text_format_test.py 93 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322
  1. #! /usr/bin/env python
  2. # -*- coding: utf-8 -*-
  3. #
  4. # Protocol Buffers - Google's data interchange format
  5. # Copyright 2008 Google Inc. All rights reserved.
  6. # https://developers.google.com/protocol-buffers/
  7. #
  8. # Redistribution and use in source and binary forms, with or without
  9. # modification, are permitted provided that the following conditions are
  10. # met:
  11. #
  12. # * Redistributions of source code must retain the above copyright
  13. # notice, this list of conditions and the following disclaimer.
  14. # * Redistributions in binary form must reproduce the above
  15. # copyright notice, this list of conditions and the following disclaimer
  16. # in the documentation and/or other materials provided with the
  17. # distribution.
  18. # * Neither the name of Google Inc. nor the names of its
  19. # contributors may be used to endorse or promote products derived from
  20. # this software without specific prior written permission.
  21. #
  22. # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  23. # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  24. # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  25. # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  26. # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  27. # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  28. # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  29. # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  30. # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  31. # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  32. # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  33. """Test for google.protobuf.text_format."""
  34. import io
  35. import math
  36. import re
  37. import string
  38. import textwrap
  39. import six
  40. # pylint: disable=g-import-not-at-top
  41. try:
  42. import unittest2 as unittest # PY26
  43. except ImportError:
  44. import unittest
  45. from google.protobuf import any_pb2
  46. from google.protobuf import any_test_pb2
  47. from google.protobuf import map_unittest_pb2
  48. from google.protobuf import unittest_custom_options_pb2
  49. from google.protobuf import unittest_mset_pb2
  50. from google.protobuf import unittest_pb2
  51. from google.protobuf import unittest_proto3_arena_pb2
  52. from google.protobuf import descriptor_pb2
  53. from google.protobuf.internal import any_test_pb2 as test_extend_any
  54. from google.protobuf.internal import message_set_extensions_pb2
  55. from google.protobuf.internal import test_util
  56. from google.protobuf import descriptor_pool
  57. from google.protobuf import text_format
  58. from google.protobuf.internal import _parameterized
  59. # pylint: enable=g-import-not-at-top
  60. # Low-level nuts-n-bolts tests.
  61. class SimpleTextFormatTests(unittest.TestCase):
  62. # The members of _QUOTES are formatted into a regexp template that
  63. # expects single characters. Therefore it's an error (in addition to being
  64. # non-sensical in the first place) to try to specify a "quote mark" that is
  65. # more than one character.
  66. def testQuoteMarksAreSingleChars(self):
  67. for quote in text_format._QUOTES:
  68. self.assertEqual(1, len(quote))
  69. # Base class with some common functionality.
  70. class TextFormatBase(unittest.TestCase):
  71. def ReadGolden(self, golden_filename):
  72. with test_util.GoldenFile(golden_filename) as f:
  73. return (f.readlines() if str is bytes else # PY3
  74. [golden_line.decode('utf-8') for golden_line in f])
  75. def CompareToGoldenFile(self, text, golden_filename):
  76. golden_lines = self.ReadGolden(golden_filename)
  77. self.assertMultiLineEqual(text, ''.join(golden_lines))
  78. def CompareToGoldenText(self, text, golden_text):
  79. self.assertEqual(text, golden_text)
  80. def RemoveRedundantZeros(self, text):
  81. # Some platforms print 1e+5 as 1e+005. This is fine, but we need to remove
  82. # these zeros in order to match the golden file.
  83. text = text.replace('e+0','e+').replace('e+0','e+') \
  84. .replace('e-0','e-').replace('e-0','e-')
  85. # Floating point fields are printed with .0 suffix even if they are
  86. # actually integer numbers.
  87. text = re.compile(r'\.0$', re.MULTILINE).sub('', text)
  88. return text
  89. @_parameterized.parameters(unittest_pb2, unittest_proto3_arena_pb2)
  90. class TextFormatMessageToStringTests(TextFormatBase):
  91. def testPrintExotic(self, message_module):
  92. message = message_module.TestAllTypes()
  93. message.repeated_int64.append(-9223372036854775808)
  94. message.repeated_uint64.append(18446744073709551615)
  95. message.repeated_double.append(123.456)
  96. message.repeated_double.append(1.23e22)
  97. message.repeated_double.append(1.23e-18)
  98. message.repeated_string.append('\000\001\a\b\f\n\r\t\v\\\'"')
  99. message.repeated_string.append(u'\u00fc\ua71f')
  100. self.CompareToGoldenText(
  101. self.RemoveRedundantZeros(text_format.MessageToString(message)),
  102. 'repeated_int64: -9223372036854775808\n'
  103. 'repeated_uint64: 18446744073709551615\n'
  104. 'repeated_double: 123.456\n'
  105. 'repeated_double: 1.23e+22\n'
  106. 'repeated_double: 1.23e-18\n'
  107. 'repeated_string:'
  108. ' "\\000\\001\\007\\010\\014\\n\\r\\t\\013\\\\\\\'\\""\n'
  109. 'repeated_string: "\\303\\274\\352\\234\\237"\n')
  110. def testPrintFloatPrecision(self, message_module):
  111. message = message_module.TestAllTypes()
  112. message.repeated_float.append(0.0)
  113. message.repeated_float.append(0.8)
  114. message.repeated_float.append(1.0)
  115. message.repeated_float.append(1.2)
  116. message.repeated_float.append(1.23)
  117. message.repeated_float.append(1.234)
  118. message.repeated_float.append(1.2345)
  119. message.repeated_float.append(1.23456)
  120. message.repeated_float.append(1.2e10)
  121. message.repeated_float.append(1.23e10)
  122. message.repeated_float.append(1.234e10)
  123. message.repeated_float.append(1.2345e10)
  124. message.repeated_float.append(1.23456e10)
  125. message.repeated_double.append(0.0)
  126. message.repeated_double.append(0.8)
  127. message.repeated_double.append(1.0)
  128. message.repeated_double.append(1.2)
  129. message.repeated_double.append(1.23)
  130. message.repeated_double.append(1.234)
  131. message.repeated_double.append(1.2345)
  132. message.repeated_double.append(1.23456)
  133. message.repeated_double.append(1.234567)
  134. message.repeated_double.append(1.2345678)
  135. message.repeated_double.append(1.23456789)
  136. message.repeated_double.append(1.234567898)
  137. message.repeated_double.append(1.2345678987)
  138. message.repeated_double.append(1.23456789876)
  139. message.repeated_double.append(1.234567898765)
  140. message.repeated_double.append(1.2345678987654)
  141. message.repeated_double.append(1.23456789876543)
  142. message.repeated_double.append(1.2e100)
  143. message.repeated_double.append(1.23e100)
  144. message.repeated_double.append(1.234e100)
  145. message.repeated_double.append(1.2345e100)
  146. message.repeated_double.append(1.23456e100)
  147. message.repeated_double.append(1.234567e100)
  148. message.repeated_double.append(1.2345678e100)
  149. message.repeated_double.append(1.23456789e100)
  150. message.repeated_double.append(1.234567898e100)
  151. message.repeated_double.append(1.2345678987e100)
  152. message.repeated_double.append(1.23456789876e100)
  153. message.repeated_double.append(1.234567898765e100)
  154. message.repeated_double.append(1.2345678987654e100)
  155. message.repeated_double.append(1.23456789876543e100)
  156. # pylint: disable=g-long-ternary
  157. self.CompareToGoldenText(
  158. self.RemoveRedundantZeros(text_format.MessageToString(message)),
  159. 'repeated_float: 0\n'
  160. # This should be 0.8
  161. 'repeated_float: 0.80000001\n'
  162. 'repeated_float: 1\n'
  163. 'repeated_float: 1.2\n'
  164. 'repeated_float: 1.23\n'
  165. 'repeated_float: 1.234\n'
  166. # This should be 1.2345
  167. 'repeated_float: 1.2345001\n'
  168. 'repeated_float: 1.23456\n'
  169. # Note that these don't use scientific notation.
  170. 'repeated_float: 12000000000\n'
  171. 'repeated_float: 12300000000\n'
  172. 'repeated_float: 12340000000\n'
  173. 'repeated_float: 12345000000\n'
  174. 'repeated_float: 12345600000\n'
  175. 'repeated_double: 0\n'
  176. 'repeated_double: 0.8\n'
  177. 'repeated_double: 1\n'
  178. 'repeated_double: 1.2\n'
  179. 'repeated_double: 1.23\n'
  180. 'repeated_double: 1.234\n'
  181. 'repeated_double: 1.2345\n'
  182. 'repeated_double: 1.23456\n'
  183. 'repeated_double: 1.234567\n'
  184. 'repeated_double: 1.2345678\n'
  185. 'repeated_double: 1.23456789\n'
  186. 'repeated_double: 1.234567898\n'
  187. 'repeated_double: 1.2345678987\n'
  188. 'repeated_double: 1.23456789876\n' +
  189. ('repeated_double: 1.23456789876\n'
  190. 'repeated_double: 1.23456789877\n'
  191. 'repeated_double: 1.23456789877\n'
  192. if six.PY2 else
  193. 'repeated_double: 1.234567898765\n'
  194. 'repeated_double: 1.2345678987654\n'
  195. 'repeated_double: 1.23456789876543\n') +
  196. 'repeated_double: 1.2e+100\n'
  197. 'repeated_double: 1.23e+100\n'
  198. 'repeated_double: 1.234e+100\n'
  199. 'repeated_double: 1.2345e+100\n'
  200. 'repeated_double: 1.23456e+100\n'
  201. 'repeated_double: 1.234567e+100\n'
  202. 'repeated_double: 1.2345678e+100\n'
  203. 'repeated_double: 1.23456789e+100\n'
  204. 'repeated_double: 1.234567898e+100\n'
  205. 'repeated_double: 1.2345678987e+100\n'
  206. 'repeated_double: 1.23456789876e+100\n' +
  207. ('repeated_double: 1.23456789877e+100\n'
  208. 'repeated_double: 1.23456789877e+100\n'
  209. 'repeated_double: 1.23456789877e+100\n'
  210. if six.PY2 else
  211. 'repeated_double: 1.234567898765e+100\n'
  212. 'repeated_double: 1.2345678987654e+100\n'
  213. 'repeated_double: 1.23456789876543e+100\n'))
  214. def testPrintExoticUnicodeSubclass(self, message_module):
  215. class UnicodeSub(six.text_type):
  216. pass
  217. message = message_module.TestAllTypes()
  218. message.repeated_string.append(UnicodeSub(u'\u00fc\ua71f'))
  219. self.CompareToGoldenText(
  220. text_format.MessageToString(message),
  221. 'repeated_string: "\\303\\274\\352\\234\\237"\n')
  222. def testPrintNestedMessageAsOneLine(self, message_module):
  223. message = message_module.TestAllTypes()
  224. msg = message.repeated_nested_message.add()
  225. msg.bb = 42
  226. self.CompareToGoldenText(
  227. text_format.MessageToString(message, as_one_line=True),
  228. 'repeated_nested_message { bb: 42 }')
  229. def testPrintRepeatedFieldsAsOneLine(self, message_module):
  230. message = message_module.TestAllTypes()
  231. message.repeated_int32.append(1)
  232. message.repeated_int32.append(1)
  233. message.repeated_int32.append(3)
  234. message.repeated_string.append('Google')
  235. message.repeated_string.append('Zurich')
  236. self.CompareToGoldenText(
  237. text_format.MessageToString(message, as_one_line=True),
  238. 'repeated_int32: 1 repeated_int32: 1 repeated_int32: 3 '
  239. 'repeated_string: "Google" repeated_string: "Zurich"')
  240. def VerifyPrintShortFormatRepeatedFields(self, message_module, as_one_line):
  241. message = message_module.TestAllTypes()
  242. message.repeated_int32.append(1)
  243. message.repeated_string.append('Google')
  244. message.repeated_string.append('Hello,World')
  245. message.repeated_foreign_enum.append(unittest_pb2.FOREIGN_FOO)
  246. message.repeated_foreign_enum.append(unittest_pb2.FOREIGN_BAR)
  247. message.repeated_foreign_enum.append(unittest_pb2.FOREIGN_BAZ)
  248. message.optional_nested_message.bb = 3
  249. for i in (21, 32):
  250. msg = message.repeated_nested_message.add()
  251. msg.bb = i
  252. expected_ascii = (
  253. 'optional_nested_message {\n bb: 3\n}\n'
  254. 'repeated_int32: [1]\n'
  255. 'repeated_string: "Google"\n'
  256. 'repeated_string: "Hello,World"\n'
  257. 'repeated_nested_message {\n bb: 21\n}\n'
  258. 'repeated_nested_message {\n bb: 32\n}\n'
  259. 'repeated_foreign_enum: [FOREIGN_FOO, FOREIGN_BAR, FOREIGN_BAZ]\n')
  260. if as_one_line:
  261. expected_ascii = expected_ascii.replace('\n', ' ')
  262. expected_ascii = re.sub(r'\s+', ' ', expected_ascii)
  263. expected_ascii = re.sub(r'\s$', '', expected_ascii)
  264. actual_ascii = text_format.MessageToString(
  265. message, use_short_repeated_primitives=True,
  266. as_one_line=as_one_line)
  267. self.CompareToGoldenText(actual_ascii, expected_ascii)
  268. parsed_message = message_module.TestAllTypes()
  269. text_format.Parse(actual_ascii, parsed_message)
  270. self.assertEqual(parsed_message, message)
  271. def testPrintShortFormatRepeatedFields(self, message_module):
  272. self.VerifyPrintShortFormatRepeatedFields(message_module, False)
  273. self.VerifyPrintShortFormatRepeatedFields(message_module, True)
  274. def testPrintNestedNewLineInStringAsOneLine(self, message_module):
  275. message = message_module.TestAllTypes()
  276. message.optional_string = 'a\nnew\nline'
  277. self.CompareToGoldenText(
  278. text_format.MessageToString(message, as_one_line=True),
  279. 'optional_string: "a\\nnew\\nline"')
  280. def testPrintExoticAsOneLine(self, message_module):
  281. message = message_module.TestAllTypes()
  282. message.repeated_int64.append(-9223372036854775808)
  283. message.repeated_uint64.append(18446744073709551615)
  284. message.repeated_double.append(123.456)
  285. message.repeated_double.append(1.23e22)
  286. message.repeated_double.append(1.23e-18)
  287. message.repeated_string.append('\000\001\a\b\f\n\r\t\v\\\'"')
  288. message.repeated_string.append(u'\u00fc\ua71f')
  289. self.CompareToGoldenText(
  290. self.RemoveRedundantZeros(text_format.MessageToString(
  291. message, as_one_line=True)),
  292. 'repeated_int64: -9223372036854775808'
  293. ' repeated_uint64: 18446744073709551615'
  294. ' repeated_double: 123.456'
  295. ' repeated_double: 1.23e+22'
  296. ' repeated_double: 1.23e-18'
  297. ' repeated_string: '
  298. '"\\000\\001\\007\\010\\014\\n\\r\\t\\013\\\\\\\'\\""'
  299. ' repeated_string: "\\303\\274\\352\\234\\237"')
  300. def testRoundTripExoticAsOneLine(self, message_module):
  301. message = message_module.TestAllTypes()
  302. message.repeated_int64.append(-9223372036854775808)
  303. message.repeated_uint64.append(18446744073709551615)
  304. message.repeated_double.append(123.456)
  305. message.repeated_double.append(1.23e22)
  306. message.repeated_double.append(1.23e-18)
  307. message.repeated_string.append('\000\001\a\b\f\n\r\t\v\\\'"')
  308. message.repeated_string.append(u'\u00fc\ua71f')
  309. # Test as_utf8 = False.
  310. wire_text = text_format.MessageToString(message,
  311. as_one_line=True,
  312. as_utf8=False)
  313. parsed_message = message_module.TestAllTypes()
  314. r = text_format.Parse(wire_text, parsed_message)
  315. self.assertIs(r, parsed_message)
  316. self.assertEqual(message, parsed_message)
  317. # Test as_utf8 = True.
  318. wire_text = text_format.MessageToString(message,
  319. as_one_line=True,
  320. as_utf8=True)
  321. parsed_message = message_module.TestAllTypes()
  322. r = text_format.Parse(wire_text, parsed_message)
  323. self.assertIs(r, parsed_message)
  324. self.assertEqual(message, parsed_message,
  325. '\n%s != %s' % (message, parsed_message))
  326. def testPrintRawUtf8String(self, message_module):
  327. message = message_module.TestAllTypes()
  328. message.repeated_string.append(u'\u00fc\t\ua71f')
  329. text = text_format.MessageToString(message, as_utf8=True)
  330. golden_unicode = u'repeated_string: "\u00fc\\t\ua71f"\n'
  331. golden_text = golden_unicode if six.PY3 else golden_unicode.encode('utf-8')
  332. # MessageToString always returns a native str.
  333. self.CompareToGoldenText(text, golden_text)
  334. parsed_message = message_module.TestAllTypes()
  335. text_format.Parse(text, parsed_message)
  336. self.assertEqual(
  337. message, parsed_message, '\n%s != %s (%s != %s)' %
  338. (message, parsed_message, message.repeated_string[0],
  339. parsed_message.repeated_string[0]))
  340. def testPrintFloatFormat(self, message_module):
  341. # Check that float_format argument is passed to sub-message formatting.
  342. message = message_module.NestedTestAllTypes()
  343. message.payload.optional_float = 1.25
  344. # Check rounding at 15 significant digits
  345. message.payload.optional_double = -.000003456789012345678
  346. # Check no decimal point.
  347. message.payload.repeated_float.append(-5642)
  348. # Check no trailing zeros.
  349. message.payload.repeated_double.append(.000078900)
  350. formatted_fields = ['optional_float: 1.25',
  351. 'optional_double: -3.45678901234568e-6',
  352. 'repeated_float: -5642', 'repeated_double: 7.89e-5']
  353. text_message = text_format.MessageToString(message, float_format='.15g')
  354. self.CompareToGoldenText(
  355. self.RemoveRedundantZeros(text_message),
  356. 'payload {{\n {0}\n {1}\n {2}\n {3}\n}}\n'.format(
  357. *formatted_fields))
  358. # as_one_line=True is a separate code branch where float_format is passed.
  359. text_message = text_format.MessageToString(message,
  360. as_one_line=True,
  361. float_format='.15g')
  362. self.CompareToGoldenText(
  363. self.RemoveRedundantZeros(text_message),
  364. 'payload {{ {0} {1} {2} {3} }}'.format(*formatted_fields))
  365. # 32-bit 1.2 is noisy when extended to 64-bit:
  366. # >>> struct.unpack('f', struct.pack('f', 1.2))[0]
  367. # 1.2000000476837158
  368. # TODO(jieluo): change to 1.2 with cl/241634942.
  369. message.payload.optional_float = 1.2000000476837158
  370. formatted_fields = ['optional_float: 1.2',
  371. 'optional_double: -3.45678901234568e-6',
  372. 'repeated_float: -5642', 'repeated_double: 7.89e-5']
  373. text_message = text_format.MessageToString(message, float_format='.7g',
  374. double_format='.15g')
  375. self.CompareToGoldenText(
  376. self.RemoveRedundantZeros(text_message),
  377. 'payload {{\n {0}\n {1}\n {2}\n {3}\n}}\n'.format(
  378. *formatted_fields))
  379. # Test only set float_format affect both float and double fields.
  380. formatted_fields = ['optional_float: 1.2',
  381. 'optional_double: -3.456789e-6',
  382. 'repeated_float: -5642', 'repeated_double: 7.89e-5']
  383. text_message = text_format.MessageToString(message, float_format='.7g')
  384. self.CompareToGoldenText(
  385. self.RemoveRedundantZeros(text_message),
  386. 'payload {{\n {0}\n {1}\n {2}\n {3}\n}}\n'.format(
  387. *formatted_fields))
  388. # Test default float_format has 8 valid digits.
  389. message.payload.optional_float = 1.2345678912
  390. message.payload.optional_double = 1.2345678912
  391. formatted_fields = ['optional_float: 1.2345679',
  392. 'optional_double: 1.2345678912',
  393. 'repeated_float: -5642', 'repeated_double: 7.89e-5']
  394. text_message = text_format.MessageToString(message)
  395. self.CompareToGoldenText(
  396. self.RemoveRedundantZeros(text_message),
  397. 'payload {{\n {0}\n {1}\n {2}\n {3}\n}}\n'.format(
  398. *formatted_fields))
  399. def testMessageToString(self, message_module):
  400. message = message_module.ForeignMessage()
  401. message.c = 123
  402. self.assertEqual('c: 123\n', str(message))
  403. def testMessageToStringUnicode(self, message_module):
  404. golden_unicode = u'Á short desçription and a 🍌.'
  405. golden_bytes = golden_unicode.encode('utf-8')
  406. message = message_module.TestAllTypes()
  407. message.optional_string = golden_unicode
  408. message.optional_bytes = golden_bytes
  409. text = text_format.MessageToString(message, as_utf8=True)
  410. golden_message = textwrap.dedent(
  411. 'optional_string: "Á short desçription and a 🍌."\n'
  412. 'optional_bytes: '
  413. r'"\303\201 short des\303\247ription and a \360\237\215\214."'
  414. '\n')
  415. self.CompareToGoldenText(text, golden_message)
  416. def testMessageToStringASCII(self, message_module):
  417. golden_unicode = u'Á short desçription and a 🍌.'
  418. golden_bytes = golden_unicode.encode('utf-8')
  419. message = message_module.TestAllTypes()
  420. message.optional_string = golden_unicode
  421. message.optional_bytes = golden_bytes
  422. text = text_format.MessageToString(message, as_utf8=False) # ASCII
  423. golden_message = (
  424. 'optional_string: '
  425. r'"\303\201 short des\303\247ription and a \360\237\215\214."'
  426. '\n'
  427. 'optional_bytes: '
  428. r'"\303\201 short des\303\247ription and a \360\237\215\214."'
  429. '\n')
  430. self.CompareToGoldenText(text, golden_message)
  431. def testPrintField(self, message_module):
  432. message = message_module.TestAllTypes()
  433. field = message.DESCRIPTOR.fields_by_name['optional_float']
  434. value = message.optional_float
  435. out = text_format.TextWriter(False)
  436. text_format.PrintField(field, value, out)
  437. self.assertEqual('optional_float: 0.0\n', out.getvalue())
  438. out.close()
  439. # Test Printer
  440. out = text_format.TextWriter(False)
  441. printer = text_format._Printer(out)
  442. printer.PrintField(field, value)
  443. self.assertEqual('optional_float: 0.0\n', out.getvalue())
  444. out.close()
  445. def testPrintFieldValue(self, message_module):
  446. message = message_module.TestAllTypes()
  447. field = message.DESCRIPTOR.fields_by_name['optional_float']
  448. value = message.optional_float
  449. out = text_format.TextWriter(False)
  450. text_format.PrintFieldValue(field, value, out)
  451. self.assertEqual('0.0', out.getvalue())
  452. out.close()
  453. # Test Printer
  454. out = text_format.TextWriter(False)
  455. printer = text_format._Printer(out)
  456. printer.PrintFieldValue(field, value)
  457. self.assertEqual('0.0', out.getvalue())
  458. out.close()
  459. def testCustomOptions(self, message_module):
  460. message_descriptor = (unittest_custom_options_pb2.
  461. TestMessageWithCustomOptions.DESCRIPTOR)
  462. message_proto = descriptor_pb2.DescriptorProto()
  463. message_descriptor.CopyToProto(message_proto)
  464. expected_text = (
  465. 'name: "TestMessageWithCustomOptions"\n'
  466. 'field {\n'
  467. ' name: "field1"\n'
  468. ' number: 1\n'
  469. ' label: LABEL_OPTIONAL\n'
  470. ' type: TYPE_STRING\n'
  471. ' options {\n'
  472. ' ctype: CORD\n'
  473. ' [protobuf_unittest.field_opt1]: 8765432109\n'
  474. ' }\n'
  475. '}\n'
  476. 'field {\n'
  477. ' name: "oneof_field"\n'
  478. ' number: 2\n'
  479. ' label: LABEL_OPTIONAL\n'
  480. ' type: TYPE_INT32\n'
  481. ' oneof_index: 0\n'
  482. '}\n'
  483. 'enum_type {\n'
  484. ' name: "AnEnum"\n'
  485. ' value {\n'
  486. ' name: "ANENUM_VAL1"\n'
  487. ' number: 1\n'
  488. ' }\n'
  489. ' value {\n'
  490. ' name: "ANENUM_VAL2"\n'
  491. ' number: 2\n'
  492. ' options {\n'
  493. ' [protobuf_unittest.enum_value_opt1]: 123\n'
  494. ' }\n'
  495. ' }\n'
  496. ' options {\n'
  497. ' [protobuf_unittest.enum_opt1]: -789\n'
  498. ' }\n'
  499. '}\n'
  500. 'options {\n'
  501. ' message_set_wire_format: false\n'
  502. ' [protobuf_unittest.message_opt1]: -56\n'
  503. '}\n'
  504. 'oneof_decl {\n'
  505. ' name: "AnOneof"\n'
  506. ' options {\n'
  507. ' [protobuf_unittest.oneof_opt1]: -99\n'
  508. ' }\n'
  509. '}\n')
  510. self.assertEqual(expected_text,
  511. text_format.MessageToString(message_proto))
  512. parsed_proto = descriptor_pb2.DescriptorProto()
  513. text_format.Parse(expected_text, parsed_proto)
  514. self.assertEqual(message_proto, parsed_proto)
  515. def testPrintUnknownFieldsEmbeddedMessageInBytes(self, message_module):
  516. inner_msg = message_module.TestAllTypes()
  517. inner_msg.optional_int32 = 101
  518. inner_msg.optional_double = 102.0
  519. inner_msg.optional_string = u'hello'
  520. inner_msg.optional_bytes = b'103'
  521. inner_msg.optional_nested_message.bb = 105
  522. inner_data = inner_msg.SerializeToString()
  523. outer_message = message_module.TestAllTypes()
  524. outer_message.optional_int32 = 101
  525. outer_message.optional_bytes = inner_data
  526. all_data = outer_message.SerializeToString()
  527. empty_message = message_module.TestEmptyMessage()
  528. empty_message.ParseFromString(all_data)
  529. self.assertEqual(' 1: 101\n'
  530. ' 15 {\n'
  531. ' 1: 101\n'
  532. ' 12: 4636878028842991616\n'
  533. ' 14: "hello"\n'
  534. ' 15: "103"\n'
  535. ' 18 {\n'
  536. ' 1: 105\n'
  537. ' }\n'
  538. ' }\n',
  539. text_format.MessageToString(empty_message,
  540. indent=2,
  541. print_unknown_fields=True))
  542. self.assertEqual('1: 101 '
  543. '15 { '
  544. '1: 101 '
  545. '12: 4636878028842991616 '
  546. '14: "hello" '
  547. '15: "103" '
  548. '18 { 1: 105 } '
  549. '}',
  550. text_format.MessageToString(empty_message,
  551. print_unknown_fields=True,
  552. as_one_line=True))
  553. @_parameterized.parameters(unittest_pb2, unittest_proto3_arena_pb2)
  554. class TextFormatMessageToTextBytesTests(TextFormatBase):
  555. def testMessageToBytes(self, message_module):
  556. message = message_module.ForeignMessage()
  557. message.c = 123
  558. self.assertEqual(b'c: 123\n', text_format.MessageToBytes(message))
  559. def testRawUtf8RoundTrip(self, message_module):
  560. message = message_module.TestAllTypes()
  561. message.repeated_string.append(u'\u00fc\t\ua71f')
  562. utf8_text = text_format.MessageToBytes(message, as_utf8=True)
  563. golden_bytes = b'repeated_string: "\xc3\xbc\\t\xea\x9c\x9f"\n'
  564. self.CompareToGoldenText(utf8_text, golden_bytes)
  565. parsed_message = message_module.TestAllTypes()
  566. text_format.Parse(utf8_text, parsed_message)
  567. self.assertEqual(
  568. message, parsed_message, '\n%s != %s (%s != %s)' %
  569. (message, parsed_message, message.repeated_string[0],
  570. parsed_message.repeated_string[0]))
  571. def testEscapedUtf8ASCIIRoundTrip(self, message_module):
  572. message = message_module.TestAllTypes()
  573. message.repeated_string.append(u'\u00fc\t\ua71f')
  574. ascii_text = text_format.MessageToBytes(message) # as_utf8=False default
  575. golden_bytes = b'repeated_string: "\\303\\274\\t\\352\\234\\237"\n'
  576. self.CompareToGoldenText(ascii_text, golden_bytes)
  577. parsed_message = message_module.TestAllTypes()
  578. text_format.Parse(ascii_text, parsed_message)
  579. self.assertEqual(
  580. message, parsed_message, '\n%s != %s (%s != %s)' %
  581. (message, parsed_message, message.repeated_string[0],
  582. parsed_message.repeated_string[0]))
  583. @_parameterized.parameters(unittest_pb2, unittest_proto3_arena_pb2)
  584. class TextFormatParserTests(TextFormatBase):
  585. def testParseAllFields(self, message_module):
  586. message = message_module.TestAllTypes()
  587. test_util.SetAllFields(message)
  588. ascii_text = text_format.MessageToString(message)
  589. parsed_message = message_module.TestAllTypes()
  590. text_format.Parse(ascii_text, parsed_message)
  591. self.assertEqual(message, parsed_message)
  592. if message_module is unittest_pb2:
  593. test_util.ExpectAllFieldsSet(self, message)
  594. def testParseAndMergeUtf8(self, message_module):
  595. message = message_module.TestAllTypes()
  596. test_util.SetAllFields(message)
  597. ascii_text = text_format.MessageToString(message)
  598. ascii_text = ascii_text.encode('utf-8')
  599. parsed_message = message_module.TestAllTypes()
  600. text_format.Parse(ascii_text, parsed_message)
  601. self.assertEqual(message, parsed_message)
  602. if message_module is unittest_pb2:
  603. test_util.ExpectAllFieldsSet(self, message)
  604. parsed_message.Clear()
  605. text_format.Merge(ascii_text, parsed_message)
  606. self.assertEqual(message, parsed_message)
  607. if message_module is unittest_pb2:
  608. test_util.ExpectAllFieldsSet(self, message)
  609. msg2 = message_module.TestAllTypes()
  610. text = (u'optional_string: "café"')
  611. text_format.Merge(text, msg2)
  612. self.assertEqual(msg2.optional_string, u'café')
  613. msg2.Clear()
  614. self.assertEqual(msg2.optional_string, u'')
  615. text_format.Parse(text, msg2)
  616. self.assertEqual(msg2.optional_string, u'café')
  617. def testParseDoubleToFloat(self, message_module):
  618. message = message_module.TestAllTypes()
  619. text = ('repeated_float: 3.4028235e+39\n'
  620. 'repeated_float: 1.4028235e-39\n')
  621. text_format.Parse(text, message)
  622. self.assertEqual(message.repeated_float[0], float('inf'))
  623. self.assertAlmostEqual(message.repeated_float[1], 1.4028235e-39)
  624. def testParseExotic(self, message_module):
  625. message = message_module.TestAllTypes()
  626. text = ('repeated_int64: -9223372036854775808\n'
  627. 'repeated_uint64: 18446744073709551615\n'
  628. 'repeated_double: 123.456\n'
  629. 'repeated_double: 1.23e+22\n'
  630. 'repeated_double: 1.23e-18\n'
  631. 'repeated_string: \n'
  632. '"\\000\\001\\007\\010\\014\\n\\r\\t\\013\\\\\\\'\\""\n'
  633. 'repeated_string: "foo" \'corge\' "grault"\n'
  634. 'repeated_string: "\\303\\274\\352\\234\\237"\n'
  635. 'repeated_string: "\\xc3\\xbc"\n'
  636. 'repeated_string: "\xc3\xbc"\n')
  637. text_format.Parse(text, message)
  638. self.assertEqual(-9223372036854775808, message.repeated_int64[0])
  639. self.assertEqual(18446744073709551615, message.repeated_uint64[0])
  640. self.assertEqual(123.456, message.repeated_double[0])
  641. self.assertEqual(1.23e22, message.repeated_double[1])
  642. self.assertEqual(1.23e-18, message.repeated_double[2])
  643. self.assertEqual('\000\001\a\b\f\n\r\t\v\\\'"', message.repeated_string[0])
  644. self.assertEqual('foocorgegrault', message.repeated_string[1])
  645. self.assertEqual(u'\u00fc\ua71f', message.repeated_string[2])
  646. self.assertEqual(u'\u00fc', message.repeated_string[3])
  647. def testParseTrailingCommas(self, message_module):
  648. message = message_module.TestAllTypes()
  649. text = ('repeated_int64: 100;\n'
  650. 'repeated_int64: 200;\n'
  651. 'repeated_int64: 300,\n'
  652. 'repeated_string: "one",\n'
  653. 'repeated_string: "two";\n')
  654. text_format.Parse(text, message)
  655. self.assertEqual(100, message.repeated_int64[0])
  656. self.assertEqual(200, message.repeated_int64[1])
  657. self.assertEqual(300, message.repeated_int64[2])
  658. self.assertEqual(u'one', message.repeated_string[0])
  659. self.assertEqual(u'two', message.repeated_string[1])
  660. def testParseRepeatedScalarShortFormat(self, message_module):
  661. message = message_module.TestAllTypes()
  662. text = ('repeated_int64: [100, 200];\n'
  663. 'repeated_int64: []\n'
  664. 'repeated_int64: 300,\n'
  665. 'repeated_string: ["one", "two"];\n')
  666. text_format.Parse(text, message)
  667. self.assertEqual(100, message.repeated_int64[0])
  668. self.assertEqual(200, message.repeated_int64[1])
  669. self.assertEqual(300, message.repeated_int64[2])
  670. self.assertEqual(u'one', message.repeated_string[0])
  671. self.assertEqual(u'two', message.repeated_string[1])
  672. def testParseRepeatedMessageShortFormat(self, message_module):
  673. message = message_module.TestAllTypes()
  674. text = ('repeated_nested_message: [{bb: 100}, {bb: 200}],\n'
  675. 'repeated_nested_message: {bb: 300}\n'
  676. 'repeated_nested_message [{bb: 400}];\n')
  677. text_format.Parse(text, message)
  678. self.assertEqual(100, message.repeated_nested_message[0].bb)
  679. self.assertEqual(200, message.repeated_nested_message[1].bb)
  680. self.assertEqual(300, message.repeated_nested_message[2].bb)
  681. self.assertEqual(400, message.repeated_nested_message[3].bb)
  682. def testParseEmptyText(self, message_module):
  683. message = message_module.TestAllTypes()
  684. text = ''
  685. text_format.Parse(text, message)
  686. self.assertEqual(message_module.TestAllTypes(), message)
  687. def testParseInvalidUtf8(self, message_module):
  688. message = message_module.TestAllTypes()
  689. text = 'repeated_string: "\\xc3\\xc3"'
  690. with self.assertRaises(text_format.ParseError) as e:
  691. text_format.Parse(text, message)
  692. self.assertEqual(e.exception.GetLine(), 1)
  693. self.assertEqual(e.exception.GetColumn(), 28)
  694. def testParseSingleWord(self, message_module):
  695. message = message_module.TestAllTypes()
  696. text = 'foo'
  697. six.assertRaisesRegex(self, text_format.ParseError, (
  698. r'1:1 : Message type "\w+.TestAllTypes" has no field named '
  699. r'"foo".'), text_format.Parse, text, message)
  700. def testParseUnknownField(self, message_module):
  701. message = message_module.TestAllTypes()
  702. text = 'unknown_field: 8\n'
  703. six.assertRaisesRegex(self, text_format.ParseError, (
  704. r'1:1 : Message type "\w+.TestAllTypes" has no field named '
  705. r'"unknown_field".'), text_format.Parse, text, message)
  706. text = ('optional_int32: 123\n'
  707. 'unknown_field: 8\n'
  708. 'optional_nested_message { bb: 45 }')
  709. text_format.Parse(text, message, allow_unknown_field=True)
  710. self.assertEqual(message.optional_nested_message.bb, 45)
  711. self.assertEqual(message.optional_int32, 123)
  712. def testParseBadEnumValue(self, message_module):
  713. message = message_module.TestAllTypes()
  714. text = 'optional_nested_enum: BARR'
  715. six.assertRaisesRegex(self, text_format.ParseError,
  716. (r'1:23 : \'optional_nested_enum: BARR\': '
  717. r'Enum type "\w+.TestAllTypes.NestedEnum" '
  718. r'has no value named BARR.'), text_format.Parse,
  719. text, message)
  720. def testParseBadIntValue(self, message_module):
  721. message = message_module.TestAllTypes()
  722. text = 'optional_int32: bork'
  723. six.assertRaisesRegex(self, text_format.ParseError,
  724. ('1:17 : \'optional_int32: bork\': '
  725. 'Couldn\'t parse integer: bork'),
  726. text_format.Parse, text, message)
  727. def testParseStringFieldUnescape(self, message_module):
  728. message = message_module.TestAllTypes()
  729. text = r'''repeated_string: "\xf\x62"
  730. repeated_string: "\\xf\\x62"
  731. repeated_string: "\\\xf\\\x62"
  732. repeated_string: "\\\\xf\\\\x62"
  733. repeated_string: "\\\\\xf\\\\\x62"
  734. repeated_string: "\x5cx20"'''
  735. text_format.Parse(text, message)
  736. SLASH = '\\'
  737. self.assertEqual('\x0fb', message.repeated_string[0])
  738. self.assertEqual(SLASH + 'xf' + SLASH + 'x62', message.repeated_string[1])
  739. self.assertEqual(SLASH + '\x0f' + SLASH + 'b', message.repeated_string[2])
  740. self.assertEqual(SLASH + SLASH + 'xf' + SLASH + SLASH + 'x62',
  741. message.repeated_string[3])
  742. self.assertEqual(SLASH + SLASH + '\x0f' + SLASH + SLASH + 'b',
  743. message.repeated_string[4])
  744. self.assertEqual(SLASH + 'x20', message.repeated_string[5])
  745. def testParseOneof(self, message_module):
  746. m = message_module.TestAllTypes()
  747. m.oneof_uint32 = 11
  748. m2 = message_module.TestAllTypes()
  749. text_format.Parse(text_format.MessageToString(m), m2)
  750. self.assertEqual('oneof_uint32', m2.WhichOneof('oneof_field'))
  751. def testParseMultipleOneof(self, message_module):
  752. m_string = '\n'.join(['oneof_uint32: 11', 'oneof_string: "foo"'])
  753. m2 = message_module.TestAllTypes()
  754. with six.assertRaisesRegex(self, text_format.ParseError,
  755. ' is specified along with field '):
  756. text_format.Parse(m_string, m2)
  757. # This example contains non-ASCII codepoint unicode data as literals
  758. # which should come through as utf-8 for bytes, and as the unicode
  759. # itself for string fields. It also demonstrates escaped binary data.
  760. # The ur"" string prefix is unfortunately missing from Python 3
  761. # so we resort to double escaping our \s so that they come through.
  762. _UNICODE_SAMPLE = u"""
  763. optional_bytes: 'Á short desçription'
  764. optional_string: 'Á short desçription'
  765. repeated_bytes: '\\303\\201 short des\\303\\247ription'
  766. repeated_bytes: '\\x12\\x34\\x56\\x78\\x90\\xab\\xcd\\xef'
  767. repeated_string: '\\xd0\\x9f\\xd1\\x80\\xd0\\xb8\\xd0\\xb2\\xd0\\xb5\\xd1\\x82'
  768. """
  769. _BYTES_SAMPLE = _UNICODE_SAMPLE.encode('utf-8')
  770. _GOLDEN_UNICODE = u'Á short desçription'
  771. _GOLDEN_BYTES = _GOLDEN_UNICODE.encode('utf-8')
  772. _GOLDEN_BYTES_1 = b'\x12\x34\x56\x78\x90\xab\xcd\xef'
  773. _GOLDEN_STR_0 = u'Привет'
  774. def testParseUnicode(self, message_module):
  775. m = message_module.TestAllTypes()
  776. text_format.Parse(self._UNICODE_SAMPLE, m)
  777. self.assertEqual(m.optional_bytes, self._GOLDEN_BYTES)
  778. self.assertEqual(m.optional_string, self._GOLDEN_UNICODE)
  779. self.assertEqual(m.repeated_bytes[0], self._GOLDEN_BYTES)
  780. # repeated_bytes[1] contained simple \ escaped non-UTF-8 raw binary data.
  781. self.assertEqual(m.repeated_bytes[1], self._GOLDEN_BYTES_1)
  782. # repeated_string[0] contained \ escaped data representing the UTF-8
  783. # representation of _GOLDEN_STR_0 - it needs to decode as such.
  784. self.assertEqual(m.repeated_string[0], self._GOLDEN_STR_0)
  785. def testParseBytes(self, message_module):
  786. m = message_module.TestAllTypes()
  787. text_format.Parse(self._BYTES_SAMPLE, m)
  788. self.assertEqual(m.optional_bytes, self._GOLDEN_BYTES)
  789. self.assertEqual(m.optional_string, self._GOLDEN_UNICODE)
  790. self.assertEqual(m.repeated_bytes[0], self._GOLDEN_BYTES)
  791. # repeated_bytes[1] contained simple \ escaped non-UTF-8 raw binary data.
  792. self.assertEqual(m.repeated_bytes[1], self._GOLDEN_BYTES_1)
  793. # repeated_string[0] contained \ escaped data representing the UTF-8
  794. # representation of _GOLDEN_STR_0 - it needs to decode as such.
  795. self.assertEqual(m.repeated_string[0], self._GOLDEN_STR_0)
  796. def testFromBytesFile(self, message_module):
  797. m = message_module.TestAllTypes()
  798. f = io.BytesIO(self._BYTES_SAMPLE)
  799. text_format.ParseLines(f, m)
  800. self.assertEqual(m.optional_bytes, self._GOLDEN_BYTES)
  801. self.assertEqual(m.optional_string, self._GOLDEN_UNICODE)
  802. self.assertEqual(m.repeated_bytes[0], self._GOLDEN_BYTES)
  803. def testFromUnicodeFile(self, message_module):
  804. m = message_module.TestAllTypes()
  805. f = io.StringIO(self._UNICODE_SAMPLE)
  806. text_format.ParseLines(f, m)
  807. self.assertEqual(m.optional_bytes, self._GOLDEN_BYTES)
  808. self.assertEqual(m.optional_string, self._GOLDEN_UNICODE)
  809. self.assertEqual(m.repeated_bytes[0], self._GOLDEN_BYTES)
  810. def testFromBytesLines(self, message_module):
  811. m = message_module.TestAllTypes()
  812. text_format.ParseLines(self._BYTES_SAMPLE.split(b'\n'), m)
  813. self.assertEqual(m.optional_bytes, self._GOLDEN_BYTES)
  814. self.assertEqual(m.optional_string, self._GOLDEN_UNICODE)
  815. self.assertEqual(m.repeated_bytes[0], self._GOLDEN_BYTES)
  816. def testFromUnicodeLines(self, message_module):
  817. m = message_module.TestAllTypes()
  818. text_format.ParseLines(self._UNICODE_SAMPLE.split(u'\n'), m)
  819. self.assertEqual(m.optional_bytes, self._GOLDEN_BYTES)
  820. self.assertEqual(m.optional_string, self._GOLDEN_UNICODE)
  821. self.assertEqual(m.repeated_bytes[0], self._GOLDEN_BYTES)
  822. def testParseDuplicateMessages(self, message_module):
  823. message = message_module.TestAllTypes()
  824. text = ('optional_nested_message { bb: 1 } '
  825. 'optional_nested_message { bb: 2 }')
  826. six.assertRaisesRegex(self, text_format.ParseError, (
  827. r'1:59 : Message type "\w+.TestAllTypes" '
  828. r'should not have multiple "optional_nested_message" fields.'),
  829. text_format.Parse, text,
  830. message)
  831. def testParseDuplicateScalars(self, message_module):
  832. message = message_module.TestAllTypes()
  833. text = ('optional_int32: 42 ' 'optional_int32: 67')
  834. six.assertRaisesRegex(self, text_format.ParseError, (
  835. r'1:36 : Message type "\w+.TestAllTypes" should not '
  836. r'have multiple "optional_int32" fields.'), text_format.Parse, text,
  837. message)
  838. def testParseExistingScalarInMessage(self, message_module):
  839. message = message_module.TestAllTypes(optional_int32=42)
  840. text = 'optional_int32: 67'
  841. six.assertRaisesRegex(self, text_format.ParseError,
  842. (r'Message type "\w+.TestAllTypes" should not '
  843. r'have multiple "optional_int32" fields.'),
  844. text_format.Parse, text, message)
  845. @_parameterized.parameters(unittest_pb2, unittest_proto3_arena_pb2)
  846. class TextFormatMergeTests(TextFormatBase):
  847. def testMergeDuplicateScalarsInText(self, message_module):
  848. message = message_module.TestAllTypes()
  849. text = ('optional_int32: 42 ' 'optional_int32: 67')
  850. r = text_format.Merge(text, message)
  851. self.assertIs(r, message)
  852. self.assertEqual(67, message.optional_int32)
  853. def testMergeDuplicateNestedMessageScalars(self, message_module):
  854. message = message_module.TestAllTypes()
  855. text = ('optional_nested_message { bb: 1 } '
  856. 'optional_nested_message { bb: 2 }')
  857. r = text_format.Merge(text, message)
  858. self.assertTrue(r is message)
  859. self.assertEqual(2, message.optional_nested_message.bb)
  860. def testReplaceScalarInMessage(self, message_module):
  861. message = message_module.TestAllTypes(optional_int32=42)
  862. text = 'optional_int32: 67'
  863. r = text_format.Merge(text, message)
  864. self.assertIs(r, message)
  865. self.assertEqual(67, message.optional_int32)
  866. def testReplaceMessageInMessage(self, message_module):
  867. message = message_module.TestAllTypes(
  868. optional_int32=42, optional_nested_message=dict())
  869. self.assertTrue(message.HasField('optional_nested_message'))
  870. text = 'optional_nested_message{ bb: 3 }'
  871. r = text_format.Merge(text, message)
  872. self.assertIs(r, message)
  873. self.assertEqual(3, message.optional_nested_message.bb)
  874. def testMergeMultipleOneof(self, message_module):
  875. m_string = '\n'.join(['oneof_uint32: 11', 'oneof_string: "foo"'])
  876. m2 = message_module.TestAllTypes()
  877. text_format.Merge(m_string, m2)
  878. self.assertEqual('oneof_string', m2.WhichOneof('oneof_field'))
  879. # These are tests that aren't fundamentally specific to proto2, but are at
  880. # the moment because of differences between the proto2 and proto3 test schemas.
  881. # Ideally the schemas would be made more similar so these tests could pass.
  882. class OnlyWorksWithProto2RightNowTests(TextFormatBase):
  883. def testPrintAllFieldsPointy(self):
  884. message = unittest_pb2.TestAllTypes()
  885. test_util.SetAllFields(message)
  886. self.CompareToGoldenFile(
  887. self.RemoveRedundantZeros(text_format.MessageToString(
  888. message, pointy_brackets=True)),
  889. 'text_format_unittest_data_pointy_oneof.txt')
  890. def testParseGolden(self):
  891. golden_text = '\n'.join(self.ReadGolden(
  892. 'text_format_unittest_data_oneof_implemented.txt'))
  893. parsed_message = unittest_pb2.TestAllTypes()
  894. r = text_format.Parse(golden_text, parsed_message)
  895. self.assertIs(r, parsed_message)
  896. message = unittest_pb2.TestAllTypes()
  897. test_util.SetAllFields(message)
  898. self.assertEqual(message, parsed_message)
  899. def testPrintAllFields(self):
  900. message = unittest_pb2.TestAllTypes()
  901. test_util.SetAllFields(message)
  902. self.CompareToGoldenFile(
  903. self.RemoveRedundantZeros(text_format.MessageToString(message)),
  904. 'text_format_unittest_data_oneof_implemented.txt')
  905. def testPrintUnknownFields(self):
  906. message = unittest_pb2.TestAllTypes()
  907. message.optional_int32 = 101
  908. message.optional_double = 102.0
  909. message.optional_string = u'hello'
  910. message.optional_bytes = b'103'
  911. message.optionalgroup.a = 104
  912. message.optional_nested_message.bb = 105
  913. all_data = message.SerializeToString()
  914. empty_message = unittest_pb2.TestEmptyMessage()
  915. empty_message.ParseFromString(all_data)
  916. self.assertEqual(' 1: 101\n'
  917. ' 12: 4636878028842991616\n'
  918. ' 14: "hello"\n'
  919. ' 15: "103"\n'
  920. ' 16 {\n'
  921. ' 17: 104\n'
  922. ' }\n'
  923. ' 18 {\n'
  924. ' 1: 105\n'
  925. ' }\n',
  926. text_format.MessageToString(empty_message,
  927. indent=2,
  928. print_unknown_fields=True))
  929. self.assertEqual('1: 101 '
  930. '12: 4636878028842991616 '
  931. '14: "hello" '
  932. '15: "103" '
  933. '16 { 17: 104 } '
  934. '18 { 1: 105 }',
  935. text_format.MessageToString(empty_message,
  936. print_unknown_fields=True,
  937. as_one_line=True))
  938. def testPrintInIndexOrder(self):
  939. message = unittest_pb2.TestFieldOrderings()
  940. # Fields are listed in index order instead of field number.
  941. message.my_string = 'str'
  942. message.my_int = 101
  943. message.my_float = 111
  944. message.optional_nested_message.oo = 0
  945. message.optional_nested_message.bb = 1
  946. message.Extensions[unittest_pb2.my_extension_string] = 'ext_str0'
  947. # Extensions are listed based on the order of extension number.
  948. # Extension number 12.
  949. message.Extensions[unittest_pb2.TestExtensionOrderings2.
  950. test_ext_orderings2].my_string = 'ext_str2'
  951. # Extension number 13.
  952. message.Extensions[unittest_pb2.TestExtensionOrderings1.
  953. test_ext_orderings1].my_string = 'ext_str1'
  954. # Extension number 14.
  955. message.Extensions[
  956. unittest_pb2.TestExtensionOrderings2.TestExtensionOrderings3.
  957. test_ext_orderings3].my_string = 'ext_str3'
  958. # Print in index order.
  959. self.CompareToGoldenText(
  960. self.RemoveRedundantZeros(
  961. text_format.MessageToString(message, use_index_order=True)),
  962. 'my_string: "str"\n'
  963. 'my_int: 101\n'
  964. 'my_float: 111\n'
  965. 'optional_nested_message {\n'
  966. ' oo: 0\n'
  967. ' bb: 1\n'
  968. '}\n'
  969. '[protobuf_unittest.TestExtensionOrderings2.test_ext_orderings2] {\n'
  970. ' my_string: "ext_str2"\n'
  971. '}\n'
  972. '[protobuf_unittest.TestExtensionOrderings1.test_ext_orderings1] {\n'
  973. ' my_string: "ext_str1"\n'
  974. '}\n'
  975. '[protobuf_unittest.TestExtensionOrderings2.TestExtensionOrderings3'
  976. '.test_ext_orderings3] {\n'
  977. ' my_string: "ext_str3"\n'
  978. '}\n'
  979. '[protobuf_unittest.my_extension_string]: "ext_str0"\n')
  980. # By default, print in field number order.
  981. self.CompareToGoldenText(
  982. self.RemoveRedundantZeros(text_format.MessageToString(message)),
  983. 'my_int: 101\n'
  984. 'my_string: "str"\n'
  985. '[protobuf_unittest.TestExtensionOrderings2.test_ext_orderings2] {\n'
  986. ' my_string: "ext_str2"\n'
  987. '}\n'
  988. '[protobuf_unittest.TestExtensionOrderings1.test_ext_orderings1] {\n'
  989. ' my_string: "ext_str1"\n'
  990. '}\n'
  991. '[protobuf_unittest.TestExtensionOrderings2.TestExtensionOrderings3'
  992. '.test_ext_orderings3] {\n'
  993. ' my_string: "ext_str3"\n'
  994. '}\n'
  995. '[protobuf_unittest.my_extension_string]: "ext_str0"\n'
  996. 'my_float: 111\n'
  997. 'optional_nested_message {\n'
  998. ' bb: 1\n'
  999. ' oo: 0\n'
  1000. '}\n')
  1001. def testMergeLinesGolden(self):
  1002. opened = self.ReadGolden('text_format_unittest_data_oneof_implemented.txt')
  1003. parsed_message = unittest_pb2.TestAllTypes()
  1004. r = text_format.MergeLines(opened, parsed_message)
  1005. self.assertIs(r, parsed_message)
  1006. message = unittest_pb2.TestAllTypes()
  1007. test_util.SetAllFields(message)
  1008. self.assertEqual(message, parsed_message)
  1009. def testParseLinesGolden(self):
  1010. opened = self.ReadGolden('text_format_unittest_data_oneof_implemented.txt')
  1011. parsed_message = unittest_pb2.TestAllTypes()
  1012. r = text_format.ParseLines(opened, parsed_message)
  1013. self.assertIs(r, parsed_message)
  1014. message = unittest_pb2.TestAllTypes()
  1015. test_util.SetAllFields(message)
  1016. self.assertEqual(message, parsed_message)
  1017. def testPrintMap(self):
  1018. message = map_unittest_pb2.TestMap()
  1019. message.map_int32_int32[-123] = -456
  1020. message.map_int64_int64[-2**33] = -2**34
  1021. message.map_uint32_uint32[123] = 456
  1022. message.map_uint64_uint64[2**33] = 2**34
  1023. message.map_string_string['abc'] = '123'
  1024. message.map_int32_foreign_message[111].c = 5
  1025. # Maps are serialized to text format using their underlying repeated
  1026. # representation.
  1027. self.CompareToGoldenText(
  1028. text_format.MessageToString(message), 'map_int32_int32 {\n'
  1029. ' key: -123\n'
  1030. ' value: -456\n'
  1031. '}\n'
  1032. 'map_int64_int64 {\n'
  1033. ' key: -8589934592\n'
  1034. ' value: -17179869184\n'
  1035. '}\n'
  1036. 'map_uint32_uint32 {\n'
  1037. ' key: 123\n'
  1038. ' value: 456\n'
  1039. '}\n'
  1040. 'map_uint64_uint64 {\n'
  1041. ' key: 8589934592\n'
  1042. ' value: 17179869184\n'
  1043. '}\n'
  1044. 'map_string_string {\n'
  1045. ' key: "abc"\n'
  1046. ' value: "123"\n'
  1047. '}\n'
  1048. 'map_int32_foreign_message {\n'
  1049. ' key: 111\n'
  1050. ' value {\n'
  1051. ' c: 5\n'
  1052. ' }\n'
  1053. '}\n')
  1054. # In cpp implementation, __str__ calls the cpp implementation of text format.
  1055. def testPrintMapUsingCppImplementation(self):
  1056. message = map_unittest_pb2.TestMap()
  1057. inner_msg = message.map_int32_foreign_message[111]
  1058. inner_msg.c = 1
  1059. self.assertEqual(
  1060. str(message),
  1061. 'map_int32_foreign_message {\n'
  1062. ' key: 111\n'
  1063. ' value {\n'
  1064. ' c: 1\n'
  1065. ' }\n'
  1066. '}\n')
  1067. inner_msg.c = 2
  1068. self.assertEqual(
  1069. str(message),
  1070. 'map_int32_foreign_message {\n'
  1071. ' key: 111\n'
  1072. ' value {\n'
  1073. ' c: 2\n'
  1074. ' }\n'
  1075. '}\n')
  1076. def testMapOrderEnforcement(self):
  1077. message = map_unittest_pb2.TestMap()
  1078. for letter in string.ascii_uppercase[13:26]:
  1079. message.map_string_string[letter] = 'dummy'
  1080. for letter in reversed(string.ascii_uppercase[0:13]):
  1081. message.map_string_string[letter] = 'dummy'
  1082. golden = ''.join(('map_string_string {\n key: "%c"\n value: "dummy"\n}\n'
  1083. % (letter,) for letter in string.ascii_uppercase))
  1084. self.CompareToGoldenText(text_format.MessageToString(message), golden)
  1085. # TODO(teboring): In c/137553523, not serializing default value for map entry
  1086. # message has been fixed. This test needs to be disabled in order to submit
  1087. # that cl. Add this back when c/137553523 has been submitted.
  1088. # def testMapOrderSemantics(self):
  1089. # golden_lines = self.ReadGolden('map_test_data.txt')
  1090. # message = map_unittest_pb2.TestMap()
  1091. # text_format.ParseLines(golden_lines, message)
  1092. # candidate = text_format.MessageToString(message)
  1093. # # The Python implementation emits "1.0" for the double value that the C++
  1094. # # implementation emits as "1".
  1095. # candidate = candidate.replace('1.0', '1', 2)
  1096. # candidate = candidate.replace('0.0', '0', 2)
  1097. # self.assertMultiLineEqual(candidate, ''.join(golden_lines))
  1098. # Tests of proto2-only features (MessageSet, extensions, etc.).
  1099. class Proto2Tests(TextFormatBase):
  1100. def testPrintMessageSet(self):
  1101. message = unittest_mset_pb2.TestMessageSetContainer()
  1102. ext1 = unittest_mset_pb2.TestMessageSetExtension1.message_set_extension
  1103. ext2 = unittest_mset_pb2.TestMessageSetExtension2.message_set_extension
  1104. message.message_set.Extensions[ext1].i = 23
  1105. message.message_set.Extensions[ext2].str = 'foo'
  1106. self.CompareToGoldenText(
  1107. text_format.MessageToString(message), 'message_set {\n'
  1108. ' [protobuf_unittest.TestMessageSetExtension1] {\n'
  1109. ' i: 23\n'
  1110. ' }\n'
  1111. ' [protobuf_unittest.TestMessageSetExtension2] {\n'
  1112. ' str: \"foo\"\n'
  1113. ' }\n'
  1114. '}\n')
  1115. message = message_set_extensions_pb2.TestMessageSet()
  1116. ext = message_set_extensions_pb2.message_set_extension3
  1117. message.Extensions[ext].text = 'bar'
  1118. self.CompareToGoldenText(
  1119. text_format.MessageToString(message),
  1120. '[google.protobuf.internal.TestMessageSetExtension3] {\n'
  1121. ' text: \"bar\"\n'
  1122. '}\n')
  1123. def testPrintMessageSetByFieldNumber(self):
  1124. out = text_format.TextWriter(False)
  1125. message = unittest_mset_pb2.TestMessageSetContainer()
  1126. ext1 = unittest_mset_pb2.TestMessageSetExtension1.message_set_extension
  1127. ext2 = unittest_mset_pb2.TestMessageSetExtension2.message_set_extension
  1128. message.message_set.Extensions[ext1].i = 23
  1129. message.message_set.Extensions[ext2].str = 'foo'
  1130. text_format.PrintMessage(message, out, use_field_number=True)
  1131. self.CompareToGoldenText(out.getvalue(), '1 {\n'
  1132. ' 1545008 {\n'
  1133. ' 15: 23\n'
  1134. ' }\n'
  1135. ' 1547769 {\n'
  1136. ' 25: \"foo\"\n'
  1137. ' }\n'
  1138. '}\n')
  1139. out.close()
  1140. def testPrintMessageSetAsOneLine(self):
  1141. message = unittest_mset_pb2.TestMessageSetContainer()
  1142. ext1 = unittest_mset_pb2.TestMessageSetExtension1.message_set_extension
  1143. ext2 = unittest_mset_pb2.TestMessageSetExtension2.message_set_extension
  1144. message.message_set.Extensions[ext1].i = 23
  1145. message.message_set.Extensions[ext2].str = 'foo'
  1146. self.CompareToGoldenText(
  1147. text_format.MessageToString(message, as_one_line=True),
  1148. 'message_set {'
  1149. ' [protobuf_unittest.TestMessageSetExtension1] {'
  1150. ' i: 23'
  1151. ' }'
  1152. ' [protobuf_unittest.TestMessageSetExtension2] {'
  1153. ' str: \"foo\"'
  1154. ' }'
  1155. ' }')
  1156. def testParseMessageSet(self):
  1157. message = unittest_pb2.TestAllTypes()
  1158. text = ('repeated_uint64: 1\n' 'repeated_uint64: 2\n')
  1159. text_format.Parse(text, message)
  1160. self.assertEqual(1, message.repeated_uint64[0])
  1161. self.assertEqual(2, message.repeated_uint64[1])
  1162. message = unittest_mset_pb2.TestMessageSetContainer()
  1163. text = ('message_set {\n'
  1164. ' [protobuf_unittest.TestMessageSetExtension1] {\n'
  1165. ' i: 23\n'
  1166. ' }\n'
  1167. ' [protobuf_unittest.TestMessageSetExtension2] {\n'
  1168. ' str: \"foo\"\n'
  1169. ' }\n'
  1170. '}\n')
  1171. text_format.Parse(text, message)
  1172. ext1 = unittest_mset_pb2.TestMessageSetExtension1.message_set_extension
  1173. ext2 = unittest_mset_pb2.TestMessageSetExtension2.message_set_extension
  1174. self.assertEqual(23, message.message_set.Extensions[ext1].i)
  1175. self.assertEqual('foo', message.message_set.Extensions[ext2].str)
  1176. def testExtensionInsideAnyMessage(self):
  1177. message = test_extend_any.TestAny()
  1178. text = ('value {\n'
  1179. ' [type.googleapis.com/google.protobuf.internal.TestAny] {\n'
  1180. ' [google.protobuf.internal.TestAnyExtension1.extension1] {\n'
  1181. ' i: 10\n'
  1182. ' }\n'
  1183. ' }\n'
  1184. '}\n')
  1185. text_format.Merge(text, message, descriptor_pool=descriptor_pool.Default())
  1186. self.CompareToGoldenText(
  1187. text_format.MessageToString(
  1188. message, descriptor_pool=descriptor_pool.Default()),
  1189. text)
  1190. def testParseMessageByFieldNumber(self):
  1191. message = unittest_pb2.TestAllTypes()
  1192. text = ('34: 1\n' 'repeated_uint64: 2\n')
  1193. text_format.Parse(text, message, allow_field_number=True)
  1194. self.assertEqual(1, message.repeated_uint64[0])
  1195. self.assertEqual(2, message.repeated_uint64[1])
  1196. message = unittest_mset_pb2.TestMessageSetContainer()
  1197. text = ('1 {\n'
  1198. ' 1545008 {\n'
  1199. ' 15: 23\n'
  1200. ' }\n'
  1201. ' 1547769 {\n'
  1202. ' 25: \"foo\"\n'
  1203. ' }\n'
  1204. '}\n')
  1205. text_format.Parse(text, message, allow_field_number=True)
  1206. ext1 = unittest_mset_pb2.TestMessageSetExtension1.message_set_extension
  1207. ext2 = unittest_mset_pb2.TestMessageSetExtension2.message_set_extension
  1208. self.assertEqual(23, message.message_set.Extensions[ext1].i)
  1209. self.assertEqual('foo', message.message_set.Extensions[ext2].str)
  1210. # Can't parse field number without set allow_field_number=True.
  1211. message = unittest_pb2.TestAllTypes()
  1212. text = '34:1\n'
  1213. six.assertRaisesRegex(self, text_format.ParseError, (
  1214. r'1:1 : Message type "\w+.TestAllTypes" has no field named '
  1215. r'"34".'), text_format.Parse, text, message)
  1216. # Can't parse if field number is not found.
  1217. text = '1234:1\n'
  1218. six.assertRaisesRegex(
  1219. self,
  1220. text_format.ParseError,
  1221. (r'1:1 : Message type "\w+.TestAllTypes" has no field named '
  1222. r'"1234".'),
  1223. text_format.Parse,
  1224. text,
  1225. message,
  1226. allow_field_number=True)
  1227. def testPrintAllExtensions(self):
  1228. message = unittest_pb2.TestAllExtensions()
  1229. test_util.SetAllExtensions(message)
  1230. self.CompareToGoldenFile(
  1231. self.RemoveRedundantZeros(text_format.MessageToString(message)),
  1232. 'text_format_unittest_extensions_data.txt')
  1233. def testPrintAllExtensionsPointy(self):
  1234. message = unittest_pb2.TestAllExtensions()
  1235. test_util.SetAllExtensions(message)
  1236. self.CompareToGoldenFile(
  1237. self.RemoveRedundantZeros(text_format.MessageToString(
  1238. message, pointy_brackets=True)),
  1239. 'text_format_unittest_extensions_data_pointy.txt')
  1240. def testParseGoldenExtensions(self):
  1241. golden_text = '\n'.join(self.ReadGolden(
  1242. 'text_format_unittest_extensions_data.txt'))
  1243. parsed_message = unittest_pb2.TestAllExtensions()
  1244. text_format.Parse(golden_text, parsed_message)
  1245. message = unittest_pb2.TestAllExtensions()
  1246. test_util.SetAllExtensions(message)
  1247. self.assertEqual(message, parsed_message)
  1248. def testParseAllExtensions(self):
  1249. message = unittest_pb2.TestAllExtensions()
  1250. test_util.SetAllExtensions(message)
  1251. ascii_text = text_format.MessageToString(message)
  1252. parsed_message = unittest_pb2.TestAllExtensions()
  1253. text_format.Parse(ascii_text, parsed_message)
  1254. self.assertEqual(message, parsed_message)
  1255. def testParseAllowedUnknownExtension(self):
  1256. # Skip over unknown extension correctly.
  1257. message = unittest_mset_pb2.TestMessageSetContainer()
  1258. text = ('message_set {\n'
  1259. ' [unknown_extension] {\n'
  1260. ' i: 23\n'
  1261. ' bin: "\xe0"'
  1262. ' [nested_unknown_ext]: {\n'
  1263. ' i: 23\n'
  1264. ' x: x\n'
  1265. ' test: "test_string"\n'
  1266. ' floaty_float: -0.315\n'
  1267. ' num: -inf\n'
  1268. ' multiline_str: "abc"\n'
  1269. ' "def"\n'
  1270. ' "xyz."\n'
  1271. ' [nested_unknown_ext.ext]: <\n'
  1272. ' i: 23\n'
  1273. ' i: 24\n'
  1274. ' pointfloat: .3\n'
  1275. ' test: "test_string"\n'
  1276. ' floaty_float: -0.315\n'
  1277. ' num: -inf\n'
  1278. ' long_string: "test" "test2" \n'
  1279. ' >\n'
  1280. ' }\n'
  1281. ' }\n'
  1282. ' [unknown_extension]: 5\n'
  1283. ' [unknown_extension_with_number_field] {\n'
  1284. ' 1: "some_field"\n'
  1285. ' 2: -0.451\n'
  1286. ' }\n'
  1287. '}\n')
  1288. text_format.Parse(text, message, allow_unknown_extension=True)
  1289. golden = 'message_set {\n}\n'
  1290. self.CompareToGoldenText(text_format.MessageToString(message), golden)
  1291. # Catch parse errors in unknown extension.
  1292. message = unittest_mset_pb2.TestMessageSetContainer()
  1293. malformed = ('message_set {\n'
  1294. ' [unknown_extension] {\n'
  1295. ' i:\n' # Missing value.
  1296. ' }\n'
  1297. '}\n')
  1298. six.assertRaisesRegex(self,
  1299. text_format.ParseError,
  1300. 'Invalid field value: }',
  1301. text_format.Parse,
  1302. malformed,
  1303. message,
  1304. allow_unknown_extension=True)
  1305. message = unittest_mset_pb2.TestMessageSetContainer()
  1306. malformed = ('message_set {\n'
  1307. ' [unknown_extension] {\n'
  1308. ' str: "malformed string\n' # Missing closing quote.
  1309. ' }\n'
  1310. '}\n')
  1311. six.assertRaisesRegex(self,
  1312. text_format.ParseError,
  1313. 'Invalid field value: "',
  1314. text_format.Parse,
  1315. malformed,
  1316. message,
  1317. allow_unknown_extension=True)
  1318. message = unittest_mset_pb2.TestMessageSetContainer()
  1319. malformed = ('message_set {\n'
  1320. ' [unknown_extension] {\n'
  1321. ' str: "malformed\n multiline\n string\n'
  1322. ' }\n'
  1323. '}\n')
  1324. six.assertRaisesRegex(self,
  1325. text_format.ParseError,
  1326. 'Invalid field value: "',
  1327. text_format.Parse,
  1328. malformed,
  1329. message,
  1330. allow_unknown_extension=True)
  1331. message = unittest_mset_pb2.TestMessageSetContainer()
  1332. malformed = ('message_set {\n'
  1333. ' [malformed_extension] <\n'
  1334. ' i: -5\n'
  1335. ' \n' # Missing '>' here.
  1336. '}\n')
  1337. six.assertRaisesRegex(self,
  1338. text_format.ParseError,
  1339. '5:1 : \'}\': Expected ">".',
  1340. text_format.Parse,
  1341. malformed,
  1342. message,
  1343. allow_unknown_extension=True)
  1344. # Don't allow unknown fields with allow_unknown_extension=True.
  1345. message = unittest_mset_pb2.TestMessageSetContainer()
  1346. malformed = ('message_set {\n'
  1347. ' unknown_field: true\n'
  1348. '}\n')
  1349. six.assertRaisesRegex(self,
  1350. text_format.ParseError,
  1351. ('2:3 : Message type '
  1352. '"proto2_wireformat_unittest.TestMessageSet" has no'
  1353. ' field named "unknown_field".'),
  1354. text_format.Parse,
  1355. malformed,
  1356. message,
  1357. allow_unknown_extension=True)
  1358. # Parse known extension correctly.
  1359. message = unittest_mset_pb2.TestMessageSetContainer()
  1360. text = ('message_set {\n'
  1361. ' [protobuf_unittest.TestMessageSetExtension1] {\n'
  1362. ' i: 23\n'
  1363. ' }\n'
  1364. ' [protobuf_unittest.TestMessageSetExtension2] {\n'
  1365. ' str: \"foo\"\n'
  1366. ' }\n'
  1367. '}\n')
  1368. text_format.Parse(text, message, allow_unknown_extension=True)
  1369. ext1 = unittest_mset_pb2.TestMessageSetExtension1.message_set_extension
  1370. ext2 = unittest_mset_pb2.TestMessageSetExtension2.message_set_extension
  1371. self.assertEqual(23, message.message_set.Extensions[ext1].i)
  1372. self.assertEqual('foo', message.message_set.Extensions[ext2].str)
  1373. def testParseBadIdentifier(self):
  1374. message = unittest_pb2.TestAllTypes()
  1375. text = ('optional_nested_message { "bb": 1 }')
  1376. with self.assertRaises(text_format.ParseError) as e:
  1377. text_format.Parse(text, message)
  1378. self.assertEqual(str(e.exception),
  1379. '1:27 : \'optional_nested_message { "bb": 1 }\': '
  1380. 'Expected identifier or number, got "bb".')
  1381. def testParseBadExtension(self):
  1382. message = unittest_pb2.TestAllExtensions()
  1383. text = '[unknown_extension]: 8\n'
  1384. six.assertRaisesRegex(self, text_format.ParseError,
  1385. '1:2 : Extension "unknown_extension" not registered.',
  1386. text_format.Parse, text, message)
  1387. message = unittest_pb2.TestAllTypes()
  1388. six.assertRaisesRegex(self, text_format.ParseError, (
  1389. '1:2 : Message type "protobuf_unittest.TestAllTypes" does not have '
  1390. 'extensions.'), text_format.Parse, text, message)
  1391. def testParseNumericUnknownEnum(self):
  1392. message = unittest_pb2.TestAllTypes()
  1393. text = 'optional_nested_enum: 100'
  1394. six.assertRaisesRegex(self, text_format.ParseError,
  1395. (r'1:23 : \'optional_nested_enum: 100\': '
  1396. r'Enum type "\w+.TestAllTypes.NestedEnum" '
  1397. r'has no value with number 100.'), text_format.Parse,
  1398. text, message)
  1399. def testMergeDuplicateExtensionScalars(self):
  1400. message = unittest_pb2.TestAllExtensions()
  1401. text = ('[protobuf_unittest.optional_int32_extension]: 42 '
  1402. '[protobuf_unittest.optional_int32_extension]: 67')
  1403. text_format.Merge(text, message)
  1404. self.assertEqual(67,
  1405. message.Extensions[unittest_pb2.optional_int32_extension])
  1406. def testParseDuplicateExtensionScalars(self):
  1407. message = unittest_pb2.TestAllExtensions()
  1408. text = ('[protobuf_unittest.optional_int32_extension]: 42 '
  1409. '[protobuf_unittest.optional_int32_extension]: 67')
  1410. six.assertRaisesRegex(self, text_format.ParseError, (
  1411. '1:96 : Message type "protobuf_unittest.TestAllExtensions" '
  1412. 'should not have multiple '
  1413. '"protobuf_unittest.optional_int32_extension" extensions.'),
  1414. text_format.Parse, text, message)
  1415. def testParseDuplicateExtensionMessages(self):
  1416. message = unittest_pb2.TestAllExtensions()
  1417. text = ('[protobuf_unittest.optional_nested_message_extension]: {} '
  1418. '[protobuf_unittest.optional_nested_message_extension]: {}')
  1419. six.assertRaisesRegex(self, text_format.ParseError, (
  1420. '1:114 : Message type "protobuf_unittest.TestAllExtensions" '
  1421. 'should not have multiple '
  1422. '"protobuf_unittest.optional_nested_message_extension" extensions.'),
  1423. text_format.Parse, text, message)
  1424. def testParseGroupNotClosed(self):
  1425. message = unittest_pb2.TestAllTypes()
  1426. text = 'RepeatedGroup: <'
  1427. six.assertRaisesRegex(self, text_format.ParseError, '1:16 : Expected ">".',
  1428. text_format.Parse, text, message)
  1429. text = 'RepeatedGroup: {'
  1430. six.assertRaisesRegex(self, text_format.ParseError, '1:16 : Expected "}".',
  1431. text_format.Parse, text, message)
  1432. def testParseEmptyGroup(self):
  1433. message = unittest_pb2.TestAllTypes()
  1434. text = 'OptionalGroup: {}'
  1435. text_format.Parse(text, message)
  1436. self.assertTrue(message.HasField('optionalgroup'))
  1437. message.Clear()
  1438. message = unittest_pb2.TestAllTypes()
  1439. text = 'OptionalGroup: <>'
  1440. text_format.Parse(text, message)
  1441. self.assertTrue(message.HasField('optionalgroup'))
  1442. # Maps aren't really proto2-only, but our test schema only has maps for
  1443. # proto2.
  1444. def testParseMap(self):
  1445. text = ('map_int32_int32 {\n'
  1446. ' key: -123\n'
  1447. ' value: -456\n'
  1448. '}\n'
  1449. 'map_int64_int64 {\n'
  1450. ' key: -8589934592\n'
  1451. ' value: -17179869184\n'
  1452. '}\n'
  1453. 'map_uint32_uint32 {\n'
  1454. ' key: 123\n'
  1455. ' value: 456\n'
  1456. '}\n'
  1457. 'map_uint64_uint64 {\n'
  1458. ' key: 8589934592\n'
  1459. ' value: 17179869184\n'
  1460. '}\n'
  1461. 'map_string_string {\n'
  1462. ' key: "abc"\n'
  1463. ' value: "123"\n'
  1464. '}\n'
  1465. 'map_int32_foreign_message {\n'
  1466. ' key: 111\n'
  1467. ' value {\n'
  1468. ' c: 5\n'
  1469. ' }\n'
  1470. '}\n')
  1471. message = map_unittest_pb2.TestMap()
  1472. text_format.Parse(text, message)
  1473. self.assertEqual(-456, message.map_int32_int32[-123])
  1474. self.assertEqual(-2**34, message.map_int64_int64[-2**33])
  1475. self.assertEqual(456, message.map_uint32_uint32[123])
  1476. self.assertEqual(2**34, message.map_uint64_uint64[2**33])
  1477. self.assertEqual('123', message.map_string_string['abc'])
  1478. self.assertEqual(5, message.map_int32_foreign_message[111].c)
  1479. class Proto3Tests(unittest.TestCase):
  1480. def testPrintMessageExpandAny(self):
  1481. packed_message = unittest_pb2.OneString()
  1482. packed_message.data = 'string'
  1483. message = any_test_pb2.TestAny()
  1484. message.any_value.Pack(packed_message)
  1485. self.assertEqual(
  1486. text_format.MessageToString(message,
  1487. descriptor_pool=descriptor_pool.Default()),
  1488. 'any_value {\n'
  1489. ' [type.googleapis.com/protobuf_unittest.OneString] {\n'
  1490. ' data: "string"\n'
  1491. ' }\n'
  1492. '}\n')
  1493. def testTopAnyMessage(self):
  1494. packed_msg = unittest_pb2.OneString()
  1495. msg = any_pb2.Any()
  1496. msg.Pack(packed_msg)
  1497. text = text_format.MessageToString(msg)
  1498. other_msg = text_format.Parse(text, any_pb2.Any())
  1499. self.assertEqual(msg, other_msg)
  1500. def testPrintMessageExpandAnyRepeated(self):
  1501. packed_message = unittest_pb2.OneString()
  1502. message = any_test_pb2.TestAny()
  1503. packed_message.data = 'string0'
  1504. message.repeated_any_value.add().Pack(packed_message)
  1505. packed_message.data = 'string1'
  1506. message.repeated_any_value.add().Pack(packed_message)
  1507. self.assertEqual(
  1508. text_format.MessageToString(message),
  1509. 'repeated_any_value {\n'
  1510. ' [type.googleapis.com/protobuf_unittest.OneString] {\n'
  1511. ' data: "string0"\n'
  1512. ' }\n'
  1513. '}\n'
  1514. 'repeated_any_value {\n'
  1515. ' [type.googleapis.com/protobuf_unittest.OneString] {\n'
  1516. ' data: "string1"\n'
  1517. ' }\n'
  1518. '}\n')
  1519. def testPrintMessageExpandAnyDescriptorPoolMissingType(self):
  1520. packed_message = unittest_pb2.OneString()
  1521. packed_message.data = 'string'
  1522. message = any_test_pb2.TestAny()
  1523. message.any_value.Pack(packed_message)
  1524. empty_pool = descriptor_pool.DescriptorPool()
  1525. self.assertEqual(
  1526. text_format.MessageToString(message, descriptor_pool=empty_pool),
  1527. 'any_value {\n'
  1528. ' type_url: "type.googleapis.com/protobuf_unittest.OneString"\n'
  1529. ' value: "\\n\\006string"\n'
  1530. '}\n')
  1531. def testPrintMessageExpandAnyPointyBrackets(self):
  1532. packed_message = unittest_pb2.OneString()
  1533. packed_message.data = 'string'
  1534. message = any_test_pb2.TestAny()
  1535. message.any_value.Pack(packed_message)
  1536. self.assertEqual(
  1537. text_format.MessageToString(message,
  1538. pointy_brackets=True),
  1539. 'any_value <\n'
  1540. ' [type.googleapis.com/protobuf_unittest.OneString] <\n'
  1541. ' data: "string"\n'
  1542. ' >\n'
  1543. '>\n')
  1544. def testPrintMessageExpandAnyAsOneLine(self):
  1545. packed_message = unittest_pb2.OneString()
  1546. packed_message.data = 'string'
  1547. message = any_test_pb2.TestAny()
  1548. message.any_value.Pack(packed_message)
  1549. self.assertEqual(
  1550. text_format.MessageToString(message,
  1551. as_one_line=True),
  1552. 'any_value {'
  1553. ' [type.googleapis.com/protobuf_unittest.OneString]'
  1554. ' { data: "string" } '
  1555. '}')
  1556. def testPrintMessageExpandAnyAsOneLinePointyBrackets(self):
  1557. packed_message = unittest_pb2.OneString()
  1558. packed_message.data = 'string'
  1559. message = any_test_pb2.TestAny()
  1560. message.any_value.Pack(packed_message)
  1561. self.assertEqual(
  1562. text_format.MessageToString(message,
  1563. as_one_line=True,
  1564. pointy_brackets=True,
  1565. descriptor_pool=descriptor_pool.Default()),
  1566. 'any_value <'
  1567. ' [type.googleapis.com/protobuf_unittest.OneString]'
  1568. ' < data: "string" > '
  1569. '>')
  1570. def testPrintAndParseMessageInvalidAny(self):
  1571. packed_message = unittest_pb2.OneString()
  1572. packed_message.data = 'string'
  1573. message = any_test_pb2.TestAny()
  1574. message.any_value.Pack(packed_message)
  1575. # Only include string after last '/' in type_url.
  1576. message.any_value.type_url = message.any_value.TypeName()
  1577. text = text_format.MessageToString(message)
  1578. self.assertEqual(
  1579. text, 'any_value {\n'
  1580. ' type_url: "protobuf_unittest.OneString"\n'
  1581. ' value: "\\n\\006string"\n'
  1582. '}\n')
  1583. parsed_message = any_test_pb2.TestAny()
  1584. text_format.Parse(text, parsed_message)
  1585. self.assertEqual(message, parsed_message)
  1586. def testUnknownEnums(self):
  1587. message = unittest_proto3_arena_pb2.TestAllTypes()
  1588. message2 = unittest_proto3_arena_pb2.TestAllTypes()
  1589. message.optional_nested_enum = 999
  1590. text_string = text_format.MessageToString(message)
  1591. text_format.Parse(text_string, message2)
  1592. self.assertEqual(999, message2.optional_nested_enum)
  1593. def testMergeExpandedAny(self):
  1594. message = any_test_pb2.TestAny()
  1595. text = ('any_value {\n'
  1596. ' [type.googleapis.com/protobuf_unittest.OneString] {\n'
  1597. ' data: "string"\n'
  1598. ' }\n'
  1599. '}\n')
  1600. text_format.Merge(text, message)
  1601. packed_message = unittest_pb2.OneString()
  1602. message.any_value.Unpack(packed_message)
  1603. self.assertEqual('string', packed_message.data)
  1604. message.Clear()
  1605. text_format.Parse(text, message)
  1606. packed_message = unittest_pb2.OneString()
  1607. message.any_value.Unpack(packed_message)
  1608. self.assertEqual('string', packed_message.data)
  1609. def testMergeExpandedAnyRepeated(self):
  1610. message = any_test_pb2.TestAny()
  1611. text = ('repeated_any_value {\n'
  1612. ' [type.googleapis.com/protobuf_unittest.OneString] {\n'
  1613. ' data: "string0"\n'
  1614. ' }\n'
  1615. '}\n'
  1616. 'repeated_any_value {\n'
  1617. ' [type.googleapis.com/protobuf_unittest.OneString] {\n'
  1618. ' data: "string1"\n'
  1619. ' }\n'
  1620. '}\n')
  1621. text_format.Merge(text, message)
  1622. packed_message = unittest_pb2.OneString()
  1623. message.repeated_any_value[0].Unpack(packed_message)
  1624. self.assertEqual('string0', packed_message.data)
  1625. message.repeated_any_value[1].Unpack(packed_message)
  1626. self.assertEqual('string1', packed_message.data)
  1627. def testMergeExpandedAnyPointyBrackets(self):
  1628. message = any_test_pb2.TestAny()
  1629. text = ('any_value {\n'
  1630. ' [type.googleapis.com/protobuf_unittest.OneString] <\n'
  1631. ' data: "string"\n'
  1632. ' >\n'
  1633. '}\n')
  1634. text_format.Merge(text, message)
  1635. packed_message = unittest_pb2.OneString()
  1636. message.any_value.Unpack(packed_message)
  1637. self.assertEqual('string', packed_message.data)
  1638. def testMergeAlternativeUrl(self):
  1639. message = any_test_pb2.TestAny()
  1640. text = ('any_value {\n'
  1641. ' [type.otherapi.com/protobuf_unittest.OneString] {\n'
  1642. ' data: "string"\n'
  1643. ' }\n'
  1644. '}\n')
  1645. text_format.Merge(text, message)
  1646. packed_message = unittest_pb2.OneString()
  1647. self.assertEqual('type.otherapi.com/protobuf_unittest.OneString',
  1648. message.any_value.type_url)
  1649. def testMergeExpandedAnyDescriptorPoolMissingType(self):
  1650. message = any_test_pb2.TestAny()
  1651. text = ('any_value {\n'
  1652. ' [type.googleapis.com/protobuf_unittest.OneString] {\n'
  1653. ' data: "string"\n'
  1654. ' }\n'
  1655. '}\n')
  1656. with self.assertRaises(text_format.ParseError) as e:
  1657. empty_pool = descriptor_pool.DescriptorPool()
  1658. text_format.Merge(text, message, descriptor_pool=empty_pool)
  1659. self.assertEqual(
  1660. str(e.exception),
  1661. 'Type protobuf_unittest.OneString not found in descriptor pool')
  1662. def testMergeUnexpandedAny(self):
  1663. text = ('any_value {\n'
  1664. ' type_url: "type.googleapis.com/protobuf_unittest.OneString"\n'
  1665. ' value: "\\n\\006string"\n'
  1666. '}\n')
  1667. message = any_test_pb2.TestAny()
  1668. text_format.Merge(text, message)
  1669. packed_message = unittest_pb2.OneString()
  1670. message.any_value.Unpack(packed_message)
  1671. self.assertEqual('string', packed_message.data)
  1672. def testMergeMissingAnyEndToken(self):
  1673. message = any_test_pb2.TestAny()
  1674. text = ('any_value {\n'
  1675. ' [type.googleapis.com/protobuf_unittest.OneString] {\n'
  1676. ' data: "string"\n')
  1677. with self.assertRaises(text_format.ParseError) as e:
  1678. text_format.Merge(text, message)
  1679. self.assertEqual(str(e.exception), '3:11 : Expected "}".')
  1680. class TokenizerTest(unittest.TestCase):
  1681. def testSimpleTokenCases(self):
  1682. text = ('identifier1:"string1"\n \n\n'
  1683. 'identifier2 : \n \n123 \n identifier3 :\'string\'\n'
  1684. 'identifiER_4 : 1.1e+2 ID5:-0.23 ID6:\'aaaa\\\'bbbb\'\n'
  1685. 'ID7 : "aa\\"bb"\n\n\n\n ID8: {A:inf B:-inf C:true D:false}\n'
  1686. 'ID9: 22 ID10: -111111111111111111 ID11: -22\n'
  1687. 'ID12: 2222222222222222222 ID13: 1.23456f ID14: 1.2e+2f '
  1688. 'false_bool: 0 true_BOOL:t \n true_bool1: 1 false_BOOL1:f '
  1689. 'False_bool: False True_bool: True X:iNf Y:-inF Z:nAN')
  1690. tokenizer = text_format.Tokenizer(text.splitlines())
  1691. methods = [(tokenizer.ConsumeIdentifier, 'identifier1'), ':',
  1692. (tokenizer.ConsumeString, 'string1'),
  1693. (tokenizer.ConsumeIdentifier, 'identifier2'), ':',
  1694. (tokenizer.ConsumeInteger, 123),
  1695. (tokenizer.ConsumeIdentifier, 'identifier3'), ':',
  1696. (tokenizer.ConsumeString, 'string'),
  1697. (tokenizer.ConsumeIdentifier, 'identifiER_4'), ':',
  1698. (tokenizer.ConsumeFloat, 1.1e+2),
  1699. (tokenizer.ConsumeIdentifier, 'ID5'), ':',
  1700. (tokenizer.ConsumeFloat, -0.23),
  1701. (tokenizer.ConsumeIdentifier, 'ID6'), ':',
  1702. (tokenizer.ConsumeString, 'aaaa\'bbbb'),
  1703. (tokenizer.ConsumeIdentifier, 'ID7'), ':',
  1704. (tokenizer.ConsumeString, 'aa\"bb'),
  1705. (tokenizer.ConsumeIdentifier, 'ID8'), ':', '{',
  1706. (tokenizer.ConsumeIdentifier, 'A'), ':',
  1707. (tokenizer.ConsumeFloat, float('inf')),
  1708. (tokenizer.ConsumeIdentifier, 'B'), ':',
  1709. (tokenizer.ConsumeFloat, -float('inf')),
  1710. (tokenizer.ConsumeIdentifier, 'C'), ':',
  1711. (tokenizer.ConsumeBool, True),
  1712. (tokenizer.ConsumeIdentifier, 'D'), ':',
  1713. (tokenizer.ConsumeBool, False), '}',
  1714. (tokenizer.ConsumeIdentifier, 'ID9'), ':',
  1715. (tokenizer.ConsumeInteger, 22),
  1716. (tokenizer.ConsumeIdentifier, 'ID10'), ':',
  1717. (tokenizer.ConsumeInteger, -111111111111111111),
  1718. (tokenizer.ConsumeIdentifier, 'ID11'), ':',
  1719. (tokenizer.ConsumeInteger, -22),
  1720. (tokenizer.ConsumeIdentifier, 'ID12'), ':',
  1721. (tokenizer.ConsumeInteger, 2222222222222222222),
  1722. (tokenizer.ConsumeIdentifier, 'ID13'), ':',
  1723. (tokenizer.ConsumeFloat, 1.23456),
  1724. (tokenizer.ConsumeIdentifier, 'ID14'), ':',
  1725. (tokenizer.ConsumeFloat, 1.2e+2),
  1726. (tokenizer.ConsumeIdentifier, 'false_bool'), ':',
  1727. (tokenizer.ConsumeBool, False),
  1728. (tokenizer.ConsumeIdentifier, 'true_BOOL'), ':',
  1729. (tokenizer.ConsumeBool, True),
  1730. (tokenizer.ConsumeIdentifier, 'true_bool1'), ':',
  1731. (tokenizer.ConsumeBool, True),
  1732. (tokenizer.ConsumeIdentifier, 'false_BOOL1'), ':',
  1733. (tokenizer.ConsumeBool, False),
  1734. (tokenizer.ConsumeIdentifier, 'False_bool'), ':',
  1735. (tokenizer.ConsumeBool, False),
  1736. (tokenizer.ConsumeIdentifier, 'True_bool'), ':',
  1737. (tokenizer.ConsumeBool, True),
  1738. (tokenizer.ConsumeIdentifier, 'X'), ':',
  1739. (tokenizer.ConsumeFloat, float('inf')),
  1740. (tokenizer.ConsumeIdentifier, 'Y'), ':',
  1741. (tokenizer.ConsumeFloat, float('-inf')),
  1742. (tokenizer.ConsumeIdentifier, 'Z'), ':',
  1743. (tokenizer.ConsumeFloat, float('nan'))]
  1744. i = 0
  1745. while not tokenizer.AtEnd():
  1746. m = methods[i]
  1747. if isinstance(m, str):
  1748. token = tokenizer.token
  1749. self.assertEqual(token, m)
  1750. tokenizer.NextToken()
  1751. elif isinstance(m[1], float) and math.isnan(m[1]):
  1752. self.assertTrue(math.isnan(m[0]()))
  1753. else:
  1754. self.assertEqual(m[1], m[0]())
  1755. i += 1
  1756. def testConsumeAbstractIntegers(self):
  1757. # This test only tests the failures in the integer parsing methods as well
  1758. # as the '0' special cases.
  1759. int64_max = (1 << 63) - 1
  1760. uint32_max = (1 << 32) - 1
  1761. text = '-1 %d %d' % (uint32_max + 1, int64_max + 1)
  1762. tokenizer = text_format.Tokenizer(text.splitlines())
  1763. self.assertEqual(-1, tokenizer.ConsumeInteger())
  1764. self.assertEqual(uint32_max + 1, tokenizer.ConsumeInteger())
  1765. self.assertEqual(int64_max + 1, tokenizer.ConsumeInteger())
  1766. self.assertTrue(tokenizer.AtEnd())
  1767. text = '-0 0 0 1.2'
  1768. tokenizer = text_format.Tokenizer(text.splitlines())
  1769. self.assertEqual(0, tokenizer.ConsumeInteger())
  1770. self.assertEqual(0, tokenizer.ConsumeInteger())
  1771. self.assertEqual(True, tokenizer.TryConsumeInteger())
  1772. self.assertEqual(False, tokenizer.TryConsumeInteger())
  1773. with self.assertRaises(text_format.ParseError):
  1774. tokenizer.ConsumeInteger()
  1775. self.assertEqual(1.2, tokenizer.ConsumeFloat())
  1776. self.assertTrue(tokenizer.AtEnd())
  1777. def testConsumeIntegers(self):
  1778. # This test only tests the failures in the integer parsing methods as well
  1779. # as the '0' special cases.
  1780. int64_max = (1 << 63) - 1
  1781. uint32_max = (1 << 32) - 1
  1782. text = '-1 %d %d' % (uint32_max + 1, int64_max + 1)
  1783. tokenizer = text_format.Tokenizer(text.splitlines())
  1784. self.assertRaises(text_format.ParseError,
  1785. text_format._ConsumeUint32, tokenizer)
  1786. self.assertRaises(text_format.ParseError,
  1787. text_format._ConsumeUint64, tokenizer)
  1788. self.assertEqual(-1, text_format._ConsumeInt32(tokenizer))
  1789. self.assertRaises(text_format.ParseError,
  1790. text_format._ConsumeUint32, tokenizer)
  1791. self.assertRaises(text_format.ParseError,
  1792. text_format._ConsumeInt32, tokenizer)
  1793. self.assertEqual(uint32_max + 1, text_format._ConsumeInt64(tokenizer))
  1794. self.assertRaises(text_format.ParseError,
  1795. text_format._ConsumeInt64, tokenizer)
  1796. self.assertEqual(int64_max + 1, text_format._ConsumeUint64(tokenizer))
  1797. self.assertTrue(tokenizer.AtEnd())
  1798. text = '-0 -0 0 0'
  1799. tokenizer = text_format.Tokenizer(text.splitlines())
  1800. self.assertEqual(0, text_format._ConsumeUint32(tokenizer))
  1801. self.assertEqual(0, text_format._ConsumeUint64(tokenizer))
  1802. self.assertEqual(0, text_format._ConsumeUint32(tokenizer))
  1803. self.assertEqual(0, text_format._ConsumeUint64(tokenizer))
  1804. self.assertTrue(tokenizer.AtEnd())
  1805. def testConsumeOctalIntegers(self):
  1806. """Test support for C style octal integers."""
  1807. text = '00 -00 04 0755 -010 007 -0033 08 -09 01'
  1808. tokenizer = text_format.Tokenizer(text.splitlines())
  1809. self.assertEqual(0, tokenizer.ConsumeInteger())
  1810. self.assertEqual(0, tokenizer.ConsumeInteger())
  1811. self.assertEqual(4, tokenizer.ConsumeInteger())
  1812. self.assertEqual(0o755, tokenizer.ConsumeInteger())
  1813. self.assertEqual(-0o10, tokenizer.ConsumeInteger())
  1814. self.assertEqual(7, tokenizer.ConsumeInteger())
  1815. self.assertEqual(-0o033, tokenizer.ConsumeInteger())
  1816. with self.assertRaises(text_format.ParseError):
  1817. tokenizer.ConsumeInteger() # 08
  1818. tokenizer.NextToken()
  1819. with self.assertRaises(text_format.ParseError):
  1820. tokenizer.ConsumeInteger() # -09
  1821. tokenizer.NextToken()
  1822. self.assertEqual(1, tokenizer.ConsumeInteger())
  1823. self.assertTrue(tokenizer.AtEnd())
  1824. def testConsumeByteString(self):
  1825. text = '"string1\''
  1826. tokenizer = text_format.Tokenizer(text.splitlines())
  1827. self.assertRaises(text_format.ParseError, tokenizer.ConsumeByteString)
  1828. text = 'string1"'
  1829. tokenizer = text_format.Tokenizer(text.splitlines())
  1830. self.assertRaises(text_format.ParseError, tokenizer.ConsumeByteString)
  1831. text = '\n"\\xt"'
  1832. tokenizer = text_format.Tokenizer(text.splitlines())
  1833. self.assertRaises(text_format.ParseError, tokenizer.ConsumeByteString)
  1834. text = '\n"\\"'
  1835. tokenizer = text_format.Tokenizer(text.splitlines())
  1836. self.assertRaises(text_format.ParseError, tokenizer.ConsumeByteString)
  1837. text = '\n"\\x"'
  1838. tokenizer = text_format.Tokenizer(text.splitlines())
  1839. self.assertRaises(text_format.ParseError, tokenizer.ConsumeByteString)
  1840. def testConsumeBool(self):
  1841. text = 'not-a-bool'
  1842. tokenizer = text_format.Tokenizer(text.splitlines())
  1843. self.assertRaises(text_format.ParseError, tokenizer.ConsumeBool)
  1844. def testSkipComment(self):
  1845. tokenizer = text_format.Tokenizer('# some comment'.splitlines())
  1846. self.assertTrue(tokenizer.AtEnd())
  1847. self.assertRaises(text_format.ParseError, tokenizer.ConsumeComment)
  1848. def testConsumeComment(self):
  1849. tokenizer = text_format.Tokenizer('# some comment'.splitlines(),
  1850. skip_comments=False)
  1851. self.assertFalse(tokenizer.AtEnd())
  1852. self.assertEqual('# some comment', tokenizer.ConsumeComment())
  1853. self.assertTrue(tokenizer.AtEnd())
  1854. def testConsumeTwoComments(self):
  1855. text = '# some comment\n# another comment'
  1856. tokenizer = text_format.Tokenizer(text.splitlines(), skip_comments=False)
  1857. self.assertEqual('# some comment', tokenizer.ConsumeComment())
  1858. self.assertFalse(tokenizer.AtEnd())
  1859. self.assertEqual('# another comment', tokenizer.ConsumeComment())
  1860. self.assertTrue(tokenizer.AtEnd())
  1861. def testConsumeTrailingComment(self):
  1862. text = 'some_number: 4\n# some comment'
  1863. tokenizer = text_format.Tokenizer(text.splitlines(), skip_comments=False)
  1864. self.assertRaises(text_format.ParseError, tokenizer.ConsumeComment)
  1865. self.assertEqual('some_number', tokenizer.ConsumeIdentifier())
  1866. self.assertEqual(tokenizer.token, ':')
  1867. tokenizer.NextToken()
  1868. self.assertRaises(text_format.ParseError, tokenizer.ConsumeComment)
  1869. self.assertEqual(4, tokenizer.ConsumeInteger())
  1870. self.assertFalse(tokenizer.AtEnd())
  1871. self.assertEqual('# some comment', tokenizer.ConsumeComment())
  1872. self.assertTrue(tokenizer.AtEnd())
  1873. def testConsumeLineComment(self):
  1874. tokenizer = text_format.Tokenizer('# some comment'.splitlines(),
  1875. skip_comments=False)
  1876. self.assertFalse(tokenizer.AtEnd())
  1877. self.assertEqual((False, '# some comment'),
  1878. tokenizer.ConsumeCommentOrTrailingComment())
  1879. self.assertTrue(tokenizer.AtEnd())
  1880. def testConsumeTwoLineComments(self):
  1881. text = '# some comment\n# another comment'
  1882. tokenizer = text_format.Tokenizer(text.splitlines(), skip_comments=False)
  1883. self.assertEqual((False, '# some comment'),
  1884. tokenizer.ConsumeCommentOrTrailingComment())
  1885. self.assertFalse(tokenizer.AtEnd())
  1886. self.assertEqual((False, '# another comment'),
  1887. tokenizer.ConsumeCommentOrTrailingComment())
  1888. self.assertTrue(tokenizer.AtEnd())
  1889. def testConsumeAndCheckTrailingComment(self):
  1890. text = 'some_number: 4 # some comment' # trailing comment on the same line
  1891. tokenizer = text_format.Tokenizer(text.splitlines(), skip_comments=False)
  1892. self.assertRaises(text_format.ParseError,
  1893. tokenizer.ConsumeCommentOrTrailingComment)
  1894. self.assertEqual('some_number', tokenizer.ConsumeIdentifier())
  1895. self.assertEqual(tokenizer.token, ':')
  1896. tokenizer.NextToken()
  1897. self.assertRaises(text_format.ParseError,
  1898. tokenizer.ConsumeCommentOrTrailingComment)
  1899. self.assertEqual(4, tokenizer.ConsumeInteger())
  1900. self.assertFalse(tokenizer.AtEnd())
  1901. self.assertEqual((True, '# some comment'),
  1902. tokenizer.ConsumeCommentOrTrailingComment())
  1903. self.assertTrue(tokenizer.AtEnd())
  1904. def testHashinComment(self):
  1905. text = 'some_number: 4 # some comment # not a new comment'
  1906. tokenizer = text_format.Tokenizer(text.splitlines(), skip_comments=False)
  1907. self.assertEqual('some_number', tokenizer.ConsumeIdentifier())
  1908. self.assertEqual(tokenizer.token, ':')
  1909. tokenizer.NextToken()
  1910. self.assertEqual(4, tokenizer.ConsumeInteger())
  1911. self.assertEqual((True, '# some comment # not a new comment'),
  1912. tokenizer.ConsumeCommentOrTrailingComment())
  1913. self.assertTrue(tokenizer.AtEnd())
  1914. def testHugeString(self):
  1915. # With pathologic backtracking, fails with Forge OOM.
  1916. text = '"' + 'a' * (10 * 1024 * 1024) + '"'
  1917. tokenizer = text_format.Tokenizer(text.splitlines(), skip_comments=False)
  1918. tokenizer.ConsumeString()
  1919. # Tests for pretty printer functionality.
  1920. @_parameterized.parameters((unittest_pb2), (unittest_proto3_arena_pb2))
  1921. class PrettyPrinterTest(TextFormatBase):
  1922. def testPrettyPrintNoMatch(self, message_module):
  1923. def printer(message, indent, as_one_line):
  1924. del message, indent, as_one_line
  1925. return None
  1926. message = message_module.TestAllTypes()
  1927. msg = message.repeated_nested_message.add()
  1928. msg.bb = 42
  1929. self.CompareToGoldenText(
  1930. text_format.MessageToString(
  1931. message, as_one_line=True, message_formatter=printer),
  1932. 'repeated_nested_message { bb: 42 }')
  1933. def testPrettyPrintOneLine(self, message_module):
  1934. def printer(m, indent, as_one_line):
  1935. del indent, as_one_line
  1936. if m.DESCRIPTOR == message_module.TestAllTypes.NestedMessage.DESCRIPTOR:
  1937. return 'My lucky number is %s' % m.bb
  1938. message = message_module.TestAllTypes()
  1939. msg = message.repeated_nested_message.add()
  1940. msg.bb = 42
  1941. self.CompareToGoldenText(
  1942. text_format.MessageToString(
  1943. message, as_one_line=True, message_formatter=printer),
  1944. 'repeated_nested_message { My lucky number is 42 }')
  1945. def testPrettyPrintMultiLine(self, message_module):
  1946. def printer(m, indent, as_one_line):
  1947. if m.DESCRIPTOR == message_module.TestAllTypes.NestedMessage.DESCRIPTOR:
  1948. line_deliminator = (' ' if as_one_line else '\n') + ' ' * indent
  1949. return 'My lucky number is:%s%s' % (line_deliminator, m.bb)
  1950. return None
  1951. message = message_module.TestAllTypes()
  1952. msg = message.repeated_nested_message.add()
  1953. msg.bb = 42
  1954. self.CompareToGoldenText(
  1955. text_format.MessageToString(
  1956. message, as_one_line=True, message_formatter=printer),
  1957. 'repeated_nested_message { My lucky number is: 42 }')
  1958. self.CompareToGoldenText(
  1959. text_format.MessageToString(
  1960. message, as_one_line=False, message_formatter=printer),
  1961. 'repeated_nested_message {\n My lucky number is:\n 42\n}\n')
  1962. def testPrettyPrintEntireMessage(self, message_module):
  1963. def printer(m, indent, as_one_line):
  1964. del indent, as_one_line
  1965. if m.DESCRIPTOR == message_module.TestAllTypes.DESCRIPTOR:
  1966. return 'The is the message!'
  1967. return None
  1968. message = message_module.TestAllTypes()
  1969. self.CompareToGoldenText(
  1970. text_format.MessageToString(
  1971. message, as_one_line=False, message_formatter=printer),
  1972. 'The is the message!\n')
  1973. self.CompareToGoldenText(
  1974. text_format.MessageToString(
  1975. message, as_one_line=True, message_formatter=printer),
  1976. 'The is the message!')
  1977. def testPrettyPrintMultipleParts(self, message_module):
  1978. def printer(m, indent, as_one_line):
  1979. del indent, as_one_line
  1980. if m.DESCRIPTOR == message_module.TestAllTypes.NestedMessage.DESCRIPTOR:
  1981. return 'My lucky number is %s' % m.bb
  1982. return None
  1983. message = message_module.TestAllTypes()
  1984. message.optional_int32 = 61
  1985. msg = message.repeated_nested_message.add()
  1986. msg.bb = 42
  1987. msg = message.repeated_nested_message.add()
  1988. msg.bb = 99
  1989. msg = message.optional_nested_message
  1990. msg.bb = 1
  1991. self.CompareToGoldenText(
  1992. text_format.MessageToString(
  1993. message, as_one_line=True, message_formatter=printer),
  1994. ('optional_int32: 61 '
  1995. 'optional_nested_message { My lucky number is 1 } '
  1996. 'repeated_nested_message { My lucky number is 42 } '
  1997. 'repeated_nested_message { My lucky number is 99 }'))
  1998. out = text_format.TextWriter(False)
  1999. text_format.PrintField(
  2000. message_module.TestAllTypes.DESCRIPTOR.fields_by_name[
  2001. 'optional_nested_message'],
  2002. message.optional_nested_message,
  2003. out,
  2004. message_formatter=printer)
  2005. self.assertEqual(
  2006. 'optional_nested_message {\n My lucky number is 1\n}\n',
  2007. out.getvalue())
  2008. out.close()
  2009. out = text_format.TextWriter(False)
  2010. text_format.PrintFieldValue(
  2011. message_module.TestAllTypes.DESCRIPTOR.fields_by_name[
  2012. 'optional_nested_message'],
  2013. message.optional_nested_message,
  2014. out,
  2015. message_formatter=printer)
  2016. self.assertEqual(
  2017. '{\n My lucky number is 1\n}',
  2018. out.getvalue())
  2019. out.close()
  2020. class WhitespaceTest(TextFormatBase):
  2021. def setUp(self):
  2022. self.out = text_format.TextWriter(False)
  2023. self.addCleanup(self.out.close)
  2024. self.message = unittest_pb2.NestedTestAllTypes()
  2025. self.message.child.payload.optional_string = 'value'
  2026. self.field = self.message.DESCRIPTOR.fields_by_name['child']
  2027. self.value = self.message.child
  2028. def testMessageToString(self):
  2029. self.CompareToGoldenText(
  2030. text_format.MessageToString(self.message),
  2031. textwrap.dedent("""\
  2032. child {
  2033. payload {
  2034. optional_string: "value"
  2035. }
  2036. }
  2037. """))
  2038. def testPrintMessage(self):
  2039. text_format.PrintMessage(self.message, self.out)
  2040. self.CompareToGoldenText(
  2041. self.out.getvalue(),
  2042. textwrap.dedent("""\
  2043. child {
  2044. payload {
  2045. optional_string: "value"
  2046. }
  2047. }
  2048. """))
  2049. def testPrintField(self):
  2050. text_format.PrintField(self.field, self.value, self.out)
  2051. self.CompareToGoldenText(
  2052. self.out.getvalue(),
  2053. textwrap.dedent("""\
  2054. child {
  2055. payload {
  2056. optional_string: "value"
  2057. }
  2058. }
  2059. """))
  2060. def testPrintFieldValue(self):
  2061. text_format.PrintFieldValue(
  2062. self.field, self.value, self.out)
  2063. self.CompareToGoldenText(
  2064. self.out.getvalue(),
  2065. textwrap.dedent("""\
  2066. {
  2067. payload {
  2068. optional_string: "value"
  2069. }
  2070. }"""))
  2071. class OptionalColonMessageToStringTest(unittest.TestCase):
  2072. def testForcePrintOptionalColon(self):
  2073. packed_message = unittest_pb2.OneString()
  2074. packed_message.data = 'string'
  2075. message = any_test_pb2.TestAny()
  2076. message.any_value.Pack(packed_message)
  2077. output = text_format.MessageToString(
  2078. message,
  2079. force_colon=True)
  2080. expected = ('any_value: {\n'
  2081. ' [type.googleapis.com/protobuf_unittest.OneString]: {\n'
  2082. ' data: "string"\n'
  2083. ' }\n'
  2084. '}\n')
  2085. self.assertEqual(expected, output)
  2086. if __name__ == '__main__':
  2087. unittest.main()