json_format.py 31 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834
  1. # Protocol Buffers - Google's data interchange format
  2. # Copyright 2008 Google Inc. All rights reserved.
  3. # https://developers.google.com/protocol-buffers/
  4. #
  5. # Redistribution and use in source and binary forms, with or without
  6. # modification, are permitted provided that the following conditions are
  7. # met:
  8. #
  9. # * Redistributions of source code must retain the above copyright
  10. # notice, this list of conditions and the following disclaimer.
  11. # * Redistributions in binary form must reproduce the above
  12. # copyright notice, this list of conditions and the following disclaimer
  13. # in the documentation and/or other materials provided with the
  14. # distribution.
  15. # * Neither the name of Google Inc. nor the names of its
  16. # contributors may be used to endorse or promote products derived from
  17. # this software without specific prior written permission.
  18. #
  19. # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  20. # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  21. # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  22. # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  23. # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  24. # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  25. # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  26. # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  27. # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  28. # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  29. # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  30. """Contains routines for printing protocol messages in JSON format.
  31. Simple usage example:
  32. # Create a proto object and serialize it to a json format string.
  33. message = my_proto_pb2.MyMessage(foo='bar')
  34. json_string = json_format.MessageToJson(message)
  35. # Parse a json format string to proto object.
  36. message = json_format.Parse(json_string, my_proto_pb2.MyMessage())
  37. """
  38. __author__ = 'jieluo@google.com (Jie Luo)'
  39. # pylint: disable=g-statement-before-imports,g-import-not-at-top
  40. try:
  41. from collections import OrderedDict
  42. except ImportError:
  43. from ordereddict import OrderedDict # PY26
  44. # pylint: enable=g-statement-before-imports,g-import-not-at-top
  45. import base64
  46. import json
  47. import math
  48. from operator import methodcaller
  49. import re
  50. import sys
  51. import six
  52. from google.protobuf.internal import type_checkers
  53. from google.protobuf import descriptor
  54. from google.protobuf import symbol_database
  55. _TIMESTAMPFOMAT = '%Y-%m-%dT%H:%M:%S'
  56. _INT_TYPES = frozenset([descriptor.FieldDescriptor.CPPTYPE_INT32,
  57. descriptor.FieldDescriptor.CPPTYPE_UINT32,
  58. descriptor.FieldDescriptor.CPPTYPE_INT64,
  59. descriptor.FieldDescriptor.CPPTYPE_UINT64])
  60. _INT64_TYPES = frozenset([descriptor.FieldDescriptor.CPPTYPE_INT64,
  61. descriptor.FieldDescriptor.CPPTYPE_UINT64])
  62. _FLOAT_TYPES = frozenset([descriptor.FieldDescriptor.CPPTYPE_FLOAT,
  63. descriptor.FieldDescriptor.CPPTYPE_DOUBLE])
  64. _INFINITY = 'Infinity'
  65. _NEG_INFINITY = '-Infinity'
  66. _NAN = 'NaN'
  67. _UNPAIRED_SURROGATE_PATTERN = re.compile(six.u(
  68. r'[\ud800-\udbff](?![\udc00-\udfff])|(?<![\ud800-\udbff])[\udc00-\udfff]'
  69. ))
  70. _VALID_EXTENSION_NAME = re.compile(r'\[[a-zA-Z0-9\._]*\]$')
  71. class Error(Exception):
  72. """Top-level module error for json_format."""
  73. class SerializeToJsonError(Error):
  74. """Thrown if serialization to JSON fails."""
  75. class ParseError(Error):
  76. """Thrown in case of parsing error."""
  77. def MessageToJson(
  78. message,
  79. including_default_value_fields=False,
  80. preserving_proto_field_name=False,
  81. indent=2,
  82. sort_keys=False,
  83. use_integers_for_enums=False,
  84. descriptor_pool=None,
  85. float_precision=None):
  86. """Converts protobuf message to JSON format.
  87. Args:
  88. message: The protocol buffers message instance to serialize.
  89. including_default_value_fields: If True, singular primitive fields,
  90. repeated fields, and map fields will always be serialized. If
  91. False, only serialize non-empty fields. Singular message fields
  92. and oneof fields are not affected by this option.
  93. preserving_proto_field_name: If True, use the original proto field
  94. names as defined in the .proto file. If False, convert the field
  95. names to lowerCamelCase.
  96. indent: The JSON object will be pretty-printed with this indent level.
  97. An indent level of 0 or negative will only insert newlines.
  98. sort_keys: If True, then the output will be sorted by field names.
  99. use_integers_for_enums: If true, print integers instead of enum names.
  100. descriptor_pool: A Descriptor Pool for resolving types. If None use the
  101. default.
  102. float_precision: If set, use this to specify float field valid digits.
  103. Returns:
  104. A string containing the JSON formatted protocol buffer message.
  105. """
  106. printer = _Printer(
  107. including_default_value_fields,
  108. preserving_proto_field_name,
  109. use_integers_for_enums,
  110. descriptor_pool,
  111. float_precision=float_precision)
  112. return printer.ToJsonString(message, indent, sort_keys)
  113. def MessageToDict(
  114. message,
  115. including_default_value_fields=False,
  116. preserving_proto_field_name=False,
  117. use_integers_for_enums=False,
  118. descriptor_pool=None,
  119. float_precision=None):
  120. """Converts protobuf message to a dictionary.
  121. When the dictionary is encoded to JSON, it conforms to proto3 JSON spec.
  122. Args:
  123. message: The protocol buffers message instance to serialize.
  124. including_default_value_fields: If True, singular primitive fields,
  125. repeated fields, and map fields will always be serialized. If
  126. False, only serialize non-empty fields. Singular message fields
  127. and oneof fields are not affected by this option.
  128. preserving_proto_field_name: If True, use the original proto field
  129. names as defined in the .proto file. If False, convert the field
  130. names to lowerCamelCase.
  131. use_integers_for_enums: If true, print integers instead of enum names.
  132. descriptor_pool: A Descriptor Pool for resolving types. If None use the
  133. default.
  134. float_precision: If set, use this to specify float field valid digits.
  135. Returns:
  136. A dict representation of the protocol buffer message.
  137. """
  138. printer = _Printer(
  139. including_default_value_fields,
  140. preserving_proto_field_name,
  141. use_integers_for_enums,
  142. descriptor_pool,
  143. float_precision=float_precision)
  144. # pylint: disable=protected-access
  145. return printer._MessageToJsonObject(message)
  146. def _IsMapEntry(field):
  147. return (field.type == descriptor.FieldDescriptor.TYPE_MESSAGE and
  148. field.message_type.has_options and
  149. field.message_type.GetOptions().map_entry)
  150. class _Printer(object):
  151. """JSON format printer for protocol message."""
  152. def __init__(
  153. self,
  154. including_default_value_fields=False,
  155. preserving_proto_field_name=False,
  156. use_integers_for_enums=False,
  157. descriptor_pool=None,
  158. float_precision=None):
  159. self.including_default_value_fields = including_default_value_fields
  160. self.preserving_proto_field_name = preserving_proto_field_name
  161. self.use_integers_for_enums = use_integers_for_enums
  162. self.descriptor_pool = descriptor_pool
  163. # TODO(jieluo): change the float precision default to 8 valid digits.
  164. if float_precision:
  165. self.float_format = '.{}g'.format(float_precision)
  166. else:
  167. self.float_format = None
  168. def ToJsonString(self, message, indent, sort_keys):
  169. js = self._MessageToJsonObject(message)
  170. return json.dumps(js, indent=indent, sort_keys=sort_keys)
  171. def _MessageToJsonObject(self, message):
  172. """Converts message to an object according to Proto3 JSON Specification."""
  173. message_descriptor = message.DESCRIPTOR
  174. full_name = message_descriptor.full_name
  175. if _IsWrapperMessage(message_descriptor):
  176. return self._WrapperMessageToJsonObject(message)
  177. if full_name in _WKTJSONMETHODS:
  178. return methodcaller(_WKTJSONMETHODS[full_name][0], message)(self)
  179. js = {}
  180. return self._RegularMessageToJsonObject(message, js)
  181. def _RegularMessageToJsonObject(self, message, js):
  182. """Converts normal message according to Proto3 JSON Specification."""
  183. fields = message.ListFields()
  184. try:
  185. for field, value in fields:
  186. if self.preserving_proto_field_name:
  187. name = field.name
  188. else:
  189. name = field.json_name
  190. if _IsMapEntry(field):
  191. # Convert a map field.
  192. v_field = field.message_type.fields_by_name['value']
  193. js_map = {}
  194. for key in value:
  195. if isinstance(key, bool):
  196. if key:
  197. recorded_key = 'true'
  198. else:
  199. recorded_key = 'false'
  200. else:
  201. recorded_key = key
  202. js_map[recorded_key] = self._FieldToJsonObject(
  203. v_field, value[key])
  204. js[name] = js_map
  205. elif field.label == descriptor.FieldDescriptor.LABEL_REPEATED:
  206. # Convert a repeated field.
  207. js[name] = [self._FieldToJsonObject(field, k)
  208. for k in value]
  209. elif field.is_extension:
  210. full_qualifier = field.full_name[:-len(field.name)]
  211. name = '[%s%s]' % (full_qualifier, name)
  212. js[name] = self._FieldToJsonObject(field, value)
  213. else:
  214. js[name] = self._FieldToJsonObject(field, value)
  215. # Serialize default value if including_default_value_fields is True.
  216. if self.including_default_value_fields:
  217. message_descriptor = message.DESCRIPTOR
  218. for field in message_descriptor.fields:
  219. # Singular message fields and oneof fields will not be affected.
  220. if ((field.label != descriptor.FieldDescriptor.LABEL_REPEATED and
  221. field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_MESSAGE) or
  222. field.containing_oneof):
  223. continue
  224. if self.preserving_proto_field_name:
  225. name = field.name
  226. else:
  227. name = field.json_name
  228. if name in js:
  229. # Skip the field which has been serialized already.
  230. continue
  231. if _IsMapEntry(field):
  232. js[name] = {}
  233. elif field.label == descriptor.FieldDescriptor.LABEL_REPEATED:
  234. js[name] = []
  235. else:
  236. js[name] = self._FieldToJsonObject(field, field.default_value)
  237. except ValueError as e:
  238. raise SerializeToJsonError(
  239. 'Failed to serialize {0} field: {1}.'.format(field.name, e))
  240. return js
  241. def _FieldToJsonObject(self, field, value):
  242. """Converts field value according to Proto3 JSON Specification."""
  243. if field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_MESSAGE:
  244. return self._MessageToJsonObject(value)
  245. elif field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_ENUM:
  246. if self.use_integers_for_enums:
  247. return value
  248. enum_value = field.enum_type.values_by_number.get(value, None)
  249. if enum_value is not None:
  250. return enum_value.name
  251. else:
  252. if field.file.syntax == 'proto3':
  253. return value
  254. raise SerializeToJsonError('Enum field contains an integer value '
  255. 'which can not mapped to an enum value.')
  256. elif field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_STRING:
  257. if field.type == descriptor.FieldDescriptor.TYPE_BYTES:
  258. # Use base64 Data encoding for bytes
  259. return base64.b64encode(value).decode('utf-8')
  260. else:
  261. return value
  262. elif field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_BOOL:
  263. return bool(value)
  264. elif field.cpp_type in _INT64_TYPES:
  265. return str(value)
  266. elif field.cpp_type in _FLOAT_TYPES:
  267. if math.isinf(value):
  268. if value < 0.0:
  269. return _NEG_INFINITY
  270. else:
  271. return _INFINITY
  272. if math.isnan(value):
  273. return _NAN
  274. if field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_FLOAT:
  275. if self.float_format:
  276. return float(format(value, self.float_format))
  277. else:
  278. return type_checkers.ToShortestFloat(value)
  279. return value
  280. def _AnyMessageToJsonObject(self, message):
  281. """Converts Any message according to Proto3 JSON Specification."""
  282. if not message.ListFields():
  283. return {}
  284. # Must print @type first, use OrderedDict instead of {}
  285. js = OrderedDict()
  286. type_url = message.type_url
  287. js['@type'] = type_url
  288. sub_message = _CreateMessageFromTypeUrl(type_url, self.descriptor_pool)
  289. sub_message.ParseFromString(message.value)
  290. message_descriptor = sub_message.DESCRIPTOR
  291. full_name = message_descriptor.full_name
  292. if _IsWrapperMessage(message_descriptor):
  293. js['value'] = self._WrapperMessageToJsonObject(sub_message)
  294. return js
  295. if full_name in _WKTJSONMETHODS:
  296. js['value'] = methodcaller(_WKTJSONMETHODS[full_name][0],
  297. sub_message)(self)
  298. return js
  299. return self._RegularMessageToJsonObject(sub_message, js)
  300. def _GenericMessageToJsonObject(self, message):
  301. """Converts message according to Proto3 JSON Specification."""
  302. # Duration, Timestamp and FieldMask have ToJsonString method to do the
  303. # convert. Users can also call the method directly.
  304. return message.ToJsonString()
  305. def _ValueMessageToJsonObject(self, message):
  306. """Converts Value message according to Proto3 JSON Specification."""
  307. which = message.WhichOneof('kind')
  308. # If the Value message is not set treat as null_value when serialize
  309. # to JSON. The parse back result will be different from original message.
  310. if which is None or which == 'null_value':
  311. return None
  312. if which == 'list_value':
  313. return self._ListValueMessageToJsonObject(message.list_value)
  314. if which == 'struct_value':
  315. value = message.struct_value
  316. else:
  317. value = getattr(message, which)
  318. oneof_descriptor = message.DESCRIPTOR.fields_by_name[which]
  319. return self._FieldToJsonObject(oneof_descriptor, value)
  320. def _ListValueMessageToJsonObject(self, message):
  321. """Converts ListValue message according to Proto3 JSON Specification."""
  322. return [self._ValueMessageToJsonObject(value)
  323. for value in message.values]
  324. def _StructMessageToJsonObject(self, message):
  325. """Converts Struct message according to Proto3 JSON Specification."""
  326. fields = message.fields
  327. ret = {}
  328. for key in fields:
  329. ret[key] = self._ValueMessageToJsonObject(fields[key])
  330. return ret
  331. def _WrapperMessageToJsonObject(self, message):
  332. return self._FieldToJsonObject(
  333. message.DESCRIPTOR.fields_by_name['value'], message.value)
  334. def _IsWrapperMessage(message_descriptor):
  335. return message_descriptor.file.name == 'google/protobuf/wrappers.proto'
  336. def _DuplicateChecker(js):
  337. result = {}
  338. for name, value in js:
  339. if name in result:
  340. raise ParseError('Failed to load JSON: duplicate key {0}.'.format(name))
  341. result[name] = value
  342. return result
  343. def _CreateMessageFromTypeUrl(type_url, descriptor_pool):
  344. """Creates a message from a type URL."""
  345. db = symbol_database.Default()
  346. pool = db.pool if descriptor_pool is None else descriptor_pool
  347. type_name = type_url.split('/')[-1]
  348. try:
  349. message_descriptor = pool.FindMessageTypeByName(type_name)
  350. except KeyError:
  351. raise TypeError(
  352. 'Can not find message descriptor by type_url: {0}.'.format(type_url))
  353. message_class = db.GetPrototype(message_descriptor)
  354. return message_class()
  355. def Parse(text, message, ignore_unknown_fields=False, descriptor_pool=None):
  356. """Parses a JSON representation of a protocol message into a message.
  357. Args:
  358. text: Message JSON representation.
  359. message: A protocol buffer message to merge into.
  360. ignore_unknown_fields: If True, do not raise errors for unknown fields.
  361. descriptor_pool: A Descriptor Pool for resolving types. If None use the
  362. default.
  363. Returns:
  364. The same message passed as argument.
  365. Raises::
  366. ParseError: On JSON parsing problems.
  367. """
  368. if not isinstance(text, six.text_type): text = text.decode('utf-8')
  369. try:
  370. js = json.loads(text, object_pairs_hook=_DuplicateChecker)
  371. except ValueError as e:
  372. raise ParseError('Failed to load JSON: {0}.'.format(str(e)))
  373. return ParseDict(js, message, ignore_unknown_fields, descriptor_pool)
  374. def ParseDict(js_dict,
  375. message,
  376. ignore_unknown_fields=False,
  377. descriptor_pool=None):
  378. """Parses a JSON dictionary representation into a message.
  379. Args:
  380. js_dict: Dict representation of a JSON message.
  381. message: A protocol buffer message to merge into.
  382. ignore_unknown_fields: If True, do not raise errors for unknown fields.
  383. descriptor_pool: A Descriptor Pool for resolving types. If None use the
  384. default.
  385. Returns:
  386. The same message passed as argument.
  387. """
  388. parser = _Parser(ignore_unknown_fields, descriptor_pool)
  389. parser.ConvertMessage(js_dict, message)
  390. return message
  391. _INT_OR_FLOAT = six.integer_types + (float,)
  392. class _Parser(object):
  393. """JSON format parser for protocol message."""
  394. def __init__(self, ignore_unknown_fields, descriptor_pool):
  395. self.ignore_unknown_fields = ignore_unknown_fields
  396. self.descriptor_pool = descriptor_pool
  397. def ConvertMessage(self, value, message):
  398. """Convert a JSON object into a message.
  399. Args:
  400. value: A JSON object.
  401. message: A WKT or regular protocol message to record the data.
  402. Raises:
  403. ParseError: In case of convert problems.
  404. """
  405. message_descriptor = message.DESCRIPTOR
  406. full_name = message_descriptor.full_name
  407. if _IsWrapperMessage(message_descriptor):
  408. self._ConvertWrapperMessage(value, message)
  409. elif full_name in _WKTJSONMETHODS:
  410. methodcaller(_WKTJSONMETHODS[full_name][1], value, message)(self)
  411. else:
  412. self._ConvertFieldValuePair(value, message)
  413. def _ConvertFieldValuePair(self, js, message):
  414. """Convert field value pairs into regular message.
  415. Args:
  416. js: A JSON object to convert the field value pairs.
  417. message: A regular protocol message to record the data.
  418. Raises:
  419. ParseError: In case of problems converting.
  420. """
  421. names = []
  422. message_descriptor = message.DESCRIPTOR
  423. fields_by_json_name = dict((f.json_name, f)
  424. for f in message_descriptor.fields)
  425. for name in js:
  426. try:
  427. field = fields_by_json_name.get(name, None)
  428. if not field:
  429. field = message_descriptor.fields_by_name.get(name, None)
  430. if not field and _VALID_EXTENSION_NAME.match(name):
  431. if not message_descriptor.is_extendable:
  432. raise ParseError('Message type {0} does not have extensions'.format(
  433. message_descriptor.full_name))
  434. identifier = name[1:-1] # strip [] brackets
  435. # pylint: disable=protected-access
  436. field = message.Extensions._FindExtensionByName(identifier)
  437. # pylint: enable=protected-access
  438. if not field:
  439. # Try looking for extension by the message type name, dropping the
  440. # field name following the final . separator in full_name.
  441. identifier = '.'.join(identifier.split('.')[:-1])
  442. # pylint: disable=protected-access
  443. field = message.Extensions._FindExtensionByName(identifier)
  444. # pylint: enable=protected-access
  445. if not field:
  446. if self.ignore_unknown_fields:
  447. continue
  448. raise ParseError(
  449. ('Message type "{0}" has no field named "{1}".\n'
  450. ' Available Fields(except extensions): {2}').format(
  451. message_descriptor.full_name, name,
  452. [f.json_name for f in message_descriptor.fields]))
  453. if name in names:
  454. raise ParseError('Message type "{0}" should not have multiple '
  455. '"{1}" fields.'.format(
  456. message.DESCRIPTOR.full_name, name))
  457. names.append(name)
  458. # Check no other oneof field is parsed.
  459. if field.containing_oneof is not None:
  460. oneof_name = field.containing_oneof.name
  461. if oneof_name in names:
  462. raise ParseError('Message type "{0}" should not have multiple '
  463. '"{1}" oneof fields.'.format(
  464. message.DESCRIPTOR.full_name, oneof_name))
  465. names.append(oneof_name)
  466. value = js[name]
  467. if value is None:
  468. if (field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_MESSAGE
  469. and field.message_type.full_name == 'google.protobuf.Value'):
  470. sub_message = getattr(message, field.name)
  471. sub_message.null_value = 0
  472. else:
  473. message.ClearField(field.name)
  474. continue
  475. # Parse field value.
  476. if _IsMapEntry(field):
  477. message.ClearField(field.name)
  478. self._ConvertMapFieldValue(value, message, field)
  479. elif field.label == descriptor.FieldDescriptor.LABEL_REPEATED:
  480. message.ClearField(field.name)
  481. if not isinstance(value, list):
  482. raise ParseError('repeated field {0} must be in [] which is '
  483. '{1}.'.format(name, value))
  484. if field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_MESSAGE:
  485. # Repeated message field.
  486. for item in value:
  487. sub_message = getattr(message, field.name).add()
  488. # None is a null_value in Value.
  489. if (item is None and
  490. sub_message.DESCRIPTOR.full_name != 'google.protobuf.Value'):
  491. raise ParseError('null is not allowed to be used as an element'
  492. ' in a repeated field.')
  493. self.ConvertMessage(item, sub_message)
  494. else:
  495. # Repeated scalar field.
  496. for item in value:
  497. if item is None:
  498. raise ParseError('null is not allowed to be used as an element'
  499. ' in a repeated field.')
  500. getattr(message, field.name).append(
  501. _ConvertScalarFieldValue(item, field))
  502. elif field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_MESSAGE:
  503. if field.is_extension:
  504. sub_message = message.Extensions[field]
  505. else:
  506. sub_message = getattr(message, field.name)
  507. sub_message.SetInParent()
  508. self.ConvertMessage(value, sub_message)
  509. else:
  510. if field.is_extension:
  511. message.Extensions[field] = _ConvertScalarFieldValue(value, field)
  512. else:
  513. setattr(message, field.name, _ConvertScalarFieldValue(value, field))
  514. except ParseError as e:
  515. if field and field.containing_oneof is None:
  516. raise ParseError('Failed to parse {0} field: {1}.'.format(name, e))
  517. else:
  518. raise ParseError(str(e))
  519. except ValueError as e:
  520. raise ParseError('Failed to parse {0} field: {1}.'.format(name, e))
  521. except TypeError as e:
  522. raise ParseError('Failed to parse {0} field: {1}.'.format(name, e))
  523. def _ConvertAnyMessage(self, value, message):
  524. """Convert a JSON representation into Any message."""
  525. if isinstance(value, dict) and not value:
  526. return
  527. try:
  528. type_url = value['@type']
  529. except KeyError:
  530. raise ParseError('@type is missing when parsing any message.')
  531. sub_message = _CreateMessageFromTypeUrl(type_url, self.descriptor_pool)
  532. message_descriptor = sub_message.DESCRIPTOR
  533. full_name = message_descriptor.full_name
  534. if _IsWrapperMessage(message_descriptor):
  535. self._ConvertWrapperMessage(value['value'], sub_message)
  536. elif full_name in _WKTJSONMETHODS:
  537. methodcaller(
  538. _WKTJSONMETHODS[full_name][1], value['value'], sub_message)(self)
  539. else:
  540. del value['@type']
  541. self._ConvertFieldValuePair(value, sub_message)
  542. value['@type'] = type_url
  543. # Sets Any message
  544. message.value = sub_message.SerializeToString()
  545. message.type_url = type_url
  546. def _ConvertGenericMessage(self, value, message):
  547. """Convert a JSON representation into message with FromJsonString."""
  548. # Duration, Timestamp, FieldMask have a FromJsonString method to do the
  549. # conversion. Users can also call the method directly.
  550. try:
  551. message.FromJsonString(value)
  552. except ValueError as e:
  553. raise ParseError(e)
  554. def _ConvertValueMessage(self, value, message):
  555. """Convert a JSON representation into Value message."""
  556. if isinstance(value, dict):
  557. self._ConvertStructMessage(value, message.struct_value)
  558. elif isinstance(value, list):
  559. self. _ConvertListValueMessage(value, message.list_value)
  560. elif value is None:
  561. message.null_value = 0
  562. elif isinstance(value, bool):
  563. message.bool_value = value
  564. elif isinstance(value, six.string_types):
  565. message.string_value = value
  566. elif isinstance(value, _INT_OR_FLOAT):
  567. message.number_value = value
  568. else:
  569. raise ParseError('Unexpected type for Value message.')
  570. def _ConvertListValueMessage(self, value, message):
  571. """Convert a JSON representation into ListValue message."""
  572. if not isinstance(value, list):
  573. raise ParseError(
  574. 'ListValue must be in [] which is {0}.'.format(value))
  575. message.ClearField('values')
  576. for item in value:
  577. self._ConvertValueMessage(item, message.values.add())
  578. def _ConvertStructMessage(self, value, message):
  579. """Convert a JSON representation into Struct message."""
  580. if not isinstance(value, dict):
  581. raise ParseError(
  582. 'Struct must be in a dict which is {0}.'.format(value))
  583. # Clear will mark the struct as modified so it will be created even if
  584. # there are no values.
  585. message.Clear()
  586. for key in value:
  587. self._ConvertValueMessage(value[key], message.fields[key])
  588. return
  589. def _ConvertWrapperMessage(self, value, message):
  590. """Convert a JSON representation into Wrapper message."""
  591. field = message.DESCRIPTOR.fields_by_name['value']
  592. setattr(message, 'value', _ConvertScalarFieldValue(value, field))
  593. def _ConvertMapFieldValue(self, value, message, field):
  594. """Convert map field value for a message map field.
  595. Args:
  596. value: A JSON object to convert the map field value.
  597. message: A protocol message to record the converted data.
  598. field: The descriptor of the map field to be converted.
  599. Raises:
  600. ParseError: In case of convert problems.
  601. """
  602. if not isinstance(value, dict):
  603. raise ParseError(
  604. 'Map field {0} must be in a dict which is {1}.'.format(
  605. field.name, value))
  606. key_field = field.message_type.fields_by_name['key']
  607. value_field = field.message_type.fields_by_name['value']
  608. for key in value:
  609. key_value = _ConvertScalarFieldValue(key, key_field, True)
  610. if value_field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_MESSAGE:
  611. self.ConvertMessage(value[key], getattr(
  612. message, field.name)[key_value])
  613. else:
  614. getattr(message, field.name)[key_value] = _ConvertScalarFieldValue(
  615. value[key], value_field)
  616. def _ConvertScalarFieldValue(value, field, require_str=False):
  617. """Convert a single scalar field value.
  618. Args:
  619. value: A scalar value to convert the scalar field value.
  620. field: The descriptor of the field to convert.
  621. require_str: If True, the field value must be a str.
  622. Returns:
  623. The converted scalar field value
  624. Raises:
  625. ParseError: In case of convert problems.
  626. """
  627. if field.cpp_type in _INT_TYPES:
  628. return _ConvertInteger(value)
  629. elif field.cpp_type in _FLOAT_TYPES:
  630. return _ConvertFloat(value)
  631. elif field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_BOOL:
  632. return _ConvertBool(value, require_str)
  633. elif field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_STRING:
  634. if field.type == descriptor.FieldDescriptor.TYPE_BYTES:
  635. return base64.b64decode(value)
  636. else:
  637. # Checking for unpaired surrogates appears to be unreliable,
  638. # depending on the specific Python version, so we check manually.
  639. if _UNPAIRED_SURROGATE_PATTERN.search(value):
  640. raise ParseError('Unpaired surrogate')
  641. return value
  642. elif field.cpp_type == descriptor.FieldDescriptor.CPPTYPE_ENUM:
  643. # Convert an enum value.
  644. enum_value = field.enum_type.values_by_name.get(value, None)
  645. if enum_value is None:
  646. try:
  647. number = int(value)
  648. enum_value = field.enum_type.values_by_number.get(number, None)
  649. except ValueError:
  650. raise ParseError('Invalid enum value {0} for enum type {1}.'.format(
  651. value, field.enum_type.full_name))
  652. if enum_value is None:
  653. if field.file.syntax == 'proto3':
  654. # Proto3 accepts unknown enums.
  655. return number
  656. raise ParseError('Invalid enum value {0} for enum type {1}.'.format(
  657. value, field.enum_type.full_name))
  658. return enum_value.number
  659. def _ConvertInteger(value):
  660. """Convert an integer.
  661. Args:
  662. value: A scalar value to convert.
  663. Returns:
  664. The integer value.
  665. Raises:
  666. ParseError: If an integer couldn't be consumed.
  667. """
  668. if isinstance(value, float) and not value.is_integer():
  669. raise ParseError('Couldn\'t parse integer: {0}.'.format(value))
  670. if isinstance(value, six.text_type) and value.find(' ') != -1:
  671. raise ParseError('Couldn\'t parse integer: "{0}".'.format(value))
  672. return int(value)
  673. def _ConvertFloat(value):
  674. """Convert an floating point number."""
  675. if value == 'nan':
  676. raise ParseError('Couldn\'t parse float "nan", use "NaN" instead.')
  677. try:
  678. # Assume Python compatible syntax.
  679. return float(value)
  680. except ValueError:
  681. # Check alternative spellings.
  682. if value == _NEG_INFINITY:
  683. return float('-inf')
  684. elif value == _INFINITY:
  685. return float('inf')
  686. elif value == _NAN:
  687. return float('nan')
  688. else:
  689. raise ParseError('Couldn\'t parse float: {0}.'.format(value))
  690. def _ConvertBool(value, require_str):
  691. """Convert a boolean value.
  692. Args:
  693. value: A scalar value to convert.
  694. require_str: If True, value must be a str.
  695. Returns:
  696. The bool parsed.
  697. Raises:
  698. ParseError: If a boolean value couldn't be consumed.
  699. """
  700. if require_str:
  701. if value == 'true':
  702. return True
  703. elif value == 'false':
  704. return False
  705. else:
  706. raise ParseError('Expected "true" or "false", not {0}.'.format(value))
  707. if not isinstance(value, bool):
  708. raise ParseError('Expected true or false without quotes.')
  709. return value
  710. _WKTJSONMETHODS = {
  711. 'google.protobuf.Any': ['_AnyMessageToJsonObject',
  712. '_ConvertAnyMessage'],
  713. 'google.protobuf.Duration': ['_GenericMessageToJsonObject',
  714. '_ConvertGenericMessage'],
  715. 'google.protobuf.FieldMask': ['_GenericMessageToJsonObject',
  716. '_ConvertGenericMessage'],
  717. 'google.protobuf.ListValue': ['_ListValueMessageToJsonObject',
  718. '_ConvertListValueMessage'],
  719. 'google.protobuf.Struct': ['_StructMessageToJsonObject',
  720. '_ConvertStructMessage'],
  721. 'google.protobuf.Timestamp': ['_GenericMessageToJsonObject',
  722. '_ConvertGenericMessage'],
  723. 'google.protobuf.Value': ['_ValueMessageToJsonObject',
  724. '_ConvertValueMessage']
  725. }