Include all dupe types (event when value is zero) in scan stats.
[chromium-blink-merge.git] / third_party / simplejson / __init__.py
blobfe2bd5a28402543ee8efa97e7d6a92a00abe22c3
1 r"""JSON (JavaScript Object Notation) <http://json.org> is a subset of
2 JavaScript syntax (ECMA-262 3rd edition) used as a lightweight data
3 interchange format.
5 :mod:`simplejson` exposes an API familiar to users of the standard library
6 :mod:`marshal` and :mod:`pickle` modules. It is the externally maintained
7 version of the :mod:`json` library contained in Python 2.6, but maintains
8 compatibility with Python 2.4 and Python 2.5 and (currently) has
9 significant performance advantages, even without using the optional C
10 extension for speedups.
12 Encoding basic Python object hierarchies::
14 >>> import simplejson as json
15 >>> json.dumps(['foo', {'bar': ('baz', None, 1.0, 2)}])
16 '["foo", {"bar": ["baz", null, 1.0, 2]}]'
17 >>> print json.dumps("\"foo\bar")
18 "\"foo\bar"
19 >>> print json.dumps(u'\u1234')
20 "\u1234"
21 >>> print json.dumps('\\')
22 "\\"
23 >>> print json.dumps({"c": 0, "b": 0, "a": 0}, sort_keys=True)
24 {"a": 0, "b": 0, "c": 0}
25 >>> from StringIO import StringIO
26 >>> io = StringIO()
27 >>> json.dump(['streaming API'], io)
28 >>> io.getvalue()
29 '["streaming API"]'
31 Compact encoding::
33 >>> import simplejson as json
34 >>> json.dumps([1,2,3,{'4': 5, '6': 7}], separators=(',',':'))
35 '[1,2,3,{"4":5,"6":7}]'
37 Pretty printing::
39 >>> import simplejson as json
40 >>> s = json.dumps({'4': 5, '6': 7}, sort_keys=True, indent=' ')
41 >>> print '\n'.join([l.rstrip() for l in s.splitlines()])
43 "4": 5,
44 "6": 7
47 Decoding JSON::
49 >>> import simplejson as json
50 >>> obj = [u'foo', {u'bar': [u'baz', None, 1.0, 2]}]
51 >>> json.loads('["foo", {"bar":["baz", null, 1.0, 2]}]') == obj
52 True
53 >>> json.loads('"\\"foo\\bar"') == u'"foo\x08ar'
54 True
55 >>> from StringIO import StringIO
56 >>> io = StringIO('["streaming API"]')
57 >>> json.load(io)[0] == 'streaming API'
58 True
60 Specializing JSON object decoding::
62 >>> import simplejson as json
63 >>> def as_complex(dct):
64 ... if '__complex__' in dct:
65 ... return complex(dct['real'], dct['imag'])
66 ... return dct
67 ...
68 >>> json.loads('{"__complex__": true, "real": 1, "imag": 2}',
69 ... object_hook=as_complex)
70 (1+2j)
71 >>> from decimal import Decimal
72 >>> json.loads('1.1', parse_float=Decimal) == Decimal('1.1')
73 True
75 Specializing JSON object encoding::
77 >>> import simplejson as json
78 >>> def encode_complex(obj):
79 ... if isinstance(obj, complex):
80 ... return [obj.real, obj.imag]
81 ... raise TypeError(repr(o) + " is not JSON serializable")
82 ...
83 >>> json.dumps(2 + 1j, default=encode_complex)
84 '[2.0, 1.0]'
85 >>> json.JSONEncoder(default=encode_complex).encode(2 + 1j)
86 '[2.0, 1.0]'
87 >>> ''.join(json.JSONEncoder(default=encode_complex).iterencode(2 + 1j))
88 '[2.0, 1.0]'
91 Using simplejson.tool from the shell to validate and pretty-print::
93 $ echo '{"json":"obj"}' | python -m simplejson.tool
95 "json": "obj"
97 $ echo '{ 1.2:3.4}' | python -m simplejson.tool
98 Expecting property name: line 1 column 2 (char 2)
99 """
100 __version__ = '2.6.2'
101 __all__ = [
102 'dump', 'dumps', 'load', 'loads',
103 'JSONDecoder', 'JSONDecodeError', 'JSONEncoder',
104 'OrderedDict', 'simple_first',
107 __author__ = 'Bob Ippolito <bob@redivi.com>'
109 from decimal import Decimal
111 from decoder import JSONDecoder, JSONDecodeError
112 from encoder import JSONEncoder, JSONEncoderForHTML
113 def _import_OrderedDict():
114 import collections
115 try:
116 return collections.OrderedDict
117 except AttributeError:
118 import ordered_dict
119 return ordered_dict.OrderedDict
120 OrderedDict = _import_OrderedDict()
122 def _import_c_make_encoder():
123 try:
124 from simplejson._speedups import make_encoder
125 return make_encoder
126 except ImportError:
127 return None
129 _default_encoder = JSONEncoder(
130 skipkeys=False,
131 ensure_ascii=True,
132 check_circular=True,
133 allow_nan=True,
134 indent=None,
135 separators=None,
136 encoding='utf-8',
137 default=None,
138 use_decimal=True,
139 namedtuple_as_object=True,
140 tuple_as_array=True,
141 bigint_as_string=False,
142 item_sort_key=None,
145 def dump(obj, fp, skipkeys=False, ensure_ascii=True, check_circular=True,
146 allow_nan=True, cls=None, indent=None, separators=None,
147 encoding='utf-8', default=None, use_decimal=True,
148 namedtuple_as_object=True, tuple_as_array=True,
149 bigint_as_string=False, sort_keys=False, item_sort_key=None,
150 **kw):
151 """Serialize ``obj`` as a JSON formatted stream to ``fp`` (a
152 ``.write()``-supporting file-like object).
154 If ``skipkeys`` is true then ``dict`` keys that are not basic types
155 (``str``, ``unicode``, ``int``, ``long``, ``float``, ``bool``, ``None``)
156 will be skipped instead of raising a ``TypeError``.
158 If ``ensure_ascii`` is false, then the some chunks written to ``fp``
159 may be ``unicode`` instances, subject to normal Python ``str`` to
160 ``unicode`` coercion rules. Unless ``fp.write()`` explicitly
161 understands ``unicode`` (as in ``codecs.getwriter()``) this is likely
162 to cause an error.
164 If ``check_circular`` is false, then the circular reference check
165 for container types will be skipped and a circular reference will
166 result in an ``OverflowError`` (or worse).
168 If ``allow_nan`` is false, then it will be a ``ValueError`` to
169 serialize out of range ``float`` values (``nan``, ``inf``, ``-inf``)
170 in strict compliance of the JSON specification, instead of using the
171 JavaScript equivalents (``NaN``, ``Infinity``, ``-Infinity``).
173 If *indent* is a string, then JSON array elements and object members
174 will be pretty-printed with a newline followed by that string repeated
175 for each level of nesting. ``None`` (the default) selects the most compact
176 representation without any newlines. For backwards compatibility with
177 versions of simplejson earlier than 2.1.0, an integer is also accepted
178 and is converted to a string with that many spaces.
180 If ``separators`` is an ``(item_separator, dict_separator)`` tuple
181 then it will be used instead of the default ``(', ', ': ')`` separators.
182 ``(',', ':')`` is the most compact JSON representation.
184 ``encoding`` is the character encoding for str instances, default is UTF-8.
186 ``default(obj)`` is a function that should return a serializable version
187 of obj or raise TypeError. The default simply raises TypeError.
189 If *use_decimal* is true (default: ``True``) then decimal.Decimal
190 will be natively serialized to JSON with full precision.
192 If *namedtuple_as_object* is true (default: ``True``),
193 :class:`tuple` subclasses with ``_asdict()`` methods will be encoded
194 as JSON objects.
196 If *tuple_as_array* is true (default: ``True``),
197 :class:`tuple` (and subclasses) will be encoded as JSON arrays.
199 If *bigint_as_string* is true (default: ``False``), ints 2**53 and higher
200 or lower than -2**53 will be encoded as strings. This is to avoid the
201 rounding that happens in Javascript otherwise. Note that this is still a
202 lossy operation that will not round-trip correctly and should be used
203 sparingly.
205 If specified, *item_sort_key* is a callable used to sort the items in
206 each dictionary. This is useful if you want to sort items other than
207 in alphabetical order by key. This option takes precedence over
208 *sort_keys*.
210 If *sort_keys* is true (default: ``False``), the output of dictionaries
211 will be sorted by item.
213 To use a custom ``JSONEncoder`` subclass (e.g. one that overrides the
214 ``.default()`` method to serialize additional types), specify it with
215 the ``cls`` kwarg.
218 # cached encoder
219 if (not skipkeys and ensure_ascii and
220 check_circular and allow_nan and
221 cls is None and indent is None and separators is None and
222 encoding == 'utf-8' and default is None and use_decimal
223 and namedtuple_as_object and tuple_as_array
224 and not bigint_as_string and not item_sort_key and not kw):
225 iterable = _default_encoder.iterencode(obj)
226 else:
227 if cls is None:
228 cls = JSONEncoder
229 iterable = cls(skipkeys=skipkeys, ensure_ascii=ensure_ascii,
230 check_circular=check_circular, allow_nan=allow_nan, indent=indent,
231 separators=separators, encoding=encoding,
232 default=default, use_decimal=use_decimal,
233 namedtuple_as_object=namedtuple_as_object,
234 tuple_as_array=tuple_as_array,
235 bigint_as_string=bigint_as_string,
236 sort_keys=sort_keys,
237 item_sort_key=item_sort_key,
238 **kw).iterencode(obj)
239 # could accelerate with writelines in some versions of Python, at
240 # a debuggability cost
241 for chunk in iterable:
242 fp.write(chunk)
245 def dumps(obj, skipkeys=False, ensure_ascii=True, check_circular=True,
246 allow_nan=True, cls=None, indent=None, separators=None,
247 encoding='utf-8', default=None, use_decimal=True,
248 namedtuple_as_object=True, tuple_as_array=True,
249 bigint_as_string=False, sort_keys=False, item_sort_key=None,
250 **kw):
251 """Serialize ``obj`` to a JSON formatted ``str``.
253 If ``skipkeys`` is false then ``dict`` keys that are not basic types
254 (``str``, ``unicode``, ``int``, ``long``, ``float``, ``bool``, ``None``)
255 will be skipped instead of raising a ``TypeError``.
257 If ``ensure_ascii`` is false, then the return value will be a
258 ``unicode`` instance subject to normal Python ``str`` to ``unicode``
259 coercion rules instead of being escaped to an ASCII ``str``.
261 If ``check_circular`` is false, then the circular reference check
262 for container types will be skipped and a circular reference will
263 result in an ``OverflowError`` (or worse).
265 If ``allow_nan`` is false, then it will be a ``ValueError`` to
266 serialize out of range ``float`` values (``nan``, ``inf``, ``-inf``) in
267 strict compliance of the JSON specification, instead of using the
268 JavaScript equivalents (``NaN``, ``Infinity``, ``-Infinity``).
270 If ``indent`` is a string, then JSON array elements and object members
271 will be pretty-printed with a newline followed by that string repeated
272 for each level of nesting. ``None`` (the default) selects the most compact
273 representation without any newlines. For backwards compatibility with
274 versions of simplejson earlier than 2.1.0, an integer is also accepted
275 and is converted to a string with that many spaces.
277 If ``separators`` is an ``(item_separator, dict_separator)`` tuple
278 then it will be used instead of the default ``(', ', ': ')`` separators.
279 ``(',', ':')`` is the most compact JSON representation.
281 ``encoding`` is the character encoding for str instances, default is UTF-8.
283 ``default(obj)`` is a function that should return a serializable version
284 of obj or raise TypeError. The default simply raises TypeError.
286 If *use_decimal* is true (default: ``True``) then decimal.Decimal
287 will be natively serialized to JSON with full precision.
289 If *namedtuple_as_object* is true (default: ``True``),
290 :class:`tuple` subclasses with ``_asdict()`` methods will be encoded
291 as JSON objects.
293 If *tuple_as_array* is true (default: ``True``),
294 :class:`tuple` (and subclasses) will be encoded as JSON arrays.
296 If *bigint_as_string* is true (not the default), ints 2**53 and higher
297 or lower than -2**53 will be encoded as strings. This is to avoid the
298 rounding that happens in Javascript otherwise.
300 If specified, *item_sort_key* is a callable used to sort the items in
301 each dictionary. This is useful if you want to sort items other than
302 in alphabetical order by key. This option takes precendence over
303 *sort_keys*.
305 If *sort_keys* is true (default: ``False``), the output of dictionaries
306 will be sorted by item.
308 To use a custom ``JSONEncoder`` subclass (e.g. one that overrides the
309 ``.default()`` method to serialize additional types), specify it with
310 the ``cls`` kwarg.
313 # cached encoder
314 if (not skipkeys and ensure_ascii and
315 check_circular and allow_nan and
316 cls is None and indent is None and separators is None and
317 encoding == 'utf-8' and default is None and use_decimal
318 and namedtuple_as_object and tuple_as_array
319 and not bigint_as_string and not sort_keys
320 and not item_sort_key and not kw):
321 return _default_encoder.encode(obj)
322 if cls is None:
323 cls = JSONEncoder
324 return cls(
325 skipkeys=skipkeys, ensure_ascii=ensure_ascii,
326 check_circular=check_circular, allow_nan=allow_nan, indent=indent,
327 separators=separators, encoding=encoding, default=default,
328 use_decimal=use_decimal,
329 namedtuple_as_object=namedtuple_as_object,
330 tuple_as_array=tuple_as_array,
331 bigint_as_string=bigint_as_string,
332 sort_keys=sort_keys,
333 item_sort_key=item_sort_key,
334 **kw).encode(obj)
337 _default_decoder = JSONDecoder(encoding=None, object_hook=None,
338 object_pairs_hook=None)
341 def load(fp, encoding=None, cls=None, object_hook=None, parse_float=None,
342 parse_int=None, parse_constant=None, object_pairs_hook=None,
343 use_decimal=False, namedtuple_as_object=True, tuple_as_array=True,
344 **kw):
345 """Deserialize ``fp`` (a ``.read()``-supporting file-like object containing
346 a JSON document) to a Python object.
348 *encoding* determines the encoding used to interpret any
349 :class:`str` objects decoded by this instance (``'utf-8'`` by
350 default). It has no effect when decoding :class:`unicode` objects.
352 Note that currently only encodings that are a superset of ASCII work,
353 strings of other encodings should be passed in as :class:`unicode`.
355 *object_hook*, if specified, will be called with the result of every
356 JSON object decoded and its return value will be used in place of the
357 given :class:`dict`. This can be used to provide custom
358 deserializations (e.g. to support JSON-RPC class hinting).
360 *object_pairs_hook* is an optional function that will be called with
361 the result of any object literal decode with an ordered list of pairs.
362 The return value of *object_pairs_hook* will be used instead of the
363 :class:`dict`. This feature can be used to implement custom decoders
364 that rely on the order that the key and value pairs are decoded (for
365 example, :func:`collections.OrderedDict` will remember the order of
366 insertion). If *object_hook* is also defined, the *object_pairs_hook*
367 takes priority.
369 *parse_float*, if specified, will be called with the string of every
370 JSON float to be decoded. By default, this is equivalent to
371 ``float(num_str)``. This can be used to use another datatype or parser
372 for JSON floats (e.g. :class:`decimal.Decimal`).
374 *parse_int*, if specified, will be called with the string of every
375 JSON int to be decoded. By default, this is equivalent to
376 ``int(num_str)``. This can be used to use another datatype or parser
377 for JSON integers (e.g. :class:`float`).
379 *parse_constant*, if specified, will be called with one of the
380 following strings: ``'-Infinity'``, ``'Infinity'``, ``'NaN'``. This
381 can be used to raise an exception if invalid JSON numbers are
382 encountered.
384 If *use_decimal* is true (default: ``False``) then it implies
385 parse_float=decimal.Decimal for parity with ``dump``.
387 To use a custom ``JSONDecoder`` subclass, specify it with the ``cls``
388 kwarg.
391 return loads(fp.read(),
392 encoding=encoding, cls=cls, object_hook=object_hook,
393 parse_float=parse_float, parse_int=parse_int,
394 parse_constant=parse_constant, object_pairs_hook=object_pairs_hook,
395 use_decimal=use_decimal, **kw)
398 def loads(s, encoding=None, cls=None, object_hook=None, parse_float=None,
399 parse_int=None, parse_constant=None, object_pairs_hook=None,
400 use_decimal=False, **kw):
401 """Deserialize ``s`` (a ``str`` or ``unicode`` instance containing a JSON
402 document) to a Python object.
404 *encoding* determines the encoding used to interpret any
405 :class:`str` objects decoded by this instance (``'utf-8'`` by
406 default). It has no effect when decoding :class:`unicode` objects.
408 Note that currently only encodings that are a superset of ASCII work,
409 strings of other encodings should be passed in as :class:`unicode`.
411 *object_hook*, if specified, will be called with the result of every
412 JSON object decoded and its return value will be used in place of the
413 given :class:`dict`. This can be used to provide custom
414 deserializations (e.g. to support JSON-RPC class hinting).
416 *object_pairs_hook* is an optional function that will be called with
417 the result of any object literal decode with an ordered list of pairs.
418 The return value of *object_pairs_hook* will be used instead of the
419 :class:`dict`. This feature can be used to implement custom decoders
420 that rely on the order that the key and value pairs are decoded (for
421 example, :func:`collections.OrderedDict` will remember the order of
422 insertion). If *object_hook* is also defined, the *object_pairs_hook*
423 takes priority.
425 *parse_float*, if specified, will be called with the string of every
426 JSON float to be decoded. By default, this is equivalent to
427 ``float(num_str)``. This can be used to use another datatype or parser
428 for JSON floats (e.g. :class:`decimal.Decimal`).
430 *parse_int*, if specified, will be called with the string of every
431 JSON int to be decoded. By default, this is equivalent to
432 ``int(num_str)``. This can be used to use another datatype or parser
433 for JSON integers (e.g. :class:`float`).
435 *parse_constant*, if specified, will be called with one of the
436 following strings: ``'-Infinity'``, ``'Infinity'``, ``'NaN'``. This
437 can be used to raise an exception if invalid JSON numbers are
438 encountered.
440 If *use_decimal* is true (default: ``False``) then it implies
441 parse_float=decimal.Decimal for parity with ``dump``.
443 To use a custom ``JSONDecoder`` subclass, specify it with the ``cls``
444 kwarg.
447 if (cls is None and encoding is None and object_hook is None and
448 parse_int is None and parse_float is None and
449 parse_constant is None and object_pairs_hook is None
450 and not use_decimal and not kw):
451 return _default_decoder.decode(s)
452 if cls is None:
453 cls = JSONDecoder
454 if object_hook is not None:
455 kw['object_hook'] = object_hook
456 if object_pairs_hook is not None:
457 kw['object_pairs_hook'] = object_pairs_hook
458 if parse_float is not None:
459 kw['parse_float'] = parse_float
460 if parse_int is not None:
461 kw['parse_int'] = parse_int
462 if parse_constant is not None:
463 kw['parse_constant'] = parse_constant
464 if use_decimal:
465 if parse_float is not None:
466 raise TypeError("use_decimal=True implies parse_float=Decimal")
467 kw['parse_float'] = Decimal
468 return cls(encoding=encoding, **kw).decode(s)
471 def _toggle_speedups(enabled):
472 import simplejson.decoder as dec
473 import simplejson.encoder as enc
474 import simplejson.scanner as scan
475 c_make_encoder = _import_c_make_encoder()
476 if enabled:
477 dec.scanstring = dec.c_scanstring or dec.py_scanstring
478 enc.c_make_encoder = c_make_encoder
479 enc.encode_basestring_ascii = (enc.c_encode_basestring_ascii or
480 enc.py_encode_basestring_ascii)
481 scan.make_scanner = scan.c_make_scanner or scan.py_make_scanner
482 else:
483 dec.scanstring = dec.py_scanstring
484 enc.c_make_encoder = None
485 enc.encode_basestring_ascii = enc.py_encode_basestring_ascii
486 scan.make_scanner = scan.py_make_scanner
487 dec.make_scanner = scan.make_scanner
488 global _default_decoder
489 _default_decoder = JSONDecoder(
490 encoding=None,
491 object_hook=None,
492 object_pairs_hook=None,
494 global _default_encoder
495 _default_encoder = JSONEncoder(
496 skipkeys=False,
497 ensure_ascii=True,
498 check_circular=True,
499 allow_nan=True,
500 indent=None,
501 separators=None,
502 encoding='utf-8',
503 default=None,
506 def simple_first(kv):
507 """Helper function to pass to item_sort_key to sort simple
508 elements to the top, then container elements.
510 return (isinstance(kv[1], (list, dict, tuple)), kv[0])