| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163 |
- """Utilities to manipulate JSON objects."""
- # Copyright (c) IPython Development Team.
- # Distributed under the terms of the Modified BSD License.
- import math
- import numbers
- import re
- import types
- from binascii import b2a_base64
- from datetime import date, datetime
- from jupyter_client._version import version_info as jupyter_client_version
- next_attr_name = "__next__"
- # -----------------------------------------------------------------------------
- # Globals and constants
- # -----------------------------------------------------------------------------
- # timestamp formats
- ISO8601 = "%Y-%m-%dT%H:%M:%S.%f"
- ISO8601_PAT = re.compile(
- r"^(\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2})(\.\d{1,6})?Z?([\+\-]\d{2}:?\d{2})?$"
- )
- # holy crap, strptime is not threadsafe.
- # Calling it once at import seems to help.
- datetime.strptime("2000-01-01", "%Y-%m-%d")
- # -----------------------------------------------------------------------------
- # Classes and functions
- # -----------------------------------------------------------------------------
- # constants for identifying png/jpeg data
- PNG = b"\x89PNG\r\n\x1a\n"
- # front of PNG base64-encoded
- PNG64 = b"iVBORw0KG"
- JPEG = b"\xff\xd8"
- # front of JPEG base64-encoded
- JPEG64 = b"/9"
- # constants for identifying gif data
- GIF_64 = b"R0lGODdh"
- GIF89_64 = b"R0lGODlh"
- # front of PDF base64-encoded
- PDF64 = b"JVBER"
- JUPYTER_CLIENT_MAJOR_VERSION = jupyter_client_version[0]
- def encode_images(format_dict):
- """b64-encodes images in a displaypub format dict
- Perhaps this should be handled in json_clean itself?
- Parameters
- ----------
- format_dict : dict
- A dictionary of display data keyed by mime-type
- Returns
- -------
- format_dict : dict
- A copy of the same dictionary,
- but binary image data ('image/png', 'image/jpeg' or 'application/pdf')
- is base64-encoded.
- """
- # no need for handling of ambiguous bytestrings on Python 3,
- # where bytes objects always represent binary data and thus
- # base64-encoded.
- return format_dict
- def json_clean(obj): # pragma: no cover
- """Deprecated, this is a no-op for jupyter-client>=7.
- Clean an object to ensure it's safe to encode in JSON.
- Atomic, immutable objects are returned unmodified. Sets and tuples are
- converted to lists, lists are copied and dicts are also copied.
- Note: dicts whose keys could cause collisions upon encoding (such as a dict
- with both the number 1 and the string '1' as keys) will cause a ValueError
- to be raised.
- Parameters
- ----------
- obj : any python object
- Returns
- -------
- out : object
- A version of the input which will not cause an encoding error when
- encoded as JSON. Note that this function does not *encode* its inputs,
- it simply sanitizes it so that there will be no encoding errors later.
- """
- if int(JUPYTER_CLIENT_MAJOR_VERSION) >= 7:
- return obj
- # types that are 'atomic' and ok in json as-is.
- atomic_ok = (str, type(None))
- # containers that we need to convert into lists
- container_to_list = (tuple, set, types.GeneratorType)
- # Since bools are a subtype of Integrals, which are a subtype of Reals,
- # we have to check them in that order.
- if isinstance(obj, bool):
- return obj
- if isinstance(obj, numbers.Integral):
- # cast int to int, in case subclasses override __str__ (e.g. boost enum, #4598)
- return int(obj)
- if isinstance(obj, numbers.Real):
- # cast out-of-range floats to their reprs
- if math.isnan(obj) or math.isinf(obj):
- return repr(obj)
- return float(obj)
- if isinstance(obj, atomic_ok):
- return obj
- if isinstance(obj, bytes):
- # unanmbiguous binary data is base64-encoded
- # (this probably should have happened upstream)
- return b2a_base64(obj).decode("ascii")
- if isinstance(obj, container_to_list) or (
- hasattr(obj, "__iter__") and hasattr(obj, next_attr_name)
- ):
- obj = list(obj)
- if isinstance(obj, list):
- return [json_clean(x) for x in obj]
- if isinstance(obj, dict):
- # First, validate that the dict won't lose data in conversion due to
- # key collisions after stringification. This can happen with keys like
- # True and 'true' or 1 and '1', which collide in JSON.
- nkeys = len(obj)
- nkeys_collapsed = len(set(map(str, obj)))
- if nkeys != nkeys_collapsed:
- msg = (
- "dict cannot be safely converted to JSON: "
- "key collision would lead to dropped values"
- )
- raise ValueError(msg)
- # If all OK, proceed by making the new dict that will be json-safe
- out = {}
- for k, v in obj.items():
- out[str(k)] = json_clean(v)
- return out
- if isinstance(obj, datetime | date):
- return obj.strftime(ISO8601)
- # we don't understand it, it's probably an unserializable object
- raise ValueError("Can't clean for JSON: %r" % obj)
|