Source code for ax.storage.json_store.encoder

#!/usr/bin/env python3
# Copyright (c) Meta Platforms, Inc. and affiliates.
#
# This source code is licensed under the MIT license found in the
# LICENSE file in the root directory of this source tree.

import dataclasses
import datetime
import enum
from collections import OrderedDict
from inspect import isclass
from typing import Any, Callable, Dict, Type

import numpy as np
import pandas as pd
import torch
from ax.exceptions.storage import JSONEncodeError
from ax.storage.json_store.encoders import tensor_to_dict
from ax.storage.json_store.registry import (
    CORE_CLASS_ENCODER_REGISTRY,
    CORE_ENCODER_REGISTRY,
)
from ax.utils.common.serialization import _is_named_tuple
from ax.utils.common.typeutils import numpy_type_to_python_type
from ax.utils.common.typeutils_torch import torch_type_to_str


# pyre-fixme[3]: Return annotation cannot be `Any`.
[docs]def object_to_json( # noqa C901 # pyre-fixme[2]: Parameter annotation cannot be `Any`. obj: Any, # pyre-fixme[2]: Parameter annotation cannot contain `Any`. # pyre-fixme[24]: Generic type `type` expects 1 type parameter, use # `typing.Type` to avoid runtime subscripting errors. encoder_registry: Dict[ Type, Callable[[Any], Dict[str, Any]] ] = CORE_ENCODER_REGISTRY, # pyre-fixme[2]: Parameter annotation cannot contain `Any`. # pyre-fixme[24]: Generic type `type` expects 1 type parameter, use # `typing.Type` to avoid runtime subscripting errors. class_encoder_registry: Dict[ Type, Callable[[Any], Dict[str, Any]] ] = CORE_CLASS_ENCODER_REGISTRY, ) -> Any: """Convert an Ax object to a JSON-serializable dictionary. The root node passed to this function should always be an instance of a core Ax class or a JSON-compatible python builtin. The sub-fields of the input will then be recursively passed to this function. e.g. if we pass an instance of Experiment, we will first fall through to the line `object_dict = ENCODER_REGISTRY[_type](object)`, which will convert the Experiment to a (shallow) dictionary, where search subfield remains "unconverted", i.e.: {"name": <name: string>, "search_space": <search space: SearchSpace>}. We then pass each item of the dictionary back into this function to recursively convert the entire object. """ obj = numpy_type_to_python_type(obj) _type = type(obj) # Type[MyClass] encoding (encoding of classes, not instances) if isclass(obj): for class_type in class_encoder_registry: if issubclass(obj, class_type): obj_dict = class_encoder_registry[class_type](obj) return { k: object_to_json( v, encoder_registry=encoder_registry, class_encoder_registry=class_encoder_registry, ) for k, v in obj_dict.items() } raise ValueError( f"{obj} is a class. Add it to the CLASS_ENCODER_REGISTRY " "(and remove it from the ENCODER_REGISTRY if needed)." ) if _type in encoder_registry: obj_dict = encoder_registry[_type](obj) return { k: object_to_json( v, encoder_registry=encoder_registry, class_encoder_registry=class_encoder_registry, ) for k, v in obj_dict.items() } # Python built-in types + `typing` module types if _type in (str, int, float, bool, type(None)): return obj elif _type is list: return [ object_to_json( x, encoder_registry=encoder_registry, class_encoder_registry=class_encoder_registry, ) for x in obj ] elif _type is tuple: return tuple( object_to_json( x, encoder_registry=encoder_registry, class_encoder_registry=class_encoder_registry, ) for x in obj ) elif _type is dict: return { k: object_to_json( v, encoder_registry=encoder_registry, class_encoder_registry=class_encoder_registry, ) for k, v in obj.items() } elif _is_named_tuple(obj): return { "__type": _type.__name__, **{ k: object_to_json( v, encoder_registry=encoder_registry, class_encoder_registry=class_encoder_registry, ) for k, v in obj._asdict().items() }, } elif dataclasses.is_dataclass(obj): return { "__type": _type.__name__, **{ k: object_to_json( v, encoder_registry=encoder_registry, class_encoder_registry=class_encoder_registry, ) for k, v in obj.__dict__.items() }, } # Types from libraries, commonly used in Ax (e.g., numpy, pandas, torch) elif _type is OrderedDict: return { "__type": _type.__name__, "value": [ ( k, object_to_json( v, encoder_registry=encoder_registry, class_encoder_registry=class_encoder_registry, ), ) for k, v in obj.items() ], } elif _type is datetime.datetime: return { "__type": _type.__name__, "value": datetime.datetime.strftime(obj, "%Y-%m-%d %H:%M:%S.%f"), } elif _type is pd.DataFrame: return {"__type": _type.__name__, "value": obj.to_json()} elif issubclass(_type, enum.Enum): return {"__type": _type.__name__, "name": obj.name} elif _type is np.ndarray or issubclass(_type, np.ndarray): return {"__type": _type.__name__, "value": obj.tolist()} elif _type is set: return {"__type": _type.__name__, "value": list(obj)} elif _type is torch.Tensor: return tensor_to_dict(obj=obj) elif _type.__module__ == "torch": # Torch does not support saving to string, so save to buffer first return {"__type": f"torch_{_type.__name__}", "value": torch_type_to_str(obj)} err = ( f"Object {obj} passed to `object_to_json` (of type {_type}, module: " f"{_type.__module__}) is not registered with a corresponding encoder " "in ENCODER_REGISTRY." ) raise JSONEncodeError(err)