ray/python/ray/serialization.py

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import hashlib
import io
import logging
import time

import pyarrow
import pyarrow.plasma as plasma

import ray.cloudpickle as pickle
from ray import ray_constants, JobID
import ray.utils
from ray.utils import _random_string
from ray.gcs_utils import ErrorType
from ray.exceptions import (
    RayActorError,
    RayWorkerError,
    UnreconstructableError,
    RAY_EXCEPTION_TYPES,
)
from ray._raylet import Pickle5Writer, unpack_pickle5_buffers

logger = logging.getLogger(__name__)


class RayNotDictionarySerializable(Exception):
    pass


# This exception is used to represent situations where cloudpickle fails to
# pickle an object (cloudpickle can fail in many different ways).
class CloudPickleError(Exception):
    pass


class DeserializationError(Exception):
    pass


class SerializedObject(object):
    def __init__(self, metadata):
        self._metadata = metadata

    @property
    def total_bytes(self):
        raise NotImplementedError

    @property
    def metadata(self):
        return self._metadata


class Pickle5SerializedObject(SerializedObject):
    def __init__(self, inband, writer):
        super(Pickle5SerializedObject,
              self).__init__(ray_constants.PICKLE5_BUFFER_METADATA)
        self.inband = inband
        self.writer = writer
        # cached total bytes
        self._total_bytes = None

    @property
    def total_bytes(self):
        if self._total_bytes is None:
            self._total_bytes = self.writer.get_total_bytes(self.inband)
        return self._total_bytes


class ArrowSerializedObject(SerializedObject):
    def __init__(self, serialized_object):
        super(ArrowSerializedObject, self).__init__(b"")
        self.serialized_object = serialized_object

    @property
    def total_bytes(self):
        return self.serialized_object.total_bytes


class RawSerializedObject(SerializedObject):
    def __init__(self, value):
        super(RawSerializedObject,
              self).__init__(ray_constants.RAW_BUFFER_METADATA)
        self.value = value

    @property
    def total_bytes(self):
        return len(self.value)


def _try_to_compute_deterministic_class_id(cls, depth=5):
    """Attempt to produce a deterministic class ID for a given class.

    The goal here is for the class ID to be the same when this is run on
    different worker processes. Pickling, loading, and pickling again seems to
    produce more consistent results than simply pickling. This is a bit crazy
    and could cause problems, in which case we should revert it and figure out
    something better.

    Args:
        cls: The class to produce an ID for.
        depth: The number of times to repeatedly try to load and dump the
            string while trying to reach a fixed point.

    Returns:
        A class ID for this class. We attempt to make the class ID the same
            when this function is run on different workers, but that is not
            guaranteed.

    Raises:
        Exception: This could raise an exception if cloudpickle raises an
            exception.
    """
    # Pickling, loading, and pickling again seems to produce more consistent
    # results than simply pickling. This is a bit
    class_id = pickle.dumps(cls)
    for _ in range(depth):
        new_class_id = pickle.dumps(pickle.loads(class_id))
        if new_class_id == class_id:
            # We appear to have reached a fix point, so use this as the ID.
            return hashlib.sha1(new_class_id).digest()
        class_id = new_class_id

    # We have not reached a fixed point, so we may end up with a different
    # class ID for this custom class on each worker, which could lead to the
    # same class definition being exported many many times.
    logger.warning(
        "WARNING: Could not produce a deterministic class ID for class "
        "{}".format(cls))
    return hashlib.sha1(new_class_id).digest()


class SerializationContext(object):
    """Initialize the serialization library.

    This defines a custom serializer for object IDs and also tells ray to
    serialize several exception classes that we define for error handling.
    """

    def __init__(self, worker):
        self.worker = worker
        self.use_pickle = worker.use_pickle

        def actor_handle_serializer(obj):
            return obj._serialization_helper(True)

        def actor_handle_deserializer(serialized_obj):
            new_handle = ray.actor.ActorHandle.__new__(ray.actor.ActorHandle)
            new_handle._deserialization_helper(serialized_obj, True)
            return new_handle

        if not worker.use_pickle:
            serialization_context = pyarrow.default_serialization_context()
            # Tell the serialization context to use the cloudpickle version
            # that we ship with Ray.
            serialization_context.set_pickle(pickle.dumps, pickle.loads)
            pyarrow.register_torch_serialization_handlers(
                serialization_context)

            def id_serializer(obj):
                return pickle.dumps(obj)

            def id_deserializer(serialized_obj):
                return pickle.loads(serialized_obj)

            def object_id_serializer(obj):
                owner_id = ""
                owner_address = ""
                if obj.is_direct_call_type():
                    worker = ray.worker.get_global_worker()
                    worker.check_connected()
                    obj, owner_id, owner_address = (
                        worker.core_worker.serialize_and_promote_object_id(obj)
                    )
                obj = obj.__reduce__()
                owner_id = owner_id.__reduce__() if owner_id else owner_id
                return pickle.dumps((obj, owner_id, owner_address))

            def object_id_deserializer(serialized_obj):
                obj_id, owner_id, owner_address = pickle.loads(serialized_obj)
                # NOTE(swang): Must deserialize the object first before asking
                # the core worker to resolve the value. This is to make sure
                # that the ref count for the ObjectID is greater than 0 by the
                # time the core worker resolves the value of the object.
                deserialized_object_id = obj_id[0](obj_id[1][0])
                if owner_id:
                    worker = ray.worker.get_global_worker()
                    worker.check_connected()
                    # UniqueIDs are serialized as
                    # (class name, (unique bytes,)).
                    worker.core_worker.deserialize_and_register_object_id(
                        obj_id[1][0], owner_id[1][0], owner_address)
                return deserialized_object_id

            for id_type in ray._raylet._ID_TYPES:
                if id_type == ray._raylet.ObjectID:
                    serialization_context.register_type(
                        id_type,
                        "{}.{}".format(id_type.__module__, id_type.__name__),
                        custom_serializer=object_id_serializer,
                        custom_deserializer=object_id_deserializer)
                else:
                    serialization_context.register_type(
                        id_type,
                        "{}.{}".format(id_type.__module__, id_type.__name__),
                        custom_serializer=id_serializer,
                        custom_deserializer=id_deserializer)

            # We register this serializer on each worker instead of calling
            # _register_custom_serializer from the driver so that isinstance
            # still works.
            serialization_context.register_type(
                ray.actor.ActorHandle,
                "ray.ActorHandle",
                pickle=False,
                custom_serializer=actor_handle_serializer,
                custom_deserializer=actor_handle_deserializer)
            self.pyarrow_context = serialization_context
        else:
            self._register_cloudpickle_serializer(
                ray.actor.ActorHandle,
                custom_serializer=actor_handle_serializer,
                custom_deserializer=actor_handle_deserializer)

            def id_serializer(obj):
                return obj.__reduce__()

            def id_deserializer(serialized_obj):
                return serialized_obj[0](*serialized_obj[1])

            def object_id_serializer(obj):
                owner_id = ""
                owner_address = ""
                if obj.is_direct_call_type():
                    worker = ray.worker.get_global_worker()
                    worker.check_connected()
                    obj, owner_id, owner_address = (
                        worker.core_worker.serialize_and_promote_object_id(obj)
                    )
                obj = id_serializer(obj)
                owner_id = id_serializer(owner_id) if owner_id else owner_id
                return (obj, owner_id, owner_address)

            def object_id_deserializer(serialized_obj):
                obj_id, owner_id, owner_address = serialized_obj
                # NOTE(swang): Must deserialize the object first before asking
                # the core worker to resolve the value. This is to make sure
                # that the ref count for the ObjectID is greater than 0 by the
                # time the core worker resolves the value of the object.
                deserialized_object_id = id_deserializer(obj_id)
                if owner_id:
                    worker = ray.worker.get_global_worker()
                    worker.check_connected()
                    # UniqueIDs are serialized as
                    # (class name, (unique bytes,)).
                    worker.core_worker.deserialize_and_register_object_id(
                        obj_id[1][0], owner_id[1][0], owner_address)
                return deserialized_object_id

            for id_type in ray._raylet._ID_TYPES:
                if id_type == ray._raylet.ObjectID:
                    self._register_cloudpickle_serializer(
                        id_type, object_id_serializer, object_id_deserializer)
                else:
                    self._register_cloudpickle_serializer(
                        id_type, id_serializer, id_deserializer)

    def initialize(self):
        """ Register custom serializers """
        if not self.worker.use_pickle:
            for error_cls in RAY_EXCEPTION_TYPES:
                self.register_custom_serializer(
                    error_cls,
                    use_dict=True,
                    local=True,
                    class_id=error_cls.__module__ + ". " + error_cls.__name__,
                )
                # Tell Ray to serialize lambdas with pickle.
            self.register_custom_serializer(
                type(lambda: 0),
                use_pickle=True,
                local=True,
                class_id="lambda")
            # Tell Ray to serialize types with pickle.
            self.register_custom_serializer(
                type(int), use_pickle=True, local=True, class_id="type")
            # Tell Ray to serialize RayParameters as dictionaries. This is
            # used when passing around actor handles.
            self.register_custom_serializer(
                ray.signature.RayParameter,
                use_dict=True,
                local=True,
                class_id="ray.signature.RayParameter")
            # Tell Ray to serialize StringIO with pickle. We do this because
            # Ray's default __dict__ serialization is incorrect for this type
            # (the object's __dict__ is empty and therefore doesn't
            # contain the full state of the object).
            self.register_custom_serializer(
                io.StringIO,
                use_pickle=True,
                local=True,
                class_id="io.StringIO")

    def _register_cloudpickle_serializer(self, cls, custom_serializer,
                                         custom_deserializer):
        if pickle.FAST_CLOUDPICKLE_USED:

            def _CloudPicklerReducer(obj):
                return custom_deserializer, (custom_serializer(obj), )

            # construct a reducer
            pickle.CloudPickler.dispatch[cls] = _CloudPicklerReducer
        else:

            def _CloudPicklerReducer(_self, obj):
                _self.save_reduce(
                    custom_deserializer, (custom_serializer(obj), ), obj=obj)

            # use a placeholder for 'self' argument
            pickle.CloudPickler.dispatch[cls] = _CloudPicklerReducer

    def _deserialize_object_from_arrow(self, data, metadata, object_id):
        if metadata:
            if metadata == ray_constants.PICKLE5_BUFFER_METADATA:
                if not self.use_pickle:
                    raise ValueError("Receiving pickle5 serialized objects "
                                     "while the serialization context is "
                                     "using pyarrow as the backend.")
                try:
                    in_band, buffers = unpack_pickle5_buffers(data)
                    if len(buffers) > 0:
                        return pickle.loads(in_band, buffers=buffers)
                    else:
                        return pickle.loads(in_band)
                # cloudpickle does not provide error types
                except pickle.pickle.PicklingError:
                    raise DeserializationError()
            # Check if the object should be returned as raw bytes.
            if metadata == ray_constants.RAW_BUFFER_METADATA:
                if data is None:
                    return b""
                return data.to_pybytes()
            # Otherwise, return an exception object based on
            # the error type.
            error_type = int(metadata)
            if error_type == ErrorType.Value("WORKER_DIED"):
                return RayWorkerError()
            elif error_type == ErrorType.Value("ACTOR_DIED"):
                return RayActorError()
            elif error_type == ErrorType.Value("OBJECT_UNRECONSTRUCTABLE"):
                return UnreconstructableError(ray.ObjectID(object_id.binary()))
            else:
                assert error_type != ErrorType.Value("OBJECT_IN_PLASMA"), \
                    "Tried to get object that has been promoted to plasma."
                assert False, "Unrecognized error type " + str(error_type)
        elif data:
            if self.use_pickle:
                raise ValueError("Receiving plasma serialized objects "
                                 "while the serialization context is "
                                 "using pickle5 as the backend.")
            try:
                # If data is not empty, deserialize the object.
                return pyarrow.deserialize(data, self.pyarrow_context)
            except pyarrow.DeserializationCallbackError:
                raise DeserializationError()
        else:
            # Object isn't available in plasma. This should never be returned
            # to the user. We should only reach this line if this object was
            # deserialized as part of a list, and another object in the list
            # throws an exception.
            return plasma.ObjectNotAvailable

    def _store_and_register_pyarrow(self, value, depth=100):
        """Store an object and attempt to register its class if needed.

        Args:
            value: The value to put in the object store.
            depth: The maximum number of classes to recursively register.

        Raises:
            Exception: An exception is raised if the attempt to serialize the
                object fails.
        """
        counter = 0
        while True:
            if counter == depth:
                raise Exception("Ray exceeded the maximum number of classes "
                                "that it will recursively serialize when "
                                "attempting to serialize an object of "
                                "type {}.".format(type(value)))
            counter += 1
            try:
                return pyarrow.serialize(value, self.pyarrow_context)
            except pyarrow.SerializationCallbackError as e:
                cls_type = type(e.example_object)
                try:
                    self.register_custom_serializer(cls_type, use_dict=True)
                    warning_message = (
                        "WARNING: Serializing objects of type "
                        "{} by expanding them as dictionaries "
                        "of their fields. This behavior may "
                        "be incorrect in some cases.".format(cls_type))
                    logger.debug(warning_message)
                except (RayNotDictionarySerializable, CloudPickleError,
                        pickle.pickle.PicklingError, Exception):
                    # We also handle generic exceptions here because
                    # cloudpickle can fail with many different types of errors.
                    warning_message = (
                        "Falling back to serializing {} objects by using "
                        "pickle. Use `ray.register_custom_serializer({},...)` "
                        "to provide faster serialization.".format(
                            cls_type, cls_type))
                    try:
                        self.register_custom_serializer(
                            cls_type, use_pickle=True)
                        logger.warning(warning_message)
                    except (CloudPickleError, ValueError):
                        self.register_custom_serializer(
                            cls_type, use_pickle=True, local=True)
                        warning_message = ("WARNING: Pickling the class {} "
                                           "failed, so we are using pickle "
                                           "and only registering the class "
                                           "locally.".format(cls_type))
                        logger.warning(warning_message)

    def deserialize_objects(self,
                            data_metadata_pairs,
                            object_ids,
                            error_timeout=10):
        pass
        assert len(data_metadata_pairs) == len(object_ids)

        start_time = time.time()
        results = []
        warning_sent = False
        i = 0
        while i < len(object_ids):
            object_id = object_ids[i]
            data, metadata = data_metadata_pairs[i]
            try:
                results.append(
                    self._deserialize_object_from_arrow(
                        data, metadata, object_id))
                i += 1
            except DeserializationError:
                # Wait a little bit for the import thread to import the class.
                # If we currently have the worker lock, we need to release it
                # so that the import thread can acquire it.
                time.sleep(0.01)

                if time.time() - start_time > error_timeout:
                    warning_message = ("This worker or driver is waiting to "
                                       "receive a class definition so that it "
                                       "can deserialize an object from the "
                                       "object store. This may be fine, or it "
                                       "may be a bug.")
                    if not warning_sent:
                        ray.utils.push_error_to_driver(
                            self,
                            ray_constants.WAIT_FOR_CLASS_PUSH_ERROR,
                            warning_message,
                            job_id=self.worker.current_job_id)
                    warning_sent = True

        return results

    def serialize(self, value):
        """Serialize an object.

        Args:
            value: The value to serialize.
        """
        if isinstance(value, bytes):
            # If the object is a byte array, skip serializing it and
            # use a special metadata to indicate it's raw binary. So
            # that this object can also be read by Java.
            return RawSerializedObject(value)

        if self.worker.use_pickle:
            writer = Pickle5Writer()
            if ray.cloudpickle.FAST_CLOUDPICKLE_USED:
                inband = pickle.dumps(
                    value, protocol=5, buffer_callback=writer.buffer_callback)
            else:
                inband = pickle.dumps(value)
            return Pickle5SerializedObject(inband, writer)
        else:
            try:
                serialized_value = self._store_and_register_pyarrow(value)
            except TypeError:
                # TypeError can happen because one of the members of the object
                # may not be serializable for cloudpickle. So we need
                # these extra fallbacks here to start from the beginning.
                # Hopefully the object could have a `__reduce__` method.
                self.register_custom_serializer(type(value), use_pickle=True)
                logger.warning("WARNING: Serializing the class {} failed, "
                               "falling back to cloudpickle.".format(
                                   type(value)))
                serialized_value = self._store_and_register_pyarrow(value)

            return ArrowSerializedObject(serialized_value)

    def register_custom_serializer(self,
                                   cls,
                                   use_pickle=False,
                                   use_dict=False,
                                   serializer=None,
                                   deserializer=None,
                                   local=False,
                                   job_id=None,
                                   class_id=None):
        """Enable serialization and deserialization for a particular class.

        This method runs the register_class function defined below on
        every worker, which will enable ray to properly serialize and
        deserialize objects of this class.

        Args:
            cls (type): The class that ray should use this custom serializer
                for.
            use_pickle (bool): If true, then objects of this class will be
                serialized using pickle.
            use_dict: If true, then objects of this class be serialized
                turning their __dict__ fields into a dictionary. Must be False
                if use_pickle is true.
            serializer: The custom serializer to use. This should be provided
                if and only if use_pickle and use_dict are False.
            deserializer: The custom deserializer to use. This should be
                provided if and only if use_pickle and use_dict are False.
            local: True if the serializers should only be registered on the
                current worker. This should usually be False.
            job_id: ID of the job that we want to register the class for.
            class_id (str): Unique ID of the class. Autogenerated if None.

        Raises:
            RayNotDictionarySerializable: Raised if use_dict is true and cls
                cannot be efficiently serialized by Ray.
            ValueError: Raised if ray could not autogenerate a class_id.
        """
        assert (serializer is None) == (deserializer is None), (
            "The serializer/deserializer arguments must both be provided or "
            "both not be provided.")
        use_custom_serializer = (serializer is not None)

        assert use_custom_serializer + use_pickle + use_dict == 1, (
            "Exactly one of use_pickle, use_dict, or serializer/deserializer "
            "must be specified.")

        if self.worker.use_pickle and serializer is None:
            # In this case it should do nothing.
            return

        if use_dict:
            # Raise an exception if cls cannot be serialized
            # efficiently by Ray.
            check_serializable(cls)

        if class_id is None:
            if not local:
                # In this case, the class ID will be used to deduplicate the
                # class across workers. Note that cloudpickle unfortunately
                # does not produce deterministic strings, so these IDs could
                # be different on different workers. We could use something
                # weaker like cls.__name__, however that would run the risk
                # of having collisions.
                # TODO(rkn): We should improve this.
                try:
                    # Attempt to produce a class ID that will be the same on
                    # each worker. However, determinism is not guaranteed,
                    # and the result may be different on different workers.
                    class_id = _try_to_compute_deterministic_class_id(cls)
                except Exception:
                    raise ValueError(
                        "Failed to use pickle in generating a unique id"
                        "for '{}'. Provide a unique class_id.".format(cls))
            else:
                # In this case, the class ID only needs to be meaningful on
                # this worker and not across workers.
                class_id = _random_string()

            # Make sure class_id is a string.
            class_id = ray.utils.binary_to_hex(class_id)

        if job_id is None:
            job_id = self.worker.current_job_id
        assert isinstance(job_id, JobID)

        def register_class_for_serialization(worker_info):
            context = worker_info["worker"].get_serialization_context(job_id)
            if worker_info["worker"].use_pickle:
                context._register_cloudpickle_serializer(
                    cls, serializer, deserializer)
            else:
                # TODO(rkn): We need to be more thoughtful about what to do if
                # custom serializers have already been registered for
                # class_id. In some cases, we may want to use the last
                # user-defined serializers and ignore subsequent calls to
                # register_custom_serializer that were made by the system.
                context.pyarrow_context.register_type(
                    cls,
                    class_id,
                    pickle=use_pickle,
                    custom_serializer=serializer,
                    custom_deserializer=deserializer)

        if not local:
            self.worker.run_function_on_all_workers(
                register_class_for_serialization)
        else:
            # Since we are pickling objects of this class, we don't actually
            # need to ship the class definition.
            register_class_for_serialization({"worker": self.worker})


def check_serializable(cls):
    """Throws an exception if Ray cannot serialize this class efficiently.

    Args:
        cls (type): The class to be serialized.

    Raises:
        Exception: An exception is raised if Ray cannot serialize this class
            efficiently.
    """
    if is_named_tuple(cls):
        # This case works.
        return
    if not hasattr(cls, "__new__"):
        print("The class {} does not have a '__new__' attribute and is "
              "probably an old-stye class. Please make it a new-style class "
              "by inheriting from 'object'.")
        raise RayNotDictionarySerializable("The class {} does not have a "
                                           "'__new__' attribute and is "
                                           "probably an old-style class. We "
                                           "do not support this. Please make "
                                           "it a new-style class by "
                                           "inheriting from 'object'."
                                           .format(cls))
    try:
        obj = cls.__new__(cls)
    except Exception:
        raise RayNotDictionarySerializable("The class {} has overridden "
                                           "'__new__', so Ray may not be "
                                           "able to serialize it "
                                           "efficiently.".format(cls))
    if not hasattr(obj, "__dict__"):
        raise RayNotDictionarySerializable("Objects of the class {} do not "
                                           "have a '__dict__' attribute, so "
                                           "Ray cannot serialize it "
                                           "efficiently.".format(cls))
    if hasattr(obj, "__slots__"):
        raise RayNotDictionarySerializable("The class {} uses '__slots__', so "
                                           "Ray may not be able to serialize "
                                           "it efficiently.".format(cls))


def is_named_tuple(cls):
    """Return True if cls is a namedtuple and False otherwise."""
    b = cls.__bases__
    if len(b) != 1 or b[0] != tuple:
        return False
    f = getattr(cls, "_fields", None)
    if not isinstance(f, tuple):
        return False
    return all(type(n) == str for n in f)