mirror of
https://github.com/wassname/ray.git
synced 2026-06-29 11:17:13 +08:00
538 lines
19 KiB
C
538 lines
19 KiB
C
#include <Python.h>
|
|
#include "bytesobject.h"
|
|
#include "node.h"
|
|
|
|
#include "common.h"
|
|
#include "common_extension.h"
|
|
#include "task.h"
|
|
#include "utarray.h"
|
|
#include "utstring.h"
|
|
|
|
PyObject *CommonError;
|
|
|
|
/* Initialize pickle module. */
|
|
|
|
PyObject *pickle_module = NULL;
|
|
PyObject *pickle_loads = NULL;
|
|
PyObject *pickle_dumps = NULL;
|
|
PyObject *pickle_protocol = NULL;
|
|
|
|
void init_pickle_module(void) {
|
|
#if PY_MAJOR_VERSION >= 3
|
|
pickle_module = PyImport_ImportModule("pickle");
|
|
#else
|
|
pickle_module = PyImport_ImportModuleNoBlock("cPickle");
|
|
#endif
|
|
CHECK(pickle_module != NULL);
|
|
CHECK(PyObject_HasAttrString(pickle_module, "loads"));
|
|
CHECK(PyObject_HasAttrString(pickle_module, "dumps"));
|
|
CHECK(PyObject_HasAttrString(pickle_module, "HIGHEST_PROTOCOL"));
|
|
pickle_loads = PyUnicode_FromString("loads");
|
|
pickle_dumps = PyUnicode_FromString("dumps");
|
|
pickle_protocol = PyObject_GetAttrString(pickle_module, "HIGHEST_PROTOCOL");
|
|
CHECK(pickle_protocol != NULL);
|
|
}
|
|
|
|
/* Define the PyObjectID class. */
|
|
|
|
int PyStringToUniqueID(PyObject *object, object_id *object_id) {
|
|
if (PyBytes_Check(object)) {
|
|
memcpy(&object_id->id[0], PyBytes_AsString(object), UNIQUE_ID_SIZE);
|
|
return 1;
|
|
} else {
|
|
PyErr_SetString(PyExc_TypeError, "must be a 20 character string");
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
int PyObjectToUniqueID(PyObject *object, object_id *objectid) {
|
|
if (PyObject_IsInstance(object, (PyObject *) &PyObjectIDType)) {
|
|
*objectid = ((PyObjectID *) object)->object_id;
|
|
return 1;
|
|
} else {
|
|
PyErr_SetString(PyExc_TypeError, "must be an ObjectID");
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
static int PyObjectID_init(PyObjectID *self, PyObject *args, PyObject *kwds) {
|
|
const char *data;
|
|
int size;
|
|
if (!PyArg_ParseTuple(args, "s#", &data, &size)) {
|
|
return -1;
|
|
}
|
|
if (size != sizeof(object_id)) {
|
|
PyErr_SetString(CommonError,
|
|
"ObjectID: object id string needs to have length 20");
|
|
return -1;
|
|
}
|
|
memcpy(&self->object_id.id[0], data, sizeof(self->object_id.id));
|
|
return 0;
|
|
}
|
|
|
|
/* Create a PyObjectID from C. */
|
|
PyObject *PyObjectID_make(object_id object_id) {
|
|
PyObjectID *result = PyObject_New(PyObjectID, &PyObjectIDType);
|
|
result = (PyObjectID *) PyObject_Init((PyObject *) result, &PyObjectIDType);
|
|
result->object_id = object_id;
|
|
return (PyObject *) result;
|
|
}
|
|
|
|
/**
|
|
* Convert a string to a Ray task specification Python object.
|
|
*
|
|
* This is called from Python like
|
|
*
|
|
* task = photon.task_from_string("...")
|
|
*
|
|
* @param task_string String representation of the task specification.
|
|
* @return Python task specification object.
|
|
*/
|
|
PyObject *PyTask_from_string(PyObject *self, PyObject *args) {
|
|
const char *data;
|
|
int size;
|
|
if (!PyArg_ParseTuple(args, "s#", &data, &size)) {
|
|
return NULL;
|
|
}
|
|
PyTask *result = PyObject_New(PyTask, &PyTaskType);
|
|
result = (PyTask *) PyObject_Init((PyObject *) result, &PyTaskType);
|
|
result->spec = malloc(size);
|
|
memcpy(result->spec, data, size);
|
|
/* TODO(pcm): Better error checking once we use flatbuffers. */
|
|
if (size != task_spec_size(result->spec)) {
|
|
PyErr_SetString(CommonError,
|
|
"task_from_string: task specification string malformed");
|
|
return NULL;
|
|
}
|
|
return (PyObject *) result;
|
|
}
|
|
|
|
/**
|
|
* Convert a Ray task specification Python object to a string.
|
|
*
|
|
* This is called from Python like
|
|
*
|
|
* s = photon.task_to_string(task)
|
|
*
|
|
* @param task Ray task specification Python object.
|
|
* @return String representing the task specification.
|
|
*/
|
|
PyObject *PyTask_to_string(PyObject *self, PyObject *args) {
|
|
PyObject *arg;
|
|
if (!PyArg_ParseTuple(args, "O", &arg)) {
|
|
return NULL;
|
|
}
|
|
PyTask *task = (PyTask *) arg;
|
|
return PyBytes_FromStringAndSize((char *) task->spec,
|
|
task_spec_size(task->spec));
|
|
}
|
|
|
|
static PyObject *PyObjectID_id(PyObject *self) {
|
|
PyObjectID *s = (PyObjectID *) self;
|
|
return PyBytes_FromStringAndSize((char *) &s->object_id.id[0],
|
|
sizeof(s->object_id.id));
|
|
}
|
|
|
|
static PyObject *PyObjectID_hex(PyObject *self) {
|
|
PyObjectID *s = (PyObjectID *) self;
|
|
char hex_id[ID_STRING_SIZE];
|
|
object_id_to_string(s->object_id, hex_id, ID_STRING_SIZE);
|
|
PyObject *result = PyUnicode_FromString(hex_id);
|
|
return result;
|
|
}
|
|
|
|
static PyObject *PyObjectID_richcompare(PyObjectID *self,
|
|
PyObject *other,
|
|
int op) {
|
|
PyObject *result = NULL;
|
|
if (Py_TYPE(self)->tp_richcompare != Py_TYPE(other)->tp_richcompare) {
|
|
result = Py_NotImplemented;
|
|
} else {
|
|
PyObjectID *other_id = (PyObjectID *) other;
|
|
switch (op) {
|
|
case Py_LT:
|
|
result = Py_NotImplemented;
|
|
break;
|
|
case Py_LE:
|
|
result = Py_NotImplemented;
|
|
break;
|
|
case Py_EQ:
|
|
result = object_ids_equal(self->object_id, other_id->object_id)
|
|
? Py_True
|
|
: Py_False;
|
|
break;
|
|
case Py_NE:
|
|
result = !object_ids_equal(self->object_id, other_id->object_id)
|
|
? Py_True
|
|
: Py_False;
|
|
break;
|
|
case Py_GT:
|
|
result = Py_NotImplemented;
|
|
break;
|
|
case Py_GE:
|
|
result = Py_NotImplemented;
|
|
break;
|
|
}
|
|
}
|
|
Py_XINCREF(result);
|
|
return result;
|
|
}
|
|
|
|
static long PyObjectID_hash(PyObjectID *self) {
|
|
PyObject *tuple = PyTuple_New(UNIQUE_ID_SIZE);
|
|
for (int i = 0; i < UNIQUE_ID_SIZE; ++i) {
|
|
PyTuple_SetItem(tuple, i, PyLong_FromLong(self->object_id.id[i]));
|
|
}
|
|
long hash = PyObject_Hash(tuple);
|
|
Py_XDECREF(tuple);
|
|
return hash;
|
|
}
|
|
|
|
static PyObject *PyObjectID_repr(PyObjectID *self) {
|
|
char hex_id[ID_STRING_SIZE];
|
|
object_id_to_string(self->object_id, hex_id, ID_STRING_SIZE);
|
|
UT_string *repr;
|
|
utstring_new(repr);
|
|
utstring_printf(repr, "ObjectID(%s)", hex_id);
|
|
PyObject *result = PyUnicode_FromString(utstring_body(repr));
|
|
utstring_free(repr);
|
|
return result;
|
|
}
|
|
|
|
static PyObject *PyObjectID___reduce__(PyObjectID *self) {
|
|
PyErr_SetString(CommonError, "ObjectID objects cannot be serialized.");
|
|
return NULL;
|
|
}
|
|
|
|
static PyMethodDef PyObjectID_methods[] = {
|
|
{"id", (PyCFunction) PyObjectID_id, METH_NOARGS,
|
|
"Return the hash associated with this ObjectID"},
|
|
{"hex", (PyCFunction) PyObjectID_hex, METH_NOARGS,
|
|
"Return the object ID as a string in hex."},
|
|
{"__reduce__", (PyCFunction) PyObjectID___reduce__, METH_NOARGS,
|
|
"Say how to pickle this ObjectID. This raises an exception to prevent"
|
|
"object IDs from being serialized."},
|
|
{NULL} /* Sentinel */
|
|
};
|
|
|
|
static PyMemberDef PyObjectID_members[] = {
|
|
{NULL} /* Sentinel */
|
|
};
|
|
|
|
PyTypeObject PyObjectIDType = {
|
|
PyVarObject_HEAD_INIT(NULL, 0) /* ob_size */
|
|
"common.ObjectID", /* tp_name */
|
|
sizeof(PyObjectID), /* tp_basicsize */
|
|
0, /* tp_itemsize */
|
|
0, /* tp_dealloc */
|
|
0, /* tp_print */
|
|
0, /* tp_getattr */
|
|
0, /* tp_setattr */
|
|
0, /* tp_compare */
|
|
(reprfunc) PyObjectID_repr, /* tp_repr */
|
|
0, /* tp_as_number */
|
|
0, /* tp_as_sequence */
|
|
0, /* tp_as_mapping */
|
|
(hashfunc) PyObjectID_hash, /* tp_hash */
|
|
0, /* tp_call */
|
|
0, /* tp_str */
|
|
0, /* tp_getattro */
|
|
0, /* tp_setattro */
|
|
0, /* tp_as_buffer */
|
|
Py_TPFLAGS_DEFAULT, /* tp_flags */
|
|
"ObjectID object", /* tp_doc */
|
|
0, /* tp_traverse */
|
|
0, /* tp_clear */
|
|
(richcmpfunc) PyObjectID_richcompare, /* tp_richcompare */
|
|
0, /* tp_weaklistoffset */
|
|
0, /* tp_iter */
|
|
0, /* tp_iternext */
|
|
PyObjectID_methods, /* tp_methods */
|
|
PyObjectID_members, /* tp_members */
|
|
0, /* tp_getset */
|
|
0, /* tp_base */
|
|
0, /* tp_dict */
|
|
0, /* tp_descr_get */
|
|
0, /* tp_descr_set */
|
|
0, /* tp_dictoffset */
|
|
(initproc) PyObjectID_init, /* tp_init */
|
|
0, /* tp_alloc */
|
|
PyType_GenericNew, /* tp_new */
|
|
};
|
|
|
|
/* Define the PyTask class. */
|
|
|
|
static int PyTask_init(PyTask *self, PyObject *args, PyObject *kwds) {
|
|
unique_id driver_id;
|
|
function_id function_id;
|
|
/* Arguments of the task (can be PyObjectIDs or Python values). */
|
|
PyObject *arguments;
|
|
/* Array of pointers to string representations of pass-by-value args. */
|
|
UT_array *val_repr_ptrs;
|
|
utarray_new(val_repr_ptrs, &ut_ptr_icd);
|
|
int num_returns;
|
|
/* The ID of the task that called this task. */
|
|
task_id parent_task_id;
|
|
/* The number of tasks that the parent task has called prior to this one. */
|
|
int parent_counter;
|
|
if (!PyArg_ParseTuple(args, "O&O&OiO&i", &PyObjectToUniqueID, &driver_id,
|
|
&PyObjectToUniqueID, &function_id, &arguments,
|
|
&num_returns, &PyObjectToUniqueID, &parent_task_id,
|
|
&parent_counter)) {
|
|
return -1;
|
|
}
|
|
Py_ssize_t size = PyList_Size(arguments);
|
|
/* Determine the size of pass by value data in bytes. */
|
|
Py_ssize_t value_data_bytes = 0;
|
|
for (Py_ssize_t i = 0; i < size; ++i) {
|
|
PyObject *arg = PyList_GetItem(arguments, i);
|
|
if (!PyObject_IsInstance(arg, (PyObject *) &PyObjectIDType)) {
|
|
CHECK(pickle_module != NULL);
|
|
CHECK(pickle_dumps != NULL);
|
|
PyObject *data = PyObject_CallMethodObjArgs(pickle_module, pickle_dumps,
|
|
arg, pickle_protocol, NULL);
|
|
value_data_bytes += PyBytes_Size(data);
|
|
utarray_push_back(val_repr_ptrs, &data);
|
|
}
|
|
}
|
|
/* Construct the task specification. */
|
|
int val_repr_index = 0;
|
|
self->spec = start_construct_task_spec(driver_id, parent_task_id,
|
|
parent_counter, function_id, size,
|
|
num_returns, value_data_bytes);
|
|
/* Add the task arguments. */
|
|
for (Py_ssize_t i = 0; i < size; ++i) {
|
|
PyObject *arg = PyList_GetItem(arguments, i);
|
|
if (PyObject_IsInstance(arg, (PyObject *) &PyObjectIDType)) {
|
|
task_args_add_ref(self->spec, ((PyObjectID *) arg)->object_id);
|
|
} else {
|
|
/* We do this check because we cast a signed int to an unsigned int. */
|
|
CHECK(val_repr_index >= 0);
|
|
PyObject *data = *((PyObject **) utarray_eltptr(
|
|
val_repr_ptrs, (uint64_t) val_repr_index));
|
|
task_args_add_val(self->spec, (uint8_t *) PyBytes_AS_STRING(data),
|
|
PyBytes_GET_SIZE(data));
|
|
Py_DECREF(data);
|
|
val_repr_index += 1;
|
|
}
|
|
}
|
|
utarray_free(val_repr_ptrs);
|
|
/* Compute the task ID and the return object IDs. */
|
|
finish_construct_task_spec(self->spec);
|
|
return 0;
|
|
}
|
|
|
|
static void PyTask_dealloc(PyTask *self) {
|
|
if (self->spec != NULL) {
|
|
free_task_spec(self->spec);
|
|
}
|
|
Py_TYPE(self)->tp_free((PyObject *) self);
|
|
}
|
|
|
|
static PyObject *PyTask_function_id(PyObject *self) {
|
|
function_id function_id = task_function(((PyTask *) self)->spec);
|
|
return PyObjectID_make(function_id);
|
|
}
|
|
|
|
static PyObject *PyTask_driver_id(PyObject *self) {
|
|
unique_id driver_id = task_spec_driver_id(((PyTask *) self)->spec);
|
|
return PyObjectID_make(driver_id);
|
|
}
|
|
|
|
static PyObject *PyTask_task_id(PyObject *self) {
|
|
task_id task_id = task_spec_id(((PyTask *) self)->spec);
|
|
return PyObjectID_make(task_id);
|
|
}
|
|
|
|
static PyObject *PyTask_arguments(PyObject *self) {
|
|
task_spec *task = ((PyTask *) self)->spec;
|
|
int64_t num_args = task_num_args(task);
|
|
PyObject *arg_list = PyList_New((Py_ssize_t) num_args);
|
|
for (int i = 0; i < num_args; ++i) {
|
|
if (task_arg_type(task, i) == ARG_BY_REF) {
|
|
object_id object_id = task_arg_id(task, i);
|
|
PyList_SetItem(arg_list, i, PyObjectID_make(object_id));
|
|
} else {
|
|
CHECK(pickle_module != NULL);
|
|
CHECK(pickle_loads != NULL);
|
|
PyObject *str =
|
|
PyBytes_FromStringAndSize((char *) task_arg_val(task, i),
|
|
(Py_ssize_t) task_arg_length(task, i));
|
|
PyObject *val =
|
|
PyObject_CallMethodObjArgs(pickle_module, pickle_loads, str, NULL);
|
|
Py_XDECREF(str);
|
|
PyList_SetItem(arg_list, i, val);
|
|
}
|
|
}
|
|
return arg_list;
|
|
}
|
|
|
|
static PyObject *PyTask_returns(PyObject *self) {
|
|
task_spec *task = ((PyTask *) self)->spec;
|
|
int64_t num_returns = task_num_returns(task);
|
|
PyObject *return_id_list = PyList_New((Py_ssize_t) num_returns);
|
|
for (int i = 0; i < num_returns; ++i) {
|
|
object_id object_id = task_return(task, i);
|
|
PyList_SetItem(return_id_list, i, PyObjectID_make(object_id));
|
|
}
|
|
return return_id_list;
|
|
}
|
|
|
|
static PyMethodDef PyTask_methods[] = {
|
|
{"function_id", (PyCFunction) PyTask_function_id, METH_NOARGS,
|
|
"Return the function ID for this task."},
|
|
{"driver_id", (PyCFunction) PyTask_driver_id, METH_NOARGS,
|
|
"Return the driver ID for this task."},
|
|
{"task_id", (PyCFunction) PyTask_task_id, METH_NOARGS,
|
|
"Return the task ID for this task."},
|
|
{"arguments", (PyCFunction) PyTask_arguments, METH_NOARGS,
|
|
"Return the arguments for the task."},
|
|
{"returns", (PyCFunction) PyTask_returns, METH_NOARGS,
|
|
"Return the object IDs for the return values of the task."},
|
|
{NULL} /* Sentinel */
|
|
};
|
|
|
|
PyTypeObject PyTaskType = {
|
|
PyVarObject_HEAD_INIT(NULL, 0) /* ob_size */
|
|
"task.Task", /* tp_name */
|
|
sizeof(PyTask), /* tp_basicsize */
|
|
0, /* tp_itemsize */
|
|
(destructor) PyTask_dealloc, /* tp_dealloc */
|
|
0, /* tp_print */
|
|
0, /* tp_getattr */
|
|
0, /* tp_setattr */
|
|
0, /* tp_compare */
|
|
0, /* tp_repr */
|
|
0, /* tp_as_number */
|
|
0, /* tp_as_sequence */
|
|
0, /* tp_as_mapping */
|
|
0, /* tp_hash */
|
|
0, /* tp_call */
|
|
0, /* tp_str */
|
|
0, /* tp_getattro */
|
|
0, /* tp_setattro */
|
|
0, /* tp_as_buffer */
|
|
Py_TPFLAGS_DEFAULT, /* tp_flags */
|
|
"Task object", /* tp_doc */
|
|
0, /* tp_traverse */
|
|
0, /* tp_clear */
|
|
0, /* tp_richcompare */
|
|
0, /* tp_weaklistoffset */
|
|
0, /* tp_iter */
|
|
0, /* tp_iternext */
|
|
PyTask_methods, /* tp_methods */
|
|
0, /* tp_members */
|
|
0, /* tp_getset */
|
|
0, /* tp_base */
|
|
0, /* tp_dict */
|
|
0, /* tp_descr_get */
|
|
0, /* tp_descr_set */
|
|
0, /* tp_dictoffset */
|
|
(initproc) PyTask_init, /* tp_init */
|
|
0, /* tp_alloc */
|
|
PyType_GenericNew, /* tp_new */
|
|
};
|
|
|
|
/* Create a PyTask from a C struct. The resulting PyTask takes ownership of the
|
|
* task_spec and will deallocate the task_spec in the PyTask destructor. */
|
|
PyObject *PyTask_make(task_spec *task_spec) {
|
|
PyTask *result = PyObject_New(PyTask, &PyTaskType);
|
|
result = (PyTask *) PyObject_Init((PyObject *) result, &PyTaskType);
|
|
result->spec = task_spec;
|
|
return (PyObject *) result;
|
|
}
|
|
|
|
/* Define the methods for the module. */
|
|
|
|
#define SIZE_LIMIT 100
|
|
#define NUM_ELEMENTS_LIMIT 1000
|
|
|
|
#if PY_MAJOR_VERSION >= 3
|
|
#define PyInt_Check PyLong_Check
|
|
#endif
|
|
|
|
/**
|
|
* This method checks if a Python object is sufficiently simple that it can be
|
|
* serialized and passed by value as an argument to a task (without being put in
|
|
* the object store). The details of which objects are sufficiently simple are
|
|
* defined by this method and are not particularly important. But for
|
|
* performance reasons, it is better to place "small" objects in the task itself
|
|
* and "large" objects in the object store.
|
|
*
|
|
* @param value The Python object in question.
|
|
* @param num_elements_contained If this method returns 1, then the number of
|
|
* objects recursively contained within this object will be added to the
|
|
* value at this address. This is used to make sure that we do not
|
|
* serialize objects that are too large.
|
|
* @return 0 if the object cannot be serialized in the task and 1 if it can.
|
|
*/
|
|
int is_simple_value(PyObject *value, int *num_elements_contained) {
|
|
*num_elements_contained += 1;
|
|
if (*num_elements_contained >= NUM_ELEMENTS_LIMIT) {
|
|
return 0;
|
|
}
|
|
if (PyInt_Check(value) || PyLong_Check(value) || value == Py_False ||
|
|
value == Py_True || PyFloat_Check(value) || value == Py_None) {
|
|
return 1;
|
|
}
|
|
if (PyBytes_CheckExact(value)) {
|
|
*num_elements_contained += PyBytes_Size(value);
|
|
return (*num_elements_contained < NUM_ELEMENTS_LIMIT);
|
|
}
|
|
if (PyUnicode_CheckExact(value)) {
|
|
*num_elements_contained += PyUnicode_GET_SIZE(value);
|
|
return (*num_elements_contained < NUM_ELEMENTS_LIMIT);
|
|
}
|
|
if (PyList_CheckExact(value) && PyList_Size(value) < SIZE_LIMIT) {
|
|
for (Py_ssize_t i = 0; i < PyList_Size(value); ++i) {
|
|
if (!is_simple_value(PyList_GetItem(value, i), num_elements_contained)) {
|
|
return 0;
|
|
}
|
|
}
|
|
return (*num_elements_contained < NUM_ELEMENTS_LIMIT);
|
|
}
|
|
if (PyDict_CheckExact(value) && PyDict_Size(value) < SIZE_LIMIT) {
|
|
PyObject *key, *val;
|
|
Py_ssize_t pos = 0;
|
|
while (PyDict_Next(value, &pos, &key, &val)) {
|
|
if (!is_simple_value(key, num_elements_contained) ||
|
|
!is_simple_value(val, num_elements_contained)) {
|
|
return 0;
|
|
}
|
|
}
|
|
return (*num_elements_contained < NUM_ELEMENTS_LIMIT);
|
|
}
|
|
if (PyTuple_CheckExact(value) && PyTuple_Size(value) < SIZE_LIMIT) {
|
|
for (Py_ssize_t i = 0; i < PyTuple_Size(value); ++i) {
|
|
if (!is_simple_value(PyTuple_GetItem(value, i), num_elements_contained)) {
|
|
return 0;
|
|
}
|
|
}
|
|
return (*num_elements_contained < NUM_ELEMENTS_LIMIT);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
PyObject *check_simple_value(PyObject *self, PyObject *args) {
|
|
PyObject *value;
|
|
if (!PyArg_ParseTuple(args, "O", &value)) {
|
|
return NULL;
|
|
}
|
|
int num_elements_contained = 0;
|
|
if (is_simple_value(value, &num_elements_contained)) {
|
|
Py_RETURN_TRUE;
|
|
}
|
|
Py_RETURN_FALSE;
|
|
}
|
|
|
|
PyObject *compute_put_id(PyObject *self, PyObject *args) {
|
|
int put_index;
|
|
task_id task_id;
|
|
if (!PyArg_ParseTuple(args, "O&i", &PyObjectToUniqueID, &task_id,
|
|
&put_index)) {
|
|
return NULL;
|
|
}
|
|
object_id put_id = task_compute_put_id(task_id, put_index);
|
|
return PyObjectID_make(put_id);
|
|
}
|