mirror of
https://github.com/wassname/ray.git
synced 2026-06-30 08:27:21 +08:00
96913be939
* Treat actor creation like a regular task. * Small cleanups. * Change semantics of actor resource handling. * Bug fix. * Minor linting * Bug fix * Fix jenkins test. * Fix actor tests * Some cleanups * Bug fix * Fix bug. * Remove cached actor tasks when a driver is removed. * Add more info to taskspec in global state API. * Fix cyclic import bug in tune. * Fix * Fix linting. * Fix linting. * Don't schedule any tasks (especially actor creaiton tasks) on local schedulers with 0 CPUs. * Bug fix. * Add test for 0 CPU case * Fix linting * Address comments. * Fix typos and add comment. * Add assertion and fix test.
605 lines
20 KiB
C++
605 lines
20 KiB
C++
#ifndef TASK_H
|
|
#define TASK_H
|
|
|
|
#include <unordered_map>
|
|
|
|
#include <stddef.h>
|
|
#include <stdint.h>
|
|
#include "common.h"
|
|
|
|
#include <string>
|
|
|
|
#include "format/common_generated.h"
|
|
|
|
using namespace ray;
|
|
|
|
typedef char TaskSpec;
|
|
|
|
class TaskExecutionSpec {
|
|
public:
|
|
TaskExecutionSpec(const std::vector<ObjectID> &execution_dependencies,
|
|
const TaskSpec *spec,
|
|
int64_t task_spec_size);
|
|
TaskExecutionSpec(const std::vector<ObjectID> &execution_dependencies,
|
|
const TaskSpec *spec,
|
|
int64_t task_spec_size,
|
|
int spillback_count);
|
|
TaskExecutionSpec(TaskExecutionSpec *execution_spec);
|
|
|
|
/// Get the task's execution dependencies.
|
|
///
|
|
/// @return A vector of object IDs representing this task's execution
|
|
/// dependencies.
|
|
std::vector<ObjectID> ExecutionDependencies() const;
|
|
|
|
/// Set the task's execution dependencies.
|
|
///
|
|
/// @param dependencies The value to set the execution dependencies to.
|
|
/// @return Void.
|
|
void SetExecutionDependencies(const std::vector<ObjectID> &dependencies);
|
|
|
|
/// Get the task spec size.
|
|
///
|
|
/// @return The size of the immutable task spec.
|
|
int64_t SpecSize() const;
|
|
|
|
/// Get the task's spillback count, which tracks the number of times
|
|
/// this task was spilled back from local to the global scheduler.
|
|
///
|
|
/// @return The spillback count for this task.
|
|
int SpillbackCount() const;
|
|
|
|
/// Increment the spillback count for this task.
|
|
///
|
|
/// @return Void.
|
|
void IncrementSpillbackCount();
|
|
|
|
/// Get the task's last timestamp.
|
|
///
|
|
/// @return The timestamp when this task was last received for scheduling.
|
|
int64_t LastTimeStamp() const;
|
|
|
|
/// Set the task's last timestamp to the specified value.
|
|
///
|
|
/// @param new_timestamp The new timestamp in millisecond to set the task's
|
|
/// time stamp to. Tracks the last time this task entered a local
|
|
/// scheduler.
|
|
/// @return Void.
|
|
void SetLastTimeStamp(int64_t new_timestamp);
|
|
|
|
/// Get the task spec.
|
|
///
|
|
/// @return A pointer to the immutable task spec.
|
|
TaskSpec *Spec() const;
|
|
|
|
/// Get the number of dependencies. This comprises the immutable task
|
|
/// arguments and the mutable execution dependencies.
|
|
///
|
|
/// @return The number of dependencies.
|
|
int64_t NumDependencies() const;
|
|
|
|
/// Get the number of object IDs at the given dependency index.
|
|
///
|
|
/// @param dependency_index The dependency index whose object IDs to count.
|
|
/// @return The number of object IDs at the given dependency_index.
|
|
int DependencyIdCount(int64_t dependency_index) const;
|
|
|
|
/// Get the object ID of a given dependency index.
|
|
///
|
|
/// @param dependency_index The index at which we should look up the object
|
|
/// ID.
|
|
/// @param id_index The index of the object ID.
|
|
ObjectID DependencyId(int64_t dependency_index, int64_t id_index) const;
|
|
|
|
/// Compute whether the task is dependent on an object ID.
|
|
///
|
|
/// @param object_id The object ID that the task may be dependent on.
|
|
/// @return bool This returns true if the task is dependent on the given
|
|
/// object ID and false otherwise.
|
|
bool DependsOn(ObjectID object_id) const;
|
|
|
|
/// Returns whether the given dependency index is a static dependency (an
|
|
/// argument of the immutable task).
|
|
///
|
|
/// @param dependency_index The requested dependency index.
|
|
/// @return bool This returns true if the requested dependency index is
|
|
/// immutable (an argument of the task).
|
|
bool IsStaticDependency(int64_t dependency_index) const;
|
|
|
|
private:
|
|
/** A list of object IDs representing this task's dependencies at execution
|
|
* time. */
|
|
std::vector<ObjectID> execution_dependencies_;
|
|
/** The size of the task specification for this task. */
|
|
int64_t task_spec_size_;
|
|
/** Last time this task was received for scheduling. */
|
|
int64_t last_timestamp_;
|
|
/** Number of times this task was spilled back by local schedulers. */
|
|
int spillback_count_;
|
|
/** The task specification for this task. */
|
|
std::unique_ptr<TaskSpec[]> spec_;
|
|
};
|
|
|
|
class TaskBuilder;
|
|
|
|
typedef UniqueID FunctionID;
|
|
|
|
/** The task ID is a deterministic hash of the function ID that the task
|
|
* executes and the argument IDs or argument values. */
|
|
typedef UniqueID TaskID;
|
|
|
|
/** The actor ID is the ID of the actor that a task must run on. If the task is
|
|
* not run on an actor, then NIL_ACTOR_ID should be used. */
|
|
typedef UniqueID ActorID;
|
|
|
|
/**
|
|
* Compare two task IDs.
|
|
*
|
|
* @param first_id The first task ID to compare.
|
|
* @param second_id The first task ID to compare.
|
|
* @return True if the task IDs are the same and false otherwise.
|
|
*/
|
|
bool TaskID_equal(TaskID first_id, TaskID second_id);
|
|
|
|
/**
|
|
* Compare a task ID to the nil ID.
|
|
*
|
|
* @param id The task ID to compare to nil.
|
|
* @return True if the task ID is equal to nil.
|
|
*/
|
|
bool TaskID_is_nil(TaskID id);
|
|
|
|
/**
|
|
* Compare two actor IDs.
|
|
*
|
|
* @param first_id The first actor ID to compare.
|
|
* @param second_id The first actor ID to compare.
|
|
* @return True if the actor IDs are the same and false otherwise.
|
|
*/
|
|
bool ActorID_equal(ActorID first_id, ActorID second_id);
|
|
|
|
/**
|
|
* Compare two function IDs.
|
|
*
|
|
* @param first_id The first function ID to compare.
|
|
* @param second_id The first function ID to compare.
|
|
* @return True if the function IDs are the same and false otherwise.
|
|
*/
|
|
bool FunctionID_equal(FunctionID first_id, FunctionID second_id);
|
|
|
|
/**
|
|
* Compare a function ID to the nil ID.
|
|
*
|
|
* @param id The function ID to compare to nil.
|
|
* @return True if the function ID is equal to nil.
|
|
*/
|
|
bool FunctionID_is_nil(FunctionID id);
|
|
|
|
/* Construct and modify task specifications. */
|
|
|
|
TaskBuilder *make_task_builder(void);
|
|
|
|
void free_task_builder(TaskBuilder *builder);
|
|
|
|
/**
|
|
* Begin constructing a task_spec. After this is called, the arguments must be
|
|
* added to the task_spec and then finish_construct_task_spec must be called.
|
|
*
|
|
* @param driver_id The ID of the driver whose job is responsible for the
|
|
* creation of this task.
|
|
* @param parent_task_id The task ID of the task that submitted this task.
|
|
* @param parent_counter A counter indicating how many tasks were submitted by
|
|
* the parent task prior to this one.
|
|
* @param actor_creation_id The actor creation ID of this task.
|
|
* @param actor_creation_dummy_object_id The dummy object for the corresponding
|
|
* actor creation task, assuming this is an actor method.
|
|
* @param actor_id The ID of the actor that this task is for. If it is not an
|
|
* actor task, then this if NIL_ACTOR_ID.
|
|
* @param actor_handle_id The ID of the actor handle that this task was
|
|
* submitted through. If it is not an actor task, or if this is the
|
|
* original handle, then this is NIL_ACTOR_ID.
|
|
* @param actor_counter A counter indicating how many tasks have been submitted
|
|
* to the same actor before this one.
|
|
* @param is_actor_checkpoint_method True if this is an actor checkpoint method
|
|
* and false otherwise.
|
|
* @param function_id The function ID of the function to execute in this task.
|
|
* @param num_args The number of arguments that this task has.
|
|
* @param num_returns The number of return values that this task has.
|
|
* @param args_value_size The total size in bytes of the arguments to this task
|
|
ignoring object ID arguments.
|
|
* @return The partially constructed task_spec.
|
|
*/
|
|
void TaskSpec_start_construct(TaskBuilder *B,
|
|
UniqueID driver_id,
|
|
TaskID parent_task_id,
|
|
int64_t parent_counter,
|
|
ActorID actor_creation_id,
|
|
ObjectID actor_creation_dummy_object_id,
|
|
ActorID actor_id,
|
|
ActorHandleID actor_handle_id,
|
|
int64_t actor_counter,
|
|
bool is_actor_checkpoint_method,
|
|
FunctionID function_id,
|
|
int64_t num_returns);
|
|
|
|
/**
|
|
* Finish constructing a task_spec. This computes the task ID and the object IDs
|
|
* of the task return values. This must be called after all of the arguments
|
|
* have been added to the task.
|
|
*
|
|
* @param spec The task spec whose ID and return object IDs should be computed.
|
|
* @return Void.
|
|
*/
|
|
TaskSpec *TaskSpec_finish_construct(TaskBuilder *builder, int64_t *size);
|
|
|
|
/**
|
|
* Return the function ID of the task.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return The function ID of the function to execute in this task.
|
|
*/
|
|
FunctionID TaskSpec_function(TaskSpec *spec);
|
|
|
|
/**
|
|
* Return the actor ID of the task.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return The actor ID of the actor the task is part of.
|
|
*/
|
|
ActorID TaskSpec_actor_id(TaskSpec *spec);
|
|
|
|
/**
|
|
* Return the actor handle ID of the task.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return The ID of the actor handle that the task was submitted through.
|
|
*/
|
|
ActorID TaskSpec_actor_handle_id(TaskSpec *spec);
|
|
|
|
/**
|
|
* Return whether this task is for an actor.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return Whether the task is for an actor.
|
|
*/
|
|
bool TaskSpec_is_actor_task(TaskSpec *spec);
|
|
|
|
/// Return whether this task is an actor creation task or not.
|
|
///
|
|
/// \param spec The task_spec in question.
|
|
/// \return True if this task is an actor creation task and false otherwise.
|
|
bool TaskSpec_is_actor_creation_task(TaskSpec *spec);
|
|
|
|
/// Return the actor creation ID of the task. The task must be an actor creation
|
|
/// task.
|
|
///
|
|
/// \param spec The task_spec in question.
|
|
/// \return The actor creation ID if this is an actor creation task.
|
|
ActorID TaskSpec_actor_creation_id(TaskSpec *spec);
|
|
|
|
/// Return the actor creation dummy object ID of the task. The task must be an
|
|
/// actor task.
|
|
///
|
|
/// \param spec The task_spec in question.
|
|
/// \return The actor creation dummy object ID corresponding to this actor task.
|
|
ObjectID TaskSpec_actor_creation_dummy_object_id(TaskSpec *spec);
|
|
|
|
/**
|
|
* Return the actor counter of the task. This starts at 0 and increments by 1
|
|
* every time a new task is submitted to run on the actor.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return The actor counter of the task.
|
|
*/
|
|
int64_t TaskSpec_actor_counter(TaskSpec *spec);
|
|
|
|
/**
|
|
* Return whether the task is a checkpoint method execution.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return Whether the task is a checkpoint method.
|
|
*/
|
|
bool TaskSpec_is_actor_checkpoint_method(TaskSpec *spec);
|
|
|
|
/**
|
|
* Return an actor task's dummy return value. Dummy objects are used to
|
|
* encode an actor's state dependencies in the task graph. The dummy object
|
|
* is local if and only if the task that returned it has completed
|
|
* execution.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return The dummy object ID that the actor task will return.
|
|
*/
|
|
ObjectID TaskSpec_actor_dummy_object(TaskSpec *spec);
|
|
|
|
/**
|
|
* Return the driver ID of the task.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return The driver ID of the task.
|
|
*/
|
|
UniqueID TaskSpec_driver_id(const TaskSpec *spec);
|
|
|
|
/**
|
|
* Return the task ID of the parent task.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return The task ID of the parent task.
|
|
*/
|
|
TaskID TaskSpec_parent_task_id(const TaskSpec *spec);
|
|
|
|
/**
|
|
* Return the task counter of the parent task. For example, this equals 5 if
|
|
* this task was the 6th task submitted by the parent task.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return The task counter of the parent task.
|
|
*/
|
|
int64_t TaskSpec_parent_counter(TaskSpec *spec);
|
|
|
|
/**
|
|
* Return the task ID of the task.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return The task ID of the task.
|
|
*/
|
|
TaskID TaskSpec_task_id(const TaskSpec *spec);
|
|
|
|
/**
|
|
* Get the number of arguments to this task.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return The number of arguments to this task.
|
|
*/
|
|
int64_t TaskSpec_num_args(TaskSpec *spec);
|
|
|
|
/**
|
|
* Get the number of return values expected from this task.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return The number of return values expected from this task.
|
|
*/
|
|
int64_t TaskSpec_num_returns(TaskSpec *spec);
|
|
|
|
/**
|
|
* Return true if this argument is passed by reference.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @param arg_index The index of the argument in question.
|
|
* @return True if this argument is passed by reference.
|
|
*/
|
|
bool TaskSpec_arg_by_ref(TaskSpec *spec, int64_t arg_index);
|
|
|
|
/**
|
|
* Get number of object IDs in a given argument
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @param arg_index The index of the argument in question.
|
|
* @return number of object IDs in this argument
|
|
*/
|
|
int TaskSpec_arg_id_count(TaskSpec *spec, int64_t arg_index);
|
|
|
|
/**
|
|
* Get a particular argument to this task. This assumes the argument is an
|
|
* object ID.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @param arg_index The index of the argument in question.
|
|
* @param id_index The index of the object ID in this arg.
|
|
* @return The argument at that index.
|
|
*/
|
|
ObjectID TaskSpec_arg_id(TaskSpec *spec, int64_t arg_index, int64_t id_index);
|
|
|
|
/**
|
|
* Get a particular argument to this task. This assumes the argument is a value.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @param arg_index The index of the argument in question.
|
|
* @return The argument at that index.
|
|
*/
|
|
const uint8_t *TaskSpec_arg_val(TaskSpec *spec, int64_t arg_index);
|
|
|
|
/**
|
|
* Get the number of bytes in a particular argument to this task. This assumes
|
|
* the argument is a value.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @param arg_index The index of the argument in question.
|
|
* @return The number of bytes in the argument.
|
|
*/
|
|
int64_t TaskSpec_arg_length(TaskSpec *spec, int64_t arg_index);
|
|
|
|
/**
|
|
* Set the next task argument. Note that this API only allows you to set the
|
|
* arguments in their order of appearance.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @param object_ids The object IDs to set the argument to.
|
|
* @param num_object_ids number of IDs in this param, usually 1.
|
|
* @return The number of task arguments that have been set before this one. This
|
|
* is only used for testing.
|
|
*/
|
|
void TaskSpec_args_add_ref(TaskBuilder *spec,
|
|
ObjectID object_ids[],
|
|
int num_object_ids);
|
|
|
|
/**
|
|
* Set the next task argument. Note that this API only allows you to set the
|
|
* arguments in their order of appearance.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @param The value to set the argument to.
|
|
* @param The length of the value to set the argument to.
|
|
* @return The number of task arguments that have been set before this one. This
|
|
* is only used for testing.
|
|
*/
|
|
void TaskSpec_args_add_val(TaskBuilder *builder,
|
|
uint8_t *value,
|
|
int64_t length);
|
|
|
|
/**
|
|
* Set the value associated to a resource index.
|
|
*
|
|
* @param spec Task specification.
|
|
* @param resource_name Name of the resource in the resource vector.
|
|
* @param value Value for the resource. This can be a quantity of this resource
|
|
* this task needs or a value for an attribute this task requires.
|
|
* @return Void.
|
|
*/
|
|
void TaskSpec_set_required_resource(TaskBuilder *builder,
|
|
const std::string &resource_name,
|
|
double value);
|
|
|
|
/**
|
|
* Get a particular return object ID of a task.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @param return_index The index of the return object ID in question.
|
|
* @return The relevant return object ID.
|
|
*/
|
|
ObjectID TaskSpec_return(TaskSpec *data, int64_t return_index);
|
|
|
|
/**
|
|
* Get the value associated to a resource name.
|
|
*
|
|
* @param spec Task specification.
|
|
* @param resource_name Name of the resource.
|
|
* @return How many of this resource the task needs to execute.
|
|
*/
|
|
double TaskSpec_get_required_resource(const TaskSpec *spec,
|
|
const std::string &resource_name);
|
|
|
|
/**
|
|
*
|
|
*/
|
|
const std::unordered_map<std::string, double> TaskSpec_get_required_resources(
|
|
const TaskSpec *spec);
|
|
|
|
/**
|
|
* Compute the object id associated to a put call.
|
|
*
|
|
* @param task_id The task id of the parent task that called the put.
|
|
* @param put_index The number of put calls in this task so far.
|
|
* @return The object ID for the object that was put.
|
|
*/
|
|
ObjectID task_compute_put_id(TaskID task_id, int64_t put_index);
|
|
|
|
/**
|
|
* Print the task as a humanly readable string.
|
|
*
|
|
* @param spec The task_spec in question.
|
|
* @return The humanly readable string.
|
|
*/
|
|
std::string TaskSpec_print(TaskSpec *spec);
|
|
|
|
/**
|
|
* Create a copy of the task spec. Must be freed with TaskSpec_free after use.
|
|
*
|
|
* @param spec The task specification that will be copied.
|
|
* @param task_spec_size The size of the task specification in bytes.
|
|
* @returns Pointer to the copy of the task specification.
|
|
*/
|
|
TaskSpec *TaskSpec_copy(TaskSpec *spec, int64_t task_spec_size);
|
|
|
|
/**
|
|
* Free a task_spec.
|
|
*
|
|
* @param The task_spec in question.
|
|
* @return Void.
|
|
*/
|
|
void TaskSpec_free(TaskSpec *spec);
|
|
|
|
/**
|
|
* ==== Task ====
|
|
* Contains information about a scheduled task: The task specification, the
|
|
* task scheduling state (WAITING, SCHEDULED, QUEUED, RUNNING, DONE), and which
|
|
* local scheduler the task is scheduled on.
|
|
*/
|
|
|
|
/** The scheduling_state can be used as a flag when we are listening
|
|
* for an event, for example TASK_WAITING | TASK_SCHEDULED. */
|
|
typedef enum {
|
|
/** The task is waiting to be scheduled. */
|
|
TASK_STATUS_WAITING = 1,
|
|
/** The task has been scheduled to a node, but has not been queued yet. */
|
|
TASK_STATUS_SCHEDULED = 2,
|
|
/** The task has been queued on a node, where it will wait for its
|
|
* dependencies to become ready and a worker to become available. */
|
|
TASK_STATUS_QUEUED = 4,
|
|
/** The task is running on a worker. */
|
|
TASK_STATUS_RUNNING = 8,
|
|
/** The task is done executing. */
|
|
TASK_STATUS_DONE = 16,
|
|
/** The task was not able to finish. */
|
|
TASK_STATUS_LOST = 32,
|
|
/** The task will be submitted for reexecution. */
|
|
TASK_STATUS_RECONSTRUCTING = 64,
|
|
/** An actor task is cached at a local scheduler and is waiting for the
|
|
* corresponding actor to be created. */
|
|
TASK_STATUS_ACTOR_CACHED = 128
|
|
} scheduling_state;
|
|
|
|
/** A task is an execution of a task specification. It has a state of execution
|
|
* (see scheduling_state) and the ID of the local scheduler it is scheduled on
|
|
* or running on. */
|
|
|
|
struct Task {
|
|
/** The scheduling state of the task. */
|
|
int state;
|
|
/** The ID of the local scheduler involved. */
|
|
DBClientID local_scheduler_id;
|
|
/** The execution specification for this task. */
|
|
std::unique_ptr<TaskExecutionSpec> execution_spec;
|
|
};
|
|
|
|
/**
|
|
* Allocate a new task. Must be freed with free_task after use.
|
|
*
|
|
* @param spec The task spec for the new task.
|
|
* @param state The scheduling state for the new task.
|
|
* @param local_scheduler_id The ID of the local scheduler that the task is
|
|
* scheduled on, if any.
|
|
*/
|
|
Task *Task_alloc(const TaskSpec *spec,
|
|
int64_t task_spec_size,
|
|
int state,
|
|
DBClientID local_scheduler_id,
|
|
const std::vector<ObjectID> &execution_dependencies);
|
|
|
|
Task *Task_alloc(TaskExecutionSpec &execution_spec,
|
|
int state,
|
|
DBClientID local_scheduler_id);
|
|
|
|
/**
|
|
* Create a copy of the task. Must be freed with Task_free after use.
|
|
*
|
|
* @param other The task that will be copied.
|
|
* @returns Pointer to the copy of the task.
|
|
*/
|
|
Task *Task_copy(Task *other);
|
|
|
|
/** Size of task structure in bytes. */
|
|
int64_t Task_size(Task *task);
|
|
|
|
/** The scheduling state of the task. */
|
|
int Task_state(Task *task);
|
|
|
|
/** Update the schedule state of the task. */
|
|
void Task_set_state(Task *task, int state);
|
|
|
|
/** Local scheduler this task has been assigned to or is running on. */
|
|
DBClientID Task_local_scheduler(Task *task);
|
|
|
|
/** Set the local scheduler ID for this task. */
|
|
void Task_set_local_scheduler(Task *task, DBClientID local_scheduler_id);
|
|
|
|
TaskExecutionSpec *Task_task_execution_spec(Task *task);
|
|
|
|
/** Task ID of this task. */
|
|
TaskID Task_task_id(Task *task);
|
|
|
|
/** Free this task datastructure. */
|
|
void Task_free(Task *task);
|
|
|
|
#endif /* TASK_H */
|