mirror of
https://github.com/wassname/ray.git
synced 2026-06-28 00:29:38 +08:00
[Java] Java worker cluster support (#2359)
This commit is contained in:
committed by
Robert Nishihara
parent
4ef9d15315
commit
fa33ea5283
@@ -0,0 +1,15 @@
|
||||
<assembly>
|
||||
<id>ear</id>
|
||||
<formats>
|
||||
<format>zip</format>
|
||||
</formats>
|
||||
<dependencySets>
|
||||
<dependencySet>
|
||||
<useProjectArtifact>true</useProjectArtifact>
|
||||
<outputDirectory>lib</outputDirectory>
|
||||
</dependencySet>
|
||||
</dependencySets>
|
||||
<fileSets>
|
||||
|
||||
</fileSets>
|
||||
</assembly>
|
||||
@@ -0,0 +1,98 @@
|
||||
<?xml version="1.0" encoding="UTF-8"?>
|
||||
|
||||
<project xmlns="http://maven.apache.org/POM/4.0.0"
|
||||
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
|
||||
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
|
||||
<parent>
|
||||
<groupId>org.ray.parent</groupId>
|
||||
<artifactId>ray-superpom</artifactId>
|
||||
<version>1.0</version>
|
||||
</parent>
|
||||
<modelVersion>4.0.0</modelVersion>
|
||||
<groupId>org.ray</groupId>
|
||||
<artifactId>ray-cli</artifactId>
|
||||
|
||||
<name>java cli for ray</name>
|
||||
<description>java cli for ray</description>
|
||||
<url></url>
|
||||
|
||||
<packaging>jar</packaging>
|
||||
|
||||
<dependencies>
|
||||
<dependency>
|
||||
<groupId>org.ray</groupId>
|
||||
<artifactId>ray-api</artifactId>
|
||||
<version>${project.version}</version>
|
||||
</dependency>
|
||||
<dependency>
|
||||
<groupId>org.ray</groupId>
|
||||
<artifactId>ray-runtime-native</artifactId>
|
||||
<version>${project.version}</version>
|
||||
</dependency>
|
||||
<dependency>
|
||||
<groupId>de.ruedigermoeller</groupId>
|
||||
<artifactId>fst</artifactId>
|
||||
</dependency>
|
||||
|
||||
<dependency>
|
||||
<groupId>com.github.davidmoten</groupId>
|
||||
<artifactId>flatbuffers-java</artifactId>
|
||||
</dependency>
|
||||
|
||||
<dependency>
|
||||
<groupId>redis.clients</groupId>
|
||||
<artifactId>jedis</artifactId>
|
||||
</dependency>
|
||||
|
||||
<!-- https://mvnrepository.com/artifact/com.beust/jcommander -->
|
||||
<dependency>
|
||||
<groupId>com.beust</groupId>
|
||||
<artifactId>jcommander</artifactId>
|
||||
</dependency>
|
||||
</dependencies>
|
||||
|
||||
<build>
|
||||
<finalName>ray-cli</finalName>
|
||||
<plugins>
|
||||
<plugin>
|
||||
<groupId>org.apache.maven.plugins</groupId>
|
||||
<artifactId>maven-assembly-plugin</artifactId>
|
||||
<configuration>
|
||||
<descriptors>
|
||||
<descriptor>assembly.xml</descriptor>
|
||||
</descriptors>
|
||||
</configuration>
|
||||
<executions>
|
||||
<execution>
|
||||
<id>make-assembly</id>
|
||||
<phase>package</phase>
|
||||
<goals>
|
||||
<goal>single</goal>
|
||||
</goals>
|
||||
</execution>
|
||||
</executions>
|
||||
</plugin>
|
||||
<plugin>
|
||||
<groupId>org.apache.maven.plugins</groupId>
|
||||
<artifactId>maven-dependency-plugin</artifactId>
|
||||
<executions>
|
||||
<execution>
|
||||
<id>copy-dependencies</id>
|
||||
<phase>package</phase>
|
||||
<goals>
|
||||
<goal>copy-dependencies</goal>
|
||||
</goals>
|
||||
<configuration>
|
||||
<outputDirectory>${basedir}/lib</outputDirectory>
|
||||
<overWriteReleases>false</overWriteReleases>
|
||||
<overWriteSnapshots>false</overWriteSnapshots>
|
||||
<overWriteIfNewer>true</overWriteIfNewer>
|
||||
</configuration>
|
||||
</execution>
|
||||
</executions>
|
||||
</plugin>
|
||||
</plugins>
|
||||
|
||||
</build>
|
||||
|
||||
</project>
|
||||
@@ -0,0 +1,21 @@
|
||||
package org.ray.cli;
|
||||
|
||||
import com.beust.jcommander.Parameter;
|
||||
import com.beust.jcommander.Parameters;
|
||||
|
||||
/**
|
||||
* Arguments for command start.
|
||||
*/
|
||||
@Parameters(separators = "= ", commandDescription = "start ray daemons")
|
||||
public class CommandStart {
|
||||
|
||||
@Parameter(names = "--head", description = "start the head node")
|
||||
public boolean head;
|
||||
|
||||
@Parameter(names = "--config", description = "the config file of ray")
|
||||
public String config = "";
|
||||
|
||||
@Parameter(names = "--overwrite", description = "the overwrite items of config")
|
||||
public String overwrite = "";
|
||||
|
||||
}
|
||||
@@ -0,0 +1,11 @@
|
||||
package org.ray.cli;
|
||||
|
||||
import com.beust.jcommander.Parameters;
|
||||
|
||||
/**
|
||||
* Arguments for command stop.
|
||||
*/
|
||||
@Parameters(separators = "= ", commandDescription = "stop ray daemons")
|
||||
public class CommandStop {
|
||||
|
||||
}
|
||||
@@ -0,0 +1,27 @@
|
||||
package org.ray.cli;
|
||||
|
||||
import com.beust.jcommander.Parameter;
|
||||
import com.beust.jcommander.Parameters;
|
||||
|
||||
/**
|
||||
* Arguments for command submit.
|
||||
*/
|
||||
@Parameters(separators = "= ", commandDescription = "submit a job to ray cluster")
|
||||
public class CommandSubmit {
|
||||
|
||||
@Parameter(names = "--package", description = "java jar package zip file", required = true)
|
||||
public String packageZip;
|
||||
|
||||
@Parameter(names = "--class", description = "java class name", required = true)
|
||||
public String className;
|
||||
|
||||
@Parameter(names = "--args", description = "arguments for the java class")
|
||||
public String classArgs;
|
||||
|
||||
@Parameter(names = "--config", description = "the config file of ray")
|
||||
public String config;
|
||||
|
||||
@Parameter(names = "--redis-address", description = "ip:port for redis service", required = true)
|
||||
public String redisAddress;
|
||||
|
||||
}
|
||||
@@ -0,0 +1,290 @@
|
||||
package org.ray.cli;
|
||||
|
||||
import com.beust.jcommander.JCommander;
|
||||
import java.io.File;
|
||||
import java.io.IOException;
|
||||
import java.util.ArrayList;
|
||||
import java.util.List;
|
||||
import net.lingala.zip4j.core.ZipFile;
|
||||
import net.lingala.zip4j.exception.ZipException;
|
||||
import org.ray.api.UniqueID;
|
||||
import org.ray.cli.CommandStart;
|
||||
import org.ray.cli.CommandStop;
|
||||
import org.ray.core.RayRuntime;
|
||||
import org.ray.core.model.RayParameters;
|
||||
import org.ray.core.model.RunMode;
|
||||
import org.ray.runner.RunInfo;
|
||||
import org.ray.runner.RunManager;
|
||||
import org.ray.runner.worker.DefaultDriver;
|
||||
import org.ray.spi.KeyValueStoreLink;
|
||||
import org.ray.spi.PathConfig;
|
||||
import org.ray.spi.RemoteFunctionManager;
|
||||
import org.ray.spi.StateStoreProxy;
|
||||
import org.ray.spi.impl.NativeRemoteFunctionManager;
|
||||
import org.ray.spi.impl.RedisClient;
|
||||
import org.ray.spi.impl.StateStoreProxyImpl;
|
||||
import org.ray.util.FileUtil;
|
||||
import org.ray.util.config.ConfigReader;
|
||||
import org.ray.util.logger.RayLog;
|
||||
|
||||
|
||||
/**
|
||||
* Ray command line interface.
|
||||
*/
|
||||
public class RayCli {
|
||||
|
||||
private static RayCliArgs rayArgs = new RayCliArgs();
|
||||
|
||||
private static RunManager startRayHead(RayParameters params, PathConfig paths,
|
||||
ConfigReader configReader) {
|
||||
RunManager manager = new RunManager(params, paths, configReader);
|
||||
|
||||
try {
|
||||
manager.startRayHead();
|
||||
} catch (Exception e) {
|
||||
e.printStackTrace();
|
||||
RayLog.core.error("error at RayCli startRayHead", e);
|
||||
throw new RuntimeException("Ray head node start failed", e);
|
||||
}
|
||||
|
||||
RayLog.core.info("Started Ray head node. Redis address: " + manager.info().redisAddress);
|
||||
return manager;
|
||||
}
|
||||
|
||||
private static RunManager startRayNode(RayParameters params, PathConfig paths,
|
||||
ConfigReader configReader) {
|
||||
RunManager manager = new RunManager(params, paths, configReader);
|
||||
|
||||
try {
|
||||
manager.startRayNode();
|
||||
} catch (Exception e) {
|
||||
e.printStackTrace();
|
||||
RayLog.core.error("error at RayCli startRayNode", e);
|
||||
throw new RuntimeException("Ray work node start failed, err = " + e.getMessage());
|
||||
}
|
||||
|
||||
RayLog.core.info("Started Ray work node.");
|
||||
return manager;
|
||||
}
|
||||
|
||||
private static RunManager startProcess(CommandStart cmdStart, ConfigReader config) {
|
||||
PathConfig paths = new PathConfig(config);
|
||||
RayParameters params = new RayParameters(config);
|
||||
|
||||
RayLog.core.info("Using IP address " + params.node_ip_address + " for this node.");
|
||||
RunManager manager;
|
||||
if (cmdStart.head) {
|
||||
manager = startRayHead(params, paths, config);
|
||||
} else {
|
||||
manager = startRayNode(params, paths, config);
|
||||
}
|
||||
return manager;
|
||||
}
|
||||
|
||||
private static void start(CommandStart cmdStart, ConfigReader reader) {
|
||||
startProcess(cmdStart, reader);
|
||||
}
|
||||
|
||||
private static void stop(CommandStop cmdStop) {
|
||||
String[] cmd = {"/bin/sh", "-c", ""};
|
||||
|
||||
cmd[2] = "killall global_scheduler local_scheduler plasma_store plasma_manager";
|
||||
try {
|
||||
Runtime.getRuntime().exec(cmd);
|
||||
} catch (IOException e) {
|
||||
RayLog.core.warn("exception in killing ray processes");
|
||||
}
|
||||
|
||||
cmd[2] = "kill $(ps aux | grep redis-server | grep -v grep | "
|
||||
+ "awk \'{ print $2 }\') 2> /dev/null";
|
||||
try {
|
||||
Runtime.getRuntime().exec(cmd);
|
||||
} catch (IOException e) {
|
||||
RayLog.core.warn("exception in killing ray processes");
|
||||
}
|
||||
|
||||
cmd[2] = "kill -9 $(ps aux | grep DefaultWorker | grep -v grep | "
|
||||
+ "awk \'{ print $2 }\') 2> /dev/null";
|
||||
try {
|
||||
Runtime.getRuntime().exec(cmd);
|
||||
} catch (IOException e) {
|
||||
RayLog.core.warn("exception in killing ray processes");
|
||||
}
|
||||
}
|
||||
|
||||
private static String[] buildRayRuntimeArgs(CommandSubmit cmdSubmit) {
|
||||
|
||||
if (cmdSubmit.redisAddress == null) {
|
||||
throw new RuntimeException(
|
||||
"--redis-address must be specified to submit a job");
|
||||
}
|
||||
|
||||
List<String> argList = new ArrayList<String>();
|
||||
String section = "ray.java.start.";
|
||||
String overwrite = "--overwrite="
|
||||
+ section + "redis_address=" + cmdSubmit.redisAddress + ";"
|
||||
+ section + "run_mode=" + "CLUSTER";
|
||||
|
||||
argList.add(overwrite);
|
||||
|
||||
if (cmdSubmit.config != null) {
|
||||
String config = "--config=" + cmdSubmit.config;
|
||||
argList.add(config);
|
||||
}
|
||||
|
||||
String[] args = new String[argList.size()];
|
||||
argList.toArray(args);
|
||||
|
||||
return args;
|
||||
}
|
||||
|
||||
private static void submit(CommandSubmit cmdSubmit, String configPath) throws Exception {
|
||||
ConfigReader config = new ConfigReader(configPath, "ray.java.start.deploy=true");
|
||||
PathConfig paths = new PathConfig(config);
|
||||
RayParameters params = new RayParameters(config);
|
||||
|
||||
params.redis_address = cmdSubmit.redisAddress;
|
||||
params.run_mode = RunMode.CLUSTER;
|
||||
|
||||
|
||||
KeyValueStoreLink kvStore = new RedisClient();
|
||||
kvStore.setAddr(cmdSubmit.redisAddress);
|
||||
StateStoreProxy stateStoreProxy = new StateStoreProxyImpl(kvStore);
|
||||
stateStoreProxy.initializeGlobalState();
|
||||
|
||||
RemoteFunctionManager functionManager = new NativeRemoteFunctionManager(kvStore);
|
||||
|
||||
// Register app to Redis.
|
||||
byte[] zip = FileUtil.fileToBytes(cmdSubmit.packageZip);
|
||||
|
||||
String packageName = cmdSubmit.packageZip.substring(
|
||||
cmdSubmit.packageZip.lastIndexOf('/') + 1,
|
||||
cmdSubmit.packageZip.lastIndexOf('.'));
|
||||
|
||||
//final RemoteFunctionManager functionManager = RayRuntime
|
||||
// .getInstance().getRemoteFunctionManager();
|
||||
|
||||
UniqueID resourceId = functionManager.registerResource(zip);
|
||||
RayLog.rapp.debug(
|
||||
"registerResource " + resourceId + " for package " + packageName + " done");
|
||||
|
||||
UniqueID appId = params.driver_id;
|
||||
functionManager.registerApp(appId, resourceId);
|
||||
RayLog.rapp.debug("registerApp " + appId + " for resouorce " + resourceId + " done");
|
||||
|
||||
// Unzip the package file.
|
||||
String appDir = "/tmp/" + cmdSubmit.className;
|
||||
String extPath = appDir + "/" + packageName;
|
||||
if (!FileUtil.createDir(extPath, false)) {
|
||||
throw new RuntimeException("create dir " + extPath + " failed ");
|
||||
}
|
||||
|
||||
ZipFile zipFile = new ZipFile(cmdSubmit.packageZip);
|
||||
zipFile.extractAll(extPath);
|
||||
|
||||
// Build the args for driver process.
|
||||
File originDirFile = new File(extPath);
|
||||
File[] topFiles = originDirFile.listFiles();
|
||||
String topDir = null;
|
||||
for (File file : topFiles) {
|
||||
if (file.isDirectory()) {
|
||||
topDir = file.getName();
|
||||
}
|
||||
}
|
||||
RayLog.rapp.debug("topDir of app classes: " + topDir);
|
||||
if (topDir == null) {
|
||||
RayLog.rapp.error("Can't find topDir of app classes, the app directory " + appDir);
|
||||
return;
|
||||
}
|
||||
|
||||
String additionalClassPath = appDir + "/" + packageName + "/" + topDir + "/*";
|
||||
RayLog.rapp.debug("Find app class path " + additionalClassPath);
|
||||
|
||||
// Start driver process.
|
||||
//RunManager runManager = new RunManager(params, RayRuntime.getInstance().getPaths(),
|
||||
// RayRuntime.configReader);
|
||||
RunManager runManager = new RunManager(params, paths, config);
|
||||
Process proc = runManager.startDriver(
|
||||
DefaultDriver.class.getName(),
|
||||
cmdSubmit.redisAddress,
|
||||
appId,
|
||||
appDir,
|
||||
params.node_ip_address,
|
||||
cmdSubmit.className,
|
||||
cmdSubmit.classArgs,
|
||||
additionalClassPath,
|
||||
null);
|
||||
|
||||
if (null == proc) {
|
||||
RayLog.rapp.error(
|
||||
"Create process for app " + packageName + " in local directory " + appDir
|
||||
+ " failed");
|
||||
return;
|
||||
}
|
||||
|
||||
RayLog.rapp
|
||||
.info("Create app " + appDir + " for package " + packageName + " succeeded");
|
||||
}
|
||||
|
||||
private static String getConfigPath(String config) {
|
||||
String configPath;
|
||||
|
||||
if (config != null && !config.equals("")) {
|
||||
configPath = config;
|
||||
} else {
|
||||
configPath = System.getenv("RAY_CONFIG");
|
||||
if (configPath == null) {
|
||||
configPath = System.getProperty("ray.config");
|
||||
}
|
||||
if (configPath == null) {
|
||||
throw new RuntimeException(
|
||||
"Please set config file path in env RAY_CONFIG or property ray.config");
|
||||
}
|
||||
}
|
||||
return configPath;
|
||||
}
|
||||
|
||||
public static void main(String[] args) throws Exception {
|
||||
|
||||
CommandStart cmdStart = new CommandStart();
|
||||
CommandStop cmdStop = new CommandStop();
|
||||
CommandSubmit cmdSubmit = new CommandSubmit();
|
||||
JCommander rayCommander = JCommander.newBuilder().addObject(rayArgs)
|
||||
.addCommand("start", cmdStart)
|
||||
.addCommand("stop", cmdStop)
|
||||
.addCommand("submit", cmdSubmit)
|
||||
.build();
|
||||
rayCommander.parse(args);
|
||||
|
||||
if (rayArgs.help) {
|
||||
rayCommander.usage();
|
||||
System.exit(0);
|
||||
}
|
||||
|
||||
String cmd = rayCommander.getParsedCommand();
|
||||
if (cmd == null) {
|
||||
rayCommander.usage();
|
||||
System.exit(0);
|
||||
}
|
||||
|
||||
String configPath;
|
||||
switch (cmd) {
|
||||
case "start": {
|
||||
configPath = getConfigPath(cmdStart.config);
|
||||
ConfigReader config = new ConfigReader(configPath, cmdStart.overwrite);
|
||||
start(cmdStart, config);
|
||||
}
|
||||
break;
|
||||
case "stop":
|
||||
stop(cmdStop);
|
||||
break;
|
||||
case "submit":
|
||||
configPath = getConfigPath(cmdSubmit.config);
|
||||
submit(cmdSubmit, configPath);
|
||||
break;
|
||||
default:
|
||||
rayCommander.usage();
|
||||
}
|
||||
}
|
||||
|
||||
}
|
||||
@@ -0,0 +1,12 @@
|
||||
package org.ray.cli;
|
||||
|
||||
import com.beust.jcommander.Parameter;
|
||||
|
||||
/**
|
||||
* Arguments for Ray cli.
|
||||
*/
|
||||
public class RayCliArgs {
|
||||
|
||||
@Parameter(names = {"-h", "-help", "--help"}, description = "print this usage", help = true)
|
||||
public boolean help;
|
||||
}
|
||||
Reference in New Issue
Block a user