org.apache.spark.launcher.SparkLauncher.launch java code examples

@Test
public void testChildProcLauncher() throws Exception {
 // This test is failed on Windows due to the failure of initiating executors
 // by the path length limitation. See SPARK-18718.
 assumeTrue(!Utils.isWindows());
 SparkSubmitOptionParser opts = new SparkSubmitOptionParser();
 Map<String, String> env = new HashMap<>();
 env.put("SPARK_PRINT_LAUNCH_COMMAND", "1");
 launcher
  .setMaster("local")
  .setAppResource(SparkLauncher.NO_RESOURCE)
  .addSparkArg(opts.CONF,
   String.format("%s=-Dfoo=ShouldBeOverriddenBelow", SparkLauncher.DRIVER_EXTRA_JAVA_OPTIONS))
  .setConf(SparkLauncher.DRIVER_EXTRA_JAVA_OPTIONS,
   "-Dfoo=bar -Dtest.appender=console")
  .setConf(SparkLauncher.DRIVER_EXTRA_CLASSPATH, System.getProperty("java.class.path"))
  .addSparkArg(opts.CLASS, "ShouldBeOverriddenBelow")
  .setMainClass(SparkLauncherTestApp.class.getName())
  .redirectError()
  .addAppArgs("proc");
 final Process app = launcher.launch();
 new OutputRedirector(app.getInputStream(), getClass().getName() + ".child", TF);
 assertEquals(0, app.waitFor());
}

@Test(expected=IllegalStateException.class)
public void testRedirectToLogWithOthersFails() throws Exception {
 launcher.setAppResource("fake-resource.jar")
  .setMainClass("my.fake.class.Fake")
  .redirectToLog("fakeLog")
  .redirectError(ProcessBuilder.Redirect.PIPE)
  .launch();
}

@Test(expected=IllegalStateException.class)
public void testRedirectTwiceFails() throws Exception {
 launcher.setAppResource("fake-resource.jar")
  .setMainClass("my.fake.class.Fake")
  .redirectError()
  .redirectError(ProcessBuilder.Redirect.PIPE)
  .launch();
}

@Test
public void testChildProcLauncher() throws Exception {
 // This test is failed on Windows due to the failure of initiating executors
 // by the path length limitation. See SPARK-18718.
 assumeTrue(!Utils.isWindows());
 SparkSubmitOptionParser opts = new SparkSubmitOptionParser();
 Map<String, String> env = new HashMap<>();
 env.put("SPARK_PRINT_LAUNCH_COMMAND", "1");
 launcher
  .setMaster("local")
  .setAppResource(SparkLauncher.NO_RESOURCE)
  .addSparkArg(opts.CONF,
   String.format("%s=-Dfoo=ShouldBeOverriddenBelow", SparkLauncher.DRIVER_EXTRA_JAVA_OPTIONS))
  .setConf(SparkLauncher.DRIVER_EXTRA_JAVA_OPTIONS,
   "-Dfoo=bar -Dtest.appender=console")
  .setConf(SparkLauncher.DRIVER_EXTRA_CLASSPATH, System.getProperty("java.class.path"))
  .addSparkArg(opts.CLASS, "ShouldBeOverriddenBelow")
  .setMainClass(SparkLauncherTestApp.class.getName())
  .redirectError()
  .addAppArgs("proc");
 final Process app = launcher.launch();
 new OutputRedirector(app.getInputStream(), getClass().getName() + ".child", TF);
 assertEquals(0, app.waitFor());
}

@Test
public void testChildProcLauncher() throws Exception {
 // This test is failed on Windows due to the failure of initiating executors
 // by the path length limitation. See SPARK-18718.
 assumeTrue(!Utils.isWindows());
 SparkSubmitOptionParser opts = new SparkSubmitOptionParser();
 Map<String, String> env = new HashMap<>();
 env.put("SPARK_PRINT_LAUNCH_COMMAND", "1");
 launcher
  .setMaster("local")
  .setAppResource(SparkLauncher.NO_RESOURCE)
  .addSparkArg(opts.CONF,
   String.format("%s=-Dfoo=ShouldBeOverriddenBelow", SparkLauncher.DRIVER_EXTRA_JAVA_OPTIONS))
  .setConf(SparkLauncher.DRIVER_EXTRA_JAVA_OPTIONS,
   "-Dfoo=bar -Dtest.appender=childproc")
  .setConf(SparkLauncher.DRIVER_EXTRA_CLASSPATH, System.getProperty("java.class.path"))
  .addSparkArg(opts.CLASS, "ShouldBeOverriddenBelow")
  .setMainClass(SparkLauncherTestApp.class.getName())
  .addAppArgs("proc");
 final Process app = launcher.launch();
 new OutputRedirector(app.getInputStream(), TF);
 new OutputRedirector(app.getErrorStream(), TF);
 assertEquals(0, app.waitFor());
}

Process proc = spark.launch();

Process proc = spark.launch();

public Process launchProcess(final SparkLauncher sparkLauncher) throws IOException {
  final Process process = sparkLauncher.launch();
  final InputStream errorStream = process.getErrorStream();
  startLogger(errorStream);
  final InputStream inputStream = process.getInputStream();
  startLogger(inputStream);
  return process;
}

@Test(expected = IllegalArgumentException.class)
public void testRedirectErrorTwiceFails() throws Exception {
 File err = Files.createTempFile("stderr", "txt").toFile();
 err.deleteOnExit();
 new SparkLauncher()
  .redirectError()
  .redirectError(err)
  .launch()
  .waitFor();
}

@Test(expected = IllegalArgumentException.class)
public void testBadLogRedirect() throws Exception {
 File out = Files.createTempFile("stdout", "txt").toFile();
 out.deleteOnExit();
 new SparkLauncher()
  .redirectError()
  .redirectOutput(out)
  .redirectToLog("foo")
  .launch()
  .waitFor();
}

  HoodieCLI.tableMetadata.getBasePath(), fileId, outputPathStr, "1", master,
  sparkMemory, Boolean.valueOf(skipV).toString(), Boolean.valueOf(dryRun).toString());
Process process = sparkLauncher.launch();
InputStreamConsumer.captureOutput(process);
int exitCode = process.waitFor();

@CliCommand(value = "repair deduplicate", help = "De-duplicate a partition path contains duplicates & produce "
  + "repaired files to replace with")
public String deduplicate(@CliOption(key = {
  "duplicatedPartitionPath"}, help = "Partition Path containing the duplicates", mandatory = true) final String
  duplicatedPartitionPath,
  @CliOption(key = {
    "repairedOutputPath"}, help = "Location to place the repaired files", mandatory = true) final String
    repairedOutputPath,
  @CliOption(key = {
    "sparkProperties"}, help = "Spark Properites File Path", mandatory = true) final String sparkPropertiesPath)
  throws Exception {
 SparkLauncher sparkLauncher = SparkUtil.initLauncher(sparkPropertiesPath);
 sparkLauncher.addAppArgs(SparkMain.SparkCommand.DEDUPLICATE.toString(), duplicatedPartitionPath, repairedOutputPath,
   HoodieCLI.tableMetadata.getBasePath());
 Process process = sparkLauncher.launch();
 InputStreamConsumer.captureOutput(process);
 int exitCode = process.waitFor();
 if (exitCode != 0) {
  return "Deduplicated files placed in:  " + repairedOutputPath;
 }
 return "Deduplication failed ";
}

  HoodieCLI.tableMetadata.getBasePath(), compactionInstant, outputPathStr, parallelism, master,
  sparkMemory, Boolean.valueOf(skipV).toString(), Boolean.valueOf(dryRun).toString());
Process process = sparkLauncher.launch();
InputStreamConsumer.captureOutput(process);
int exitCode = process.waitFor();

  HoodieCLI.tableMetadata.getBasePath(), compactionInstant, outputPathStr, parallelism, master,
  sparkMemory);
Process process = sparkLauncher.launch();
InputStreamConsumer.captureOutput(process);
int exitCode = process.waitFor();

@CliCommand(value = "compaction schedule", help = "Schedule Compaction")
public String scheduleCompact(
  @CliOption(key = "sparkMemory", unspecifiedDefaultValue = "1G", help = "Spark executor memory")
  final String sparkMemory) throws Exception {
 boolean initialized = HoodieCLI.initConf();
 HoodieCLI.initFS(initialized);
 // First get a compaction instant time and pass it to spark launcher for scheduling compaction
 String compactionInstantTime = HoodieActiveTimeline.createNewCommitTime();
 if (HoodieCLI.tableMetadata.getTableType() == HoodieTableType.MERGE_ON_READ) {
  String sparkPropertiesPath = Utils.getDefaultPropertiesFile(
    scala.collection.JavaConversions.propertiesAsScalaMap(System.getProperties()));
  SparkLauncher sparkLauncher = SparkUtil.initLauncher(sparkPropertiesPath);
  sparkLauncher.addAppArgs(SparkCommand.COMPACT_SCHEDULE.toString(), HoodieCLI.tableMetadata.getBasePath(),
    HoodieCLI.tableMetadata.getTableConfig().getTableName(), compactionInstantTime, sparkMemory);
  Process process = sparkLauncher.launch();
  InputStreamConsumer.captureOutput(process);
  int exitCode = process.waitFor();
  if (exitCode != 0) {
   return "Failed to run compaction for " + compactionInstantTime;
  }
  return "Compaction successfully completed for " + compactionInstantTime;
 } else {
  throw new Exception("Compactions can only be run for table type : MERGE_ON_READ");
 }
}

  HoodieCLI.tableMetadata.getBasePath(), compactionInstant, outputPathStr, parallelism, master,
  sparkMemory, Boolean.valueOf(dryRun).toString());
Process process = sparkLauncher.launch();
InputStreamConsumer.captureOutput(process);
int exitCode = process.waitFor();

  HoodieCLI.tableMetadata.getTableConfig().getTableName(), compactionInstantTime, parallelism, schemaFilePath,
  sparkMemory, retry);
Process process = sparkLauncher.launch();
InputStreamConsumer.captureOutput(process);
int exitCode = process.waitFor();

@CliCommand(value = "commit rollback", help = "Rollback a commit")
public String rollbackCommit(@CliOption(key = {"commit"}, help = "Commit to rollback") final String commitTime,
  @CliOption(key = {"sparkProperties"}, help = "Spark Properites File Path") final String sparkPropertiesPath)
  throws Exception {
 HoodieActiveTimeline activeTimeline = HoodieCLI.tableMetadata.getActiveTimeline();
 HoodieTimeline timeline = activeTimeline.getCommitsTimeline().filterCompletedInstants();
 HoodieInstant commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTime);
 if (!timeline.containsInstant(commitInstant)) {
  return "Commit " + commitTime + " not found in Commits " + timeline;
 }
 SparkLauncher sparkLauncher = SparkUtil.initLauncher(sparkPropertiesPath);
 sparkLauncher
   .addAppArgs(SparkMain.SparkCommand.ROLLBACK.toString(), commitTime, HoodieCLI.tableMetadata.getBasePath());
 Process process = sparkLauncher.launch();
 InputStreamConsumer.captureOutput(process);
 int exitCode = process.waitFor();
 // Refresh the current
 refreshCommits();
 if (exitCode != 0) {
  return "Commit " + commitTime + " failed to roll back";
 }
 return "Commit " + commitTime + " rolled back";
}

@CliCommand(value = "savepoint rollback", help = "Savepoint a commit")
public String rollbackToSavepoint(
  @CliOption(key = {"savepoint"}, help = "Savepoint to rollback") final String commitTime,
  @CliOption(key = {"sparkProperties"}, help = "Spark Properites File Path") final String sparkPropertiesPath)
  throws Exception {
 HoodieActiveTimeline activeTimeline = HoodieCLI.tableMetadata.getActiveTimeline();
 HoodieTimeline timeline = activeTimeline.getCommitTimeline().filterCompletedInstants();
 HoodieInstant commitInstant = new HoodieInstant(false, HoodieTimeline.COMMIT_ACTION, commitTime);
 if (!timeline.containsInstant(commitInstant)) {
  return "Commit " + commitTime + " not found in Commits " + timeline;
 }
 SparkLauncher sparkLauncher = SparkUtil.initLauncher(sparkPropertiesPath);
 sparkLauncher.addAppArgs(SparkMain.SparkCommand.ROLLBACK_TO_SAVEPOINT.toString(), commitTime,
   HoodieCLI.tableMetadata.getBasePath());
 Process process = sparkLauncher.launch();
 InputStreamConsumer.captureOutput(process);
 int exitCode = process.waitFor();
 // Refresh the current
 refreshMetaClient();
 if (exitCode != 0) {
  return "Savepoint " + commitTime + " failed to roll back";
 }
 return "Savepoint " + commitTime + " rolled back";
}

Process process = sparkLauncher.launch();
InputStreamConsumer.captureOutput(process);
int exitCode = process.waitFor();

Javadoc

Launches a sub-process that will start the configured Spark application.

The #startApplication(SparkAppHandle.Listener...) method is preferred when launching Spark, since it provides better control of the child application.

Popular methods of SparkLauncher

setConf
Set a single configuration value for the application.
setMainClass
Sets the application class name for Java/Scala applications.
<init>
Creates a launcher that will set the given environment variables in the child.
setMaster
Set the Spark master for the application.
addAppArgs
Adds command line arguments for the application.
addJar
Adds a jar file to be submitted with the application.
setAppResource
Set the main application resource. This should be the location of a jar file for Scala/Java applicat
addFile
Adds a file to be submitted with the application.
addPyFile
Adds a python file / zip / egg to be submitted with the application.
addSparkArg
Adds an argument with a value to the Spark invocation. If the argument name corresponds to a known a
createBuilder
redirectError
Redirects error output to the specified Redirect.

Popular in Java

Parsing JSON documents to java classes using gson
onCreateOptionsMenu (Activity)
getSharedPreferences (Context)
findViewById (Activity)
Proxy (java.net)
This class represents proxy server settings. A created instance of Proxy stores a type and an addres
Properties (java.util)
A Properties object is a Hashtable where the keys and values must be Strings. Each property can have
SortedSet (java.util)
SortedSet is a Set which iterates over its elements in a sorted order. The order is determined eithe
Stack (java.util)
Stack is a Last-In/First-Out(LIFO) data structure which represents a stack of objects. It enables u
ReentrantLock (java.util.concurrent.locks)
A reentrant mutual exclusion Lock with the same basic behavior and semantics as the implicit monitor
JFrame (javax.swing)
Best IntelliJ plugins

How to use launchmethodin org.apache.spark.launcher.SparkLauncher

Best Java code snippets using org.apache.spark.launcher.SparkLauncher.launch (Showing top 20 results out of 315)

How to use
launch
method
in
org.apache.spark.launcher.SparkLauncher