org.apache.flink.api.java.DataSet.getExecutionEnvironment java code examples

@Override
public DataSetAnalyticBase<T, R> run(DataSet<T> input)
    throws Exception {
  env = input.getExecutionEnvironment();
  return this;
}

public NoOpOperator(DataSet<IN> input, TypeInformation<IN> resultType) {
  super(input.getExecutionEnvironment(), resultType);
  this.input = input;
}

protected SingleInputOperator(DataSet<IN> input, TypeInformation<OUT> resultType) {
  super(input.getExecutionEnvironment(), resultType);
  this.input = input;
}

protected static void checkSameExecutionContext(DataSet<?> set1, DataSet<?> set2) {
  if (set1.getExecutionEnvironment() != set2.getExecutionEnvironment()) {
    throw new IllegalArgumentException("The two inputs have different execution contexts.");
  }
}

  @Override
  public void write(String executionName, PrintStream out, DataSet<T> data) throws Exception {
    ChecksumHashCode<T> checksumHashCode = new ChecksumHashCode<T>().run(data);

    if (printExecutionPlan.getValue()) {
      out.println();
      out.println(data.getExecutionEnvironment().getExecutionPlan());
    }

    ChecksumHashCode.Checksum checksum = checksumHashCode
      .execute(executionName);

    out.println();
    out.println(checksum);
  }
}

protected TwoInputOperator(DataSet<IN1> input1, DataSet<IN2> input2, TypeInformation<OUT> resultType) {
  super(Preconditions.checkNotNull(input1, "input1 is null").getExecutionEnvironment(), resultType);
  Preconditions.checkNotNull(input2, "input2 is null");
  DataSet.checkSameExecutionContext(input1, input2);
  this.input1 = input1;
  this.input2 = input2;
}

  @Override
  public void write(String executionName, PrintStream out, DataSet<T> data) throws Exception {
    Collect<T> collector = new Collect<T>().run(data);

    if (printExecutionPlan.getValue()) {
      out.println();
      out.println(data.getExecutionEnvironment().getExecutionPlan());
    }

    List<T> results = collector.execute(executionName);

    if (results.size() == 0) {
      return;
    }

    out.println();

    if (results.get(0) instanceof PrintableResult) {
      for (Object result : results) {
        out.println(((PrintableResult) result).toPrintableString());
      }
    } else {
      for (Object result : results) {
        out.println(result);
      }
    }
  }
}

/**
 * Closes the delta iteration. This method defines the end of the delta iteration's function.
 *
 * @param solutionSetDelta The delta for the solution set. The delta will be merged into the solution set at the end of
 *                         each iteration.
 * @param newWorkset The new workset (feedback data set) that will be fed back to the next iteration.
 * @return The DataSet that represents the result of the iteration, after the computation has terminated.
 *
 * @see DataSet#iterateDelta(DataSet, int, int...)
 */
public DataSet<ST> closeWith(DataSet<ST> solutionSetDelta, DataSet<WT> newWorkset) {
  return new DeltaIterationResultSet<ST, WT>(initialSolutionSet.getExecutionEnvironment(),
      initialSolutionSet.getType(), initialWorkset.getType(), this, solutionSetDelta, newWorkset, keys, maxIterations);
}

return new IterativeDataSet<>(getExecutionEnvironment(), getType(), this, maxIterations);

public <F> F clean(F f) {
  if (getExecutionEnvironment().getConfig().isClosureCleanerEnabled()) {
    ClosureCleaner.clean(f, true);
  } else {
    ClosureCleaner.ensureSerializable(f);
  }
  return f;
}

protected ProjectCross(DataSet<I1> input1, DataSet<I2> input2, int[] fields, boolean[] isFromFirst,
    TupleTypeInfo<OUT> returnType, CrossProjection<I1, I2> crossProjection, CrossHint hint) {
  super(input1, input2,
    new ProjectCrossFunction<I1, I2, OUT>(fields, isFromFirst, returnType.createSerializer(input1.getExecutionEnvironment().getConfig()).createInstance()),
    returnType, hint, "unknown");
  this.crossProjection = crossProjection;
}

protected ProjectCross(DataSet<I1> input1, DataSet<I2> input2, int[] fields, boolean[] isFromFirst,
    TupleTypeInfo<OUT> returnType, CrossHint hint) {
  super(input1, input2,
      new ProjectCrossFunction<I1, I2, OUT>(fields, isFromFirst, returnType.createSerializer(input1.getExecutionEnvironment().getConfig()).createInstance()),
      returnType, hint, "unknown");
  crossProjection = null;
}

protected ProjectJoin(DataSet<I1> input1, DataSet<I2> input2, Keys<I1> keys1, Keys<I2> keys2, JoinHint hint, int[] fields, boolean[] isFromFirst, TupleTypeInfo<OUT> returnType, JoinProjection<I1, I2> joinProj) {
  super(input1, input2, keys1, keys2,
      new ProjectFlatJoinFunction<I1, I2, OUT>(fields, isFromFirst, returnType.createSerializer(input1.getExecutionEnvironment().getConfig()).createInstance()),
      returnType, hint, Utils.getCallLocationName(4));
  this.joinProj = joinProj;
}

protected ProjectJoin(DataSet<I1> input1, DataSet<I2> input2, Keys<I1> keys1, Keys<I2> keys2, JoinHint hint, int[] fields, boolean[] isFromFirst, TupleTypeInfo<OUT> returnType) {
  super(input1, input2, keys1, keys2,
      new ProjectFlatJoinFunction<I1, I2, OUT>(fields, isFromFirst, returnType.createSerializer(input1.getExecutionEnvironment().getConfig()).createInstance()),
      returnType, hint, Utils.getCallLocationName(4)); // We need to use the 4th element in the stack because the call comes through .types().
  joinProj = null;
}

/**
 * Convenience method to get the elements of a DataSet as a List.
 * As DataSet can contain a lot of data, this method should be used with caution.
 *
 * @return A List containing the elements of the DataSet
 */
public List<T> collect() throws Exception {
  final String id = new AbstractID().toString();
  final TypeSerializer<T> serializer = getType().createSerializer(getExecutionEnvironment().getConfig());
  this.output(new Utils.CollectHelper<>(id, serializer)).name("collect()");
  JobExecutionResult res = getExecutionEnvironment().execute();
  ArrayList<byte[]> accResult = res.getAccumulatorResult(id);
  if (accResult != null) {
    try {
      return SerializedListAccumulator.deserializeList(accResult, serializer);
    } catch (ClassNotFoundException e) {
      throw new RuntimeException("Cannot find type class of collected data type.", e);
    } catch (IOException e) {
      throw new RuntimeException("Serialization error while deserializing collected data", e);
    }
  } else {
    throw new RuntimeException("The call to collect() could not retrieve the DataSet.");
  }
}

/**
 * Convenience method to get the count (number of elements) of a DataSet
 * as well as the checksum (sum over element hashes).
 *
 * @return A ChecksumHashCode that represents the count and checksum of elements in the data set.
 * @deprecated replaced with {@code org.apache.flink.graph.asm.dataset.ChecksumHashCode} in Gelly
 */
@Deprecated
public static <T> Utils.ChecksumHashCode checksumHashCode(DataSet<T> input) throws Exception {
  final String id = new AbstractID().toString();
  input.output(new Utils.ChecksumHashCodeHelper<T>(id)).name("ChecksumHashCode");
  JobExecutionResult res = input.getExecutionEnvironment().execute();
  return res.<Utils.ChecksumHashCode> getAccumulatorResult(id);
}

/**
 * Convenience method to get the count (number of elements) of a DataSet.
 *
 * @return A long integer that represents the number of elements in the data set.
 */
public long count() throws Exception {
  final String id = new AbstractID().toString();
  output(new Utils.CountHelper<T>(id)).name("count()");
  JobExecutionResult res = getExecutionEnvironment().execute();
  return res.<Long> getAccumulatorResult(id);
}

  @Override
  public void write(String executionName, PrintStream out, DataSet<T> data) throws Exception {
    if (Tuple.class.isAssignableFrom(data.getType().getTypeClass())) {
      data
        .writeAsCsv(filename.getValue(), lineDelimiter.getValue(), fieldDelimiter.getValue())
          .name("CSV: " + filename.getValue());
    } else {
      // line and field delimiters are ineffective when writing custom POJOs result types
      data
        .writeAsText(filename.getValue())
          .name("CSV: " + filename.getValue());
    }

    data.getExecutionEnvironment().execute();
  }
}

return new DeltaIteration<>(getExecutionEnvironment(), getType(), this, workset, keys, maxIterations);

Graph.fromDataSet(initialVertices, edgesWithValue, initialVertices.getExecutionEnvironment());

Javadoc

Returns the ExecutionEnvironment in which this DataSet is registered.

Popular methods of DataSet

map
Applies a Map transformation on this DataSet.The transformation calls a org.apache.flink.api.common.
flatMap
Applies a FlatMap transformation on a DataSet.The transformation calls a org.apache.flink.api.common
output
Emits a DataSet using an OutputFormat. This method adds a data sink to the program. Programs may hav
groupBy
Groups a DataSet using field expressions. A field expression is either the name of a public field or
filter
Applies a Filter transformation on a DataSet.The transformation calls a org.apache.flink.api.common.
join
Initiates a Join transformation.A Join transformation joins the elements of two DataSet on key equal
collect
Convenience method to get the elements of a DataSet as a List. As DataSet can contain a lot of data,
getType
Returns the TypeInformation for the type of this DataSet.
union
Creates a union of this DataSet with an other DataSet. The other DataSet must be of the same data ty
iterate
Initiates an iterative part of the program that executes multiple times and feeds back data sets. Th
writeAsCsv
Writes a Tuple DataSet as CSV file(s) to the specified location.Note: Only a Tuple DataSet can writt
writeAsText
Writes a DataSet as text file(s) to the specified location.For each element of the DataSet the resul

Popular in Java

Parsing JSON documents to java classes using gson
getSharedPreferences (Context)
startActivity (Activity)
addToBackStack (FragmentTransaction)
FileWriter (java.io)
A specialized Writer that writes to a file in the file system. All write requests made by calling me
BigInteger (java.math)
An immutable arbitrary-precision signed integer.FAST CRYPTOGRAPHY This implementation is efficient f
LinkedHashMap (java.util)
LinkedHashMap is an implementation of Map that guarantees iteration order. All optional operations a
Executors (java.util.concurrent)
Factory and utility methods for Executor, ExecutorService, ScheduledExecutorService, ThreadFactory,
DataSource (javax.sql)
An interface for the creation of Connection objects which represent a connection to a database. This
SAXParseException (org.xml.sax)
Encapsulate an XML parse error or warning.> This module, both source code and documentation, is in t
Best plugins for Eclipse

How to use getExecutionEnvironmentmethodin org.apache.flink.api.java.DataSet

Best Java code snippets using org.apache.flink.api.java.DataSet.getExecutionEnvironment (Showing top 20 results out of 315)

How to use
getExecutionEnvironment
method
in
org.apache.flink.api.java.DataSet