org.apache.gobblin.configuration.WorkUnitState.getId java code examples

private String getWorkUnitName() {
 StringBuilder sb = new StringBuilder();
 sb.append("[");
 sb.append(StringUtils.stripToEmpty(this.workUnitState.getProp(ConfigurationKeys.SOURCE_QUERYBASED_SCHEMA)));
 sb.append("_");
 sb.append(StringUtils.stripToEmpty(this.workUnitState.getProp(ConfigurationKeys.SOURCE_ENTITY)));
 sb.append("_");
 String id = this.workUnitState.getId();
 int seqIndex = id.lastIndexOf("_", id.length());
 if (seqIndex > 0) {
  String timeSeqStr = id.substring(0, seqIndex);
  int timeIndex = timeSeqStr.lastIndexOf("_", timeSeqStr.length());
  if (timeIndex > 0) {
   sb.append(id.substring(timeIndex + 1));
  }
 }
 sb.append("]");
 return sb.toString();
}

@Override
public Extractor<S, D> getExtractor(WorkUnitState workUnitState) throws IOException {
 if (!workUnitState.contains(HadoopFileInputSource.FILE_SPLIT_BYTES_STRING_KEY)) {
  throw new IOException("No serialized FileSplit found in WorkUnitState " + workUnitState.getId());
 }
 JobConf jobConf = new JobConf(new Configuration());
 for (String key : workUnitState.getPropertyNames()) {
  jobConf.set(key, workUnitState.getProp(key));
 }
 String fileSplitBytesStr = workUnitState.getProp(HadoopFileInputSource.FILE_SPLIT_BYTES_STRING_KEY);
 FileSplit fileSplit = (FileSplit) HadoopUtils.deserializeFromString(FileSplit.class, fileSplitBytesStr);
 FileInputFormat<K, V> fileInputFormat = getFileInputFormat(workUnitState, jobConf);
 RecordReader<K, V> recordReader = fileInputFormat.getRecordReader(fileSplit, jobConf, Reporter.NULL);
 boolean readKeys = workUnitState.getPropAsBoolean(
   HadoopFileInputSource.FILE_INPUT_READ_KEYS_KEY, HadoopFileInputSource.DEFAULT_FILE_INPUT_READ_KEYS);
 return getExtractor(workUnitState, recordReader, fileSplit, readKeys);
}

LOG.warn(String.format("Branch %d of WorkUnit %s produced no data", branchId, state.getId()));
return;

@Override
public Extractor<S, D> getExtractor(WorkUnitState workUnitState) throws IOException {
 if (!workUnitState.contains(FILE_SPLIT_BYTES_STRING_KEY)) {
  throw new IOException("No serialized FileSplit found in WorkUnitState " + workUnitState.getId());
 }
 Configuration configuration = new Configuration();
 FileInputFormat<K, V> fileInputFormat = getFileInputFormat(workUnitState, configuration);
 String fileSplitBytesStr = workUnitState.getProp(FILE_SPLIT_BYTES_STRING_KEY);
 FileSplit fileSplit = (FileSplit) HadoopUtils.deserializeFromString(FileSplit.class, fileSplitBytesStr);
 TaskAttemptContext taskAttemptContext =
   getTaskAttemptContext(configuration, DummyTaskAttemptIDFactory.newTaskAttemptID());
 try {
  RecordReader<K, V> recordReader = fileInputFormat.createRecordReader(fileSplit, taskAttemptContext);
  recordReader.initialize(fileSplit, taskAttemptContext);
  boolean readKeys = workUnitState.getPropAsBoolean(FILE_INPUT_READ_KEYS_KEY, DEFAULT_FILE_INPUT_READ_KEYS);
  return getExtractor(workUnitState, recordReader, fileSplit, readKeys);
 } catch (InterruptedException ie) {
  throw new IOException(ie);
 }
}

private String getWorkUnitName() {
 StringBuilder sb = new StringBuilder();
 sb.append("[");
 sb.append(StringUtils.stripToEmpty(this.workUnitState.getProp(ConfigurationKeys.SOURCE_QUERYBASED_SCHEMA)));
 sb.append("_");
 sb.append(StringUtils.stripToEmpty(this.workUnitState.getProp(ConfigurationKeys.SOURCE_ENTITY)));
 sb.append("_");
 String id = this.workUnitState.getId();
 int seqIndex = id.lastIndexOf("_", id.length());
 if (seqIndex > 0) {
  String timeSeqStr = id.substring(0, seqIndex);
  int timeIndex = timeSeqStr.lastIndexOf("_", timeSeqStr.length());
  if (timeIndex > 0) {
   sb.append(id.substring(timeIndex + 1));
  }
 }
 sb.append("]");
 return sb.toString();
}

@Override
public Extractor<S, D> getExtractor(WorkUnitState workUnitState) throws IOException {
 if (!workUnitState.contains(HadoopFileInputSource.FILE_SPLIT_BYTES_STRING_KEY)) {
  throw new IOException("No serialized FileSplit found in WorkUnitState " + workUnitState.getId());
 }
 JobConf jobConf = new JobConf(new Configuration());
 for (String key : workUnitState.getPropertyNames()) {
  jobConf.set(key, workUnitState.getProp(key));
 }
 String fileSplitBytesStr = workUnitState.getProp(HadoopFileInputSource.FILE_SPLIT_BYTES_STRING_KEY);
 FileSplit fileSplit = (FileSplit) HadoopUtils.deserializeFromString(FileSplit.class, fileSplitBytesStr);
 FileInputFormat<K, V> fileInputFormat = getFileInputFormat(workUnitState, jobConf);
 RecordReader<K, V> recordReader = fileInputFormat.getRecordReader(fileSplit, jobConf, Reporter.NULL);
 boolean readKeys = workUnitState.getPropAsBoolean(
   HadoopFileInputSource.FILE_INPUT_READ_KEYS_KEY, HadoopFileInputSource.DEFAULT_FILE_INPUT_READ_KEYS);
 return getExtractor(workUnitState, recordReader, fileSplit, readKeys);
}

LOG.warn(String.format("Branch %d of WorkUnit %s produced no data", branchId, state.getId()));
return;

@Override
public Extractor<S, D> getExtractor(WorkUnitState workUnitState) throws IOException {
 if (!workUnitState.contains(FILE_SPLIT_BYTES_STRING_KEY)) {
  throw new IOException("No serialized FileSplit found in WorkUnitState " + workUnitState.getId());
 }
 Configuration configuration = new Configuration();
 FileInputFormat<K, V> fileInputFormat = getFileInputFormat(workUnitState, configuration);
 String fileSplitBytesStr = workUnitState.getProp(FILE_SPLIT_BYTES_STRING_KEY);
 FileSplit fileSplit = (FileSplit) HadoopUtils.deserializeFromString(FileSplit.class, fileSplitBytesStr);
 TaskAttemptContext taskAttemptContext =
   getTaskAttemptContext(configuration, DummyTaskAttemptIDFactory.newTaskAttemptID());
 try {
  RecordReader<K, V> recordReader = fileInputFormat.createRecordReader(fileSplit, taskAttemptContext);
  recordReader.initialize(fileSplit, taskAttemptContext);
  boolean readKeys = workUnitState.getPropAsBoolean(FILE_INPUT_READ_KEYS_KEY, DEFAULT_FILE_INPUT_READ_KEYS);
  return getExtractor(workUnitState, recordReader, fileSplit, readKeys);
 } catch (InterruptedException ie) {
  throw new IOException(ie);
 }
}

Popular methods of WorkUnitState

getProp
<init>
setProp
contains
getProperties
getWorkunit
Get an ImmutableWorkUnit that wraps the internal WorkUnit.
getPropAsBoolean
getJobState
getPropAsInt
getActualHighWatermark
Get the actual high Watermark. If the WorkUnitState does not contain the actual high watermark (whic
setActualHighWatermark
This method should set the actual, runtime high Watermark for this WorkUnitState. A high Watermark i
setWorkingState
Set the current runtime state of the WorkUnit.

Popular in Java

Reading from database using SQL prepared statement
getOriginalFilename (MultipartFile)
Return the original filename in the client's filesystem.This may contain path information depending
startActivity (Activity)
notifyDataSetChanged (ArrayAdapter)
FileOutputStream (java.io)
An output stream that writes bytes to a file. If the output file exists, it can be replaced or appen
Runnable (java.lang)
Represents a command that can be executed. Often used to run code in a different Thread.
Connection (java.sql)
A connection represents a link from a Java application to a database. All SQL statements and results
Map (java.util)
A Map is a data structure consisting of a set of keys and values in which each key is mapped to a si
Cipher (javax.crypto)
This class provides access to implementations of cryptographic ciphers for encryption and decryption
JButton (javax.swing)
From CI to AI: The AI layer in your organization

How to use getIdmethodin org.apache.gobblin.configuration.WorkUnitState

Best Java code snippets using org.apache.gobblin.configuration.WorkUnitState.getId (Showing top 8 results out of 315)

How to use
getId
method
in
org.apache.gobblin.configuration.WorkUnitState