org.apache.gobblin.util.HadoopUtils.deserializeFromString java code examples

/**
 * Deserialize a {@link Writable} object from a string.
 *
 * @param writableClass the {@link Writable} implementation class
 * @param serializedWritableStr the string containing a serialized {@link Writable} object
 * @return a {@link Writable} deserialized from the string
 * @throws IOException if there's something wrong with the deserialization
 */
public static Writable deserializeFromString(Class<? extends Writable> writableClass, String serializedWritableStr)
  throws IOException {
 return deserializeFromString(writableClass, serializedWritableStr, new Configuration());
}

@Override
public Extractor<S, D> getExtractor(WorkUnitState workUnitState) throws IOException {
 if (!workUnitState.contains(HadoopFileInputSource.FILE_SPLIT_BYTES_STRING_KEY)) {
  throw new IOException("No serialized FileSplit found in WorkUnitState " + workUnitState.getId());
 }
 JobConf jobConf = new JobConf(new Configuration());
 for (String key : workUnitState.getPropertyNames()) {
  jobConf.set(key, workUnitState.getProp(key));
 }
 String fileSplitBytesStr = workUnitState.getProp(HadoopFileInputSource.FILE_SPLIT_BYTES_STRING_KEY);
 FileSplit fileSplit = (FileSplit) HadoopUtils.deserializeFromString(FileSplit.class, fileSplitBytesStr);
 FileInputFormat<K, V> fileInputFormat = getFileInputFormat(workUnitState, jobConf);
 RecordReader<K, V> recordReader = fileInputFormat.getRecordReader(fileSplit, jobConf, Reporter.NULL);
 boolean readKeys = workUnitState.getPropAsBoolean(
   HadoopFileInputSource.FILE_INPUT_READ_KEYS_KEY, HadoopFileInputSource.DEFAULT_FILE_INPUT_READ_KEYS);
 return getExtractor(workUnitState, recordReader, fileSplit, readKeys);
}

@Override
public Extractor<S, D> getExtractor(WorkUnitState workUnitState) throws IOException {
 if (!workUnitState.contains(FILE_SPLIT_BYTES_STRING_KEY)) {
  throw new IOException("No serialized FileSplit found in WorkUnitState " + workUnitState.getId());
 }
 Configuration configuration = new Configuration();
 FileInputFormat<K, V> fileInputFormat = getFileInputFormat(workUnitState, configuration);
 String fileSplitBytesStr = workUnitState.getProp(FILE_SPLIT_BYTES_STRING_KEY);
 FileSplit fileSplit = (FileSplit) HadoopUtils.deserializeFromString(FileSplit.class, fileSplitBytesStr);
 TaskAttemptContext taskAttemptContext =
   getTaskAttemptContext(configuration, DummyTaskAttemptIDFactory.newTaskAttemptID());
 try {
  RecordReader<K, V> recordReader = fileInputFormat.createRecordReader(fileSplit, taskAttemptContext);
  recordReader.initialize(fileSplit, taskAttemptContext);
  boolean readKeys = workUnitState.getPropAsBoolean(FILE_INPUT_READ_KEYS_KEY, DEFAULT_FILE_INPUT_READ_KEYS);
  return getExtractor(workUnitState, recordReader, fileSplit, readKeys);
 } catch (InterruptedException ie) {
  throw new IOException(ie);
 }
}

/**
 * Deserialize a {@link Writable} object from a string.
 *
 * @param writableClass the {@link Writable} implementation class
 * @param serializedWritableStr the string containing a serialized {@link Writable} object
 * @return a {@link Writable} deserialized from the string
 * @throws IOException if there's something wrong with the deserialization
 */
public static Writable deserializeFromString(Class<? extends Writable> writableClass, String serializedWritableStr)
  throws IOException {
 return deserializeFromString(writableClass, serializedWritableStr, new Configuration());
}

@Override
public Extractor<S, D> getExtractor(WorkUnitState workUnitState) throws IOException {
 if (!workUnitState.contains(HadoopFileInputSource.FILE_SPLIT_BYTES_STRING_KEY)) {
  throw new IOException("No serialized FileSplit found in WorkUnitState " + workUnitState.getId());
 }
 JobConf jobConf = new JobConf(new Configuration());
 for (String key : workUnitState.getPropertyNames()) {
  jobConf.set(key, workUnitState.getProp(key));
 }
 String fileSplitBytesStr = workUnitState.getProp(HadoopFileInputSource.FILE_SPLIT_BYTES_STRING_KEY);
 FileSplit fileSplit = (FileSplit) HadoopUtils.deserializeFromString(FileSplit.class, fileSplitBytesStr);
 FileInputFormat<K, V> fileInputFormat = getFileInputFormat(workUnitState, jobConf);
 RecordReader<K, V> recordReader = fileInputFormat.getRecordReader(fileSplit, jobConf, Reporter.NULL);
 boolean readKeys = workUnitState.getPropAsBoolean(
   HadoopFileInputSource.FILE_INPUT_READ_KEYS_KEY, HadoopFileInputSource.DEFAULT_FILE_INPUT_READ_KEYS);
 return getExtractor(workUnitState, recordReader, fileSplit, readKeys);
}

@Override
public Extractor<S, D> getExtractor(WorkUnitState workUnitState) throws IOException {
 if (!workUnitState.contains(FILE_SPLIT_BYTES_STRING_KEY)) {
  throw new IOException("No serialized FileSplit found in WorkUnitState " + workUnitState.getId());
 }
 Configuration configuration = new Configuration();
 FileInputFormat<K, V> fileInputFormat = getFileInputFormat(workUnitState, configuration);
 String fileSplitBytesStr = workUnitState.getProp(FILE_SPLIT_BYTES_STRING_KEY);
 FileSplit fileSplit = (FileSplit) HadoopUtils.deserializeFromString(FileSplit.class, fileSplitBytesStr);
 TaskAttemptContext taskAttemptContext =
   getTaskAttemptContext(configuration, DummyTaskAttemptIDFactory.newTaskAttemptID());
 try {
  RecordReader<K, V> recordReader = fileInputFormat.createRecordReader(fileSplit, taskAttemptContext);
  recordReader.initialize(fileSplit, taskAttemptContext);
  boolean readKeys = workUnitState.getPropAsBoolean(FILE_INPUT_READ_KEYS_KEY, DEFAULT_FILE_INPUT_READ_KEYS);
  return getExtractor(workUnitState, recordReader, fileSplit, readKeys);
 } catch (InterruptedException ie) {
  throw new IOException(ie);
 }
}

Javadoc

Deserialize a Writable object from a string.

Popular methods of HadoopUtils

getConfFromState
Provides Hadoop configuration given state. It also supports decrypting values on "encryptedPath". No
newConfiguration
renamePath
A wrapper around FileSystem#rename(Path,Path) which throws IOException if FileSystem#rename(Path,Pat
deleteIfExists
A wrapper around FileSystem#delete(Path,boolean) that only deletes a given Path if it is present on
deletePath
A wrapper around FileSystem#delete(Path,boolean) which throws IOException if the given Path exists,
sanitizePath
Remove illegal HDFS path characters from the given path. Illegal characters will be replaced with th
getOptionallyThrottledFileSystem
Calls #getOptionallyThrottledFileSystem(FileSystem,int) parsing the qps from the input Stateat key #
getStateFromConf
movePath
Moves a src Path from a srcFs FileSystem to a dst Path on a dstFs FileSystem. If the srcFs and the d
getSourceFileSystem
Get a FileSystem object for the uri specified at ConfigurationKeys#SOURCE_FILEBASED_FS_URI.
addGobblinSite
Add "gobblin-site.xml" as a Configuration resource.
copyFile
Copy a file from a srcFs FileSystem to a dstFs FileSystem. The src Path must be a file, that is File

Popular in Java

Running tasks concurrently on multiple threads
scheduleAtFixedRate (Timer)
setScale (BigDecimal)
notifyDataSetChanged (ArrayAdapter)
MalformedURLException (java.net)
This exception is thrown when a program attempts to create an URL from an incorrect specification.
Hashtable (java.util)
A plug-in replacement for JDK1.5 java.util.Hashtable. This version is based on org.cliffc.high_scale
LinkedList (java.util)
Doubly-linked list implementation of the List and Dequeinterfaces. Implements all optional list oper
TimerTask (java.util)
The TimerTask class represents a task to run at a specified time. The task may be run once or repeat
HttpServletRequest (javax.servlet.http)
Extends the javax.servlet.ServletRequest interface to provide request information for HTTP servlets.
LoggerFactory (org.slf4j)
The LoggerFactory is a utility class producing Loggers for various logging APIs, most notably for lo
Top PhpStorm plugins

How to use deserializeFromStringmethodin org.apache.gobblin.util.HadoopUtils

Best Java code snippets using org.apache.gobblin.util.HadoopUtils.deserializeFromString (Showing top 6 results out of 315)

How to use
deserializeFromString
method
in
org.apache.gobblin.util.HadoopUtils