org.apache.hadoop.hive.ql.exec.tez.ReduceRecordSource java code examples

private void initializeSourceForTag(ReduceWork redWork, int tag, ObjectInspector[] ois,
  ReduceRecordSource[] sources, TableDesc valueTableDesc, String inputName)
  throws Exception {
 reducer = redWork.getReducer();
 reducer.getParentOperators().clear();
 reducer.setParentOperators(null); // clear out any parents as reducer is the root
 TableDesc keyTableDesc = redWork.getKeyDesc();
 Reader reader = inputs.get(inputName).getReader();
 sources[tag] = new ReduceRecordSource();
 // Only the big table input source should be vectorized (if applicable)
 // Note this behavior may have to change if we ever implement a vectorized merge join
 boolean vectorizedRecordSource = (tag == bigTablePosition) && redWork.getVectorMode();
 sources[tag].init(jconf, redWork.getReducer(), vectorizedRecordSource, keyTableDesc,
   valueTableDesc, reader, tag == bigTablePosition, (byte) tag,
   redWork.getVectorizedRowBatchCtx(), redWork.getVectorizedVertexNum(),
   redWork.getVectorizedTestingReducerBatchSize());
 ois[tag] = sources[tag].getObjectInspector();
}

private boolean pushRecordVector() {
 try {
  if (!reader.next()) {
   return false;
  }
  BytesWritable keyWritable = (BytesWritable) reader.getCurrentKey();
  valueWritables = reader.getCurrentValues();
  processVectorGroup(keyWritable, valueWritables, tag);
  return true;
 } catch (Throwable e) {
  abort = true;
  if (e instanceof OutOfMemoryError) {
   // Don't create a new object if we are already out of memory
   throw (OutOfMemoryError) e;
  } else {
   l4j.error(StringUtils.stringifyException(e));
   throw new RuntimeException(e);
  }
 }
}

@Override
void run() throws Exception {
 for (Entry<String, LogicalOutput> outputEntry : outputs.entrySet()) {
  l4j.info("Starting Output: " + outputEntry.getKey());
  if (!isAborted()) {
   outputEntry.getValue().start();
   ((TezKVOutputCollector) outMap.get(outputEntry.getKey())).initialize();
  }
 }
 // run the operator pipeline
 startAbortChecks();
 while (sources[bigTablePosition].pushRecord()) {
  addRowAndMaybeCheckAbort();
 }
}

return pushRecordVector();

if (isAborted()) {
 for (ReduceRecordSource rs: sources) {
  if (!rs.close()) {
   setAborted(false); // Preserving the old logic. Hmm...
   break;

((ReduceRecordSource) source).setFlushLastRecord(true);

return pushRecordVector();

if (isAborted()) {
 for (ReduceRecordSource rs: sources) {
  if (!rs.close()) {
   setAborted(false); // Preserving the old logic. Hmm...
   break;

private void initializeSourceForTag(ReduceWork redWork, int tag, ObjectInspector[] ois,
  ReduceRecordSource[] sources, TableDesc valueTableDesc, String inputName)
  throws Exception {
 reducer = redWork.getReducer();
 reducer.getParentOperators().clear();
 reducer.setParentOperators(null); // clear out any parents as reducer is the root
 TableDesc keyTableDesc = redWork.getKeyDesc();
 Reader reader = inputs.get(inputName).getReader();
 sources[tag] = new ReduceRecordSource();
 // Only the big table input source should be vectorized (if applicable)
 // Note this behavior may have to change if we ever implement a vectorized merge join
 boolean vectorizedRecordSource = (tag == bigTablePosition) && redWork.getVectorMode();
 sources[tag].init(jconf, redWork.getReducer(), vectorizedRecordSource, keyTableDesc,
   valueTableDesc, reader, tag == bigTablePosition, (byte) tag,
   redWork.getVectorizedRowBatchCtx(), redWork.getVectorizedVertexNum());
 ois[tag] = sources[tag].getObjectInspector();
}

@Override
void run() throws Exception {
 for (Entry<String, LogicalOutput> outputEntry : outputs.entrySet()) {
  l4j.info("Starting Output: " + outputEntry.getKey());
  if (!isAborted()) {
   outputEntry.getValue().start();
   ((TezKVOutputCollector) outMap.get(outputEntry.getKey())).initialize();
  }
 }
 // run the operator pipeline
 startAbortChecks();
 while (sources[bigTablePosition].pushRecord()) {
  addRowAndMaybeCheckAbort();
 }
}

 processVectorGroup(keyWritable, valueWritables, tag);
 return true;
} catch (Throwable e) {

return pushRecordVector();

abort = abort && rs.close();

private void initializeSourceForTag(ReduceWork redWork, int tag, ObjectInspector[] ois,
  ReduceRecordSource[] sources, TableDesc valueTableDesc, String inputName)
  throws Exception {
 reducer = redWork.getReducer();
 reducer.getParentOperators().clear();
 reducer.setParentOperators(null); // clear out any parents as reducer is the root
 TableDesc keyTableDesc = redWork.getKeyDesc();
 KeyValuesReader reader = (KeyValuesReader) inputs.get(inputName).getReader();
 sources[tag] = new ReduceRecordSource();
 sources[tag].init(jconf, redWork.getReducer(), redWork.getVectorMode(), keyTableDesc,
   valueTableDesc, reader, tag == bigTablePosition, (byte) tag,
   redWork.getVectorScratchColumnTypeMap());
 ois[tag] = sources[tag].getObjectInspector();
}

@Override
void run() throws Exception {
 for (Entry<String, LogicalOutput> outputEntry : outputs.entrySet()) {
  l4j.info("Starting Output: " + outputEntry.getKey());
  outputEntry.getValue().start();
  ((TezKVOutputCollector) outMap.get(outputEntry.getKey())).initialize();
 }
 // run the operator pipeline
 while (sources[bigTablePosition].pushRecord()) {
 }
}

 processVectorGroup(keyWritable, valueWritables, tag);
 return true;
} catch (Throwable e) {

Javadoc

Process input from tez LogicalInput and write output - for a map plan Just pump the records through the query plan.

Most used methods

Popular in Java

Reading from database using SQL prepared statement
scheduleAtFixedRate (Timer)
getResourceAsStream (ClassLoader)
getExternalFilesDir (Context)
System (java.lang)
Provides access to system-related information and resources including standard input and output. Ena
SecureRandom (java.security)
This class generates cryptographically secure pseudo-random numbers. It is best to invoke SecureRand
DateFormat (java.text)
Formats or parses dates and times.This class provides factories for obtaining instances configured f
Deque (java.util)
A linear collection that supports element insertion and removal at both ends. The name deque is shor
Callable (java.util.concurrent)
A task that returns a result and may throw an exception. Implementors define a single method with no
VirtualMachine (com.sun.tools.attach)
A Java virtual machine. A VirtualMachine represents a Java virtual machine to which this Java vir
CodeWhisperer alternatives

How to useReduceRecordSource in org.apache.hadoop.hive.ql.exec.tez

Best Java code snippets using org.apache.hadoop.hive.ql.exec.tez.ReduceRecordSource (Showing top 16 results out of 315)

How to use
ReduceRecordSource
in
org.apache.hadoop.hive.ql.exec.tez