org.apache.hadoop.hbase.mapreduce.TableInputFormat.setConf java code examples

this.tableInputFormat.setConf(config);

@Test
public void testNonSuccessiveSplitsAreNotMerged() throws IOException {
 JobContext context = mock(JobContext.class);
 Configuration conf = HBaseConfiguration.create();
 conf.set(ClusterConnection.HBASE_CLIENT_CONNECTION_IMPL,
   ConnectionForMergeTesting.class.getName());
 conf.set(TableInputFormat.INPUT_TABLE, "testTable");
 conf.setBoolean(TableInputFormatBase.MAPREDUCE_INPUT_AUTOBALANCE, true);
 when(context.getConfiguration()).thenReturn(conf);
 TableInputFormat tifExclude = new TableInputFormatForMergeTesting();
 tifExclude.setConf(conf);
 // split["b", "c"] is excluded, split["o", "p"] and split["p", "q"] are merged,
 // but split["a", "b"] and split["c", "d"] are not merged.
 assertEquals(ConnectionForMergeTesting.START_KEYS.length - 1 - 1,
   tifExclude.getSplits(context).size());
}

/**
 * Tests Number of inputSplits for MR job when specify number of mappers for TableInputFormatXXX
 * This test does not run MR job
 */
protected void testNumOfSplits(int splitsPerRegion, int expectedNumOfSplits)
  throws IOException, InterruptedException, ClassNotFoundException {
 String jobName = "TestJobForNumOfSplits";
 LOG.info("Before map/reduce startup - job " + jobName);
 Configuration c = new Configuration(TEST_UTIL.getConfiguration());
 Scan scan = new Scan();
 scan.addFamily(INPUT_FAMILYS[0]);
 scan.addFamily(INPUT_FAMILYS[1]);
 c.setInt("hbase.mapreduce.tableinput.mappers.per.region", splitsPerRegion);
 c.set(KEY_STARTROW, "");
 c.set(KEY_LASTROW, "");
 Job job = Job.getInstance(c, jobName);
 TableMapReduceUtil.initTableMapperJob(TABLE_NAME.getNameAsString(), scan, ScanMapper.class,
  ImmutableBytesWritable.class, ImmutableBytesWritable.class, job);
 TableInputFormat tif = new TableInputFormat();
 tif.setConf(job.getConfiguration());
 Assert.assertEquals(TABLE_NAME, table.getName());
 List<InputSplit> splits = tif.getSplits(job);
 Assert.assertEquals(expectedNumOfSplits, splits.size());
}

@Override
public void setConf(Configuration conf) {
 super.setConf(conf);
 if (conf.get(ROW_KEY_DISTRIBUTOR_CLASS) != null) {
  String clazz = conf.get(ROW_KEY_DISTRIBUTOR_CLASS);
  try {
   rowKeyDistributor = (AbstractRowKeyDistributor) Class.forName(clazz).newInstance();
   if (conf.get(ROW_KEY_DISTRIBUTOR_PARAMS) != null) {
    rowKeyDistributor.init(conf.get(ROW_KEY_DISTRIBUTOR_PARAMS));
   }
  } catch (Exception e) {
   throw new RuntimeException("Cannot create row key distributor, " + ROW_KEY_DISTRIBUTOR_CLASS + ": " + clazz, e);
  }
 }
}

@Override
public void setConf(Configuration conf) {
 super.setConf(conf);
 if (conf.get(ROW_KEY_DISTRIBUTOR_CLASS) != null) {
  String clazz = conf.get(ROW_KEY_DISTRIBUTOR_CLASS);
  try {
   rowKeyDistributor = (AbstractRowKeyDistributor) Class.forName(clazz).newInstance();
   if (conf.get(ROW_KEY_DISTRIBUTOR_PARAMS) != null) {
    rowKeyDistributor.init(conf.get(ROW_KEY_DISTRIBUTOR_PARAMS));
   }
  } catch (Exception e) {
   throw new RuntimeException("Cannot create row key distributor, " + ROW_KEY_DISTRIBUTOR_CLASS + ": " + clazz, e);
  }
 }
}

@Override
public void setConf(Configuration conf) {
 super.setConf(conf);
 if (conf.get(ROW_KEY_DISTRIBUTOR_CLASS) != null) {
  String clazz = conf.get(ROW_KEY_DISTRIBUTOR_CLASS);
  try {
   rowKeyDistributor = (AbstractRowKeyDistributor) Class.forName(clazz).newInstance();
   if (conf.get(ROW_KEY_DISTRIBUTOR_PARAMS) != null) {
    rowKeyDistributor.init(conf.get(ROW_KEY_DISTRIBUTOR_PARAMS));
   }
  } catch (Exception e) {
   throw new RuntimeException("Cannot create row key distributor, " + ROW_KEY_DISTRIBUTOR_CLASS + ": " + clazz, e);
  }
 }
}

@Override
public void setConf(final Configuration config) {
  this.graph = new FaunusTitanHBaseGraph(GraphFactory.generateTitanConfiguration(config, FAUNUS_GRAPH_INPUT_TITAN));
  this.vertexQuery = VertexQueryFilter.create(config);
  this.pathEnabled = config.getBoolean(FaunusCompiler.PATH_ENABLED, false);
  //config.set(TableInputFormat.SCAN_COLUMN_FAMILY, Backend.EDGESTORE_NAME);
  config.set(TableInputFormat.INPUT_TABLE, config.get(FAUNUS_GRAPH_INPUT_TITAN_STORAGE_TABLENAME));
  config.set(HConstants.ZOOKEEPER_QUORUM, config.get(FAUNUS_GRAPH_INPUT_TITAN_STORAGE_HOSTNAME));
  if (config.get(FAUNUS_GRAPH_INPUT_TITAN_STORAGE_PORT, null) != null)
    config.set(HConstants.ZOOKEEPER_CLIENT_PORT, config.get(FAUNUS_GRAPH_INPUT_TITAN_STORAGE_PORT));
  config.set("storage.read-only", "true");
  config.set("autotype", "none");
  Scan scanner = new Scan();
  scanner.addFamily(Backend.EDGESTORE_NAME.getBytes());
  scanner.setFilter(getColumnFilter(this.vertexQuery));
  //TODO (minor): should we set other options in http://hbase.apache.org/apidocs/org/apache/hadoop/hbase/client/Scan.html for optimization?
  Method converter;
  try {
    converter = TableMapReduceUtil.class.getDeclaredMethod("convertScanToString", Scan.class);
    converter.setAccessible(true);
    config.set(TableInputFormat.SCAN, (String) converter.invoke(null, scanner));
  } catch (Exception e) {
    throw new RuntimeException(e);
  }
  this.tableInputFormat.setConf(config);
}

@Override
public org.apache.hadoop.mapred.InputSplit[] getSplits(JobConf job, int numSplits)
 throws IOException {
 inputFormat.setConf(job);
 return convertSplits(inputFormat.getSplits(HCatMapRedUtil.createJobContext(job, null,
  Reporter.NULL)));
}

private TableInputFormat getDelegate(Configuration conf) throws IOException {
 TableInputFormat delegate = new TableInputFormat();
 String tableName = HBaseMetadataProvider.getTableName(dataset.getName());
 conf.set(TableInputFormat.INPUT_TABLE, tableName);
 if (view != null) {
  Job tempJob = new Job();
  Scan scan = ((BaseEntityScanner) view.newEntityScanner()).getScan();
  TableMapReduceUtil.initTableMapperJob(tableName, scan, TableMapper.class, null,
    null, tempJob);
  Configuration tempConf = Hadoop.JobContext.getConfiguration.invoke(tempJob);
  conf.set(SCAN, tempConf.get(SCAN));
 }
 delegate.setConf(conf);
 return delegate;
}

private TableInputFormat getDelegate(Configuration conf) throws IOException {
 TableInputFormat delegate = new TableInputFormat();
 String tableName = HBaseMetadataProvider.getTableName(dataset.getName());
 conf.set(TableInputFormat.INPUT_TABLE, tableName);
 if (view != null) {
  Job tempJob = new Job();
  Scan scan = ((BaseEntityScanner) view.newEntityScanner()).getScan();
  TableMapReduceUtil.initTableMapperJob(tableName, scan, TableMapper.class, null,
    null, tempJob);
  Configuration tempConf = Hadoop.JobContext.getConfiguration.invoke(tempJob);
  conf.set(SCAN, tempConf.get(SCAN));
 }
 delegate.setConf(conf);
 return delegate;
}

this.tableInputFormat.setConf(config);

this.tableInputFormat.setConf(config);

this.tableInputFormat.setConf(config);

@Test
public void testNonSuccessiveSplitsAreNotMerged() throws IOException {
 JobContext context = mock(JobContext.class);
 Configuration conf = HBaseConfiguration.create();
 conf.set(ClusterConnection.HBASE_CLIENT_CONNECTION_IMPL,
   ConnectionForMergeTesting.class.getName());
 conf.set(TableInputFormat.INPUT_TABLE, "testTable");
 conf.setBoolean(TableInputFormatBase.MAPREDUCE_INPUT_AUTOBALANCE, true);
 when(context.getConfiguration()).thenReturn(conf);
 TableInputFormat tifExclude = new TableInputFormatForMergeTesting();
 tifExclude.setConf(conf);
 // split["b", "c"] is excluded, split["o", "p"] and split["p", "q"] are merged,
 // but split["a", "b"] and split["c", "d"] are not merged.
 assertEquals(ConnectionForMergeTesting.START_KEYS.length - 1 - 1,
   tifExclude.getSplits(context).size());
}

tableInputFormat.setConf(connection.getConfiguration());
tableInputFormat.setScan(scan);

@Override
public RecordReader<ImmutableBytesWritable, ResultWritable> getRecordReader(
 InputSplit split, JobConf job, Reporter reporter)
 throws IOException {
 String jobString = job.get(HCatConstants.HCAT_KEY_JOB_INFO);
 InputJobInfo inputJobInfo = (InputJobInfo) HCatUtil.deserialize(jobString);
 String tableName = job.get(TableInputFormat.INPUT_TABLE);
 TableSplit tSplit = (TableSplit) split;
 HbaseSnapshotRecordReader recordReader = new HbaseSnapshotRecordReader(inputJobInfo, job);
 inputFormat.setConf(job);
 Scan inputScan = inputFormat.getScan();
 // TODO: Make the caching configurable by the user
 inputScan.setCaching(200);
 inputScan.setCacheBlocks(false);
 Scan sc = new Scan(inputScan);
 sc.setStartRow(tSplit.getStartRow());
 sc.setStopRow(tSplit.getEndRow());
 recordReader.setScan(sc);
 recordReader.setHTable(new HTable(job, tableName));
 recordReader.init();
 return recordReader;
}

/**
 * Tests Number of inputSplits for MR job when specify number of mappers for TableInputFormatXXX
 * This test does not run MR job
 */
protected void testNumOfSplits(int splitsPerRegion, int expectedNumOfSplits)
  throws IOException, InterruptedException, ClassNotFoundException {
 String jobName = "TestJobForNumOfSplits";
 LOG.info("Before map/reduce startup - job " + jobName);
 Configuration c = new Configuration(TEST_UTIL.getConfiguration());
 Scan scan = new Scan();
 scan.addFamily(INPUT_FAMILYS[0]);
 scan.addFamily(INPUT_FAMILYS[1]);
 c.setInt("hbase.mapreduce.tableinput.mappers.per.region", splitsPerRegion);
 c.set(KEY_STARTROW, "");
 c.set(KEY_LASTROW, "");
 Job job = Job.getInstance(c, jobName);
 TableMapReduceUtil.initTableMapperJob(TABLE_NAME.getNameAsString(), scan, ScanMapper.class,
  ImmutableBytesWritable.class, ImmutableBytesWritable.class, job);
 TableInputFormat tif = new TableInputFormat();
 tif.setConf(job.getConfiguration());
 Assert.assertEquals(TABLE_NAME, table.getName());
 List<InputSplit> splits = tif.getSplits(job);
 Assert.assertEquals(expectedNumOfSplits, splits.size());
}

/**
 * Tests Number of inputSplits for MR job when specify number of mappers for TableInputFormatXXX
 * This test does not run MR job
 *
 * @throws IOException
 * @throws ClassNotFoundException
 * @throws InterruptedException
 */
public void testNumOfSplits(int splitsPerRegion, int expectedNumOfSplits) throws IOException,
  InterruptedException,
  ClassNotFoundException {
 String jobName = "TestJobForNumOfSplits";
 LOG.info("Before map/reduce startup - job " + jobName);
 Configuration c = new Configuration(TEST_UTIL.getConfiguration());
 Scan scan = new Scan();
 scan.addFamily(INPUT_FAMILYS[0]);
 scan.addFamily(INPUT_FAMILYS[1]);
 c.setInt("hbase.mapreduce.tableinput.mappers.per.region", splitsPerRegion);
 c.set(KEY_STARTROW, "");
 c.set(KEY_LASTROW, "");
 Job job = new Job(c, jobName);
 TableMapReduceUtil.initTableMapperJob(TABLE_NAME.getNameAsString(), scan, ScanMapper.class,
   ImmutableBytesWritable.class, ImmutableBytesWritable.class, job);
 TableInputFormat tif = new TableInputFormat();
 tif.setConf(job.getConfiguration());
 Assert.assertEquals(TABLE_NAME, table.getName());
 List<InputSplit> splits = tif.getSplits(job);
 Assert.assertEquals(expectedNumOfSplits, splits.size());
}

  tableInputFormat = new TableInputFormat();
tableInputFormat.setConf(configuration);
inputFormat = tableInputFormat;

Javadoc

Sets the configuration. This is used to set the details for the table to be scanned.

Popular methods of TableInputFormat

getSplits
Calculates the splits that will serve as input for the map tasks. The number of splits matches the n
getConf
Returns the current configuration.
<init>
addColumns
Adds an array of columns specified using old format, family:qualifier. Overrides previous calls to S
createRecordReader
setScan
configureSplitTable
Sets split table in map-reduce job.
initializeTable
addColumn
Parses a combined family and qualifier and adds either both or just the family in case there is no q
calculateAutoBalancedSplits
createScanFromConfiguration
Sets up a Scan instance, applying settings from the configuration property constants defined in Tabl
reverseDNS

Popular in Java

Creating JSON documents from java classes using gson
startActivity (Activity)
getExternalFilesDir (Context)
getSupportFragmentManager (FragmentActivity)
GregorianCalendar (java.util)
GregorianCalendar is a concrete subclass of Calendarand provides the standard calendar used by most
HashSet (java.util)
HashSet is an implementation of a Set. All optional operations (adding and removing) are supported.
ThreadPoolExecutor (java.util.concurrent)
An ExecutorService that executes each submitted task using one of possibly several pooled threads, n
ZipFile (java.util.zip)
This class provides random read access to a zip file. You pay more to read the zip file's central di
XPath (javax.xml.xpath)
XPath provides access to the XPath evaluation environment and expressions. Evaluation of XPath Expr
StringUtils (org.apache.commons.lang)
Operations on java.lang.String that arenull safe. * IsEmpty/IsBlank - checks if a String contains
CodeWhisperer alternatives

How to use setConfmethodin org.apache.hadoop.hbase.mapreduce.TableInputFormat

Best Java code snippets using org.apache.hadoop.hbase.mapreduce.TableInputFormat.setConf (Showing top 19 results out of 315)

How to use
setConf
method
in
org.apache.hadoop.hbase.mapreduce.TableInputFormat