org.apache.druid.segment.indexing.DataSchema java code examples

@Override
public String getDataSource()
{
 return schema.getDataSource();
}

private static IndexIOConfig createIoConfig(TaskToolbox toolbox, DataSchema dataSchema, Interval interval)
{
 return new IndexIOConfig(
   new IngestSegmentFirehoseFactory(
     dataSchema.getDataSource(),
     interval,
     null, // no filter
     // set dimensions and metrics names to make sure that the generated dataSchema is used for the firehose
     dataSchema.getParser().getParseSpec().getDimensionsSpec().getDimensionNames(),
     Arrays.stream(dataSchema.getAggregators()).map(AggregatorFactory::getName).collect(Collectors.toList()),
     toolbox.getIndexIO()
   ),
   false
 );
}

public DataSchema withTransformSpec(TransformSpec transformSpec)
{
 return new DataSchema(dataSource, parser, aggregators, granularitySpec, transformSpec, jsonMapper);
}

public DataSegment getSegment()
{
 return new DataSegment(
   schema.getDataSource(),
   interval,
   version,
   ImmutableMap.of(),
   Collections.emptyList(),
   Lists.transform(Arrays.asList(schema.getAggregators()), AggregatorFactory::getName),
   shardSpec,
   null,
   0
 );
}

public void verify()
{
 Preconditions.checkNotNull(schema.getDataSchema().getDataSource(), "dataSource");
 Preconditions.checkNotNull(schema.getDataSchema().getParser().getParseSpec(), "parseSpec");
 Preconditions.checkNotNull(schema.getDataSchema().getParser().getParseSpec().getTimestampSpec(), "timestampSpec");
 Preconditions.checkNotNull(schema.getDataSchema().getGranularitySpec(), "granularitySpec");
 Preconditions.checkNotNull(pathSpec, "inputSpec");
 Preconditions.checkNotNull(schema.getTuningConfig().getWorkingPath(), "workingPath");
 Preconditions.checkNotNull(schema.getIOConfig().getSegmentOutputPath(), "segmentOutputPath");
 Preconditions.checkNotNull(schema.getTuningConfig().getVersion(), "version");
}

);
Assert.assertEquals(actual.getDataSource(), "test");
Assert.assertEquals(
  actual.getParser().getParseSpec(),
  new JSONParseSpec(
    new TimestampSpec("xXx", null, null),
  actual.getAggregators(),
  new AggregatorFactory[]{
    new DoubleSumAggregatorFactory("metric1", "col1")
  actual.getGranularitySpec(),
  new ArbitraryGranularitySpec(
    new DurationGranularity(86400000, null),

@Override
protected void setup(Context context)
{
 config = HadoopDruidIndexerConfig.fromConfiguration(context.getConfiguration());
 aggregators = config.getSchema().getDataSchema().getAggregators();
 combiningAggs = new AggregatorFactory[aggregators.length];
 for (int i = 0; i < aggregators.length; ++i) {
  metricNames.add(aggregators[i].getName());
  combiningAggs[i] = aggregators[i].getCombiningFactory();
 }
 typeHelperMap = InputRowSerde.getTypeHelperMap(config.getSchema()
                            .getDataSchema()
                            .getParser()
                            .getParseSpec()
                            .getDimensionsSpec());
}

   schema.getGranularitySpec().isRollup(),
   schema.getAggregators(),
   mergedTarget,
   config.getIndexSpec(),
 log.makeAlert("Failed to create marker file for [%s]", schema.getDataSource())
   .addData("interval", sink.getInterval())
   .addData("partitionNum", segment.getShardSpec().getPartitionNum())
log.makeAlert(e, "Failed to persist merged index[%s]", schema.getDataSource())
  .addData("interval", interval)
  .emit();

private SegmentIdWithShardSpec getSegmentIdentifier(long timestamp)
{
 if (!rejectionPolicy.accept(timestamp)) {
  return null;
 }
 final Granularity segmentGranularity = schema.getGranularitySpec().getSegmentGranularity();
 final VersioningPolicy versioningPolicy = config.getVersioningPolicy();
 DateTime truncatedDateTime = segmentGranularity.bucketStart(DateTimes.utc(timestamp));
 final long truncatedTime = truncatedDateTime.getMillis();
 SegmentIdWithShardSpec retVal = segments.get(truncatedTime);
 if (retVal == null) {
  final Interval interval = new Interval(
    truncatedDateTime,
    segmentGranularity.increment(truncatedDateTime)
  );
  retVal = new SegmentIdWithShardSpec(
    schema.getDataSource(),
    interval,
    versioningPolicy.getVersion(interval),
    config.getShardSpec()
  );
  addSegment(retVal);
 }
 return retVal;
}

  .withTimestampSpec(schema.getParser())
  .withQueryGranularity(schema.getGranularitySpec().getQueryGranularity())
  .withDimensionsSpec(schema.getParser())
  .withMetrics(schema.getAggregators())
  .withRollup(schema.getGranularitySpec().isRollup())
  .build();
final IncrementalIndex newIndex = new IncrementalIndex.Builder()

public GranularitySpec getGranularitySpec()
{
 return schema.getDataSchema().getGranularitySpec();
}

);
DataSchema schema = new DataSchema(
  "test",
  parser,
  jsonMapper
);
schema.getParser();

indexMergerV9.mergeQueryableIndex(
  indexes,
  schema.getGranularitySpec().isRollup(),
  schema.getAggregators(),
  fileToUpload,
  config.getIndexSpec(),

  groupId,
  taskResource,
  dataSchema.getDataSource(),
  context
);
this.dataSchema = Preconditions.checkNotNull(dataSchema, "dataSchema");
this.parser = Preconditions.checkNotNull((InputRowParser<ByteBuffer>) dataSchema.getParser(), "parser");
this.tuningConfig = Preconditions.checkNotNull(tuningConfig, "tuningConfig");
this.ioConfig = Preconditions.checkNotNull(ioConfig, "ioConfig");

  new DataSchema(
    "foo",
    jsonMapper.convertValue(
Assert.assertEquals(schema.getDataSchema().getDataSource(), newSchema.getDataSchema().getDataSource());
Assert.assertEquals("/tmp/nonexistent", schema.getTuningConfig().getBasePersistDirectory().toString());

private static IncrementalIndex makeIncrementalIndex(
  Bucket theBucket,
  AggregatorFactory[] aggs,
  HadoopDruidIndexerConfig config,
  Iterable<String> oldDimOrder,
  Map<String, ColumnCapabilitiesImpl> oldCapabilities
)
{
 final HadoopTuningConfig tuningConfig = config.getSchema().getTuningConfig();
 final IncrementalIndexSchema indexSchema = new IncrementalIndexSchema.Builder()
   .withMinTimestamp(theBucket.time.getMillis())
   .withTimestampSpec(config.getSchema().getDataSchema().getParser().getParseSpec().getTimestampSpec())
   .withDimensionsSpec(config.getSchema().getDataSchema().getParser())
   .withQueryGranularity(config.getSchema().getDataSchema().getGranularitySpec().getQueryGranularity())
   .withMetrics(aggs)
   .withRollup(config.getSchema().getDataSchema().getGranularitySpec().isRollup())
   .build();
 IncrementalIndex newIndex = new IncrementalIndex.Builder()
   .setIndexSchema(indexSchema)
   .setReportParseExceptions(!tuningConfig.isIgnoreInvalidRows()) // only used by OffHeapIncrementalIndex
   .setMaxRowCount(tuningConfig.getRowFlushBoundary())
   .setMaxBytesInMemory(TuningConfigs.getMaxBytesInMemoryOrDefault(tuningConfig.getMaxBytesInMemory()))
   .buildOnheap();
 if (oldDimOrder != null && !indexSchema.getDimensionsSpec().hasCustomDimensions()) {
  newIndex.loadDimensionIterable(oldDimOrder, oldCapabilities);
 }
 return newIndex;
}

public InputRowParser getParser()
{
 return schema.getDataSchema().getParser();
}

  new TaskResource("rofl", 2),
  new FireDepartment(
    new DataSchema(
      "foo",
      null,
Assert.assertEquals(
  Granularities.HOUR,
  task.getRealtimeIngestionSchema().getDataSchema().getGranularitySpec().getSegmentGranularity()
);
Assert.assertTrue(task.getRealtimeIngestionSchema().getTuningConfig().isReportParseExceptions());
);
Assert.assertEquals(
  task.getRealtimeIngestionSchema().getDataSchema().getGranularitySpec().getSegmentGranularity(),
  task2.getRealtimeIngestionSchema().getDataSchema().getGranularitySpec().getSegmentGranularity()
);

 final AggregatorFactory[] cols = config.getSchema().getDataSchema().getAggregators();
 if (cols != null) {
  if (useNewAggs) {
  config.getSchema().getDataSchema().getTransformSpec()
);

                         .getGranularitySpec()
                         .bucketIntervals()
                         .isPresent();
        .collect(Collectors.toMap(Entry::getKey, entry -> entry.getValue().getVersion()));
dataSchema = ingestionSchema.getDataSchema().withGranularitySpec(
  ingestionSchema.getDataSchema()
          .getGranularitySpec()
          .withIntervals(
            JodaUtils.condenseIntervals(

Most used methods

Popular in Java

Finding current android device location
findViewById (Activity)
startActivity (Activity)
onCreateOptionsMenu (Activity)
FileReader (java.io)
A specialized Reader that reads from a file in the file system. All read requests made by calling me
URLEncoder (java.net)
This class is used to encode a string using the format required by application/x-www-form-urlencoded
DecimalFormat (java.text)
A concrete subclass of NumberFormat that formats decimal numbers. It has a variety of features desig
ReentrantLock (java.util.concurrent.locks)
A reentrant mutual exclusion Lock with the same basic behavior and semantics as the implicit monitor
SSLHandshakeException (javax.net.ssl)
The exception that is thrown when a handshake could not be completed successfully.
Options (org.apache.commons.cli)
Main entry-point into the library. Options represents a collection of Option objects, which describ
Top PhpStorm plugins

How to useDataSchema in org.apache.druid.segment.indexing

Best Java code snippets using org.apache.druid.segment.indexing.DataSchema (Showing top 20 results out of 315)

How to use
DataSchema
in
org.apache.druid.segment.indexing