mirror of https://github.com/apache/druid.git
add config for build v9 directly and update docs
This commit is contained in:
parent
1f2168fae5
commit
82ff98c2bf
|
@ -104,7 +104,8 @@ The spec\_file is a path to a file that contains JSON and an example looks like:
|
||||||
"ignoreInvalidRows" : false,
|
"ignoreInvalidRows" : false,
|
||||||
"jobProperties" : { },
|
"jobProperties" : { },
|
||||||
"combineText" : false,
|
"combineText" : false,
|
||||||
"rowFlushBoundary" : 300000
|
"rowFlushBoundary" : 300000,
|
||||||
|
"buildV9Directly" : false
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
```
|
```
|
||||||
|
@ -205,6 +206,7 @@ The tuningConfig is optional and default parameters will be used if no tuningCon
|
||||||
|ignoreInvalidRows|Boolean|Ignore rows found to have problems.|no (default == false)|
|
|ignoreInvalidRows|Boolean|Ignore rows found to have problems.|no (default == false)|
|
||||||
|useCombiner|Boolean|Use hadoop combiner to merge rows at mapper if possible.|no (default == false)|
|
|useCombiner|Boolean|Use hadoop combiner to merge rows at mapper if possible.|no (default == false)|
|
||||||
|jobProperties|Object|a map of properties to add to the Hadoop job configuration.|no (default == null)|
|
|jobProperties|Object|a map of properties to add to the Hadoop job configuration.|no (default == null)|
|
||||||
|
|buildV9Directly|Boolean|Whether to build v9 index directly instead of building v8 index and convert it to v9 format|no (default = false)|
|
||||||
|
|
||||||
### Partitioning specification
|
### Partitioning specification
|
||||||
|
|
||||||
|
|
|
@ -142,6 +142,7 @@ The tuningConfig is optional and default parameters will be used if no tuningCon
|
||||||
|rejectionPolicy|Object|Controls how data sets the data acceptance policy for creating and handing off segments. More on this below.|no (default=='serverTime')|
|
|rejectionPolicy|Object|Controls how data sets the data acceptance policy for creating and handing off segments. More on this below.|no (default=='serverTime')|
|
||||||
|maxPendingPersists|Integer|Maximum number of persists that can be pending, but not started. If this limit would be exceeded by a new intermediate persist, ingestion will block until the currently-running persist finishes. Maximum heap memory usage for indexing scales with maxRowsInMemory * (2 + maxPendingPersists).|no (default == 0; meaning one persist can be running concurrently with ingestion, and none can be queued up)|
|
|maxPendingPersists|Integer|Maximum number of persists that can be pending, but not started. If this limit would be exceeded by a new intermediate persist, ingestion will block until the currently-running persist finishes. Maximum heap memory usage for indexing scales with maxRowsInMemory * (2 + maxPendingPersists).|no (default == 0; meaning one persist can be running concurrently with ingestion, and none can be queued up)|
|
||||||
|shardSpec|Object|This describes the shard that is represented by this server. This must be specified properly in order to have multiple realtime nodes indexing the same data stream in a [sharded fashion](#sharding).|no (default == 'NoneShardSpec'|
|
|shardSpec|Object|This describes the shard that is represented by this server. This must be specified properly in order to have multiple realtime nodes indexing the same data stream in a [sharded fashion](#sharding).|no (default == 'NoneShardSpec'|
|
||||||
|
|buildV9Directly|Boolean|Whether to build v9 index directly instead of building v8 index and convert it to v9 format|no (default = false)|
|
||||||
|
|
||||||
#### Rejection Policy
|
#### Rejection Policy
|
||||||
|
|
||||||
|
|
|
@ -51,6 +51,7 @@ import io.druid.indexer.path.PathSpec;
|
||||||
import io.druid.initialization.Initialization;
|
import io.druid.initialization.Initialization;
|
||||||
import io.druid.segment.IndexIO;
|
import io.druid.segment.IndexIO;
|
||||||
import io.druid.segment.IndexMerger;
|
import io.druid.segment.IndexMerger;
|
||||||
|
import io.druid.segment.IndexMergerV9;
|
||||||
import io.druid.segment.IndexSpec;
|
import io.druid.segment.IndexSpec;
|
||||||
import io.druid.segment.indexing.granularity.GranularitySpec;
|
import io.druid.segment.indexing.granularity.GranularitySpec;
|
||||||
import io.druid.server.DruidNode;
|
import io.druid.server.DruidNode;
|
||||||
|
@ -89,6 +90,7 @@ public class HadoopDruidIndexerConfig
|
||||||
public static final ObjectMapper JSON_MAPPER;
|
public static final ObjectMapper JSON_MAPPER;
|
||||||
public static final IndexIO INDEX_IO;
|
public static final IndexIO INDEX_IO;
|
||||||
public static final IndexMerger INDEX_MERGER;
|
public static final IndexMerger INDEX_MERGER;
|
||||||
|
public static final IndexMergerV9 INDEX_MERGER_V9;
|
||||||
|
|
||||||
private static final String DEFAULT_WORKING_PATH = "/tmp/druid-indexing";
|
private static final String DEFAULT_WORKING_PATH = "/tmp/druid-indexing";
|
||||||
|
|
||||||
|
@ -112,6 +114,7 @@ public class HadoopDruidIndexerConfig
|
||||||
JSON_MAPPER = injector.getInstance(ObjectMapper.class);
|
JSON_MAPPER = injector.getInstance(ObjectMapper.class);
|
||||||
INDEX_IO = injector.getInstance(IndexIO.class);
|
INDEX_IO = injector.getInstance(IndexIO.class);
|
||||||
INDEX_MERGER = injector.getInstance(IndexMerger.class);
|
INDEX_MERGER = injector.getInstance(IndexMerger.class);
|
||||||
|
INDEX_MERGER_V9 = injector.getInstance(IndexMergerV9.class);
|
||||||
}
|
}
|
||||||
|
|
||||||
public static enum IndexJobCounters
|
public static enum IndexJobCounters
|
||||||
|
@ -351,6 +354,11 @@ public class HadoopDruidIndexerConfig
|
||||||
return schema.getTuningConfig().getShardSpecs().get(bucket.time).get(bucket.partitionNum);
|
return schema.getTuningConfig().getShardSpecs().get(bucket.time).get(bucket.partitionNum);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public boolean isBuildV9Directly()
|
||||||
|
{
|
||||||
|
return schema.getTuningConfig().getBuildV9Directly();
|
||||||
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Job instance should have Configuration set (by calling {@link #addJobProperties(Job)}
|
* Job instance should have Configuration set (by calling {@link #addJobProperties(Job)}
|
||||||
* or via injected system properties) before this method is called. The {@link PathSpec} may
|
* or via injected system properties) before this method is called. The {@link PathSpec} may
|
||||||
|
|
|
@ -42,6 +42,7 @@ public class HadoopTuningConfig implements TuningConfig
|
||||||
private static final IndexSpec DEFAULT_INDEX_SPEC = new IndexSpec();
|
private static final IndexSpec DEFAULT_INDEX_SPEC = new IndexSpec();
|
||||||
private static final int DEFAULT_ROW_FLUSH_BOUNDARY = 80000;
|
private static final int DEFAULT_ROW_FLUSH_BOUNDARY = 80000;
|
||||||
private static final boolean DEFAULT_USE_COMBINER = false;
|
private static final boolean DEFAULT_USE_COMBINER = false;
|
||||||
|
private static final Boolean DEFAULT_BUILD_V9_DIRECTLY = Boolean.FALSE;
|
||||||
|
|
||||||
public static HadoopTuningConfig makeDefaultTuningConfig()
|
public static HadoopTuningConfig makeDefaultTuningConfig()
|
||||||
{
|
{
|
||||||
|
@ -59,7 +60,8 @@ public class HadoopTuningConfig implements TuningConfig
|
||||||
null,
|
null,
|
||||||
false,
|
false,
|
||||||
false,
|
false,
|
||||||
null
|
null,
|
||||||
|
DEFAULT_BUILD_V9_DIRECTLY
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -76,6 +78,7 @@ public class HadoopTuningConfig implements TuningConfig
|
||||||
private final Map<String, String> jobProperties;
|
private final Map<String, String> jobProperties;
|
||||||
private final boolean combineText;
|
private final boolean combineText;
|
||||||
private final boolean useCombiner;
|
private final boolean useCombiner;
|
||||||
|
private final Boolean buildV9Directly;
|
||||||
|
|
||||||
@JsonCreator
|
@JsonCreator
|
||||||
public HadoopTuningConfig(
|
public HadoopTuningConfig(
|
||||||
|
@ -93,7 +96,8 @@ public class HadoopTuningConfig implements TuningConfig
|
||||||
final @JsonProperty("combineText") boolean combineText,
|
final @JsonProperty("combineText") boolean combineText,
|
||||||
final @JsonProperty("useCombiner") Boolean useCombiner,
|
final @JsonProperty("useCombiner") Boolean useCombiner,
|
||||||
// See https://github.com/druid-io/druid/pull/1922
|
// See https://github.com/druid-io/druid/pull/1922
|
||||||
final @JsonProperty("rowFlushBoundary") Integer maxRowsInMemoryCOMPAT
|
final @JsonProperty("rowFlushBoundary") Integer maxRowsInMemoryCOMPAT,
|
||||||
|
final @JsonProperty("buildV9Directly") Boolean buildV9Directly
|
||||||
)
|
)
|
||||||
{
|
{
|
||||||
this.workingPath = workingPath;
|
this.workingPath = workingPath;
|
||||||
|
@ -111,6 +115,7 @@ public class HadoopTuningConfig implements TuningConfig
|
||||||
: ImmutableMap.copyOf(jobProperties));
|
: ImmutableMap.copyOf(jobProperties));
|
||||||
this.combineText = combineText;
|
this.combineText = combineText;
|
||||||
this.useCombiner = useCombiner == null ? DEFAULT_USE_COMBINER : useCombiner.booleanValue();
|
this.useCombiner = useCombiner == null ? DEFAULT_USE_COMBINER : useCombiner.booleanValue();
|
||||||
|
this.buildV9Directly = buildV9Directly == null ? DEFAULT_BUILD_V9_DIRECTLY : buildV9Directly;
|
||||||
}
|
}
|
||||||
|
|
||||||
@JsonProperty
|
@JsonProperty
|
||||||
|
@ -191,6 +196,11 @@ public class HadoopTuningConfig implements TuningConfig
|
||||||
return useCombiner;
|
return useCombiner;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@JsonProperty
|
||||||
|
public Boolean getBuildV9Directly() {
|
||||||
|
return buildV9Directly;
|
||||||
|
}
|
||||||
|
|
||||||
public HadoopTuningConfig withWorkingPath(String path)
|
public HadoopTuningConfig withWorkingPath(String path)
|
||||||
{
|
{
|
||||||
return new HadoopTuningConfig(
|
return new HadoopTuningConfig(
|
||||||
|
@ -207,7 +217,8 @@ public class HadoopTuningConfig implements TuningConfig
|
||||||
jobProperties,
|
jobProperties,
|
||||||
combineText,
|
combineText,
|
||||||
useCombiner,
|
useCombiner,
|
||||||
null
|
null,
|
||||||
|
buildV9Directly
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -227,7 +238,8 @@ public class HadoopTuningConfig implements TuningConfig
|
||||||
jobProperties,
|
jobProperties,
|
||||||
combineText,
|
combineText,
|
||||||
useCombiner,
|
useCombiner,
|
||||||
null
|
null,
|
||||||
|
buildV9Directly
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -247,7 +259,8 @@ public class HadoopTuningConfig implements TuningConfig
|
||||||
jobProperties,
|
jobProperties,
|
||||||
combineText,
|
combineText,
|
||||||
useCombiner,
|
useCombiner,
|
||||||
null
|
null,
|
||||||
|
buildV9Directly
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -467,10 +467,16 @@ public class IndexGeneratorJob implements Jobby
|
||||||
final ProgressIndicator progressIndicator
|
final ProgressIndicator progressIndicator
|
||||||
) throws IOException
|
) throws IOException
|
||||||
{
|
{
|
||||||
|
if (config.isBuildV9Directly()) {
|
||||||
|
return HadoopDruidIndexerConfig.INDEX_MERGER_V9.persist(
|
||||||
|
index, interval, file, null, config.getIndexSpec(), progressIndicator
|
||||||
|
);
|
||||||
|
} else {
|
||||||
return HadoopDruidIndexerConfig.INDEX_MERGER.persist(
|
return HadoopDruidIndexerConfig.INDEX_MERGER.persist(
|
||||||
index, interval, file, null, config.getIndexSpec(), progressIndicator
|
index, interval, file, null, config.getIndexSpec(), progressIndicator
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
protected File mergeQueryableIndex(
|
protected File mergeQueryableIndex(
|
||||||
final List<QueryableIndex> indexes,
|
final List<QueryableIndex> indexes,
|
||||||
|
@ -479,10 +485,16 @@ public class IndexGeneratorJob implements Jobby
|
||||||
ProgressIndicator progressIndicator
|
ProgressIndicator progressIndicator
|
||||||
) throws IOException
|
) throws IOException
|
||||||
{
|
{
|
||||||
|
if (config.isBuildV9Directly()) {
|
||||||
|
return HadoopDruidIndexerConfig.INDEX_MERGER_V9.mergeQueryableIndex(
|
||||||
|
indexes, aggs, file, config.getIndexSpec(), progressIndicator
|
||||||
|
);
|
||||||
|
} else {
|
||||||
return HadoopDruidIndexerConfig.INDEX_MERGER.mergeQueryableIndex(
|
return HadoopDruidIndexerConfig.INDEX_MERGER.mergeQueryableIndex(
|
||||||
indexes, aggs, file, config.getIndexSpec(), progressIndicator
|
indexes, aggs, file, config.getIndexSpec(), progressIndicator
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
protected void setup(Context context)
|
protected void setup(Context context)
|
||||||
|
|
|
@ -381,6 +381,7 @@ public class BatchDeltaIngestionTest
|
||||||
null,
|
null,
|
||||||
false,
|
false,
|
||||||
false,
|
false,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
)
|
)
|
||||||
)
|
)
|
||||||
|
|
|
@ -160,6 +160,7 @@ public class DetermineHashedPartitionsJobTest
|
||||||
null,
|
null,
|
||||||
false,
|
false,
|
||||||
false,
|
false,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
)
|
)
|
||||||
);
|
);
|
||||||
|
|
|
@ -264,6 +264,7 @@ public class DeterminePartitionsJobTest
|
||||||
null,
|
null,
|
||||||
false,
|
false,
|
||||||
false,
|
false,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
)
|
)
|
||||||
)
|
)
|
||||||
|
|
|
@ -207,6 +207,7 @@ public class HadoopDruidIndexerConfigTest
|
||||||
null,
|
null,
|
||||||
false,
|
false,
|
||||||
false,
|
false,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
)
|
)
|
||||||
);
|
);
|
||||||
|
|
|
@ -53,6 +53,7 @@ public class HadoopTuningConfigTest
|
||||||
null,
|
null,
|
||||||
true,
|
true,
|
||||||
true,
|
true,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
);
|
);
|
||||||
|
|
||||||
|
|
|
@ -395,6 +395,7 @@ public class IndexGeneratorJobTest
|
||||||
ImmutableMap.of(JobContext.NUM_REDUCES, "0"), //verifies that set num reducers is ignored
|
ImmutableMap.of(JobContext.NUM_REDUCES, "0"), //verifies that set num reducers is ignored
|
||||||
false,
|
false,
|
||||||
useCombiner,
|
useCombiner,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
)
|
)
|
||||||
)
|
)
|
||||||
|
|
|
@ -115,6 +115,7 @@ public class JobHelperTest
|
||||||
),
|
),
|
||||||
false,
|
false,
|
||||||
false,
|
false,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
)
|
)
|
||||||
)
|
)
|
||||||
|
|
|
@ -120,7 +120,7 @@ public class GranularityPathSpecTest
|
||||||
jsonMapper
|
jsonMapper
|
||||||
),
|
),
|
||||||
new HadoopIOConfig(null, null, null),
|
new HadoopIOConfig(null, null, null),
|
||||||
new HadoopTuningConfig(null, null, null, null, null, null, false, false, false, false, null, false, false, null)
|
new HadoopTuningConfig(null, null, null, null, null, null, false, false, false, false, null, false, false, null, null)
|
||||||
);
|
);
|
||||||
|
|
||||||
granularityPathSpec.setDataGranularity(Granularity.HOUR);
|
granularityPathSpec.setDataGranularity(Granularity.HOUR);
|
||||||
|
|
|
@ -201,6 +201,7 @@ public class HadoopConverterJobTest
|
||||||
null,
|
null,
|
||||||
false,
|
false,
|
||||||
false,
|
false,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
)
|
)
|
||||||
)
|
)
|
||||||
|
|
|
@ -37,6 +37,7 @@ import io.druid.indexing.common.task.Task;
|
||||||
import io.druid.query.QueryRunnerFactoryConglomerate;
|
import io.druid.query.QueryRunnerFactoryConglomerate;
|
||||||
import io.druid.segment.IndexIO;
|
import io.druid.segment.IndexIO;
|
||||||
import io.druid.segment.IndexMerger;
|
import io.druid.segment.IndexMerger;
|
||||||
|
import io.druid.segment.IndexMergerV9;
|
||||||
import io.druid.segment.loading.DataSegmentArchiver;
|
import io.druid.segment.loading.DataSegmentArchiver;
|
||||||
import io.druid.segment.loading.DataSegmentKiller;
|
import io.druid.segment.loading.DataSegmentKiller;
|
||||||
import io.druid.segment.loading.DataSegmentMover;
|
import io.druid.segment.loading.DataSegmentMover;
|
||||||
|
@ -80,7 +81,7 @@ public class TaskToolbox
|
||||||
private final IndexIO indexIO;
|
private final IndexIO indexIO;
|
||||||
private final Cache cache;
|
private final Cache cache;
|
||||||
private final CacheConfig cacheConfig;
|
private final CacheConfig cacheConfig;
|
||||||
|
private final IndexMergerV9 indexMergerV9;
|
||||||
|
|
||||||
public TaskToolbox(
|
public TaskToolbox(
|
||||||
TaskConfig config,
|
TaskConfig config,
|
||||||
|
@ -102,7 +103,8 @@ public class TaskToolbox
|
||||||
IndexMerger indexMerger,
|
IndexMerger indexMerger,
|
||||||
IndexIO indexIO,
|
IndexIO indexIO,
|
||||||
Cache cache,
|
Cache cache,
|
||||||
CacheConfig cacheConfig
|
CacheConfig cacheConfig,
|
||||||
|
IndexMergerV9 indexMergerV9
|
||||||
)
|
)
|
||||||
{
|
{
|
||||||
this.config = config;
|
this.config = config;
|
||||||
|
@ -125,6 +127,7 @@ public class TaskToolbox
|
||||||
this.indexIO = Preconditions.checkNotNull(indexIO, "Null IndexIO");
|
this.indexIO = Preconditions.checkNotNull(indexIO, "Null IndexIO");
|
||||||
this.cache = cache;
|
this.cache = cache;
|
||||||
this.cacheConfig = cacheConfig;
|
this.cacheConfig = cacheConfig;
|
||||||
|
this.indexMergerV9 = Preconditions.checkNotNull(indexMergerV9, "Null IndexMergerV9");
|
||||||
}
|
}
|
||||||
|
|
||||||
public TaskConfig getConfig()
|
public TaskConfig getConfig()
|
||||||
|
@ -247,4 +250,8 @@ public class TaskToolbox
|
||||||
{
|
{
|
||||||
return cacheConfig;
|
return cacheConfig;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public IndexMergerV9 getIndexMergerV9() {
|
||||||
|
return indexMergerV9;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -34,6 +34,7 @@ import io.druid.indexing.common.task.Task;
|
||||||
import io.druid.query.QueryRunnerFactoryConglomerate;
|
import io.druid.query.QueryRunnerFactoryConglomerate;
|
||||||
import io.druid.segment.IndexIO;
|
import io.druid.segment.IndexIO;
|
||||||
import io.druid.segment.IndexMerger;
|
import io.druid.segment.IndexMerger;
|
||||||
|
import io.druid.segment.IndexMergerV9;
|
||||||
import io.druid.segment.loading.DataSegmentArchiver;
|
import io.druid.segment.loading.DataSegmentArchiver;
|
||||||
import io.druid.segment.loading.DataSegmentKiller;
|
import io.druid.segment.loading.DataSegmentKiller;
|
||||||
import io.druid.segment.loading.DataSegmentMover;
|
import io.druid.segment.loading.DataSegmentMover;
|
||||||
|
@ -67,6 +68,7 @@ public class TaskToolboxFactory
|
||||||
private final IndexIO indexIO;
|
private final IndexIO indexIO;
|
||||||
private final Cache cache;
|
private final Cache cache;
|
||||||
private final CacheConfig cacheConfig;
|
private final CacheConfig cacheConfig;
|
||||||
|
private final IndexMergerV9 indexMergerV9;
|
||||||
|
|
||||||
@Inject
|
@Inject
|
||||||
public TaskToolboxFactory(
|
public TaskToolboxFactory(
|
||||||
|
@ -87,7 +89,8 @@ public class TaskToolboxFactory
|
||||||
IndexMerger indexMerger,
|
IndexMerger indexMerger,
|
||||||
IndexIO indexIO,
|
IndexIO indexIO,
|
||||||
Cache cache,
|
Cache cache,
|
||||||
CacheConfig cacheConfig
|
CacheConfig cacheConfig,
|
||||||
|
IndexMergerV9 indexMergerV9
|
||||||
)
|
)
|
||||||
{
|
{
|
||||||
this.config = config;
|
this.config = config;
|
||||||
|
@ -108,6 +111,7 @@ public class TaskToolboxFactory
|
||||||
this.indexIO = Preconditions.checkNotNull(indexIO, "Null IndexIO");
|
this.indexIO = Preconditions.checkNotNull(indexIO, "Null IndexIO");
|
||||||
this.cache = cache;
|
this.cache = cache;
|
||||||
this.cacheConfig = cacheConfig;
|
this.cacheConfig = cacheConfig;
|
||||||
|
this.indexMergerV9 = indexMergerV9;
|
||||||
}
|
}
|
||||||
|
|
||||||
public TaskToolbox build(Task task)
|
public TaskToolbox build(Task task)
|
||||||
|
@ -133,7 +137,8 @@ public class TaskToolboxFactory
|
||||||
indexMerger,
|
indexMerger,
|
||||||
indexIO,
|
indexIO,
|
||||||
cache,
|
cache,
|
||||||
cacheConfig
|
cacheConfig,
|
||||||
|
indexMergerV9
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -48,6 +48,7 @@ import io.druid.indexing.common.TaskStatus;
|
||||||
import io.druid.indexing.common.TaskToolbox;
|
import io.druid.indexing.common.TaskToolbox;
|
||||||
import io.druid.indexing.common.index.YeOldePlumberSchool;
|
import io.druid.indexing.common.index.YeOldePlumberSchool;
|
||||||
import io.druid.query.aggregation.hyperloglog.HyperLogLogCollector;
|
import io.druid.query.aggregation.hyperloglog.HyperLogLogCollector;
|
||||||
|
import io.druid.segment.IndexMerger;
|
||||||
import io.druid.segment.IndexSpec;
|
import io.druid.segment.IndexSpec;
|
||||||
import io.druid.segment.indexing.DataSchema;
|
import io.druid.segment.indexing.DataSchema;
|
||||||
import io.druid.segment.indexing.IOConfig;
|
import io.druid.segment.indexing.IOConfig;
|
||||||
|
@ -134,7 +135,8 @@ public class IndexTask extends AbstractFixedIntervalTask
|
||||||
null,
|
null,
|
||||||
null,
|
null,
|
||||||
shardSpec,
|
shardSpec,
|
||||||
indexSpec
|
indexSpec,
|
||||||
|
null
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -353,12 +355,15 @@ public class IndexTask extends AbstractFixedIntervalTask
|
||||||
final FireDepartmentMetrics metrics = new FireDepartmentMetrics();
|
final FireDepartmentMetrics metrics = new FireDepartmentMetrics();
|
||||||
final Firehose firehose = firehoseFactory.connect(ingestionSchema.getDataSchema().getParser());
|
final Firehose firehose = firehoseFactory.connect(ingestionSchema.getDataSchema().getParser());
|
||||||
final Supplier<Committer> committerSupplier = Committers.supplierFromFirehose(firehose);
|
final Supplier<Committer> committerSupplier = Committers.supplierFromFirehose(firehose);
|
||||||
|
final IndexMerger indexMerger = ingestionSchema.getTuningConfig().getBuildV9Directly()
|
||||||
|
? toolbox.getIndexMergerV9()
|
||||||
|
: toolbox.getIndexMerger();
|
||||||
final Plumber plumber = new YeOldePlumberSchool(
|
final Plumber plumber = new YeOldePlumberSchool(
|
||||||
interval,
|
interval,
|
||||||
version,
|
version,
|
||||||
wrappedDataSegmentPusher,
|
wrappedDataSegmentPusher,
|
||||||
tmpDir,
|
tmpDir,
|
||||||
toolbox.getIndexMerger(),
|
indexMerger,
|
||||||
toolbox.getIndexIO()
|
toolbox.getIndexIO()
|
||||||
).findPlumber(
|
).findPlumber(
|
||||||
schema,
|
schema,
|
||||||
|
@ -434,7 +439,7 @@ public class IndexTask extends AbstractFixedIntervalTask
|
||||||
|
|
||||||
this.dataSchema = dataSchema;
|
this.dataSchema = dataSchema;
|
||||||
this.ioConfig = ioConfig;
|
this.ioConfig = ioConfig;
|
||||||
this.tuningConfig = tuningConfig == null ? new IndexTuningConfig(0, 0, null, null) : tuningConfig;
|
this.tuningConfig = tuningConfig == null ? new IndexTuningConfig(0, 0, null, null, null) : tuningConfig;
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
@ -485,18 +490,21 @@ public class IndexTask extends AbstractFixedIntervalTask
|
||||||
private static final int DEFAULT_TARGET_PARTITION_SIZE = 5000000;
|
private static final int DEFAULT_TARGET_PARTITION_SIZE = 5000000;
|
||||||
private static final int DEFAULT_ROW_FLUSH_BOUNDARY = 500000;
|
private static final int DEFAULT_ROW_FLUSH_BOUNDARY = 500000;
|
||||||
private static final IndexSpec DEFAULT_INDEX_SPEC = new IndexSpec();
|
private static final IndexSpec DEFAULT_INDEX_SPEC = new IndexSpec();
|
||||||
|
private static final Boolean DEFAULT_BUILD_V9_DIRECTLY = Boolean.FALSE;
|
||||||
|
|
||||||
private final int targetPartitionSize;
|
private final int targetPartitionSize;
|
||||||
private final int rowFlushBoundary;
|
private final int rowFlushBoundary;
|
||||||
private final int numShards;
|
private final int numShards;
|
||||||
private final IndexSpec indexSpec;
|
private final IndexSpec indexSpec;
|
||||||
|
private final Boolean buildV9Directly;
|
||||||
|
|
||||||
@JsonCreator
|
@JsonCreator
|
||||||
public IndexTuningConfig(
|
public IndexTuningConfig(
|
||||||
@JsonProperty("targetPartitionSize") int targetPartitionSize,
|
@JsonProperty("targetPartitionSize") int targetPartitionSize,
|
||||||
@JsonProperty("rowFlushBoundary") int rowFlushBoundary,
|
@JsonProperty("rowFlushBoundary") int rowFlushBoundary,
|
||||||
@JsonProperty("numShards") @Nullable Integer numShards,
|
@JsonProperty("numShards") @Nullable Integer numShards,
|
||||||
@JsonProperty("indexSpec") @Nullable IndexSpec indexSpec
|
@JsonProperty("indexSpec") @Nullable IndexSpec indexSpec,
|
||||||
|
@JsonProperty("buildV9Directly") Boolean buildV9Directly
|
||||||
)
|
)
|
||||||
{
|
{
|
||||||
this.targetPartitionSize = targetPartitionSize == 0 ? DEFAULT_TARGET_PARTITION_SIZE : targetPartitionSize;
|
this.targetPartitionSize = targetPartitionSize == 0 ? DEFAULT_TARGET_PARTITION_SIZE : targetPartitionSize;
|
||||||
|
@ -508,6 +516,7 @@ public class IndexTask extends AbstractFixedIntervalTask
|
||||||
this.targetPartitionSize == -1 || this.numShards == -1,
|
this.targetPartitionSize == -1 || this.numShards == -1,
|
||||||
"targetPartitionsSize and shardCount both cannot be set"
|
"targetPartitionsSize and shardCount both cannot be set"
|
||||||
);
|
);
|
||||||
|
this.buildV9Directly = buildV9Directly == null ? DEFAULT_BUILD_V9_DIRECTLY : buildV9Directly;
|
||||||
}
|
}
|
||||||
|
|
||||||
@JsonProperty
|
@JsonProperty
|
||||||
|
@ -533,5 +542,11 @@ public class IndexTask extends AbstractFixedIntervalTask
|
||||||
{
|
{
|
||||||
return indexSpec;
|
return indexSpec;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@JsonProperty
|
||||||
|
public Boolean getBuildV9Directly()
|
||||||
|
{
|
||||||
|
return buildV9Directly;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -47,6 +47,7 @@ import io.druid.query.QueryRunner;
|
||||||
import io.druid.query.QueryRunnerFactory;
|
import io.druid.query.QueryRunnerFactory;
|
||||||
import io.druid.query.QueryRunnerFactoryConglomerate;
|
import io.druid.query.QueryRunnerFactoryConglomerate;
|
||||||
import io.druid.query.QueryToolChest;
|
import io.druid.query.QueryToolChest;
|
||||||
|
import io.druid.segment.IndexMerger;
|
||||||
import io.druid.segment.indexing.DataSchema;
|
import io.druid.segment.indexing.DataSchema;
|
||||||
import io.druid.segment.indexing.RealtimeIOConfig;
|
import io.druid.segment.indexing.RealtimeIOConfig;
|
||||||
import io.druid.segment.indexing.RealtimeTuningConfig;
|
import io.druid.segment.indexing.RealtimeTuningConfig;
|
||||||
|
@ -286,6 +287,9 @@ public class RealtimeIndexTask extends AbstractTask
|
||||||
);
|
);
|
||||||
this.queryRunnerFactoryConglomerate = toolbox.getQueryRunnerFactoryConglomerate();
|
this.queryRunnerFactoryConglomerate = toolbox.getQueryRunnerFactoryConglomerate();
|
||||||
|
|
||||||
|
IndexMerger indexMerger = spec.getTuningConfig().getBuildV9Directly()
|
||||||
|
? toolbox.getIndexMergerV9()
|
||||||
|
: toolbox.getIndexMerger();
|
||||||
// NOTE: This pusher selects path based purely on global configuration and the DataSegment, which means
|
// NOTE: This pusher selects path based purely on global configuration and the DataSegment, which means
|
||||||
// NOTE: that redundant realtime tasks will upload to the same location. This can cause index.zip and
|
// NOTE: that redundant realtime tasks will upload to the same location. This can cause index.zip and
|
||||||
// NOTE: descriptor.json to mismatch, or it can cause historical nodes to load different instances of the
|
// NOTE: descriptor.json to mismatch, or it can cause historical nodes to load different instances of the
|
||||||
|
@ -298,7 +302,7 @@ public class RealtimeIndexTask extends AbstractTask
|
||||||
segmentPublisher,
|
segmentPublisher,
|
||||||
toolbox.getSegmentHandoffNotifierFactory(),
|
toolbox.getSegmentHandoffNotifierFactory(),
|
||||||
toolbox.getQueryExecutorService(),
|
toolbox.getQueryExecutorService(),
|
||||||
toolbox.getIndexMerger(),
|
indexMerger,
|
||||||
toolbox.getIndexIO(),
|
toolbox.getIndexIO(),
|
||||||
toolbox.getCache(),
|
toolbox.getCache(),
|
||||||
toolbox.getCacheConfig(),
|
toolbox.getCacheConfig(),
|
||||||
|
|
|
@ -31,6 +31,7 @@ import io.druid.indexing.common.task.Task;
|
||||||
import io.druid.query.QueryRunnerFactoryConglomerate;
|
import io.druid.query.QueryRunnerFactoryConglomerate;
|
||||||
import io.druid.segment.IndexIO;
|
import io.druid.segment.IndexIO;
|
||||||
import io.druid.segment.IndexMerger;
|
import io.druid.segment.IndexMerger;
|
||||||
|
import io.druid.segment.IndexMergerV9;
|
||||||
import io.druid.segment.loading.DataSegmentArchiver;
|
import io.druid.segment.loading.DataSegmentArchiver;
|
||||||
import io.druid.segment.loading.DataSegmentKiller;
|
import io.druid.segment.loading.DataSegmentKiller;
|
||||||
import io.druid.segment.loading.DataSegmentMover;
|
import io.druid.segment.loading.DataSegmentMover;
|
||||||
|
@ -77,6 +78,7 @@ public class TaskToolboxTest
|
||||||
private SegmentLoaderLocalCacheManager mockSegmentLoaderLocalCacheManager = EasyMock.createMock(SegmentLoaderLocalCacheManager.class);
|
private SegmentLoaderLocalCacheManager mockSegmentLoaderLocalCacheManager = EasyMock.createMock(SegmentLoaderLocalCacheManager.class);
|
||||||
private Task task = EasyMock.createMock(Task.class);
|
private Task task = EasyMock.createMock(Task.class);
|
||||||
private IndexMerger mockIndexMerger = EasyMock.createMock(IndexMerger.class);
|
private IndexMerger mockIndexMerger = EasyMock.createMock(IndexMerger.class);
|
||||||
|
private IndexMergerV9 mockIndexMergerV9 = EasyMock.createMock(IndexMergerV9.class);
|
||||||
private IndexIO mockIndexIO = EasyMock.createMock(IndexIO.class);
|
private IndexIO mockIndexIO = EasyMock.createMock(IndexIO.class);
|
||||||
private Cache mockCache = EasyMock.createMock(Cache.class);
|
private Cache mockCache = EasyMock.createMock(Cache.class);
|
||||||
private CacheConfig mockCacheConfig = EasyMock.createMock(CacheConfig.class);
|
private CacheConfig mockCacheConfig = EasyMock.createMock(CacheConfig.class);
|
||||||
|
@ -109,7 +111,8 @@ public class TaskToolboxTest
|
||||||
mockIndexMerger,
|
mockIndexMerger,
|
||||||
mockIndexIO,
|
mockIndexIO,
|
||||||
mockCache,
|
mockCache,
|
||||||
mockCacheConfig
|
mockCacheConfig,
|
||||||
|
mockIndexMergerV9
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -28,6 +28,7 @@ import io.druid.guice.ServerModule;
|
||||||
import io.druid.jackson.DefaultObjectMapper;
|
import io.druid.jackson.DefaultObjectMapper;
|
||||||
import io.druid.segment.IndexIO;
|
import io.druid.segment.IndexIO;
|
||||||
import io.druid.segment.IndexMerger;
|
import io.druid.segment.IndexMerger;
|
||||||
|
import io.druid.segment.IndexMergerV9;
|
||||||
import io.druid.segment.column.ColumnConfig;
|
import io.druid.segment.column.ColumnConfig;
|
||||||
|
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
|
@ -39,6 +40,7 @@ public class TestUtils
|
||||||
{
|
{
|
||||||
private final ObjectMapper jsonMapper;
|
private final ObjectMapper jsonMapper;
|
||||||
private final IndexMerger indexMerger;
|
private final IndexMerger indexMerger;
|
||||||
|
private final IndexMergerV9 indexMergerV9;
|
||||||
private final IndexIO indexIO;
|
private final IndexIO indexIO;
|
||||||
|
|
||||||
public TestUtils()
|
public TestUtils()
|
||||||
|
@ -56,6 +58,7 @@ public class TestUtils
|
||||||
}
|
}
|
||||||
);
|
);
|
||||||
indexMerger = new IndexMerger(jsonMapper, indexIO);
|
indexMerger = new IndexMerger(jsonMapper, indexIO);
|
||||||
|
indexMergerV9 = new IndexMergerV9(jsonMapper, indexIO);
|
||||||
|
|
||||||
final List<? extends Module> list = new ServerModule().getJacksonModules();
|
final List<? extends Module> list = new ServerModule().getJacksonModules();
|
||||||
for (Module module : list) {
|
for (Module module : list) {
|
||||||
|
@ -80,6 +83,10 @@ public class TestUtils
|
||||||
return indexMerger;
|
return indexMerger;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public IndexMergerV9 getTestIndexMergerV9() {
|
||||||
|
return indexMergerV9;
|
||||||
|
}
|
||||||
|
|
||||||
public IndexIO getTestIndexIO()
|
public IndexIO getTestIndexIO()
|
||||||
{
|
{
|
||||||
return indexIO;
|
return indexIO;
|
||||||
|
|
|
@ -39,6 +39,7 @@ import io.druid.query.aggregation.AggregatorFactory;
|
||||||
import io.druid.query.aggregation.LongSumAggregatorFactory;
|
import io.druid.query.aggregation.LongSumAggregatorFactory;
|
||||||
import io.druid.segment.IndexIO;
|
import io.druid.segment.IndexIO;
|
||||||
import io.druid.segment.IndexMerger;
|
import io.druid.segment.IndexMerger;
|
||||||
|
import io.druid.segment.IndexMergerV9;
|
||||||
import io.druid.segment.IndexSpec;
|
import io.druid.segment.IndexSpec;
|
||||||
import io.druid.segment.indexing.DataSchema;
|
import io.druid.segment.indexing.DataSchema;
|
||||||
import io.druid.segment.indexing.RealtimeTuningConfig;
|
import io.druid.segment.indexing.RealtimeTuningConfig;
|
||||||
|
@ -70,6 +71,7 @@ public class IndexTaskTest
|
||||||
private final IndexSpec indexSpec;
|
private final IndexSpec indexSpec;
|
||||||
private final ObjectMapper jsonMapper;
|
private final ObjectMapper jsonMapper;
|
||||||
private IndexMerger indexMerger;
|
private IndexMerger indexMerger;
|
||||||
|
private IndexMergerV9 indexMergerV9;
|
||||||
private IndexIO indexIO;
|
private IndexIO indexIO;
|
||||||
|
|
||||||
public IndexTaskTest()
|
public IndexTaskTest()
|
||||||
|
@ -78,6 +80,7 @@ public class IndexTaskTest
|
||||||
TestUtils testUtils = new TestUtils();
|
TestUtils testUtils = new TestUtils();
|
||||||
jsonMapper = testUtils.getTestObjectMapper();
|
jsonMapper = testUtils.getTestObjectMapper();
|
||||||
indexMerger = testUtils.getTestIndexMerger();
|
indexMerger = testUtils.getTestIndexMerger();
|
||||||
|
indexMergerV9 = testUtils.getTestIndexMergerV9();
|
||||||
indexIO = testUtils.getTestIndexIO();
|
indexIO = testUtils.getTestIndexIO();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -140,7 +143,8 @@ public class IndexTaskTest
|
||||||
2,
|
2,
|
||||||
0,
|
0,
|
||||||
null,
|
null,
|
||||||
indexSpec
|
indexSpec,
|
||||||
|
null
|
||||||
)
|
)
|
||||||
),
|
),
|
||||||
jsonMapper,
|
jsonMapper,
|
||||||
|
@ -252,7 +256,7 @@ public class IndexTaskTest
|
||||||
return segment;
|
return segment;
|
||||||
}
|
}
|
||||||
}, null, null, null, null, null, null, null, null, null, null, temporaryFolder.newFolder(),
|
}, null, null, null, null, null, null, null, null, null, null, temporaryFolder.newFolder(),
|
||||||
indexMerger, indexIO, null, null
|
indexMerger, indexIO, null, null, indexMergerV9
|
||||||
)
|
)
|
||||||
);
|
);
|
||||||
|
|
||||||
|
@ -332,7 +336,8 @@ public class IndexTaskTest
|
||||||
100,
|
100,
|
||||||
1000,
|
1000,
|
||||||
null,
|
null,
|
||||||
new IndexSpec()
|
new IndexSpec(),
|
||||||
|
null
|
||||||
);
|
);
|
||||||
RealtimeTuningConfig realtimeTuningConfig = IndexTask.convertTuningConfig(
|
RealtimeTuningConfig realtimeTuningConfig = IndexTask.convertTuningConfig(
|
||||||
spec,
|
spec,
|
||||||
|
|
|
@ -571,6 +571,7 @@ public class RealtimeIndexTaskTest
|
||||||
null,
|
null,
|
||||||
null,
|
null,
|
||||||
null,
|
null,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
);
|
);
|
||||||
return new RealtimeIndexTask(
|
return new RealtimeIndexTask(
|
||||||
|
@ -715,7 +716,8 @@ public class RealtimeIndexTaskTest
|
||||||
testUtils.getTestIndexMerger(),
|
testUtils.getTestIndexMerger(),
|
||||||
testUtils.getTestIndexIO(),
|
testUtils.getTestIndexIO(),
|
||||||
MapCache.create(1024),
|
MapCache.create(1024),
|
||||||
new CacheConfig()
|
new CacheConfig(),
|
||||||
|
testUtils.getTestIndexMergerV9()
|
||||||
);
|
);
|
||||||
|
|
||||||
return toolboxFactory.build(task);
|
return toolboxFactory.build(task);
|
||||||
|
|
|
@ -91,7 +91,7 @@ public class TaskSerdeTest
|
||||||
jsonMapper
|
jsonMapper
|
||||||
),
|
),
|
||||||
new IndexTask.IndexIOConfig(new LocalFirehoseFactory(new File("lol"), "rofl", null)),
|
new IndexTask.IndexIOConfig(new LocalFirehoseFactory(new File("lol"), "rofl", null)),
|
||||||
new IndexTask.IndexTuningConfig(10000, 10, -1, indexSpec)
|
new IndexTask.IndexTuningConfig(10000, 10, -1, indexSpec, null)
|
||||||
),
|
),
|
||||||
jsonMapper,
|
jsonMapper,
|
||||||
null
|
null
|
||||||
|
@ -132,7 +132,7 @@ public class TaskSerdeTest
|
||||||
jsonMapper
|
jsonMapper
|
||||||
),
|
),
|
||||||
new IndexTask.IndexIOConfig(new LocalFirehoseFactory(new File("lol"), "rofl", null)),
|
new IndexTask.IndexIOConfig(new LocalFirehoseFactory(new File("lol"), "rofl", null)),
|
||||||
new IndexTask.IndexTuningConfig(10000, 10, -1, indexSpec)
|
new IndexTask.IndexTuningConfig(10000, 10, -1, indexSpec, null)
|
||||||
),
|
),
|
||||||
jsonMapper,
|
jsonMapper,
|
||||||
null
|
null
|
||||||
|
@ -332,7 +332,8 @@ public class TaskSerdeTest
|
||||||
null,
|
null,
|
||||||
1,
|
1,
|
||||||
new NoneShardSpec(),
|
new NoneShardSpec(),
|
||||||
indexSpec
|
indexSpec,
|
||||||
|
null
|
||||||
)
|
)
|
||||||
),
|
),
|
||||||
null
|
null
|
||||||
|
|
|
@ -64,6 +64,7 @@ import io.druid.query.aggregation.LongSumAggregatorFactory;
|
||||||
import io.druid.query.filter.SelectorDimFilter;
|
import io.druid.query.filter.SelectorDimFilter;
|
||||||
import io.druid.segment.IndexIO;
|
import io.druid.segment.IndexIO;
|
||||||
import io.druid.segment.IndexMerger;
|
import io.druid.segment.IndexMerger;
|
||||||
|
import io.druid.segment.IndexMergerV9;
|
||||||
import io.druid.segment.IndexSpec;
|
import io.druid.segment.IndexSpec;
|
||||||
import io.druid.segment.incremental.IncrementalIndexSchema;
|
import io.druid.segment.incremental.IncrementalIndexSchema;
|
||||||
import io.druid.segment.incremental.OnheapIncrementalIndex;
|
import io.druid.segment.incremental.OnheapIncrementalIndex;
|
||||||
|
@ -109,12 +110,14 @@ public class IngestSegmentFirehoseFactoryTest
|
||||||
{
|
{
|
||||||
private static final ObjectMapper MAPPER;
|
private static final ObjectMapper MAPPER;
|
||||||
private static final IndexMerger INDEX_MERGER;
|
private static final IndexMerger INDEX_MERGER;
|
||||||
|
private static final IndexMergerV9 INDEX_MERGER_V9;
|
||||||
private static final IndexIO INDEX_IO;
|
private static final IndexIO INDEX_IO;
|
||||||
|
|
||||||
static {
|
static {
|
||||||
TestUtils testUtils = new TestUtils();
|
TestUtils testUtils = new TestUtils();
|
||||||
MAPPER = setupInjectablesInObjectMapper(testUtils.getTestObjectMapper());
|
MAPPER = setupInjectablesInObjectMapper(testUtils.getTestObjectMapper());
|
||||||
INDEX_MERGER = testUtils.getTestIndexMerger();
|
INDEX_MERGER = testUtils.getTestIndexMerger();
|
||||||
|
INDEX_MERGER_V9 = testUtils.getTestIndexMergerV9();
|
||||||
INDEX_IO = testUtils.getTestIndexIO();
|
INDEX_IO = testUtils.getTestIndexIO();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -274,7 +277,8 @@ public class IngestSegmentFirehoseFactoryTest
|
||||||
INDEX_MERGER,
|
INDEX_MERGER,
|
||||||
INDEX_IO,
|
INDEX_IO,
|
||||||
null,
|
null,
|
||||||
null
|
null,
|
||||||
|
INDEX_MERGER_V9
|
||||||
);
|
);
|
||||||
Collection<Object[]> values = new LinkedList<>();
|
Collection<Object[]> values = new LinkedList<>();
|
||||||
for (InputRowParser parser : Arrays.<InputRowParser>asList(
|
for (InputRowParser parser : Arrays.<InputRowParser>asList(
|
||||||
|
|
|
@ -55,6 +55,7 @@ import io.druid.query.aggregation.LongSumAggregatorFactory;
|
||||||
import io.druid.query.filter.NoopDimFilter;
|
import io.druid.query.filter.NoopDimFilter;
|
||||||
import io.druid.segment.IndexIO;
|
import io.druid.segment.IndexIO;
|
||||||
import io.druid.segment.IndexMerger;
|
import io.druid.segment.IndexMerger;
|
||||||
|
import io.druid.segment.IndexMergerV9;
|
||||||
import io.druid.segment.IndexSpec;
|
import io.druid.segment.IndexSpec;
|
||||||
import io.druid.segment.incremental.IncrementalIndexSchema;
|
import io.druid.segment.incremental.IncrementalIndexSchema;
|
||||||
import io.druid.segment.incremental.IndexSizeExceededException;
|
import io.druid.segment.incremental.IndexSizeExceededException;
|
||||||
|
@ -111,12 +112,14 @@ public class IngestSegmentFirehoseFactoryTimelineTest
|
||||||
private static final ObjectMapper MAPPER;
|
private static final ObjectMapper MAPPER;
|
||||||
private static final IndexMerger INDEX_MERGER;
|
private static final IndexMerger INDEX_MERGER;
|
||||||
private static final IndexIO INDEX_IO;
|
private static final IndexIO INDEX_IO;
|
||||||
|
private static final IndexMergerV9 INDEX_MERGER_V9;
|
||||||
|
|
||||||
static {
|
static {
|
||||||
TestUtils testUtils = new TestUtils();
|
TestUtils testUtils = new TestUtils();
|
||||||
MAPPER = IngestSegmentFirehoseFactoryTest.setupInjectablesInObjectMapper(testUtils.getTestObjectMapper());
|
MAPPER = IngestSegmentFirehoseFactoryTest.setupInjectablesInObjectMapper(testUtils.getTestObjectMapper());
|
||||||
INDEX_MERGER = testUtils.getTestIndexMerger();
|
INDEX_MERGER = testUtils.getTestIndexMerger();
|
||||||
INDEX_IO = testUtils.getTestIndexIO();
|
INDEX_IO = testUtils.getTestIndexIO();
|
||||||
|
INDEX_MERGER_V9 = testUtils.getTestIndexMergerV9();
|
||||||
}
|
}
|
||||||
|
|
||||||
public IngestSegmentFirehoseFactoryTimelineTest(
|
public IngestSegmentFirehoseFactoryTimelineTest(
|
||||||
|
@ -334,7 +337,8 @@ public class IngestSegmentFirehoseFactoryTimelineTest
|
||||||
INDEX_MERGER,
|
INDEX_MERGER,
|
||||||
INDEX_IO,
|
INDEX_IO,
|
||||||
null,
|
null,
|
||||||
null
|
null,
|
||||||
|
INDEX_MERGER_V9
|
||||||
);
|
);
|
||||||
final Injector injector = Guice.createInjector(
|
final Injector injector = Guice.createInjector(
|
||||||
new Module()
|
new Module()
|
||||||
|
|
|
@ -82,6 +82,7 @@ import io.druid.query.aggregation.DoubleSumAggregatorFactory;
|
||||||
import io.druid.query.aggregation.LongSumAggregatorFactory;
|
import io.druid.query.aggregation.LongSumAggregatorFactory;
|
||||||
import io.druid.segment.IndexIO;
|
import io.druid.segment.IndexIO;
|
||||||
import io.druid.segment.IndexMerger;
|
import io.druid.segment.IndexMerger;
|
||||||
|
import io.druid.segment.IndexMergerV9;
|
||||||
import io.druid.segment.IndexSpec;
|
import io.druid.segment.IndexSpec;
|
||||||
import io.druid.segment.indexing.DataSchema;
|
import io.druid.segment.indexing.DataSchema;
|
||||||
import io.druid.segment.indexing.RealtimeIOConfig;
|
import io.druid.segment.indexing.RealtimeIOConfig;
|
||||||
|
@ -132,12 +133,14 @@ public class TaskLifecycleTest
|
||||||
{
|
{
|
||||||
private static final ObjectMapper MAPPER;
|
private static final ObjectMapper MAPPER;
|
||||||
private static final IndexMerger INDEX_MERGER;
|
private static final IndexMerger INDEX_MERGER;
|
||||||
|
private static final IndexMergerV9 INDEX_MERGER_V9;
|
||||||
private static final IndexIO INDEX_IO;
|
private static final IndexIO INDEX_IO;
|
||||||
|
|
||||||
static {
|
static {
|
||||||
TestUtils testUtils = new TestUtils();
|
TestUtils testUtils = new TestUtils();
|
||||||
MAPPER = testUtils.getTestObjectMapper();
|
MAPPER = testUtils.getTestObjectMapper();
|
||||||
INDEX_MERGER = testUtils.getTestIndexMerger();
|
INDEX_MERGER = testUtils.getTestIndexMerger();
|
||||||
|
INDEX_MERGER_V9 = testUtils.getTestIndexMergerV9();
|
||||||
INDEX_IO = testUtils.getTestIndexIO();
|
INDEX_IO = testUtils.getTestIndexIO();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -532,7 +535,8 @@ public class TaskLifecycleTest
|
||||||
INDEX_MERGER,
|
INDEX_MERGER,
|
||||||
INDEX_IO,
|
INDEX_IO,
|
||||||
MapCache.create(0),
|
MapCache.create(0),
|
||||||
FireDepartmentTest.NO_CACHE_CONFIG
|
FireDepartmentTest.NO_CACHE_CONFIG,
|
||||||
|
INDEX_MERGER_V9
|
||||||
);
|
);
|
||||||
tr = new ThreadPoolTaskRunner(tb, taskConfig, emitter);
|
tr = new ThreadPoolTaskRunner(tb, taskConfig, emitter);
|
||||||
tq = new TaskQueue(tqc, ts, tr, tac, tl, emitter);
|
tq = new TaskQueue(tqc, ts, tr, tac, tl, emitter);
|
||||||
|
@ -565,7 +569,7 @@ public class TaskLifecycleTest
|
||||||
mapper
|
mapper
|
||||||
),
|
),
|
||||||
new IndexTask.IndexIOConfig(new MockFirehoseFactory(false)),
|
new IndexTask.IndexIOConfig(new MockFirehoseFactory(false)),
|
||||||
new IndexTask.IndexTuningConfig(10000, 10, -1, indexSpec)
|
new IndexTask.IndexTuningConfig(10000, 10, -1, indexSpec, null)
|
||||||
),
|
),
|
||||||
mapper,
|
mapper,
|
||||||
null
|
null
|
||||||
|
@ -623,7 +627,7 @@ public class TaskLifecycleTest
|
||||||
mapper
|
mapper
|
||||||
),
|
),
|
||||||
new IndexTask.IndexIOConfig(new MockExceptionalFirehoseFactory()),
|
new IndexTask.IndexIOConfig(new MockExceptionalFirehoseFactory()),
|
||||||
new IndexTask.IndexTuningConfig(10000, 10, -1, indexSpec)
|
new IndexTask.IndexTuningConfig(10000, 10, -1, indexSpec, null)
|
||||||
),
|
),
|
||||||
mapper,
|
mapper,
|
||||||
null
|
null
|
||||||
|
@ -969,7 +973,7 @@ public class TaskLifecycleTest
|
||||||
mapper
|
mapper
|
||||||
),
|
),
|
||||||
new IndexTask.IndexIOConfig(new MockFirehoseFactory(false)),
|
new IndexTask.IndexIOConfig(new MockFirehoseFactory(false)),
|
||||||
new IndexTask.IndexTuningConfig(10000, 10, -1, indexSpec)
|
new IndexTask.IndexTuningConfig(10000, 10, -1, indexSpec, null)
|
||||||
),
|
),
|
||||||
mapper,
|
mapper,
|
||||||
null
|
null
|
||||||
|
@ -1080,6 +1084,7 @@ public class TaskLifecycleTest
|
||||||
null,
|
null,
|
||||||
null,
|
null,
|
||||||
null,
|
null,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
);
|
);
|
||||||
FireDepartment fireDepartment = new FireDepartment(dataSchema, realtimeIOConfig, realtimeTuningConfig);
|
FireDepartment fireDepartment = new FireDepartment(dataSchema, realtimeIOConfig, realtimeTuningConfig);
|
||||||
|
|
|
@ -41,6 +41,7 @@ import io.druid.indexing.overlord.ThreadPoolTaskRunner;
|
||||||
import io.druid.indexing.worker.config.WorkerConfig;
|
import io.druid.indexing.worker.config.WorkerConfig;
|
||||||
import io.druid.segment.IndexIO;
|
import io.druid.segment.IndexIO;
|
||||||
import io.druid.segment.IndexMerger;
|
import io.druid.segment.IndexMerger;
|
||||||
|
import io.druid.segment.IndexMergerV9;
|
||||||
import io.druid.segment.loading.SegmentLoaderConfig;
|
import io.druid.segment.loading.SegmentLoaderConfig;
|
||||||
import io.druid.segment.loading.SegmentLoaderLocalCacheManager;
|
import io.druid.segment.loading.SegmentLoaderLocalCacheManager;
|
||||||
import io.druid.segment.loading.StorageLocationConfig;
|
import io.druid.segment.loading.StorageLocationConfig;
|
||||||
|
@ -80,6 +81,7 @@ public class WorkerTaskMonitorTest
|
||||||
private Worker worker;
|
private Worker worker;
|
||||||
private ObjectMapper jsonMapper;
|
private ObjectMapper jsonMapper;
|
||||||
private IndexMerger indexMerger;
|
private IndexMerger indexMerger;
|
||||||
|
private IndexMergerV9 indexMergerV9;
|
||||||
private IndexIO indexIO;
|
private IndexIO indexIO;
|
||||||
|
|
||||||
public WorkerTaskMonitorTest()
|
public WorkerTaskMonitorTest()
|
||||||
|
@ -87,6 +89,7 @@ public class WorkerTaskMonitorTest
|
||||||
TestUtils testUtils = new TestUtils();
|
TestUtils testUtils = new TestUtils();
|
||||||
jsonMapper = testUtils.getTestObjectMapper();
|
jsonMapper = testUtils.getTestObjectMapper();
|
||||||
indexMerger = testUtils.getTestIndexMerger();
|
indexMerger = testUtils.getTestIndexMerger();
|
||||||
|
indexMergerV9 = testUtils.getTestIndexMergerV9();
|
||||||
indexIO = testUtils.getTestIndexIO();
|
indexIO = testUtils.getTestIndexIO();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -183,7 +186,8 @@ public class WorkerTaskMonitorTest
|
||||||
indexMerger,
|
indexMerger,
|
||||||
indexIO,
|
indexIO,
|
||||||
null,
|
null,
|
||||||
null
|
null,
|
||||||
|
indexMergerV9
|
||||||
),
|
),
|
||||||
taskConfig,
|
taskConfig,
|
||||||
new NoopServiceEmitter()
|
new NoopServiceEmitter()
|
||||||
|
|
|
@ -104,12 +104,12 @@ public class IndexMerger
|
||||||
{
|
{
|
||||||
private static final Logger log = new Logger(IndexMerger.class);
|
private static final Logger log = new Logger(IndexMerger.class);
|
||||||
|
|
||||||
private static final SerializerUtils serializerUtils = new SerializerUtils();
|
protected static final SerializerUtils serializerUtils = new SerializerUtils();
|
||||||
private static final int INVALID_ROW = -1;
|
protected static final int INVALID_ROW = -1;
|
||||||
private static final Splitter SPLITTER = Splitter.on(",");
|
protected static final Splitter SPLITTER = Splitter.on(",");
|
||||||
|
|
||||||
private final ObjectMapper mapper;
|
protected final ObjectMapper mapper;
|
||||||
private final IndexIO indexIO;
|
protected final IndexIO indexIO;
|
||||||
|
|
||||||
@Inject
|
@Inject
|
||||||
public IndexMerger(
|
public IndexMerger(
|
||||||
|
@ -473,7 +473,7 @@ public class IndexMerger
|
||||||
return makeIndexFiles(indexes, outDir, progress, mergedDimensions, mergedMetrics, null, rowMergerFn, indexSpec);
|
return makeIndexFiles(indexes, outDir, progress, mergedDimensions, mergedMetrics, null, rowMergerFn, indexSpec);
|
||||||
}
|
}
|
||||||
|
|
||||||
private File makeIndexFiles(
|
protected File makeIndexFiles(
|
||||||
final List<IndexableAdapter> indexes,
|
final List<IndexableAdapter> indexes,
|
||||||
final File outDir,
|
final File outDir,
|
||||||
final ProgressIndicator progress,
|
final ProgressIndicator progress,
|
||||||
|
|
|
@ -100,335 +100,21 @@ import java.util.Map;
|
||||||
import java.util.Set;
|
import java.util.Set;
|
||||||
import java.util.TreeSet;
|
import java.util.TreeSet;
|
||||||
|
|
||||||
public class IndexMergerV9
|
public class IndexMergerV9 extends IndexMerger
|
||||||
{
|
{
|
||||||
private static final Logger log = new Logger(IndexMergerV9.class);
|
private static final Logger log = new Logger(IndexMergerV9.class);
|
||||||
|
|
||||||
private static final SerializerUtils serializerUtils = new SerializerUtils();
|
|
||||||
private static final int INVALID_ROW = -1;
|
|
||||||
private static final Splitter SPLITTER = Splitter.on(",");
|
|
||||||
|
|
||||||
private final ObjectMapper mapper;
|
|
||||||
private final IndexIO indexIO;
|
|
||||||
|
|
||||||
@Inject
|
@Inject
|
||||||
public IndexMergerV9(
|
public IndexMergerV9(
|
||||||
ObjectMapper mapper,
|
ObjectMapper mapper,
|
||||||
IndexIO indexIO
|
IndexIO indexIO
|
||||||
)
|
)
|
||||||
{
|
{
|
||||||
this.mapper = Preconditions.checkNotNull(mapper, "null ObjectMapper");
|
super(mapper, indexIO);
|
||||||
this.indexIO = Preconditions.checkNotNull(indexIO, "null IndexIO");
|
|
||||||
}
|
}
|
||||||
|
|
||||||
public File persist(
|
|
||||||
final IncrementalIndex index,
|
|
||||||
File outDir,
|
|
||||||
Map<String, Object> segmentMetadata,
|
|
||||||
IndexSpec indexSpec
|
|
||||||
) throws IOException
|
|
||||||
{
|
|
||||||
return persist(index, index.getInterval(), outDir, segmentMetadata, indexSpec);
|
|
||||||
}
|
|
||||||
|
|
||||||
public File persist(
|
|
||||||
final IncrementalIndex index,
|
|
||||||
final Interval dataInterval,
|
|
||||||
File outDir,
|
|
||||||
Map<String, Object> segmentMetadata,
|
|
||||||
IndexSpec indexSpec
|
|
||||||
) throws IOException
|
|
||||||
{
|
|
||||||
return persist(
|
|
||||||
index,
|
|
||||||
dataInterval,
|
|
||||||
outDir,
|
|
||||||
segmentMetadata,
|
|
||||||
indexSpec,
|
|
||||||
new BaseProgressIndicator()
|
|
||||||
);
|
|
||||||
}
|
|
||||||
|
|
||||||
public File persist(
|
|
||||||
final IncrementalIndex index,
|
|
||||||
final Interval dataInterval,
|
|
||||||
File outDir,
|
|
||||||
Map<String, Object> segmentMetadata,
|
|
||||||
IndexSpec indexSpec,
|
|
||||||
ProgressIndicator progress
|
|
||||||
) throws IOException
|
|
||||||
{
|
|
||||||
if (index.isEmpty()) {
|
|
||||||
throw new IAE("Trying to persist an empty index!");
|
|
||||||
}
|
|
||||||
|
|
||||||
final long firstTimestamp = index.getMinTime().getMillis();
|
|
||||||
final long lastTimestamp = index.getMaxTime().getMillis();
|
|
||||||
if (!(dataInterval.contains(firstTimestamp) && dataInterval.contains(lastTimestamp))) {
|
|
||||||
throw new IAE(
|
|
||||||
"interval[%s] does not encapsulate the full range of timestamps[%s, %s]",
|
|
||||||
dataInterval,
|
|
||||||
new DateTime(firstTimestamp),
|
|
||||||
new DateTime(lastTimestamp)
|
|
||||||
);
|
|
||||||
}
|
|
||||||
|
|
||||||
if (!outDir.exists()) {
|
|
||||||
outDir.mkdirs();
|
|
||||||
}
|
|
||||||
if (!outDir.isDirectory()) {
|
|
||||||
throw new ISE("Can only persist to directories, [%s] wasn't a directory", outDir);
|
|
||||||
}
|
|
||||||
|
|
||||||
log.info("Starting persist for interval[%s], rows[%,d]", dataInterval, index.size());
|
|
||||||
return merge(
|
|
||||||
Arrays.<IndexableAdapter>asList(
|
|
||||||
new IncrementalIndexAdapter(
|
|
||||||
dataInterval,
|
|
||||||
index,
|
|
||||||
indexSpec.getBitmapSerdeFactory().getBitmapFactory()
|
|
||||||
)
|
|
||||||
),
|
|
||||||
index.getMetricAggs(),
|
|
||||||
outDir,
|
|
||||||
segmentMetadata,
|
|
||||||
indexSpec,
|
|
||||||
progress
|
|
||||||
);
|
|
||||||
}
|
|
||||||
|
|
||||||
public File convert(final File inDir, final File outDir, final IndexSpec indexSpec) throws IOException
|
|
||||||
{
|
|
||||||
return convert(inDir, outDir, indexSpec, new BaseProgressIndicator());
|
|
||||||
}
|
|
||||||
|
|
||||||
public File convert(
|
|
||||||
final File inDir, final File outDir, final IndexSpec indexSpec, final ProgressIndicator progress
|
|
||||||
) throws IOException
|
|
||||||
{
|
|
||||||
try (QueryableIndex index = indexIO.loadIndex(inDir)) {
|
|
||||||
final IndexableAdapter adapter = new QueryableIndexIndexableAdapter(index);
|
|
||||||
return makeIndexFiles(
|
|
||||||
ImmutableList.of(adapter),
|
|
||||||
outDir,
|
|
||||||
progress,
|
|
||||||
Lists.newArrayList(adapter.getDimensionNames()),
|
|
||||||
Lists.newArrayList(adapter.getMetricNames()),
|
|
||||||
null,
|
|
||||||
new Function<ArrayList<Iterable<Rowboat>>, Iterable<Rowboat>>()
|
|
||||||
{
|
|
||||||
@Nullable
|
|
||||||
@Override
|
@Override
|
||||||
public Iterable<Rowboat> apply(ArrayList<Iterable<Rowboat>> input)
|
protected File makeIndexFiles(
|
||||||
{
|
|
||||||
return input.get(0);
|
|
||||||
}
|
|
||||||
},
|
|
||||||
indexSpec
|
|
||||||
);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
public File mergeQueryableIndex(
|
|
||||||
List<QueryableIndex> indexes, final AggregatorFactory[] metricAggs, File outDir, IndexSpec indexSpec
|
|
||||||
) throws IOException
|
|
||||||
{
|
|
||||||
return mergeQueryableIndex(indexes, metricAggs, outDir, indexSpec, new BaseProgressIndicator());
|
|
||||||
}
|
|
||||||
|
|
||||||
public File mergeQueryableIndex(
|
|
||||||
List<QueryableIndex> indexes,
|
|
||||||
final AggregatorFactory[] metricAggs,
|
|
||||||
File outDir,
|
|
||||||
IndexSpec indexSpec,
|
|
||||||
ProgressIndicator progress
|
|
||||||
) throws IOException
|
|
||||||
{
|
|
||||||
// We are materializing the list for performance reasons. Lists.transform
|
|
||||||
// only creates a "view" of the original list, meaning the function gets
|
|
||||||
// applied every time you access an element.
|
|
||||||
List<IndexableAdapter> indexAdapteres = Lists.newArrayList(
|
|
||||||
Iterables.transform(
|
|
||||||
indexes,
|
|
||||||
new Function<QueryableIndex, IndexableAdapter>()
|
|
||||||
{
|
|
||||||
@Override
|
|
||||||
public IndexableAdapter apply(final QueryableIndex input)
|
|
||||||
{
|
|
||||||
return new QueryableIndexIndexableAdapter(input);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
)
|
|
||||||
);
|
|
||||||
return merge(
|
|
||||||
indexAdapteres,
|
|
||||||
metricAggs,
|
|
||||||
outDir,
|
|
||||||
null,
|
|
||||||
indexSpec,
|
|
||||||
progress
|
|
||||||
);
|
|
||||||
}
|
|
||||||
|
|
||||||
public File merge(
|
|
||||||
List<IndexableAdapter> indexes,
|
|
||||||
final AggregatorFactory[] metricAggs,
|
|
||||||
File outDir,
|
|
||||||
Map<String, Object> segmentMetadata,
|
|
||||||
IndexSpec indexSpec
|
|
||||||
) throws IOException
|
|
||||||
{
|
|
||||||
return merge(indexes, metricAggs, outDir, segmentMetadata, indexSpec, new BaseProgressIndicator());
|
|
||||||
}
|
|
||||||
|
|
||||||
public File merge(
|
|
||||||
List<IndexableAdapter> adapters,
|
|
||||||
final AggregatorFactory[] metricAggs,
|
|
||||||
File outDir,
|
|
||||||
Map<String, Object> segmentMetadata,
|
|
||||||
IndexSpec indexSpec,
|
|
||||||
ProgressIndicator progress
|
|
||||||
) throws IOException
|
|
||||||
{
|
|
||||||
FileUtils.deleteDirectory(outDir);
|
|
||||||
if (!outDir.mkdirs()) {
|
|
||||||
throw new ISE("Couldn't make outdir[%s].", outDir);
|
|
||||||
}
|
|
||||||
|
|
||||||
final List<String> mergedDimensions = IndexMerger.getMergedDimensions(adapters);
|
|
||||||
|
|
||||||
final List<String> mergedMetrics = Lists.transform(
|
|
||||||
IndexMerger.mergeIndexed(
|
|
||||||
Lists.newArrayList(
|
|
||||||
FunctionalIterable
|
|
||||||
.create(adapters)
|
|
||||||
.transform(
|
|
||||||
new Function<IndexableAdapter, Iterable<String>>()
|
|
||||||
{
|
|
||||||
@Override
|
|
||||||
public Iterable<String> apply(@Nullable IndexableAdapter input)
|
|
||||||
{
|
|
||||||
return input.getMetricNames();
|
|
||||||
}
|
|
||||||
}
|
|
||||||
)
|
|
||||||
.concat(Arrays.<Iterable<String>>asList(new IndexMerger.AggFactoryStringIndexed(metricAggs)))
|
|
||||||
)
|
|
||||||
),
|
|
||||||
new Function<String, String>()
|
|
||||||
{
|
|
||||||
@Override
|
|
||||||
public String apply(@Nullable String input)
|
|
||||||
{
|
|
||||||
return input;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
);
|
|
||||||
if (mergedMetrics.size() != metricAggs.length) {
|
|
||||||
throw new IAE("Bad number of metrics[%d], expected [%d]", mergedMetrics.size(), metricAggs.length);
|
|
||||||
}
|
|
||||||
|
|
||||||
final AggregatorFactory[] sortedMetricAggs = new AggregatorFactory[mergedMetrics.size()];
|
|
||||||
for (int i = 0; i < metricAggs.length; i++) {
|
|
||||||
AggregatorFactory metricAgg = metricAggs[i];
|
|
||||||
sortedMetricAggs[mergedMetrics.indexOf(metricAgg.getName())] = metricAgg;
|
|
||||||
}
|
|
||||||
|
|
||||||
for (int i = 0; i < mergedMetrics.size(); i++) {
|
|
||||||
if (!sortedMetricAggs[i].getName().equals(mergedMetrics.get(i))) {
|
|
||||||
throw new IAE(
|
|
||||||
"Metric mismatch, index[%d] [%s] != [%s]",
|
|
||||||
i,
|
|
||||||
metricAggs[i].getName(),
|
|
||||||
mergedMetrics.get(i)
|
|
||||||
);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
Function<ArrayList<Iterable<Rowboat>>, Iterable<Rowboat>> rowMergerFn =
|
|
||||||
new Function<ArrayList<Iterable<Rowboat>>, Iterable<Rowboat>>()
|
|
||||||
{
|
|
||||||
@Override
|
|
||||||
public Iterable<Rowboat> apply(
|
|
||||||
@Nullable ArrayList<Iterable<Rowboat>> boats
|
|
||||||
)
|
|
||||||
{
|
|
||||||
return CombiningIterable.create(
|
|
||||||
new MergeIterable<>(
|
|
||||||
Ordering.<Rowboat>natural().nullsFirst(),
|
|
||||||
boats
|
|
||||||
),
|
|
||||||
Ordering.<Rowboat>natural().nullsFirst(),
|
|
||||||
new IndexMerger.RowboatMergeFunction(sortedMetricAggs)
|
|
||||||
);
|
|
||||||
}
|
|
||||||
};
|
|
||||||
|
|
||||||
return makeIndexFiles(
|
|
||||||
adapters, outDir, progress, mergedDimensions, mergedMetrics, segmentMetadata, rowMergerFn, indexSpec
|
|
||||||
);
|
|
||||||
}
|
|
||||||
|
|
||||||
public File append(
|
|
||||||
List<IndexableAdapter> indexes, File outDir, IndexSpec indexSpec
|
|
||||||
) throws IOException
|
|
||||||
{
|
|
||||||
return append(indexes, outDir, indexSpec, new BaseProgressIndicator());
|
|
||||||
}
|
|
||||||
|
|
||||||
public File append(
|
|
||||||
List<IndexableAdapter> indexes, File outDir, IndexSpec indexSpec, ProgressIndicator progress
|
|
||||||
) throws IOException
|
|
||||||
{
|
|
||||||
FileUtils.deleteDirectory(outDir);
|
|
||||||
if (!outDir.mkdirs()) {
|
|
||||||
throw new ISE("Couldn't make outdir[%s].", outDir);
|
|
||||||
}
|
|
||||||
|
|
||||||
final List<String> mergedDimensions = IndexMerger.getMergedDimensions(indexes);
|
|
||||||
|
|
||||||
final List<String> mergedMetrics = IndexMerger.mergeIndexed(
|
|
||||||
Lists.transform(
|
|
||||||
indexes,
|
|
||||||
new Function<IndexableAdapter, Iterable<String>>()
|
|
||||||
{
|
|
||||||
@Override
|
|
||||||
public Iterable<String> apply(@Nullable IndexableAdapter input)
|
|
||||||
{
|
|
||||||
return Iterables.transform(
|
|
||||||
input.getMetricNames(),
|
|
||||||
new Function<String, String>()
|
|
||||||
{
|
|
||||||
@Override
|
|
||||||
public String apply(@Nullable String input)
|
|
||||||
{
|
|
||||||
return input;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
)
|
|
||||||
);
|
|
||||||
|
|
||||||
Function<ArrayList<Iterable<Rowboat>>, Iterable<Rowboat>> rowMergerFn = new Function<ArrayList<Iterable<Rowboat>>, Iterable<Rowboat>>()
|
|
||||||
{
|
|
||||||
@Override
|
|
||||||
public Iterable<Rowboat> apply(
|
|
||||||
@Nullable final ArrayList<Iterable<Rowboat>> boats
|
|
||||||
)
|
|
||||||
{
|
|
||||||
return new MergeIterable<Rowboat>(
|
|
||||||
Ordering.<Rowboat>natural().nullsFirst(),
|
|
||||||
boats
|
|
||||||
);
|
|
||||||
}
|
|
||||||
};
|
|
||||||
|
|
||||||
return makeIndexFiles(indexes, outDir, progress, mergedDimensions, mergedMetrics, null, rowMergerFn, indexSpec);
|
|
||||||
}
|
|
||||||
|
|
||||||
private File makeIndexFiles(
|
|
||||||
final List<IndexableAdapter> adapters,
|
final List<IndexableAdapter> adapters,
|
||||||
final File outDir,
|
final File outDir,
|
||||||
final ProgressIndicator progress,
|
final ProgressIndicator progress,
|
||||||
|
@ -829,7 +515,7 @@ public class IndexMergerV9
|
||||||
List<Iterable<Integer>> convertedInverteds = Lists.newArrayListWithCapacity(adapters.size());
|
List<Iterable<Integer>> convertedInverteds = Lists.newArrayListWithCapacity(adapters.size());
|
||||||
for (int j = 0; j < adapters.size(); ++j) {
|
for (int j = 0; j < adapters.size(); ++j) {
|
||||||
convertedInverteds.add(
|
convertedInverteds.add(
|
||||||
new IndexMerger.ConvertingIndexedInts(
|
new ConvertingIndexedInts(
|
||||||
bitmapIndexSeeker[j].seek(dimVal), rowNumConversions.get(j)
|
bitmapIndexSeeker[j].seek(dimVal), rowNumConversions.get(j)
|
||||||
)
|
)
|
||||||
);
|
);
|
||||||
|
@ -1094,7 +780,7 @@ public class IndexMergerV9
|
||||||
}
|
}
|
||||||
|
|
||||||
boats.add(
|
boats.add(
|
||||||
new IndexMerger.MMappedIndexRowIterable(
|
new MMappedIndexRowIterable(
|
||||||
Iterables.transform(
|
Iterables.transform(
|
||||||
adapters.get(i).getRows(),
|
adapters.get(i).getRows(),
|
||||||
new Function<Rowboat, Rowboat>()
|
new Function<Rowboat, Rowboat>()
|
||||||
|
@ -1177,14 +863,14 @@ public class IndexMergerV9
|
||||||
List<Indexed<String>> dimValueLookups = Lists.newArrayListWithCapacity(adapters.size());
|
List<Indexed<String>> dimValueLookups = Lists.newArrayListWithCapacity(adapters.size());
|
||||||
|
|
||||||
// each converter converts dim values of this dimension to global dictionary
|
// each converter converts dim values of this dimension to global dictionary
|
||||||
IndexMerger.DimValueConverter[] converters = new IndexMerger.DimValueConverter[adapters.size()];
|
DimValueConverter[] converters = new DimValueConverter[adapters.size()];
|
||||||
|
|
||||||
boolean existNullColumn = false;
|
boolean existNullColumn = false;
|
||||||
for (int i = 0; i < adapters.size(); i++) {
|
for (int i = 0; i < adapters.size(); i++) {
|
||||||
Indexed<String> dimValues = adapters.get(i).getDimValueLookup(dimension);
|
Indexed<String> dimValues = adapters.get(i).getDimValueLookup(dimension);
|
||||||
if (!IndexMerger.isNullColumn(dimValues)) {
|
if (!isNullColumn(dimValues)) {
|
||||||
dimValueLookups.add(dimValues);
|
dimValueLookups.add(dimValues);
|
||||||
converters[i] = new IndexMerger.DimValueConverter(dimValues);
|
converters[i] = new DimValueConverter(dimValues);
|
||||||
} else {
|
} else {
|
||||||
existNullColumn = true;
|
existNullColumn = true;
|
||||||
}
|
}
|
||||||
|
@ -1233,7 +919,7 @@ public class IndexMergerV9
|
||||||
writer.write(value);
|
writer.write(value);
|
||||||
|
|
||||||
for (int i = 0; i < adapters.size(); i++) {
|
for (int i = 0; i < adapters.size(); i++) {
|
||||||
IndexMerger.DimValueConverter converter = converters[i];
|
DimValueConverter converter = converters[i];
|
||||||
if (converter != null) {
|
if (converter != null) {
|
||||||
converter.convert(value, cardinality);
|
converter.convert(value, cardinality);
|
||||||
}
|
}
|
||||||
|
@ -1259,7 +945,7 @@ public class IndexMergerV9
|
||||||
|
|
||||||
// make the conversion
|
// make the conversion
|
||||||
for (int i = 0; i < adapters.size(); ++i) {
|
for (int i = 0; i < adapters.size(); ++i) {
|
||||||
IndexMerger.DimValueConverter converter = converters[i];
|
DimValueConverter converter = converters[i];
|
||||||
if (converter != null) {
|
if (converter != null) {
|
||||||
dimConversions.get(i).put(dimension, converters[i].getConversionBuffer());
|
dimConversions.get(i).put(dimension, converters[i].getConversionBuffer());
|
||||||
}
|
}
|
||||||
|
|
|
@ -46,6 +46,7 @@ public class RealtimeTuningConfig implements TuningConfig
|
||||||
private static final int defaultMaxPendingPersists = 0;
|
private static final int defaultMaxPendingPersists = 0;
|
||||||
private static final ShardSpec defaultShardSpec = new NoneShardSpec();
|
private static final ShardSpec defaultShardSpec = new NoneShardSpec();
|
||||||
private static final IndexSpec defaultIndexSpec = new IndexSpec();
|
private static final IndexSpec defaultIndexSpec = new IndexSpec();
|
||||||
|
private static final Boolean defaultBuildV9Directly = Boolean.FALSE;
|
||||||
|
|
||||||
// Might make sense for this to be a builder
|
// Might make sense for this to be a builder
|
||||||
public static RealtimeTuningConfig makeDefaultTuningConfig()
|
public static RealtimeTuningConfig makeDefaultTuningConfig()
|
||||||
|
@ -59,7 +60,8 @@ public class RealtimeTuningConfig implements TuningConfig
|
||||||
defaultRejectionPolicyFactory,
|
defaultRejectionPolicyFactory,
|
||||||
defaultMaxPendingPersists,
|
defaultMaxPendingPersists,
|
||||||
defaultShardSpec,
|
defaultShardSpec,
|
||||||
defaultIndexSpec
|
defaultIndexSpec,
|
||||||
|
defaultBuildV9Directly
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -72,6 +74,7 @@ public class RealtimeTuningConfig implements TuningConfig
|
||||||
private final int maxPendingPersists;
|
private final int maxPendingPersists;
|
||||||
private final ShardSpec shardSpec;
|
private final ShardSpec shardSpec;
|
||||||
private final IndexSpec indexSpec;
|
private final IndexSpec indexSpec;
|
||||||
|
private final Boolean buildV9Directly;
|
||||||
|
|
||||||
@JsonCreator
|
@JsonCreator
|
||||||
public RealtimeTuningConfig(
|
public RealtimeTuningConfig(
|
||||||
|
@ -83,7 +86,8 @@ public class RealtimeTuningConfig implements TuningConfig
|
||||||
@JsonProperty("rejectionPolicy") RejectionPolicyFactory rejectionPolicyFactory,
|
@JsonProperty("rejectionPolicy") RejectionPolicyFactory rejectionPolicyFactory,
|
||||||
@JsonProperty("maxPendingPersists") Integer maxPendingPersists,
|
@JsonProperty("maxPendingPersists") Integer maxPendingPersists,
|
||||||
@JsonProperty("shardSpec") ShardSpec shardSpec,
|
@JsonProperty("shardSpec") ShardSpec shardSpec,
|
||||||
@JsonProperty("indexSpec") IndexSpec indexSpec
|
@JsonProperty("indexSpec") IndexSpec indexSpec,
|
||||||
|
@JsonProperty("buildV9Directly") Boolean buildV9Directly
|
||||||
)
|
)
|
||||||
{
|
{
|
||||||
this.maxRowsInMemory = maxRowsInMemory == null ? defaultMaxRowsInMemory : maxRowsInMemory;
|
this.maxRowsInMemory = maxRowsInMemory == null ? defaultMaxRowsInMemory : maxRowsInMemory;
|
||||||
|
@ -99,6 +103,7 @@ public class RealtimeTuningConfig implements TuningConfig
|
||||||
this.maxPendingPersists = maxPendingPersists == null ? defaultMaxPendingPersists : maxPendingPersists;
|
this.maxPendingPersists = maxPendingPersists == null ? defaultMaxPendingPersists : maxPendingPersists;
|
||||||
this.shardSpec = shardSpec == null ? defaultShardSpec : shardSpec;
|
this.shardSpec = shardSpec == null ? defaultShardSpec : shardSpec;
|
||||||
this.indexSpec = indexSpec == null ? defaultIndexSpec : indexSpec;
|
this.indexSpec = indexSpec == null ? defaultIndexSpec : indexSpec;
|
||||||
|
this.buildV9Directly = buildV9Directly == null ? defaultBuildV9Directly : buildV9Directly;
|
||||||
}
|
}
|
||||||
|
|
||||||
@JsonProperty
|
@JsonProperty
|
||||||
|
@ -155,6 +160,11 @@ public class RealtimeTuningConfig implements TuningConfig
|
||||||
return indexSpec;
|
return indexSpec;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@JsonProperty
|
||||||
|
public Boolean getBuildV9Directly() {
|
||||||
|
return buildV9Directly;
|
||||||
|
}
|
||||||
|
|
||||||
public RealtimeTuningConfig withVersioningPolicy(VersioningPolicy policy)
|
public RealtimeTuningConfig withVersioningPolicy(VersioningPolicy policy)
|
||||||
{
|
{
|
||||||
return new RealtimeTuningConfig(
|
return new RealtimeTuningConfig(
|
||||||
|
@ -166,7 +176,8 @@ public class RealtimeTuningConfig implements TuningConfig
|
||||||
rejectionPolicyFactory,
|
rejectionPolicyFactory,
|
||||||
maxPendingPersists,
|
maxPendingPersists,
|
||||||
shardSpec,
|
shardSpec,
|
||||||
indexSpec
|
indexSpec,
|
||||||
|
buildV9Directly
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -181,7 +192,8 @@ public class RealtimeTuningConfig implements TuningConfig
|
||||||
rejectionPolicyFactory,
|
rejectionPolicyFactory,
|
||||||
maxPendingPersists,
|
maxPendingPersists,
|
||||||
shardSpec,
|
shardSpec,
|
||||||
indexSpec
|
indexSpec,
|
||||||
|
buildV9Directly
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -116,7 +116,7 @@ public class FireDepartmentTest
|
||||||
null
|
null
|
||||||
),
|
),
|
||||||
new RealtimeTuningConfig(
|
new RealtimeTuningConfig(
|
||||||
null, null, null, null, null, null, null, null, null
|
null, null, null, null, null, null, null, null, null, null
|
||||||
)
|
)
|
||||||
);
|
);
|
||||||
|
|
||||||
|
|
|
@ -150,6 +150,7 @@ public class RealtimeManagerTest
|
||||||
null,
|
null,
|
||||||
null,
|
null,
|
||||||
null,
|
null,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
);
|
);
|
||||||
plumber = new TestPlumber(new Sink(new Interval("0/P5000Y"), schema, tuningConfig, new DateTime().toString()));
|
plumber = new TestPlumber(new Sink(new Interval("0/P5000Y"), schema, tuningConfig, new DateTime().toString()));
|
||||||
|
|
|
@ -185,6 +185,7 @@ public class RealtimePlumberSchoolTest
|
||||||
rejectionPolicy,
|
rejectionPolicy,
|
||||||
null,
|
null,
|
||||||
null,
|
null,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
);
|
);
|
||||||
|
|
||||||
|
|
|
@ -66,6 +66,7 @@ public class SinkTest
|
||||||
null,
|
null,
|
||||||
null,
|
null,
|
||||||
null,
|
null,
|
||||||
|
null,
|
||||||
null
|
null
|
||||||
);
|
);
|
||||||
final Sink sink = new Sink(interval, schema, tuningConfig, version);
|
final Sink sink = new Sink(interval, schema, tuningConfig, version);
|
||||||
|
|
Loading…
Reference in New Issue