mirror of https://github.com/apache/druid.git
Merge pull request #1192 from metamx/fix-bad-rebase
fix file missing from previous PR rebase
This commit is contained in:
commit
75e92fd4dc
|
@ -0,0 +1,136 @@
|
|||
/*
|
||||
* Licensed to Metamarkets Group Inc. (Metamarkets) under one
|
||||
* or more contributor license agreements. See the NOTICE file
|
||||
* distributed with this work for additional information
|
||||
* regarding copyright ownership. Metamarkets licenses this file
|
||||
* to you under the Apache License, Version 2.0 (the
|
||||
* "License"); you may not use this file except in compliance
|
||||
* with the License. You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing,
|
||||
* software distributed under the License is distributed on an
|
||||
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
||||
* KIND, either express or implied. See the License for the
|
||||
* specific language governing permissions and limitations
|
||||
* under the License.
|
||||
*/
|
||||
|
||||
package io.druid.segment;
|
||||
|
||||
import com.google.common.collect.Iterators;
|
||||
import com.google.common.collect.Maps;
|
||||
import io.druid.query.extraction.ExtractionFn;
|
||||
import io.druid.segment.data.IndexedInts;
|
||||
|
||||
import java.util.Iterator;
|
||||
import java.util.Map;
|
||||
|
||||
public class SingleScanTimeDimSelector implements DimensionSelector
|
||||
{
|
||||
private final ExtractionFn extractionFn;
|
||||
private final LongColumnSelector selector;
|
||||
|
||||
private final Map<Integer, String> timeValues = Maps.newHashMap();
|
||||
private String currentValue = null;
|
||||
private long currentTimestamp = Long.MIN_VALUE;
|
||||
private int index = -1;
|
||||
|
||||
|
||||
// Use a special DimSelector for projected time columns
|
||||
// - it assumes time values are scanned once and values are grouped together
|
||||
// (i.e. we never revisit a timestamp we have seen before, unless it is the same as the last accessed one)
|
||||
// - it also applies and caches extraction function values at the DimSelector level to speed things up
|
||||
public SingleScanTimeDimSelector(LongColumnSelector selector, ExtractionFn extractionFn)
|
||||
{
|
||||
if (extractionFn == null) {
|
||||
throw new UnsupportedOperationException("time dimension must provide an extraction function");
|
||||
}
|
||||
|
||||
this.extractionFn = extractionFn;
|
||||
this.selector = selector;
|
||||
}
|
||||
|
||||
@Override
|
||||
public IndexedInts getRow()
|
||||
{
|
||||
// if this the first timestamp, apply and cache extraction function result
|
||||
final long timestamp = selector.get();
|
||||
if (index < 0) {
|
||||
currentTimestamp = timestamp;
|
||||
currentValue = extractionFn.apply(timestamp);
|
||||
++index;
|
||||
timeValues.put(index, currentValue);
|
||||
}
|
||||
// if this is a new timestamp, apply and cache extraction function result
|
||||
// since timestamps are assumed grouped and scanned once, we only need to
|
||||
// check if the current timestamp is different than the current timestamp.
|
||||
//
|
||||
// If this new timestamp is mapped to the same value by the extraction function,
|
||||
// we can also avoid creating a dimension value and corresponding index
|
||||
// and use the current one
|
||||
else if (timestamp != currentTimestamp) {
|
||||
if(timestamp < currentTimestamp) {
|
||||
// re-using this selector for multiple scans would cause the same rows to return different IDs
|
||||
// we might want to re-visit if we ever need to do multiple scans with this dimension selector
|
||||
throw new IllegalStateException("cannot re-use time dimension selector for multiple scans");
|
||||
}
|
||||
currentTimestamp = timestamp;
|
||||
final String value = extractionFn.apply(timestamp);
|
||||
if (!value.equals(currentValue)) {
|
||||
currentValue = value;
|
||||
++index;
|
||||
timeValues.put(index, currentValue);
|
||||
}
|
||||
// Note: this could be further optimized by checking if the new value is one we have
|
||||
// previously seen, but would require keeping track of both the current and the maximum index
|
||||
}
|
||||
// otherwise, if the current timestamp is the same as the previous timestamp,
|
||||
// keep using the same dimension value index
|
||||
|
||||
final int dimensionValueIndex = index;
|
||||
return new IndexedInts()
|
||||
{
|
||||
@Override
|
||||
public int size()
|
||||
{
|
||||
return 1;
|
||||
}
|
||||
|
||||
@Override
|
||||
public int get(int i)
|
||||
{
|
||||
return dimensionValueIndex;
|
||||
}
|
||||
|
||||
@Override
|
||||
public Iterator<Integer> iterator()
|
||||
{
|
||||
return Iterators.singletonIterator(dimensionValueIndex);
|
||||
}
|
||||
};
|
||||
}
|
||||
|
||||
@Override
|
||||
public int getValueCardinality()
|
||||
{
|
||||
return Integer.MAX_VALUE;
|
||||
}
|
||||
|
||||
@Override
|
||||
public String lookupName(int id)
|
||||
{
|
||||
if (id == index) {
|
||||
return currentValue;
|
||||
} else {
|
||||
return timeValues.get(id);
|
||||
}
|
||||
}
|
||||
|
||||
@Override
|
||||
public int lookupId(String name)
|
||||
{
|
||||
throw new UnsupportedOperationException("time column does not support lookups");
|
||||
}
|
||||
}
|
Loading…
Reference in New Issue