HBASE-11144 Filter to support scanning multiple row key ranges (Jiajia Li)
This commit is contained in:
parent
40e9c22ea2
commit
b79dbedad6
|
@ -0,0 +1,508 @@
|
|||
/*
|
||||
* Licensed to the Apache Software Foundation (ASF) under one
|
||||
* or more contributor license agreements. See the NOTICE file
|
||||
* distributed with this work for additional information
|
||||
* regarding copyright ownership. The ASF licenses this file
|
||||
* to you under the Apache License, Version 2.0 (the
|
||||
* "License"); you may not use this file except in compliance
|
||||
* with the License. You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
package org.apache.hadoop.hbase.filter;
|
||||
|
||||
import java.io.IOException;
|
||||
import java.util.ArrayList;
|
||||
import java.util.Collections;
|
||||
import java.util.List;
|
||||
|
||||
import org.apache.hadoop.hbase.classification.InterfaceAudience;
|
||||
import org.apache.hadoop.hbase.classification.InterfaceStability;
|
||||
import org.apache.hadoop.hbase.Cell;
|
||||
import org.apache.hadoop.hbase.HConstants;
|
||||
import org.apache.hadoop.hbase.KeyValueUtil;
|
||||
import org.apache.hadoop.hbase.exceptions.DeserializationException;
|
||||
import org.apache.hadoop.hbase.protobuf.generated.FilterProtos;
|
||||
import org.apache.hadoop.hbase.util.Bytes;
|
||||
|
||||
import com.google.protobuf.HBaseZeroCopyByteString;
|
||||
import com.google.protobuf.InvalidProtocolBufferException;
|
||||
|
||||
/**
|
||||
* Filter to support scan multiple row key ranges. It can construct the row key ranges from the
|
||||
* passed list which can be accessed by each region server.
|
||||
*
|
||||
* HBase is quite efficient when scanning only one small row key range. If user needs to specify
|
||||
* multiple row key ranges in one scan, the typical solutions are: 1. through FilterList which is a
|
||||
* list of row key Filters, 2. using the SQL layer over HBase to join with two table, such as hive,
|
||||
* phoenix etc. However, both solutions are inefficient. Both of them can't utilize the range info
|
||||
* to perform fast forwarding during scan which is quite time consuming. If the number of ranges
|
||||
* are quite big (e.g. millions), join is a proper solution though it is slow. However, there are
|
||||
* cases that user wants to specify a small number of ranges to scan (e.g. <1000 ranges). Both
|
||||
* solutions can't provide satisfactory performance in such case. MultiRowRangeFilter is to support
|
||||
* such usec ase (scan multiple row key ranges), which can construct the row key ranges from user
|
||||
* specified list and perform fast-forwarding during scan. Thus, the scan will be quite efficient.
|
||||
*/
|
||||
@InterfaceAudience.Public
|
||||
@InterfaceStability.Evolving
|
||||
public class MultiRowRangeFilter extends FilterBase {
|
||||
|
||||
private List<RowRange> rangeList;
|
||||
|
||||
private static final int ROW_BEFORE_FIRST_RANGE = -1;
|
||||
private boolean EXCLUSIVE = false;
|
||||
private boolean done = false;
|
||||
private boolean initialized = false;
|
||||
private int index;
|
||||
private RowRange range;
|
||||
private ReturnCode currentReturnCode;
|
||||
|
||||
/**
|
||||
* @param list A list of <code>RowRange</code>
|
||||
* @throws java.io.IOException
|
||||
* throw an exception if the range list is not in an natural order or any
|
||||
* <code>RowRange</code> is invalid
|
||||
*/
|
||||
public MultiRowRangeFilter(List<RowRange> list) throws IOException {
|
||||
this.rangeList = sortAndMerge(list);
|
||||
}
|
||||
|
||||
@Override
|
||||
public boolean filterAllRemaining() {
|
||||
return done;
|
||||
}
|
||||
|
||||
public List<RowRange> getRowRanges() {
|
||||
return this.rangeList;
|
||||
}
|
||||
|
||||
@Override
|
||||
public boolean filterRowKey(byte[] buffer, int offset, int length) {
|
||||
// If it is the first time of running, calculate the current range index for
|
||||
// the row key. If index is out of bound which happens when the start row
|
||||
// user sets is after the largest stop row of the ranges, stop the scan.
|
||||
// If row key is after the current range, find the next range and update index.
|
||||
if (!initialized || !range.contains(buffer, offset, length)) {
|
||||
byte[] rowkey = new byte[length];
|
||||
System.arraycopy(buffer, offset, rowkey, 0, length);
|
||||
index = getNextRangeIndex(rowkey);
|
||||
if (index >= rangeList.size()) {
|
||||
done = true;
|
||||
currentReturnCode = ReturnCode.NEXT_ROW;
|
||||
return false;
|
||||
}
|
||||
if(index != ROW_BEFORE_FIRST_RANGE) {
|
||||
range = rangeList.get(index);
|
||||
} else {
|
||||
range = rangeList.get(0);
|
||||
}
|
||||
if(EXCLUSIVE) {
|
||||
EXCLUSIVE = false;
|
||||
currentReturnCode = ReturnCode.NEXT_ROW;
|
||||
return false;
|
||||
}
|
||||
if (!initialized) {
|
||||
if(index != ROW_BEFORE_FIRST_RANGE) {
|
||||
currentReturnCode = ReturnCode.INCLUDE;
|
||||
} else {
|
||||
currentReturnCode = ReturnCode.SEEK_NEXT_USING_HINT;
|
||||
}
|
||||
initialized = true;
|
||||
} else {
|
||||
currentReturnCode = ReturnCode.SEEK_NEXT_USING_HINT;
|
||||
}
|
||||
} else {
|
||||
currentReturnCode = ReturnCode.INCLUDE;
|
||||
}
|
||||
return false;
|
||||
}
|
||||
|
||||
@Override
|
||||
public ReturnCode filterKeyValue(Cell ignored) {
|
||||
return currentReturnCode;
|
||||
}
|
||||
|
||||
@Override
|
||||
public Cell getNextCellHint(Cell currentKV) {
|
||||
// skip to the next range's start row
|
||||
return KeyValueUtil.createFirstOnRow(range.startRow);
|
||||
}
|
||||
|
||||
/**
|
||||
* @return The filter serialized using pb
|
||||
*/
|
||||
public byte[] toByteArray() {
|
||||
FilterProtos.MultiRowRangeFilter.Builder builder = FilterProtos.MultiRowRangeFilter
|
||||
.newBuilder();
|
||||
for (RowRange range : rangeList) {
|
||||
if (range != null) {
|
||||
FilterProtos.RowRange.Builder rangebuilder = FilterProtos.RowRange.newBuilder();
|
||||
if (range.startRow != null)
|
||||
rangebuilder.setStartRow(HBaseZeroCopyByteString.wrap(range.startRow));
|
||||
rangebuilder.setStartRowInclusive(range.startRowInclusive);
|
||||
if (range.stopRow != null)
|
||||
rangebuilder.setStopRow(HBaseZeroCopyByteString.wrap(range.stopRow));
|
||||
rangebuilder.setStopRowInclusive(range.stopRowInclusive);
|
||||
range.isScan = Bytes.equals(range.startRow, range.stopRow) ? 1 : 0;
|
||||
builder.addRowRangeList(rangebuilder.build());
|
||||
}
|
||||
}
|
||||
return builder.build().toByteArray();
|
||||
}
|
||||
|
||||
/**
|
||||
* @param pbBytes A pb serialized instance
|
||||
* @return An instance of MultiRowRangeFilter
|
||||
* @throws org.apache.hadoop.hbase.exceptions.DeserializationException
|
||||
*/
|
||||
public static MultiRowRangeFilter parseFrom(final byte[] pbBytes)
|
||||
throws DeserializationException {
|
||||
FilterProtos.MultiRowRangeFilter proto;
|
||||
try {
|
||||
proto = FilterProtos.MultiRowRangeFilter.parseFrom(pbBytes);
|
||||
} catch (InvalidProtocolBufferException e) {
|
||||
throw new DeserializationException(e);
|
||||
}
|
||||
int length = proto.getRowRangeListCount();
|
||||
List<FilterProtos.RowRange> rangeProtos = proto.getRowRangeListList();
|
||||
List<RowRange> rangeList = new ArrayList<RowRange>(length);
|
||||
for (FilterProtos.RowRange rangeProto : rangeProtos) {
|
||||
RowRange range = new RowRange(rangeProto.hasStartRow() ? rangeProto.getStartRow()
|
||||
.toByteArray() : null, rangeProto.getStartRowInclusive(), rangeProto.hasStopRow() ?
|
||||
rangeProto.getStopRow().toByteArray() : null, rangeProto.getStopRowInclusive());
|
||||
rangeList.add(range);
|
||||
}
|
||||
try {
|
||||
return new MultiRowRangeFilter(rangeList);
|
||||
} catch (IOException e) {
|
||||
throw new DeserializationException("Fail to instantiate the MultiRowRangeFilter", e);
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* @param o the filter to compare
|
||||
* @return true if and only if the fields of the filter that are serialized are equal to the
|
||||
* corresponding fields in other. Used for testing.
|
||||
*/
|
||||
boolean areSerializedFieldsEqual(Filter o) {
|
||||
if (o == this)
|
||||
return true;
|
||||
if (!(o instanceof MultiRowRangeFilter))
|
||||
return false;
|
||||
|
||||
MultiRowRangeFilter other = (MultiRowRangeFilter) o;
|
||||
if (this.rangeList.size() != other.rangeList.size())
|
||||
return false;
|
||||
for (int i = 0; i < rangeList.size(); ++i) {
|
||||
RowRange thisRange = this.rangeList.get(i);
|
||||
RowRange otherRange = other.rangeList.get(i);
|
||||
if (!(Bytes.equals(thisRange.startRow, otherRange.startRow) && Bytes.equals(
|
||||
thisRange.stopRow, otherRange.stopRow) && (thisRange.startRowInclusive ==
|
||||
otherRange.startRowInclusive) && (thisRange.stopRowInclusive ==
|
||||
otherRange.stopRowInclusive))) {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
||||
/**
|
||||
* calculate the position where the row key in the ranges list.
|
||||
*
|
||||
* @param rowKey the row key to calculate
|
||||
* @return index the position of the row key
|
||||
*/
|
||||
private int getNextRangeIndex(byte[] rowKey) {
|
||||
RowRange temp = new RowRange(rowKey, true, null, true);
|
||||
int index = Collections.binarySearch(rangeList, temp);
|
||||
if (index < 0) {
|
||||
int insertionPosition = -index - 1;
|
||||
// check if the row key in the range before the insertion position
|
||||
if (insertionPosition != 0 && rangeList.get(insertionPosition - 1).contains(rowKey)) {
|
||||
return insertionPosition - 1;
|
||||
}
|
||||
// check if the row key is before the first range
|
||||
if (insertionPosition == 0 && !rangeList.get(insertionPosition).contains(rowKey)) {
|
||||
return ROW_BEFORE_FIRST_RANGE;
|
||||
}
|
||||
return insertionPosition;
|
||||
}
|
||||
// the row key equals one of the start keys, and the the range exclude the start key
|
||||
if(rangeList.get(index).startRowInclusive == false) {
|
||||
EXCLUSIVE = true;
|
||||
}
|
||||
return index;
|
||||
}
|
||||
|
||||
/**
|
||||
* sort the ranges and if the ranges with overlap, then merge them.
|
||||
*
|
||||
* @param ranges the list of ranges to sort and merge.
|
||||
* @return the ranges after sort and merge.
|
||||
*/
|
||||
public static List<RowRange> sortAndMerge(List<RowRange> ranges) {
|
||||
if (ranges.size() == 0) {
|
||||
throw new IllegalArgumentException("No ranges found.");
|
||||
}
|
||||
List<RowRange> invalidRanges = new ArrayList<RowRange>();
|
||||
List<RowRange> newRanges = new ArrayList<RowRange>(ranges.size());
|
||||
Collections.sort(ranges);
|
||||
if(ranges.get(0).isValid()) {
|
||||
if (ranges.size() == 1) {
|
||||
newRanges.add(ranges.get(0));
|
||||
}
|
||||
} else {
|
||||
invalidRanges.add(ranges.get(0));
|
||||
}
|
||||
|
||||
byte[] lastStartRow = ranges.get(0).startRow;
|
||||
boolean lastStartRowInclusive = ranges.get(0).startRowInclusive;
|
||||
byte[] lastStopRow = ranges.get(0).stopRow;
|
||||
boolean lastStopRowInclusive = ranges.get(0).stopRowInclusive;
|
||||
int i = 1;
|
||||
for (; i < ranges.size(); i++) {
|
||||
RowRange range = ranges.get(i);
|
||||
if (!range.isValid()) {
|
||||
invalidRanges.add(range);
|
||||
}
|
||||
if(Bytes.equals(lastStopRow, HConstants.EMPTY_BYTE_ARRAY)) {
|
||||
newRanges.add(new RowRange(lastStartRow, lastStartRowInclusive, lastStopRow,
|
||||
lastStopRowInclusive));
|
||||
break;
|
||||
}
|
||||
// with overlap in the ranges
|
||||
if ((Bytes.compareTo(lastStopRow, range.startRow) > 0) ||
|
||||
(Bytes.compareTo(lastStopRow, range.startRow) == 0 && !(lastStopRowInclusive == false &&
|
||||
range.isStartRowInclusive() == false))) {
|
||||
if(Bytes.equals(range.stopRow, HConstants.EMPTY_BYTE_ARRAY)) {
|
||||
newRanges.add(new RowRange(lastStartRow, lastStartRowInclusive, range.stopRow,
|
||||
range.stopRowInclusive));
|
||||
break;
|
||||
}
|
||||
// if first range contains second range, ignore the second range
|
||||
if (Bytes.compareTo(lastStopRow, range.stopRow) >= 0) {
|
||||
if((Bytes.compareTo(lastStopRow, range.stopRow) == 0)) {
|
||||
if(lastStopRowInclusive == true || range.stopRowInclusive == true) {
|
||||
lastStopRowInclusive = true;
|
||||
}
|
||||
}
|
||||
if ((i + 1) == ranges.size()) {
|
||||
newRanges.add(new RowRange(lastStartRow, lastStartRowInclusive, lastStopRow,
|
||||
lastStopRowInclusive));
|
||||
}
|
||||
} else {
|
||||
lastStopRow = range.stopRow;
|
||||
lastStopRowInclusive = range.stopRowInclusive;
|
||||
if ((i + 1) < ranges.size()) {
|
||||
i++;
|
||||
range = ranges.get(i);
|
||||
if (!range.isValid()) {
|
||||
invalidRanges.add(range);
|
||||
}
|
||||
} else {
|
||||
newRanges.add(new RowRange(lastStartRow, lastStartRowInclusive, lastStopRow,
|
||||
lastStopRowInclusive));
|
||||
break;
|
||||
}
|
||||
while ((Bytes.compareTo(lastStopRow, range.startRow) > 0) ||
|
||||
(Bytes.compareTo(lastStopRow, range.startRow) == 0 &&
|
||||
(lastStopRowInclusive == true || range.startRowInclusive==true))) {
|
||||
if(Bytes.equals(range.stopRow, HConstants.EMPTY_BYTE_ARRAY)) {
|
||||
break;
|
||||
}
|
||||
// if this first range contain second range, ignore the second range
|
||||
if (Bytes.compareTo(lastStopRow, range.stopRow) >= 0) {
|
||||
if(lastStopRowInclusive == true || range.stopRowInclusive == true) {
|
||||
lastStopRowInclusive = true;
|
||||
}
|
||||
i++;
|
||||
if (i < ranges.size()) {
|
||||
range = ranges.get(i);
|
||||
if (!range.isValid()) {
|
||||
invalidRanges.add(range);
|
||||
}
|
||||
} else {
|
||||
break;
|
||||
}
|
||||
} else {
|
||||
lastStopRow = range.stopRow;
|
||||
lastStopRowInclusive = range.stopRowInclusive;
|
||||
i++;
|
||||
if (i < ranges.size()) {
|
||||
range = ranges.get(i);
|
||||
if (!range.isValid()) {
|
||||
invalidRanges.add(range);
|
||||
}
|
||||
} else {
|
||||
break;
|
||||
}
|
||||
}
|
||||
}
|
||||
if(Bytes.equals(range.stopRow, HConstants.EMPTY_BYTE_ARRAY)) {
|
||||
if((Bytes.compareTo(lastStopRow, range.startRow) < 0) ||
|
||||
(Bytes.compareTo(lastStopRow, range.startRow) == 0 &&
|
||||
lastStopRowInclusive == false && range.startRowInclusive == false)) {
|
||||
newRanges.add(new RowRange(lastStartRow, lastStartRowInclusive, lastStopRow,
|
||||
lastStopRowInclusive));
|
||||
newRanges.add(range);
|
||||
} else {
|
||||
newRanges.add(new RowRange(lastStartRow, lastStartRowInclusive, range.stopRow,
|
||||
range.stopRowInclusive));
|
||||
break;
|
||||
}
|
||||
}
|
||||
newRanges.add(new RowRange(lastStartRow, lastStartRowInclusive, lastStopRow,
|
||||
lastStopRowInclusive));
|
||||
if ((i + 1) == ranges.size()) {
|
||||
newRanges.add(range);
|
||||
}
|
||||
lastStartRow = range.startRow;
|
||||
lastStartRowInclusive = range.startRowInclusive;
|
||||
lastStopRow = range.stopRow;
|
||||
lastStopRowInclusive = range.stopRowInclusive;
|
||||
}
|
||||
} else {
|
||||
newRanges.add(new RowRange(lastStartRow, lastStartRowInclusive, lastStopRow,
|
||||
lastStopRowInclusive));
|
||||
if ((i + 1) == ranges.size()) {
|
||||
newRanges.add(range);
|
||||
}
|
||||
lastStartRow = range.startRow;
|
||||
lastStartRowInclusive = range.startRowInclusive;
|
||||
lastStopRow = range.stopRow;
|
||||
lastStopRowInclusive = range.stopRowInclusive;
|
||||
}
|
||||
}
|
||||
// check the remaining ranges
|
||||
for(int j=i; j < ranges.size(); j++) {
|
||||
if(!ranges.get(j).isValid()) {
|
||||
invalidRanges.add(ranges.get(j));
|
||||
}
|
||||
}
|
||||
// if invalid range exists, throw the exception
|
||||
if (invalidRanges.size() != 0) {
|
||||
throwExceptionForInvalidRanges(invalidRanges, true);
|
||||
}
|
||||
// If no valid ranges found, throw the exception
|
||||
if(newRanges.size() == 0) {
|
||||
throw new IllegalArgumentException("No valid ranges found.");
|
||||
}
|
||||
return newRanges;
|
||||
}
|
||||
|
||||
private static void throwExceptionForInvalidRanges(List<RowRange> invalidRanges,
|
||||
boolean details) {
|
||||
StringBuilder sb = new StringBuilder();
|
||||
sb.append(invalidRanges.size()).append(" invaild ranges.\n");
|
||||
if (details) {
|
||||
for (RowRange range : invalidRanges) {
|
||||
sb.append(
|
||||
"Invalid range: start row => " + Bytes.toString(range.startRow) + ", stop row => "
|
||||
+ Bytes.toString(range.stopRow)).append('\n');
|
||||
}
|
||||
}
|
||||
throw new IllegalArgumentException(sb.toString());
|
||||
}
|
||||
|
||||
@InterfaceAudience.Public
|
||||
@InterfaceStability.Evolving
|
||||
public static class RowRange implements Comparable<RowRange> {
|
||||
private byte[] startRow;
|
||||
private boolean startRowInclusive = true;
|
||||
private byte[] stopRow;
|
||||
private boolean stopRowInclusive = false;
|
||||
private int isScan = 0;
|
||||
|
||||
public RowRange() {
|
||||
}
|
||||
/**
|
||||
* If the startRow is empty or null, set it to HConstants.EMPTY_BYTE_ARRAY, means begin at the
|
||||
* start row of the table. If the stopRow is empty or null, set it to
|
||||
* HConstants.EMPTY_BYTE_ARRAY, means end of the last row of table.
|
||||
*/
|
||||
public RowRange(String startRow, boolean startRowInclusive, String stopRow,
|
||||
boolean stopRowInclusive) {
|
||||
this((startRow == null || startRow.isEmpty()) ? HConstants.EMPTY_BYTE_ARRAY :
|
||||
Bytes.toBytes(startRow), startRowInclusive,
|
||||
(stopRow == null || stopRow.isEmpty()) ? HConstants.EMPTY_BYTE_ARRAY :
|
||||
Bytes.toBytes(stopRow), stopRowInclusive);
|
||||
}
|
||||
|
||||
public RowRange(byte[] startRow, boolean startRowInclusive, byte[] stopRow,
|
||||
boolean stopRowInclusive) {
|
||||
this.startRow = (startRow == null) ? HConstants.EMPTY_BYTE_ARRAY : startRow;
|
||||
this.startRowInclusive = startRowInclusive;
|
||||
this.stopRow = (stopRow == null) ? HConstants.EMPTY_BYTE_ARRAY :stopRow;
|
||||
this.stopRowInclusive = stopRowInclusive;
|
||||
isScan = Bytes.equals(startRow, stopRow) ? 1 : 0;
|
||||
}
|
||||
|
||||
public byte[] getStartRow() {
|
||||
return startRow;
|
||||
}
|
||||
|
||||
public byte[] getStopRow() {
|
||||
return stopRow;
|
||||
}
|
||||
|
||||
/**
|
||||
* @return if start row is inclusive.
|
||||
*/
|
||||
public boolean isStartRowInclusive() {
|
||||
return startRowInclusive;
|
||||
}
|
||||
|
||||
/**
|
||||
* @return if stop row is inclusive.
|
||||
*/
|
||||
public boolean isStopRowInclusive() {
|
||||
return stopRowInclusive;
|
||||
}
|
||||
|
||||
public boolean contains(byte[] row) {
|
||||
return contains(row, 0, row.length);
|
||||
}
|
||||
|
||||
public boolean contains(byte[] buffer, int offset, int length) {
|
||||
if(startRowInclusive) {
|
||||
if(stopRowInclusive) {
|
||||
return Bytes.compareTo(buffer, offset, length, startRow, 0, startRow.length) >= 0
|
||||
&& (Bytes.equals(stopRow, HConstants.EMPTY_BYTE_ARRAY) ||
|
||||
Bytes.compareTo(buffer, offset, length, stopRow, 0, stopRow.length) <= isScan);
|
||||
} else {
|
||||
return Bytes.compareTo(buffer, offset, length, startRow, 0, startRow.length) >= 0
|
||||
&& (Bytes.equals(stopRow, HConstants.EMPTY_BYTE_ARRAY) ||
|
||||
Bytes.compareTo(buffer, offset, length, stopRow, 0, stopRow.length) < isScan);
|
||||
}
|
||||
} else {
|
||||
if(stopRowInclusive) {
|
||||
return Bytes.compareTo(buffer, offset, length, startRow, 0, startRow.length) > 0
|
||||
&& (Bytes.equals(stopRow, HConstants.EMPTY_BYTE_ARRAY) ||
|
||||
Bytes.compareTo(buffer, offset, length, stopRow, 0, stopRow.length) <= isScan);
|
||||
} else {
|
||||
return Bytes.compareTo(buffer, offset, length, startRow, 0, startRow.length) > 0
|
||||
&& (Bytes.equals(stopRow, HConstants.EMPTY_BYTE_ARRAY) ||
|
||||
Bytes.compareTo(buffer, offset, length, stopRow, 0, stopRow.length) < isScan);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
@Override
|
||||
public int compareTo(RowRange other) {
|
||||
return Bytes.compareTo(this.startRow, other.startRow);
|
||||
}
|
||||
|
||||
public boolean isValid() {
|
||||
return Bytes.equals(startRow, HConstants.EMPTY_BYTE_ARRAY)
|
||||
|| Bytes.equals(stopRow, HConstants.EMPTY_BYTE_ARRAY)
|
||||
|| Bytes.compareTo(startRow, stopRow) < 0
|
||||
|| (Bytes.compareTo(startRow, stopRow) == 0 && stopRowInclusive == true);
|
||||
}
|
||||
}
|
||||
}
|
File diff suppressed because it is too large
Load Diff
|
@ -155,4 +155,15 @@ message WhileMatchFilter {
|
|||
required Filter filter = 1;
|
||||
}
|
||||
message FilterAllFilter {
|
||||
}
|
||||
|
||||
message RowRange {
|
||||
optional bytes start_row = 1;
|
||||
optional bool start_row_inclusive = 2;
|
||||
optional bytes stop_row = 3;
|
||||
optional bool stop_row_inclusive =4;
|
||||
}
|
||||
|
||||
message MultiRowRangeFilter {
|
||||
repeated RowRange row_range_list = 1;
|
||||
}
|
|
@ -32,8 +32,8 @@ import javax.xml.bind.annotation.XmlAttribute;
|
|||
import javax.xml.bind.annotation.XmlElement;
|
||||
import javax.xml.bind.annotation.XmlRootElement;
|
||||
|
||||
import org.apache.hadoop.hbase.classification.InterfaceAudience;
|
||||
import org.apache.hadoop.hbase.HConstants;
|
||||
import org.apache.hadoop.hbase.classification.InterfaceAudience;
|
||||
import org.apache.hadoop.hbase.client.Scan;
|
||||
import org.apache.hadoop.hbase.filter.BinaryComparator;
|
||||
import org.apache.hadoop.hbase.filter.BinaryPrefixComparator;
|
||||
|
@ -52,6 +52,8 @@ import org.apache.hadoop.hbase.filter.FilterList;
|
|||
import org.apache.hadoop.hbase.filter.FirstKeyOnlyFilter;
|
||||
import org.apache.hadoop.hbase.filter.InclusiveStopFilter;
|
||||
import org.apache.hadoop.hbase.filter.KeyOnlyFilter;
|
||||
import org.apache.hadoop.hbase.filter.MultiRowRangeFilter;
|
||||
import org.apache.hadoop.hbase.filter.MultiRowRangeFilter.RowRange;
|
||||
import org.apache.hadoop.hbase.filter.MultipleColumnPrefixFilter;
|
||||
import org.apache.hadoop.hbase.filter.NullComparator;
|
||||
import org.apache.hadoop.hbase.filter.PageFilter;
|
||||
|
@ -212,6 +214,7 @@ public class ScannerModel implements ProtobufMessageHandler, Serializable {
|
|||
@XmlAttribute public Boolean dropDependentColumn;
|
||||
@XmlAttribute public Float chance;
|
||||
@XmlElement public List<String> prefixes;
|
||||
@XmlElement private List<RowRange> ranges;
|
||||
@XmlElement public List<Long> timestamps;
|
||||
|
||||
static enum FilterType {
|
||||
|
@ -226,6 +229,7 @@ public class ScannerModel implements ProtobufMessageHandler, Serializable {
|
|||
InclusiveStopFilter,
|
||||
KeyOnlyFilter,
|
||||
MultipleColumnPrefixFilter,
|
||||
MultiRowRangeFilter,
|
||||
PageFilter,
|
||||
PrefixFilter,
|
||||
QualifierFilter,
|
||||
|
@ -293,6 +297,13 @@ public class ScannerModel implements ProtobufMessageHandler, Serializable {
|
|||
this.prefixes.add(Base64.encodeBytes(prefix));
|
||||
}
|
||||
break;
|
||||
case MultiRowRangeFilter:
|
||||
this.ranges = new ArrayList<RowRange>();
|
||||
for(RowRange range : ((MultiRowRangeFilter)filter).getRowRanges()) {
|
||||
this.ranges.add(new RowRange(range.getStartRow(), range.isStartRowInclusive(),
|
||||
range.getStopRow(), range.isStopRowInclusive()));
|
||||
}
|
||||
break;
|
||||
case PageFilter:
|
||||
this.value = Long.toString(((PageFilter)filter).getPageSize());
|
||||
break;
|
||||
|
@ -394,6 +405,13 @@ public class ScannerModel implements ProtobufMessageHandler, Serializable {
|
|||
}
|
||||
filter = new MultipleColumnPrefixFilter(values);
|
||||
} break;
|
||||
case MultiRowRangeFilter: {
|
||||
try {
|
||||
filter = new MultiRowRangeFilter(ranges);
|
||||
} catch (IOException e) {
|
||||
throw new RuntimeException(e);
|
||||
}
|
||||
} break;
|
||||
case PageFilter:
|
||||
filter = new PageFilter(Long.valueOf(value));
|
||||
break;
|
||||
|
|
|
@ -21,11 +21,14 @@ package org.apache.hadoop.hbase.filter;
|
|||
|
||||
import static org.junit.Assert.assertTrue;
|
||||
|
||||
import java.util.ArrayList;
|
||||
import java.util.LinkedList;
|
||||
import java.util.List;
|
||||
import java.util.TreeSet;
|
||||
|
||||
import org.apache.hadoop.hbase.testclassification.SmallTests;
|
||||
import org.apache.hadoop.hbase.filter.CompareFilter.CompareOp;
|
||||
import org.apache.hadoop.hbase.filter.MultiRowRangeFilter.RowRange;
|
||||
import org.apache.hadoop.hbase.protobuf.ProtobufUtil;
|
||||
import org.apache.hadoop.hbase.util.Bytes;
|
||||
import org.apache.hadoop.hbase.util.Pair;
|
||||
|
@ -319,4 +322,16 @@ public class TestFilterSerialization {
|
|||
ProtobufUtil.toFilter(ProtobufUtil.toFilter(whileMatchFilter))));
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMultiRowRangeFilter() throws Exception {
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(40), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(60), true, Bytes.toBytes(70), false));
|
||||
|
||||
MultiRowRangeFilter multiRowRangeFilter =
|
||||
new MultiRowRangeFilter(ranges);
|
||||
assertTrue(multiRowRangeFilter.areSerializedFieldsEqual(
|
||||
ProtobufUtil.toFilter(ProtobufUtil.toFilter(multiRowRangeFilter))));
|
||||
}
|
||||
}
|
||||
|
|
|
@ -0,0 +1,465 @@
|
|||
/*
|
||||
* Licensed to the Apache Software Foundation (ASF) under one
|
||||
* or more contributor license agreements. See the NOTICE file
|
||||
* distributed with this work for additional information
|
||||
* regarding copyright ownership. The ASF licenses this file
|
||||
* to you under the Apache License, Version 2.0 (the
|
||||
* "License"); you may not use this file except in compliance
|
||||
* with the License. You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
package org.apache.hadoop.hbase.filter;
|
||||
|
||||
import static org.junit.Assert.assertEquals;
|
||||
|
||||
import java.io.IOException;
|
||||
import java.util.ArrayList;
|
||||
import java.util.List;
|
||||
|
||||
import org.apache.commons.logging.Log;
|
||||
import org.apache.commons.logging.LogFactory;
|
||||
import org.apache.hadoop.hbase.Cell;
|
||||
import org.apache.hadoop.hbase.HBaseTestingUtility;
|
||||
import org.apache.hadoop.hbase.client.HTable;
|
||||
import org.apache.hadoop.hbase.client.Put;
|
||||
import org.apache.hadoop.hbase.client.Result;
|
||||
import org.apache.hadoop.hbase.client.ResultScanner;
|
||||
import org.apache.hadoop.hbase.client.Scan;
|
||||
import org.apache.hadoop.hbase.filter.MultiRowRangeFilter.RowRange;
|
||||
import org.apache.hadoop.hbase.testclassification.MediumTests;
|
||||
import org.apache.hadoop.hbase.util.Bytes;
|
||||
import org.junit.AfterClass;
|
||||
import org.junit.Assert;
|
||||
import org.junit.BeforeClass;
|
||||
import org.junit.Test;
|
||||
import org.junit.experimental.categories.Category;
|
||||
|
||||
@Category(MediumTests.class)
|
||||
public class TestMultiRowRangeFilter {
|
||||
|
||||
private final static HBaseTestingUtility TEST_UTIL = new HBaseTestingUtility();
|
||||
private final Log LOG = LogFactory.getLog(this.getClass());
|
||||
private byte[] family = Bytes.toBytes("family");
|
||||
private byte[] qf = Bytes.toBytes("qf");
|
||||
private byte[] value = Bytes.toBytes("val");
|
||||
private byte[] tableName;
|
||||
private int numRows = 100;
|
||||
|
||||
/**
|
||||
* @throws Exception
|
||||
*/
|
||||
@BeforeClass
|
||||
public static void setUpBeforeClass() throws Exception {
|
||||
TEST_UTIL.startMiniCluster();
|
||||
}
|
||||
|
||||
/**
|
||||
* @throws Exception
|
||||
*/
|
||||
@AfterClass
|
||||
public static void tearDownAfterClass() throws Exception {
|
||||
TEST_UTIL.shutdownMiniCluster();
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMergeAndSortWithEmptyStartRow() throws IOException {
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(""), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(15), true, Bytes.toBytes(40), false));
|
||||
List<RowRange> actualRanges = MultiRowRangeFilter.sortAndMerge(ranges);
|
||||
List<RowRange> expectedRanges = new ArrayList<RowRange>();
|
||||
expectedRanges.add(new RowRange(Bytes.toBytes(""), true, Bytes.toBytes(40), false));
|
||||
assertRangesEqual(expectedRanges, actualRanges);
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMergeAndSortWithEmptyStopRow() throws IOException {
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(15), true, Bytes.toBytes(""), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(70), false));
|
||||
List<RowRange> actualRanges = MultiRowRangeFilter.sortAndMerge(ranges);
|
||||
List<RowRange> expectedRanges = new ArrayList<RowRange>();
|
||||
expectedRanges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(""), false));
|
||||
assertRangesEqual(expectedRanges, actualRanges);
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMergeAndSortWithEmptyStartRowAndStopRow() throws IOException {
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(""), true, Bytes.toBytes(""), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(70), false));
|
||||
List<RowRange> actualRanges = MultiRowRangeFilter.sortAndMerge(ranges);
|
||||
List<RowRange> expectedRanges = new ArrayList<RowRange>();
|
||||
expectedRanges.add(new RowRange(Bytes.toBytes(""), true, Bytes.toBytes(""), false));
|
||||
assertRangesEqual(expectedRanges, actualRanges);
|
||||
}
|
||||
|
||||
@Test(expected=IllegalArgumentException.class)
|
||||
public void testMultiRowRangeWithoutRange() throws IOException {
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
new MultiRowRangeFilter(ranges);
|
||||
}
|
||||
|
||||
@Test(expected=IllegalArgumentException.class)
|
||||
public void testMultiRowRangeWithInvalidRange() throws IOException {
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
// the start row larger than the stop row
|
||||
ranges.add(new RowRange(Bytes.toBytes(80), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(70), false));
|
||||
new MultiRowRangeFilter(ranges);
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMergeAndSortWithoutOverlap() throws IOException {
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(40), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(60), true, Bytes.toBytes(70), false));
|
||||
List<RowRange> actualRanges = MultiRowRangeFilter.sortAndMerge(ranges);
|
||||
List<RowRange> expectedRanges = new ArrayList<RowRange>();
|
||||
expectedRanges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
expectedRanges.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(40), false));
|
||||
expectedRanges.add(new RowRange(Bytes.toBytes(60), true, Bytes.toBytes(70), false));
|
||||
assertRangesEqual(expectedRanges, actualRanges);
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMergeAndSortWithOverlap() throws IOException {
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(15), true, Bytes.toBytes(40), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(20), true, Bytes.toBytes(30), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(50), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(70), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(90), true, Bytes.toBytes(100), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(95), true, Bytes.toBytes(100), false));
|
||||
List<RowRange> actualRanges = MultiRowRangeFilter.sortAndMerge(ranges);
|
||||
List<RowRange> expectedRanges = new ArrayList<RowRange>();
|
||||
expectedRanges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(70), false));
|
||||
expectedRanges.add(new RowRange(Bytes.toBytes(90), true, Bytes.toBytes(100), false));
|
||||
assertRangesEqual(expectedRanges, actualRanges);
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMergeAndSortWithStartRowInclusive() throws IOException {
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(20), true, Bytes.toBytes(""), false));
|
||||
List<RowRange> actualRanges = MultiRowRangeFilter.sortAndMerge(ranges);
|
||||
List<RowRange> expectedRanges = new ArrayList<RowRange>();
|
||||
expectedRanges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(""), false));
|
||||
assertRangesEqual(expectedRanges, actualRanges);
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMergeAndSortWithRowExclusive() throws IOException {
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(20), false, Bytes.toBytes(""), false));
|
||||
List<RowRange> actualRanges = MultiRowRangeFilter.sortAndMerge(ranges);
|
||||
List<RowRange> expectedRanges = new ArrayList<RowRange>();
|
||||
expectedRanges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
expectedRanges.add(new RowRange(Bytes.toBytes(20), false, Bytes.toBytes(""), false));
|
||||
assertRangesEqual(expectedRanges, actualRanges);
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMergeAndSortWithRowInclusive() throws IOException {
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), true));
|
||||
ranges.add(new RowRange(Bytes.toBytes(20), false, Bytes.toBytes(""), false));
|
||||
List<RowRange> actualRanges = MultiRowRangeFilter.sortAndMerge(ranges);
|
||||
List<RowRange> expectedRanges = new ArrayList<RowRange>();
|
||||
expectedRanges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(""), false));
|
||||
assertRangesEqual(expectedRanges, actualRanges);
|
||||
}
|
||||
|
||||
public void assertRangesEqual(List<RowRange> expected, List<RowRange> actual) {
|
||||
assertEquals(expected.size(), actual.size());
|
||||
for(int i = 0; i < expected.size(); i++) {
|
||||
Assert.assertTrue(Bytes.equals(expected.get(i).getStartRow(), actual.get(i).getStartRow()));
|
||||
Assert.assertTrue(expected.get(i).isStartRowInclusive() ==
|
||||
actual.get(i).isStartRowInclusive());
|
||||
Assert.assertTrue(Bytes.equals(expected.get(i).getStopRow(), actual.get(i).getStopRow()));
|
||||
Assert.assertTrue(expected.get(i).isStopRowInclusive() ==
|
||||
actual.get(i).isStopRowInclusive());
|
||||
}
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMultiRowRangeFilterWithRangeOverlap() throws IOException {
|
||||
tableName = Bytes.toBytes("testMultiRowRangeFilterWithRangeOverlap");
|
||||
HTable ht = TEST_UTIL.createTable(tableName, family, Integer.MAX_VALUE);
|
||||
generateRows(numRows, ht, family, qf, value);
|
||||
|
||||
Scan scan = new Scan();
|
||||
scan.setMaxVersions();
|
||||
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(15), true, Bytes.toBytes(40), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(65), true, Bytes.toBytes(75), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(60), true, null, false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(60), true, Bytes.toBytes(80), false));
|
||||
|
||||
MultiRowRangeFilter filter = new MultiRowRangeFilter(ranges);
|
||||
scan.setFilter(filter);
|
||||
int resultsSize = getResultsSize(ht, scan);
|
||||
LOG.info("found " + resultsSize + " results");
|
||||
List<Cell> results1 = getScanResult(Bytes.toBytes(10), Bytes.toBytes(40), ht);
|
||||
List<Cell> results2 = getScanResult(Bytes.toBytes(60), Bytes.toBytes(""), ht);
|
||||
|
||||
assertEquals(results1.size() + results2.size(), resultsSize);
|
||||
|
||||
ht.close();
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMultiRowRangeFilterWithoutRangeOverlap() throws IOException {
|
||||
tableName = Bytes.toBytes("testMultiRowRangeFilterWithoutRangeOverlap");
|
||||
HTable ht = TEST_UTIL.createTable(tableName, family, Integer.MAX_VALUE);
|
||||
generateRows(numRows, ht, family, qf, value);
|
||||
|
||||
Scan scan = new Scan();
|
||||
scan.setMaxVersions();
|
||||
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(40), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(60), true, Bytes.toBytes(70), false));
|
||||
|
||||
MultiRowRangeFilter filter = new MultiRowRangeFilter(ranges);
|
||||
scan.setFilter(filter);
|
||||
int resultsSize = getResultsSize(ht, scan);
|
||||
LOG.info("found " + resultsSize + " results");
|
||||
List<Cell> results1 = getScanResult(Bytes.toBytes(10), Bytes.toBytes(20), ht);
|
||||
List<Cell> results2 = getScanResult(Bytes.toBytes(30), Bytes.toBytes(40), ht);
|
||||
List<Cell> results3 = getScanResult(Bytes.toBytes(60), Bytes.toBytes(70), ht);
|
||||
|
||||
assertEquals(results1.size() + results2.size() + results3.size(), resultsSize);
|
||||
|
||||
ht.close();
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMultiRowRangeFilterWithEmptyStartRow() throws IOException {
|
||||
tableName = Bytes.toBytes("testMultiRowRangeFilterWithEmptyStartRow");
|
||||
HTable ht = TEST_UTIL.createTable(tableName, family, Integer.MAX_VALUE);
|
||||
generateRows(numRows, ht, family, qf, value);
|
||||
Scan scan = new Scan();
|
||||
scan.setMaxVersions();
|
||||
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(""), true, Bytes.toBytes(10), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(40), false));
|
||||
|
||||
MultiRowRangeFilter filter = new MultiRowRangeFilter(ranges);
|
||||
scan.setFilter(filter);
|
||||
int resultsSize = getResultsSize(ht, scan);
|
||||
List<Cell> results1 = getScanResult(Bytes.toBytes(""), Bytes.toBytes(10), ht);
|
||||
List<Cell> results2 = getScanResult(Bytes.toBytes(30), Bytes.toBytes(40), ht);
|
||||
assertEquals(results1.size() + results2.size(), resultsSize);
|
||||
|
||||
ht.close();
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMultiRowRangeFilterWithEmptyStopRow() throws IOException {
|
||||
tableName = Bytes.toBytes("testMultiRowRangeFilterWithEmptyStopRow");
|
||||
HTable ht = TEST_UTIL.createTable(tableName, family, Integer.MAX_VALUE);
|
||||
generateRows(numRows, ht, family, qf, value);
|
||||
Scan scan = new Scan();
|
||||
scan.setMaxVersions();
|
||||
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(""), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(40), false));
|
||||
|
||||
MultiRowRangeFilter filter = new MultiRowRangeFilter(ranges);
|
||||
scan.setFilter(filter);
|
||||
int resultsSize = getResultsSize(ht, scan);
|
||||
List<Cell> results1 = getScanResult(Bytes.toBytes(10), Bytes.toBytes(""), ht);
|
||||
assertEquals(results1.size(), resultsSize);
|
||||
|
||||
ht.close();
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMultiRowRangeFilterWithInclusive() throws IOException {
|
||||
tableName = Bytes.toBytes("testMultiRowRangeFilterWithInclusive");
|
||||
HTable ht = TEST_UTIL.createTable(tableName, family, Integer.MAX_VALUE);
|
||||
generateRows(numRows, ht, family, qf, value);
|
||||
|
||||
Scan scan = new Scan();
|
||||
scan.setMaxVersions();
|
||||
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(20), true, Bytes.toBytes(40), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(65), true, Bytes.toBytes(75), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(60), true, null, false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(60), true, Bytes.toBytes(80), false));
|
||||
|
||||
MultiRowRangeFilter filter = new MultiRowRangeFilter(ranges);
|
||||
scan.setFilter(filter);
|
||||
int resultsSize = getResultsSize(ht, scan);
|
||||
LOG.info("found " + resultsSize + " results");
|
||||
List<Cell> results1 = getScanResult(Bytes.toBytes(10), Bytes.toBytes(40), ht);
|
||||
List<Cell> results2 = getScanResult(Bytes.toBytes(60), Bytes.toBytes(""), ht);
|
||||
|
||||
assertEquals(results1.size() + results2.size(), resultsSize);
|
||||
|
||||
ht.close();
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMultiRowRangeFilterWithExclusive() throws IOException {
|
||||
tableName = Bytes.toBytes("testMultiRowRangeFilterWithExclusive");
|
||||
HTable ht = TEST_UTIL.createTable(tableName, family, Integer.MAX_VALUE);
|
||||
generateRows(numRows, ht, family, qf, value);
|
||||
|
||||
Scan scan = new Scan();
|
||||
scan.setMaxVersions();
|
||||
|
||||
List<RowRange> ranges = new ArrayList<RowRange>();
|
||||
ranges.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(20), false, Bytes.toBytes(40), false));
|
||||
ranges.add(new RowRange(Bytes.toBytes(65), true, Bytes.toBytes(75), false));
|
||||
|
||||
MultiRowRangeFilter filter = new MultiRowRangeFilter(ranges);
|
||||
scan.setFilter(filter);
|
||||
int resultsSize = getResultsSize(ht, scan);
|
||||
LOG.info("found " + resultsSize + " results");
|
||||
List<Cell> results1 = getScanResult(Bytes.toBytes(10), Bytes.toBytes(40), ht);
|
||||
List<Cell> results2 = getScanResult(Bytes.toBytes(65), Bytes.toBytes(75), ht);
|
||||
|
||||
assertEquals((results1.size() - 1) + results2.size(), resultsSize);
|
||||
|
||||
ht.close();
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMultiRowRangeWithFilterListAndOperator() throws IOException {
|
||||
tableName = Bytes.toBytes("TestMultiRowRangeFilterWithFilterListAndOperator");
|
||||
HTable ht = TEST_UTIL.createTable(tableName, family, Integer.MAX_VALUE);
|
||||
generateRows(numRows, ht, family, qf, value);
|
||||
|
||||
Scan scan = new Scan();
|
||||
scan.setMaxVersions();
|
||||
|
||||
List<RowRange> ranges1 = new ArrayList<RowRange>();
|
||||
ranges1.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges1.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(40), false));
|
||||
ranges1.add(new RowRange(Bytes.toBytes(60), true, Bytes.toBytes(70), false));
|
||||
|
||||
MultiRowRangeFilter filter1 = new MultiRowRangeFilter(ranges1);
|
||||
|
||||
List<RowRange> ranges2 = new ArrayList<RowRange>();
|
||||
ranges2.add(new RowRange(Bytes.toBytes(20), true, Bytes.toBytes(40), false));
|
||||
ranges2.add(new RowRange(Bytes.toBytes(80), true, Bytes.toBytes(90), false));
|
||||
|
||||
MultiRowRangeFilter filter2 = new MultiRowRangeFilter(ranges2);
|
||||
|
||||
FilterList filterList = new FilterList(FilterList.Operator.MUST_PASS_ALL);
|
||||
filterList.addFilter(filter1);
|
||||
filterList.addFilter(filter2);
|
||||
scan.setFilter(filterList);
|
||||
int resultsSize = getResultsSize(ht, scan);
|
||||
LOG.info("found " + resultsSize + " results");
|
||||
List<Cell> results1 = getScanResult(Bytes.toBytes(30), Bytes.toBytes(40), ht);
|
||||
|
||||
assertEquals(results1.size(), resultsSize);
|
||||
|
||||
ht.close();
|
||||
}
|
||||
|
||||
@Test
|
||||
public void testMultiRowRangeWithFilterListOrOperator() throws IOException {
|
||||
tableName = Bytes.toBytes("TestMultiRowRangeFilterWithFilterListOrOperator");
|
||||
HTable ht = TEST_UTIL.createTable(tableName, family, Integer.MAX_VALUE);
|
||||
generateRows(numRows, ht, family, qf, value);
|
||||
|
||||
Scan scan = new Scan();
|
||||
scan.setMaxVersions();
|
||||
|
||||
List<RowRange> ranges1 = new ArrayList<RowRange>();
|
||||
ranges1.add(new RowRange(Bytes.toBytes(30), true, Bytes.toBytes(40), false));
|
||||
ranges1.add(new RowRange(Bytes.toBytes(10), true, Bytes.toBytes(20), false));
|
||||
ranges1.add(new RowRange(Bytes.toBytes(60), true, Bytes.toBytes(70), false));
|
||||
|
||||
MultiRowRangeFilter filter1 = new MultiRowRangeFilter(ranges1);
|
||||
|
||||
List<RowRange> ranges2 = new ArrayList<RowRange>();
|
||||
ranges2.add(new RowRange(Bytes.toBytes(20), true, Bytes.toBytes(40), false));
|
||||
ranges2.add(new RowRange(Bytes.toBytes(80), true, Bytes.toBytes(90), false));
|
||||
|
||||
MultiRowRangeFilter filter2 = new MultiRowRangeFilter(ranges2);
|
||||
|
||||
FilterList filterList = new FilterList(FilterList.Operator.MUST_PASS_ONE);
|
||||
filterList.addFilter(filter1);
|
||||
filterList.addFilter(filter2);
|
||||
scan.setFilter(filterList);
|
||||
int resultsSize = getResultsSize(ht, scan);
|
||||
LOG.info("found " + resultsSize + " results");
|
||||
List<Cell> results1 = getScanResult(Bytes.toBytes(10), Bytes.toBytes(40), ht);
|
||||
List<Cell> results2 = getScanResult(Bytes.toBytes(60), Bytes.toBytes(70), ht);
|
||||
List<Cell> results3 = getScanResult(Bytes.toBytes(80), Bytes.toBytes(90), ht);
|
||||
|
||||
assertEquals(results1.size() + results2.size() + results3.size(),resultsSize);
|
||||
|
||||
ht.close();
|
||||
}
|
||||
|
||||
private void generateRows(int numberOfRows, HTable ht, byte[] family, byte[] qf, byte[] value)
|
||||
throws IOException {
|
||||
for (int i = 0; i < numberOfRows; i++) {
|
||||
byte[] row = Bytes.toBytes(i);
|
||||
Put p = new Put(row);
|
||||
p.add(family, qf, value);
|
||||
ht.put(p);
|
||||
}
|
||||
TEST_UTIL.flush();
|
||||
}
|
||||
|
||||
private List<Cell> getScanResult(byte[] startRow, byte[] stopRow, HTable ht) throws IOException {
|
||||
Scan scan = new Scan();
|
||||
scan.setMaxVersions();
|
||||
if(!Bytes.toString(startRow).isEmpty()) {
|
||||
scan.setStartRow(startRow);
|
||||
}
|
||||
if(!Bytes.toString(stopRow).isEmpty()) {
|
||||
scan.setStopRow(stopRow);
|
||||
}
|
||||
ResultScanner scanner = ht.getScanner(scan);
|
||||
List<Cell> kvList = new ArrayList<Cell>();
|
||||
Result r;
|
||||
while ((r = scanner.next()) != null) {
|
||||
for (Cell kv : r.listCells()) {
|
||||
kvList.add(kv);
|
||||
}
|
||||
}
|
||||
return kvList;
|
||||
}
|
||||
|
||||
private int getResultsSize(HTable ht, Scan scan) throws IOException {
|
||||
ResultScanner scanner = ht.getScanner(scan);
|
||||
List<Cell> results = new ArrayList<Cell>();
|
||||
Result r;
|
||||
while ((r = scanner.next()) != null) {
|
||||
for (Cell kv : r.listCells()) {
|
||||
results.add(kv);
|
||||
}
|
||||
}
|
||||
return results.size();
|
||||
}
|
||||
}
|
Loading…
Reference in New Issue