HBASE-13933 DBE's seekBefore with tags corrupts the tag's offset information thus leading to incorrect results (ramkrishna.s.vasudevan)

This commit is contained in:
Nick Dimiduk 2015-06-19 14:26:02 -07:00
parent d628f95307
commit 34cd3377f8
2 changed files with 99 additions and 14 deletions

View File

@ -170,6 +170,8 @@ abstract class BufferedDataBlockEncoder implements DataBlockEncoder {
nextKvOffset = nextState.nextKvOffset; nextKvOffset = nextState.nextKvOffset;
memstoreTS = nextState.memstoreTS; memstoreTS = nextState.memstoreTS;
currentBuffer = nextState.currentBuffer; currentBuffer = nextState.currentBuffer;
tagsOffset = nextState.tagsOffset;
tagsLength = nextState.tagsLength;
if (nextState.tagCompressionContext != null) { if (nextState.tagCompressionContext != null) {
tagCompressionContext = nextState.tagCompressionContext; tagCompressionContext = nextState.tagCompressionContext;
} }

View File

@ -19,27 +19,71 @@
package org.apache.hadoop.hbase.io.hfile; package org.apache.hadoop.hbase.io.hfile;
import java.io.IOException; import java.io.IOException;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Iterator;
import java.util.List;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertTrue;
import org.junit.Before;
import org.junit.Test;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FSDataOutputStream; import org.apache.hadoop.fs.FSDataOutputStream;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path; import org.apache.hadoop.fs.Path;
import org.apache.hadoop.hbase.Cell; import org.apache.hadoop.hbase.Cell;
import org.apache.hadoop.hbase.HBaseTestCase; import org.apache.hadoop.hbase.CellUtil;
import org.apache.hadoop.hbase.HBaseTestingUtility;
import org.apache.hadoop.hbase.HConstants; import org.apache.hadoop.hbase.HConstants;
import org.apache.hadoop.hbase.KeyValue; import org.apache.hadoop.hbase.KeyValue;
import org.apache.hadoop.hbase.KeyValueUtil; import org.apache.hadoop.hbase.KeyValueUtil;
import org.apache.hadoop.hbase.io.encoding.DataBlockEncoding;
import org.apache.hadoop.hbase.testclassification.SmallTests; import org.apache.hadoop.hbase.testclassification.SmallTests;
import org.apache.hadoop.hbase.Tag; import org.apache.hadoop.hbase.Tag;
import org.apache.hadoop.hbase.util.Bytes; import org.apache.hadoop.hbase.util.Bytes;
import org.junit.experimental.categories.Category; import org.junit.experimental.categories.Category;
import org.junit.runner.RunWith;
import org.junit.runners.Parameterized;
import org.junit.runners.Parameterized.Parameters;
/** /**
* Test {@link HFileScanner#seekTo(byte[])} and its variants. * Test {@link HFileScanner#seekTo(byte[])} and its variants.
*/ */
@Category(SmallTests.class) @Category(SmallTests.class)
public class TestSeekTo extends HBaseTestCase { @RunWith(Parameterized.class)
public class TestSeekTo {
private final static HBaseTestingUtility TEST_UTIL = new HBaseTestingUtility();
private final DataBlockEncoding encoding;
@Parameters
public static Collection<Object[]> parameters() {
List<Object[]> paramList = new ArrayList<Object[]>();
for (DataBlockEncoding encoding : DataBlockEncoding.values()) {
// Remove after HBASE-13939
if (encoding != DataBlockEncoding.PREFIX_TREE) {
paramList.add(new Object[] { encoding });
}
}
return paramList;
}
static boolean switchKVs = false; static boolean switchKVs = false;
public TestSeekTo(DataBlockEncoding encoding) {
this.encoding = encoding;
}
@Before
public void setUp() {
//reset
switchKVs = false;
}
static KeyValue toKV(String row, TagUsage tagUsage) { static KeyValue toKV(String row, TagUsage tagUsage) {
if (tagUsage == TagUsage.NO_TAG) { if (tagUsage == TagUsage.NO_TAG) {
return new KeyValue(Bytes.toBytes(row), Bytes.toBytes("family"), Bytes.toBytes("qualifier"), return new KeyValue(Bytes.toBytes(row), Bytes.toBytes("family"), Bytes.toBytes("qualifier"),
@ -54,7 +98,7 @@ public class TestSeekTo extends HBaseTestCase {
if (!switchKVs) { if (!switchKVs) {
switchKVs = true; switchKVs = true;
return new KeyValue(Bytes.toBytes(row), Bytes.toBytes("family"), return new KeyValue(Bytes.toBytes(row), Bytes.toBytes("family"),
Bytes.toBytes("qualifier"), Bytes.toBytes("value")); Bytes.toBytes("qualifier"), HConstants.LATEST_TIMESTAMP, Bytes.toBytes("value"));
} else { } else {
switchKVs = false; switchKVs = false;
Tag t = new Tag((byte) 1, "myTag1"); Tag t = new Tag((byte) 1, "myTag1");
@ -65,20 +109,23 @@ public class TestSeekTo extends HBaseTestCase {
} }
} }
} }
static String toRowStr(Cell kv) { static String toRowStr(Cell kv) {
return Bytes.toString(KeyValueUtil.ensureKeyValue(kv).getRow()); return Bytes.toString(KeyValueUtil.ensureKeyValue(kv).getRow());
} }
Path makeNewFile(TagUsage tagUsage) throws IOException { Path makeNewFile(TagUsage tagUsage) throws IOException {
Path ncTFile = new Path(this.testDir, "basic.hfile"); Path ncTFile = new Path(TEST_UTIL.getDataTestDir(), "basic.hfile");
FSDataOutputStream fout = TEST_UTIL.getTestFileSystem().create(ncTFile);
Configuration conf = TEST_UTIL.getConfiguration();
if (tagUsage != TagUsage.NO_TAG) { if (tagUsage != TagUsage.NO_TAG) {
conf.setInt("hfile.format.version", 3); conf.setInt("hfile.format.version", 3);
} else { } else {
conf.setInt("hfile.format.version", 2); conf.setInt("hfile.format.version", 2);
} }
FSDataOutputStream fout = this.fs.create(ncTFile);
int blocksize = toKV("a", tagUsage).getLength() * 3; int blocksize = toKV("a", tagUsage).getLength() * 3;
HFileContext context = new HFileContextBuilder().withBlockSize(blocksize) HFileContext context = new HFileContextBuilder().withBlockSize(blocksize)
.withDataBlockEncoding(encoding)
.withIncludesTags(true).build(); .withIncludesTags(true).build();
HFile.Writer writer = HFile.getWriterFactoryNoCache(conf).withOutputStream(fout) HFile.Writer writer = HFile.getWriterFactoryNoCache(conf).withOutputStream(fout)
.withFileContext(context) .withFileContext(context)
@ -96,6 +143,7 @@ public class TestSeekTo extends HBaseTestCase {
return ncTFile; return ncTFile;
} }
@Test
public void testSeekBefore() throws Exception { public void testSeekBefore() throws Exception {
testSeekBeforeInternals(TagUsage.NO_TAG); testSeekBeforeInternals(TagUsage.NO_TAG);
testSeekBeforeInternals(TagUsage.ONLY_TAG); testSeekBeforeInternals(TagUsage.ONLY_TAG);
@ -104,6 +152,8 @@ public class TestSeekTo extends HBaseTestCase {
protected void testSeekBeforeInternals(TagUsage tagUsage) throws IOException { protected void testSeekBeforeInternals(TagUsage tagUsage) throws IOException {
Path p = makeNewFile(tagUsage); Path p = makeNewFile(tagUsage);
FileSystem fs = TEST_UTIL.getTestFileSystem();
Configuration conf = TEST_UTIL.getConfiguration();
HFile.Reader reader = HFile.createReader(fs, p, new CacheConfig(conf), conf); HFile.Reader reader = HFile.createReader(fs, p, new CacheConfig(conf), conf);
reader.loadFileInfo(); reader.loadFileInfo();
HFileScanner scanner = reader.getScanner(false, true); HFileScanner scanner = reader.getScanner(false, true);
@ -129,14 +179,25 @@ public class TestSeekTo extends HBaseTestCase {
assertEquals("g", toRowStr(scanner.getKeyValue())); assertEquals("g", toRowStr(scanner.getKeyValue()));
assertEquals(true, scanner.seekBefore(toKV("j", tagUsage))); assertEquals(true, scanner.seekBefore(toKV("j", tagUsage)));
assertEquals("i", toRowStr(scanner.getKeyValue())); assertEquals("i", toRowStr(scanner.getKeyValue()));
Cell cell = scanner.getKeyValue();
if (tagUsage != TagUsage.NO_TAG && cell.getTagsLength() > 0) {
Iterator<Tag> tagsIterator = CellUtil.tagsIterator(cell.getTagsArray(), cell.getTagsOffset(),
cell.getTagsLength());
while (tagsIterator.hasNext()) {
Tag next = tagsIterator.next();
assertEquals("myTag1", Bytes.toString(next.getValue()));
}
}
assertEquals(true, scanner.seekBefore(toKV("k", tagUsage))); assertEquals(true, scanner.seekBefore(toKV("k", tagUsage)));
assertEquals("i", toRowStr(scanner.getKeyValue())); assertEquals("i", toRowStr(scanner.getKeyValue()));
assertEquals(true, scanner.seekBefore(toKV("l", tagUsage))); assertEquals(true, scanner.seekBefore(toKV("l", tagUsage)));
assertEquals("k", toRowStr(scanner.getKeyValue())); assertEquals("k", toRowStr(scanner.getKeyValue()));
reader.close(); reader.close();
deleteTestDir(fs);
} }
@Test
public void testSeekBeforeWithReSeekTo() throws Exception { public void testSeekBeforeWithReSeekTo() throws Exception {
testSeekBeforeWithReSeekToInternals(TagUsage.NO_TAG); testSeekBeforeWithReSeekToInternals(TagUsage.NO_TAG);
testSeekBeforeWithReSeekToInternals(TagUsage.ONLY_TAG); testSeekBeforeWithReSeekToInternals(TagUsage.ONLY_TAG);
@ -145,6 +206,8 @@ public class TestSeekTo extends HBaseTestCase {
protected void testSeekBeforeWithReSeekToInternals(TagUsage tagUsage) throws IOException { protected void testSeekBeforeWithReSeekToInternals(TagUsage tagUsage) throws IOException {
Path p = makeNewFile(tagUsage); Path p = makeNewFile(tagUsage);
FileSystem fs = TEST_UTIL.getTestFileSystem();
Configuration conf = TEST_UTIL.getConfiguration();
HFile.Reader reader = HFile.createReader(fs, p, new CacheConfig(conf), conf); HFile.Reader reader = HFile.createReader(fs, p, new CacheConfig(conf), conf);
reader.loadFileInfo(); reader.loadFileInfo();
HFileScanner scanner = reader.getScanner(false, true); HFileScanner scanner = reader.getScanner(false, true);
@ -162,7 +225,7 @@ public class TestSeekTo extends HBaseTestCase {
assertEquals("g", toRowStr(scanner.getKeyValue())); assertEquals("g", toRowStr(scanner.getKeyValue()));
// seekBefore e, so the scanner points to c // seekBefore e, so the scanner points to c
assertEquals(true, scanner.seekBefore(toKV("e", tagUsage))); assertTrue(scanner.seekBefore(toKV("e", tagUsage)));
assertEquals("c", toRowStr(scanner.getKeyValue())); assertEquals("c", toRowStr(scanner.getKeyValue()));
// reseekTo e and g // reseekTo e and g
assertEquals(0, scanner.reseekTo(toKV("e", tagUsage))); assertEquals(0, scanner.reseekTo(toKV("e", tagUsage)));
@ -171,7 +234,7 @@ public class TestSeekTo extends HBaseTestCase {
assertEquals("g", toRowStr(scanner.getKeyValue())); assertEquals("g", toRowStr(scanner.getKeyValue()));
// seekBefore f, so the scanner points to e // seekBefore f, so the scanner points to e
assertEquals(true, scanner.seekBefore(toKV("f", tagUsage))); assertTrue(scanner.seekBefore(toKV("f", tagUsage)));
assertEquals("e", toRowStr(scanner.getKeyValue())); assertEquals("e", toRowStr(scanner.getKeyValue()));
// reseekTo e and g // reseekTo e and g
assertEquals(0, scanner.reseekTo(toKV("e", tagUsage))); assertEquals(0, scanner.reseekTo(toKV("e", tagUsage)));
@ -180,7 +243,7 @@ public class TestSeekTo extends HBaseTestCase {
assertEquals("g", toRowStr(scanner.getKeyValue())); assertEquals("g", toRowStr(scanner.getKeyValue()));
// seekBefore g, so the scanner points to e // seekBefore g, so the scanner points to e
assertEquals(true, scanner.seekBefore(toKV("g", tagUsage))); assertTrue(scanner.seekBefore(toKV("g", tagUsage)));
assertEquals("e", toRowStr(scanner.getKeyValue())); assertEquals("e", toRowStr(scanner.getKeyValue()));
// reseekTo e and g again // reseekTo e and g again
assertEquals(0, scanner.reseekTo(toKV("e", tagUsage))); assertEquals(0, scanner.reseekTo(toKV("e", tagUsage)));
@ -189,28 +252,28 @@ public class TestSeekTo extends HBaseTestCase {
assertEquals("g", toRowStr(scanner.getKeyValue())); assertEquals("g", toRowStr(scanner.getKeyValue()));
// seekBefore h, so the scanner points to g // seekBefore h, so the scanner points to g
assertEquals(true, scanner.seekBefore(toKV("h", tagUsage))); assertTrue(scanner.seekBefore(toKV("h", tagUsage)));
assertEquals("g", toRowStr(scanner.getKeyValue())); assertEquals("g", toRowStr(scanner.getKeyValue()));
// reseekTo g // reseekTo g
assertEquals(0, scanner.reseekTo(toKV("g", tagUsage))); assertEquals(0, scanner.reseekTo(toKV("g", tagUsage)));
assertEquals("g", toRowStr(scanner.getKeyValue())); assertEquals("g", toRowStr(scanner.getKeyValue()));
// seekBefore i, so the scanner points to g // seekBefore i, so the scanner points to g
assertEquals(true, scanner.seekBefore(toKV("i", tagUsage))); assertTrue(scanner.seekBefore(toKV("i", tagUsage)));
assertEquals("g", toRowStr(scanner.getKeyValue())); assertEquals("g", toRowStr(scanner.getKeyValue()));
// reseekTo g // reseekTo g
assertEquals(0, scanner.reseekTo(toKV("g", tagUsage))); assertEquals(0, scanner.reseekTo(toKV("g", tagUsage)));
assertEquals("g", toRowStr(scanner.getKeyValue())); assertEquals("g", toRowStr(scanner.getKeyValue()));
// seekBefore j, so the scanner points to i // seekBefore j, so the scanner points to i
assertEquals(true, scanner.seekBefore(toKV("j", tagUsage))); assertTrue(scanner.seekBefore(toKV("j", tagUsage)));
assertEquals("i", toRowStr(scanner.getKeyValue())); assertEquals("i", toRowStr(scanner.getKeyValue()));
// reseekTo i // reseekTo i
assertEquals(0, scanner.reseekTo(toKV("i", tagUsage))); assertEquals(0, scanner.reseekTo(toKV("i", tagUsage)));
assertEquals("i", toRowStr(scanner.getKeyValue())); assertEquals("i", toRowStr(scanner.getKeyValue()));
// seekBefore k, so the scanner points to i // seekBefore k, so the scanner points to i
assertEquals(true, scanner.seekBefore(toKV("k", tagUsage))); assertTrue(scanner.seekBefore(toKV("k", tagUsage)));
assertEquals("i", toRowStr(scanner.getKeyValue())); assertEquals("i", toRowStr(scanner.getKeyValue()));
// reseekTo i and k // reseekTo i and k
assertEquals(0, scanner.reseekTo(toKV("i", tagUsage))); assertEquals(0, scanner.reseekTo(toKV("i", tagUsage)));
@ -224,8 +287,10 @@ public class TestSeekTo extends HBaseTestCase {
// reseekTo k // reseekTo k
assertEquals(0, scanner.reseekTo(toKV("k", tagUsage))); assertEquals(0, scanner.reseekTo(toKV("k", tagUsage)));
assertEquals("k", toRowStr(scanner.getKeyValue())); assertEquals("k", toRowStr(scanner.getKeyValue()));
deleteTestDir(fs);
} }
@Test
public void testSeekTo() throws Exception { public void testSeekTo() throws Exception {
testSeekToInternals(TagUsage.NO_TAG); testSeekToInternals(TagUsage.NO_TAG);
testSeekToInternals(TagUsage.ONLY_TAG); testSeekToInternals(TagUsage.ONLY_TAG);
@ -234,6 +299,8 @@ public class TestSeekTo extends HBaseTestCase {
protected void testSeekToInternals(TagUsage tagUsage) throws IOException { protected void testSeekToInternals(TagUsage tagUsage) throws IOException {
Path p = makeNewFile(tagUsage); Path p = makeNewFile(tagUsage);
FileSystem fs = TEST_UTIL.getTestFileSystem();
Configuration conf = TEST_UTIL.getConfiguration();
HFile.Reader reader = HFile.createReader(fs, p, new CacheConfig(conf), conf); HFile.Reader reader = HFile.createReader(fs, p, new CacheConfig(conf), conf);
reader.loadFileInfo(); reader.loadFileInfo();
assertEquals(2, reader.getDataBlockIndexReader().getRootBlockCount()); assertEquals(2, reader.getDataBlockIndexReader().getRootBlockCount());
@ -248,20 +315,35 @@ public class TestSeekTo extends HBaseTestCase {
// 'h' does not exist so we will get a '1' back for not found. // 'h' does not exist so we will get a '1' back for not found.
assertEquals(0, scanner.seekTo(toKV("i", tagUsage))); assertEquals(0, scanner.seekTo(toKV("i", tagUsage)));
assertEquals("i", toRowStr(scanner.getKeyValue())); assertEquals("i", toRowStr(scanner.getKeyValue()));
assertEquals(1, scanner.seekTo(toKV("l", tagUsage))); assertEquals(1, scanner.seekTo(toKV("l", tagUsage)));
assertEquals("k", toRowStr(scanner.getKeyValue())); if (encoding == DataBlockEncoding.PREFIX_TREE) {
// TODO : Fix this
assertEquals(null, scanner.getKeyValue());
} else {
assertEquals("k", toRowStr(scanner.getKeyValue()));
}
reader.close(); reader.close();
deleteTestDir(fs);
} }
@Test
public void testBlockContainingKey() throws Exception { public void testBlockContainingKey() throws Exception {
testBlockContainingKeyInternals(TagUsage.NO_TAG); testBlockContainingKeyInternals(TagUsage.NO_TAG);
testBlockContainingKeyInternals(TagUsage.ONLY_TAG); testBlockContainingKeyInternals(TagUsage.ONLY_TAG);
testBlockContainingKeyInternals(TagUsage.PARTIAL_TAG); testBlockContainingKeyInternals(TagUsage.PARTIAL_TAG);
} }
protected void deleteTestDir(FileSystem fs) throws IOException {
Path dataTestDir = TEST_UTIL.getDataTestDir();
if (fs.exists(dataTestDir)) {
fs.delete(dataTestDir, true);
}
}
protected void testBlockContainingKeyInternals(TagUsage tagUsage) throws IOException { protected void testBlockContainingKeyInternals(TagUsage tagUsage) throws IOException {
Path p = makeNewFile(tagUsage); Path p = makeNewFile(tagUsage);
FileSystem fs = TEST_UTIL.getTestFileSystem();
Configuration conf = TEST_UTIL.getConfiguration();
HFile.Reader reader = HFile.createReader(fs, p, new CacheConfig(conf), conf); HFile.Reader reader = HFile.createReader(fs, p, new CacheConfig(conf), conf);
reader.loadFileInfo(); reader.loadFileInfo();
HFileBlockIndex.BlockIndexReader blockIndexReader = HFileBlockIndex.BlockIndexReader blockIndexReader =
@ -288,5 +370,6 @@ public class TestSeekTo extends HBaseTestCase {
assertEquals(1, blockIndexReader.rootBlockContainingKey( assertEquals(1, blockIndexReader.rootBlockContainingKey(
toKV("l", tagUsage))); toKV("l", tagUsage)));
reader.close(); reader.close();
deleteTestDir(fs);
} }
} }