HBASE-15287 mapreduce.RowCounter returns incorrect result with binary row key inputs (Matt Warhaftig)

This commit is contained in:
tedyu 2016-04-16 12:46:21 -07:00
parent d815211f5a
commit e9211e415a
12 changed files with 79 additions and 28 deletions

View File

@ -154,6 +154,6 @@ implements TableMap<ImmutableBytesWritable,Result> {
} }
sb.append(Bytes.toString(vals[i])); sb.append(Bytes.toString(vals[i]));
} }
return new ImmutableBytesWritable(Bytes.toBytes(sb.toString())); return new ImmutableBytesWritable(Bytes.toBytesBinary(sb.toString()));
} }
} }

View File

@ -241,7 +241,7 @@ public class CellCounter extends Configured implements Tool {
String regexPattern = filterCriteria.substring(1, filterCriteria.length()); String regexPattern = filterCriteria.substring(1, filterCriteria.length());
rowFilter = new RowFilter(CompareFilter.CompareOp.EQUAL, new RegexStringComparator(regexPattern)); rowFilter = new RowFilter(CompareFilter.CompareOp.EQUAL, new RegexStringComparator(regexPattern));
} else { } else {
rowFilter = new PrefixFilter(Bytes.toBytes(filterCriteria)); rowFilter = new PrefixFilter(Bytes.toBytesBinary(filterCriteria));
} }
return rowFilter; return rowFilter;
} }

View File

@ -111,11 +111,11 @@ public class CopyTable extends Configured implements Tool {
} }
if (startRow != null) { if (startRow != null) {
scan.setStartRow(Bytes.toBytes(startRow)); scan.setStartRow(Bytes.toBytesBinary(startRow));
} }
if (stopRow != null) { if (stopRow != null) {
scan.setStopRow(Bytes.toBytes(stopRow)); scan.setStopRow(Bytes.toBytesBinary(stopRow));
} }
if(families != null) { if(families != null) {

View File

@ -100,10 +100,10 @@ public class Export extends Configured implements Tool {
s.setCacheBlocks(false); s.setCacheBlocks(false);
// set Start and Stop row // set Start and Stop row
if (conf.get(TableInputFormat.SCAN_ROW_START) != null) { if (conf.get(TableInputFormat.SCAN_ROW_START) != null) {
s.setStartRow(Bytes.toBytes(conf.get(TableInputFormat.SCAN_ROW_START))); s.setStartRow(Bytes.toBytesBinary(conf.get(TableInputFormat.SCAN_ROW_START)));
} }
if (conf.get(TableInputFormat.SCAN_ROW_STOP) != null) { if (conf.get(TableInputFormat.SCAN_ROW_STOP) != null) {
s.setStopRow(Bytes.toBytes(conf.get(TableInputFormat.SCAN_ROW_STOP))); s.setStopRow(Bytes.toBytesBinary(conf.get(TableInputFormat.SCAN_ROW_STOP)));
} }
// Set Scan Column Family // Set Scan Column Family
boolean raw = Boolean.parseBoolean(conf.get(RAW_SCAN)); boolean raw = Boolean.parseBoolean(conf.get(RAW_SCAN));
@ -142,7 +142,7 @@ public class Export extends Configured implements Tool {
String regexPattern = filterCriteria.substring(1, filterCriteria.length()); String regexPattern = filterCriteria.substring(1, filterCriteria.length());
exportFilter = new RowFilter(CompareOp.EQUAL, new RegexStringComparator(regexPattern)); exportFilter = new RowFilter(CompareOp.EQUAL, new RegexStringComparator(regexPattern));
} else { } else {
exportFilter = new PrefixFilter(Bytes.toBytes(filterCriteria)); exportFilter = new PrefixFilter(Bytes.toBytesBinary(filterCriteria));
} }
return exportFilter; return exportFilter;
} }

View File

@ -145,7 +145,7 @@ extends TableMapper<ImmutableBytesWritable,Result> implements Configurable {
} }
sb.append(Bytes.toString(vals[i])); sb.append(Bytes.toString(vals[i]));
} }
return new ImmutableBytesWritable(Bytes.toBytes(sb.toString())); return new ImmutableBytesWritable(Bytes.toBytesBinary(sb.toString()));
} }
/** /**

View File

@ -147,10 +147,10 @@ public class RowCounter extends Configured implements Tool {
Scan scan = new Scan(); Scan scan = new Scan();
scan.setCacheBlocks(false); scan.setCacheBlocks(false);
if (startKey != null && !startKey.equals("")) { if (startKey != null && !startKey.equals("")) {
scan.setStartRow(Bytes.toBytes(startKey)); scan.setStartRow(Bytes.toBytesBinary(startKey));
} }
if (endKey != null && !endKey.equals("")) { if (endKey != null && !endKey.equals("")) {
scan.setStopRow(Bytes.toBytes(endKey)); scan.setStopRow(Bytes.toBytesBinary(endKey));
} }
if (sb.length() > 0) { if (sb.length() > 0) {
for (String columnName : sb.toString().trim().split(" ")) { for (String columnName : sb.toString().trim().split(" ")) {

View File

@ -94,7 +94,7 @@ implements Configurable {
} }
LOG.warn("Using deprecated configuration " + deprecatedKey + LOG.warn("Using deprecated configuration " + deprecatedKey +
" - please use static accessor methods instead."); " - please use static accessor methods instead.");
return Bytes.toBytes(oldStyleVal); return Bytes.toBytesBinary(oldStyleVal);
} }
@Override @Override

View File

@ -129,11 +129,11 @@ implements Configurable {
scan = new Scan(); scan = new Scan();
if (conf.get(SCAN_ROW_START) != null) { if (conf.get(SCAN_ROW_START) != null) {
scan.setStartRow(Bytes.toBytes(conf.get(SCAN_ROW_START))); scan.setStartRow(Bytes.toBytesBinary(conf.get(SCAN_ROW_START)));
} }
if (conf.get(SCAN_ROW_STOP) != null) { if (conf.get(SCAN_ROW_STOP) != null) {
scan.setStopRow(Bytes.toBytes(conf.get(SCAN_ROW_STOP))); scan.setStopRow(Bytes.toBytesBinary(conf.get(SCAN_ROW_STOP)));
} }
if (conf.get(SCAN_COLUMNS) != null) { if (conf.get(SCAN_COLUMNS) != null) {

View File

@ -47,8 +47,8 @@ import static org.junit.Assert.fail;
@Category({MapReduceTests.class, LargeTests.class}) @Category({MapReduceTests.class, LargeTests.class})
public class TestCellCounter { public class TestCellCounter {
private static final HBaseTestingUtility UTIL = new HBaseTestingUtility(); private static final HBaseTestingUtility UTIL = new HBaseTestingUtility();
private static final byte[] ROW1 = Bytes.toBytes("row1"); private static final byte[] ROW1 = Bytes.toBytesBinary("\\x01row1");
private static final byte[] ROW2 = Bytes.toBytes("row2"); private static final byte[] ROW2 = Bytes.toBytesBinary("\\x01row2");
private static final String FAMILY_A_STRING = "a"; private static final String FAMILY_A_STRING = "a";
private static final String FAMILY_B_STRING = "b"; private static final String FAMILY_B_STRING = "b";
private static final byte[] FAMILY_A = Bytes.toBytes(FAMILY_A_STRING); private static final byte[] FAMILY_A = Bytes.toBytes(FAMILY_A_STRING);
@ -111,6 +111,44 @@ public class TestCellCounter {
} }
} }
/**
* Test CellCounter all data should print to output
*/
@Test(timeout = 300000)
public void testCellCounterPrefix() throws Exception {
TableName sourceTable = TableName.valueOf("testCellCounterPrefix");
byte[][] families = { FAMILY_A, FAMILY_B };
Table t = UTIL.createTable(sourceTable, families);
try {
Put p = new Put(ROW1);
p.addColumn(FAMILY_A, QUALIFIER, now, Bytes.toBytes("Data11"));
p.addColumn(FAMILY_B, QUALIFIER, now + 1, Bytes.toBytes("Data12"));
p.addColumn(FAMILY_A, QUALIFIER, now + 2, Bytes.toBytes("Data13"));
t.put(p);
p = new Put(ROW2);
p.addColumn(FAMILY_B, QUALIFIER, now, Bytes.toBytes("Dat21"));
p.addColumn(FAMILY_A, QUALIFIER, now + 1, Bytes.toBytes("Data22"));
p.addColumn(FAMILY_B, QUALIFIER, now + 2, Bytes.toBytes("Data23"));
t.put(p);
String[] args = { sourceTable.getNameAsString(), FQ_OUTPUT_DIR.toString(), ";", "\\x01row1" };
runCount(args);
FileInputStream inputStream =
new FileInputStream(OUTPUT_DIR + File.separator + "part-r-00000");
String data = IOUtils.toString(inputStream);
inputStream.close();
assertTrue(data.contains("Total Families Across all Rows" + "\t" + "2"));
assertTrue(data.contains("Total Qualifiers across all Rows" + "\t" + "2"));
assertTrue(data.contains("Total ROWS" + "\t" + "1"));
assertTrue(data.contains("b;q" + "\t" + "1"));
assertTrue(data.contains("a;q" + "\t" + "1"));
assertTrue(data.contains("row1;a;q_Versions" + "\t" + "1"));
assertTrue(data.contains("row1;b;q_Versions" + "\t" + "1"));
} finally {
t.close();
FileUtil.fullyDelete(new File(OUTPUT_DIR));
}
}
/** /**
* Test CellCounter with time range all data should print to output * Test CellCounter with time range all data should print to output
*/ */

View File

@ -134,9 +134,9 @@ public class TestCopyTable {
final TableName TABLENAME2 = TableName.valueOf("testStartStopRow2"); final TableName TABLENAME2 = TableName.valueOf("testStartStopRow2");
final byte[] FAMILY = Bytes.toBytes("family"); final byte[] FAMILY = Bytes.toBytes("family");
final byte[] COLUMN1 = Bytes.toBytes("c1"); final byte[] COLUMN1 = Bytes.toBytes("c1");
final byte[] ROW0 = Bytes.toBytes("row0"); final byte[] ROW0 = Bytes.toBytesBinary("\\x01row0");
final byte[] ROW1 = Bytes.toBytes("row1"); final byte[] ROW1 = Bytes.toBytesBinary("\\x01row1");
final byte[] ROW2 = Bytes.toBytes("row2"); final byte[] ROW2 = Bytes.toBytesBinary("\\x01row2");
Table t1 = TEST_UTIL.createTable(TABLENAME1, FAMILY); Table t1 = TEST_UTIL.createTable(TABLENAME1, FAMILY);
Table t2 = TEST_UTIL.createTable(TABLENAME2, FAMILY); Table t2 = TEST_UTIL.createTable(TABLENAME2, FAMILY);
@ -156,8 +156,8 @@ public class TestCopyTable {
assertEquals( assertEquals(
0, 0,
ToolRunner.run(new Configuration(TEST_UTIL.getConfiguration()), ToolRunner.run(new Configuration(TEST_UTIL.getConfiguration()),
copy, new String[] { "--new.name=" + TABLENAME2, "--startrow=row1", copy, new String[] { "--new.name=" + TABLENAME2, "--startrow=\\x01row1",
"--stoprow=row2", TABLENAME1.getNameAsString() })); "--stoprow=\\x01row2", TABLENAME1.getNameAsString() }));
// verify the data was copied into table 2 // verify the data was copied into table 2
// row1 exist, row0, row2 do not exist // row1 exist, row0, row2 do not exist

View File

@ -93,8 +93,9 @@ import org.mockito.stubbing.Answer;
public class TestImportExport { public class TestImportExport {
private static final Log LOG = LogFactory.getLog(TestImportExport.class); private static final Log LOG = LogFactory.getLog(TestImportExport.class);
private static final HBaseTestingUtility UTIL = new HBaseTestingUtility(); private static final HBaseTestingUtility UTIL = new HBaseTestingUtility();
private static final byte[] ROW1 = Bytes.toBytes("row1"); private static final byte[] ROW1 = Bytes.toBytesBinary("\\x32row1");
private static final byte[] ROW2 = Bytes.toBytes("row2"); private static final byte[] ROW2 = Bytes.toBytesBinary("\\x32row2");
private static final byte[] ROW3 = Bytes.toBytesBinary("\\x32row3");
private static final String FAMILYA_STRING = "a"; private static final String FAMILYA_STRING = "a";
private static final String FAMILYB_STRING = "b"; private static final String FAMILYB_STRING = "b";
private static final byte[] FAMILYA = Bytes.toBytes(FAMILYA_STRING); private static final byte[] FAMILYA = Bytes.toBytes(FAMILYA_STRING);
@ -181,9 +182,17 @@ public class TestImportExport {
p.addColumn(FAMILYA, QUAL, now + 1, QUAL); p.addColumn(FAMILYA, QUAL, now + 1, QUAL);
p.addColumn(FAMILYA, QUAL, now + 2, QUAL); p.addColumn(FAMILYA, QUAL, now + 2, QUAL);
t.put(p); t.put(p);
p = new Put(ROW3);
p.addColumn(FAMILYA, QUAL, now, QUAL);
p.addColumn(FAMILYA, QUAL, now + 1, QUAL);
p.addColumn(FAMILYA, QUAL, now + 2, QUAL);
t.put(p);
} }
String[] args = new String[] { String[] args = new String[] {
// Only export row1 & row2.
"-D" + TableInputFormat.SCAN_ROW_START + "=\\x32row1",
"-D" + TableInputFormat.SCAN_ROW_STOP + "=\\x32row3",
EXPORT_TABLE, EXPORT_TABLE,
FQ_OUTPUT_DIR, FQ_OUTPUT_DIR,
"1000", // max number of key versions per key to export "1000", // max number of key versions per key to export
@ -207,6 +216,9 @@ public class TestImportExport {
g.setMaxVersions(); g.setMaxVersions();
r = t.get(g); r = t.get(g);
assertEquals(3, r.size()); assertEquals(3, r.size());
g = new Get(ROW3);
r = t.get(g);
assertEquals(0, r.size());
} }
} }

View File

@ -149,7 +149,7 @@ public class TestRowCounter {
@Test @Test
public void testRowCounterColumnAndRowRange() throws Exception { public void testRowCounterColumnAndRowRange() throws Exception {
String[] args = new String[] { String[] args = new String[] {
TABLE_NAME, "--range=rov,rox", COL_FAM + ":" + COL1 TABLE_NAME, "--range=\\x00rov,\\x00rox", COL_FAM + ":" + COL1
}; };
runRowCount(args, 8); runRowCount(args, 8);
} }
@ -245,7 +245,8 @@ public class TestRowCounter {
// write few rows with two columns // write few rows with two columns
int i = 0; int i = 0;
for (; i < TOTAL_ROWS - ROWS_WITH_ONE_COL; i++) { for (; i < TOTAL_ROWS - ROWS_WITH_ONE_COL; i++) {
byte[] row = Bytes.toBytes("row" + i); // Use binary rows values to test for HBASE-15287.
byte[] row = Bytes.toBytesBinary("\\x00row" + i);
Put put = new Put(row); Put put = new Put(row);
put.addColumn(family, col1, value); put.addColumn(family, col1, value);
put.addColumn(family, col2, value); put.addColumn(family, col2, value);