From a6e9de3a0edd8b1d9320e48d47f594c75b80f4e3 Mon Sep 17 00:00:00 2001 From: Tomu Tsuruhara Date: Wed, 5 Apr 2017 21:42:28 +0900 Subject: [PATCH] HBASE-17871 scan#setBatch(int) call leads wrong result of VerifyReplication Signed-off-by: tedyu --- .../replication/VerifyReplication.java | 19 +++++++++++++++---- 1 file changed, 15 insertions(+), 4 deletions(-) diff --git a/hbase-server/src/main/java/org/apache/hadoop/hbase/mapreduce/replication/VerifyReplication.java b/hbase-server/src/main/java/org/apache/hadoop/hbase/mapreduce/replication/VerifyReplication.java index 365211033ef..1d429dcc6b4 100644 --- a/hbase-server/src/main/java/org/apache/hadoop/hbase/mapreduce/replication/VerifyReplication.java +++ b/hbase-server/src/main/java/org/apache/hadoop/hbase/mapreduce/replication/VerifyReplication.java @@ -78,7 +78,7 @@ public class VerifyReplication extends Configured implements Tool { private final static String PEER_CONFIG_PREFIX = NAME + ".peer."; static long startTime = 0; static long endTime = Long.MAX_VALUE; - static int batch = Integer.MAX_VALUE; + static int batch = -1; static int versions = -1; static String tableName = null; static String families = null; @@ -105,6 +105,7 @@ public class VerifyReplication extends Configured implements Tool { private int sleepMsBeforeReCompare; private String delimiter = ""; private boolean verbose = false; + private int batch = -1; /** * Map method that compares every scanned row with the equivalent from @@ -123,8 +124,11 @@ public class VerifyReplication extends Configured implements Tool { sleepMsBeforeReCompare = conf.getInt(NAME +".sleepMsBeforeReCompare", 0); delimiter = conf.get(NAME + ".delimiter", ""); verbose = conf.getBoolean(NAME +".verbose", false); + batch = conf.getInt(NAME + ".batch", -1); final Scan scan = new Scan(); - scan.setBatch(batch); + if (batch > 0) { + scan.setBatch(batch); + } scan.setCacheBlocks(false); scan.setCaching(conf.getInt(TableInputFormat.SCAN_CACHEDROWS, 1)); long startTime = conf.getLong(NAME + ".startTime", 0); @@ -318,6 +322,7 @@ public class VerifyReplication extends Configured implements Tool { conf.setLong(NAME+".endTime", endTime); conf.setInt(NAME +".sleepMsBeforeReCompare", sleepMsBeforeReCompare); conf.set(NAME + ".delimiter", delimiter); + conf.setInt(NAME + ".batch", batch); conf.setBoolean(NAME +".verbose", verbose); conf.setBoolean(NAME +".includeDeletedCells", includeDeletedCells); if (families != null) { @@ -345,6 +350,10 @@ public class VerifyReplication extends Configured implements Tool { Scan scan = new Scan(); scan.setTimeRange(startTime, endTime); scan.setRaw(includeDeletedCells); + scan.setCacheBlocks(false); + if (batch > 0) { + scan.setBatch(batch); + } if (versions >= 0) { scan.setMaxVersions(versions); LOG.info("Number of versions set to " + versions); @@ -493,7 +502,7 @@ public class VerifyReplication extends Configured implements Tool { private static void restoreDefaults() { startTime = 0; endTime = Long.MAX_VALUE; - batch = Integer.MAX_VALUE; + batch = -1; versions = -1; tableName = null; families = null; @@ -511,13 +520,15 @@ public class VerifyReplication extends Configured implements Tool { } System.err.println("Usage: verifyrep [--starttime=X]" + " [--endtime=Y] [--families=A] [--row-prefixes=B] [--delimiter=] [--recomparesleep=] " + - "[--verbose] "); + "[--batch=] [--verbose] "); System.err.println(); System.err.println("Options:"); System.err.println(" starttime beginning of the time range"); System.err.println(" without endtime means from starttime to forever"); System.err.println(" endtime end of the time range"); System.err.println(" versions number of cell versions to verify"); + System.err.println(" batch batch count for scan, " + + "note that result row counts will no longer be actual number of rows when you use this option"); System.err.println(" raw includes raw scan if given in options"); System.err.println(" families comma-separated list of families to copy"); System.err.println(" row-prefixes comma-separated list of row key prefixes to filter on ");