HBASE-2399 Forced splits only act on the first family in a table (Ming Ma)

git-svn-id: https://svn.apache.org/repos/asf/hbase/trunk@1158080 13f79535-47bb-0310-9956-ffa450edef68
2011-08-16 01:16:43 +00:00 · 2011-08-16 01:16:43 +00:00 · 4b1b49635a
parent 4fae472fe1
commit 4b1b49635a
4 changed files with 119 additions and 31 deletions
--- a/CHANGES.txt
+++ b/CHANGES.txt
@ -199,6 +199,7 @@ Release 0.91.0 - Unreleased
               set in config file (Ming Ma)
   HBASE-4186  No region is added to regionsInTransitionInRS
   HBASE-4194  RegionSplitter: Split on under-loaded region servers first
   HBASE-2399  Forced splits only act on the first family in a table (Ming Ma)
  IMPROVEMENTS
   HBASE-3290  Max Compaction Size (Nicolas Spiegelberg via Stack)  
--- a/src/main/java/org/apache/hadoop/hbase/regionserver/HRegion.java
+++ b/src/main/java/org/apache/hadoop/hbase/regionserver/HRegion.java
@ -3875,18 +3875,27 @@ public class HRegion implements HeapSize { // , Writable{
    // nothing
  }
  /**
   * Return the splitpoint. null indicates the region isn't splittable
   * If the splitpoint isn't explicitly specified, it will go over the stores
   * to find the best splitpoint. Currently the criteria of best splitpoint
   * is based on the size of the store.
   */
  public byte[] checkSplit() {
    if (this.splitPoint != null) {
      return this.splitPoint;
    }
-    byte[] splitPoint = null;
+    byte[] splitPointFromLargestStore = null;
    long largestStoreSize = 0;
    for (Store s : stores.values()) {
-      splitPoint = s.checkSplit();
+      byte[] splitPoint = s.checkSplit();
-      if (splitPoint != null) {
+      long storeSize = s.getSize();
-        return splitPoint;
+      if (splitPoint != null && largestStoreSize < storeSize) {
        splitPointFromLargestStore = splitPoint;
        largestStoreSize = storeSize;
      }
    }
-    return null;
+    return splitPointFromLargestStore;
  }
  /**
--- a/src/test/java/org/apache/hadoop/hbase/HBaseTestingUtility.java
+++ b/src/test/java/org/apache/hadoop/hbase/HBaseTestingUtility.java
@ -699,6 +699,31 @@ public class HBaseTestingUtility {
    return new HTable(new Configuration(getConfiguration()), tableName);
  }
  /**
   * Create a table.
   * @param tableName
   * @param families
   * @param numVersions
   * @return An HTable instance for the created table.
   * @throws IOException
   */
  public HTable createTable(byte[] tableName, byte[][] families,
    int numVersions, int blockSize) throws IOException {
    HTableDescriptor desc = new HTableDescriptor(tableName);
    for (byte[] family : families) {
      HColumnDescriptor hcd = new HColumnDescriptor(family, numVersions,
          HColumnDescriptor.DEFAULT_COMPRESSION,
          HColumnDescriptor.DEFAULT_IN_MEMORY,
          HColumnDescriptor.DEFAULT_BLOCKCACHE,
          blockSize, HColumnDescriptor.DEFAULT_TTL,
          HColumnDescriptor.DEFAULT_BLOOMFILTER,
          HColumnDescriptor.DEFAULT_REPLICATION_SCOPE);
      desc.addFamily(hcd);
    }
    getHBaseAdmin().createTable(desc);
    return new HTable(new Configuration(getConfiguration()), tableName);
  }
  /**
   * Create a table.
   * @param tableName
--- a/src/test/java/org/apache/hadoop/hbase/client/TestAdmin.java
+++ b/src/test/java/org/apache/hadoop/hbase/client/TestAdmin.java
@ -564,29 +564,71 @@ public class TestAdmin {
   */
  @Test
  public void testForceSplit() throws Exception {
-      splitTest(null);
+    byte[][] familyNames = new byte[][] { Bytes.toBytes("cf") };
-      splitTest(Bytes.toBytes("pwn"));
+    int[] rowCounts = new int[] { 6000 };
-    }
+    int numVersions = HColumnDescriptor.DEFAULT_VERSIONS;
    int blockSize = 256;
    splitTest(null, familyNames, rowCounts, numVersions, blockSize);
-  void splitTest(byte[] splitPoint) throws Exception {
+    byte[] splitKey = Bytes.toBytes(3500);
-    byte [] familyName = HConstants.CATALOG_FAMILY;
+    splitTest(splitKey, familyNames, rowCounts, numVersions, blockSize);
  }
  /**
   * Multi-family scenario. Tests forcing split from client and
   * having scanners successfully ride over split.
   * @throws Exception
   * @throws IOException
   */
  @Test
  public void testForceSplitMultiFamily() throws Exception {
    int numVersions = HColumnDescriptor.DEFAULT_VERSIONS;
    // use small HFile block size so that we can have lots of blocks in HFile
    // Otherwise, if there is only one block,
    // HFileBlockIndex.midKey()'s value == startKey
    int blockSize = 256;
    byte[][] familyNames = new byte[][] { Bytes.toBytes("cf1"),
      Bytes.toBytes("cf2") };
    // one of the column families isn't splittable
    int[] rowCounts = new int[] { 6000, 1 };
    splitTest(null, familyNames, rowCounts, numVersions, blockSize);
    rowCounts = new int[] { 1, 6000 };
    splitTest(null, familyNames, rowCounts, numVersions, blockSize);
    // one column family has much smaller data than the other
    // the split key should be based on the largest column family
    rowCounts = new int[] { 6000, 300 };
    splitTest(null, familyNames, rowCounts, numVersions, blockSize);
    rowCounts = new int[] { 300, 6000 };
    splitTest(null, familyNames, rowCounts, numVersions, blockSize);
  }
  void splitTest(byte[] splitPoint, byte[][] familyNames, int[] rowCounts,
    int numVersions, int blockSize) throws Exception {
    byte [] tableName = Bytes.toBytes("testForceSplit");
    assertFalse(admin.tableExists(tableName));
-    final HTable table = TEST_UTIL.createTable(tableName, familyName);
+    final HTable table = TEST_UTIL.createTable(tableName, familyNames,
      numVersions, blockSize);
    try {
      byte[] k = new byte[3];
      int rowCount = 0;
-      for (byte b1 = 'a'; b1 < 'z'; b1++) {
+
-        for (byte b2 = 'a'; b2 < 'z'; b2++) {
+      // insert rows into column families. The number of rows that have values
-          for (byte b3 = 'a'; b3 < 'z'; b3++) {
+      // in a specific column family is decided by rowCounts[familyIndex]
-            k[0] = b1;
+      for (int index = 0; index < familyNames.length; index++) {
-            k[1] = b2;
+        for (int i = 0; i < rowCounts[index]; i++) {
-            k[2] = b3;
+          byte[] k = Bytes.toBytes(i);
-            Put put = new Put(k);
+          Put put = new Put(k);
-            put.add(familyName, new byte[0], k);
+          put.add(familyNames[index], new byte[0], k);
-            table.put(put);
+          table.put(put);
-            rowCount++;
+        }
-          }
+
        if ( rowCount < rowCounts[index] ) {
          rowCount = rowCounts[index];
        }
      }
@ -651,21 +693,32 @@ public class TestAdmin {
      scanner.close();
      assertEquals(rowCount, rows);
      Map<HRegionInfo, HServerAddress> regions = null;
      try {
        regions = table.getRegionsInfo();
      } catch (IOException e) {
        e.printStackTrace();
      }
      assertEquals(2, regions.size());
      HRegionInfo[] r = regions.keySet().toArray(new HRegionInfo[0]);
      if (splitPoint != null) {
        // make sure the split point matches our explicit configuration
        Map<HRegionInfo, HServerAddress> regions = null;
        try {
          regions = table.getRegionsInfo();
        } catch (IOException e) {
          e.printStackTrace();
        }
        assertEquals(2, regions.size());
        HRegionInfo[] r = regions.keySet().toArray(new HRegionInfo[0]);
        assertEquals(Bytes.toString(splitPoint),
            Bytes.toString(r[0].getEndKey()));
        assertEquals(Bytes.toString(splitPoint),
            Bytes.toString(r[1].getStartKey()));
        LOG.debug("Properly split on " + Bytes.toString(splitPoint));
      } else {
        if (familyNames.length > 1) {
          int splitKey = Bytes.toInt(r[0].getEndKey());
          // check if splitKey is based on the largest column family
          // in terms of it store size
          int deltaForLargestFamily = Math.abs(rowCount/2 - splitKey);
          for (int index = 0; index < familyNames.length; index++) {
            int delta = Math.abs(rowCounts[index]/2 - splitKey);
            assertTrue(delta >= deltaForLargestFamily);
          }
        }
      }
    } finally {
      TEST_UTIL.deleteTable(tableName);