Refactor ByteBlockPool so it is just a "shift/mask big array" (#12625)

Moved all the hairy allocSlice stuff as static method in TermsHashPerField and I introduce a BytesRefBlockPool to encapsulate of the BytesRefHash write/read logic.
2023-10-18 08:10:48 +02:00 · 2023-10-18 08:10:48 +02:00 · 17ea6d5a0d
parent ea272d0eda
commit 17ea6d5a0d
15 changed files with 335 additions and 279 deletions
--- a/lucene/CHANGES.txt
+++ b/lucene/CHANGES.txt
@ -363,6 +363,8 @@ Other

 * GITHUB#12512: Remove unused variable in BKDWriter. (Chao Zhang)

+* GITHUB#12625: Refactor ByteBlockPool so it is just a "shift/mask big array". (Ignacio Vera)
+
 ======================== Lucene 9.7.0 =======================

 API Changes
--- a/lucene/core/src/java/org/apache/lucene/index/ByteSliceReader.java
+++ b/lucene/core/src/java/org/apache/lucene/index/ByteSliceReader.java
@ -53,7 +53,7 @@ final class ByteSliceReader extends DataInput {
    buffer = pool.buffers[bufferUpto];
    upto = startIndex & ByteBlockPool.BYTE_BLOCK_MASK;

-    final int firstSize = ByteBlockPool.LEVEL_SIZE_ARRAY[0];
+    final int firstSize = TermsHashPerField.LEVEL_SIZE_ARRAY[0];

    if (startIndex + firstSize >= endIndex) {
      // There is only this one slice to read
@ -97,8 +97,8 @@ final class ByteSliceReader extends DataInput {
    // Skip to our next slice
    final int nextIndex = (int) BitUtil.VH_LE_INT.get(buffer, limit);

-    level = ByteBlockPool.NEXT_LEVEL_ARRAY[level];
-    final int newSize = ByteBlockPool.LEVEL_SIZE_ARRAY[level];
+    level = TermsHashPerField.NEXT_LEVEL_ARRAY[level];
+    final int newSize = TermsHashPerField.LEVEL_SIZE_ARRAY[level];

    bufferUpto = nextIndex / ByteBlockPool.BYTE_BLOCK_SIZE;
    bufferOffset = bufferUpto * ByteBlockPool.BYTE_BLOCK_SIZE;
--- a/lucene/core/src/java/org/apache/lucene/index/FreqProxFields.java
+++ b/lucene/core/src/java/org/apache/lucene/index/FreqProxFields.java
@ -24,6 +24,7 @@ import java.util.Map;
 import org.apache.lucene.index.FreqProxTermsWriterPerField.FreqProxPostingsArray;
 import org.apache.lucene.util.AttributeSource;
 import org.apache.lucene.util.BytesRef;
+import org.apache.lucene.util.BytesRefBlockPool;
 import org.apache.lucene.util.BytesRefBuilder;

 /**
@ -120,6 +121,7 @@ class FreqProxFields extends Fields {

  private static class FreqProxTermsEnum extends BaseTermsEnum {
    final FreqProxTermsWriterPerField terms;
+    final BytesRefBlockPool termsPool;
    final int[] sortedTermIDs;
    final FreqProxPostingsArray postingsArray;
    final BytesRef scratch = new BytesRef();
@ -128,6 +130,7 @@ class FreqProxFields extends Fields {

    FreqProxTermsEnum(FreqProxTermsWriterPerField terms) {
      this.terms = terms;
+      this.termsPool = new BytesRefBlockPool(terms.bytePool);
      this.numTerms = terms.getNumTerms();
      sortedTermIDs = terms.getSortedTermIDs();
      assert sortedTermIDs != null;
@ -149,7 +152,7 @@ class FreqProxFields extends Fields {
      while (hi >= lo) {
        int mid = (lo + hi) >>> 1;
        int textStart = postingsArray.textStarts[sortedTermIDs[mid]];
-        terms.bytePool.setBytesRef(scratch, textStart);
+        termsPool.fillBytesRef(scratch, textStart);
        int cmp = scratch.compareTo(text);
        if (cmp < 0) {
          lo = mid + 1;
@ -169,7 +172,7 @@ class FreqProxFields extends Fields {
        return SeekStatus.END;
      } else {
        int textStart = postingsArray.textStarts[sortedTermIDs[ord]];
-        terms.bytePool.setBytesRef(scratch, textStart);
+        termsPool.fillBytesRef(scratch, textStart);
        assert term().compareTo(text) > 0;
        return SeekStatus.NOT_FOUND;
      }
@ -179,7 +182,7 @@ class FreqProxFields extends Fields {
    public void seekExact(long ord) {
      this.ord = (int) ord;
      int textStart = postingsArray.textStarts[sortedTermIDs[this.ord]];
-      terms.bytePool.setBytesRef(scratch, textStart);
+      termsPool.fillBytesRef(scratch, textStart);
    }

    @Override
@ -189,7 +192,7 @@ class FreqProxFields extends Fields {
        return null;
      } else {
        int textStart = postingsArray.textStarts[sortedTermIDs[ord]];
-        terms.bytePool.setBytesRef(scratch, textStart);
+        termsPool.fillBytesRef(scratch, textStart);
        return scratch;
      }
    }
--- a/lucene/core/src/java/org/apache/lucene/index/TermVectorsConsumerPerField.java
+++ b/lucene/core/src/java/org/apache/lucene/index/TermVectorsConsumerPerField.java
@ -21,8 +21,8 @@ import org.apache.lucene.analysis.tokenattributes.OffsetAttribute;
 import org.apache.lucene.analysis.tokenattributes.PayloadAttribute;
 import org.apache.lucene.analysis.tokenattributes.TermFrequencyAttribute;
 import org.apache.lucene.codecs.TermVectorsWriter;
-import org.apache.lucene.util.ByteBlockPool;
 import org.apache.lucene.util.BytesRef;
+import org.apache.lucene.util.BytesRefBlockPool;

 final class TermVectorsConsumerPerField extends TermsHashPerField {

@ -40,7 +40,7 @@ final class TermVectorsConsumerPerField extends TermsHashPerField {
  private OffsetAttribute offsetAttribute;
  private PayloadAttribute payloadAttribute;
  private TermFrequencyAttribute termFreqAtt;
-  private final ByteBlockPool termBytePool;
+  private final BytesRefBlockPool termBytePool;

  private boolean hasPayloads; // if enabled, and we actually saw any for this field

@ -58,7 +58,7 @@ final class TermVectorsConsumerPerField extends TermsHashPerField {
    this.termsWriter = termsHash;
    this.fieldInfo = fieldInfo;
    this.fieldState = invertState;
-    termBytePool = termsHash.termBytePool;
+    termBytePool = new BytesRefBlockPool(termsHash.termBytePool);
  }

  /**
@ -106,7 +106,7 @@ final class TermVectorsConsumerPerField extends TermsHashPerField {
      final int freq = postings.freqs[termID];

      // Get BytesRef
-      termBytePool.setBytesRef(flushTerm, postings.textStarts[termID]);
+      termBytePool.fillBytesRef(flushTerm, postings.textStarts[termID]);
      tv.startTerm(flushTerm, freq);

      if (doVectorPositions || doVectorOffsets) {
--- a/lucene/core/src/java/org/apache/lucene/index/TermsHashPerField.java
+++ b/lucene/core/src/java/org/apache/lucene/index/TermsHashPerField.java
@ -17,6 +17,7 @@
 package org.apache.lucene.index;

 import java.io.IOException;
+import org.apache.lucene.util.BitUtil;
 import org.apache.lucene.util.ByteBlockPool;
 import org.apache.lucene.util.BytesRef;
 import org.apache.lucene.util.BytesRefHash;
@ -97,7 +98,7 @@ abstract class TermsHashPerField implements Comparable<TermsHashPerField> {
    final int offsetInAddressBuffer = streamStartOffset & IntBlockPool.INT_BLOCK_MASK;
    reader.init(
        bytePool,
-        postingsArray.byteStarts[termID] + stream * ByteBlockPool.FIRST_LEVEL_SIZE,
+        postingsArray.byteStarts[termID] + stream * FIRST_LEVEL_SIZE,
        streamAddressBuffer[offsetInAddressBuffer + stream]);
  }

@ -153,8 +154,7 @@ abstract class TermsHashPerField implements Comparable<TermsHashPerField> {
      intPool.nextBuffer();
    }

-    if (ByteBlockPool.BYTE_BLOCK_SIZE - bytePool.byteUpto
-        < (2 * streamCount) * ByteBlockPool.FIRST_LEVEL_SIZE) {
+    if (ByteBlockPool.BYTE_BLOCK_SIZE - bytePool.byteUpto < (2 * streamCount) * FIRST_LEVEL_SIZE) {
      // can we fit at least one byte per stream in the current buffer, if not allocate a new one
      bytePool.nextBuffer();
    }
@ -168,7 +168,7 @@ abstract class TermsHashPerField implements Comparable<TermsHashPerField> {
    for (int i = 0; i < streamCount; i++) {
      // initialize each stream with a slice we start with ByteBlockPool.FIRST_LEVEL_SIZE)
      // and grow as we need more space. see ByteBlockPool.LEVEL_SIZE_ARRAY
-      final int upto = bytePool.newSlice(ByteBlockPool.FIRST_LEVEL_SIZE);
+      final int upto = newSlice(bytePool, FIRST_LEVEL_SIZE, 0);
      termStreamAddressBuffer[streamAddressOffset + i] = upto + bytePool.byteOffset;
    }
    postingsArray.byteStarts[termID] = termStreamAddressBuffer[streamAddressOffset];
@ -221,7 +221,7 @@ abstract class TermsHashPerField implements Comparable<TermsHashPerField> {
    int offset = upto & ByteBlockPool.BYTE_BLOCK_MASK;
    if (bytes[offset] != 0) {
      // End of slice; allocate a new one
-      offset = bytePool.allocSlice(bytes, offset);
+      offset = allocSlice(bytePool, bytes, offset);
      bytes = bytePool.buffer;
      termStreamAddressBuffer[streamAddress] = offset + bytePool.byteOffset;
    }
@ -243,7 +243,7 @@ abstract class TermsHashPerField implements Comparable<TermsHashPerField> {
    }

    while (offset < end) {
-      int offsetAndLength = bytePool.allocKnownSizeSlice(slice, sliceOffset);
+      int offsetAndLength = allocKnownSizeSlice(bytePool, slice, sliceOffset);
      sliceOffset = offsetAndLength >> 8;
      int sliceLength = offsetAndLength & 0xff;
      slice = bytePool.buffer;
@ -255,6 +255,81 @@ abstract class TermsHashPerField implements Comparable<TermsHashPerField> {
    }
  }

+  // Size of each slice.  These arrays should be at most 16
+  // elements (index is encoded with 4 bits).  First array
+  // is just a compact way to encode X+1 with a max.  Second
+  // array is the length of each slice, ie first slice is 5
+  // bytes, next slice is 14 bytes, etc.
+
+  /**
+   * An array holding the offset into the {@link #LEVEL_SIZE_ARRAY} to quickly navigate to the next
+   * slice level.
+   */
+  static final int[] NEXT_LEVEL_ARRAY = {1, 2, 3, 4, 5, 6, 7, 8, 9, 9};
+
+  /** An array holding the level sizes for byte slices. */
+  static final int[] LEVEL_SIZE_ARRAY = {5, 14, 20, 30, 40, 40, 80, 80, 120, 200};
+
+  /** The first level size for new slices */
+  static final int FIRST_LEVEL_SIZE = LEVEL_SIZE_ARRAY[0];
+
+  /**
+   * Allocates a new slice with the given size. As each slice is filled with 0's initially, we mark
+   * the end with a non-zero byte. This way we don't need to record its length and instead allocate
+   * new slice once they hit a non-zero byte.
+   */
+  // pkg private for access by tests
+  static int newSlice(ByteBlockPool bytePool, final int size, final int level) {
+    assert LEVEL_SIZE_ARRAY[level] == size;
+    // Maybe allocate another block
+    if (bytePool.byteUpto > ByteBlockPool.BYTE_BLOCK_SIZE - size) {
+      bytePool.nextBuffer();
+    }
+    final int upto = bytePool.byteUpto;
+    bytePool.byteUpto += size;
+    bytePool.buffer[bytePool.byteUpto - 1] = (byte) (16 | level);
+    return upto;
+  }
+
+  /**
+   * Creates a new byte slice with the given starting size and returns the slices offset in the
+   * pool.
+   */
+  // pkg private for access by tests
+  static int allocSlice(ByteBlockPool bytePool, final byte[] slice, final int upto) {
+    return allocKnownSizeSlice(bytePool, slice, upto) >> 8;
+  }
+
+  /**
+   * Create a new byte slice with the given starting size return the slice offset in the pool and
+   * length. The lower 8 bits of the returned int represent the length of the slice, and the upper
+   * 24 bits represent the offset.
+   */
+  // pkg private for access by tests
+  static int allocKnownSizeSlice(ByteBlockPool bytePool, final byte[] slice, final int upto) {
+    // The idea is to allocate the next slice and then write the address of the new slice
+    // into the last 4 bytes of the previous slice (the "forwarding address").
+    final int level = slice[upto] & 15;
+    final int newLevel = NEXT_LEVEL_ARRAY[level];
+    final int newSize = LEVEL_SIZE_ARRAY[newLevel];
+
+    final int newUpto = newSlice(bytePool, newSize, newLevel);
+    final int offset = newUpto + bytePool.byteOffset;
+
+    // Copy forward the past 3 bytes (which we are about to overwrite with the forwarding address).
+    // We actually copy 4 bytes at once since VarHandles make it cheap.
+    final int past3Bytes = ((int) BitUtil.VH_LE_INT.get(slice, upto - 3)) & 0xFFFFFF;
+    // Ensure we're not changing the content of `buffer` by setting 4 bytes instead of 3. This
+    // should never happen since the next `newSize` bytes must be equal to 0.
+    assert bytePool.buffer[newUpto + 3] == 0;
+    BitUtil.VH_LE_INT.set(bytePool.buffer, newUpto, past3Bytes);
+
+    // Write forwarding address at end of last slice:
+    BitUtil.VH_LE_INT.set(slice, upto - 3, offset);
+
+    return ((newUpto + 3) << 8) | (newSize - 3);
+  }
+
  final void writeVInt(int stream, int i) {
    assert stream < streamCount;
    while ((i & ~0x7F) != 0) {
--- a/lucene/core/src/java/org/apache/lucene/util/ByteBlockPool.java
+++ b/lucene/core/src/java/org/apache/lucene/util/ByteBlockPool.java
@ -22,15 +22,9 @@ import java.util.Arrays;
 import java.util.List;

 /**
- * Class that Posting and PostingVector use to write byte streams into shared fixed-size byte[]
- * arrays. The idea is to allocate slices of increasing lengths For example, the first slice is 5
- * bytes, the next slice is 14, etc. We start by writing our bytes into the first 5 bytes. When we
- * hit the end of the slice, we allocate the next slice and then write the address of the new slice
- * into the last 4 bytes of the previous slice (the "forwarding address").
- *
- * <p>Each slice is filled with 0's initially, and we mark the end with a non-zero byte. This way
- * the methods that are writing into the slice don't need to record its length and instead allocate
- * a new slice once they hit a non-zero byte.
+ * Represents a logical byte[] as a series of blocks. You can write into it by using append and read
+ * using the offset position (random access). The buffers can be reset to reuse the allocated
+ * buffers.
 *
 * @lucene.internal
 */
@ -66,11 +60,7 @@ public final class ByteBlockPool implements Accountable {
  public static final class DirectAllocator extends Allocator {

    public DirectAllocator() {
-      this(BYTE_BLOCK_SIZE);
-    }
-
-    public DirectAllocator(int blockSize) {
-      super(blockSize);
+      super(BYTE_BLOCK_SIZE);
    }

    @Override
@ -82,11 +72,7 @@ public final class ByteBlockPool implements Accountable {
    private final Counter bytesUsed;

    public DirectTrackingAllocator(Counter bytesUsed) {
-      this(BYTE_BLOCK_SIZE, bytesUsed);
-    }
-
-    public DirectTrackingAllocator(int blockSize, Counter bytesUsed) {
-      super(blockSize);
+      super(BYTE_BLOCK_SIZE);
      this.bytesUsed = bytesUsed;
    }

@ -202,85 +188,6 @@ public final class ByteBlockPool implements Accountable {
    byteOffset = Math.addExact(byteOffset, BYTE_BLOCK_SIZE);
  }

-  /**
-   * Allocates a new slice with the given size.
-   *
-   * @see ByteBlockPool#FIRST_LEVEL_SIZE
-   */
-  public int newSlice(final int size) {
-    if (byteUpto > BYTE_BLOCK_SIZE - size) nextBuffer();
-    final int upto = byteUpto;
-    byteUpto += size;
-    buffer[byteUpto - 1] = 16;
-    return upto;
-  }
-
-  // Size of each slice.  These arrays should be at most 16
-  // elements (index is encoded with 4 bits).  First array
-  // is just a compact way to encode X+1 with a max.  Second
-  // array is the length of each slice, ie first slice is 5
-  // bytes, next slice is 14 bytes, etc.
-
-  /**
-   * An array holding the offset into the {@link ByteBlockPool#LEVEL_SIZE_ARRAY} to quickly navigate
-   * to the next slice level.
-   */
-  public static final int[] NEXT_LEVEL_ARRAY = {1, 2, 3, 4, 5, 6, 7, 8, 9, 9};
-
-  /** An array holding the level sizes for byte slices. */
-  public static final int[] LEVEL_SIZE_ARRAY = {5, 14, 20, 30, 40, 40, 80, 80, 120, 200};
-
-  /**
-   * The first level size for new slices
-   *
-   * @see ByteBlockPool#newSlice(int)
-   */
-  public static final int FIRST_LEVEL_SIZE = LEVEL_SIZE_ARRAY[0];
-
-  /**
-   * Creates a new byte slice with the given starting size and returns the slices offset in the
-   * pool.
-   */
-  public int allocSlice(final byte[] slice, final int upto) {
-    return allocKnownSizeSlice(slice, upto) >> 8;
-  }
-
-  /**
-   * Create a new byte slice with the given starting size return the slice offset in the pool and
-   * length. The lower 8 bits of the returned int represent the length of the slice, and the upper
-   * 24 bits represent the offset.
-   */
-  public int allocKnownSizeSlice(final byte[] slice, final int upto) {
-    final int level = slice[upto] & 15;
-    final int newLevel = NEXT_LEVEL_ARRAY[level];
-    final int newSize = LEVEL_SIZE_ARRAY[newLevel];
-
-    // Maybe allocate another block
-    if (byteUpto > BYTE_BLOCK_SIZE - newSize) {
-      nextBuffer();
-    }
-
-    final int newUpto = byteUpto;
-    final int offset = newUpto + byteOffset;
-    byteUpto += newSize;
-
-    // Copy forward the past 3 bytes (which we are about to overwrite with the forwarding address).
-    // We actually copy 4 bytes at once since VarHandles make it cheap.
-    int past3Bytes = ((int) BitUtil.VH_LE_INT.get(slice, upto - 3)) & 0xFFFFFF;
-    // Ensure we're not changing the content of `buffer` by setting 4 bytes instead of 3. This
-    // should never happen since the next `newSize` bytes must be equal to 0.
-    assert buffer[newUpto + 3] == 0;
-    BitUtil.VH_LE_INT.set(buffer, newUpto, past3Bytes);
-
-    // Write forwarding address at end of last slice:
-    BitUtil.VH_LE_INT.set(slice, upto - 3, offset);
-
-    // Write new level:
-    buffer[byteUpto - 1] = (byte) (16 | newLevel);
-
-    return ((newUpto + 3) << 8) | (newSize - 3);
-  }
-
  /**
   * Fill the provided {@link BytesRef} with the bytes at the specified offset/length slice. This
   * will avoid copying the bytes, if the slice fits into a single block; otherwise, it uses the
@ -306,23 +213,6 @@ public final class ByteBlockPool implements Accountable {
    }
  }

-  // Fill in a BytesRef from term's length & bytes encoded in
-  // byte block
-  public void setBytesRef(BytesRef term, int textStart) {
-    final byte[] bytes = term.bytes = buffers[textStart >> BYTE_BLOCK_SHIFT];
-    int pos = textStart & BYTE_BLOCK_MASK;
-    if ((bytes[pos] & 0x80) == 0) {
-      // length is 1 byte
-      term.length = bytes[pos];
-      term.offset = pos + 1;
-    } else {
-      // length is 2 bytes
-      term.length = ((short) BitUtil.VH_BE_SHORT.get(bytes, pos)) & 0x7FFF;
-      term.offset = pos + 2;
-    }
-    assert term.length >= 0;
-  }
-
  /** Appends the bytes in the provided {@link BytesRef} at the current position. */
  public void append(final BytesRef bytes) {
    int bytesLeft = bytes.length;
@ -366,26 +256,6 @@ public final class ByteBlockPool implements Accountable {
    }
  }

-  /**
-   * Set the given {@link BytesRef} so that its content is equal to the {@code ref.length} bytes
-   * starting at {@code offset}. Most of the time this method will set pointers to internal
-   * data-structures. However, in case a value crosses a boundary, a fresh copy will be returned. On
-   * the contrary to {@link #setBytesRef(BytesRef, int)}, this does not expect the length to be
-   * encoded with the data.
-   */
-  public void setRawBytesRef(BytesRef ref, final long offset) {
-    int bufferIndex = (int) (offset >> BYTE_BLOCK_SHIFT);
-    int pos = (int) (offset & BYTE_BLOCK_MASK);
-    if (pos + ref.length <= BYTE_BLOCK_SIZE) {
-      ref.bytes = buffers[bufferIndex];
-      ref.offset = pos;
-    } else {
-      ref.bytes = new byte[ref.length];
-      ref.offset = 0;
-      readBytes(offset, ref.bytes, 0, ref.length);
-    }
-  }
-
  @Override
  public long ramBytesUsed() {
    long size = BASE_RAM_BYTES;
--- a/lucene/core/src/java/org/apache/lucene/util/BytesRefBlockPool.java
+++ b/lucene/core/src/java/org/apache/lucene/util/BytesRefBlockPool.java
@ -0,0 +1,176 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.lucene.util;
+
+import static org.apache.lucene.util.ByteBlockPool.BYTE_BLOCK_MASK;
+import static org.apache.lucene.util.ByteBlockPool.BYTE_BLOCK_SHIFT;
+import static org.apache.lucene.util.ByteBlockPool.BYTE_BLOCK_SIZE;
+
+import java.util.Arrays;
+
+/**
+ * Represents a logical list of ByteRef backed by a {@link ByteBlockPool}. It uses up to two bytes
+ * to record the length of the BytesRef followed by the actual bytes. They can be read using the
+ * start position returned when they are appended.
+ *
+ * <p>The {@link BytesRef} is written so it never crosses the {@link ByteBlockPool#BYTE_BLOCK_SIZE}
+ * boundary. The limit of the largest {@link BytesRef} is therefore {@link
+ * ByteBlockPool#BYTE_BLOCK_SIZE}-2 bytes.
+ *
+ * @lucene.internal
+ */
+public class BytesRefBlockPool implements Accountable {
+
+  private static final long BASE_RAM_BYTES =
+      RamUsageEstimator.shallowSizeOfInstance(BytesRefBlockPool.class);
+
+  private final ByteBlockPool byteBlockPool;
+
+  public BytesRefBlockPool() {
+    this.byteBlockPool = new ByteBlockPool(new ByteBlockPool.DirectAllocator());
+  }
+
+  public BytesRefBlockPool(ByteBlockPool byteBlockPool) {
+    this.byteBlockPool = byteBlockPool;
+  }
+
+  /** Reset this buffer to the empty state. */
+  void reset() {
+    byteBlockPool.reset(false, false); // we don't need to 0-fill the buffers
+  }
+
+  /**
+   * Populates the given BytesRef with the term starting at <i>start</i>.
+   *
+   * @see #fillBytesRef(BytesRef, int)
+   */
+  public void fillBytesRef(BytesRef term, int start) {
+    final byte[] bytes = term.bytes = byteBlockPool.buffers[start >> BYTE_BLOCK_SHIFT];
+    int pos = start & BYTE_BLOCK_MASK;
+    if ((bytes[pos] & 0x80) == 0) {
+      // length is 1 byte
+      term.length = bytes[pos];
+      term.offset = pos + 1;
+    } else {
+      // length is 2 bytes
+      term.length = ((short) BitUtil.VH_BE_SHORT.get(bytes, pos)) & 0x7FFF;
+      term.offset = pos + 2;
+    }
+    assert term.length >= 0;
+  }
+
+  /**
+   * Add a term returning the start position on the underlying {@link ByteBlockPool}. THis can be
+   * used to read back the value using {@link #fillBytesRef(BytesRef, int)}.
+   *
+   * @see #fillBytesRef(BytesRef, int)
+   */
+  public int addBytesRef(BytesRef bytes) {
+    final int length = bytes.length;
+    final int len2 = 2 + bytes.length;
+    if (len2 + byteBlockPool.byteUpto > BYTE_BLOCK_SIZE) {
+      if (len2 > BYTE_BLOCK_SIZE) {
+        throw new BytesRefHash.MaxBytesLengthExceededException(
+            "bytes can be at most " + (BYTE_BLOCK_SIZE - 2) + " in length; got " + bytes.length);
+      }
+      byteBlockPool.nextBuffer();
+    }
+    final byte[] buffer = byteBlockPool.buffer;
+    final int bufferUpto = byteBlockPool.byteUpto;
+    final int textStart = bufferUpto + byteBlockPool.byteOffset;
+
+    // We first encode the length, followed by the
+    // bytes. Length is encoded as vInt, but will consume
+    // 1 or 2 bytes at most (we reject too-long terms,
+    // above).
+    if (length < 128) {
+      // 1 byte to store length
+      buffer[bufferUpto] = (byte) length;
+      byteBlockPool.byteUpto += length + 1;
+      assert length >= 0 : "Length must be positive: " + length;
+      System.arraycopy(bytes.bytes, bytes.offset, buffer, bufferUpto + 1, length);
+    } else {
+      // 2 byte to store length
+      BitUtil.VH_BE_SHORT.set(buffer, bufferUpto, (short) (length | 0x8000));
+      byteBlockPool.byteUpto += length + 2;
+      System.arraycopy(bytes.bytes, bytes.offset, buffer, bufferUpto + 2, length);
+    }
+    return textStart;
+  }
+
+  /**
+   * Computes the hash of the BytesRef at the given start. This is equivalent of doing:
+   *
+   * <pre>
+   *     BytesRef bytes = new BytesRef();
+   *     fillTerm(bytes, start);
+   *     BytesRefHash.doHash(bytes.bytes, bytes.pos, bytes.len);
+   *  </pre>
+   *
+   * It just saves the work of filling the BytesRef.
+   */
+  int hash(int start) {
+    final int offset = start & BYTE_BLOCK_MASK;
+    final byte[] bytes = byteBlockPool.buffers[start >> BYTE_BLOCK_SHIFT];
+    final int len;
+    int pos;
+    if ((bytes[offset] & 0x80) == 0) {
+      // length is 1 byte
+      len = bytes[offset];
+      pos = offset + 1;
+    } else {
+      len = ((short) BitUtil.VH_BE_SHORT.get(bytes, offset)) & 0x7FFF;
+      pos = offset + 2;
+    }
+    return BytesRefHash.doHash(bytes, pos, len);
+  }
+
+  /**
+   * Computes the equality between the BytesRef at the start position with the provided BytesRef.
+   * This is equivalent of doing:
+   *
+   * <pre>
+   *     BytesRef bytes = new BytesRef();
+   *     fillTerm(bytes, start);
+   *     Arrays.equals(bytes.bytes, bytes.offset, bytes.offset + length, b.bytes, b.offset, b.offset + b.length);
+   *  </pre>
+   *
+   * It just saves the work of filling the BytesRef.
+   */
+  boolean equals(int start, BytesRef b) {
+    final byte[] bytes = byteBlockPool.buffers[start >> BYTE_BLOCK_SHIFT];
+    int pos = start & BYTE_BLOCK_MASK;
+    final int length;
+    final int offset;
+    if ((bytes[pos] & 0x80) == 0) {
+      // length is 1 byte
+      length = bytes[pos];
+      offset = pos + 1;
+    } else {
+      // length is 2 bytes
+      length = ((short) BitUtil.VH_BE_SHORT.get(bytes, pos)) & 0x7FFF;
+      offset = pos + 2;
+    }
+    return Arrays.equals(bytes, offset, offset + length, b.bytes, b.offset, b.offset + b.length);
+  }
+
+  @Override
+  public long ramBytesUsed() {
+    return BASE_RAM_BYTES + byteBlockPool.ramBytesUsed();
+  }
+}
--- a/lucene/core/src/java/org/apache/lucene/util/BytesRefHash.java
+++ b/lucene/core/src/java/org/apache/lucene/util/BytesRefHash.java
@ -16,10 +16,6 @@
 */
 package org.apache.lucene.util;

-import static org.apache.lucene.util.ByteBlockPool.BYTE_BLOCK_MASK;
-import static org.apache.lucene.util.ByteBlockPool.BYTE_BLOCK_SHIFT;
-import static org.apache.lucene.util.ByteBlockPool.BYTE_BLOCK_SIZE;
-
 import java.util.Arrays;
 import java.util.concurrent.atomic.AtomicLong;
 import org.apache.lucene.util.ByteBlockPool.DirectAllocator;
@ -48,7 +44,7 @@ public final class BytesRefHash implements Accountable {

  // the following fields are needed by comparator,
  // so package private to prevent access$-methods:
-  final ByteBlockPool pool;
+  final BytesRefBlockPool pool;
  int[] bytesStart;

  private int hashSize;
@ -58,7 +54,7 @@ public final class BytesRefHash implements Accountable {
  private int lastCount = -1;
  private int[] ids;
  private final BytesStartArray bytesStartArray;
-  private Counter bytesUsed;
+  private final Counter bytesUsed;

  /**
   * Creates a new {@link BytesRefHash} with a {@link ByteBlockPool} using a {@link
@ -78,7 +74,7 @@ public final class BytesRefHash implements Accountable {
    hashSize = capacity;
    hashHalfSize = hashSize >> 1;
    hashMask = hashSize - 1;
-    this.pool = pool;
+    this.pool = new BytesRefBlockPool(pool);
    ids = new int[hashSize];
    Arrays.fill(ids, -1);
    this.bytesStartArray = bytesStartArray;
@ -110,7 +106,7 @@ public final class BytesRefHash implements Accountable {
  public BytesRef get(int bytesID, BytesRef ref) {
    assert bytesStart != null : "bytesStart is null - not initialized";
    assert bytesID < bytesStart.length : "bytesID exceeds byteStart len: " + bytesStart.length;
-    pool.setBytesRef(ref, bytesStart[bytesID]);
+    pool.fillBytesRef(ref, bytesStart[bytesID]);
    return ref;
  }

@ -160,30 +156,12 @@ public final class BytesRefHash implements Accountable {

      @Override
      protected void get(BytesRefBuilder builder, BytesRef result, int i) {
-        pool.setBytesRef(result, bytesStart[compact[i]]);
+        pool.fillBytesRef(result, bytesStart[compact[i]]);
      }
    }.sort(0, count);
    return compact;
  }

-  private boolean equals(int id, BytesRef b) {
-    final int textStart = bytesStart[id];
-    final byte[] bytes = pool.buffers[textStart >> BYTE_BLOCK_SHIFT];
-    int pos = textStart & BYTE_BLOCK_MASK;
-    final int length;
-    final int offset;
-    if ((bytes[pos] & 0x80) == 0) {
-      // length is 1 byte
-      length = bytes[pos];
-      offset = pos + 1;
-    } else {
-      // length is 2 bytes
-      length = ((short) BitUtil.VH_BE_SHORT.get(bytes, pos)) & 0x7FFF;
-      offset = pos + 2;
-    }
-    return Arrays.equals(bytes, offset, offset + length, b.bytes, b.offset, b.offset + b.length);
-  }
-
  private boolean shrink(int targetSize) {
    // Cannot use ArrayUtil.shrink because we require power
    // of 2:
@ -209,7 +187,7 @@ public final class BytesRefHash implements Accountable {
    lastCount = count;
    count = 0;
    if (resetPool) {
-      pool.reset(false, false); // we don't need to 0-fill the buffers
+      pool.reset();
    }
    bytesStart = bytesStartArray.clear();
    if (lastCount != -1 && shrink(lastCount)) {
@ -242,47 +220,18 @@ public final class BytesRefHash implements Accountable {
   */
  public int add(BytesRef bytes) {
    assert bytesStart != null : "Bytesstart is null - not initialized";
-    final int length = bytes.length;
    // final position
    final int hashPos = findHash(bytes);
    int e = ids[hashPos];

    if (e == -1) {
      // new entry
-      final int len2 = 2 + bytes.length;
-      if (len2 + pool.byteUpto > BYTE_BLOCK_SIZE) {
-        if (len2 > BYTE_BLOCK_SIZE) {
-          throw new MaxBytesLengthExceededException(
-              "bytes can be at most " + (BYTE_BLOCK_SIZE - 2) + " in length; got " + bytes.length);
-        }
-        pool.nextBuffer();
-      }
-      final byte[] buffer = pool.buffer;
-      final int bufferUpto = pool.byteUpto;
      if (count >= bytesStart.length) {
        bytesStart = bytesStartArray.grow();
        assert count < bytesStart.length + 1 : "count: " + count + " len: " + bytesStart.length;
      }
+      bytesStart[count] = pool.addBytesRef(bytes);
      e = count++;
-
-      bytesStart[e] = bufferUpto + pool.byteOffset;
-
-      // We first encode the length, followed by the
-      // bytes. Length is encoded as vInt, but will consume
-      // 1 or 2 bytes at most (we reject too-long terms,
-      // above).
-      if (length < 128) {
-        // 1 byte to store length
-        buffer[bufferUpto] = (byte) length;
-        pool.byteUpto += length + 1;
-        assert length >= 0 : "Length must be positive: " + length;
-        System.arraycopy(bytes.bytes, bytes.offset, buffer, bufferUpto + 1, length);
-      } else {
-        // 2 byte to store length
-        BitUtil.VH_BE_SHORT.set(buffer, bufferUpto, (short) (length | 0x8000));
-        pool.byteUpto += length + 2;
-        System.arraycopy(bytes.bytes, bytes.offset, buffer, bufferUpto + 2, length);
-      }
      assert ids[hashPos] == -1;
      ids[hashPos] = e;

@ -312,14 +261,14 @@ public final class BytesRefHash implements Accountable {
    // final position
    int hashPos = code & hashMask;
    int e = ids[hashPos];
-    if (e != -1 && !equals(e, bytes)) {
+    if (e != -1 && pool.equals(bytesStart[e], bytes) == false) {
      // Conflict; use linear probe to find an open slot
      // (see LUCENE-5604):
      do {
        code++;
        hashPos = code & hashMask;
        e = ids[hashPos];
-      } while (e != -1 && !equals(e, bytes));
+      } while (e != -1 && pool.equals(bytesStart[e], bytes) == false);
    }

    return hashPos;
@ -378,20 +327,7 @@ public final class BytesRefHash implements Accountable {
      if (e0 != -1) {
        int code;
        if (hashOnData) {
-          final int off = bytesStart[e0];
-          final int start = off & BYTE_BLOCK_MASK;
-          final byte[] bytes = pool.buffers[off >> BYTE_BLOCK_SHIFT];
-          final int len;
-          int pos;
-          if ((bytes[start] & 0x80) == 0) {
-            // length is 1 byte
-            len = bytes[start];
-            pos = start + 1;
-          } else {
-            len = ((short) BitUtil.VH_BE_SHORT.get(bytes, start)) & 0x7FFF;
-            pos = start + 2;
-          }
-          code = doHash(bytes, pos, len);
+          code = pool.hash(bytesStart[e0]);
        } else {
          code = bytesStart[e0];
        }
@ -418,7 +354,7 @@ public final class BytesRefHash implements Accountable {
  }

  // TODO: maybe use long?  But our keys are typically short...
-  private int doHash(byte[] bytes, int offset, int length) {
+  static int doHash(byte[] bytes, int offset, int length) {
    return StringHelper.murmurhash3_x86_32(bytes, offset, length, StringHelper.GOOD_FAST_HASH_SEED);
  }

--- a/lucene/core/src/java/org/apache/lucene/util/RecyclingByteBlockAllocator.java
+++ b/lucene/core/src/java/org/apache/lucene/util/RecyclingByteBlockAllocator.java
@ -36,12 +36,11 @@ public final class RecyclingByteBlockAllocator extends ByteBlockPool.Allocator {
  /**
   * Creates a new {@link RecyclingByteBlockAllocator}
   *
-   * @param blockSize the block size in bytes
   * @param maxBufferedBlocks maximum number of buffered byte block
   * @param bytesUsed {@link Counter} reference counting internally allocated bytes
   */
-  public RecyclingByteBlockAllocator(int blockSize, int maxBufferedBlocks, Counter bytesUsed) {
-    super(blockSize);
+  public RecyclingByteBlockAllocator(int maxBufferedBlocks, Counter bytesUsed) {
+    super(ByteBlockPool.BYTE_BLOCK_SIZE);
    freeByteBlocks = new byte[maxBufferedBlocks][];
    this.maxBufferedBlocks = maxBufferedBlocks;
    this.bytesUsed = bytesUsed;
@ -50,11 +49,10 @@ public final class RecyclingByteBlockAllocator extends ByteBlockPool.Allocator {
  /**
   * Creates a new {@link RecyclingByteBlockAllocator}.
   *
-   * @param blockSize the block size in bytes
   * @param maxBufferedBlocks maximum number of buffered byte block
   */
-  public RecyclingByteBlockAllocator(int blockSize, int maxBufferedBlocks) {
-    this(blockSize, maxBufferedBlocks, Counter.newCounter(false));
+  public RecyclingByteBlockAllocator(int maxBufferedBlocks) {
+    this(maxBufferedBlocks, Counter.newCounter(false));
  }

  /**
@ -63,7 +61,7 @@ public final class RecyclingByteBlockAllocator extends ByteBlockPool.Allocator {
   * ({@value #DEFAULT_BUFFERED_BLOCKS}).
   */
  public RecyclingByteBlockAllocator() {
-    this(ByteBlockPool.BYTE_BLOCK_SIZE, 64, Counter.newCounter(false));
+    this(DEFAULT_BUFFERED_BLOCKS, Counter.newCounter(false));
  }

  @Override
--- a/lucene/core/src/test/org/apache/lucene/index/TestByteSliceReader.java
+++ b/lucene/core/src/test/org/apache/lucene/index/TestByteSliceReader.java
@ -37,10 +37,10 @@ public class TestByteSliceReader extends LuceneTestCase {
    BLOCK_POOL = new ByteBlockPool(new ByteBlockPool.DirectAllocator());
    BLOCK_POOL.nextBuffer();
    byte[] buffer = BLOCK_POOL.buffer;
-    int upto = BLOCK_POOL.newSlice(ByteBlockPool.FIRST_LEVEL_SIZE);
+    int upto = TermsHashPerField.newSlice(BLOCK_POOL, TermsHashPerField.FIRST_LEVEL_SIZE, 0);
    for (byte randomByte : RANDOM_DATA) {
      if ((buffer[upto] & 16) != 0) {
-        upto = BLOCK_POOL.allocSlice(buffer, upto);
+        upto = TermsHashPerField.allocSlice(BLOCK_POOL, buffer, upto);
        buffer = BLOCK_POOL.buffer;
      }
      buffer[upto++] = randomByte;
--- a/lucene/core/src/test/org/apache/lucene/index/TestTermsHashPerField.java
+++ b/lucene/core/src/test/org/apache/lucene/index/TestTermsHashPerField.java
@ -323,4 +323,38 @@ public class TestTermsHashPerField extends LuceneTestCase {
      }
    }
  }
+
+  public void testAllocKnowSizeSlice() {
+    Counter bytesUsed = Counter.newCounter();
+    ByteBlockPool pool = new ByteBlockPool(new ByteBlockPool.DirectTrackingAllocator(bytesUsed));
+    pool.nextBuffer();
+    for (int i = 0; i < 100; i++) {
+      int size;
+      if (random().nextBoolean()) {
+        size = TestUtil.nextInt(random(), 100, 1000);
+      } else {
+        size = TestUtil.nextInt(random(), 50000, 100000);
+      }
+      byte[] randomData = new byte[size];
+      random().nextBytes(randomData);
+
+      int upto = TermsHashPerField.newSlice(pool, TermsHashPerField.FIRST_LEVEL_SIZE, 0);
+
+      for (int offset = 0; offset < size; ) {
+        if ((pool.buffer[upto] & 16) == 0) {
+          pool.buffer[upto++] = randomData[offset++];
+        } else {
+          int offsetAndLength = TermsHashPerField.allocKnownSizeSlice(pool, pool.buffer, upto);
+          int sliceLength = offsetAndLength & 0xff;
+          upto = offsetAndLength >> 8;
+          assertNotEquals(0, pool.buffer[upto + sliceLength - 1]);
+          assertEquals(0, pool.buffer[upto]);
+          int writeLength = Math.min(sliceLength - 1, size - offset);
+          System.arraycopy(randomData, offset, pool.buffer, upto, writeLength);
+          offset += writeLength;
+          upto += writeLength;
+        }
+      }
+    }
+  }
 }
--- a/lucene/core/src/test/org/apache/lucene/util/TestByteBlockPool.java
+++ b/lucene/core/src/test/org/apache/lucene/util/TestByteBlockPool.java
@ -44,6 +44,7 @@ public class TestByteBlockPool extends LuceneTestCase {
      }
      // verify
      long position = 0;
+      BytesRefBuilder builder = new BytesRefBuilder();
      for (BytesRef expected : list) {
        ref.grow(expected.length);
        ref.setLength(expected.length);
@ -54,8 +55,7 @@ public class TestByteBlockPool extends LuceneTestCase {
            break;
          case 1:
            BytesRef scratch = new BytesRef();
-            scratch.length = ref.length();
-            pool.setRawBytesRef(scratch, position);
+            pool.setBytesRef(builder, scratch, position, ref.length());
            System.arraycopy(scratch.bytes, scratch.offset, ref.bytes(), 0, ref.length());
            break;
          default:
@ -102,40 +102,6 @@ public class TestByteBlockPool extends LuceneTestCase {
    }
  }

-  public void testAllocKnowSizeSlice() throws IOException {
-    Counter bytesUsed = Counter.newCounter();
-    ByteBlockPool pool = new ByteBlockPool(new ByteBlockPool.DirectTrackingAllocator(bytesUsed));
-    pool.nextBuffer();
-    for (int i = 0; i < 100; i++) {
-      int size;
-      if (random().nextBoolean()) {
-        size = TestUtil.nextInt(random(), 100, 1000);
-      } else {
-        size = TestUtil.nextInt(random(), 50000, 100000);
-      }
-      byte[] randomData = new byte[size];
-      random().nextBytes(randomData);
-
-      int upto = pool.newSlice(ByteBlockPool.FIRST_LEVEL_SIZE);
-
-      for (int offset = 0; offset < size; ) {
-        if ((pool.buffer[upto] & 16) == 0) {
-          pool.buffer[upto++] = randomData[offset++];
-        } else {
-          int offsetAndLength = pool.allocKnownSizeSlice(pool.buffer, upto);
-          int sliceLength = offsetAndLength & 0xff;
-          upto = offsetAndLength >> 8;
-          assertNotEquals(0, pool.buffer[upto + sliceLength - 1]);
-          assertEquals(0, pool.buffer[upto]);
-          int writeLength = Math.min(sliceLength - 1, size - offset);
-          System.arraycopy(randomData, offset, pool.buffer, upto, writeLength);
-          offset += writeLength;
-          upto += writeLength;
-        }
-      }
-    }
-  }
-
  public void testTooManyAllocs() {
    // Use a mock allocator that doesn't waste memory
    ByteBlockPool pool =
--- a/lucene/core/src/test/org/apache/lucene/util/TestBytesRefHash.java
+++ b/lucene/core/src/test/org/apache/lucene/util/TestBytesRefHash.java
@ -50,8 +50,7 @@ public class TestBytesRefHash extends LuceneTestCase {
  private ByteBlockPool newPool() {
    return random().nextBoolean() && pool != null
        ? pool
-        : new ByteBlockPool(
-            new RecyclingByteBlockAllocator(ByteBlockPool.BYTE_BLOCK_SIZE, random().nextInt(25)));
+        : new ByteBlockPool(new RecyclingByteBlockAllocator(random().nextInt(25)));
  }

  private BytesRefHash newHash(ByteBlockPool blockPool) {
--- a/lucene/core/src/test/org/apache/lucene/util/TestRecyclingByteBlockAllocator.java
+++ b/lucene/core/src/test/org/apache/lucene/util/TestRecyclingByteBlockAllocator.java
@ -34,8 +34,7 @@ public class TestRecyclingByteBlockAllocator extends LuceneTestCase {
  }

  private RecyclingByteBlockAllocator newAllocator() {
-    return new RecyclingByteBlockAllocator(
-        1 << (2 + random().nextInt(15)), random().nextInt(97), Counter.newCounter());
+    return new RecyclingByteBlockAllocator(random().nextInt(97), Counter.newCounter());
  }

  @Test
--- a/lucene/memory/src/java/org/apache/lucene/index/memory/MemoryIndex.java
+++ b/lucene/memory/src/java/org/apache/lucene/index/memory/MemoryIndex.java
@ -446,9 +446,7 @@ public class MemoryIndex {
            + (maxBufferedIntBlocks * SlicedIntBlockPool.INT_BLOCK_SIZE * Integer.BYTES)
        <= maxReusedBytes;
    byteBlockPool =
-        new ByteBlockPool(
-            new RecyclingByteBlockAllocator(
-                ByteBlockPool.BYTE_BLOCK_SIZE, maxBufferedByteBlocks, bytesUsed));
+        new ByteBlockPool(new RecyclingByteBlockAllocator(maxBufferedByteBlocks, bytesUsed));
    slicedIntBlockPool =
        new SlicedIntBlockPool(
            new RecyclingIntBlockAllocator(