Merge pull request #2002 from navis/DRUID-2001

fixed #2001 GenericIndexed.fromIterable compares all values even when it's not sorted
This commit is contained in:
Xavier Léauté 2015-12-09 08:56:49 -08:00
commit 9015a68c03
2 changed files with 63 additions and 54 deletions

View File

@ -35,9 +35,9 @@ import java.util.Iterator;
/**
* A generic, flat storage mechanism. Use static methods fromArray() or fromIterable() to construct. If input
* is sorted, supports binary search index lookups. If input is not sorted, only supports array-like index lookups.
*
*
* V1 Storage Format:
*
*
* byte 1: version (0x1)
* byte 2 == 0x1 => allowReverseLookup
* bytes 3-6 => numBytesUsed
@ -66,48 +66,42 @@ public class GenericIndexed<T> implements Indexed<T>
}
boolean allowReverseLookup = true;
int count = 1;
T prevVal = objects.next();
while (objects.hasNext()) {
T next = objects.next();
if (!(strategy.compare(prevVal, next) < 0)) {
allowReverseLookup = false;
}
if (prevVal instanceof Closeable) {
CloseQuietly.close((Closeable) prevVal);
}
int count = 0;
prevVal = next;
++count;
}
if (prevVal instanceof Closeable) {
CloseQuietly.close((Closeable) prevVal);
}
ByteArrayOutputStream headerBytes = new ByteArrayOutputStream(4 + (count * 4));
ByteArrayOutputStream headerBytes = new ByteArrayOutputStream();
ByteArrayOutputStream valueBytes = new ByteArrayOutputStream();
int offset = 0;
try {
headerBytes.write(Ints.toByteArray(count));
int offset = 0;
T prevVal = null;
do {
count++;
T next = objects.next();
if (allowReverseLookup && prevVal != null && !(strategy.compare(prevVal, next) < 0)) {
allowReverseLookup = false;
}
for (T object : objectsIterable) {
final byte[] bytes = strategy.toBytes(object);
final byte[] bytes = strategy.toBytes(next);
offset += 4 + bytes.length;
headerBytes.write(Ints.toByteArray(offset));
valueBytes.write(Ints.toByteArray(bytes.length));
valueBytes.write(bytes);
if (object instanceof Closeable) {
CloseQuietly.close((Closeable) object);
if (prevVal instanceof Closeable) {
CloseQuietly.close((Closeable) prevVal);
}
prevVal = next;
} while (objects.hasNext());
if (prevVal instanceof Closeable) {
CloseQuietly.close((Closeable) prevVal);
}
}
catch (IOException e) {
throw new RuntimeException(e);
}
ByteBuffer theBuffer = ByteBuffer.allocate(headerBytes.size() + valueBytes.size());
ByteBuffer theBuffer = ByteBuffer.allocate(Ints.BYTES + headerBytes.size() + valueBytes.size());
theBuffer.put(Ints.toByteArray(count));
theBuffer.put(headerBytes.toByteArray());
theBuffer.put(valueBytes.toByteArray());
theBuffer.flip();

View File

@ -57,19 +57,7 @@ public class GenericIndexedTest
final String[] strings = {"a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l"};
Indexed<String> indexed = GenericIndexed.fromArray(strings, GenericIndexed.STRING_STRATEGY);
Assert.assertEquals(strings.length, indexed.size());
for (int i = 0; i < strings.length; i++) {
Assert.assertEquals(strings[i], indexed.get(i));
}
HashMap<String, Integer> mixedUp = Maps.newHashMap();
for (int i = 0; i < strings.length; i++) {
mixedUp.put(strings[i], i);
}
for (Map.Entry<String, Integer> entry : mixedUp.entrySet()) {
Assert.assertEquals(entry.getValue().intValue(), indexed.indexOf(entry.getKey()));
}
checkBasicAPIs(strings, indexed, true);
Assert.assertEquals(-13, indexed.indexOf("q"));
Assert.assertEquals(-9, indexed.indexOf("howdydo"));
@ -87,25 +75,52 @@ public class GenericIndexedTest
)
);
Assert.assertEquals(strings.length, deserialized.size());
for (int i = 0; i < strings.length; i++) {
Assert.assertEquals(strings[i], deserialized.get(i));
}
HashMap<String, Integer> mixedUp = Maps.newHashMap();
for (int i = 0; i < strings.length; i++) {
mixedUp.put(strings[i], i);
}
for (Map.Entry<String, Integer> entry : mixedUp.entrySet()) {
Assert.assertEquals(entry.getValue().intValue(), deserialized.indexOf(entry.getKey()));
}
checkBasicAPIs(strings, deserialized, true);
Assert.assertEquals(-13, deserialized.indexOf("q"));
Assert.assertEquals(-9, deserialized.indexOf("howdydo"));
Assert.assertEquals(-1, deserialized.indexOf("1111"));
}
@Test
public void testNotSortedSerialization() throws Exception
{
final String[] strings = {"a", "b", "c", "d", "e", "f", "g", "h", "i", "k", "j", "l"};
GenericIndexed<String> deserialized = serializeAndDeserialize(
GenericIndexed.fromArray(
strings, GenericIndexed.STRING_STRATEGY
)
);
checkBasicAPIs(strings, deserialized, false);
}
private void checkBasicAPIs(String[] strings, Indexed<String> index, boolean allowReverseLookup)
{
Assert.assertEquals(strings.length, index.size());
for (int i = 0; i < strings.length; i++) {
Assert.assertEquals(strings[i], index.get(i));
}
if (allowReverseLookup) {
HashMap<String, Integer> mixedUp = Maps.newHashMap();
for (int i = 0; i < strings.length; i++) {
mixedUp.put(strings[i], i);
}
for (Map.Entry<String, Integer> entry : mixedUp.entrySet()) {
Assert.assertEquals(entry.getValue().intValue(), index.indexOf(entry.getKey()));
}
} else {
try {
index.indexOf("xxx");
Assert.fail("should throw exception");
}
catch (UnsupportedOperationException e) {
// not supported
}
}
}
private GenericIndexed<String> serializeAndDeserialize(GenericIndexed<String> indexed) throws IOException
{
ByteArrayOutputStream baos = new ByteArrayOutputStream();