From 07619aa516deb9094a18e0c64ce66ff9c8b05e92 Mon Sep 17 00:00:00 2001 From: Colin Patrick Mccabe Date: Thu, 18 Dec 2014 11:05:06 -0800 Subject: [PATCH] HADOOP-11427. ChunkedArrayList: fix removal via iterator and implement get (cmccabe) --- .../hadoop-common/CHANGES.txt | 3 + .../apache/hadoop/util/ChunkedArrayList.java | 42 +++++++++- .../hadoop/util/TestChunkedArrayList.java | 78 +++++++++++++++++++ 3 files changed, 119 insertions(+), 4 deletions(-) diff --git a/hadoop-common-project/hadoop-common/CHANGES.txt b/hadoop-common-project/hadoop-common/CHANGES.txt index 2378b5bd14a..167bf384c8e 100644 --- a/hadoop-common-project/hadoop-common/CHANGES.txt +++ b/hadoop-common-project/hadoop-common/CHANGES.txt @@ -429,6 +429,9 @@ Release 2.7.0 - UNRELEASED HADOOP-11421. Add IOUtils#listDirectory (cmccabe) + HADOOP-11427. ChunkedArrayList: fix removal via iterator and implement get + (cmccabe) + OPTIMIZATIONS HADOOP-11323. WritableComparator#compare keeps reference to byte array. diff --git a/hadoop-common-project/hadoop-common/src/main/java/org/apache/hadoop/util/ChunkedArrayList.java b/hadoop-common-project/hadoop-common/src/main/java/org/apache/hadoop/util/ChunkedArrayList.java index 42cd324a86c..84ddc32f88c 100644 --- a/hadoop-common-project/hadoop-common/src/main/java/org/apache/hadoop/util/ChunkedArrayList.java +++ b/hadoop-common-project/hadoop-common/src/main/java/org/apache/hadoop/util/ChunkedArrayList.java @@ -110,11 +110,33 @@ public class ChunkedArrayList extends AbstractList { @Override public Iterator iterator() { - return Iterables.concat(chunks).iterator(); + final Iterator it = Iterables.concat(chunks).iterator(); + + return new Iterator() { + @Override + public boolean hasNext() { + return it.hasNext(); + } + + @Override + public T next() { + return it.next(); + } + + @Override + public void remove() { + it.remove(); + size--; + } + }; } @Override public boolean add(T e) { + if (size == Integer.MAX_VALUE) { + throw new RuntimeException("Can't add an additional element to the " + + "list; list already has INT_MAX elements."); + } if (lastChunk == null) { addChunk(initialChunkCapacity); } else if (lastChunk.size() >= lastChunkCapacity) { @@ -164,8 +186,20 @@ public class ChunkedArrayList extends AbstractList { } @Override - public T get(int arg0) { - throw new UnsupportedOperationException( - this.getClass().getName() + " does not support random access"); + public T get(int idx) { + if (idx < 0) { + throw new IndexOutOfBoundsException(); + } + int base = 0; + Iterator> it = chunks.iterator(); + while (it.hasNext()) { + List list = it.next(); + int size = list.size(); + if (idx < base + size) { + return list.get(idx - base); + } + base += size; + } + throw new IndexOutOfBoundsException(); } } diff --git a/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/TestChunkedArrayList.java b/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/TestChunkedArrayList.java index ad170944c7b..f8a2d49c580 100644 --- a/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/TestChunkedArrayList.java +++ b/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/TestChunkedArrayList.java @@ -20,7 +20,9 @@ package org.apache.hadoop.util; import static org.junit.Assert.*; import java.util.ArrayList; +import java.util.Iterator; +import org.junit.Assert; import org.junit.Test; import com.google.common.base.Stopwatch; @@ -90,4 +92,80 @@ public class TestChunkedArrayList { } } } + + @Test + public void testRemovals() throws Exception { + final int NUM_ELEMS = 100000; + ChunkedArrayList list = new ChunkedArrayList(); + for (int i = 0; i < NUM_ELEMS; i++) { + list.add(i); + } + + // Iterate through all list elements. + Iterator iter = list.iterator(); + for (int i = 0; i < NUM_ELEMS; i++) { + Assert.assertTrue(iter.hasNext()); + Integer val = iter.next(); + Assert.assertEquals(Integer.valueOf(i), val); + } + Assert.assertFalse(iter.hasNext()); + Assert.assertEquals(NUM_ELEMS, list.size()); + + // Remove even elements. + iter = list.iterator(); + for (int i = 0; i < NUM_ELEMS; i++) { + Assert.assertTrue(iter.hasNext()); + Integer val = iter.next(); + Assert.assertEquals(Integer.valueOf(i), val); + if (i % 2 == 0) { + iter.remove(); + } + } + Assert.assertFalse(iter.hasNext()); + Assert.assertEquals(NUM_ELEMS / 2, list.size()); + + // Iterate through all odd list elements. + iter = list.iterator(); + for (int i = 0; i < NUM_ELEMS / 2; i++) { + Assert.assertTrue(iter.hasNext()); + Integer val = iter.next(); + Assert.assertEquals(Integer.valueOf(1 + (2 * i)), val); + iter.remove(); + } + Assert.assertFalse(iter.hasNext()); + + // Check that list is now empty. + Assert.assertEquals(0, list.size()); + Assert.assertTrue(list.isEmpty()); + iter = list.iterator(); + Assert.assertFalse(iter.hasNext()); + } + + @Test + public void testGet() throws Exception { + final int NUM_ELEMS = 100001; + ChunkedArrayList list = new ChunkedArrayList(); + for (int i = 0; i < NUM_ELEMS; i++) { + list.add(i); + } + + Assert.assertEquals(Integer.valueOf(100), list.get(100)); + Assert.assertEquals(Integer.valueOf(1000), list.get(1000)); + Assert.assertEquals(Integer.valueOf(10000), list.get(10000)); + Assert.assertEquals(Integer.valueOf(100000), list.get(100000)); + + Iterator iter = list.iterator(); + iter.next(); + iter.remove(); + Assert.assertEquals(Integer.valueOf(1), list.get(0)); + + iter = list.iterator(); + for (int i = 0; i < 500; i++) { + iter.next(); + } + iter.remove(); + + Assert.assertEquals(Integer.valueOf(502), list.get(500)); + Assert.assertEquals(Integer.valueOf(602), list.get(600)); + } }