LUCENE-2764: Allow tests to use random codec per field

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1036543 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
Simon Willnauer 2010-11-18 17:28:27 +00:00
parent e60764241b
commit a5d73e7dec
9 changed files with 80 additions and 31 deletions

View File

@ -65,6 +65,7 @@
</condition> </condition>
<property name="tests.multiplier" value="1" /> <property name="tests.multiplier" value="1" />
<property name="tests.codec" value="random" /> <property name="tests.codec" value="random" />
<property name="tests.randomCodecPerField" value="true"/>
<property name="tests.locale" value="random" /> <property name="tests.locale" value="random" />
<property name="tests.timezone" value="random" /> <property name="tests.timezone" value="random" />
<property name="tests.directory" value="random" /> <property name="tests.directory" value="random" />

View File

@ -133,7 +133,6 @@ public class CreateIndexTask extends PerfTask {
final String defaultCodec = config.get("default.codec", null); final String defaultCodec = config.get("default.codec", null);
if (defaultCodec != null) { if (defaultCodec != null) {
CodecProvider.setDefaultCodec(defaultCodec);
CodecProvider.getDefault().setDefaultFieldCodec(defaultCodec); CodecProvider.getDefault().setDefaultFieldCodec(defaultCodec);
} }

View File

@ -39,7 +39,7 @@ import org.apache.lucene.index.codecs.standard.StandardCodec;
public class CodecProvider { public class CodecProvider {
private SegmentInfosWriter infosWriter = new DefaultSegmentInfosWriter(); private SegmentInfosWriter infosWriter = new DefaultSegmentInfosWriter();
private SegmentInfosReader infosReader = new DefaultSegmentInfosReader(); private SegmentInfosReader infosReader = new DefaultSegmentInfosReader();
private String defaultFieldCodec = defaultCodec; private String defaultFieldCodec = "Standard";
private final Map<String, String> perFieldMap = new HashMap<String, String>(); private final Map<String, String> perFieldMap = new HashMap<String, String>();
@ -47,7 +47,6 @@ public class CodecProvider {
private final Set<String> knownExtensions = new HashSet<String>(); private final Set<String> knownExtensions = new HashSet<String>();
private static String defaultCodec = "Standard";
public final static String[] CORE_CODECS = new String[] {"Standard", "Pulsing", "PreFlex", "SimpleText"}; public final static String[] CORE_CODECS = new String[] {"Standard", "Pulsing", "PreFlex", "SimpleText"};
@ -103,15 +102,6 @@ public class CodecProvider {
return defaultCodecs; return defaultCodecs;
} }
/** Used for testing. @lucene.internal */
public synchronized static void setDefaultCodec(String s) {
defaultCodec = s;
}
/** Used for testing. @lucene.internal */
public synchronized static String getDefaultCodec() {
return defaultCodec;
}
/** /**
* Sets the {@link Codec} for a given field. Not that setting a fields code is * Sets the {@link Codec} for a given field. Not that setting a fields code is
* write-once. If the fields codec is already set this method will throw an * write-once. If the fields codec is already set this method will throw an
@ -175,6 +165,5 @@ class DefaultCodecProvider extends CodecProvider {
register(new PreFlexCodec()); register(new PreFlexCodec());
register(new PulsingCodec(1)); register(new PulsingCodec(1));
register(new SimpleTextCodec()); register(new SimpleTextCodec());
setDefaultFieldCodec(CodecProvider.getDefaultCodec());
} }
} }

View File

@ -24,7 +24,6 @@ import java.util.Random;
import org.apache.lucene.analysis.Analyzer; import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.MockAnalyzer; import org.apache.lucene.analysis.MockAnalyzer;
import org.apache.lucene.document.Document; import org.apache.lucene.document.Document;
import org.apache.lucene.index.codecs.CodecProvider;
import org.apache.lucene.store.Directory; import org.apache.lucene.store.Directory;
import org.apache.lucene.util.LuceneTestCase; import org.apache.lucene.util.LuceneTestCase;
import org.apache.lucene.util.Version; import org.apache.lucene.util.Version;
@ -84,7 +83,7 @@ public class RandomIndexWriter implements Closeable {
flushAt = _TestUtil.nextInt(r, 10, 1000); flushAt = _TestUtil.nextInt(r, 10, 1000);
if (LuceneTestCase.VERBOSE) { if (LuceneTestCase.VERBOSE) {
System.out.println("RIW config=" + w.getConfig()); System.out.println("RIW config=" + w.getConfig());
System.out.println("codec default=" + CodecProvider.getDefaultCodec()); System.out.println("codec default=" + w.getConfig().getCodecProvider().getDefaultFieldCodec());
} }
} }

View File

@ -123,7 +123,7 @@ public class Test2BTerms extends LuceneTestCase {
@Ignore("Takes ~4 hours to run on a fast machine!! And requires that you don't use PreFlex codec.") @Ignore("Takes ~4 hours to run on a fast machine!! And requires that you don't use PreFlex codec.")
public void test2BTerms() throws IOException { public void test2BTerms() throws IOException {
if ("PreFlex".equals(CodecProvider.getDefaultCodec())) { if ("PreFlex".equals(CodecProvider.getDefault().getDefaultFieldCodec())) {
throw new RuntimeException("thist test cannot run with PreFlex codec"); throw new RuntimeException("thist test cannot run with PreFlex codec");
} }

View File

@ -69,7 +69,7 @@ public class TestLazyProxSkipping extends LuceneTestCase {
int numDocs = 500; int numDocs = 500;
Directory directory = new SeekCountingDirectory(new RAMDirectory()); Directory directory = new SeekCountingDirectory(new RAMDirectory());
IndexWriter writer = new IndexWriter(directory, newIndexWriterConfig( TEST_VERSION_CURRENT, new MockAnalyzer(MockTokenizer.WHITESPACE, true, false)).setMaxBufferedDocs(10)); IndexWriter writer = new IndexWriter(directory, newIndexWriterConfig(TEST_VERSION_CURRENT, new MockAnalyzer(MockTokenizer.WHITESPACE, true, false)).setMaxBufferedDocs(10));
((LogMergePolicy) writer.getConfig().getMergePolicy()).setUseCompoundFile(false); ((LogMergePolicy) writer.getConfig().getMergePolicy()).setUseCompoundFile(false);
((LogMergePolicy) writer.getConfig().getMergePolicy()).setUseCompoundDocStore(false); ((LogMergePolicy) writer.getConfig().getMergePolicy()).setUseCompoundDocStore(false);
for (int i = 0; i < numDocs; i++) { for (int i = 0; i < numDocs; i++) {
@ -120,7 +120,7 @@ public class TestLazyProxSkipping extends LuceneTestCase {
} }
public void testLazySkipping() throws IOException { public void testLazySkipping() throws IOException {
assumeFalse("This test cannot run with SimpleText codec", CodecProvider.getDefaultCodec().equals("SimpleText")); assumeFalse("This test cannot run with SimpleText codec", getRandomFieldCodec(this.field).equals("SimpleText"));
// test whether only the minimum amount of seeks() // test whether only the minimum amount of seeks()
// are performed // are performed
performTest(5); performTest(5);

View File

@ -27,7 +27,6 @@ import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.Term; import org.apache.lucene.index.Term;
import org.apache.lucene.index.TermsEnum; import org.apache.lucene.index.TermsEnum;
import org.apache.lucene.index.RandomIndexWriter; import org.apache.lucene.index.RandomIndexWriter;
import org.apache.lucene.index.codecs.CodecProvider;
import org.apache.lucene.store.Directory; import org.apache.lucene.store.Directory;
import org.apache.lucene.util.AttributeSource; import org.apache.lucene.util.AttributeSource;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
@ -57,7 +56,7 @@ public class TestPrefixRandom extends LuceneTestCase {
// we generate aweful prefixes: good for testing. // we generate aweful prefixes: good for testing.
// but for preflex codec, the test can be very slow, so use less iterations. // but for preflex codec, the test can be very slow, so use less iterations.
String codec = CodecProvider.getDefaultCodec(); final String codec = getRandomFieldCodec("field");
int num = codec.equals("PreFlex") ? 200 * RANDOM_MULTIPLIER : 2000 * RANDOM_MULTIPLIER; int num = codec.equals("PreFlex") ? 200 * RANDOM_MULTIPLIER : 2000 * RANDOM_MULTIPLIER;
for (int i = 0; i < num; i++) { for (int i = 0; i < num; i++) {
field.setValue(_TestUtil.randomUnicodeString(random, 10)); field.setValue(_TestUtil.randomUnicodeString(random, 10));

View File

@ -58,7 +58,6 @@ public class TestRegexpRandom2 extends LuceneTestCase {
RandomIndexWriter writer = new RandomIndexWriter(random, dir, RandomIndexWriter writer = new RandomIndexWriter(random, dir,
newIndexWriterConfig(TEST_VERSION_CURRENT, new MockAnalyzer(MockTokenizer.KEYWORD, false)) newIndexWriterConfig(TEST_VERSION_CURRENT, new MockAnalyzer(MockTokenizer.KEYWORD, false))
.setMaxBufferedDocs(_TestUtil.nextInt(random, 50, 1000))); .setMaxBufferedDocs(_TestUtil.nextInt(random, 50, 1000)));
Document doc = new Document(); Document doc = new Document();
Field field = newField("field", "", Field.Store.NO, Field.Index.NOT_ANALYZED); Field field = newField("field", "", Field.Store.NO, Field.Index.NOT_ANALYZED);
doc.add(field); doc.add(field);
@ -135,8 +134,7 @@ public class TestRegexpRandom2 extends LuceneTestCase {
public void testRegexps() throws Exception { public void testRegexps() throws Exception {
// we generate aweful regexps: good for testing. // we generate aweful regexps: good for testing.
// but for preflex codec, the test can be very slow, so use less iterations. // but for preflex codec, the test can be very slow, so use less iterations.
String codec = CodecProvider.getDefaultCodec(); int num = getRandomFieldCodec("field").equals("PreFlex") ? 100 * RANDOM_MULTIPLIER : 1000 * RANDOM_MULTIPLIER;
int num = codec.equals("PreFlex") ? 100 * RANDOM_MULTIPLIER : 1000 * RANDOM_MULTIPLIER;
for (int i = 0; i < num; i++) { for (int i = 0; i < num; i++) {
String reg = AutomatonTestUtil.randomRegexp(random); String reg = AutomatonTestUtil.randomRegexp(random);
assertSame(reg); assertSame(reg);

View File

@ -35,6 +35,8 @@ import org.apache.lucene.index.codecs.mocksep.MockSepCodec;
import org.apache.lucene.index.codecs.preflex.PreFlexCodec; import org.apache.lucene.index.codecs.preflex.PreFlexCodec;
import org.apache.lucene.index.codecs.preflexrw.PreFlexRWCodec; import org.apache.lucene.index.codecs.preflexrw.PreFlexRWCodec;
import org.apache.lucene.index.codecs.pulsing.PulsingCodec; import org.apache.lucene.index.codecs.pulsing.PulsingCodec;
import org.apache.lucene.index.codecs.simpletext.SimpleTextCodec;
import org.apache.lucene.index.codecs.standard.StandardCodec;
import org.apache.lucene.search.BooleanQuery; import org.apache.lucene.search.BooleanQuery;
import org.apache.lucene.search.FieldCache; import org.apache.lucene.search.FieldCache;
import org.apache.lucene.search.FieldCache.CacheEntry; import org.apache.lucene.search.FieldCache.CacheEntry;
@ -73,6 +75,7 @@ import java.lang.reflect.Modifier;
import java.util.ArrayList; import java.util.ArrayList;
import java.util.Arrays; import java.util.Arrays;
import java.util.Collections; import java.util.Collections;
import java.util.HashMap;
import java.util.IdentityHashMap; import java.util.IdentityHashMap;
import java.util.Iterator; import java.util.Iterator;
import java.util.List; import java.util.List;
@ -146,6 +149,8 @@ public abstract class LuceneTestCase extends Assert {
// tests) // tests)
/** Gets the codec to run tests with. */ /** Gets the codec to run tests with. */
static final String TEST_CODEC = System.getProperty("tests.codec", "random"); static final String TEST_CODEC = System.getProperty("tests.codec", "random");
/** Get if a random codec per field should be used */ // only use random per field if no explicit codec is set
static final boolean TEST_RANDOM_CODEC_PER_FIELD = "random".equals(TEST_CODEC) && Boolean.parseBoolean(System.getProperty("tests.randomCodecPerField", "true"));
/** Gets the locale to run tests with */ /** Gets the locale to run tests with */
static final String TEST_LOCALE = System.getProperty("tests.locale", "random"); static final String TEST_LOCALE = System.getProperty("tests.locale", "random");
/** Gets the timezone to run tests with */ /** Gets the timezone to run tests with */
@ -215,7 +220,7 @@ public abstract class LuceneTestCase extends Assert {
static Codec installTestCodecs() { static Codec installTestCodecs() {
final CodecProvider cp = CodecProvider.getDefault(); final CodecProvider cp = CodecProvider.getDefault();
savedDefaultCodec = CodecProvider.getDefaultCodec(); savedDefaultCodec = cp.getDefaultFieldCodec();
String codec = TEST_CODEC; String codec = TEST_CODEC;
final boolean codecHasParam; final boolean codecHasParam;
@ -235,7 +240,6 @@ public abstract class LuceneTestCase extends Assert {
} }
} }
CodecProvider.setDefaultCodec(codec);
cp.setDefaultFieldCodec(codec); cp.setDefaultFieldCodec(codec);
if (codec.equals("PreFlex")) { if (codec.equals("PreFlex")) {
@ -268,7 +272,6 @@ public abstract class LuceneTestCase extends Assert {
cp.unregister(cp.lookup("MockFixedIntBlock")); cp.unregister(cp.lookup("MockFixedIntBlock"));
cp.unregister(cp.lookup("MockVariableIntBlock")); cp.unregister(cp.lookup("MockVariableIntBlock"));
swapCodec(new PulsingCodec(1)); swapCodec(new PulsingCodec(1));
CodecProvider.setDefaultCodec(savedDefaultCodec);
cp.setDefaultFieldCodec(savedDefaultCodec); cp.setDefaultFieldCodec(savedDefaultCodec);
} }
@ -322,6 +325,7 @@ public abstract class LuceneTestCase extends Assert {
timeZone = TEST_TIMEZONE.equals("random") ? randomTimeZone(random) : TimeZone.getTimeZone(TEST_TIMEZONE); timeZone = TEST_TIMEZONE.equals("random") ? randomTimeZone(random) : TimeZone.getTimeZone(TEST_TIMEZONE);
TimeZone.setDefault(timeZone); TimeZone.setDefault(timeZone);
testsFailed = false; testsFailed = false;
randomCodecProvider = new RandomCodecProvider(random);
} }
@AfterClass @AfterClass
@ -342,11 +346,11 @@ public abstract class LuceneTestCase extends Assert {
} }
stores = null; stores = null;
// if tests failed, report some information back // if tests failed, report some information back
if (testsFailed) if (testsFailed) {
System.out.println("NOTE: test params are: codec=" + codec + System.out.println("NOTE: test params are: codec=" + codec +
", locale=" + locale + ", locale=" + locale +
", timezone=" + (timeZone == null ? "(null)" : timeZone.getID())); ", timezone=" + (timeZone == null ? "(null)" : timeZone.getID()) +
if (testsFailed) { (TEST_RANDOM_CODEC_PER_FIELD?", "+randomCodecProvider.toString():""));
System.err.println("NOTE: all tests run in this JVM:"); System.err.println("NOTE: all tests run in this JVM:");
System.err.println(Arrays.toString(testClassesRun.toArray())); System.err.println(Arrays.toString(testClassesRun.toArray()));
} }
@ -617,8 +621,9 @@ public abstract class LuceneTestCase extends Assert {
return newIndexWriterConfig(random, v, a); return newIndexWriterConfig(random, v, a);
} }
/** create a new index writer config with random defaults */
public static IndexWriterConfig newIndexWriterConfig(Random r, Version v, Analyzer a) { public static IndexWriterConfig newIndexWriterConfig(Random r, Version v, Analyzer a) {
IndexWriterConfig c = new IndexWriterConfig(v, a); final IndexWriterConfig c = new IndexWriterConfig(v, a);
if (r.nextBoolean()) { if (r.nextBoolean()) {
c.setMergePolicy(new LogDocMergePolicy()); c.setMergePolicy(new LogDocMergePolicy());
} }
@ -642,7 +647,9 @@ public abstract class LuceneTestCase extends Assert {
logmp.setCalibrateSizeByDeletes(r.nextBoolean()); logmp.setCalibrateSizeByDeletes(r.nextBoolean());
logmp.setMergeFactor(_TestUtil.nextInt(r, 2, 20)); logmp.setMergeFactor(_TestUtil.nextInt(r, 2, 20));
} }
if (TEST_RANDOM_CODEC_PER_FIELD) {
c.setCodecProvider(randomCodecProvider);
}
c.setReaderPooling(r.nextBoolean()); c.setReaderPooling(r.nextBoolean());
c.setReaderTermsIndexDivisor(_TestUtil.nextInt(r, 1, 4)); c.setReaderTermsIndexDivisor(_TestUtil.nextInt(r, 1, 4));
return c; return c;
@ -844,6 +851,8 @@ public abstract class LuceneTestCase extends Assert {
// seed for individual test methods, changed in @before // seed for individual test methods, changed in @before
private long seed; private long seed;
protected static CodecProvider randomCodecProvider;
private static final Random seedRand = new Random(); private static final Random seedRand = new Random();
protected static final Random random = new Random(); protected static final Random random = new Random();
@ -944,6 +953,61 @@ public abstract class LuceneTestCase extends Assert {
} }
} }
/** Returns the codec for the given field uses in this testcase */
public static String getRandomFieldCodec(String field) {
final CodecProvider provider = TEST_RANDOM_CODEC_PER_FIELD ? randomCodecProvider : CodecProvider.getDefault();
return provider.getFieldCodec(field);
}
static class RandomCodecProvider extends CodecProvider {
private final Codec[] codecs;
private final Map<String, String> perFieldMap = new HashMap<String, String>();
private final Random random;
RandomCodecProvider(Random random) {
if (random.nextInt(5) == 0) {
/*
* We randomly swap in a exclusive PreFlexCodec to provide random test coverage
* for preFlex indexes. In realistic a PreFlex-Environment newer codecs don't occur.
*/
this.codecs = new Codec[] { new PreFlexRWCodec() };
} else {
this.codecs = new Codec[] { new StandardCodec(), new SimpleTextCodec(),
new MockSepCodec(), new PulsingCodec(1 + random.nextInt(10)),
new MockVariableIntBlockCodec(1 + random.nextInt(10)),
new MockFixedIntBlockCodec(1 + random.nextInt(10)), };
register(new PreFlexCodec()); // register this for read support
}
for (int i = 0; i < codecs.length; i++) {
register(codecs[i]);
}
this.random = random;
}
@Override
public synchronized String getFieldCodec(String name) {
if (!perFieldMap.containsKey(name)) { // select a codec at random
setFieldCodec(name, codecs[random.nextInt(codecs.length)].name);
}
return super.getFieldCodec(name);
}
@Override
public synchronized void setFieldCodec(String field, String codec) {
if (!perFieldMap.containsKey(field)) {
perFieldMap.put(field, codec);
}
super.setFieldCodec(field, codec);
}
@Override
public String toString() {
return "RandomCodecProvider [perFieldMap=" + perFieldMap + "]";
}
}
@Ignore("just a hack") @Ignore("just a hack")
public final void alwaysIgnoredTestMethod() {} public final void alwaysIgnoredTestMethod() {}
} }