mirror of https://github.com/apache/lucene.git
LUCENE-5889: add commit method to AnalyzingInfixSuggester
git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1619635 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
parent
f84135de7c
commit
4a485d6877
|
@ -103,6 +103,9 @@ New Features
|
||||||
* LUCENE-5895: Lucene now stores a unique id per-segment and per-commit to aid
|
* LUCENE-5895: Lucene now stores a unique id per-segment and per-commit to aid
|
||||||
in accurate replication of index files (Robert Muir, Mike McCandless)
|
in accurate replication of index files (Robert Muir, Mike McCandless)
|
||||||
|
|
||||||
|
* LUCENE-5889: Add commit method to AnalyzingInfixSuggester, and allow just using .add
|
||||||
|
to build up the suggester. (Varun Thacker via Mike McCandless)
|
||||||
|
|
||||||
======================= Lucene 4.10.0 ======================
|
======================= Lucene 4.10.0 ======================
|
||||||
|
|
||||||
New Features
|
New Features
|
||||||
|
|
|
@ -126,6 +126,7 @@ public class AnalyzingInfixSuggester extends Lookup implements Closeable {
|
||||||
final Version matchVersion;
|
final Version matchVersion;
|
||||||
private final Directory dir;
|
private final Directory dir;
|
||||||
final int minPrefixChars;
|
final int minPrefixChars;
|
||||||
|
private final boolean commitOnBuild;
|
||||||
|
|
||||||
/** Used for ongoing NRT additions/updates. */
|
/** Used for ongoing NRT additions/updates. */
|
||||||
private IndexWriter writer;
|
private IndexWriter writer;
|
||||||
|
@ -146,7 +147,7 @@ public class AnalyzingInfixSuggester extends Lookup implements Closeable {
|
||||||
* Lucene index). Note that {@link #close}
|
* Lucene index). Note that {@link #close}
|
||||||
* will also close the provided directory. */
|
* will also close the provided directory. */
|
||||||
public AnalyzingInfixSuggester(Version matchVersion, Directory dir, Analyzer analyzer) throws IOException {
|
public AnalyzingInfixSuggester(Version matchVersion, Directory dir, Analyzer analyzer) throws IOException {
|
||||||
this(matchVersion, dir, analyzer, analyzer, DEFAULT_MIN_PREFIX_CHARS);
|
this(matchVersion, dir, analyzer, analyzer, DEFAULT_MIN_PREFIX_CHARS, false);
|
||||||
}
|
}
|
||||||
|
|
||||||
/** Create a new instance, loading from a previously built
|
/** Create a new instance, loading from a previously built
|
||||||
|
@ -160,8 +161,12 @@ public class AnalyzingInfixSuggester extends Lookup implements Closeable {
|
||||||
* Prefixes shorter than this are indexed as character
|
* Prefixes shorter than this are indexed as character
|
||||||
* ngrams (increasing index size but making lookups
|
* ngrams (increasing index size but making lookups
|
||||||
* faster).
|
* faster).
|
||||||
|
*
|
||||||
|
* @param commitOnBuild Call commit after the index has finished building. This would persist the
|
||||||
|
* suggester index to disk and future instances of this suggester can use this pre-built dictionary.
|
||||||
*/
|
*/
|
||||||
public AnalyzingInfixSuggester(Version matchVersion, Directory dir, Analyzer indexAnalyzer, Analyzer queryAnalyzer, int minPrefixChars) throws IOException {
|
public AnalyzingInfixSuggester(Version matchVersion, Directory dir, Analyzer indexAnalyzer, Analyzer queryAnalyzer, int minPrefixChars,
|
||||||
|
boolean commitOnBuild) throws IOException {
|
||||||
|
|
||||||
if (minPrefixChars < 0) {
|
if (minPrefixChars < 0) {
|
||||||
throw new IllegalArgumentException("minPrefixChars must be >= 0; got: " + minPrefixChars);
|
throw new IllegalArgumentException("minPrefixChars must be >= 0; got: " + minPrefixChars);
|
||||||
|
@ -172,6 +177,7 @@ public class AnalyzingInfixSuggester extends Lookup implements Closeable {
|
||||||
this.matchVersion = matchVersion;
|
this.matchVersion = matchVersion;
|
||||||
this.dir = dir;
|
this.dir = dir;
|
||||||
this.minPrefixChars = minPrefixChars;
|
this.minPrefixChars = minPrefixChars;
|
||||||
|
this.commitOnBuild = commitOnBuild;
|
||||||
|
|
||||||
if (DirectoryReader.indexExists(dir)) {
|
if (DirectoryReader.indexExists(dir)) {
|
||||||
// Already built; open it:
|
// Already built; open it:
|
||||||
|
@ -237,7 +243,9 @@ public class AnalyzingInfixSuggester extends Lookup implements Closeable {
|
||||||
}
|
}
|
||||||
|
|
||||||
//System.out.println("initial indexing time: " + ((System.nanoTime()-t0)/1000000) + " msec");
|
//System.out.println("initial indexing time: " + ((System.nanoTime()-t0)/1000000) + " msec");
|
||||||
|
if (commitOnBuild) {
|
||||||
|
commit();
|
||||||
|
}
|
||||||
searcherMgr = new SearcherManager(writer, true, null);
|
searcherMgr = new SearcherManager(writer, true, null);
|
||||||
success = true;
|
success = true;
|
||||||
} finally {
|
} finally {
|
||||||
|
@ -248,6 +256,13 @@ public class AnalyzingInfixSuggester extends Lookup implements Closeable {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public void commit() throws IOException {
|
||||||
|
if (writer == null) {
|
||||||
|
throw new IllegalStateException("Cannot commit on an closed writer. Add documents first");
|
||||||
|
}
|
||||||
|
writer.commit();
|
||||||
|
}
|
||||||
|
|
||||||
private Analyzer getGramAnalyzer() {
|
private Analyzer getGramAnalyzer() {
|
||||||
return new AnalyzerWrapper(Analyzer.PER_FIELD_REUSE_STRATEGY) {
|
return new AnalyzerWrapper(Analyzer.PER_FIELD_REUSE_STRATEGY) {
|
||||||
@Override
|
@Override
|
||||||
|
@ -273,12 +288,25 @@ public class AnalyzingInfixSuggester extends Lookup implements Closeable {
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
|
|
||||||
|
private synchronized void ensureOpen() throws IOException {
|
||||||
|
if (writer == null) {
|
||||||
|
if (searcherMgr != null) {
|
||||||
|
searcherMgr.close();
|
||||||
|
searcherMgr = null;
|
||||||
|
}
|
||||||
|
writer = new IndexWriter(dir,
|
||||||
|
getIndexWriterConfig(getGramAnalyzer(), IndexWriterConfig.OpenMode.CREATE));
|
||||||
|
searcherMgr = new SearcherManager(writer, true, null);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
/** Adds a new suggestion. Be sure to use {@link #update}
|
/** Adds a new suggestion. Be sure to use {@link #update}
|
||||||
* instead if you want to replace a previous suggestion.
|
* instead if you want to replace a previous suggestion.
|
||||||
* After adding or updating a batch of new suggestions,
|
* After adding or updating a batch of new suggestions,
|
||||||
* you must call {@link #refresh} in the end in order to
|
* you must call {@link #refresh} in the end in order to
|
||||||
* see the suggestions in {@link #lookup} */
|
* see the suggestions in {@link #lookup} */
|
||||||
public void add(BytesRef text, Set<BytesRef> contexts, long weight, BytesRef payload) throws IOException {
|
public void add(BytesRef text, Set<BytesRef> contexts, long weight, BytesRef payload) throws IOException {
|
||||||
|
ensureOpen();
|
||||||
writer.addDocument(buildDocument(text, contexts, weight, payload));
|
writer.addDocument(buildDocument(text, contexts, weight, payload));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -290,6 +318,7 @@ public class AnalyzingInfixSuggester extends Lookup implements Closeable {
|
||||||
* new suggestions, you must call {@link #refresh} in the
|
* new suggestions, you must call {@link #refresh} in the
|
||||||
* end in order to see the suggestions in {@link #lookup} */
|
* end in order to see the suggestions in {@link #lookup} */
|
||||||
public void update(BytesRef text, Set<BytesRef> contexts, long weight, BytesRef payload) throws IOException {
|
public void update(BytesRef text, Set<BytesRef> contexts, long weight, BytesRef payload) throws IOException {
|
||||||
|
ensureOpen();
|
||||||
writer.updateDocument(new Term(EXACT_TEXT_FIELD_NAME, text.utf8ToString()),
|
writer.updateDocument(new Term(EXACT_TEXT_FIELD_NAME, text.utf8ToString()),
|
||||||
buildDocument(text, contexts, weight, payload));
|
buildDocument(text, contexts, weight, payload));
|
||||||
}
|
}
|
||||||
|
@ -321,6 +350,9 @@ public class AnalyzingInfixSuggester extends Lookup implements Closeable {
|
||||||
* up" many additions/updates, and then call refresh
|
* up" many additions/updates, and then call refresh
|
||||||
* once in the end. */
|
* once in the end. */
|
||||||
public void refresh() throws IOException {
|
public void refresh() throws IOException {
|
||||||
|
if (searcherMgr == null) {
|
||||||
|
throw new IllegalStateException("suggester was not built");
|
||||||
|
}
|
||||||
searcherMgr.maybeRefreshBlocking();
|
searcherMgr.maybeRefreshBlocking();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -673,6 +705,9 @@ public class AnalyzingInfixSuggester extends Lookup implements Closeable {
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public long getCount() throws IOException {
|
public long getCount() throws IOException {
|
||||||
|
if (searcherMgr == null) {
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
IndexSearcher searcher = searcherMgr.acquire();
|
IndexSearcher searcher = searcherMgr.acquire();
|
||||||
try {
|
try {
|
||||||
return searcher.getIndexReader().numDocs();
|
return searcher.getIndexReader().numDocs();
|
||||||
|
|
|
@ -106,11 +106,13 @@ public class BlendedInfixSuggester extends AnalyzingInfixSuggester {
|
||||||
*
|
*
|
||||||
* @param blenderType Type of blending strategy, see BlenderType for more precisions
|
* @param blenderType Type of blending strategy, see BlenderType for more precisions
|
||||||
* @param numFactor Factor to multiply the number of searched elements before ponderate
|
* @param numFactor Factor to multiply the number of searched elements before ponderate
|
||||||
|
* @param commitOnBuild Call commit after the index has finished building. This would persist the
|
||||||
|
* suggester index to disk and future instances of this suggester can use this pre-built dictionary.
|
||||||
* @throws IOException If there are problems opening the underlying Lucene index.
|
* @throws IOException If there are problems opening the underlying Lucene index.
|
||||||
*/
|
*/
|
||||||
public BlendedInfixSuggester(Version matchVersion, Directory dir, Analyzer indexAnalyzer, Analyzer queryAnalyzer,
|
public BlendedInfixSuggester(Version matchVersion, Directory dir, Analyzer indexAnalyzer, Analyzer queryAnalyzer,
|
||||||
int minPrefixChars, BlenderType blenderType, int numFactor) throws IOException {
|
int minPrefixChars, BlenderType blenderType, int numFactor, boolean commitOnBuild) throws IOException {
|
||||||
super(matchVersion, dir, indexAnalyzer, queryAnalyzer, minPrefixChars);
|
super(matchVersion, dir, indexAnalyzer, queryAnalyzer, minPrefixChars, commitOnBuild);
|
||||||
this.blenderType = blenderType;
|
this.blenderType = blenderType;
|
||||||
this.numFactor = numFactor;
|
this.numFactor = numFactor;
|
||||||
}
|
}
|
||||||
|
|
|
@ -51,7 +51,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
};
|
};
|
||||||
|
|
||||||
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
||||||
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3);
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3, false);
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
|
|
||||||
List<LookupResult> results = suggester.lookup(TestUtil.stringToCharSequence("ear", random()), 10, true, true);
|
List<LookupResult> results = suggester.lookup(TestUtil.stringToCharSequence("ear", random()), 10, true, true);
|
||||||
|
@ -94,12 +94,12 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
File tempDir = createTempDir("AnalyzingInfixSuggesterTest");
|
File tempDir = createTempDir("AnalyzingInfixSuggesterTest");
|
||||||
|
|
||||||
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
||||||
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, 3);
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, 3, false);
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
assertEquals(2, suggester.getCount());
|
assertEquals(2, suggester.getCount());
|
||||||
suggester.close();
|
suggester.close();
|
||||||
|
|
||||||
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, 3);
|
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, 3, false);
|
||||||
List<LookupResult> results = suggester.lookup(TestUtil.stringToCharSequence("ear", random()), 10, true, true);
|
List<LookupResult> results = suggester.lookup(TestUtil.stringToCharSequence("ear", random()), 10, true, true);
|
||||||
assertEquals(2, results.size());
|
assertEquals(2, results.size());
|
||||||
assertEquals("a penny saved is a penny <b>ear</b>ned", results.get(0).key);
|
assertEquals("a penny saved is a penny <b>ear</b>ned", results.get(0).key);
|
||||||
|
@ -138,7 +138,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
};
|
};
|
||||||
|
|
||||||
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
||||||
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3) {
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3, false) {
|
||||||
@Override
|
@Override
|
||||||
protected Object highlight(String text, Set<String> matchedTokens, String prefixToken) throws IOException {
|
protected Object highlight(String text, Set<String> matchedTokens, String prefixToken) throws IOException {
|
||||||
try (TokenStream ts = queryAnalyzer.tokenStream("text", new StringReader(text))) {
|
try (TokenStream ts = queryAnalyzer.tokenStream("text", new StringReader(text))) {
|
||||||
|
@ -214,7 +214,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
|
|
||||||
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
||||||
int minPrefixLength = random().nextInt(10);
|
int minPrefixLength = random().nextInt(10);
|
||||||
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, minPrefixLength);
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, minPrefixLength, false);
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
|
|
||||||
for(int i=0;i<2;i++) {
|
for(int i=0;i<2;i++) {
|
||||||
|
@ -271,7 +271,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
|
|
||||||
// Make sure things still work after close and reopen:
|
// Make sure things still work after close and reopen:
|
||||||
suggester.close();
|
suggester.close();
|
||||||
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, minPrefixLength);
|
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, minPrefixLength, false);
|
||||||
}
|
}
|
||||||
suggester.close();
|
suggester.close();
|
||||||
}
|
}
|
||||||
|
@ -282,7 +282,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
};
|
};
|
||||||
|
|
||||||
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
||||||
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3);
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3, false);
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
List<LookupResult> results = suggester.lookup(TestUtil.stringToCharSequence("penn", random()), 10, true, true);
|
List<LookupResult> results = suggester.lookup(TestUtil.stringToCharSequence("penn", random()), 10, true, true);
|
||||||
assertEquals(1, results.size());
|
assertEquals(1, results.size());
|
||||||
|
@ -296,7 +296,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
};
|
};
|
||||||
|
|
||||||
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, true);
|
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, true);
|
||||||
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3);
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3, false);
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
List<LookupResult> results = suggester.lookup(TestUtil.stringToCharSequence("penn", random()), 10, true, true);
|
List<LookupResult> results = suggester.lookup(TestUtil.stringToCharSequence("penn", random()), 10, true, true);
|
||||||
assertEquals(1, results.size());
|
assertEquals(1, results.size());
|
||||||
|
@ -305,7 +305,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
|
|
||||||
// Try again, but overriding addPrefixMatch to highlight
|
// Try again, but overriding addPrefixMatch to highlight
|
||||||
// the entire hit:
|
// the entire hit:
|
||||||
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3) {
|
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3, false) {
|
||||||
@Override
|
@Override
|
||||||
protected void addPrefixMatch(StringBuilder sb, String surface, String analyzed, String prefixToken) {
|
protected void addPrefixMatch(StringBuilder sb, String surface, String analyzed, String prefixToken) {
|
||||||
sb.append("<b>");
|
sb.append("<b>");
|
||||||
|
@ -326,7 +326,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
};
|
};
|
||||||
|
|
||||||
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
||||||
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3);
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3, false);
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
suggester.close();
|
suggester.close();
|
||||||
suggester.close();
|
suggester.close();
|
||||||
|
@ -352,7 +352,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), indexAnalyzer, queryAnalyzer, 3);
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), indexAnalyzer, queryAnalyzer, 3, false);
|
||||||
|
|
||||||
Input keys[] = new Input[] {
|
Input keys[] = new Input[] {
|
||||||
new Input("a bob for apples", 10, new BytesRef("foobaz")),
|
new Input("a bob for apples", 10, new BytesRef("foobaz")),
|
||||||
|
@ -367,7 +367,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
|
|
||||||
public void testEmptyAtStart() throws Exception {
|
public void testEmptyAtStart() throws Exception {
|
||||||
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
||||||
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3);
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3, false);
|
||||||
suggester.build(new InputArrayIterator(new Input[0]));
|
suggester.build(new InputArrayIterator(new Input[0]));
|
||||||
suggester.add(new BytesRef("a penny saved is a penny earned"), null, 10, new BytesRef("foobaz"));
|
suggester.add(new BytesRef("a penny saved is a penny earned"), null, 10, new BytesRef("foobaz"));
|
||||||
suggester.add(new BytesRef("lend me your ear"), null, 8, new BytesRef("foobar"));
|
suggester.add(new BytesRef("lend me your ear"), null, 8, new BytesRef("foobar"));
|
||||||
|
@ -405,7 +405,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
|
|
||||||
public void testBothExactAndPrefix() throws Exception {
|
public void testBothExactAndPrefix() throws Exception {
|
||||||
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
||||||
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3);
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3, false);
|
||||||
suggester.build(new InputArrayIterator(new Input[0]));
|
suggester.build(new InputArrayIterator(new Input[0]));
|
||||||
suggester.add(new BytesRef("the pen is pretty"), null, 10, new BytesRef("foobaz"));
|
suggester.add(new BytesRef("the pen is pretty"), null, 10, new BytesRef("foobaz"));
|
||||||
suggester.refresh();
|
suggester.refresh();
|
||||||
|
@ -478,7 +478,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
System.out.println(" minPrefixChars=" + minPrefixChars);
|
System.out.println(" minPrefixChars=" + minPrefixChars);
|
||||||
}
|
}
|
||||||
|
|
||||||
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, minPrefixChars);
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, minPrefixChars, false);
|
||||||
|
|
||||||
// Initial suggester built with nothing:
|
// Initial suggester built with nothing:
|
||||||
suggester.build(new InputArrayIterator(new Input[0]));
|
suggester.build(new InputArrayIterator(new Input[0]));
|
||||||
|
@ -558,7 +558,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
}
|
}
|
||||||
lookupThread.finish();
|
lookupThread.finish();
|
||||||
suggester.close();
|
suggester.close();
|
||||||
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, minPrefixChars);
|
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, minPrefixChars, false);
|
||||||
lookupThread = new LookupThread(suggester);
|
lookupThread = new LookupThread(suggester);
|
||||||
lookupThread.start();
|
lookupThread.start();
|
||||||
|
|
||||||
|
@ -730,7 +730,7 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
};
|
};
|
||||||
|
|
||||||
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
||||||
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3);
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newDirectory(), a, a, 3, false);
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
|
|
||||||
List<LookupResult> results = suggester.lookup(TestUtil.stringToCharSequence("ear", random()), 10, true, true);
|
List<LookupResult> results = suggester.lookup(TestUtil.stringToCharSequence("ear", random()), 10, true, true);
|
||||||
|
@ -790,6 +790,65 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
suggester.close();
|
suggester.close();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
public void testNRTWithParallelAdds() throws IOException, InterruptedException {
|
||||||
|
String[] keys = new String[] {"python", "java", "c", "scala", "ruby", "clojure", "erlang", "go", "swift", "lisp"};
|
||||||
|
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
||||||
|
File tempDir = createTempDir("AIS_NRT_PERSIST_TEST");
|
||||||
|
AnalyzingInfixSuggester suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, 3, false);
|
||||||
|
Thread[] multiAddThreads = new Thread[10];
|
||||||
|
try {
|
||||||
|
suggester.refresh();
|
||||||
|
fail("Cannot call refresh on an suggester when no docs are added to the index");
|
||||||
|
} catch(IllegalStateException e) {
|
||||||
|
//Expected
|
||||||
|
}
|
||||||
|
for(int i=0; i<10; i++) {
|
||||||
|
multiAddThreads[i] = new Thread(new IndexDocument(suggester, keys[i]));
|
||||||
|
}
|
||||||
|
for(int i=0; i<10; i++) {
|
||||||
|
multiAddThreads[i].start();
|
||||||
|
}
|
||||||
|
//Make sure all threads have completed indexing
|
||||||
|
for(int i=0; i<10; i++) {
|
||||||
|
multiAddThreads[i].join();
|
||||||
|
}
|
||||||
|
|
||||||
|
suggester.refresh();
|
||||||
|
List<LookupResult> results = suggester.lookup(TestUtil.stringToCharSequence("python", random()), 10, true, false);
|
||||||
|
assertEquals(1, results.size());
|
||||||
|
assertEquals("python", results.get(0).key);
|
||||||
|
|
||||||
|
//Test if the index is getting persisted correctly and can be reopened.
|
||||||
|
suggester.commit();
|
||||||
|
suggester.close();
|
||||||
|
|
||||||
|
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, 3, false);
|
||||||
|
results = suggester.lookup(TestUtil.stringToCharSequence("python", random()), 10, true, false);
|
||||||
|
assertEquals(1, results.size());
|
||||||
|
assertEquals("python", results.get(0).key);
|
||||||
|
|
||||||
|
suggester.close();
|
||||||
|
}
|
||||||
|
|
||||||
|
private class IndexDocument implements Runnable {
|
||||||
|
AnalyzingInfixSuggester suggester;
|
||||||
|
String key;
|
||||||
|
|
||||||
|
private IndexDocument(AnalyzingInfixSuggester suggester, String key) {
|
||||||
|
this.suggester = suggester;
|
||||||
|
this.key = key;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void run() {
|
||||||
|
try {
|
||||||
|
suggester.add(new BytesRef(key), null, 10, null);
|
||||||
|
} catch (IOException e) {
|
||||||
|
fail("Could not build suggest dictionary correctly");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
private Set<BytesRef> asSet(String... values) {
|
private Set<BytesRef> asSet(String... values) {
|
||||||
HashSet<BytesRef> result = new HashSet<>();
|
HashSet<BytesRef> result = new HashSet<>();
|
||||||
for(String value : values) {
|
for(String value : values) {
|
||||||
|
@ -812,11 +871,11 @@ public class AnalyzingInfixSuggesterTest extends LuceneTestCase {
|
||||||
AnalyzingInfixSuggester suggester;
|
AnalyzingInfixSuggester suggester;
|
||||||
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
Analyzer a = new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false);
|
||||||
if (iter == 0) {
|
if (iter == 0) {
|
||||||
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, 3);
|
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, 3, false);
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
} else {
|
} else {
|
||||||
// Test again, after close/reopen:
|
// Test again, after close/reopen:
|
||||||
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, 3);
|
suggester = new AnalyzingInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a, 3, false);
|
||||||
}
|
}
|
||||||
|
|
||||||
// No context provided, all results returned
|
// No context provided, all results returned
|
||||||
|
|
|
@ -50,7 +50,7 @@ public class BlendedInfixSuggesterTest extends LuceneTestCase {
|
||||||
BlendedInfixSuggester suggester = new BlendedInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a,
|
BlendedInfixSuggester suggester = new BlendedInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a,
|
||||||
AnalyzingInfixSuggester.DEFAULT_MIN_PREFIX_CHARS,
|
AnalyzingInfixSuggester.DEFAULT_MIN_PREFIX_CHARS,
|
||||||
BlendedInfixSuggester.BlenderType.POSITION_LINEAR,
|
BlendedInfixSuggester.BlenderType.POSITION_LINEAR,
|
||||||
BlendedInfixSuggester.DEFAULT_NUM_FACTOR);
|
BlendedInfixSuggester.DEFAULT_NUM_FACTOR, false);
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
|
|
||||||
// we query for star wars and check that the weight
|
// we query for star wars and check that the weight
|
||||||
|
@ -98,7 +98,8 @@ public class BlendedInfixSuggesterTest extends LuceneTestCase {
|
||||||
|
|
||||||
// BlenderType.RECIPROCAL is using 1/(1+p) * w where w is weight and p the position of the word
|
// BlenderType.RECIPROCAL is using 1/(1+p) * w where w is weight and p the position of the word
|
||||||
suggester = new BlendedInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a,
|
suggester = new BlendedInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a,
|
||||||
AnalyzingInfixSuggester.DEFAULT_MIN_PREFIX_CHARS, BlendedInfixSuggester.BlenderType.POSITION_RECIPROCAL, 1);
|
AnalyzingInfixSuggester.DEFAULT_MIN_PREFIX_CHARS,
|
||||||
|
BlendedInfixSuggester.BlenderType.POSITION_RECIPROCAL, 1, false);
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
|
|
||||||
assertEquals(w, getInResults(suggester, "top", pl, 1));
|
assertEquals(w, getInResults(suggester, "top", pl, 1));
|
||||||
|
@ -129,7 +130,8 @@ public class BlendedInfixSuggesterTest extends LuceneTestCase {
|
||||||
|
|
||||||
// if factor is small, we don't get the expected element
|
// if factor is small, we don't get the expected element
|
||||||
BlendedInfixSuggester suggester = new BlendedInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a,
|
BlendedInfixSuggester suggester = new BlendedInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a,
|
||||||
AnalyzingInfixSuggester.DEFAULT_MIN_PREFIX_CHARS, BlendedInfixSuggester.BlenderType.POSITION_RECIPROCAL, 1);
|
AnalyzingInfixSuggester.DEFAULT_MIN_PREFIX_CHARS,
|
||||||
|
BlendedInfixSuggester.BlenderType.POSITION_RECIPROCAL, 1, false);
|
||||||
|
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
|
|
||||||
|
@ -148,7 +150,8 @@ public class BlendedInfixSuggesterTest extends LuceneTestCase {
|
||||||
|
|
||||||
// if we increase the factor we have it
|
// if we increase the factor we have it
|
||||||
suggester = new BlendedInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a,
|
suggester = new BlendedInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a,
|
||||||
AnalyzingInfixSuggester.DEFAULT_MIN_PREFIX_CHARS, BlendedInfixSuggester.BlenderType.POSITION_RECIPROCAL, 2);
|
AnalyzingInfixSuggester.DEFAULT_MIN_PREFIX_CHARS,
|
||||||
|
BlendedInfixSuggester.BlenderType.POSITION_RECIPROCAL, 2, false);
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
|
|
||||||
// we have it
|
// we have it
|
||||||
|
@ -179,8 +182,9 @@ public class BlendedInfixSuggesterTest extends LuceneTestCase {
|
||||||
|
|
||||||
// if factor is small, we don't get the expected element
|
// if factor is small, we don't get the expected element
|
||||||
BlendedInfixSuggester suggester = new BlendedInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a,
|
BlendedInfixSuggester suggester = new BlendedInfixSuggester(TEST_VERSION_CURRENT, newFSDirectory(tempDir), a, a,
|
||||||
AnalyzingInfixSuggester.DEFAULT_MIN_PREFIX_CHARS, BlendedInfixSuggester.BlenderType.POSITION_RECIPROCAL,
|
AnalyzingInfixSuggester.DEFAULT_MIN_PREFIX_CHARS,
|
||||||
BlendedInfixSuggester.DEFAULT_NUM_FACTOR);
|
BlendedInfixSuggester.BlenderType.POSITION_RECIPROCAL,
|
||||||
|
BlendedInfixSuggester.DEFAULT_NUM_FACTOR, false);
|
||||||
suggester.build(new InputArrayIterator(keys));
|
suggester.build(new InputArrayIterator(keys));
|
||||||
|
|
||||||
|
|
||||||
|
|
|
@ -94,7 +94,7 @@ public class AnalyzingInfixLookupFactory extends LookupFactory {
|
||||||
try {
|
try {
|
||||||
return new AnalyzingInfixSuggester(core.getSolrConfig().luceneMatchVersion,
|
return new AnalyzingInfixSuggester(core.getSolrConfig().luceneMatchVersion,
|
||||||
FSDirectory.open(new File(indexPath)), indexAnalyzer,
|
FSDirectory.open(new File(indexPath)), indexAnalyzer,
|
||||||
queryAnalyzer, minPrefixChars);
|
queryAnalyzer, minPrefixChars, true);
|
||||||
} catch (IOException e) {
|
} catch (IOException e) {
|
||||||
throw new RuntimeException();
|
throw new RuntimeException();
|
||||||
}
|
}
|
||||||
|
|
|
@ -100,7 +100,7 @@ public class BlendedInfixLookupFactory extends AnalyzingInfixLookupFactory {
|
||||||
return new BlendedInfixSuggester(core.getSolrConfig().luceneMatchVersion,
|
return new BlendedInfixSuggester(core.getSolrConfig().luceneMatchVersion,
|
||||||
FSDirectory.open(new File(indexPath)),
|
FSDirectory.open(new File(indexPath)),
|
||||||
indexAnalyzer, queryAnalyzer, minPrefixChars,
|
indexAnalyzer, queryAnalyzer, minPrefixChars,
|
||||||
blenderType, numFactor);
|
blenderType, numFactor, true);
|
||||||
} catch (IOException e) {
|
} catch (IOException e) {
|
||||||
throw new RuntimeException();
|
throw new RuntimeException();
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue