mirror of
https://github.com/apache/lucene.git
synced 2025-02-09 11:35:14 +00:00
add comment and test for ngram token filter
This commit is contained in:
parent
01f2a87c67
commit
80e2854247
@ -79,6 +79,28 @@ public class TestNGramFilters extends BaseTokenStreamFactoryTestCase {
|
|||||||
new String[] { "te", "tes", "es", "est", "st" });
|
new String[] { "te", "tes", "es", "est", "st" });
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Test NGramFilterFactory on tokens with payloads
|
||||||
|
*/
|
||||||
|
public void testNGramFilterPayload() throws Exception {
|
||||||
|
Reader reader = new StringReader("test|0.1");
|
||||||
|
TokenStream stream = whitespaceMockTokenizer(reader);
|
||||||
|
stream = tokenFilterFactory("DelimitedPayload", "encoder", "float").create(stream);
|
||||||
|
stream = tokenFilterFactory("NGram", "minGramSize", "1", "maxGramSize", "2").create(stream);
|
||||||
|
|
||||||
|
stream.reset();
|
||||||
|
while (stream.incrementToken()) {
|
||||||
|
PayloadAttribute payAttr = stream.getAttribute(PayloadAttribute.class);
|
||||||
|
assertNotNull(payAttr);
|
||||||
|
BytesRef payData = payAttr.getPayload();
|
||||||
|
assertNotNull(payData);
|
||||||
|
float payFloat = PayloadHelper.decodeFloat(payData.bytes);
|
||||||
|
assertEquals(0.1f, payFloat, 0.0f);
|
||||||
|
}
|
||||||
|
stream.end();
|
||||||
|
stream.close();
|
||||||
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Test EdgeNGramTokenizerFactory
|
* Test EdgeNGramTokenizerFactory
|
||||||
*/
|
*/
|
||||||
@ -127,6 +149,9 @@ public class TestNGramFilters extends BaseTokenStreamFactoryTestCase {
|
|||||||
new String[] { "t", "te" });
|
new String[] { "t", "te" });
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Test EdgeNGramFilterFactory on tokens with payloads
|
||||||
|
*/
|
||||||
public void testEdgeNGramFilterPayload() throws Exception {
|
public void testEdgeNGramFilterPayload() throws Exception {
|
||||||
Reader reader = new StringReader("test|0.1");
|
Reader reader = new StringReader("test|0.1");
|
||||||
TokenStream stream = whitespaceMockTokenizer(reader);
|
TokenStream stream = whitespaceMockTokenizer(reader);
|
||||||
|
Loading…
x
Reference in New Issue
Block a user