Fix numeric terms aggregations with includes/excludes and minDocCount=0 (#22141)

For minDocCount=0 the numeric terms aggregator should also check the includes/excludes when buckets with empty count are added to the result.
This change fixes this bug and adds a test for it.

Fixes #22140
This commit is contained in:
Jim Ferenczi 2016-12-14 12:37:11 +01:00 committed by GitHub
parent 571b20137a
commit 23d11ed729
2 changed files with 33 additions and 18 deletions

View File

@ -113,7 +113,10 @@ public class LongTermsAggregator extends TermsAggregator {
values.setDocument(docId); values.setDocument(docId);
final int valueCount = values.count(); final int valueCount = values.count();
for (int i = 0; i < valueCount; ++i) { for (int i = 0; i < valueCount; ++i) {
bucketOrds.add(values.valueAt(i)); long value = values.valueAt(i);
if (longFilter == null || longFilter.accept(value)) {
bucketOrds.add(value);
}
} }
} }
} }

View File

@ -305,41 +305,53 @@ public class LongTermsIT extends AbstractTermsTestCase {
long includes[] = { 1, 2, 3, 98 }; long includes[] = { 1, 2, 3, 98 };
long excludes[] = { -1, 2, 4 }; long excludes[] = { -1, 2, 4 };
long empty[] = {}; long empty[] = {};
testIncludeExcludeResults(includes, empty, new long[] { 1, 2, 3 }); testIncludeExcludeResults(1, includes, empty, new long[] { 1, 2, 3 }, new long[0]);
testIncludeExcludeResults(includes, excludes, new long[] { 1, 3 }); testIncludeExcludeResults(1, includes, excludes, new long[] { 1, 3 }, new long[0]);
testIncludeExcludeResults(empty, excludes, new long[] { 0, 1, 3 }); testIncludeExcludeResults(1, empty, excludes, new long[] { 0, 1, 3 }, new long[0]);
testIncludeExcludeResults(0, includes, empty, new long[] { 1, 2, 3}, new long[] { 98 });
testIncludeExcludeResults(0, includes, excludes, new long[] { 1, 3 }, new long[] { 98 });
testIncludeExcludeResults(0, empty, excludes, new long[] { 0, 1, 3 }, new long[] {5, 6, 7, 8, 9, 10, 11});
} }
private void testIncludeExcludeResults(long[] includes, long[] excludes, long[] expecteds) { private void testIncludeExcludeResults(int minDocCount, long[] includes, long[] excludes,
long[] expectedWithCounts, long[] expectedZeroCounts) {
SearchResponse response = client().prepareSearch("idx").setTypes("type") SearchResponse response = client().prepareSearch("idx").setTypes("type")
.addAggregation(terms("terms") .addAggregation(terms("terms")
.field(SINGLE_VALUED_FIELD_NAME) .field(SINGLE_VALUED_FIELD_NAME)
.includeExclude(new IncludeExclude(includes, excludes)) .includeExclude(new IncludeExclude(includes, excludes))
.collectMode(randomFrom(SubAggCollectionMode.values()))) .collectMode(randomFrom(SubAggCollectionMode.values()))
.minDocCount(minDocCount))
.execute().actionGet(); .execute().actionGet();
assertSearchResponse(response); assertSearchResponse(response);
Terms terms = response.getAggregations().get("terms"); Terms terms = response.getAggregations().get("terms");
assertThat(terms, notNullValue()); assertThat(terms, notNullValue());
assertThat(terms.getName(), equalTo("terms")); assertThat(terms.getName(), equalTo("terms"));
assertThat(terms.getBuckets().size(), equalTo(expecteds.length)); assertThat(terms.getBuckets().size(), equalTo(expectedWithCounts.length + expectedZeroCounts.length));
for (int i = 0; i < expecteds.length; i++) { for (int i = 0; i < expectedWithCounts.length; i++) {
Terms.Bucket bucket = terms.getBucketByKey("" + expecteds[i]); Terms.Bucket bucket = terms.getBucketByKey("" + expectedWithCounts[i]);
assertThat(bucket, notNullValue()); assertThat(bucket, notNullValue());
assertThat(bucket.getDocCount(), equalTo(1L)); assertThat(bucket.getDocCount(), equalTo(1L));
} }
for (int i = 0; i < expectedZeroCounts.length; i++) {
Terms.Bucket bucket = terms.getBucketByKey("" + expectedZeroCounts[i]);
assertThat(bucket, notNullValue());
assertThat(bucket.getDocCount(), equalTo(0L));
}
} }
public void testSingleValueFieldWithPartitionedFiltering() throws Exception { public void testSingleValueFieldWithPartitionedFiltering() throws Exception {
runTestFieldWithPartitionedFiltering(SINGLE_VALUED_FIELD_NAME); runTestFieldWithPartitionedFiltering(SINGLE_VALUED_FIELD_NAME);
} }
public void testMultiValueFieldWithPartitionedFiltering() throws Exception { public void testMultiValueFieldWithPartitionedFiltering() throws Exception {
runTestFieldWithPartitionedFiltering(MULTI_VALUED_FIELD_NAME); runTestFieldWithPartitionedFiltering(MULTI_VALUED_FIELD_NAME);
} }
private void runTestFieldWithPartitionedFiltering(String field) throws Exception { private void runTestFieldWithPartitionedFiltering(String field) throws Exception {
// Find total number of unique terms // Find total number of unique terms
SearchResponse allResponse = client().prepareSearch("idx").setTypes("type") SearchResponse allResponse = client().prepareSearch("idx").setTypes("type")
@ -348,8 +360,8 @@ public class LongTermsIT extends AbstractTermsTestCase {
Terms terms = allResponse.getAggregations().get("terms"); Terms terms = allResponse.getAggregations().get("terms");
assertThat(terms, notNullValue()); assertThat(terms, notNullValue());
assertThat(terms.getName(), equalTo("terms")); assertThat(terms.getName(), equalTo("terms"));
int expectedCardinality = terms.getBuckets().size(); int expectedCardinality = terms.getBuckets().size();
// Gather terms using partitioned aggregations // Gather terms using partitioned aggregations
final int numPartitions = randomIntBetween(2, 4); final int numPartitions = randomIntBetween(2, 4);
Set<Number> foundTerms = new HashSet<>(); Set<Number> foundTerms = new HashSet<>();
@ -368,9 +380,9 @@ public class LongTermsIT extends AbstractTermsTestCase {
foundTerms.add(bucket.getKeyAsNumber()); foundTerms.add(bucket.getKeyAsNumber());
} }
} }
assertEquals(expectedCardinality, foundTerms.size()); assertEquals(expectedCardinality, foundTerms.size());
} }
public void testSingleValueFieldWithMaxSize() throws Exception { public void testSingleValueFieldWithMaxSize() throws Exception {
SearchResponse response = client().prepareSearch("idx").setTypes("high_card_type") SearchResponse response = client().prepareSearch("idx").setTypes("high_card_type")