diff --git a/docs/reference/rest-api/common-parms.asciidoc b/docs/reference/rest-api/common-parms.asciidoc index 7877ee7ae16..670551b75ff 100644 --- a/docs/reference/rest-api/common-parms.asciidoc +++ b/docs/reference/rest-api/common-parms.asciidoc @@ -666,6 +666,8 @@ are supported: * <> * <> * <> +* <> +* <> * <> * <> * <> diff --git a/x-pack/plugin/src/test/resources/rest-api-spec/test/transform/preview_transforms.yml b/x-pack/plugin/src/test/resources/rest-api-spec/test/transform/preview_transforms.yml index 1064cb54148..771f599a029 100644 --- a/x-pack/plugin/src/test/resources/rest-api-spec/test/transform/preview_transforms.yml +++ b/x-pack/plugin/src/test/resources/rest-api-spec/test/transform/preview_transforms.yml @@ -265,12 +265,12 @@ setup: "group_by": { "time": {"date_histogram": {"fixed_interval": "1h", "field": "time"}}}, "aggs": { - "vals": {"terms": {"field":"airline"}} + "vals": {"significant_terms": {"field":"airline"}} } } } - do: - catch: /Unsupported aggregation type \[terms\]/ + catch: /Unsupported aggregation type \[significant_terms\]/ transform.preview_transform: body: > { @@ -280,7 +280,7 @@ setup: "group_by": { "time": {"date_histogram": {"fixed_interval": "1h", "field": "time"}}}, "aggs": { - "vals": {"terms": {"field":"airline"}} + "vals": {"significant_terms": {"field":"airline"}} } } } diff --git a/x-pack/plugin/transform/qa/single-node-tests/src/test/java/org/elasticsearch/xpack/transform/integration/TransformPivotRestIT.java b/x-pack/plugin/transform/qa/single-node-tests/src/test/java/org/elasticsearch/xpack/transform/integration/TransformPivotRestIT.java index 992d0ad5fd4..3e39f2cbb8d 100644 --- a/x-pack/plugin/transform/qa/single-node-tests/src/test/java/org/elasticsearch/xpack/transform/integration/TransformPivotRestIT.java +++ b/x-pack/plugin/transform/qa/single-node-tests/src/test/java/org/elasticsearch/xpack/transform/integration/TransformPivotRestIT.java @@ -18,6 +18,8 @@ import org.junit.Before; import java.io.IOException; import java.time.Instant; import java.util.Arrays; +import java.util.Collections; +import java.util.HashMap; import java.util.HashSet; import java.util.List; import java.util.Map; @@ -25,11 +27,11 @@ import java.util.Set; import static org.elasticsearch.common.xcontent.XContentFactory.jsonBuilder; import static org.elasticsearch.xpack.core.security.authc.support.UsernamePasswordToken.basicAuthHeaderValue; -import static org.hamcrest.CoreMatchers.is; import static org.hamcrest.Matchers.containsString; import static org.hamcrest.Matchers.equalTo; import static org.hamcrest.Matchers.greaterThan; import static org.hamcrest.Matchers.hasSize; +import static org.hamcrest.Matchers.is; import static org.hamcrest.Matchers.lessThan; import static org.hamcrest.Matchers.not; import static org.hamcrest.Matchers.nullValue; @@ -508,6 +510,97 @@ public class TransformPivotRestIT extends TransformRestTestCase { assertDateHistogramPivot(REVIEWS_DATE_NANO_INDEX_NAME); } + @SuppressWarnings("unchecked") + public void testPivotWithTermsAgg() throws Exception { + String transformId = "simple_terms_agg_pivot"; + String transformIndex = "pivot_reviews_via_histogram_with_terms_agg"; + setupDataAccessRole(DATA_ACCESS_ROLE, REVIEWS_INDEX_NAME, transformIndex); + + final Request createTransformRequest = createRequestWithAuth( + "PUT", + getTransformEndpoint() + transformId, + BASIC_AUTH_VALUE_TRANSFORM_ADMIN_WITH_SOME_DATA_ACCESS + ); + + String config = "{" + + " \"source\": {\"index\":\"" + + REVIEWS_INDEX_NAME + + "\"}," + + " \"dest\": {\"index\":\"" + + transformIndex + + "\"},"; + + config += " \"pivot\": {" + + " \"group_by\": {" + + " \"every_2\": {" + + " \"histogram\": {" + + " \"interval\": 2,\"field\":\"stars\"" + + " } } }," + + " \"aggregations\": {" + + " \"common_users\": {" + + " \"terms\": {" + + " \"field\": \"user_id\"," + + " \"size\": 2" + + " }," + + " \"aggs\" : {" + + " \"common_businesses\": {" + + " \"terms\": {" + + " \"field\": \"business_id\"," + + " \"size\": 2" + + " }}" + + " } " + +" }," + + " \"rare_users\": {" + + " \"rare_terms\": {" + + " \"field\": \"user_id\"" + + " } } } }" + + "}"; + + createTransformRequest.setJsonEntity(config); + Map createTransformResponse = entityAsMap(client().performRequest(createTransformRequest)); + assertThat(createTransformResponse.get("acknowledged"), equalTo(Boolean.TRUE)); + + startAndWaitForTransform(transformId, transformIndex); + assertTrue(indexExists(transformIndex)); + + // we expect 3 documents as there shall be 5 unique star values and we are bucketing every 2 starting at 0 + Map indexStats = getAsMap(transformIndex + "/_stats"); + assertEquals(3, XContentMapValues.extractValue("_all.total.docs.count", indexStats)); + + // get and check some term results + Map searchResult = getAsMap(transformIndex + "/_search?q=every_2:2.0"); + + assertEquals(1, XContentMapValues.extractValue("hits.total.value", searchResult)); + Map commonUsers = (Map) ((List) XContentMapValues.extractValue( + "hits.hits._source.common_users", + searchResult + )).get(0); + Map rareUsers = (Map) ((List) XContentMapValues.extractValue( + "hits.hits._source.rare_users", + searchResult + )).get(0); + assertThat(commonUsers, is(not(nullValue()))); + assertThat(commonUsers, equalTo(new HashMap(){{ + put("user_10", + Collections.singletonMap( + "common_businesses", + new HashMap(){{ + put("business_12", 6); + put("business_9", 4); + }})); + put("user_0", Collections.singletonMap( + "common_businesses", + new HashMap(){{ + put("business_0", 35); + }})); + }})); + assertThat(rareUsers, is(not(nullValue()))); + assertThat(rareUsers, equalTo(new HashMap(){{ + put("user_5", 1); + put("user_12", 1); + }})); + } + private void assertDateHistogramPivot(String indexName) throws Exception { String transformId = "simple_date_histogram_pivot_" + indexName; String transformIndex = "pivot_reviews_via_date_histogram_" + indexName; diff --git a/x-pack/plugin/transform/src/main/java/org/elasticsearch/xpack/transform/transforms/pivot/AggregationResultUtils.java b/x-pack/plugin/transform/src/main/java/org/elasticsearch/xpack/transform/transforms/pivot/AggregationResultUtils.java index 1475cd0babd..fbdffd1ec86 100644 --- a/x-pack/plugin/transform/src/main/java/org/elasticsearch/xpack/transform/transforms/pivot/AggregationResultUtils.java +++ b/x-pack/plugin/transform/src/main/java/org/elasticsearch/xpack/transform/transforms/pivot/AggregationResultUtils.java @@ -16,6 +16,7 @@ import org.elasticsearch.common.geo.parsers.ShapeParser; import org.elasticsearch.search.aggregations.Aggregation; import org.elasticsearch.search.aggregations.AggregationBuilder; import org.elasticsearch.search.aggregations.PipelineAggregationBuilder; +import org.elasticsearch.search.aggregations.bucket.MultiBucketsAggregation; import org.elasticsearch.search.aggregations.bucket.SingleBucketAggregation; import org.elasticsearch.search.aggregations.bucket.composite.CompositeAggregation; import org.elasticsearch.search.aggregations.metrics.GeoBounds; @@ -52,6 +53,7 @@ public final class AggregationResultUtils { tempMap.put(GeoBounds.class.getName(), new GeoBoundsAggExtractor()); tempMap.put(Percentiles.class.getName(), new PercentilesAggExtractor()); tempMap.put(SingleBucketAggregation.class.getName(), new SingleBucketAggExtractor()); + tempMap.put(MultiBucketsAggregation.class.getName(), new MultiBucketsAggExtractor()); TYPE_VALUE_EXTRACTOR_MAP = Collections.unmodifiableMap(tempMap); } @@ -120,6 +122,8 @@ public final class AggregationResultUtils { return TYPE_VALUE_EXTRACTOR_MAP.get(Percentiles.class.getName()); } else if (aggregation instanceof SingleBucketAggregation) { return TYPE_VALUE_EXTRACTOR_MAP.get(SingleBucketAggregation.class.getName()); + } else if (aggregation instanceof MultiBucketsAggregation) { + return TYPE_VALUE_EXTRACTOR_MAP.get(MultiBucketsAggregation.class.getName()); } else { // Execution should never reach this point! // Creating transforms with unsupported aggregations shall not be possible @@ -246,6 +250,35 @@ public final class AggregationResultUtils { } } + static class MultiBucketsAggExtractor implements AggValueExtractor { + @Override + public Object value(Aggregation agg, Map fieldTypeMap, String lookupFieldPrefix) { + MultiBucketsAggregation aggregation = (MultiBucketsAggregation) agg; + + HashMap nested = new HashMap<>(); + + for (MultiBucketsAggregation.Bucket bucket : aggregation.getBuckets()) { + if (bucket.getAggregations().iterator().hasNext() == false) { + nested.put(bucket.getKeyAsString(), bucket.getDocCount()); + } else { + HashMap nestedBucketObject = new HashMap<>(); + for (Aggregation subAgg : bucket.getAggregations()) { + nestedBucketObject.put( + subAgg.getName(), + getExtractor(subAgg).value( + subAgg, + fieldTypeMap, + lookupFieldPrefix.isEmpty() ? agg.getName() : lookupFieldPrefix + "." + agg.getName() + ) + ); + } + nested.put(bucket.getKeyAsString(), nestedBucketObject); + } + } + return nested; + } + } + static class ScriptedMetricAggExtractor implements AggValueExtractor { @Override public Object value(Aggregation agg, Map fieldTypeMap, String lookupFieldPrefix) { diff --git a/x-pack/plugin/transform/src/main/java/org/elasticsearch/xpack/transform/transforms/pivot/Aggregations.java b/x-pack/plugin/transform/src/main/java/org/elasticsearch/xpack/transform/transforms/pivot/Aggregations.java index 7a626150500..a011931a57a 100644 --- a/x-pack/plugin/transform/src/main/java/org/elasticsearch/xpack/transform/transforms/pivot/Aggregations.java +++ b/x-pack/plugin/transform/src/main/java/org/elasticsearch/xpack/transform/transforms/pivot/Aggregations.java @@ -31,6 +31,7 @@ public final class Aggregations { private static final String SOURCE = "_source"; public static final String FLOAT = "float"; + public static final String FLATTENED = "flattened"; public static final String SCALED_FLOAT = "scaled_float"; public static final String DOUBLE = "double"; public static final String LONG = "long"; @@ -69,14 +70,12 @@ public final class Aggregations { "nested", "percentile_ranks", "range", - "rare_terms", "reverse_nested", "sampler", "significant_terms", // https://github.com/elastic/elasticsearch/issues/51073 "significant_text", "stats", // https://github.com/elastic/elasticsearch/issues/51925 "string_stats", // https://github.com/elastic/elasticsearch/issues/51925 - "terms", // https://github.com/elastic/elasticsearch/issues/51073 "top_hits", "top_metrics", // https://github.com/elastic/elasticsearch/issues/52236 "t_test" // https://github.com/elastic/elasticsearch/issues/54503 @@ -107,7 +106,9 @@ public final class Aggregations { BUCKET_SELECTOR("bucket_selector", DYNAMIC), BUCKET_SCRIPT("bucket_script", DYNAMIC), PERCENTILES("percentiles", DOUBLE), - FILTER("filter", LONG); + FILTER("filter", LONG), + TERMS("terms", FLATTENED), + RARE_TERMS("rare_terms", FLATTENED); private final String aggregationType; private final String targetMapping; diff --git a/x-pack/plugin/transform/src/test/java/org/elasticsearch/xpack/transform/transforms/pivot/AggregationsTests.java b/x-pack/plugin/transform/src/test/java/org/elasticsearch/xpack/transform/transforms/pivot/AggregationsTests.java index a2afbddb412..f1ed70be07c 100644 --- a/x-pack/plugin/transform/src/test/java/org/elasticsearch/xpack/transform/transforms/pivot/AggregationsTests.java +++ b/x-pack/plugin/transform/src/test/java/org/elasticsearch/xpack/transform/transforms/pivot/AggregationsTests.java @@ -90,6 +90,16 @@ public class AggregationsTests extends ESTestCase { assertEquals("long", Aggregations.resolveTargetMapping("filter", "long")); assertEquals("long", Aggregations.resolveTargetMapping("filter", "double")); + // terms + assertEquals("flattened", Aggregations.resolveTargetMapping("terms", null)); + assertEquals("flattened", Aggregations.resolveTargetMapping("terms", "keyword")); + assertEquals("flattened", Aggregations.resolveTargetMapping("terms", "text")); + + // rare_terms + assertEquals("flattened", Aggregations.resolveTargetMapping("rare_terms", null)); + assertEquals("flattened", Aggregations.resolveTargetMapping("rare_terms", "text")); + assertEquals("flattened", Aggregations.resolveTargetMapping("rare_terms", "keyword")); + // corner case: source type null assertEquals(null, Aggregations.resolveTargetMapping("min", null)); }