From dd63f543251927ef2410baa69666db638d1ede04 Mon Sep 17 00:00:00 2001 From: Gian Merlino Date: Fri, 16 Dec 2016 17:15:59 -0800 Subject: [PATCH] Built-in SQL. (#3682) --- NOTICE | 6 + benchmarks/pom.xml | 17 + .../druid/benchmark/query/SqlBenchmark.java | 237 ++ docs/content/configuration/broker.md | 24 + docs/content/querying/sql.md | 128 +- pom.xml | 42 +- server/pom.xml | 4 + .../initialization/jetty/JettyBindings.java | 10 +- .../jetty/JettyServerModule.java | 6 +- services/pom.xml | 5 + .../src/main/java/io/druid/cli/CliBroker.java | 5 +- .../cli/QueryJettyServerInitializer.java | 23 +- sql/pom.xml | 99 + .../io/druid/sql/avatica/AvaticaMonitor.java | 183 ++ .../sql/avatica/DruidAvaticaHandler.java | 77 + .../io/druid/sql/avatica/ServerConfig.java | 41 + .../io/druid/sql/calcite/DruidSchema.java | 358 +++ .../sql/calcite/aggregation/Aggregation.java | 196 ++ .../aggregation/PostAggregatorFactory.java | 57 + .../AbstractExpressionConversion.java | 57 + .../CharLengthExpressionConversion.java | 61 + .../expression/ExpressionConversion.java | 54 + .../expression/ExpressionConverter.java | 108 + .../sql/calcite/expression/Expressions.java | 519 ++++ .../ExtractExpressionConversion.java | 87 + .../sql/calcite/expression/ExtractionFns.java | 87 + .../expression/FloorExpressionConversion.java | 89 + .../sql/calcite/expression/RowExtraction.java | 185 ++ .../SubstringExpressionConversion.java | 71 + .../sql/calcite/expression/TimeUnits.java | 76 + .../calcite/filtration/BottomUpTransform.java | 95 + .../sql/calcite/filtration/BoundRefKey.java | 112 + .../sql/calcite/filtration/BoundValue.java | 87 + .../druid/sql/calcite/filtration/Bounds.java | 117 + .../filtration/CombineAndSimplifyBounds.java | 230 ++ .../filtration/ConvertBoundsToSelectors.java | 72 + .../filtration/ConvertSelectorsToIns.java | 106 + .../sql/calcite/filtration/Filtration.java | 189 ++ .../MoveMarkerFiltersToIntervals.java | 50 + .../MoveTimeFiltersToIntervals.java | 172 ++ .../sql/calcite/filtration/RangeSets.java | 136 + .../ValidateNoMarkerFiltersRemain.java | 47 + .../calcite/planner/AggregateValuesRule.java | 98 + .../druid/sql/calcite/planner/Calcites.java | 89 + .../calcite/planner/DruidConvertletTable.java | 59 + .../sql/calcite/planner/DruidPlannerImpl.java | 68 + .../sql/calcite/planner/PlannerConfig.java | 145 + .../io/druid/sql/calcite/planner/Rules.java | 214 ++ .../sql/calcite/rel/DruidConvention.java | 84 + .../sql/calcite/rel/DruidQueryBuilder.java | 388 +++ .../druid/sql/calcite/rel/DruidQueryRel.java | 168 ++ .../io/druid/sql/calcite/rel/DruidRel.java | 70 + .../druid/sql/calcite/rel/DruidSemiJoin.java | 317 +++ .../io/druid/sql/calcite/rel/Grouping.java | 139 + .../io/druid/sql/calcite/rel/QueryMaker.java | 435 +++ .../sql/calcite/rel/SelectProjection.java | 116 + .../rule/DruidBindableConverterRule.java | 53 + .../sql/calcite/rule/DruidFilterRule.java | 66 + .../rule/DruidSelectProjectionRule.java | 125 + .../sql/calcite/rule/DruidSelectSortRule.java | 74 + .../sql/calcite/rule/DruidSemiJoinRule.java | 59 + .../druid/sql/calcite/rule/GroupByRules.java | 787 ++++++ .../druid/sql/calcite/table/DruidTable.java | 210 ++ .../druid/sql/calcite/table/DruidTables.java | 76 + .../java/io/druid/sql/guice/SqlModule.java | 88 + .../main/java/io/druid/sql/http/SqlQuery.java | 72 + .../java/io/druid/sql/http/SqlResource.java | 152 + .../sql/avatica/DruidAvaticaHandlerTest.java | 268 ++ .../druid/sql/calcite/CalciteQueryTest.java | 2483 +++++++++++++++++ .../io/druid/sql/calcite/DruidSchemaTest.java | 133 + .../calcite/filtration/FiltrationTest.java | 62 + .../sql/calcite/http/SqlResourceTest.java | 161 ++ .../druid/sql/calcite/util/CalciteTests.java | 247 ++ .../SpecificSegmentsQuerySegmentWalker.java | 217 ++ .../calcite/util/TestServerInventoryView.java | 95 + 75 files changed, 12132 insertions(+), 11 deletions(-) create mode 100644 benchmarks/src/main/java/io/druid/benchmark/query/SqlBenchmark.java create mode 100644 sql/pom.xml create mode 100644 sql/src/main/java/io/druid/sql/avatica/AvaticaMonitor.java create mode 100644 sql/src/main/java/io/druid/sql/avatica/DruidAvaticaHandler.java create mode 100644 sql/src/main/java/io/druid/sql/avatica/ServerConfig.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/DruidSchema.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/aggregation/Aggregation.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/aggregation/PostAggregatorFactory.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/expression/AbstractExpressionConversion.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/expression/CharLengthExpressionConversion.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/expression/ExpressionConversion.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/expression/ExpressionConverter.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/expression/Expressions.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/expression/ExtractExpressionConversion.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/expression/ExtractionFns.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/expression/FloorExpressionConversion.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/expression/RowExtraction.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/expression/SubstringExpressionConversion.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/expression/TimeUnits.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/filtration/BottomUpTransform.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/filtration/BoundRefKey.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/filtration/BoundValue.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/filtration/Bounds.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/filtration/CombineAndSimplifyBounds.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/filtration/ConvertBoundsToSelectors.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/filtration/ConvertSelectorsToIns.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/filtration/Filtration.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/filtration/MoveMarkerFiltersToIntervals.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/filtration/MoveTimeFiltersToIntervals.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/filtration/RangeSets.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/filtration/ValidateNoMarkerFiltersRemain.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/planner/AggregateValuesRule.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/planner/Calcites.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/planner/DruidConvertletTable.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/planner/DruidPlannerImpl.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/planner/PlannerConfig.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/planner/Rules.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rel/DruidConvention.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rel/DruidQueryBuilder.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rel/DruidQueryRel.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rel/DruidRel.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rel/DruidSemiJoin.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rel/Grouping.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rel/QueryMaker.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rel/SelectProjection.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rule/DruidBindableConverterRule.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rule/DruidFilterRule.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rule/DruidSelectProjectionRule.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rule/DruidSelectSortRule.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rule/DruidSemiJoinRule.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/rule/GroupByRules.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/table/DruidTable.java create mode 100644 sql/src/main/java/io/druid/sql/calcite/table/DruidTables.java create mode 100644 sql/src/main/java/io/druid/sql/guice/SqlModule.java create mode 100644 sql/src/main/java/io/druid/sql/http/SqlQuery.java create mode 100644 sql/src/main/java/io/druid/sql/http/SqlResource.java create mode 100644 sql/src/test/java/io/druid/sql/avatica/DruidAvaticaHandlerTest.java create mode 100644 sql/src/test/java/io/druid/sql/calcite/CalciteQueryTest.java create mode 100644 sql/src/test/java/io/druid/sql/calcite/DruidSchemaTest.java create mode 100644 sql/src/test/java/io/druid/sql/calcite/filtration/FiltrationTest.java create mode 100644 sql/src/test/java/io/druid/sql/calcite/http/SqlResourceTest.java create mode 100644 sql/src/test/java/io/druid/sql/calcite/util/CalciteTests.java create mode 100644 sql/src/test/java/io/druid/sql/calcite/util/SpecificSegmentsQuerySegmentWalker.java create mode 100644 sql/src/test/java/io/druid/sql/calcite/util/TestServerInventoryView.java diff --git a/NOTICE b/NOTICE index 1f91649e555..cb8a439535b 100644 --- a/NOTICE +++ b/NOTICE @@ -44,3 +44,9 @@ This product contains a modified version of Metamarkets bytebuffer-collections l * https://github.com/metamx/bytebuffer-collections * COMMIT TAG: * https://github.com/metamx/bytebuffer-collections/commit/3d1e7c8 + +This product contains SQL query planning code adapted from Apache Calcite + * LICENSE: + * https://github.com/apache/calcite/blob/master/LICENSE (Apache License, Version 2.0) + * HOMEPAGE: + * https://calcite.apache.org/ diff --git a/benchmarks/pom.xml b/benchmarks/pom.xml index 732ff2ab8eb..d87cd693eb3 100644 --- a/benchmarks/pom.xml +++ b/benchmarks/pom.xml @@ -56,6 +56,23 @@ druid-server ${project.parent.version} + + io.druid + druid-sql + ${project.parent.version} + + + io.druid + druid-processing + ${project.parent.version} + test-jar + + + io.druid + druid-sql + ${project.parent.version} + test-jar + com.github.wnameless json-flattener diff --git a/benchmarks/src/main/java/io/druid/benchmark/query/SqlBenchmark.java b/benchmarks/src/main/java/io/druid/benchmark/query/SqlBenchmark.java new file mode 100644 index 00000000000..8e40734c713 --- /dev/null +++ b/benchmarks/src/main/java/io/druid/benchmark/query/SqlBenchmark.java @@ -0,0 +1,237 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.benchmark.query; + +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +import com.google.common.collect.ImmutableMap; +import com.google.common.collect.Lists; +import com.google.common.collect.Maps; +import com.google.common.hash.Hashing; +import com.google.common.io.Files; +import io.druid.benchmark.datagen.BenchmarkDataGenerator; +import io.druid.benchmark.datagen.BenchmarkSchemaInfo; +import io.druid.benchmark.datagen.BenchmarkSchemas; +import io.druid.common.utils.JodaUtils; +import io.druid.data.input.InputRow; +import io.druid.data.input.Row; +import io.druid.granularity.QueryGranularities; +import io.druid.java.util.common.guava.Sequence; +import io.druid.java.util.common.guava.Sequences; +import io.druid.java.util.common.logger.Logger; +import io.druid.query.TableDataSource; +import io.druid.query.aggregation.AggregatorFactory; +import io.druid.query.aggregation.CountAggregatorFactory; +import io.druid.query.aggregation.hyperloglog.HyperUniquesSerde; +import io.druid.query.dimension.DefaultDimensionSpec; +import io.druid.query.dimension.DimensionSpec; +import io.druid.query.groupby.GroupByQuery; +import io.druid.segment.column.ValueType; +import io.druid.segment.serde.ComplexMetrics; +import io.druid.sql.calcite.planner.Calcites; +import io.druid.sql.calcite.planner.PlannerConfig; +import io.druid.sql.calcite.table.DruidTable; +import io.druid.sql.calcite.util.CalciteTests; +import io.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker; +import org.apache.calcite.jdbc.CalciteConnection; +import org.apache.calcite.schema.Schema; +import org.apache.calcite.schema.Table; +import org.apache.calcite.schema.impl.AbstractSchema; +import org.apache.commons.io.FileUtils; +import org.joda.time.Interval; +import org.openjdk.jmh.annotations.Benchmark; +import org.openjdk.jmh.annotations.BenchmarkMode; +import org.openjdk.jmh.annotations.Fork; +import org.openjdk.jmh.annotations.Level; +import org.openjdk.jmh.annotations.Measurement; +import org.openjdk.jmh.annotations.Mode; +import org.openjdk.jmh.annotations.OutputTimeUnit; +import org.openjdk.jmh.annotations.Param; +import org.openjdk.jmh.annotations.Scope; +import org.openjdk.jmh.annotations.Setup; +import org.openjdk.jmh.annotations.State; +import org.openjdk.jmh.annotations.TearDown; +import org.openjdk.jmh.annotations.Warmup; +import org.openjdk.jmh.infra.Blackhole; + +import java.io.File; +import java.sql.ResultSet; +import java.sql.ResultSetMetaData; +import java.util.ArrayList; +import java.util.Arrays; +import java.util.List; +import java.util.Map; +import java.util.concurrent.TimeUnit; + +/** + * Benchmark that compares the same groupBy query through the native query layer and through the SQL layer. + */ +@State(Scope.Benchmark) +@Fork(jvmArgsPrepend = "-server", value = 1) +@Warmup(iterations = 15) +@Measurement(iterations = 30) +public class SqlBenchmark +{ + @Param({"10000", "100000", "200000"}) + private int rowsPerSegment; + + private static final Logger log = new Logger(SqlBenchmark.class); + private static final int RNG_SEED = 9999; + + private File tmpDir; + private SpecificSegmentsQuerySegmentWalker walker; + private CalciteConnection calciteConnection; + private GroupByQuery groupByQuery; + private String sqlQuery; + + @Setup(Level.Trial) + public void setup() throws Exception + { + tmpDir = Files.createTempDir(); + log.info("Starting benchmark setup using tmpDir[%s], rows[%,d].", tmpDir, rowsPerSegment); + + if (ComplexMetrics.getSerdeForType("hyperUnique") == null) { + ComplexMetrics.registerSerde("hyperUnique", new HyperUniquesSerde(Hashing.murmur3_128())); + } + + final BenchmarkSchemaInfo schemaInfo = BenchmarkSchemas.SCHEMA_MAP.get("basic"); + final BenchmarkDataGenerator dataGenerator = new BenchmarkDataGenerator( + schemaInfo.getColumnSchemas(), + RNG_SEED + 1, + schemaInfo.getDataInterval(), + rowsPerSegment + ); + + final List rows = Lists.newArrayList(); + for (int i = 0; i < rowsPerSegment; i++) { + final InputRow row = dataGenerator.nextRow(); + if (i % 20000 == 0) { + log.info("%,d/%,d rows generated.", i, rowsPerSegment); + } + rows.add(row); + } + + log.info("%,d/%,d rows generated.", rows.size(), rowsPerSegment); + + final PlannerConfig plannerConfig = new PlannerConfig(); + walker = CalciteTests.createWalker(tmpDir, rows); + final Map tableMap = ImmutableMap.of( + "foo", + new DruidTable( + walker, + new TableDataSource("foo"), + plannerConfig, + ImmutableMap.of( + "__time", ValueType.LONG, + "dimSequential", ValueType.STRING, + "dimZipf", ValueType.STRING, + "dimUniform", ValueType.STRING + ) + ) + ); + final Schema druidSchema = new AbstractSchema() + { + @Override + protected Map getTableMap() + { + return tableMap; + } + }; + calciteConnection = Calcites.jdbc(druidSchema, plannerConfig); + groupByQuery = GroupByQuery + .builder() + .setDataSource("foo") + .setInterval(new Interval(JodaUtils.MIN_INSTANT, JodaUtils.MAX_INSTANT)) + .setDimensions( + Arrays.asList( + new DefaultDimensionSpec("dimZipf", "d0"), + new DefaultDimensionSpec("dimSequential", "d1") + ) + ) + .setAggregatorSpecs(Arrays.asList(new CountAggregatorFactory("c"))) + .setGranularity(QueryGranularities.ALL) + .build(); + + sqlQuery = "SELECT\n" + + " dimZipf AS d0," + + " dimSequential AS d1,\n" + + " COUNT(*) AS c\n" + + "FROM druid.foo\n" + + "GROUP BY dimZipf, dimSequential"; + } + + @TearDown(Level.Trial) + public void tearDown() throws Exception + { + if (walker != null) { + walker.close(); + walker = null; + } + + if (tmpDir != null) { + FileUtils.deleteDirectory(tmpDir); + } + } + + @Benchmark + @BenchmarkMode(Mode.AverageTime) + @OutputTimeUnit(TimeUnit.MILLISECONDS) + public void queryNative(Blackhole blackhole) throws Exception + { + final Sequence resultSequence = groupByQuery.run(walker, Maps.newHashMap()); + final ArrayList resultList = Sequences.toList(resultSequence, Lists.newArrayList()); + + for (Row row : resultList) { + blackhole.consume(row); + } + } + + @Benchmark + @BenchmarkMode(Mode.AverageTime) + @OutputTimeUnit(TimeUnit.MILLISECONDS) + public void querySql(Blackhole blackhole) throws Exception + { + final ResultSet resultSet = calciteConnection.createStatement().executeQuery(sqlQuery); + final ResultSetMetaData metaData = resultSet.getMetaData(); + + while (resultSet.next()) { + for (int i = 0; i < metaData.getColumnCount(); i++) { + blackhole.consume(resultSet.getObject(i + 1)); + } + } + } +} diff --git a/docs/content/configuration/broker.md b/docs/content/configuration/broker.md index 55c1ccf8059..0e85d94b0a6 100644 --- a/docs/content/configuration/broker.md +++ b/docs/content/configuration/broker.md @@ -85,6 +85,30 @@ See [groupBy server configuration](../querying/groupbyquery.html#server-configur |--------|-----------|-------| |`druid.query.segmentMetadata.defaultHistory`|When no interval is specified in the query, use a default interval of defaultHistory before the end time of the most recent segment, specified in ISO8601 format. This property also controls the duration of the default interval used by GET /druid/v2/datasources/{dataSourceName} interactions for retrieving datasource dimensions/metrics.|P1W| +#### SQL Server Configuration + +The broker's [built-in SQL server](../querying/sql.html) can be configured through the following properties. + +|Property|Description|Default| +|--------|-----------|-------| +|`druid.sql.enable`|Whether to enable SQL at all, including background metadata fetching. If false, this overrides all other SQL-related properties and disables SQL metadata, serving, and planning completely.|false| +|`druid.sql.server.enableAvatica`|Whether to enable an Avatica server at `/druid/v2/sql/avatica/`.|false| +|`druid.sql.server.enableJsonOverHttp`|Whether to enable a simple JSON over HTTP route at `/druid/v2/sql/`.|true| + +#### SQL Planner Configuration + +The broker's [SQL planner](../querying/sql.html) can be configured through the following properties. + +|Property|Description|Default| +|--------|-----------|-------| +|`druid.sql.planner.maxSemiJoinRowsInMemory`|Maximum number of rows to keep in memory for executing two-stage semi-join queries like `SELECT * FROM Employee WHERE DeptName IN (SELECT DeptName FROM Dept)`.|100000| +|`druid.sql.planner.maxTopNLimit`|Maximum threshold for a [TopN query](../querying/topnquery.html). Higher limits will be planned as [GroupBy queries](../querying/groupbyquery.html) instead.|100000| +|`druid.sql.planner.metadataRefreshPeriod`|Throttle for metadata refreshes.|PT1M| +|`druid.sql.planner.selectPageSize`|Page size threshold for [Select queries](../querying/select-query.html). Select queries for larger resultsets will be issued back-to-back using pagination.|1000| +|`druid.sql.planner.useApproximateCountDistinct`|Whether to use an approximate cardinalty algorithm for `COUNT(DISTINCT foo)`.|true| +|`druid.sql.planner.useApproximateTopN`|Whether to use approximate [TopN queries](../querying/topnquery.html) when a SQL query could be expressed as such. If false, exact [GroupBy queries](../querying/groupbyquery.html) will be used instead.|true| +|`druid.sql.planner.useFallback`|Whether to evaluate operations on the broker when they cannot be expressed as Druid queries. This option is not recommended for production since it can generate unscalable query plans. If false, SQL queries that cannot be translated to Druid queries will fail.|false| + ### Caching You can optionally only configure caching to be enabled on the broker by setting caching configs here. diff --git a/docs/content/querying/sql.md b/docs/content/querying/sql.md index 10e928b85c9..98da2be86aa 100644 --- a/docs/content/querying/sql.md +++ b/docs/content/querying/sql.md @@ -2,6 +2,130 @@ layout: doc_page --- # SQL Support for Druid -Full SQL is currently not supported with Druid. SQL libraries on top of Druid have been contributed by the community and can be found on our [libraries](../development/libraries.html) page. -The community SQL libraries are not yet as expressive as Druid's native query language. +## Built-in SQL + +
+Built-in SQL is an experimental feature. The API described here is +subject to change. +
+ +Druid includes a native SQL layer with an [Apache Calcite](https://calcite.apache.org/)-based parser and planner. All +parsing and planning takes place on the Broker, where SQL is converted to native Druid queries. Those native Druid +queries are then passed down to data nodes. Each Druid dataSource appears as a table in the "druid" schema. + +Add "EXPLAIN PLAN FOR" to the beginning of any query to see how Druid will plan that query. + +### Querying with JDBC + +You can make Druid SQL queries using the [Avatica JDBC driver](https://calcite.apache.org/avatica/downloads/). Once +you've downloaded the Avatica client jar, add it to your classpath and use the connect string: + +``` +jdbc:avatica:remote:url=http://BROKER:8082/druid/v2/sql/avatica/ +``` + +Example code: + +```java +Connection connection = DriverManager.getConnection("jdbc:avatica:remote:url=http://localhost:8082/druid/v2/sql/avatica/"); +ResultSet resultSet = connection.createStatement().executeQuery("SELECT COUNT(*) AS cnt FROM druid.foo"); +while (resultSet.next()) { + // Do something +} +``` + +Table metadata is available over JDBC using `connection.getMetaData()`. + +Parameterized queries don't work properly, so avoid those. + +### Querying with JSON over HTTP + +You can make Druid SQL queries using JSON over HTTP by POSTing to the endpoint `/druid/v2/sql/`. The request format +is: + +```json +{ + "query" : "SELECT COUNT(*) FROM druid.ds WHERE foo = ?" +} +``` + +You can use _curl_ to send these queries from the command-line: + +```bash +curl -XPOST -H'Content-Type: application/json' http://BROKER:8082/druid/v2/sql/ -d '{"query":"SELECT COUNT(*) FROM druid.ds"}' +``` + +Metadata is not available over the HTTP API. + +### Metadata + +Druid brokers cache column type metadata for each dataSource and use it to plan SQL queries. This cache is updated +on broker startup and also periodically in the background through +[SegmentMetadata queries](../querying/segmentmetadataquery.html). Background metadata refreshing is triggered by +segments entering and exiting the cluster, and can also be throttled through configuration. + +This cached metadata is queryable through the "metadata.COLUMNS" and "metadata.TABLES" tables. When +`druid.sql.planner.useFallback` is disabled (the default), only full scans of this table are possible. For example, to +retrieve column metadata, use the query: + +```sql +SELECT * FROM metadata.COLUMNS +``` + +If `druid.sql.planner.useFallback` is enabled, full SQL is possible on metadata tables. However, useFallback is not +recommended in production since it can generate unscalable query plans. The JDBC driver allows accessing +table and column metadata through `connection.getMetaData()` even if useFallback is off. + +### Time functions + +Druid's SQL language supports a number of time operations, including: + +- `FLOOR(__time TO )` for grouping or filtering on time buckets, like `SELECT FLOOR(__time TO MONTH), SUM(cnt) FROM druid.foo GROUP BY FLOOR(__time TO MONTH)` +- `EXTRACT( FROM __time)` for grouping or filtering on time parts, like `SELECT EXTRACT(HOUR FROM __time), SUM(cnt) FROM druid.foo GROUP BY EXTRACT(HOUR FROM __time)` +- Comparisons to `TIMESTAMP '
+ + org.apache.calcite + calcite-core + ${calcite.version} + + + org.apache.calcite + calcite-linq4j + ${calcite.version} + + + org.apache.calcite.avatica + avatica-core + ${avatica.version} + + + org.apache.calcite.avatica + avatica-server + ${avatica.version} + com.google.guava guava @@ -391,6 +415,16 @@ jetty-proxy ${jetty.version} + + org.eclipse.jetty + jetty-util + ${jetty.version} + + + io.netty + netty-all + ${netty.version} + joda-time joda-time @@ -478,7 +512,7 @@ com.google.protobuf protobuf-java - 2.5.0 + 3.1.0 io.tesla.aether @@ -584,6 +618,12 @@ slf4j-api 1.6.4 + + org.apache.calcite + calcite-core + ${calcite.version} + test-jar + org.easymock easymock diff --git a/server/pom.xml b/server/pom.xml index 6a15740e2b5..485e8a51b4d 100644 --- a/server/pom.xml +++ b/server/pom.xml @@ -120,6 +120,10 @@ org.eclipse.jetty jetty-server + + org.eclipse.jetty + jetty-util + org.eclipse.jetty jetty-proxy diff --git a/server/src/main/java/io/druid/server/initialization/jetty/JettyBindings.java b/server/src/main/java/io/druid/server/initialization/jetty/JettyBindings.java index 8b738f038fa..e05b664e14c 100644 --- a/server/src/main/java/io/druid/server/initialization/jetty/JettyBindings.java +++ b/server/src/main/java/io/druid/server/initialization/jetty/JettyBindings.java @@ -22,9 +22,8 @@ package io.druid.server.initialization.jetty; import com.google.common.collect.ImmutableMap; import com.google.inject.Binder; import com.google.inject.multibindings.Multibinder; - import io.druid.java.util.common.logger.Logger; - +import org.eclipse.jetty.server.Handler; import org.eclipse.jetty.servlets.QoSFilter; import javax.servlet.DispatcherType; @@ -52,6 +51,13 @@ public class JettyBindings .toInstance(new QosFilterHolder(path, maxRequests)); } + public static void addHandler(Binder binder, Class handlerClass) + { + Multibinder.newSetBinder(binder, Handler.class) + .addBinding() + .to(handlerClass); + } + private static class QosFilterHolder implements ServletFilterHolder { private final String path; diff --git a/server/src/main/java/io/druid/server/initialization/jetty/JettyServerModule.java b/server/src/main/java/io/druid/server/initialization/jetty/JettyServerModule.java index 69a08e7c152..7de440c07d5 100644 --- a/server/src/main/java/io/druid/server/initialization/jetty/JettyServerModule.java +++ b/server/src/main/java/io/druid/server/initialization/jetty/JettyServerModule.java @@ -59,6 +59,7 @@ import io.druid.server.metrics.MetricsModule; import io.druid.server.metrics.MonitorsConfig; import org.eclipse.jetty.server.ConnectionFactory; import org.eclipse.jetty.server.Connector; +import org.eclipse.jetty.server.Handler; import org.eclipse.jetty.server.Server; import org.eclipse.jetty.server.ServerConnector; import org.eclipse.jetty.util.thread.QueuedThreadPool; @@ -95,8 +96,9 @@ public class JettyServerModule extends JerseyServletModule Jerseys.addResource(binder, StatusResource.class); binder.bind(StatusResource.class).in(LazySingleton.class); - //Adding empty binding for ServletFilterHolders so that injector returns - //an empty set when no external modules provide ServletFilterHolder impls + // Adding empty binding for ServletFilterHolders and Handlers so that injector returns an empty set if none + // are provided by extensions. + Multibinder.newSetBinder(binder, Handler.class); Multibinder.newSetBinder(binder, ServletFilterHolder.class); MetricsModule.register(binder, JettyMonitor.class); diff --git a/services/pom.xml b/services/pom.xml index 5ab6fcb64e2..cb292b66820 100644 --- a/services/pom.xml +++ b/services/pom.xml @@ -51,6 +51,11 @@ druid-indexing-service ${project.parent.version} + + io.druid + druid-sql + ${project.parent.version} + io.airlift airline diff --git a/services/src/main/java/io/druid/cli/CliBroker.java b/services/src/main/java/io/druid/cli/CliBroker.java index 8b4e069e402..5c6df160c0f 100644 --- a/services/src/main/java/io/druid/cli/CliBroker.java +++ b/services/src/main/java/io/druid/cli/CliBroker.java @@ -23,7 +23,6 @@ import com.google.common.collect.ImmutableList; import com.google.inject.Binder; import com.google.inject.Module; import com.google.inject.name.Names; - import io.airlift.airline.Command; import io.druid.client.BrokerSegmentWatcherConfig; import io.druid.client.BrokerServerView; @@ -51,6 +50,7 @@ import io.druid.server.http.BrokerResource; import io.druid.server.initialization.jetty.JettyServerInitializer; import io.druid.server.metrics.MetricsModule; import io.druid.server.router.TieredBrokerConfig; +import io.druid.sql.guice.SqlModule; import org.eclipse.jetty.server.Server; import java.util.List; @@ -111,7 +111,8 @@ public class CliBroker extends ServerRunnable LifecycleModule.register(binder, Server.class); } }, - new LookupModule() + new LookupModule(), + new SqlModule() ); } } diff --git a/services/src/main/java/io/druid/cli/QueryJettyServerInitializer.java b/services/src/main/java/io/druid/cli/QueryJettyServerInitializer.java index 7ca03c10841..c4bbf32acf7 100644 --- a/services/src/main/java/io/druid/cli/QueryJettyServerInitializer.java +++ b/services/src/main/java/io/druid/cli/QueryJettyServerInitializer.java @@ -19,6 +19,8 @@ package io.druid.cli; +import com.google.common.collect.ImmutableList; +import com.google.inject.Inject; import com.google.inject.Injector; import com.google.inject.servlet.GuiceFilter; import io.druid.server.initialization.jetty.JettyServerInitUtils; @@ -30,10 +32,21 @@ import org.eclipse.jetty.servlet.DefaultServlet; import org.eclipse.jetty.servlet.ServletContextHandler; import org.eclipse.jetty.servlet.ServletHolder; +import java.util.List; +import java.util.Set; + /** -*/ + */ public class QueryJettyServerInitializer implements JettyServerInitializer { + private final List extensionHandlers; + + @Inject + public QueryJettyServerInitializer(Set extensionHandlers) + { + this.extensionHandlers = ImmutableList.copyOf(extensionHandlers); + } + @Override public void initialize(Server server, Injector injector) { @@ -45,7 +58,13 @@ public class QueryJettyServerInitializer implements JettyServerInitializer root.addFilter(GuiceFilter.class, "/*", null); final HandlerList handlerList = new HandlerList(); - handlerList.setHandlers(new Handler[]{JettyServerInitUtils.getJettyRequestLogHandler(), root}); + final Handler[] handlers = new Handler[extensionHandlers.size() + 2]; + handlers[0] = JettyServerInitUtils.getJettyRequestLogHandler(); + handlers[handlers.length - 1] = root; + for (int i = 0; i < extensionHandlers.size(); i++) { + handlers[i + 1] = extensionHandlers.get(i); + } + handlerList.setHandlers(handlers); server.setHandler(handlerList); } } diff --git a/sql/pom.xml b/sql/pom.xml new file mode 100644 index 00000000000..7027584da94 --- /dev/null +++ b/sql/pom.xml @@ -0,0 +1,99 @@ + + + + + 4.0.0 + + druid-sql + druid-sql + Druid SQL + + + io.druid + druid + 0.9.3-SNAPSHOT + + + + + io.druid + druid-server + ${project.parent.version} + + + org.apache.calcite + calcite-core + + + org.apache.calcite + calcite-linq4j + + + org.apache.calcite.avatica + avatica-core + + + org.apache.calcite.avatica + avatica-server + + + io.netty + netty-all + + + + + junit + junit + test + + + org.apache.calcite + calcite-core + test-jar + test + + + io.druid + druid-processing + ${project.parent.version} + test-jar + test + + + + + + + org.apache.maven.plugins + maven-jar-plugin + + + + test-jar + + + + + + + + diff --git a/sql/src/main/java/io/druid/sql/avatica/AvaticaMonitor.java b/sql/src/main/java/io/druid/sql/avatica/AvaticaMonitor.java new file mode 100644 index 00000000000..03b074cb8dd --- /dev/null +++ b/sql/src/main/java/io/druid/sql/avatica/AvaticaMonitor.java @@ -0,0 +1,183 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.avatica; + +import com.google.common.collect.Maps; +import com.metamx.emitter.service.ServiceEmitter; +import com.metamx.emitter.service.ServiceMetricEvent; +import com.metamx.metrics.AbstractMonitor; +import io.druid.java.util.common.logger.Logger; +import org.apache.calcite.avatica.metrics.Counter; +import org.apache.calcite.avatica.metrics.Gauge; +import org.apache.calcite.avatica.metrics.Histogram; +import org.apache.calcite.avatica.metrics.Meter; +import org.apache.calcite.avatica.metrics.MetricsSystem; +import org.apache.calcite.avatica.metrics.Timer; + +import java.util.Map; +import java.util.concurrent.ConcurrentMap; +import java.util.concurrent.atomic.AtomicBoolean; +import java.util.concurrent.atomic.AtomicLong; + +public class AvaticaMonitor extends AbstractMonitor implements MetricsSystem +{ + private static final Logger log = new Logger(AvaticaMonitor.class); + + private final ConcurrentMap counters = Maps.newConcurrentMap(); + private final ConcurrentMap> gauges = Maps.newConcurrentMap(); + + @Override + public boolean doMonitor(final ServiceEmitter emitter) + { + for (final Map.Entry entry : counters.entrySet()) { + final String name = entry.getKey(); + final long value = entry.getValue().getAndSet(0); + emitter.emit(ServiceMetricEvent.builder().build(fullMetricName(name), value)); + } + + for (Map.Entry> entry : gauges.entrySet()) { + final String name = entry.getKey(); + final Object value = entry.getValue().getValue(); + if (value instanceof Number) { + emitter.emit(ServiceMetricEvent.builder().build(fullMetricName(name), (Number) value)); + } else { + log.debug("Not emitting gauge[%s] since value[%s] type was[%s].", name, value, value.getClass().getName()); + } + } + + return true; + } + + @Override + public Timer getTimer(final String name) + { + final AtomicLong counter = makeCounter(name); + return new Timer() + { + @Override + public Context start() + { + final long start = System.currentTimeMillis(); + final AtomicBoolean closed = new AtomicBoolean(); + return new Context() + { + @Override + public void close() + { + if (closed.compareAndSet(false, true)) { + counter.addAndGet(System.currentTimeMillis() - start); + } + } + }; + } + }; + } + + @Override + public Histogram getHistogram(final String name) + { + // Return a dummy Histogram. We don't support Histogram metrics. + return new Histogram() + { + @Override + public void update(int i) + { + // Do nothing. + } + + @Override + public void update(long l) + { + // Do nothing. + } + }; + } + + @Override + public Meter getMeter(final String name) + { + final AtomicLong counter = makeCounter(name); + return new Meter() + { + @Override + public void mark() + { + counter.incrementAndGet(); + } + + @Override + public void mark(long events) + { + counter.addAndGet(events); + } + }; + } + + @Override + public Counter getCounter(final String name) + { + final AtomicLong counter = makeCounter(name); + return new Counter() + { + @Override + public void increment() + { + counter.incrementAndGet(); + } + + @Override + public void increment(long n) + { + counter.addAndGet(n); + } + + @Override + public void decrement() + { + counter.decrementAndGet(); + } + + @Override + public void decrement(long n) + { + counter.addAndGet(-n); + } + }; + } + + @Override + public void register(final String name, final Gauge gauge) + { + if (gauges.putIfAbsent(name, gauge) != null) { + log.warn("Ignoring gauge[%s], one with the same name was already registered.", name); + } + } + + private AtomicLong makeCounter(final String name) + { + counters.putIfAbsent(name, new AtomicLong()); + return counters.get(name); + } + + private String fullMetricName(final String name) + { + return name.replace("org.apache.calcite.avatica", "avatica").replace(".", "/"); + } +} diff --git a/sql/src/main/java/io/druid/sql/avatica/DruidAvaticaHandler.java b/sql/src/main/java/io/druid/sql/avatica/DruidAvaticaHandler.java new file mode 100644 index 00000000000..8ae03ba94f6 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/avatica/DruidAvaticaHandler.java @@ -0,0 +1,77 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.avatica; + +import com.google.inject.Inject; +import io.druid.guice.annotations.Self; +import io.druid.server.DruidNode; +import org.apache.calcite.avatica.Meta; +import org.apache.calcite.avatica.remote.LocalService; +import org.apache.calcite.avatica.remote.Service; +import org.apache.calcite.avatica.server.AvaticaJsonHandler; +import org.apache.calcite.jdbc.CalciteConnection; +import org.apache.calcite.jdbc.CalciteMetaImpl; +import org.eclipse.jetty.server.Request; + +import javax.servlet.ServletException; +import javax.servlet.http.HttpServletRequest; +import javax.servlet.http.HttpServletResponse; +import java.io.IOException; +import java.lang.reflect.InvocationTargetException; + +public class DruidAvaticaHandler extends AvaticaJsonHandler +{ + static final String AVATICA_PATH = "/druid/v2/sql/avatica/"; + + private final ServerConfig config; + + @Inject + public DruidAvaticaHandler( + final CalciteConnection connection, + @Self final DruidNode druidNode, + final AvaticaMonitor avaticaMonitor, + final ServerConfig config + ) throws InstantiationException, IllegalAccessException, InvocationTargetException + { + super( + new LocalService((Meta) CalciteMetaImpl.class.getConstructors()[0].newInstance(connection), avaticaMonitor), + avaticaMonitor + ); + + this.config = config; + setServerRpcMetadata(new Service.RpcMetadataResponse(druidNode.getHostAndPort())); + } + + @Override + public void handle( + final String target, + final Request baseRequest, + final HttpServletRequest request, + final HttpServletResponse response + ) throws IOException, ServletException + { + // This is not integrated with the experimental authorization framework. + // (Non-trivial since we don't know the dataSources up-front) + + if (config.isEnableAvatica() && request.getRequestURI().equals(AVATICA_PATH)) { + super.handle(target, baseRequest, request, response); + } + } +} diff --git a/sql/src/main/java/io/druid/sql/avatica/ServerConfig.java b/sql/src/main/java/io/druid/sql/avatica/ServerConfig.java new file mode 100644 index 00000000000..fff36f59b6b --- /dev/null +++ b/sql/src/main/java/io/druid/sql/avatica/ServerConfig.java @@ -0,0 +1,41 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.avatica; + +import com.fasterxml.jackson.annotation.JsonProperty; + +public class ServerConfig +{ + @JsonProperty + private boolean enableAvatica = false; + + @JsonProperty + private boolean enableJsonOverHttp = true; + + public boolean isEnableAvatica() + { + return enableAvatica; + } + + public boolean isEnableJsonOverHttp() + { + return enableJsonOverHttp; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/DruidSchema.java b/sql/src/main/java/io/druid/sql/calcite/DruidSchema.java new file mode 100644 index 00000000000..2aa467366d1 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/DruidSchema.java @@ -0,0 +1,358 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite; + +import com.google.common.annotations.VisibleForTesting; +import com.google.common.base.Joiner; +import com.google.common.base.Preconditions; +import com.google.common.collect.ImmutableMap; +import com.google.common.collect.ImmutableMultimap; +import com.google.common.collect.Iterables; +import com.google.common.collect.Lists; +import com.google.common.collect.Maps; +import com.google.common.collect.Multimap; +import com.google.common.collect.Sets; +import com.google.common.util.concurrent.MoreExecutors; +import com.google.inject.Inject; +import com.metamx.emitter.EmittingLogger; +import io.druid.client.DruidDataSource; +import io.druid.client.DruidServer; +import io.druid.client.ServerView; +import io.druid.client.TimelineServerView; +import io.druid.guice.ManageLifecycle; +import io.druid.java.util.common.concurrent.ScheduledExecutors; +import io.druid.java.util.common.guava.Sequence; +import io.druid.java.util.common.guava.Sequences; +import io.druid.java.util.common.lifecycle.LifecycleStart; +import io.druid.java.util.common.lifecycle.LifecycleStop; +import io.druid.query.QuerySegmentWalker; +import io.druid.query.TableDataSource; +import io.druid.query.metadata.metadata.ColumnAnalysis; +import io.druid.query.metadata.metadata.SegmentAnalysis; +import io.druid.query.metadata.metadata.SegmentMetadataQuery; +import io.druid.segment.column.ValueType; +import io.druid.server.coordination.DruidServerMetadata; +import io.druid.sql.calcite.planner.PlannerConfig; +import io.druid.sql.calcite.table.DruidTable; +import io.druid.timeline.DataSegment; +import org.apache.calcite.linq4j.tree.Expression; +import org.apache.calcite.schema.Function; +import org.apache.calcite.schema.Schema; +import org.apache.calcite.schema.SchemaPlus; +import org.apache.calcite.schema.Table; +import org.apache.calcite.schema.impl.AbstractSchema; +import org.joda.time.DateTime; + +import java.util.EnumSet; +import java.util.List; +import java.util.Map; +import java.util.Set; +import java.util.concurrent.ConcurrentMap; +import java.util.concurrent.CountDownLatch; +import java.util.concurrent.ExecutorService; + +@ManageLifecycle +public class DruidSchema extends AbstractSchema +{ + private static final EmittingLogger log = new EmittingLogger(DruidSchema.class); + + private final QuerySegmentWalker walker; + private final TimelineServerView serverView; + private final PlannerConfig config; + private final ExecutorService cacheExec; + private final ConcurrentMap tables; + + // For awaitInitialization. + private final CountDownLatch initializationLatch = new CountDownLatch(1); + + // Protects access to dataSourcesNeedingRefresh, lastRefresh, isServerViewInitialized + private final Object lock = new Object(); + + // List of dataSources that need metadata refreshes. + private final Set dataSourcesNeedingRefresh = Sets.newHashSet(); + private boolean refreshImmediately = false; + private long lastRefresh = 0L; + private boolean isServerViewInitialized = false; + + @Inject + public DruidSchema( + final QuerySegmentWalker walker, + final TimelineServerView serverView, + final PlannerConfig config + ) + { + this.walker = Preconditions.checkNotNull(walker, "walker"); + this.serverView = Preconditions.checkNotNull(serverView, "serverView"); + this.config = Preconditions.checkNotNull(config, "config"); + this.cacheExec = ScheduledExecutors.fixed(1, "DruidSchema-Cache-%d"); + this.tables = Maps.newConcurrentMap(); + } + + @LifecycleStart + public void start() + { + cacheExec.submit( + new Runnable() + { + @Override + public void run() + { + try { + while (!Thread.currentThread().isInterrupted()) { + final Set dataSources = Sets.newHashSet(); + + try { + synchronized (lock) { + final long nextRefresh = new DateTime(lastRefresh).plus(config.getMetadataRefreshPeriod()) + .getMillis(); + + while (!( + isServerViewInitialized + && !dataSourcesNeedingRefresh.isEmpty() + && (refreshImmediately || nextRefresh < System.currentTimeMillis()) + )) { + lock.wait(Math.max(1, nextRefresh - System.currentTimeMillis())); + } + + dataSources.addAll(dataSourcesNeedingRefresh); + dataSourcesNeedingRefresh.clear(); + lastRefresh = System.currentTimeMillis(); + refreshImmediately = false; + } + + // Refresh dataSources. + for (final String dataSource : dataSources) { + log.debug("Refreshing metadata for dataSource[%s].", dataSource); + final long startTime = System.currentTimeMillis(); + final DruidTable druidTable = computeTable(dataSource); + if (druidTable == null) { + if (tables.remove(dataSource) != null) { + log.info("Removed dataSource[%s] from the list of active dataSources.", dataSource); + } + } else { + tables.put(dataSource, druidTable); + log.info( + "Refreshed metadata for dataSource[%s] in %,dms.", + dataSource, + System.currentTimeMillis() - startTime + ); + } + } + + initializationLatch.countDown(); + } + catch (InterruptedException e) { + // Fall through. + throw e; + } + catch (Exception e) { + log.warn( + e, + "Metadata refresh failed for dataSources[%s], trying again soon.", + Joiner.on(", ").join(dataSources) + ); + + synchronized (lock) { + // Add dataSources back to the refresh list. + dataSourcesNeedingRefresh.addAll(dataSources); + lock.notifyAll(); + } + } + } + } + catch (InterruptedException e) { + // Just exit. + } + catch (Throwable e) { + // Throwables that fall out to here (not caught by an inner try/catch) are potentially gnarly, like + // OOMEs. Anyway, let's just emit an alert and stop refreshing metadata. + log.makeAlert(e, "Metadata refresh failed permanently").emit(); + throw e; + } + finally { + log.info("Metadata refresh stopped."); + } + } + } + ); + + serverView.registerSegmentCallback( + MoreExecutors.sameThreadExecutor(), + new ServerView.SegmentCallback() + { + @Override + public ServerView.CallbackAction segmentViewInitialized() + { + synchronized (lock) { + isServerViewInitialized = true; + lock.notifyAll(); + } + + return ServerView.CallbackAction.CONTINUE; + } + + @Override + public ServerView.CallbackAction segmentAdded(DruidServerMetadata server, DataSegment segment) + { + synchronized (lock) { + dataSourcesNeedingRefresh.add(segment.getDataSource()); + if (!tables.containsKey(segment.getDataSource())) { + refreshImmediately = true; + } + + lock.notifyAll(); + } + + return ServerView.CallbackAction.CONTINUE; + } + + @Override + public ServerView.CallbackAction segmentRemoved(DruidServerMetadata server, DataSegment segment) + { + synchronized (lock) { + dataSourcesNeedingRefresh.add(segment.getDataSource()); + lock.notifyAll(); + } + + return ServerView.CallbackAction.CONTINUE; + } + } + ); + + serverView.registerServerCallback( + MoreExecutors.sameThreadExecutor(), + new ServerView.ServerCallback() + { + @Override + public ServerView.CallbackAction serverRemoved(DruidServer server) + { + final List dataSourceNames = Lists.newArrayList(); + for (DruidDataSource druidDataSource : server.getDataSources()) { + dataSourceNames.add(druidDataSource.getName()); + } + + synchronized (lock) { + dataSourcesNeedingRefresh.addAll(dataSourceNames); + lock.notifyAll(); + } + + return ServerView.CallbackAction.CONTINUE; + } + } + ); + } + + @LifecycleStop + public void stop() + { + cacheExec.shutdownNow(); + } + + @VisibleForTesting + public void awaitInitialization() throws InterruptedException + { + initializationLatch.await(); + } + + @Override + public boolean isMutable() + { + return true; + } + + @Override + public boolean contentsHaveChangedSince(final long lastCheck, final long now) + { + return false; + } + + @Override + public Expression getExpression(final SchemaPlus parentSchema, final String name) + { + return super.getExpression(parentSchema, name); + } + + @Override + protected Map getTableMap() + { + return ImmutableMap.copyOf(tables); + } + + @Override + protected Multimap getFunctionMultimap() + { + return ImmutableMultimap.of(); + } + + @Override + protected Map getSubSchemaMap() + { + return ImmutableMap.of(); + } + + private DruidTable computeTable(final String dataSource) + { + final SegmentMetadataQuery segmentMetadataQuery = new SegmentMetadataQuery( + new TableDataSource(dataSource), + null, + null, + true, + null, + EnumSet.noneOf(SegmentMetadataQuery.AnalysisType.class), + null, + true + ); + + final Sequence sequence = segmentMetadataQuery.run(walker, Maps.newHashMap()); + final List results = Sequences.toList(sequence, Lists.newArrayList()); + if (results.isEmpty()) { + return null; + } + + final Map columnMetadata = Iterables.getOnlyElement(results).getColumns(); + final Map columnValueTypes = Maps.newHashMap(); + + for (Map.Entry entry : columnMetadata.entrySet()) { + if (entry.getValue().isError()) { + // Ignore columns with metadata consistency errors. + continue; + } + + final ValueType valueType; + try { + valueType = ValueType.valueOf(entry.getValue().getType().toUpperCase()); + } + catch (IllegalArgumentException e) { + // Ignore unrecognized types. This includes complex types like hyperUnique, etc. + // So, that means currently they are not supported. + continue; + } + + columnValueTypes.put(entry.getKey(), valueType); + } + + return new DruidTable( + walker, + new TableDataSource(dataSource), + config, + columnValueTypes + ); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/aggregation/Aggregation.java b/sql/src/main/java/io/druid/sql/calcite/aggregation/Aggregation.java new file mode 100644 index 00000000000..64d4fb1ac27 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/aggregation/Aggregation.java @@ -0,0 +1,196 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.aggregation; + +import com.google.common.base.Preconditions; +import com.google.common.collect.ImmutableList; +import com.google.common.collect.Iterables; +import com.google.common.collect.Lists; +import com.google.common.collect.Sets; +import io.druid.java.util.common.IAE; +import io.druid.java.util.common.ISE; +import io.druid.query.aggregation.AggregatorFactory; +import io.druid.query.aggregation.FilteredAggregatorFactory; +import io.druid.query.aggregation.PostAggregator; +import io.druid.query.filter.DimFilter; + +import java.util.List; +import java.util.Set; + +public class Aggregation +{ + private final List aggregatorFactories; + private final PostAggregator postAggregator; + private final PostAggregatorFactory finalizingPostAggregatorFactory; + + private Aggregation( + final List aggregatorFactories, + final PostAggregator postAggregator, + final PostAggregatorFactory finalizingPostAggregatorFactory + ) + { + this.aggregatorFactories = Preconditions.checkNotNull(aggregatorFactories, "aggregatorFactories"); + this.postAggregator = postAggregator; + this.finalizingPostAggregatorFactory = finalizingPostAggregatorFactory; + + if (postAggregator == null) { + Preconditions.checkArgument(aggregatorFactories.size() == 1, "aggregatorFactories.size == 1"); + } else { + // Verify that there are no "useless" fields in the aggregatorFactories. + // Don't verify that the PostAggregator inputs are all present; they might not be. + final Set dependentFields = postAggregator.getDependentFields(); + for (AggregatorFactory aggregatorFactory : aggregatorFactories) { + if (!dependentFields.contains(aggregatorFactory.getName())) { + throw new IAE("Unused field[%s] in Aggregation", aggregatorFactory.getName()); + } + } + } + } + + public static Aggregation create(final AggregatorFactory aggregatorFactory) + { + return new Aggregation(ImmutableList.of(aggregatorFactory), null, null); + } + + public static Aggregation create(final PostAggregator postAggregator) + { + return new Aggregation(ImmutableList.of(), postAggregator, null); + } + + public static Aggregation create( + final List aggregatorFactories, + final PostAggregator postAggregator + ) + { + return new Aggregation(aggregatorFactories, postAggregator, null); + } + + public static Aggregation createFinalizable( + final List aggregatorFactories, + final PostAggregator postAggregator, + final PostAggregatorFactory finalizingPostAggregatorFactory + ) + { + return new Aggregation( + aggregatorFactories, + postAggregator, + Preconditions.checkNotNull(finalizingPostAggregatorFactory, "finalizingPostAggregatorFactory") + ); + } + + public List getAggregatorFactories() + { + return aggregatorFactories; + } + + public PostAggregator getPostAggregator() + { + return postAggregator; + } + + public PostAggregatorFactory getFinalizingPostAggregatorFactory() + { + return finalizingPostAggregatorFactory; + } + + public String getOutputName() + { + return postAggregator != null + ? postAggregator.getName() + : Iterables.getOnlyElement(aggregatorFactories).getName(); + } + + public Aggregation filter(final DimFilter filter) + { + if (filter == null) { + return this; + } + + if (postAggregator != null) { + // Verify that this Aggregation contains all inputs. If not, this "filter" call won't work right. + final Set dependentFields = postAggregator.getDependentFields(); + final Set aggregatorNames = Sets.newHashSet(); + for (AggregatorFactory aggregatorFactory : aggregatorFactories) { + aggregatorNames.add(aggregatorFactory.getName()); + } + for (String field : dependentFields) { + if (!aggregatorNames.contains(field)) { + throw new ISE("Cannot filter an Aggregation that does not contain its inputs: %s", this); + } + } + } + + final List newAggregators = Lists.newArrayList(); + + for (AggregatorFactory agg : aggregatorFactories) { + newAggregators.add(new FilteredAggregatorFactory(agg, filter)); + } + + return new Aggregation( + newAggregators, + postAggregator, + finalizingPostAggregatorFactory + ); + } + + @Override + public boolean equals(Object o) + { + if (this == o) { + return true; + } + if (o == null || getClass() != o.getClass()) { + return false; + } + + Aggregation that = (Aggregation) o; + + if (aggregatorFactories != null + ? !aggregatorFactories.equals(that.aggregatorFactories) + : that.aggregatorFactories != null) { + return false; + } + if (postAggregator != null ? !postAggregator.equals(that.postAggregator) : that.postAggregator != null) { + return false; + } + return finalizingPostAggregatorFactory != null + ? finalizingPostAggregatorFactory.equals(that.finalizingPostAggregatorFactory) + : that.finalizingPostAggregatorFactory == null; + } + + @Override + public int hashCode() + { + int result = aggregatorFactories != null ? aggregatorFactories.hashCode() : 0; + result = 31 * result + (postAggregator != null ? postAggregator.hashCode() : 0); + result = 31 * result + (finalizingPostAggregatorFactory != null ? finalizingPostAggregatorFactory.hashCode() : 0); + return result; + } + + @Override + public String toString() + { + return "Aggregation{" + + "aggregatorFactories=" + aggregatorFactories + + ", postAggregator=" + postAggregator + + ", finalizingPostAggregatorFactory=" + finalizingPostAggregatorFactory + + '}'; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/aggregation/PostAggregatorFactory.java b/sql/src/main/java/io/druid/sql/calcite/aggregation/PostAggregatorFactory.java new file mode 100644 index 00000000000..4048ad7a9f3 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/aggregation/PostAggregatorFactory.java @@ -0,0 +1,57 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.aggregation; + +import io.druid.query.aggregation.PostAggregator; + +/** + * Can create PostAggregators with specific output names. + */ +public abstract class PostAggregatorFactory +{ + public abstract PostAggregator factorize(final String outputName); + + @Override + public boolean equals(Object o) + { + if (this == o) { + return true; + } + if (o == null || getClass() != o.getClass()) { + return false; + } + + PostAggregatorFactory that = (PostAggregatorFactory) o; + + return factorize(null).equals(that.factorize(null)); + } + + @Override + public int hashCode() + { + return factorize(null).hashCode(); + } + + @Override + public String toString() + { + return factorize(null).toString(); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/expression/AbstractExpressionConversion.java b/sql/src/main/java/io/druid/sql/calcite/expression/AbstractExpressionConversion.java new file mode 100644 index 00000000000..3633dc0b88a --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/expression/AbstractExpressionConversion.java @@ -0,0 +1,57 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.expression; + +import org.apache.calcite.sql.SqlKind; + +public abstract class AbstractExpressionConversion implements ExpressionConversion +{ + private final SqlKind kind; + private final String operatorName; + + public AbstractExpressionConversion(SqlKind kind) + { + this(kind, null); + } + + public AbstractExpressionConversion(SqlKind kind, String operatorName) + { + this.kind = kind; + this.operatorName = operatorName; + + if (kind == SqlKind.OTHER_FUNCTION && operatorName == null) { + throw new NullPointerException("operatorName must be non-null for kind OTHER_FUNCTION"); + } else if (kind != SqlKind.OTHER_FUNCTION && operatorName != null) { + throw new NullPointerException("operatorName must be non-null for kind " + kind); + } + } + + @Override + public SqlKind sqlKind() + { + return kind; + } + + @Override + public String operatorName() + { + return operatorName; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/expression/CharLengthExpressionConversion.java b/sql/src/main/java/io/druid/sql/calcite/expression/CharLengthExpressionConversion.java new file mode 100644 index 00000000000..eb35f1c676d --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/expression/CharLengthExpressionConversion.java @@ -0,0 +1,61 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.expression; + +import io.druid.query.extraction.StrlenExtractionFn; +import org.apache.calcite.rex.RexCall; +import org.apache.calcite.rex.RexNode; +import org.apache.calcite.sql.SqlKind; + +import java.util.List; + +public class CharLengthExpressionConversion extends AbstractExpressionConversion +{ + private static final CharLengthExpressionConversion INSTANCE = new CharLengthExpressionConversion(); + + private CharLengthExpressionConversion() + { + super(SqlKind.OTHER_FUNCTION, "CHAR_LENGTH"); + } + + public static CharLengthExpressionConversion instance() + { + return INSTANCE; + } + + @Override + public RowExtraction convert( + final ExpressionConverter converter, + final List rowOrder, + final RexNode expression + ) + { + final RexCall call = (RexCall) expression; + final RowExtraction arg = converter.convert(rowOrder, call.getOperands().get(0)); + if (arg == null) { + return null; + } + + return RowExtraction.of( + arg.getColumn(), + ExtractionFns.compose(StrlenExtractionFn.instance(), arg.getExtractionFn()) + ); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/expression/ExpressionConversion.java b/sql/src/main/java/io/druid/sql/calcite/expression/ExpressionConversion.java new file mode 100644 index 00000000000..4060224dc9d --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/expression/ExpressionConversion.java @@ -0,0 +1,54 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.expression; + +import org.apache.calcite.rex.RexNode; +import org.apache.calcite.sql.SqlKind; + +import java.util.List; + +public interface ExpressionConversion +{ + /** + * SQL kind that this converter knows how to convert. + * + * @return sql kind + */ + SqlKind sqlKind(); + + /** + * Operator name, if {@link #sqlKind()} is {@code OTHER_FUNCTION}. + * + * @return operator name, or null + */ + String operatorName(); + + /** + * Translate a row-expression to a Druid column reference. Note that this signature will probably need to change + * once we support extractions from multiple columns. + * + * @param converter converter that can be used to convert sub-expressions + * @param rowOrder order of fields in the Druid rows to be extracted from + * @param expression expression meant to be applied on top of the table + * + * @return (columnName, extractionFn) or null + */ + RowExtraction convert(ExpressionConverter converter, List rowOrder, RexNode expression); +} diff --git a/sql/src/main/java/io/druid/sql/calcite/expression/ExpressionConverter.java b/sql/src/main/java/io/druid/sql/calcite/expression/ExpressionConverter.java new file mode 100644 index 00000000000..9c27db640ae --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/expression/ExpressionConverter.java @@ -0,0 +1,108 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.expression; + +import com.google.common.collect.Maps; +import io.druid.java.util.common.ISE; +import org.apache.calcite.rex.RexCall; +import org.apache.calcite.rex.RexInputRef; +import org.apache.calcite.rex.RexNode; +import org.apache.calcite.sql.SqlKind; + +import java.util.List; +import java.util.Map; + +public class ExpressionConverter +{ + private final Map kindMap; + private final Map otherFunctionMap; + + private ExpressionConverter( + Map kindMap, + Map otherFunctionMap + ) + { + this.kindMap = kindMap; + this.otherFunctionMap = otherFunctionMap; + } + + public static ExpressionConverter create(final List conversions) + { + final Map kindMap = Maps.newHashMap(); + final Map otherFunctionMap = Maps.newHashMap(); + + for (final ExpressionConversion conversion : conversions) { + if (conversion.sqlKind() != SqlKind.OTHER_FUNCTION) { + if (kindMap.put(conversion.sqlKind(), conversion) != null) { + throw new ISE("Oops, can't have two conversions for sqlKind[%s]", conversion.sqlKind()); + } + } else { + // kind is OTHER_FUNCTION + if (otherFunctionMap.put(conversion.operatorName(), conversion) != null) { + throw new ISE( + "Oops, can't have two conversions for sqlKind[%s], operatorName[%s]", + conversion.sqlKind(), + conversion.operatorName() + ); + } + } + } + + return new ExpressionConverter(kindMap, otherFunctionMap); + } + + /** + * Translate a row-expression to a Druid row extraction. Note that this signature will probably need to change + * once we support extractions from multiple columns. + * + * @param rowOrder order of fields in the Druid rows to be extracted from + * @param expression expression meant to be applied on top of the table + * + * @return (columnName, extractionFn) or null + */ + public RowExtraction convert(List rowOrder, RexNode expression) + { + if (expression.getKind() == SqlKind.INPUT_REF) { + final RexInputRef ref = (RexInputRef) expression; + final String columnName = rowOrder.get(ref.getIndex()); + if (columnName == null) { + throw new ISE("WTF?! Expression referred to nonexistent index[%d]", ref.getIndex()); + } + + return RowExtraction.of(columnName, null); + } else if (expression.getKind() == SqlKind.CAST) { + // TODO(gianm): Probably not a good idea to ignore CAST like this. + return convert(rowOrder, ((RexCall) expression).getOperands().get(0)); + } else { + // Try conversion using an ExpressionConversion specific to this operator. + final RowExtraction retVal; + + if (expression.getKind() == SqlKind.OTHER_FUNCTION) { + final ExpressionConversion conversion = otherFunctionMap.get(((RexCall) expression).getOperator().getName()); + retVal = conversion != null ? conversion.convert(this, rowOrder, expression) : null; + } else { + final ExpressionConversion conversion = kindMap.get(expression.getKind()); + retVal = conversion != null ? conversion.convert(this, rowOrder, expression) : null; + } + + return retVal; + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/expression/Expressions.java b/sql/src/main/java/io/druid/sql/calcite/expression/Expressions.java new file mode 100644 index 00000000000..d052378e212 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/expression/Expressions.java @@ -0,0 +1,519 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.expression; + +import com.google.common.base.Joiner; +import com.google.common.base.Preconditions; +import com.google.common.collect.ImmutableList; +import com.google.common.collect.ImmutableMap; +import com.google.common.collect.Iterables; +import com.google.common.collect.Lists; +import com.google.common.io.BaseEncoding; +import com.google.common.primitives.Chars; +import io.druid.granularity.QueryGranularity; +import io.druid.java.util.common.ISE; +import io.druid.math.expr.ExprType; +import io.druid.query.aggregation.PostAggregator; +import io.druid.query.aggregation.post.ArithmeticPostAggregator; +import io.druid.query.aggregation.post.ConstantPostAggregator; +import io.druid.query.aggregation.post.ExpressionPostAggregator; +import io.druid.query.aggregation.post.FieldAccessPostAggregator; +import io.druid.query.extraction.ExtractionFn; +import io.druid.query.filter.AndDimFilter; +import io.druid.query.filter.BoundDimFilter; +import io.druid.query.filter.DimFilter; +import io.druid.query.filter.LikeDimFilter; +import io.druid.query.filter.NotDimFilter; +import io.druid.query.filter.OrDimFilter; +import io.druid.query.ordering.StringComparator; +import io.druid.query.ordering.StringComparators; +import io.druid.segment.column.Column; +import io.druid.sql.calcite.aggregation.PostAggregatorFactory; +import io.druid.sql.calcite.filtration.Filtration; +import io.druid.sql.calcite.table.DruidTable; +import org.apache.calcite.jdbc.JavaTypeFactoryImpl; +import org.apache.calcite.rel.core.Project; +import org.apache.calcite.rex.RexCall; +import org.apache.calcite.rex.RexInputRef; +import org.apache.calcite.rex.RexLiteral; +import org.apache.calcite.rex.RexNode; +import org.apache.calcite.sql.SqlKind; +import org.apache.calcite.sql.type.SqlTypeName; + +import java.util.Calendar; +import java.util.List; +import java.util.Map; + +/** + * A collection of functions for translating from Calcite expressions into Druid objects. + */ +public class Expressions +{ + private static final ExpressionConverter EXPRESSION_CONVERTER = ExpressionConverter.create( + ImmutableList.of( + CharLengthExpressionConversion.instance(), + ExtractExpressionConversion.instance(), + FloorExpressionConversion.instance(), + SubstringExpressionConversion.instance() + ) + ); + + private static final Map MATH_FUNCTIONS = ImmutableMap.builder() + .put("ABS", "abs") + .put("CEIL", "ceil") + .put("EXP", "exp") + .put("FLOOR", "floor") + .put("LN", "log") + .put("LOG10", "log10") + .put("POWER", "pow") + .put("SQRT", "sqrt") + .build(); + + private static final Map MATH_TYPES; + + static { + final ImmutableMap.Builder builder = ImmutableMap.builder(); + + for (SqlTypeName type : SqlTypeName.APPROX_TYPES) { + builder.put(type, ExprType.DOUBLE); + } + + for (SqlTypeName type : SqlTypeName.EXACT_TYPES) { + builder.put(type, ExprType.LONG); + } + + for (SqlTypeName type : SqlTypeName.STRING_TYPES) { + builder.put(type, ExprType.STRING); + } + + MATH_TYPES = builder.build(); + } + + private Expressions() + { + // No instantiation. + } + + /** + * Translate a field access, possibly through a projection, to an underlying Druid table. + * + * @param druidTable underlying Druid table + * @param project projection, or null + * @param fieldNumber number of the field to access + * + * @return row expression + */ + public static RexNode fromFieldAccess( + final DruidTable druidTable, + final Project project, + final int fieldNumber + ) + { + if (project == null) { + // I don't think the factory impl matters here. + return RexInputRef.of(fieldNumber, druidTable.getRowType(new JavaTypeFactoryImpl())); + } else { + return project.getChildExps().get(fieldNumber); + } + } + + /** + * Translate a Calcite row-expression to a Druid row extraction. Note that this signature will probably need to + * change once we support extractions from multiple columns. + * + * @param rowOrder order of fields in the Druid rows to be extracted from + * @param expression expression meant to be applied on top of the rows + * + * @return RowExtraction or null if not possible + */ + public static RowExtraction toRowExtraction( + final List rowOrder, + final RexNode expression + ) + { + return EXPRESSION_CONVERTER.convert(rowOrder, expression); + } + + /** + * Translate a Calcite row-expression to a Druid PostAggregator. One day, when possible, this could be folded + * into {@link #toRowExtraction(List, RexNode)}. + * + * @param name name of the PostAggregator + * @param rowOrder order of fields in the Druid rows to be extracted from + * @param finalizingPostAggregatorFactories post-aggregators that should be used for specific entries in rowOrder. + * May be empty, and individual values may be null. Missing or null values + * will lead to creation of {@link FieldAccessPostAggregator}. + * @param expression expression meant to be applied on top of the rows + * + * @return PostAggregator or null if not possible + */ + public static PostAggregator toPostAggregator( + final String name, + final List rowOrder, + final List finalizingPostAggregatorFactories, + final RexNode expression + ) + { + final PostAggregator retVal; + + if (expression.getKind() == SqlKind.INPUT_REF) { + final RexInputRef ref = (RexInputRef) expression; + final PostAggregatorFactory finalizingPostAggregatorFactory = finalizingPostAggregatorFactories.get(ref.getIndex()); + retVal = finalizingPostAggregatorFactory != null + ? finalizingPostAggregatorFactory.factorize(name) + : new FieldAccessPostAggregator(name, rowOrder.get(ref.getIndex())); + } else if (expression.getKind() == SqlKind.CAST) { + // Ignore CAST when translating to PostAggregators and hope for the best. They are really loosey-goosey with + // types internally and there isn't much we can do to respect + // TODO(gianm): Probably not a good idea to ignore CAST like this. + final RexNode operand = ((RexCall) expression).getOperands().get(0); + retVal = toPostAggregator(name, rowOrder, finalizingPostAggregatorFactories, operand); + } else if (expression.getKind() == SqlKind.LITERAL + && SqlTypeName.NUMERIC_TYPES.contains(expression.getType().getSqlTypeName())) { + retVal = new ConstantPostAggregator(name, (Number) RexLiteral.value(expression)); + } else if (expression.getKind() == SqlKind.TIMES + || expression.getKind() == SqlKind.DIVIDE + || expression.getKind() == SqlKind.PLUS + || expression.getKind() == SqlKind.MINUS) { + final String fnName = ImmutableMap.builder() + .put(SqlKind.TIMES, "*") + .put(SqlKind.DIVIDE, "quotient") + .put(SqlKind.PLUS, "+") + .put(SqlKind.MINUS, "-") + .build().get(expression.getKind()); + final List operands = Lists.newArrayList(); + for (RexNode operand : ((RexCall) expression).getOperands()) { + final PostAggregator translatedOperand = toPostAggregator( + null, + rowOrder, + finalizingPostAggregatorFactories, + operand + ); + if (translatedOperand == null) { + return null; + } + operands.add(translatedOperand); + } + retVal = new ArithmeticPostAggregator(name, fnName, operands); + } else { + // Try converting to a math expression. + final String mathExpression = Expressions.toMathExpression(rowOrder, expression); + if (mathExpression == null) { + retVal = null; + } else { + retVal = new ExpressionPostAggregator(name, mathExpression); + } + } + + if (retVal != null && name != null && !name.equals(retVal.getName())) { + throw new ISE("WTF?! Was about to return a PostAggregator with bad name, [%s] != [%s]", name, retVal.getName()); + } + + return retVal; + } + + /** + * Translate a row-expression to a Druid math expression. One day, when possible, this could be folded into + * {@link #toRowExtraction(List, RexNode)}. + * + * @param rowOrder order of fields in the Druid rows to be extracted from + * @param expression expression meant to be applied on top of the rows + * + * @return expression referring to fields in rowOrder, or null if not possible + */ + public static String toMathExpression( + final List rowOrder, + final RexNode expression + ) + { + final SqlKind kind = expression.getKind(); + final SqlTypeName sqlTypeName = expression.getType().getSqlTypeName(); + + if (kind == SqlKind.INPUT_REF) { + // Translate field references. + final RexInputRef ref = (RexInputRef) expression; + final String columnName = rowOrder.get(ref.getIndex()); + if (columnName == null) { + throw new ISE("WTF?! Expression referred to nonexistent index[%d]", ref.getIndex()); + } + + return String.format("\"%s\"", escape(columnName)); + } else if (kind == SqlKind.CAST || kind == SqlKind.REINTERPRET) { + // Translate casts. + final RexNode operand = ((RexCall) expression).getOperands().get(0); + final String operandExpression = toMathExpression(rowOrder, operand); + if (operandExpression == null) { + return null; + } + + final ExprType fromType = MATH_TYPES.get(operand.getType().getSqlTypeName()); + final ExprType toType = MATH_TYPES.get(sqlTypeName); + if (fromType != toType) { + return String.format("CAST(%s, '%s')", operandExpression, toType.toString()); + } else { + return operandExpression; + } + } else if (kind == SqlKind.TIMES || kind == SqlKind.DIVIDE || kind == SqlKind.PLUS || kind == SqlKind.MINUS) { + // Translate simple arithmetic. + final List operands = ((RexCall) expression).getOperands(); + final String lhsExpression = toMathExpression(rowOrder, operands.get(0)); + final String rhsExpression = toMathExpression(rowOrder, operands.get(1)); + if (lhsExpression == null || rhsExpression == null) { + return null; + } + + final String op = ImmutableMap.of( + SqlKind.TIMES, "*", + SqlKind.DIVIDE, "/", + SqlKind.PLUS, "+", + SqlKind.MINUS, "-" + ).get(kind); + + return String.format("(%s %s %s)", lhsExpression, op, rhsExpression); + } else if (kind == SqlKind.OTHER_FUNCTION) { + final String calciteFunction = ((RexCall) expression).getOperator().getName(); + final String druidFunction = MATH_FUNCTIONS.get(calciteFunction); + final List functionArgs = Lists.newArrayList(); + + for (final RexNode operand : ((RexCall) expression).getOperands()) { + final String operandExpression = toMathExpression(rowOrder, operand); + if (operandExpression == null) { + return null; + } + functionArgs.add(operandExpression); + } + + if ("MOD".equals(calciteFunction)) { + // Special handling for MOD, which is a function in Calcite but a binary operator in Druid. + Preconditions.checkState(functionArgs.size() == 2, "WTF?! Expected 2 args for MOD."); + return String.format("(%s %s %s)", functionArgs.get(0), "%", functionArgs.get(1)); + } + + if (druidFunction == null) { + return null; + } + + return String.format("%s(%s)", druidFunction, Joiner.on(", ").join(functionArgs)); + } else if (kind == SqlKind.LITERAL) { + // Translate literal. + if (SqlTypeName.NUMERIC_TYPES.contains(sqlTypeName)) { + // Include literal numbers as-is. + return String.valueOf(RexLiteral.value(expression)); + } else if (SqlTypeName.STRING_TYPES.contains(sqlTypeName)) { + // Quote literal strings. + return "\'" + escape(RexLiteral.stringValue(expression)) + "\'"; + } else { + // Can't translate other literals. + return null; + } + } else { + // Can't translate other kinds of expressions. + return null; + } + } + + /** + * Translates "condition" to a Druid filter, or returns null if we cannot translate the condition. + * + * @param druidTable Druid table, if the rows come from a table scan; null otherwise + * @param rowOrder order of columns in the rows to be filtered + * @param expression Calcite row expression + */ + public static DimFilter toFilter( + final DruidTable druidTable, + final List rowOrder, + final RexNode expression + ) + { + if (expression.getKind() == SqlKind.AND + || expression.getKind() == SqlKind.OR + || expression.getKind() == SqlKind.NOT) { + final List filters = Lists.newArrayList(); + for (final RexNode rexNode : ((RexCall) expression).getOperands()) { + final DimFilter nextFilter = toFilter(druidTable, rowOrder, rexNode); + if (nextFilter == null) { + return null; + } + filters.add(nextFilter); + } + + if (expression.getKind() == SqlKind.AND) { + return new AndDimFilter(filters); + } else if (expression.getKind() == SqlKind.OR) { + return new OrDimFilter(filters); + } else { + assert expression.getKind() == SqlKind.NOT; + return new NotDimFilter(Iterables.getOnlyElement(filters)); + } + } else { + // Handle filter conditions on everything else. + return toLeafFilter(druidTable, rowOrder, expression); + } + } + + /** + * Translates "condition" to a Druid filter, assuming it does not contain any boolean expressions. Returns null + * if we cannot translate the condition. + * + * @param druidTable Druid table, if the rows come from a table scan; null otherwise + * @param rowOrder order of columns in the rows to be filtered + * @param expression Calcite row expression + */ + private static DimFilter toLeafFilter( + final DruidTable druidTable, + final List rowOrder, + final RexNode expression + ) + { + if (expression.isAlwaysTrue()) { + return Filtration.matchEverything(); + } else if (expression.isAlwaysFalse()) { + return Filtration.matchNothing(); + } + + final SqlKind kind = expression.getKind(); + + if (kind == SqlKind.LIKE) { + final List operands = ((RexCall) expression).getOperands(); + final RowExtraction rex = EXPRESSION_CONVERTER.convert(rowOrder, operands.get(0)); + if (rex == null || !rex.isFilterable(druidTable)) { + return null; + } + return new LikeDimFilter( + rex.getColumn(), + RexLiteral.stringValue(operands.get(1)), + operands.size() > 2 ? RexLiteral.stringValue(operands.get(2)) : null, + rex.getExtractionFn() + ); + } else if (kind == SqlKind.EQUALS + || kind == SqlKind.NOT_EQUALS + || kind == SqlKind.GREATER_THAN + || kind == SqlKind.GREATER_THAN_OR_EQUAL + || kind == SqlKind.LESS_THAN + || kind == SqlKind.LESS_THAN_OR_EQUAL) { + final List operands = ((RexCall) expression).getOperands(); + Preconditions.checkState(operands.size() == 2, "WTF?! Expected 2 operands, got[%,d]", operands.size()); + boolean flip = false; + RexNode lhs = operands.get(0); + RexNode rhs = operands.get(1); + + if (lhs.getKind() == SqlKind.LITERAL && rhs.getKind() != SqlKind.LITERAL) { + // swap lhs, rhs + RexNode x = lhs; + lhs = rhs; + rhs = x; + flip = true; + } + + // rhs must be a literal + if (rhs.getKind() != SqlKind.LITERAL) { + return null; + } + + // lhs must be translatable to a RowExtraction to be filterable + final RowExtraction rex = EXPRESSION_CONVERTER.convert(rowOrder, lhs); + if (rex == null || !rex.isFilterable(druidTable)) { + return null; + } + + final String column = rex.getColumn(); + final ExtractionFn extractionFn = rex.getExtractionFn(); + + if (column.equals(Column.TIME_COLUMN_NAME) && ExtractionFns.toQueryGranularity(extractionFn) != null) { + // lhs is FLOOR(__time TO gran); convert to range + final QueryGranularity gran = ExtractionFns.toQueryGranularity(extractionFn); + final long rhsMillis = ((Calendar) RexLiteral.value(rhs)).getTimeInMillis(); + if (gran.truncate(rhsMillis) != rhsMillis) { + // Nothing matches. + return Filtration.matchNothing(); + } else { + // Match any __time within the granular bucket. + return new BoundDimFilter( + Column.TIME_COLUMN_NAME, + String.valueOf(gran.truncate(rhsMillis)), + String.valueOf(gran.next(gran.truncate(rhsMillis))), + false, + true, + null, + null, + StringComparators.NUMERIC + ); + } + } + + final String val; + final RexLiteral rhsLiteral = (RexLiteral) rhs; + if (SqlTypeName.NUMERIC_TYPES.contains(rhsLiteral.getTypeName())) { + val = String.valueOf(RexLiteral.value(rhsLiteral)); + } else if (rhsLiteral.getTypeName() == SqlTypeName.CHAR) { + val = String.valueOf(RexLiteral.stringValue(rhsLiteral)); + } else if (SqlTypeName.DATETIME_TYPES.contains(rhsLiteral.getTypeName())) { + val = String.valueOf(((Calendar) RexLiteral.value(rhsLiteral)).getTimeInMillis()); + } else { + // Hope for the best. + val = String.valueOf(RexLiteral.value(rhsLiteral)); + } + + // Numeric lhs needs a numeric comparison. + final boolean lhsIsNumeric = SqlTypeName.NUMERIC_TYPES.contains(lhs.getType().getSqlTypeName()) + || SqlTypeName.DATETIME_TYPES.contains(lhs.getType().getSqlTypeName()); + final StringComparator comparator = lhsIsNumeric ? StringComparators.NUMERIC : StringComparators.LEXICOGRAPHIC; + + final DimFilter filter; + + // Always use BoundDimFilters, to simplify filter optimization later (it helps to remember the comparator). + if (kind == SqlKind.EQUALS) { + filter = new BoundDimFilter(column, val, val, false, false, null, extractionFn, comparator); + } else if (kind == SqlKind.NOT_EQUALS) { + filter = new NotDimFilter( + new BoundDimFilter(column, val, val, false, false, null, extractionFn, comparator) + ); + } else if ((!flip && kind == SqlKind.GREATER_THAN) || (flip && kind == SqlKind.LESS_THAN)) { + filter = new BoundDimFilter(column, val, null, true, false, null, extractionFn, comparator); + } else if ((!flip && kind == SqlKind.GREATER_THAN_OR_EQUAL) || (flip && kind == SqlKind.LESS_THAN_OR_EQUAL)) { + filter = new BoundDimFilter(column, val, null, false, false, null, extractionFn, comparator); + } else if ((!flip && kind == SqlKind.LESS_THAN) || (flip && kind == SqlKind.GREATER_THAN)) { + filter = new BoundDimFilter(column, null, val, false, true, null, extractionFn, comparator); + } else if ((!flip && kind == SqlKind.LESS_THAN_OR_EQUAL) || (flip && kind == SqlKind.GREATER_THAN_OR_EQUAL)) { + filter = new BoundDimFilter(column, null, val, false, false, null, extractionFn, comparator); + } else { + throw new IllegalStateException("WTF?! Shouldn't have got here..."); + } + + return filter; + } else { + return null; + } + } + + private static String escape(final String s) + { + final StringBuilder escaped = new StringBuilder(); + for (int i = 0; i < s.length(); i++) { + final char c = s.charAt(i); + if (Character.isLetterOrDigit(c) || Character.isWhitespace(c)) { + escaped.append(c); + } else { + escaped.append("\\u").append(BaseEncoding.base16().encode(Chars.toByteArray(c))); + } + } + return escaped.toString(); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/expression/ExtractExpressionConversion.java b/sql/src/main/java/io/druid/sql/calcite/expression/ExtractExpressionConversion.java new file mode 100644 index 00000000000..1f2017800fc --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/expression/ExtractExpressionConversion.java @@ -0,0 +1,87 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.expression; + +import io.druid.query.extraction.ExtractionFn; +import io.druid.query.extraction.TimeFormatExtractionFn; +import org.apache.calcite.avatica.util.TimeUnitRange; +import org.apache.calcite.rex.RexCall; +import org.apache.calcite.rex.RexLiteral; +import org.apache.calcite.rex.RexNode; +import org.apache.calcite.sql.SqlKind; + +import java.util.List; + +public class ExtractExpressionConversion extends AbstractExpressionConversion +{ + private static final ExtractExpressionConversion INSTANCE = new ExtractExpressionConversion(); + + private ExtractExpressionConversion() + { + super(SqlKind.EXTRACT); + } + + public static ExtractExpressionConversion instance() + { + return INSTANCE; + } + + @Override + public RowExtraction convert( + final ExpressionConverter converter, + final List rowOrder, + final RexNode expression + ) + { + // EXTRACT(timeUnit FROM expr) + final RexCall call = (RexCall) expression; + final RexLiteral flag = (RexLiteral) call.getOperands().get(0); + final TimeUnitRange timeUnit = (TimeUnitRange) flag.getValue(); + final RexNode expr = call.getOperands().get(1); + + final RowExtraction rex = converter.convert(rowOrder, expr); + if (rex == null) { + return null; + } + + final String dateTimeFormat = TimeUnits.toDateTimeFormat(timeUnit); + if (dateTimeFormat == null) { + return null; + } + + final ExtractionFn baseExtractionFn; + + if (call.getOperator().getName().equals("EXTRACT_DATE")) { + // Expr will be in number of days since the epoch. Can't translate. + return null; + } else { + // Expr will be in millis since the epoch + baseExtractionFn = rex.getExtractionFn(); + } + + return RowExtraction.of( + rex.getColumn(), + ExtractionFns.compose( + new TimeFormatExtractionFn(dateTimeFormat, null, null, null, true), + baseExtractionFn + ) + ); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/expression/ExtractionFns.java b/sql/src/main/java/io/druid/sql/calcite/expression/ExtractionFns.java new file mode 100644 index 00000000000..ab46ad5340f --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/expression/ExtractionFns.java @@ -0,0 +1,87 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.expression; + +import com.google.common.collect.Lists; +import io.druid.granularity.QueryGranularity; +import io.druid.query.extraction.CascadeExtractionFn; +import io.druid.query.extraction.ExtractionFn; +import io.druid.query.extraction.TimeFormatExtractionFn; + +import java.util.Arrays; +import java.util.List; + +public class ExtractionFns +{ + /** + * Converts extractionFn to a QueryGranularity, if possible. + * + * @param extractionFn function + * + * @return + */ + public static QueryGranularity toQueryGranularity(final ExtractionFn extractionFn) + { + if (extractionFn instanceof TimeFormatExtractionFn) { + final TimeFormatExtractionFn fn = (TimeFormatExtractionFn) extractionFn; + if (fn.getFormat() == null && fn.getTimeZone() == null && fn.getLocale() == null) { + return fn.getGranularity(); + } + } + + return null; + } + + /** + * Compose f and g, returning an ExtractionFn that computes f(g(x)). Null f or g are treated like identity functions. + * + * @param f function + * @param g function + * + * @return composed function, or null if both f and g were null + */ + public static ExtractionFn compose(final ExtractionFn f, final ExtractionFn g) + { + if (f == null) { + // Treat null like identity. + return g; + } else if (g == null) { + return f; + } else { + final List extractionFns = Lists.newArrayList(); + + // Apply g, then f, unwrapping if they are already cascades. + + if (g instanceof CascadeExtractionFn) { + extractionFns.addAll(Arrays.asList(((CascadeExtractionFn) g).getExtractionFns())); + } else { + extractionFns.add(g); + } + + if (f instanceof CascadeExtractionFn) { + extractionFns.addAll(Arrays.asList(((CascadeExtractionFn) f).getExtractionFns())); + } else { + extractionFns.add(f); + } + + return new CascadeExtractionFn(extractionFns.toArray(new ExtractionFn[extractionFns.size()])); + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/expression/FloorExpressionConversion.java b/sql/src/main/java/io/druid/sql/calcite/expression/FloorExpressionConversion.java new file mode 100644 index 00000000000..2b1df5a88ae --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/expression/FloorExpressionConversion.java @@ -0,0 +1,89 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.expression; + +import io.druid.granularity.QueryGranularity; +import io.druid.query.extraction.BucketExtractionFn; +import io.druid.query.extraction.TimeFormatExtractionFn; +import org.apache.calcite.avatica.util.TimeUnitRange; +import org.apache.calcite.rex.RexCall; +import org.apache.calcite.rex.RexLiteral; +import org.apache.calcite.rex.RexNode; +import org.apache.calcite.sql.SqlKind; + +import java.util.List; + +public class FloorExpressionConversion extends AbstractExpressionConversion +{ + private static final FloorExpressionConversion INSTANCE = new FloorExpressionConversion(); + + private FloorExpressionConversion() + { + super(SqlKind.FLOOR); + } + + public static FloorExpressionConversion instance() + { + return INSTANCE; + } + + @Override + public RowExtraction convert( + final ExpressionConverter converter, + final List rowOrder, + final RexNode expression + ) + { + final RexCall call = (RexCall) expression; + final RexNode arg = call.getOperands().get(0); + + final RowExtraction rex = converter.convert(rowOrder, arg); + if (rex == null) { + return null; + } else if (call.getOperands().size() == 1) { + // FLOOR(expr) + return RowExtraction.of( + rex.getColumn(), + ExtractionFns.compose(new BucketExtractionFn(1.0, 0.0), rex.getExtractionFn()) + ); + } else if (call.getOperands().size() == 2) { + // FLOOR(expr TO timeUnit) + final RexLiteral flag = (RexLiteral) call.getOperands().get(1); + final TimeUnitRange timeUnit = (TimeUnitRange) flag.getValue(); + + final QueryGranularity queryGranularity = TimeUnits.toQueryGranularity(timeUnit); + if (queryGranularity != null) { + return RowExtraction.of( + rex.getColumn(), + ExtractionFns.compose( + new TimeFormatExtractionFn(null, null, null, queryGranularity, true), + rex.getExtractionFn() + ) + ); + } else { + // We don't have a queryGranularity for this timeUnit. + return null; + } + } else { + // WTF? FLOOR with 3 arguments? + return null; + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/expression/RowExtraction.java b/sql/src/main/java/io/druid/sql/calcite/expression/RowExtraction.java new file mode 100644 index 00000000000..0f943fecbe5 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/expression/RowExtraction.java @@ -0,0 +1,185 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.expression; + +import com.google.common.base.Preconditions; +import io.druid.query.dimension.DefaultDimensionSpec; +import io.druid.query.dimension.DimensionSpec; +import io.druid.query.dimension.ExtractionDimensionSpec; +import io.druid.query.extraction.ExtractionFn; +import io.druid.segment.column.Column; +import io.druid.segment.column.ValueType; +import io.druid.segment.filter.Filters; +import io.druid.sql.calcite.rel.DruidQueryBuilder; +import io.druid.sql.calcite.table.DruidTable; + +/** + * Represents an extraction of a value from a Druid row. Can be used for grouping, filtering, etc. + * + * Currently this is a column plus an extractionFn, but it's expected that as time goes on, this will become more + * general and allow for variously-typed extractions from multiple columns. + */ +public class RowExtraction +{ + private final String column; + private final ExtractionFn extractionFn; + + public RowExtraction(String column, ExtractionFn extractionFn) + { + this.column = Preconditions.checkNotNull(column, "column"); + this.extractionFn = extractionFn; + } + + public static RowExtraction of(String column, ExtractionFn extractionFn) + { + return new RowExtraction(column, extractionFn); + } + + public static RowExtraction fromDimensionSpec(final DimensionSpec dimensionSpec) + { + if (dimensionSpec instanceof ExtractionDimensionSpec) { + return RowExtraction.of( + dimensionSpec.getDimension(), + ((ExtractionDimensionSpec) dimensionSpec).getExtractionFn() + ); + } else if (dimensionSpec instanceof DefaultDimensionSpec) { + return RowExtraction.of(dimensionSpec.getDimension(), null); + } else { + return null; + } + } + + public static RowExtraction fromQueryBuilder( + final DruidQueryBuilder queryBuilder, + final int fieldNumber + ) + { + final String fieldName = queryBuilder.getRowOrder().get(fieldNumber); + + if (queryBuilder.getGrouping() != null) { + for (DimensionSpec dimensionSpec : queryBuilder.getGrouping().getDimensions()) { + if (dimensionSpec.getOutputName().equals(fieldName)) { + return RowExtraction.fromDimensionSpec(dimensionSpec); + } + } + + return null; + } else if (queryBuilder.getSelectProjection() != null) { + for (DimensionSpec dimensionSpec : queryBuilder.getSelectProjection().getDimensions()) { + if (dimensionSpec.getOutputName().equals(fieldName)) { + return RowExtraction.fromDimensionSpec(dimensionSpec); + } + } + + for (String metricName : queryBuilder.getSelectProjection().getMetrics()) { + if (metricName.equals(fieldName)) { + return RowExtraction.of(metricName, null); + } + } + + return null; + } else { + // No select projection or grouping. + return RowExtraction.of(queryBuilder.getRowOrder().get(fieldNumber), null); + } + } + + public String getColumn() + { + return column; + } + + public ExtractionFn getExtractionFn() + { + return extractionFn; + } + + /** + * Check if this extraction can be used to build a filter on a Druid table. This method exists because we can't + * filter on floats (yet) and things like DruidFilterRule need to check for that. + * + * If a null table is passed in, this method always returns true. + * + * @param druidTable Druid table, or null + * + * @return whether or not this extraction is filterable; will be true if druidTable is null + */ + public boolean isFilterable(final DruidTable druidTable) + { + return druidTable == null || + Filters.FILTERABLE_TYPES.contains(druidTable.getColumnType(druidTable.getColumnNumber(column))); + } + + public DimensionSpec toDimensionSpec(final DruidTable druidTable, final String outputName) + { + final int columnNumber = druidTable.getColumnNumber(column); + if (columnNumber < 0) { + return null; + } + + final ValueType columnType = druidTable.getColumnType(columnNumber); + + if (columnType == ValueType.STRING || (column.equals(Column.TIME_COLUMN_NAME) && extractionFn != null)) { + return extractionFn == null + ? new DefaultDimensionSpec(column, outputName) + : new ExtractionDimensionSpec(column, outputName, extractionFn); + } else { + // Can't create dimensionSpecs for non-string, non-time. + return null; + } + } + + @Override + public boolean equals(Object o) + { + if (this == o) { + return true; + } + if (o == null || getClass() != o.getClass()) { + return false; + } + + RowExtraction that = (RowExtraction) o; + + if (column != null ? !column.equals(that.column) : that.column != null) { + return false; + } + return extractionFn != null ? extractionFn.equals(that.extractionFn) : that.extractionFn == null; + + } + + @Override + public int hashCode() + { + int result = column != null ? column.hashCode() : 0; + result = 31 * result + (extractionFn != null ? extractionFn.hashCode() : 0); + return result; + } + + @Override + public String toString() + { + if (extractionFn != null) { + return String.format("%s(%s)", extractionFn, column); + } else { + return column; + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/expression/SubstringExpressionConversion.java b/sql/src/main/java/io/druid/sql/calcite/expression/SubstringExpressionConversion.java new file mode 100644 index 00000000000..946a56b8469 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/expression/SubstringExpressionConversion.java @@ -0,0 +1,71 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.expression; + +import io.druid.query.extraction.SubstringDimExtractionFn; +import org.apache.calcite.rex.RexCall; +import org.apache.calcite.rex.RexLiteral; +import org.apache.calcite.rex.RexNode; +import org.apache.calcite.sql.SqlKind; + +import java.util.List; + +public class SubstringExpressionConversion extends AbstractExpressionConversion +{ + private static final SubstringExpressionConversion INSTANCE = new SubstringExpressionConversion(); + + private SubstringExpressionConversion() + { + super(SqlKind.OTHER_FUNCTION, "SUBSTRING"); + } + + public static SubstringExpressionConversion instance() + { + return INSTANCE; + } + + @Override + public RowExtraction convert( + final ExpressionConverter converter, + final List rowOrder, + final RexNode expression + ) + { + final RexCall call = (RexCall) expression; + final RowExtraction arg = converter.convert(rowOrder, call.getOperands().get(0)); + if (arg == null) { + return null; + } + final int index = RexLiteral.intValue(call.getOperands().get(1)) - 1; + final Integer length; + if (call.getOperands().size() > 2) { + length = RexLiteral.intValue(call.getOperands().get(2)); + } else { + length = null; + } + + return RowExtraction.of(arg.getColumn(), + ExtractionFns.compose( + new SubstringDimExtractionFn(index, length), + arg.getExtractionFn() + ) + ); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/expression/TimeUnits.java b/sql/src/main/java/io/druid/sql/calcite/expression/TimeUnits.java new file mode 100644 index 00000000000..f1d1fa1c3db --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/expression/TimeUnits.java @@ -0,0 +1,76 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.expression; + +import com.google.common.collect.ImmutableMap; +import io.druid.granularity.QueryGranularities; +import io.druid.granularity.QueryGranularity; +import org.apache.calcite.avatica.util.TimeUnitRange; + +import java.util.Map; + +public class TimeUnits +{ + private static final Map QUERY_GRANULARITY_MAP = ImmutableMap.builder() + .put(TimeUnitRange.SECOND, QueryGranularities.SECOND) + .put(TimeUnitRange.MINUTE, QueryGranularities.MINUTE) + .put(TimeUnitRange.HOUR, QueryGranularities.HOUR) + .put(TimeUnitRange.DAY, QueryGranularities.DAY) + .put(TimeUnitRange.WEEK, QueryGranularities.WEEK) + .put(TimeUnitRange.MONTH, QueryGranularities.MONTH) + .put(TimeUnitRange.QUARTER, QueryGranularities.QUARTER) + .put(TimeUnitRange.YEAR, QueryGranularities.YEAR) + .build(); + + // Note that QUARTER is not supported here. + private static final Map EXTRACT_FORMAT_MAP = ImmutableMap.builder() + .put(TimeUnitRange.SECOND, "s") + .put(TimeUnitRange.MINUTE, "m") + .put(TimeUnitRange.HOUR, "H") + .put(TimeUnitRange.DAY, "d") + .put(TimeUnitRange.WEEK, "w") + .put(TimeUnitRange.MONTH, "M") + .put(TimeUnitRange.YEAR, "Y") + .build(); + + /** + * Returns the Druid QueryGranularity corresponding to a Calcite TimeUnitRange, or null if there is none. + * + * @param timeUnitRange timeUnit + * + * @return queryGranularity, or null + */ + public static QueryGranularity toQueryGranularity(final TimeUnitRange timeUnitRange) + { + return QUERY_GRANULARITY_MAP.get(timeUnitRange); + } + + /** + * Returns the Joda format string corresponding to extracting on a Calcite TimeUnitRange, or null if there is none. + * + * @param timeUnitRange timeUnit + * + * @return queryGranularity, or null + */ + public static String toDateTimeFormat(final TimeUnitRange timeUnitRange) + { + return EXTRACT_FORMAT_MAP.get(timeUnitRange); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/filtration/BottomUpTransform.java b/sql/src/main/java/io/druid/sql/calcite/filtration/BottomUpTransform.java new file mode 100644 index 00000000000..8ef80c8fe52 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/filtration/BottomUpTransform.java @@ -0,0 +1,95 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import com.google.common.base.Function; +import com.google.common.base.Preconditions; +import com.google.common.collect.Lists; +import io.druid.query.filter.AndDimFilter; +import io.druid.query.filter.DimFilter; +import io.druid.query.filter.NotDimFilter; +import io.druid.query.filter.OrDimFilter; + +import java.util.List; + +public abstract class BottomUpTransform implements Function +{ + protected abstract DimFilter process(final DimFilter filter); + + private DimFilter checkedProcess(final DimFilter filter) + { + final DimFilter retVal = process(Preconditions.checkNotNull(filter, "filter")); + return Preconditions.checkNotNull(retVal, "process(filter) result in %s", getClass().getSimpleName()); + } + + @Override + public Filtration apply(final Filtration filtration) + { + if (filtration.getDimFilter() != null) { + final Filtration retVal = Filtration.create(apply0(filtration.getDimFilter()), filtration.getIntervals()); + return filtration.equals(retVal) ? retVal : apply(retVal); + } else { + return filtration; + } + } + + private DimFilter apply0(final DimFilter filter) + { + if (filter instanceof AndDimFilter) { + final List oldFilters = ((AndDimFilter) filter).getFields(); + final List newFilters = Lists.newArrayList(); + for (DimFilter oldFilter : oldFilters) { + final DimFilter newFilter = apply0(oldFilter); + if (newFilter != null) { + newFilters.add(newFilter); + } + } + if (!newFilters.equals(oldFilters)) { + return checkedProcess(new AndDimFilter(newFilters)); + } else { + return checkedProcess(filter); + } + } else if (filter instanceof OrDimFilter) { + final List oldFilters = ((OrDimFilter) filter).getFields(); + final List newFilters = Lists.newArrayList(); + for (DimFilter oldFilter : oldFilters) { + final DimFilter newFilter = apply0(oldFilter); + if (newFilter != null) { + newFilters.add(newFilter); + } + } + if (!newFilters.equals(oldFilters)) { + return checkedProcess(new OrDimFilter(newFilters)); + } else { + return checkedProcess(filter); + } + } else if (filter instanceof NotDimFilter) { + final DimFilter oldFilter = ((NotDimFilter) filter).getField(); + final DimFilter newFilter = apply0(oldFilter); + if (!oldFilter.equals(newFilter)) { + return checkedProcess(new NotDimFilter(newFilter)); + } else { + return checkedProcess(filter); + } + } else { + return checkedProcess(filter); + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/filtration/BoundRefKey.java b/sql/src/main/java/io/druid/sql/calcite/filtration/BoundRefKey.java new file mode 100644 index 00000000000..30d206036ad --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/filtration/BoundRefKey.java @@ -0,0 +1,112 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import io.druid.query.extraction.ExtractionFn; +import io.druid.query.filter.BoundDimFilter; +import io.druid.query.filter.SelectorDimFilter; +import io.druid.query.ordering.StringComparator; + +public class BoundRefKey +{ + private final String dimension; + private final ExtractionFn extractionFn; + private final StringComparator comparator; + + public BoundRefKey(String dimension, ExtractionFn extractionFn, StringComparator comparator) + { + this.dimension = dimension; + this.extractionFn = extractionFn; + this.comparator = comparator; + } + + public static BoundRefKey from(BoundDimFilter filter) + { + return new BoundRefKey( + filter.getDimension(), + filter.getExtractionFn(), + filter.getOrdering() + ); + } + + public static BoundRefKey from(SelectorDimFilter filter, StringComparator comparator) + { + return new BoundRefKey( + filter.getDimension(), + filter.getExtractionFn(), + comparator + ); + } + + public String getDimension() + { + return dimension; + } + + public ExtractionFn getExtractionFn() + { + return extractionFn; + } + + public StringComparator getComparator() + { + return comparator; + } + + @Override + public boolean equals(Object o) + { + if (this == o) { + return true; + } + if (o == null || getClass() != o.getClass()) { + return false; + } + + BoundRefKey boundRefKey = (BoundRefKey) o; + + if (dimension != null ? !dimension.equals(boundRefKey.dimension) : boundRefKey.dimension != null) { + return false; + } + if (extractionFn != null ? !extractionFn.equals(boundRefKey.extractionFn) : boundRefKey.extractionFn != null) { + return false; + } + return comparator != null ? comparator.equals(boundRefKey.comparator) : boundRefKey.comparator == null; + } + + @Override + public int hashCode() + { + int result = dimension != null ? dimension.hashCode() : 0; + result = 31 * result + (extractionFn != null ? extractionFn.hashCode() : 0); + result = 31 * result + (comparator != null ? comparator.hashCode() : 0); + return result; + } + + @Override + public String toString() + { + return "BoundRefKey{" + + "dimension='" + dimension + '\'' + + ", extractionFn=" + extractionFn + + ", comparator=" + comparator + + '}'; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/filtration/BoundValue.java b/sql/src/main/java/io/druid/sql/calcite/filtration/BoundValue.java new file mode 100644 index 00000000000..c695d5f045e --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/filtration/BoundValue.java @@ -0,0 +1,87 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import io.druid.java.util.common.ISE; +import io.druid.query.ordering.StringComparator; + +public class BoundValue implements Comparable +{ + private final String value; + private final StringComparator comparator; + + public BoundValue(String value, StringComparator comparator) + { + this.value = value; + this.comparator = comparator; + } + + public String getValue() + { + return value; + } + + public StringComparator getComparator() + { + return comparator; + } + + @Override + public boolean equals(Object o) + { + if (this == o) { + return true; + } + if (o == null || getClass() != o.getClass()) { + return false; + } + + BoundValue that = (BoundValue) o; + + if (value != null ? !value.equals(that.value) : that.value != null) { + return false; + } + return comparator != null ? comparator.equals(that.comparator) : that.comparator == null; + + } + + @Override + public int hashCode() + { + int result = value != null ? value.hashCode() : 0; + result = 31 * result + (comparator != null ? comparator.hashCode() : 0); + return result; + } + + @Override + public int compareTo(BoundValue o) + { + if (!comparator.equals(o.comparator)) { + throw new ISE("WTF?! Comparator mismatch?!"); + } + return comparator.compare(value, o.value); + } + + @Override + public String toString() + { + return value; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/filtration/Bounds.java b/sql/src/main/java/io/druid/sql/calcite/filtration/Bounds.java new file mode 100644 index 00000000000..01952a0e663 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/filtration/Bounds.java @@ -0,0 +1,117 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import com.google.common.base.Function; +import com.google.common.collect.BoundType; +import com.google.common.collect.ImmutableList; +import com.google.common.collect.Lists; +import com.google.common.collect.Range; +import io.druid.query.filter.BoundDimFilter; + +import java.util.List; + +public class Bounds +{ + /** + * Negates single-ended Bound filters. + * + * @param bound filter + * + * @return negated filter, or null if this bound is double-ended. + */ + public static BoundDimFilter not(final BoundDimFilter bound) + { + if (bound.getUpper() != null && bound.getLower() != null) { + return null; + } else if (bound.getUpper() != null) { + return new BoundDimFilter( + bound.getDimension(), + bound.getUpper(), + null, + !bound.isUpperStrict(), + false, + null, + bound.getExtractionFn(), + bound.getOrdering() + ); + } else { + // bound.getLower() != null + return new BoundDimFilter( + bound.getDimension(), + null, + bound.getLower(), + false, + !bound.isLowerStrict(), + null, + bound.getExtractionFn(), + bound.getOrdering() + ); + } + } + + public static Range toRange(final BoundDimFilter bound) + { + final BoundValue upper = bound.getUpper() != null ? new BoundValue(bound.getUpper(), bound.getOrdering()) : null; + final BoundValue lower = bound.getLower() != null ? new BoundValue(bound.getLower(), bound.getOrdering()) : null; + + if (lower == null) { + return bound.isUpperStrict() ? Range.lessThan(upper) : Range.atMost(upper); + } else if (upper == null) { + return bound.isLowerStrict() ? Range.greaterThan(lower) : Range.atLeast(lower); + } else { + return Range.range( + lower, bound.isLowerStrict() ? BoundType.OPEN : BoundType.CLOSED, + upper, bound.isUpperStrict() ? BoundType.OPEN : BoundType.CLOSED + ); + } + } + + public static List> toRanges(final List bounds) + { + return ImmutableList.copyOf( + Lists.transform( + bounds, + new Function>() + { + @Override + public Range apply(BoundDimFilter bound) + { + return toRange(bound); + } + } + ) + ); + } + + public static BoundDimFilter toFilter(final BoundRefKey boundRefKey, final Range range) + { + return new BoundDimFilter( + boundRefKey.getDimension(), + range.hasLowerBound() ? range.lowerEndpoint().getValue() : null, + range.hasUpperBound() ? range.upperEndpoint().getValue() : null, + range.hasLowerBound() && range.lowerBoundType() == BoundType.OPEN, + range.hasUpperBound() && range.upperBoundType() == BoundType.OPEN, + null, + boundRefKey.getExtractionFn(), + boundRefKey.getComparator() + ); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/filtration/CombineAndSimplifyBounds.java b/sql/src/main/java/io/druid/sql/calcite/filtration/CombineAndSimplifyBounds.java new file mode 100644 index 00000000000..54d45c3c72e --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/filtration/CombineAndSimplifyBounds.java @@ -0,0 +1,230 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import com.google.common.base.Preconditions; +import com.google.common.collect.Lists; +import com.google.common.collect.Maps; +import com.google.common.collect.Range; +import com.google.common.collect.RangeSet; +import io.druid.java.util.common.ISE; +import io.druid.query.filter.AndDimFilter; +import io.druid.query.filter.BoundDimFilter; +import io.druid.query.filter.DimFilter; +import io.druid.query.filter.NotDimFilter; +import io.druid.query.filter.OrDimFilter; + +import java.util.Iterator; +import java.util.List; +import java.util.Map; + +public class CombineAndSimplifyBounds extends BottomUpTransform +{ + private static final CombineAndSimplifyBounds INSTANCE = new CombineAndSimplifyBounds(); + + private CombineAndSimplifyBounds() + { + } + + public static CombineAndSimplifyBounds instance() + { + return INSTANCE; + } + + @Override + public DimFilter process(DimFilter filter) + { + if (filter instanceof AndDimFilter) { + final List children = ((AndDimFilter) filter).getFields(); + final DimFilter one = doSimplifyAnd(children); + final DimFilter two = negate(doSimplifyOr(negateAll(children))); + return computeCost(one) <= computeCost(two) ? one : two; + } else if (filter instanceof OrDimFilter) { + final List children = ((OrDimFilter) filter).getFields(); + final DimFilter one = doSimplifyOr(children); + final DimFilter two = negate(doSimplifyAnd(negateAll(children))); + return computeCost(one) <= computeCost(two) ? one : two; + } else if (filter instanceof NotDimFilter) { + return negate(((NotDimFilter) filter).getField()); + } else { + return filter; + } + } + + private static DimFilter doSimplifyAnd(final List children) + { + return doSimplify(children, false); + } + + private static DimFilter doSimplifyOr(final List children) + { + return doSimplify(children, true); + } + + /** + * Simplify BoundDimFilters that are children of an OR or an AND. + * + * @param children the filters + * @param disjunction true for disjunction, false for conjunction + * + * @return simplified filters + */ + private static DimFilter doSimplify(final List children, boolean disjunction) + { + // Copy children list + final List newChildren = Lists.newArrayList(children); + + // Group Bound filters by dimension, extractionFn, and comparator and compute a RangeSet for each one. + final Map> bounds = Maps.newHashMap(); + + final Iterator iterator = newChildren.iterator(); + while (iterator.hasNext()) { + final DimFilter child = iterator.next(); + + if (child.equals(Filtration.matchNothing())) { + // Child matches nothing, equivalent to FALSE + // OR with FALSE => ignore + // AND with FALSE => always false, short circuit + if (disjunction) { + iterator.remove(); + } else { + return Filtration.matchNothing(); + } + } else if (child.equals(Filtration.matchEverything())) { + // Child matches everything, equivalent to TRUE + // OR with TRUE => always true, short circuit + // AND with TRUE => ignore + if (disjunction) { + return Filtration.matchEverything(); + } else { + iterator.remove(); + } + } else if (child instanceof BoundDimFilter) { + final BoundDimFilter bound = (BoundDimFilter) child; + final BoundRefKey boundRefKey = BoundRefKey.from(bound); + List filterList = bounds.get(boundRefKey); + if (filterList == null) { + filterList = Lists.newArrayList(); + bounds.put(boundRefKey, filterList); + } + filterList.add(bound); + } + } + + // Try to simplify filters within each group. + for (Map.Entry> entry : bounds.entrySet()) { + final BoundRefKey boundRefKey = entry.getKey(); + final List filterList = entry.getValue(); + + // Create a RangeSet for this group. + final RangeSet rangeSet = disjunction + ? RangeSets.unionRanges(Bounds.toRanges(filterList)) + : RangeSets.intersectRanges(Bounds.toRanges(filterList)); + + if (rangeSet.asRanges().size() < filterList.size()) { + // We found a simplification. Remove the old filters and add new ones. + for (final BoundDimFilter bound : filterList) { + if (!newChildren.remove(bound)) { + throw new ISE("WTF?! Tried to remove bound but couldn't?"); + } + } + + if (rangeSet.asRanges().isEmpty()) { + // range set matches nothing, equivalent to FALSE + // OR with FALSE => ignore + // AND with FALSE => always false, short circuit + if (disjunction) { + newChildren.add(Filtration.matchNothing()); + } else { + return Filtration.matchNothing(); + } + } + + for (final Range range : rangeSet.asRanges()) { + if (!range.hasLowerBound() && !range.hasUpperBound()) { + // range matches all, equivalent to TRUE + // AND with TRUE => ignore + // OR with TRUE => always true; short circuit + if (disjunction) { + return Filtration.matchEverything(); + } else { + newChildren.add(Filtration.matchEverything()); + } + } else { + newChildren.add(Bounds.toFilter(boundRefKey, range)); + } + } + } + } + + Preconditions.checkState(newChildren.size() > 0, "newChildren.size > 0"); + if (newChildren.size() == 1) { + return newChildren.get(0); + } else { + return disjunction ? new OrDimFilter(newChildren) : new AndDimFilter(newChildren); + } + } + + private static DimFilter negate(final DimFilter filter) + { + if (Filtration.matchEverything().equals(filter)) { + return Filtration.matchNothing(); + } else if (Filtration.matchNothing().equals(filter)) { + return Filtration.matchEverything(); + } else if (filter instanceof NotDimFilter) { + return ((NotDimFilter) filter).getField(); + } else if (filter instanceof BoundDimFilter) { + final BoundDimFilter negated = Bounds.not((BoundDimFilter) filter); + return negated != null ? negated : new NotDimFilter(filter); + } else { + return new NotDimFilter(filter); + } + } + + private static List negateAll(final List children) + { + final List newChildren = Lists.newArrayListWithCapacity(children.size()); + for (final DimFilter child : children) { + newChildren.add(negate(child)); + } + return newChildren; + } + + private static int computeCost(final DimFilter filter) + { + if (filter instanceof NotDimFilter) { + return computeCost(((NotDimFilter) filter).getField()); + } else if (filter instanceof AndDimFilter) { + int cost = 0; + for (DimFilter field : ((AndDimFilter) filter).getFields()) { + cost += computeCost(field); + } + return cost; + } else if (filter instanceof OrDimFilter) { + int cost = 0; + for (DimFilter field : ((OrDimFilter) filter).getFields()) { + cost += computeCost(field); + } + return cost; + } else { + return 1; + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/filtration/ConvertBoundsToSelectors.java b/sql/src/main/java/io/druid/sql/calcite/filtration/ConvertBoundsToSelectors.java new file mode 100644 index 00000000000..d587a2b6639 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/filtration/ConvertBoundsToSelectors.java @@ -0,0 +1,72 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import io.druid.query.filter.BoundDimFilter; +import io.druid.query.filter.DimFilter; +import io.druid.query.filter.SelectorDimFilter; +import io.druid.query.ordering.StringComparator; +import io.druid.sql.calcite.expression.RowExtraction; +import io.druid.sql.calcite.table.DruidTable; +import io.druid.sql.calcite.table.DruidTables; + +public class ConvertBoundsToSelectors extends BottomUpTransform +{ + private final DruidTable druidTable; + + private ConvertBoundsToSelectors(final DruidTable druidTable) + { + this.druidTable = druidTable; + } + + public static ConvertBoundsToSelectors create(final DruidTable druidTable) + { + return new ConvertBoundsToSelectors(druidTable); + } + + @Override + public DimFilter process(DimFilter filter) + { + if (filter instanceof BoundDimFilter) { + final BoundDimFilter bound = (BoundDimFilter) filter; + final StringComparator naturalStringComparator = DruidTables.naturalStringComparator( + druidTable, + RowExtraction.of(bound.getDimension(), bound.getExtractionFn()) + ); + + if (bound.hasUpperBound() + && bound.hasLowerBound() + && bound.getUpper().equals(bound.getLower()) + && !bound.isUpperStrict() + && !bound.isLowerStrict() + && bound.getOrdering().equals(naturalStringComparator)) { + return new SelectorDimFilter( + bound.getDimension(), + bound.getUpper(), + bound.getExtractionFn() + ); + } else { + return filter; + } + } else { + return filter; + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/filtration/ConvertSelectorsToIns.java b/sql/src/main/java/io/druid/sql/calcite/filtration/ConvertSelectorsToIns.java new file mode 100644 index 00000000000..7a01afe8475 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/filtration/ConvertSelectorsToIns.java @@ -0,0 +1,106 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import com.google.common.collect.Lists; +import com.google.common.collect.Maps; +import io.druid.java.util.common.ISE; +import io.druid.query.filter.DimFilter; +import io.druid.query.filter.InDimFilter; +import io.druid.query.filter.OrDimFilter; +import io.druid.query.filter.SelectorDimFilter; +import io.druid.sql.calcite.expression.RowExtraction; +import io.druid.sql.calcite.table.DruidTable; +import io.druid.sql.calcite.table.DruidTables; + +import java.util.List; +import java.util.Map; + +public class ConvertSelectorsToIns extends BottomUpTransform +{ + private final DruidTable druidTable; + + private ConvertSelectorsToIns(final DruidTable druidTable) + { + this.druidTable = druidTable; + } + + public static ConvertSelectorsToIns create(final DruidTable druidTable) + { + return new ConvertSelectorsToIns(druidTable); + } + + @Override + public DimFilter process(DimFilter filter) + { + if (filter instanceof OrDimFilter) { + // Copy children list + final List children = Lists.newArrayList(((OrDimFilter) filter).getFields()); + + // Group filters by dimension and extractionFn. + final Map> selectors = Maps.newHashMap(); + + for (DimFilter child : children) { + if (child instanceof SelectorDimFilter) { + final SelectorDimFilter selector = (SelectorDimFilter) child; + final BoundRefKey boundRefKey = BoundRefKey.from( + selector, + DruidTables.naturalStringComparator( + druidTable, + RowExtraction.of(selector.getDimension(), selector.getExtractionFn()) + ) + ); + List filterList = selectors.get(boundRefKey); + if (filterList == null) { + filterList = Lists.newArrayList(); + selectors.put(boundRefKey, filterList); + } + filterList.add(selector); + } + } + + // Emit IN filters for each group of size > 1. + for (Map.Entry> entry : selectors.entrySet()) { + final List filterList = entry.getValue(); + if (filterList.size() > 1) { + // We found a simplification. Remove the old filters and add new ones. + final List values = Lists.newArrayList(); + + for (final SelectorDimFilter selector : filterList) { + values.add(selector.getValue()); + if (!children.remove(selector)) { + throw new ISE("WTF?! Tried to remove selector but couldn't?"); + } + } + + children.add(new InDimFilter(entry.getKey().getDimension(), values, entry.getKey().getExtractionFn())); + } + } + + if (!children.equals(((OrDimFilter) filter).getFields())) { + return children.size() == 1 ? children.get(0) : new OrDimFilter(children); + } else { + return filter; + } + } else { + return filter; + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/filtration/Filtration.java b/sql/src/main/java/io/druid/sql/calcite/filtration/Filtration.java new file mode 100644 index 00000000000..37448a6780d --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/filtration/Filtration.java @@ -0,0 +1,189 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import com.google.common.base.Function; +import com.google.common.collect.ImmutableList; +import io.druid.common.utils.JodaUtils; +import io.druid.java.util.common.ISE; +import io.druid.js.JavaScriptConfig; +import io.druid.query.filter.DimFilter; +import io.druid.query.filter.JavaScriptDimFilter; +import io.druid.query.spec.MultipleIntervalSegmentSpec; +import io.druid.query.spec.QuerySegmentSpec; +import io.druid.sql.calcite.table.DruidTable; +import org.joda.time.Interval; + +import java.util.List; + +public class Filtration +{ + private static final Interval ETERNITY = new Interval(JodaUtils.MIN_INSTANT, JodaUtils.MAX_INSTANT); + private static final DimFilter MATCH_NOTHING = new JavaScriptDimFilter( + "dummy", "function(x){return false;}", null, JavaScriptConfig.getDefault() + ); + private static final DimFilter MATCH_EVERYTHING = new JavaScriptDimFilter( + "dummy", "function(x){return true;}", null, JavaScriptConfig.getDefault() + ); + + // 1) If "dimFilter" is null, it should be ignored and not affect filtration. + // 2) There is an implicit AND between "intervals" and "dimFilter" (if dimFilter is non-null). + // 3) There is an implicit OR between the intervals in "intervals". + private final DimFilter dimFilter; + private final List intervals; + + private Filtration(final DimFilter dimFilter, final List intervals) + { + this.intervals = intervals != null ? intervals : ImmutableList.of(ETERNITY); + this.dimFilter = dimFilter; + } + + public static Interval eternity() + { + return ETERNITY; + } + + public static DimFilter matchNothing() + { + return MATCH_NOTHING; + } + + public static DimFilter matchEverything() + { + return MATCH_EVERYTHING; + } + + public static Filtration create(final DimFilter dimFilter) + { + return new Filtration(dimFilter, null); + } + + public static Filtration create(final DimFilter dimFilter, final List intervals) + { + return new Filtration(dimFilter, intervals); + } + + private static Filtration transform(final Filtration filtration, final List> fns) + { + Filtration retVal = filtration; + for (Function fn : fns) { + retVal = fn.apply(retVal); + } + return retVal; + } + + public QuerySegmentSpec getQuerySegmentSpec() + { + return new MultipleIntervalSegmentSpec(intervals); + } + + public List getIntervals() + { + return intervals; + } + + public DimFilter getDimFilter() + { + return dimFilter; + } + + /** + * Optimize a Filtration for querying, possibly pulling out intervals and simplifying the dimFilter in the process. + * + * @return equivalent Filtration + */ + public Filtration optimize(final DruidTable druidTable) + { + return transform( + this, + ImmutableList.of( + CombineAndSimplifyBounds.instance(), + MoveTimeFiltersToIntervals.instance(), + ConvertBoundsToSelectors.create(druidTable), + ConvertSelectorsToIns.create(druidTable), + MoveMarkerFiltersToIntervals.instance(), + ValidateNoMarkerFiltersRemain.instance() + ) + ); + } + + /** + * Optimize a Filtration containing only a DimFilter, avoiding pulling out intervals. + * + * @return equivalent Filtration + */ + public Filtration optimizeFilterOnly(final DruidTable druidTable) + { + if (!intervals.equals(ImmutableList.of(eternity()))) { + throw new ISE("Cannot optimizeFilterOnly when intervals are set"); + } + + final Filtration transformed = transform( + this, + ImmutableList.>of( + CombineAndSimplifyBounds.instance(), + ConvertBoundsToSelectors.create(druidTable), + ConvertSelectorsToIns.create(druidTable) + ) + ); + + if (!transformed.getIntervals().equals(ImmutableList.of(eternity()))) { + throw new ISE("WTF?! optimizeFilterOnly was about to return filtration with intervals?!"); + } + + return transformed; + } + + @Override + public boolean equals(Object o) + { + if (this == o) { + return true; + } + if (o == null || getClass() != o.getClass()) { + return false; + } + + Filtration that = (Filtration) o; + + if (intervals != null ? !intervals.equals(that.intervals) : that.intervals != null) { + return false; + } + return dimFilter != null ? dimFilter.equals(that.dimFilter) : that.dimFilter == null; + + } + + @Override + public int hashCode() + { + int result = intervals != null ? intervals.hashCode() : 0; + result = 31 * result + (dimFilter != null ? dimFilter.hashCode() : 0); + return result; + } + + @Override + public String toString() + { + return "Filtration{" + + "intervals=" + intervals + + ", dimFilter=" + dimFilter + + '}'; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/filtration/MoveMarkerFiltersToIntervals.java b/sql/src/main/java/io/druid/sql/calcite/filtration/MoveMarkerFiltersToIntervals.java new file mode 100644 index 00000000000..89290177ab9 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/filtration/MoveMarkerFiltersToIntervals.java @@ -0,0 +1,50 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import com.google.common.base.Function; +import com.google.common.collect.ImmutableList; +import org.joda.time.Interval; + +public class MoveMarkerFiltersToIntervals implements Function +{ + private static final MoveMarkerFiltersToIntervals INSTANCE = new MoveMarkerFiltersToIntervals(); + + private MoveMarkerFiltersToIntervals() + { + } + + public static MoveMarkerFiltersToIntervals instance() + { + return INSTANCE; + } + + @Override + public Filtration apply(final Filtration filtration) + { + if (Filtration.matchEverything().equals(filtration.getDimFilter())) { + return Filtration.create(null, filtration.getIntervals()); + } else if (Filtration.matchNothing().equals(filtration.getDimFilter())) { + return Filtration.create(null, ImmutableList.of()); + } else { + return filtration; + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/filtration/MoveTimeFiltersToIntervals.java b/sql/src/main/java/io/druid/sql/calcite/filtration/MoveTimeFiltersToIntervals.java new file mode 100644 index 00000000000..1ec9f0691d1 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/filtration/MoveTimeFiltersToIntervals.java @@ -0,0 +1,172 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import com.google.common.base.Function; +import com.google.common.collect.ImmutableList; +import com.google.common.collect.Lists; +import com.google.common.collect.Range; +import com.google.common.collect.RangeSet; +import io.druid.java.util.common.Pair; +import io.druid.query.filter.AndDimFilter; +import io.druid.query.filter.BoundDimFilter; +import io.druid.query.filter.DimFilter; +import io.druid.query.filter.NotDimFilter; +import io.druid.query.filter.OrDimFilter; +import io.druid.query.ordering.StringComparators; +import io.druid.segment.column.Column; + +import java.util.List; + +public class MoveTimeFiltersToIntervals implements Function +{ + private static final MoveTimeFiltersToIntervals INSTANCE = new MoveTimeFiltersToIntervals(); + private static final BoundRefKey TIME_BOUND_REF_KEY = new BoundRefKey( + Column.TIME_COLUMN_NAME, + null, + StringComparators.NUMERIC + ); + + private MoveTimeFiltersToIntervals() + { + } + + public static MoveTimeFiltersToIntervals instance() + { + return INSTANCE; + } + + @Override + public Filtration apply(final Filtration filtration) + { + if (filtration.getDimFilter() == null) { + return filtration; + } + + // Convert existing filtration intervals to a RangeSet. + final RangeSet rangeSet = RangeSets.fromIntervals(filtration.getIntervals()); + + // Remove anything outside eternity. + rangeSet.removeAll(RangeSets.fromIntervals(ImmutableList.of(Filtration.eternity())).complement()); + + // Extract time bounds from the dimFilter. + final Pair> pair = extractConvertibleTimeBounds(filtration.getDimFilter()); + + if (pair.rhs != null) { + rangeSet.removeAll(pair.rhs.complement()); + } + + return Filtration.create(pair.lhs, RangeSets.toIntervals(rangeSet)); + } + + /** + * Extract bound filters on __time that can be converted to query-level "intervals". + * + * @return pair of new dimFilter + RangeSet of __time that should be ANDed together. Either can be null but not both. + */ + private static Pair> extractConvertibleTimeBounds(final DimFilter filter) + { + if (filter instanceof AndDimFilter) { + final List children = ((AndDimFilter) filter).getFields(); + final List newChildren = Lists.newArrayList(); + final List> rangeSets = Lists.newArrayList(); + + for (DimFilter child : children) { + final Pair> pair = extractConvertibleTimeBounds(child); + if (pair.lhs != null) { + newChildren.add(pair.lhs); + } + if (pair.rhs != null) { + rangeSets.add(pair.rhs); + } + } + + final DimFilter newFilter; + if (newChildren.size() == 0) { + newFilter = null; + } else if (newChildren.size() == 1) { + newFilter = newChildren.get(0); + } else { + newFilter = new AndDimFilter(newChildren); + } + + return Pair.of( + newFilter, + rangeSets.isEmpty() ? null : RangeSets.intersectRangeSets(rangeSets) + ); + } else if (filter instanceof OrDimFilter) { + final List children = ((OrDimFilter) filter).getFields(); + final List> rangeSets = Lists.newArrayList(); + + boolean allCompletelyConverted = true; + boolean allHadIntervals = true; + for (DimFilter child : children) { + final Pair> pair = extractConvertibleTimeBounds(child); + if (pair.lhs != null) { + allCompletelyConverted = false; + } + if (pair.rhs != null) { + rangeSets.add(pair.rhs); + } else { + allHadIntervals = false; + } + } + + if (allCompletelyConverted) { + return Pair.of(null, RangeSets.unionRangeSets(rangeSets)); + } else { + return Pair.of(filter, allHadIntervals ? RangeSets.unionRangeSets(rangeSets) : null); + } + } else if (filter instanceof NotDimFilter) { + final DimFilter child = ((NotDimFilter) filter).getField(); + final Pair> pair = extractConvertibleTimeBounds(child); + if (pair.rhs != null && pair.lhs == null) { + return Pair.of(null, pair.rhs.complement()); + } else { + return Pair.of(filter, null); + } + } else if (filter instanceof BoundDimFilter) { + final BoundDimFilter bound = (BoundDimFilter) filter; + if (BoundRefKey.from(bound).equals(TIME_BOUND_REF_KEY)) { + return Pair.of(null, RangeSets.of(toLongRange(Bounds.toRange(bound)))); + } else { + return Pair.of(filter, null); + } + } else { + return Pair.of(filter, null); + } + } + + private static Range toLongRange(final Range range) + { + if (!range.hasUpperBound() && !range.hasLowerBound()) { + return Range.all(); + } else if (range.hasUpperBound() && !range.hasLowerBound()) { + return Range.upTo(Long.parseLong(range.upperEndpoint().getValue()), range.upperBoundType()); + } else if (!range.hasUpperBound() && range.hasLowerBound()) { + return Range.downTo(Long.parseLong(range.lowerEndpoint().getValue()), range.lowerBoundType()); + } else { + return Range.range( + Long.parseLong(range.lowerEndpoint().getValue()), range.lowerBoundType(), + Long.parseLong(range.upperEndpoint().getValue()), range.upperBoundType() + ); + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/filtration/RangeSets.java b/sql/src/main/java/io/druid/sql/calcite/filtration/RangeSets.java new file mode 100644 index 00000000000..345a7e748d2 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/filtration/RangeSets.java @@ -0,0 +1,136 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import com.google.common.collect.BoundType; +import com.google.common.collect.ImmutableList; +import com.google.common.collect.Lists; +import com.google.common.collect.Range; +import com.google.common.collect.RangeSet; +import com.google.common.collect.TreeRangeSet; +import org.joda.time.Interval; + +import java.util.List; + +public class RangeSets +{ + public static > RangeSet of(final Range range) + { + return unionRanges(ImmutableList.of(range)); + } + + /** + * Unions a set of ranges, or returns null if the set is empty. + */ + public static > RangeSet unionRanges(final Iterable> ranges) + { + RangeSet rangeSet = null; + for (Range range : ranges) { + if (rangeSet == null) { + rangeSet = TreeRangeSet.create(); + } + rangeSet.add(range); + } + return rangeSet; + } + + /** + * Unions a set of rangeSets, or returns null if the set is empty. + */ + public static > RangeSet unionRangeSets(final Iterable> rangeSets) + { + final RangeSet rangeSet = TreeRangeSet.create(); + for (RangeSet set : rangeSets) { + rangeSet.addAll(set); + } + return rangeSet; + } + + /** + * Intersects a set of ranges, or returns null if the set is empty. + */ + public static > RangeSet intersectRanges(final Iterable> ranges) + { + RangeSet rangeSet = null; + for (final Range range : ranges) { + if (rangeSet == null) { + rangeSet = TreeRangeSet.create(); + rangeSet.add(range); + } else { + rangeSet = TreeRangeSet.create(rangeSet.subRangeSet(range)); + } + } + return rangeSet; + } + + /** + * Intersects a set of rangeSets, or returns null if the set is empty. + */ + public static > RangeSet intersectRangeSets(final Iterable> rangeSets) + { + RangeSet rangeSet = null; + for (final RangeSet set : rangeSets) { + if (rangeSet == null) { + rangeSet = TreeRangeSet.create(); + rangeSet.addAll(set); + } else { + rangeSet.removeAll(set.complement()); + } + } + return rangeSet; + } + + public static RangeSet fromIntervals(final Iterable intervals) + { + final RangeSet retVal = TreeRangeSet.create(); + for (Interval interval : intervals) { + retVal.add(Range.closedOpen(interval.getStartMillis(), interval.getEndMillis())); + } + return retVal; + } + + public static List toIntervals(final RangeSet rangeSet) + { + final List retVal = Lists.newArrayList(); + + for (Range range : rangeSet.asRanges()) { + final long start; + final long end; + + if (range.hasLowerBound()) { + final long millis = range.lowerEndpoint(); + start = millis + (range.lowerBoundType() == BoundType.OPEN ? 1 : 0); + } else { + start = Filtration.eternity().getStartMillis(); + } + + if (range.hasUpperBound()) { + final long millis = range.upperEndpoint(); + end = millis + (range.upperBoundType() == BoundType.OPEN ? 0 : 1); + } else { + end = Filtration.eternity().getEndMillis(); + } + + retVal.add(new Interval(start, end)); + } + + return retVal; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/filtration/ValidateNoMarkerFiltersRemain.java b/sql/src/main/java/io/druid/sql/calcite/filtration/ValidateNoMarkerFiltersRemain.java new file mode 100644 index 00000000000..0758cca40da --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/filtration/ValidateNoMarkerFiltersRemain.java @@ -0,0 +1,47 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import io.druid.java.util.common.ISE; +import io.druid.query.filter.DimFilter; + +public class ValidateNoMarkerFiltersRemain extends BottomUpTransform +{ + private static final ValidateNoMarkerFiltersRemain INSTANCE = new ValidateNoMarkerFiltersRemain(); + + private ValidateNoMarkerFiltersRemain() + { + } + + public static ValidateNoMarkerFiltersRemain instance() + { + return INSTANCE; + } + + @Override + protected DimFilter process(DimFilter filter) + { + if (Filtration.matchNothing().equals(filter) || Filtration.matchEverything().equals(filter)) { + throw new ISE("Marker filters shouldn't exist in the final filter, but found: %s", filter); + } + + return filter; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/planner/AggregateValuesRule.java b/sql/src/main/java/io/druid/sql/calcite/planner/AggregateValuesRule.java new file mode 100644 index 00000000000..c80fb7ab7d2 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/planner/AggregateValuesRule.java @@ -0,0 +1,98 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.planner; + +import com.google.common.base.Predicates; +import com.google.common.collect.ImmutableList; +import org.apache.calcite.plan.RelOptRule; +import org.apache.calcite.plan.RelOptRuleCall; +import org.apache.calcite.rel.core.Aggregate; +import org.apache.calcite.rel.core.AggregateCall; +import org.apache.calcite.rel.core.Values; +import org.apache.calcite.rel.logical.LogicalValues; +import org.apache.calcite.rex.RexBuilder; +import org.apache.calcite.rex.RexLiteral; + +import java.math.BigDecimal; + +/** + * Rule that applies Aggregate to Values. Currently only applies to empty Values. + * + * This is still useful because PruneEmptyRules doesn't handle Aggregate, which is in turn because + * Aggregate of empty relations need some special handling: a single row will be generated, where + * each column's value depends on the specific aggregate calls (e.g. COUNT is 0, SUM is NULL). + * Sample query where this matters: SELECT COUNT(*) FROM s.foo WHERE 1 = 0. + * + * Can be replaced by AggregateValuesRule in Calcite 1.11.0, when released. + */ +public class AggregateValuesRule extends RelOptRule +{ + public static final AggregateValuesRule INSTANCE = new AggregateValuesRule(); + + private AggregateValuesRule() + { + super( + operand(Aggregate.class, null, Predicates.not(Aggregate.IS_NOT_GRAND_TOTAL), + operand(Values.class, null, Values.IS_EMPTY, none()) + ) + ); + } + + @Override + public void onMatch(RelOptRuleCall call) + { + final Aggregate aggregate = call.rel(0); + final Values values = call.rel(1); + + final ImmutableList.Builder literals = ImmutableList.builder(); + + final RexBuilder rexBuilder = call.builder().getRexBuilder(); + for (final AggregateCall aggregateCall : aggregate.getAggCallList()) { + switch (aggregateCall.getAggregation().getKind()) { + case COUNT: + case SUM0: + literals.add((RexLiteral) rexBuilder.makeLiteral( + BigDecimal.ZERO, aggregateCall.getType(), false)); + break; + + case MIN: + case MAX: + case SUM: + literals.add(rexBuilder.constantNull()); + break; + + default: + // Unknown what this aggregate call should do on empty Values. Bail out to be safe. + return; + } + } + + call.transformTo( + LogicalValues.create( + values.getCluster(), + aggregate.getRowType(), + ImmutableList.of(literals.build()) + ) + ); + + // New plan is absolutely better than old plan. + call.getPlanner().setImportance(aggregate, 0.0); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/planner/Calcites.java b/sql/src/main/java/io/druid/sql/calcite/planner/Calcites.java new file mode 100644 index 00000000000..28e7c6254c0 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/planner/Calcites.java @@ -0,0 +1,89 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.planner; + +import org.apache.calcite.jdbc.CalciteConnection; +import org.apache.calcite.jdbc.CalciteJdbc41Factory; +import org.apache.calcite.jdbc.CalcitePrepare; +import org.apache.calcite.jdbc.Driver; +import org.apache.calcite.linq4j.function.Function0; +import org.apache.calcite.schema.Schema; +import org.apache.calcite.schema.SchemaPlus; + +import java.sql.SQLException; +import java.util.Properties; + +/** + * Entry points for Calcite. + */ +public class Calcites +{ + private static final String DRUID_SCHEMA_NAME = "druid"; + + private Calcites() + { + // No instantiation. + } + + /** + * Create a Calcite JDBC driver. + * + * @param druidSchema "druid" schema + * + * @return JDBC driver + */ + public static CalciteConnection jdbc( + final Schema druidSchema, + final PlannerConfig plannerConfig + ) throws SQLException + { + final Properties props = new Properties(); + props.setProperty("caseSensitive", "true"); + props.setProperty("unquotedCasing", "UNCHANGED"); + + final CalciteJdbc41Factory jdbcFactory = new CalciteJdbc41Factory(); + final Function0 prepareFactory = new Function0() + { + @Override + public CalcitePrepare apply() + { + return new DruidPlannerImpl(plannerConfig); + } + }; + final Driver driver = new Driver() + { + @Override + protected Function0 createPrepareFactory() + { + return prepareFactory; + } + }; + final CalciteConnection calciteConnection = (CalciteConnection) jdbcFactory.newConnection( + driver, + jdbcFactory, + "jdbc:calcite:", + props + ); + + final SchemaPlus druidSchemaPlus = calciteConnection.getRootSchema().add(DRUID_SCHEMA_NAME, druidSchema); + druidSchemaPlus.setCacheEnabled(false); + return calciteConnection; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/planner/DruidConvertletTable.java b/sql/src/main/java/io/druid/sql/calcite/planner/DruidConvertletTable.java new file mode 100644 index 00000000000..3675602a1ca --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/planner/DruidConvertletTable.java @@ -0,0 +1,59 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.planner; + +import org.apache.calcite.rex.RexNode; +import org.apache.calcite.sql.SqlCall; +import org.apache.calcite.sql.SqlKind; +import org.apache.calcite.sql2rel.SqlRexContext; +import org.apache.calcite.sql2rel.SqlRexConvertlet; +import org.apache.calcite.sql2rel.SqlRexConvertletTable; +import org.apache.calcite.sql2rel.StandardConvertletTable; + +public class DruidConvertletTable implements SqlRexConvertletTable +{ + private static final DruidConvertletTable INSTANCE = new DruidConvertletTable(); + + private DruidConvertletTable() + { + } + + public static DruidConvertletTable instance() + { + return INSTANCE; + } + + @Override + public SqlRexConvertlet get(SqlCall call) + { + if (call.getKind() == SqlKind.EXTRACT && call.getOperandList().get(1).getKind() != SqlKind.LITERAL) { + return new SqlRexConvertlet() + { + @Override + public RexNode convertCall(SqlRexContext cx, SqlCall call) + { + return StandardConvertletTable.INSTANCE.convertCall(cx, call); + } + }; + } else { + return StandardConvertletTable.INSTANCE.get(call); + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/planner/DruidPlannerImpl.java b/sql/src/main/java/io/druid/sql/calcite/planner/DruidPlannerImpl.java new file mode 100644 index 00000000000..4665a94ccd9 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/planner/DruidPlannerImpl.java @@ -0,0 +1,68 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.planner; + +import org.apache.calcite.plan.Contexts; +import org.apache.calcite.plan.ConventionTraitDef; +import org.apache.calcite.plan.RelOptCostFactory; +import org.apache.calcite.plan.RelOptPlanner; +import org.apache.calcite.plan.RelOptRule; +import org.apache.calcite.plan.volcano.VolcanoPlanner; +import org.apache.calcite.prepare.CalcitePrepareImpl; +import org.apache.calcite.rel.RelCollationTraitDef; + +/** + * Our very own subclass of CalcitePrepareImpl, used to alter behaviors of the JDBC driver as necessary. + * + * When Calcite 1.11.0 is released, we should override "createConvertletTable" and provide the + * DruidConvertletTable. + */ +public class DruidPlannerImpl extends CalcitePrepareImpl +{ + private final PlannerConfig plannerConfig; + + public DruidPlannerImpl(PlannerConfig plannerConfig) + { + this.plannerConfig = plannerConfig; + } + + @Override + protected RelOptPlanner createPlanner( + final Context prepareContext, + final org.apache.calcite.plan.Context externalContext0, + final RelOptCostFactory costFactory + ) + { + final org.apache.calcite.plan.Context externalContext = externalContext0 != null + ? externalContext0 + : Contexts.of(prepareContext.config()); + + final VolcanoPlanner planner = new VolcanoPlanner(costFactory, externalContext); + planner.addRelTraitDef(ConventionTraitDef.INSTANCE); + planner.addRelTraitDef(RelCollationTraitDef.INSTANCE); + + // Register planner rules. + for (RelOptRule rule : Rules.ruleSet(plannerConfig)) { + planner.addRule(rule); + } + + return planner; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/planner/PlannerConfig.java b/sql/src/main/java/io/druid/sql/calcite/planner/PlannerConfig.java new file mode 100644 index 00000000000..7ed2f4d630e --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/planner/PlannerConfig.java @@ -0,0 +1,145 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.planner; + +import com.fasterxml.jackson.annotation.JsonProperty; +import org.joda.time.Period; + +public class PlannerConfig +{ + @JsonProperty + private Period metadataRefreshPeriod = new Period("PT1M"); + + @JsonProperty + private int maxSemiJoinRowsInMemory = 100000; + + @JsonProperty + private int maxTopNLimit = 100000; + + @JsonProperty + private int selectThreshold = 1000; + + @JsonProperty + private boolean useApproximateCountDistinct = true; + + @JsonProperty + private boolean useApproximateTopN = true; + + @JsonProperty + private boolean useFallback = false; + + public Period getMetadataRefreshPeriod() + { + return metadataRefreshPeriod; + } + + public int getMaxSemiJoinRowsInMemory() + { + return maxSemiJoinRowsInMemory; + } + + public int getMaxTopNLimit() + { + return maxTopNLimit; + } + + public int getSelectThreshold() + { + return selectThreshold; + } + + public boolean isUseApproximateCountDistinct() + { + return useApproximateCountDistinct; + } + + public boolean isUseApproximateTopN() + { + return useApproximateTopN; + } + + public boolean isUseFallback() + { + return useFallback; + } + + @Override + public boolean equals(Object o) + { + if (this == o) { + return true; + } + if (o == null || getClass() != o.getClass()) { + return false; + } + + PlannerConfig that = (PlannerConfig) o; + + if (maxSemiJoinRowsInMemory != that.maxSemiJoinRowsInMemory) { + return false; + } + if (maxTopNLimit != that.maxTopNLimit) { + return false; + } + if (selectThreshold != that.selectThreshold) { + return false; + } + if (useApproximateCountDistinct != that.useApproximateCountDistinct) { + return false; + } + if (useApproximateTopN != that.useApproximateTopN) { + return false; + } + if (useFallback != that.useFallback) { + return false; + } + return metadataRefreshPeriod != null + ? metadataRefreshPeriod.equals(that.metadataRefreshPeriod) + : that.metadataRefreshPeriod == null; + + } + + @Override + public int hashCode() + { + int result = metadataRefreshPeriod != null ? metadataRefreshPeriod.hashCode() : 0; + result = 31 * result + maxSemiJoinRowsInMemory; + result = 31 * result + maxTopNLimit; + result = 31 * result + selectThreshold; + result = 31 * result + (useApproximateCountDistinct ? 1 : 0); + result = 31 * result + (useApproximateTopN ? 1 : 0); + result = 31 * result + (useFallback ? 1 : 0); + return result; + } + + @Override + public String toString() + { + return "PlannerConfig{" + + "metadataRefreshPeriod=" + metadataRefreshPeriod + + ", maxSemiJoinRowsInMemory=" + maxSemiJoinRowsInMemory + + ", maxTopNLimit=" + maxTopNLimit + + ", selectThreshold=" + selectThreshold + + ", useApproximateCountDistinct=" + useApproximateCountDistinct + + ", useApproximateTopN=" + useApproximateTopN + + ", useFallback=" + useFallback + + '}'; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/planner/Rules.java b/sql/src/main/java/io/druid/sql/calcite/planner/Rules.java new file mode 100644 index 00000000000..aea79f0b246 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/planner/Rules.java @@ -0,0 +1,214 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.planner; + +import com.google.common.collect.ImmutableList; +import io.druid.sql.calcite.rule.DruidBindableConverterRule; +import io.druid.sql.calcite.rule.DruidFilterRule; +import io.druid.sql.calcite.rule.DruidSelectProjectionRule; +import io.druid.sql.calcite.rule.DruidSelectSortRule; +import io.druid.sql.calcite.rule.DruidSemiJoinRule; +import io.druid.sql.calcite.rule.GroupByRules; +import org.apache.calcite.adapter.enumerable.EnumerableInterpreterRule; +import org.apache.calcite.adapter.enumerable.EnumerableRules; +import org.apache.calcite.interpreter.Bindables; +import org.apache.calcite.plan.RelOptRule; +import org.apache.calcite.plan.volcano.AbstractConverter; +import org.apache.calcite.rel.rules.AggregateJoinTransposeRule; +import org.apache.calcite.rel.rules.AggregateProjectMergeRule; +import org.apache.calcite.rel.rules.AggregateProjectPullUpConstantsRule; +import org.apache.calcite.rel.rules.AggregateRemoveRule; +import org.apache.calcite.rel.rules.AggregateStarTableRule; +import org.apache.calcite.rel.rules.CalcRemoveRule; +import org.apache.calcite.rel.rules.DateRangeRules; +import org.apache.calcite.rel.rules.FilterAggregateTransposeRule; +import org.apache.calcite.rel.rules.FilterJoinRule; +import org.apache.calcite.rel.rules.FilterMergeRule; +import org.apache.calcite.rel.rules.FilterProjectTransposeRule; +import org.apache.calcite.rel.rules.FilterTableScanRule; +import org.apache.calcite.rel.rules.JoinCommuteRule; +import org.apache.calcite.rel.rules.JoinPushExpressionsRule; +import org.apache.calcite.rel.rules.JoinPushThroughJoinRule; +import org.apache.calcite.rel.rules.ProjectFilterTransposeRule; +import org.apache.calcite.rel.rules.ProjectMergeRule; +import org.apache.calcite.rel.rules.ProjectRemoveRule; +import org.apache.calcite.rel.rules.ProjectTableScanRule; +import org.apache.calcite.rel.rules.ProjectToWindowRule; +import org.apache.calcite.rel.rules.ProjectWindowTransposeRule; +import org.apache.calcite.rel.rules.PruneEmptyRules; +import org.apache.calcite.rel.rules.ReduceExpressionsRule; +import org.apache.calcite.rel.rules.SemiJoinRule; +import org.apache.calcite.rel.rules.SortJoinTransposeRule; +import org.apache.calcite.rel.rules.SortProjectTransposeRule; +import org.apache.calcite.rel.rules.SortRemoveRule; +import org.apache.calcite.rel.rules.SortUnionTransposeRule; +import org.apache.calcite.rel.rules.TableScanRule; +import org.apache.calcite.rel.rules.UnionMergeRule; +import org.apache.calcite.rel.rules.UnionPullUpConstantsRule; +import org.apache.calcite.rel.rules.UnionToDistinctRule; +import org.apache.calcite.rel.rules.ValuesReduceRule; + +import java.util.List; + +public class Rules +{ + // Rules from CalcitePrepareImpl's DEFAULT_RULES, minus AggregateExpandDistinctAggregatesRule + // and AggregateReduceFunctionsRule. + private static final List DEFAULT_RULES = + ImmutableList.of( + AggregateStarTableRule.INSTANCE, + AggregateStarTableRule.INSTANCE2, + TableScanRule.INSTANCE, + ProjectMergeRule.INSTANCE, + FilterTableScanRule.INSTANCE, + ProjectFilterTransposeRule.INSTANCE, + FilterProjectTransposeRule.INSTANCE, + FilterJoinRule.FILTER_ON_JOIN, + JoinPushExpressionsRule.INSTANCE, + FilterAggregateTransposeRule.INSTANCE, + ProjectWindowTransposeRule.INSTANCE, + JoinCommuteRule.INSTANCE, + JoinPushThroughJoinRule.RIGHT, + JoinPushThroughJoinRule.LEFT, + SortProjectTransposeRule.INSTANCE, + SortJoinTransposeRule.INSTANCE, + SortUnionTransposeRule.INSTANCE + ); + + // Rules from CalcitePrepareImpl's createPlanner. + private static final List MISCELLANEOUS_RULES = + ImmutableList.of( + Bindables.BINDABLE_TABLE_SCAN_RULE, + ProjectTableScanRule.INSTANCE, + ProjectTableScanRule.INTERPRETER, + EnumerableInterpreterRule.INSTANCE, + EnumerableRules.ENUMERABLE_VALUES_RULE + ); + + // Rules from CalcitePrepareImpl's CONSTANT_REDUCTION_RULES. + private static final List CONSTANT_REDUCTION_RULES = + ImmutableList.of( + ReduceExpressionsRule.PROJECT_INSTANCE, + ReduceExpressionsRule.CALC_INSTANCE, + ReduceExpressionsRule.JOIN_INSTANCE, + ReduceExpressionsRule.FILTER_INSTANCE, + ValuesReduceRule.FILTER_INSTANCE, + ValuesReduceRule.PROJECT_FILTER_INSTANCE, + ValuesReduceRule.PROJECT_INSTANCE, + AggregateValuesRule.INSTANCE + ); + + // Rules from CalcitePrepareImpl's ENUMERABLE_RULES. + private static final List ENUMERABLE_RULES = + ImmutableList.of( + EnumerableRules.ENUMERABLE_JOIN_RULE, + EnumerableRules.ENUMERABLE_MERGE_JOIN_RULE, + EnumerableRules.ENUMERABLE_SEMI_JOIN_RULE, + EnumerableRules.ENUMERABLE_CORRELATE_RULE, + EnumerableRules.ENUMERABLE_PROJECT_RULE, + EnumerableRules.ENUMERABLE_FILTER_RULE, + EnumerableRules.ENUMERABLE_AGGREGATE_RULE, + EnumerableRules.ENUMERABLE_SORT_RULE, + EnumerableRules.ENUMERABLE_LIMIT_RULE, + EnumerableRules.ENUMERABLE_COLLECT_RULE, + EnumerableRules.ENUMERABLE_UNCOLLECT_RULE, + EnumerableRules.ENUMERABLE_UNION_RULE, + EnumerableRules.ENUMERABLE_INTERSECT_RULE, + EnumerableRules.ENUMERABLE_MINUS_RULE, + EnumerableRules.ENUMERABLE_TABLE_MODIFICATION_RULE, + EnumerableRules.ENUMERABLE_VALUES_RULE, + EnumerableRules.ENUMERABLE_WINDOW_RULE, + EnumerableRules.ENUMERABLE_TABLE_SCAN_RULE, + EnumerableRules.ENUMERABLE_TABLE_FUNCTION_SCAN_RULE + ); + + // Rules from VolcanoPlanner's registerAbstractRelationalRules. + private static final List VOLCANO_ABSTRACT_RULES = + ImmutableList.of( + FilterJoinRule.FILTER_ON_JOIN, + FilterJoinRule.JOIN, + AbstractConverter.ExpandConversionRule.INSTANCE, + JoinCommuteRule.INSTANCE, + SemiJoinRule.INSTANCE, + AggregateRemoveRule.INSTANCE, + UnionToDistinctRule.INSTANCE, + ProjectRemoveRule.INSTANCE, + AggregateJoinTransposeRule.INSTANCE, + AggregateProjectMergeRule.INSTANCE, + CalcRemoveRule.INSTANCE, + SortRemoveRule.INSTANCE + ); + + // Rules from RelOptUtil's registerAbstractRels. + private static final List RELOPTUTIL_ABSTRACT_RULES = + ImmutableList.of( + AggregateProjectPullUpConstantsRule.INSTANCE2, + UnionPullUpConstantsRule.INSTANCE, + PruneEmptyRules.UNION_INSTANCE, + PruneEmptyRules.PROJECT_INSTANCE, + PruneEmptyRules.FILTER_INSTANCE, + PruneEmptyRules.SORT_INSTANCE, + PruneEmptyRules.AGGREGATE_INSTANCE, + PruneEmptyRules.JOIN_LEFT_INSTANCE, + PruneEmptyRules.JOIN_RIGHT_INSTANCE, + PruneEmptyRules.SORT_FETCH_ZERO_INSTANCE, + UnionMergeRule.INSTANCE, + ProjectToWindowRule.PROJECT, + FilterMergeRule.INSTANCE, + DateRangeRules.FILTER_INSTANCE + ); + + private Rules() + { + // No instantiation. + } + + public static List ruleSet(final PlannerConfig plannerConfig) + { + final ImmutableList.Builder rules = ImmutableList.builder(); + + // Calcite rules. + rules.addAll(DEFAULT_RULES); + rules.addAll(MISCELLANEOUS_RULES); + rules.addAll(CONSTANT_REDUCTION_RULES); + rules.addAll(VOLCANO_ABSTRACT_RULES); + rules.addAll(RELOPTUTIL_ABSTRACT_RULES); + + if (plannerConfig.isUseFallback()) { + rules.addAll(ENUMERABLE_RULES); + } + + // Druid-specific rules. + rules.add(DruidFilterRule.instance()); + rules.add(DruidSelectSortRule.instance()); + rules.add(DruidSelectProjectionRule.instance()); + + if (plannerConfig.getMaxSemiJoinRowsInMemory() > 0) { + rules.add(DruidSemiJoinRule.instance()); + } + + rules.addAll(GroupByRules.rules(plannerConfig)); + + // Allow conversion of Druid queries to Bindable convention. + rules.add(DruidBindableConverterRule.instance()); + + return rules.build(); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rel/DruidConvention.java b/sql/src/main/java/io/druid/sql/calcite/rel/DruidConvention.java new file mode 100644 index 00000000000..f4eaa5f1502 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rel/DruidConvention.java @@ -0,0 +1,84 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rel; + +import org.apache.calcite.plan.Convention; +import org.apache.calcite.plan.RelOptPlanner; +import org.apache.calcite.plan.RelTrait; +import org.apache.calcite.plan.RelTraitDef; +import org.apache.calcite.plan.RelTraitSet; + +public class DruidConvention implements Convention +{ + private static final DruidConvention INSTANCE = new DruidConvention(); + + private DruidConvention() + { + } + + public static DruidConvention instance() + { + return INSTANCE; + } + + @Override + public Class getInterface() + { + return null; + } + + @Override + public String getName() + { + return null; + } + + @Override + public boolean canConvertConvention(Convention toConvention) + { + return false; + } + + @Override + public boolean useAbstractConvertersForConversion( + RelTraitSet fromTraits, RelTraitSet toTraits + ) + { + return false; + } + + @Override + public RelTraitDef getTraitDef() + { + return null; + } + + @Override + public boolean satisfies(RelTrait trait) + { + return false; + } + + @Override + public void register(RelOptPlanner planner) + { + + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rel/DruidQueryBuilder.java b/sql/src/main/java/io/druid/sql/calcite/rel/DruidQueryBuilder.java new file mode 100644 index 00000000000..5916463f350 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rel/DruidQueryBuilder.java @@ -0,0 +1,388 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rel; + +import com.google.common.base.Function; +import com.google.common.base.Preconditions; +import com.google.common.collect.ImmutableList; +import com.google.common.collect.Iterables; +import com.google.common.collect.Lists; +import io.druid.granularity.QueryGranularities; +import io.druid.granularity.QueryGranularity; +import io.druid.java.util.common.ISE; +import io.druid.query.dimension.DimensionSpec; +import io.druid.query.filter.DimFilter; +import io.druid.query.groupby.orderby.DefaultLimitSpec; +import io.druid.query.groupby.orderby.OrderByColumnSpec; +import io.druid.query.topn.DimensionTopNMetricSpec; +import io.druid.query.topn.InvertedTopNMetricSpec; +import io.druid.query.topn.NumericTopNMetricSpec; +import io.druid.query.topn.TopNMetricSpec; +import io.druid.segment.column.Column; +import io.druid.sql.calcite.expression.ExtractionFns; +import io.druid.sql.calcite.planner.PlannerConfig; +import io.druid.sql.calcite.table.DruidTable; +import org.apache.calcite.interpreter.Row; +import org.apache.calcite.plan.RelTrait; +import org.apache.calcite.rel.RelCollations; +import org.apache.calcite.rel.RelFieldCollation; +import org.apache.calcite.rel.type.RelDataType; +import org.apache.calcite.rel.type.RelDataTypeFactory; +import org.apache.calcite.rel.type.RelDataTypeField; + +import java.util.List; + +public class DruidQueryBuilder +{ + private final DimFilter filter; + private final SelectProjection selectProjection; + private final Grouping grouping; + private final DimFilter having; + private final DefaultLimitSpec limitSpec; + private final RelDataType rowType; + private final List rowOrder; + + private DruidQueryBuilder( + final DimFilter filter, + final SelectProjection selectProjection, + final Grouping grouping, + final DimFilter having, + final DefaultLimitSpec limitSpec, + final RelDataType rowType, + final List rowOrder + ) + { + this.filter = filter; + this.selectProjection = selectProjection; + this.grouping = grouping; + this.having = having; + this.limitSpec = limitSpec; + this.rowType = Preconditions.checkNotNull(rowType, "rowType"); + this.rowOrder = Preconditions.checkNotNull(ImmutableList.copyOf(rowOrder), "rowOrder"); + + if (selectProjection != null && grouping != null) { + throw new ISE("Cannot have both selectProjection and grouping"); + } + } + + public static DruidQueryBuilder fullScan(final DruidTable druidTable, final RelDataTypeFactory relDataTypeFactory) + { + final RelDataType rowType = druidTable.getRowType(relDataTypeFactory); + final List rowOrder = Lists.newArrayListWithCapacity(rowType.getFieldCount()); + for (RelDataTypeField field : rowType.getFieldList()) { + rowOrder.add(field.getName()); + } + return new DruidQueryBuilder(null, null, null, null, null, rowType, rowOrder); + } + + public DruidQueryBuilder withFilter(final DimFilter newFilter) + { + Preconditions.checkNotNull(newFilter, "newFilter"); + return new DruidQueryBuilder(newFilter, selectProjection, grouping, having, limitSpec, rowType, rowOrder); + } + + public DruidQueryBuilder withSelectProjection(final SelectProjection newProjection, final List newRowOrder) + { + Preconditions.checkState(selectProjection == null, "cannot project twice"); + Preconditions.checkState(grouping == null, "cannot project after grouping"); + Preconditions.checkNotNull(newProjection, "newProjection"); + Preconditions.checkState( + newProjection.getProject().getChildExps().size() == newRowOrder.size(), + "project size[%,d] != rowOrder size[%,d]", + newProjection.getProject().getChildExps().size(), + newRowOrder.size() + ); + return new DruidQueryBuilder( + filter, + newProjection, + grouping, + having, + limitSpec, + newProjection.getProject().getRowType(), + newRowOrder + ); + } + + public DruidQueryBuilder withGrouping( + final Grouping newGrouping, + final RelDataType newRowType, + final List newRowOrder + ) + { + Preconditions.checkState(grouping == null, "cannot add grouping twice"); + Preconditions.checkState(having == null, "cannot add grouping after having"); + Preconditions.checkState(limitSpec == null, "cannot add grouping after limitSpec"); + Preconditions.checkNotNull(newGrouping, "newGrouping"); + // Set selectProjection to null now that we're grouping. Grouping subsumes select projection. + return new DruidQueryBuilder(filter, null, newGrouping, having, limitSpec, newRowType, newRowOrder); + } + + public DruidQueryBuilder withAdjustedGrouping( + final Grouping newGrouping, + final RelDataType newRowType, + final List newRowOrder + ) + { + // Like withGrouping, but without any sanity checks. It's assumed that callers will pass something that makes sense. + // This is used when adjusting the Grouping while pushing down a post-Aggregate Project or Sort. + Preconditions.checkNotNull(newGrouping, "newGrouping"); + return new DruidQueryBuilder(filter, null, newGrouping, having, limitSpec, newRowType, newRowOrder); + } + + public DruidQueryBuilder withHaving(final DimFilter newHaving) + { + Preconditions.checkState(having == null, "cannot add having twice"); + Preconditions.checkState(limitSpec == null, "cannot add having after limitSpec"); + Preconditions.checkState(grouping != null, "cannot add having before grouping"); + Preconditions.checkNotNull(newHaving, "newHaving"); + return new DruidQueryBuilder(filter, selectProjection, grouping, newHaving, limitSpec, rowType, rowOrder); + } + + public DruidQueryBuilder withLimitSpec(final DefaultLimitSpec newLimitSpec) + { + Preconditions.checkState(limitSpec == null, "cannot add limitSpec twice"); + Preconditions.checkNotNull(newLimitSpec, "newLimitSpec"); + return new DruidQueryBuilder(filter, selectProjection, grouping, having, newLimitSpec, rowType, rowOrder); + } + + public DimFilter getFilter() + { + return filter; + } + + public SelectProjection getSelectProjection() + { + return selectProjection; + } + + public Grouping getGrouping() + { + return grouping; + } + + public DimFilter getHaving() + { + return having; + } + + public DefaultLimitSpec getLimitSpec() + { + return limitSpec; + } + + public RelDataType getRowType() + { + return rowType; + } + + public List getRowOrder() + { + return rowOrder; + } + + public RelTrait[] getRelTraits() + { + final List collations = Lists.newArrayList(); + if (limitSpec != null) { + for (OrderByColumnSpec orderBy : limitSpec.getColumns()) { + final int i = rowOrder.indexOf(orderBy.getDimension()); + final RelFieldCollation.Direction direction = orderBy.getDirection() == OrderByColumnSpec.Direction.ASCENDING + ? RelFieldCollation.Direction.ASCENDING + : RelFieldCollation.Direction.DESCENDING; + collations.add(new RelFieldCollation(i, direction)); + } + } + + if (!collations.isEmpty()) { + return new RelTrait[]{RelCollations.of(collations)}; + } else { + return new RelTrait[]{}; + } + } + + public void accumulate( + final DruidTable druidTable, + final Function sink + ) + { + final PlannerConfig config = druidTable.getPlannerConfig(); + + if (grouping == null) { + QueryMaker.executeSelect(druidTable, this, sink); + } else if (asQueryGranularityIfTimeseries() != null) { + QueryMaker.executeTimeseries(druidTable, this, sink); + } else if (asTopNMetricSpecIfTopN(config.getMaxTopNLimit(), config.isUseApproximateTopN()) != null) { + QueryMaker.executeTopN(druidTable, this, sink); + } else { + QueryMaker.executeGroupBy(druidTable, this, sink); + } + } + + /** + * Determine if this query can be run as a Timeseries query, and if so, return the query granularity. + * + * @return query granularity, or null + */ + public QueryGranularity asQueryGranularityIfTimeseries() + { + if (grouping == null) { + return null; + } + + final List dimensions = grouping.getDimensions(); + + if (dimensions.isEmpty()) { + return QueryGranularities.ALL; + } else if (dimensions.size() == 1) { + final DimensionSpec dimensionSpec = Iterables.getOnlyElement(dimensions); + final QueryGranularity gran = ExtractionFns.toQueryGranularity(dimensionSpec.getExtractionFn()); + + if (gran == null || !dimensionSpec.getDimension().equals(Column.TIME_COLUMN_NAME)) { + // Timeseries only applies if the single dimension is granular __time. + return null; + } + + if (having != null) { + // Timeseries does not offer HAVING. + return null; + } + + // Timeseries only applies if sort is null, or if sort is on the time dimension. + final boolean sortingOnTime = + limitSpec == null || limitSpec.getColumns().isEmpty() + || (limitSpec.getLimit() == Integer.MAX_VALUE + && limitSpec.getColumns().size() == 1 + && limitSpec.getColumns().get(0).getDimension().equals(dimensionSpec.getOutputName()) + && limitSpec.getColumns().get(0).getDirection() == OrderByColumnSpec.Direction.ASCENDING); + + if (sortingOnTime) { + return ExtractionFns.toQueryGranularity(dimensionSpec.getExtractionFn()); + } + } + + return null; + } + + /** + * Determine if this query can be run as a topN query, and if so, returns the metric spec for ordering. + * + * @param maxTopNLimit maximum limit to consider for conversion to a topN + * @param useApproximateTopN true if we should allow approximate topNs, false otherwise + * + * @return metric spec, or null + */ + public TopNMetricSpec asTopNMetricSpecIfTopN( + final int maxTopNLimit, + final boolean useApproximateTopN + ) + { + // Must have GROUP BY one column, ORDER BY one column, limit less than maxTopNLimit, and no HAVING. + if (grouping == null + || grouping.getDimensions().size() != 1 + || limitSpec == null + || limitSpec.getColumns().size() != 1 + || limitSpec.getLimit() > maxTopNLimit + || having != null) { + return null; + } + + final DimensionSpec dimensionSpec = Iterables.getOnlyElement(grouping.getDimensions()); + final OrderByColumnSpec limitColumn = Iterables.getOnlyElement(limitSpec.getColumns()); + + if (limitColumn.getDimension().equals(dimensionSpec.getOutputName())) { + // DimensionTopNMetricSpec is exact; always return it even if allowApproximate is false. + final DimensionTopNMetricSpec baseMetricSpec = new DimensionTopNMetricSpec( + null, + limitColumn.getDimensionComparator() + ); + return limitColumn.getDirection() == OrderByColumnSpec.Direction.ASCENDING + ? baseMetricSpec + : new InvertedTopNMetricSpec(baseMetricSpec); + } else if (useApproximateTopN) { + // ORDER BY metric + final NumericTopNMetricSpec baseMetricSpec = new NumericTopNMetricSpec(limitColumn.getDimension()); + return limitColumn.getDirection() == OrderByColumnSpec.Direction.ASCENDING + ? new InvertedTopNMetricSpec(baseMetricSpec) + : baseMetricSpec; + } else { + return null; + } + } + + @Override + public boolean equals(Object o) + { + if (this == o) { + return true; + } + if (o == null || getClass() != o.getClass()) { + return false; + } + + DruidQueryBuilder that = (DruidQueryBuilder) o; + + if (filter != null ? !filter.equals(that.filter) : that.filter != null) { + return false; + } + if (selectProjection != null ? !selectProjection.equals(that.selectProjection) : that.selectProjection != null) { + return false; + } + if (grouping != null ? !grouping.equals(that.grouping) : that.grouping != null) { + return false; + } + if (having != null ? !having.equals(that.having) : that.having != null) { + return false; + } + if (limitSpec != null ? !limitSpec.equals(that.limitSpec) : that.limitSpec != null) { + return false; + } + if (rowType != null ? !rowType.equals(that.rowType) : that.rowType != null) { + return false; + } + return rowOrder != null ? rowOrder.equals(that.rowOrder) : that.rowOrder == null; + + } + + @Override + public int hashCode() + { + int result = filter != null ? filter.hashCode() : 0; + result = 31 * result + (selectProjection != null ? selectProjection.hashCode() : 0); + result = 31 * result + (grouping != null ? grouping.hashCode() : 0); + result = 31 * result + (having != null ? having.hashCode() : 0); + result = 31 * result + (limitSpec != null ? limitSpec.hashCode() : 0); + result = 31 * result + (rowType != null ? rowType.hashCode() : 0); + result = 31 * result + (rowOrder != null ? rowOrder.hashCode() : 0); + return result; + } + + @Override + public String toString() + { + return "DruidQueryBuilder{" + + "filter=" + filter + + ", selectProjection=" + selectProjection + + ", grouping=" + grouping + + ", having=" + having + + ", limitSpec=" + limitSpec + + ", rowOrder=" + rowOrder + + '}'; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rel/DruidQueryRel.java b/sql/src/main/java/io/druid/sql/calcite/rel/DruidQueryRel.java new file mode 100644 index 00000000000..4007712e4cc --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rel/DruidQueryRel.java @@ -0,0 +1,168 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rel; + +import com.google.common.base.Function; +import com.google.common.base.Preconditions; +import com.google.common.collect.ImmutableList; +import io.druid.sql.calcite.filtration.Filtration; +import io.druid.sql.calcite.table.DruidTable; +import org.apache.calcite.interpreter.BindableConvention; +import org.apache.calcite.interpreter.Row; +import org.apache.calcite.plan.RelOptCluster; +import org.apache.calcite.plan.RelOptCost; +import org.apache.calcite.plan.RelOptPlanner; +import org.apache.calcite.plan.RelOptTable; +import org.apache.calcite.plan.RelTraitSet; +import org.apache.calcite.rel.RelWriter; +import org.apache.calcite.rel.metadata.RelMetadataQuery; +import org.apache.calcite.rel.type.RelDataType; + +public class DruidQueryRel extends DruidRel +{ + private final RelOptTable table; + private final DruidTable druidTable; + private final DruidQueryBuilder queryBuilder; + + private DruidQueryRel( + final RelOptCluster cluster, + final RelTraitSet traitSet, + final RelOptTable table, + final DruidTable druidTable, + final DruidQueryBuilder queryBuilder + ) + { + super(cluster, traitSet); + this.table = Preconditions.checkNotNull(table, "table"); + this.druidTable = Preconditions.checkNotNull(druidTable, "druidTable"); + this.queryBuilder = Preconditions.checkNotNull(queryBuilder, "queryBuilder"); + } + + /** + * Create a DruidQueryRel representing a full scan. + */ + public static DruidQueryRel fullScan( + final RelOptCluster cluster, + final RelTraitSet traitSet, + final RelOptTable table, + final DruidTable druidTable + ) + { + return new DruidQueryRel( + cluster, + traitSet, + table, + druidTable, + DruidQueryBuilder.fullScan(druidTable, cluster.getTypeFactory()) + ); + } + + public DruidQueryRel asBindable() + { + return new DruidQueryRel( + getCluster(), + getTraitSet().plus(BindableConvention.INSTANCE), + table, + druidTable, + queryBuilder + ); + } + + public DruidTable getDruidTable() + { + return druidTable; + } + + public DruidQueryBuilder getQueryBuilder() + { + return queryBuilder; + } + + public DruidQueryRel withQueryBuilder(final DruidQueryBuilder newQueryBuilder) + { + return new DruidQueryRel( + getCluster(), + getTraitSet().plusAll(newQueryBuilder.getRelTraits()), + table, + druidTable, + newQueryBuilder + ); + } + + @Override + public void accumulate(final Function sink) + { + queryBuilder.accumulate(druidTable, sink); + } + + @Override + public RelOptTable getTable() + { + return table; + } + + @Override + public Class getElementType() + { + return Object[].class; + } + + @Override + protected RelDataType deriveRowType() + { + return queryBuilder.getRowType(); + } + + @Override + public RelWriter explainTerms(final RelWriter pw) + { + pw.item("dataSource", druidTable.getDataSource()); + if (queryBuilder != null) { + final Filtration filtration = Filtration.create(queryBuilder.getFilter()).optimize(druidTable); + if (!filtration.getIntervals().equals(ImmutableList.of(Filtration.eternity()))) { + pw.item("intervals", filtration.getIntervals()); + } + if (filtration.getDimFilter() != null) { + pw.item("filter", filtration.getDimFilter()); + } + if (queryBuilder.getSelectProjection() != null) { + pw.item("selectDimensions", queryBuilder.getSelectProjection().getDimensions()); + pw.item("selectMetrics", queryBuilder.getSelectProjection().getMetrics()); + } + if (queryBuilder.getGrouping() != null) { + pw.item("dimensions", queryBuilder.getGrouping().getDimensions()); + pw.item("aggregations", queryBuilder.getGrouping().getAggregations()); + } + if (queryBuilder.getHaving() != null) { + pw.item("having", queryBuilder.getHaving()); + } + if (queryBuilder.getLimitSpec() != null) { + pw.item("limitSpec", queryBuilder.getLimitSpec()); + } + } + return pw; + } + + @Override + public RelOptCost computeSelfCost(final RelOptPlanner planner, final RelMetadataQuery mq) + { + return super.computeSelfCost(planner, mq).multiplyBy(0.1); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rel/DruidRel.java b/sql/src/main/java/io/druid/sql/calcite/rel/DruidRel.java new file mode 100644 index 00000000000..a72847d65e9 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rel/DruidRel.java @@ -0,0 +1,70 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rel; + +import com.google.common.base.Function; +import io.druid.sql.calcite.table.DruidTable; +import org.apache.calcite.DataContext; +import org.apache.calcite.interpreter.BindableRel; +import org.apache.calcite.interpreter.Node; +import org.apache.calcite.interpreter.Row; +import org.apache.calcite.interpreter.Sink; +import org.apache.calcite.linq4j.Enumerable; +import org.apache.calcite.plan.RelOptCluster; +import org.apache.calcite.plan.RelTraitSet; +import org.apache.calcite.rel.AbstractRelNode; + +public abstract class DruidRel extends AbstractRelNode implements BindableRel +{ + public DruidRel(RelOptCluster cluster, RelTraitSet traitSet) + { + super(cluster, traitSet); + } + + public abstract DruidTable getDruidTable(); + + public abstract DruidQueryBuilder getQueryBuilder(); + + public abstract void accumulate(Function sink); + + public abstract T withQueryBuilder(DruidQueryBuilder newQueryBuilder); + + public abstract T asBindable(); + + @Override + public Node implement(InterpreterImplementor implementor) + { + final Sink sink = implementor.interpreter.sink(this); + return new Node() + { + @Override + public void run() throws InterruptedException + { + accumulate(QueryMaker.sinkFunction(sink)); + } + }; + } + + @Override + public Enumerable bind(final DataContext dataContext) + { + throw new UnsupportedOperationException(); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rel/DruidSemiJoin.java b/sql/src/main/java/io/druid/sql/calcite/rel/DruidSemiJoin.java new file mode 100644 index 00000000000..9aafcf6a963 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rel/DruidSemiJoin.java @@ -0,0 +1,317 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rel; + +import com.google.common.base.Function; +import com.google.common.collect.ImmutableList; +import com.google.common.collect.Lists; +import com.google.common.collect.Sets; +import io.druid.java.util.common.ISE; +import io.druid.java.util.common.Pair; +import io.druid.query.ResourceLimitExceededException; +import io.druid.query.dimension.DimensionSpec; +import io.druid.query.filter.AndDimFilter; +import io.druid.query.filter.BoundDimFilter; +import io.druid.query.filter.DimFilter; +import io.druid.query.filter.OrDimFilter; +import io.druid.sql.calcite.aggregation.Aggregation; +import io.druid.sql.calcite.expression.RowExtraction; +import io.druid.sql.calcite.table.DruidTable; +import io.druid.sql.calcite.table.DruidTables; +import org.apache.calcite.DataContext; +import org.apache.calcite.interpreter.BindableConvention; +import org.apache.calcite.interpreter.Row; +import org.apache.calcite.linq4j.Enumerable; +import org.apache.calcite.plan.RelOptCluster; +import org.apache.calcite.plan.RelOptCost; +import org.apache.calcite.plan.RelOptPlanner; +import org.apache.calcite.plan.RelTraitSet; +import org.apache.calcite.rel.RelWriter; +import org.apache.calcite.rel.core.SemiJoin; +import org.apache.calcite.rel.metadata.RelMetadataQuery; +import org.apache.calcite.rel.type.RelDataType; +import org.apache.calcite.rex.RexNode; + +import java.util.List; +import java.util.Set; + +public class DruidSemiJoin extends DruidRel +{ + private final SemiJoin semiJoin; + private final DruidRel left; + private final DruidRel right; + private final RexNode condition; + private final List leftRowExtractions; + private final List rightKeys; + private final int maxSemiJoinRowsInMemory; + + private DruidSemiJoin( + final RelOptCluster cluster, + final RelTraitSet traitSet, + final SemiJoin semiJoin, + final DruidRel left, + final DruidRel right, + final RexNode condition, + final List leftRowExtractions, + final List rightKeys, + final int maxSemiJoinRowsInMemory + ) + { + super(cluster, traitSet); + this.semiJoin = semiJoin; + this.left = left; + this.right = right; + this.condition = condition; + this.leftRowExtractions = ImmutableList.copyOf(leftRowExtractions); + this.rightKeys = ImmutableList.copyOf(rightKeys); + this.maxSemiJoinRowsInMemory = maxSemiJoinRowsInMemory; + } + + public static DruidSemiJoin from( + final SemiJoin semiJoin, + final RelTraitSet traitSet, + final DruidRel left, + final DruidRel right + ) + { + if (semiJoin.getLeftKeys().size() != semiJoin.getRightKeys().size()) { + throw new ISE("WTF?! SemiJoin with different left/right key count?"); + } + + final ImmutableList.Builder listBuilder = ImmutableList.builder(); + for (Integer key : semiJoin.getLeftKeys()) { + final RowExtraction rex = RowExtraction.fromQueryBuilder(left.getQueryBuilder(), key); + if (rex == null) { + // Can't figure out what to filter the left-hand side on... + return null; + } + listBuilder.add(rex); + } + + return new DruidSemiJoin( + semiJoin.getCluster(), + traitSet, + semiJoin, + left, + right, + semiJoin.getCondition(), + listBuilder.build(), + semiJoin.getRightKeys(), + right.getDruidTable().getPlannerConfig().getMaxSemiJoinRowsInMemory() + ); + } + + @Override + public Class getElementType() + { + return Object[].class; + } + + @Override + public DruidTable getDruidTable() + { + return left.getDruidTable(); + } + + @Override + public DruidQueryBuilder getQueryBuilder() + { + return left.getQueryBuilder(); + } + + @Override + public DruidSemiJoin withQueryBuilder(final DruidQueryBuilder newQueryBuilder) + { + return new DruidSemiJoin( + getCluster(), + getTraitSet().plusAll(newQueryBuilder.getRelTraits()), + semiJoin, + left.withQueryBuilder(newQueryBuilder), + right, + condition, + leftRowExtractions, + rightKeys, + maxSemiJoinRowsInMemory + ); + } + + @Override + public DruidSemiJoin asBindable() + { + return new DruidSemiJoin( + getCluster(), + getTraitSet().plus(BindableConvention.INSTANCE), + semiJoin, + left, + right, + condition, + leftRowExtractions, + rightKeys, + maxSemiJoinRowsInMemory + ); + } + + @Override + public void accumulate(final Function sink) + { + final Pair> pair = getRightQueryBuilderWithGrouping(); + final DruidQueryBuilder rightQueryBuilderAdjusted = pair.lhs; + final List rightKeysAdjusted = pair.rhs; + + // Build list of acceptable values from right side. + final Set> valuess = Sets.newHashSet(); + final List filters = Lists.newArrayList(); + rightQueryBuilderAdjusted.accumulate( + right.getDruidTable(), + new Function() + { + @Override + public Void apply(final Row row) + { + final List values = Lists.newArrayListWithCapacity(rightKeysAdjusted.size()); + + for (int i : rightKeysAdjusted) { + final Object value = row.getObject(i); + final String stringValue = value != null ? String.valueOf(value) : ""; + values.add(stringValue); + if (values.size() > maxSemiJoinRowsInMemory) { + throw new ResourceLimitExceededException( + String.format("maxSemiJoinRowsInMemory[%,d] exceeded", maxSemiJoinRowsInMemory) + ); + } + } + + if (valuess.add(values)) { + final List bounds = Lists.newArrayList(); + for (int i = 0; i < values.size(); i++) { + bounds.add( + new BoundDimFilter( + leftRowExtractions.get(i).getColumn(), + values.get(i), + values.get(i), + false, + false, + null, + leftRowExtractions.get(i).getExtractionFn(), + DruidTables.naturalStringComparator(getDruidTable(), leftRowExtractions.get(i)) + ) + ); + } + filters.add(new AndDimFilter(bounds)); + } + return null; + } + } + ); + + valuess.clear(); + + if (!filters.isEmpty()) { + // Add a filter to the left side. Use OR of singleton Bound filters so they can be simplified later. + final DimFilter semiJoinFilter = new OrDimFilter(filters); + final DimFilter newFilter = left.getQueryBuilder().getFilter() == null + ? semiJoinFilter + : new AndDimFilter( + ImmutableList.of( + semiJoinFilter, + left.getQueryBuilder().getFilter() + ) + ); + + left.getQueryBuilder().withFilter(newFilter).accumulate( + left.getDruidTable(), + sink + ); + } + } + + @Override + public Enumerable bind(final DataContext dataContext) + { + throw new UnsupportedOperationException(); + } + + @Override + protected RelDataType deriveRowType() + { + return left.getRowType(); + } + + @Override + public RelWriter explainTerms(RelWriter pw) + { + final Pair> rightQueryBuilderWithGrouping = getRightQueryBuilderWithGrouping(); + return pw + .item("leftDataSource", left.getDruidTable().getDataSource()) + .item("leftRowExtractions", leftRowExtractions) + .item("leftQuery", left.getQueryBuilder()) + .item("rightDataSource", right.getDruidTable().getDataSource()) + .item("rightKeysAdjusted", rightQueryBuilderWithGrouping.rhs) + .item("rightQuery", rightQueryBuilderWithGrouping.lhs); + } + + @Override + public RelOptCost computeSelfCost(final RelOptPlanner planner, final RelMetadataQuery mq) + { + return semiJoin.computeSelfCost(planner, mq).multiplyBy(0.1); + } + + private Pair> getRightQueryBuilderWithGrouping() + { + if (right.getQueryBuilder().getGrouping() != null) { + return Pair.of(right.getQueryBuilder(), rightKeys); + } else { + // Add grouping on the join key to limit resultset from data nodes. + final List dimensionSpecs = Lists.newArrayList(); + final List rowTypes = Lists.newArrayList(); + final List rowOrder = Lists.newArrayList(); + final List rightKeysAdjusted = Lists.newArrayList(); + + int counter = 0; + for (final int key : rightKeys) { + final String keyDimensionOutputName = "v" + key; + final RowExtraction rex = RowExtraction.fromQueryBuilder(right.getQueryBuilder(), key); + if (rex == null) { + throw new ISE("WTF?! Can't find dimensionSpec to group on!"); + } + + final DimensionSpec dimensionSpec = rex.toDimensionSpec(left.getDruidTable(), keyDimensionOutputName); + if (dimensionSpec == null) { + throw new ISE("WTF?! Can't translate row expression to dimensionSpec: %s", rex); + } + + dimensionSpecs.add(dimensionSpec); + rowTypes.add(right.getQueryBuilder().getRowType().getFieldList().get(key).getType()); + rowOrder.add(dimensionSpec.getOutputName()); + rightKeysAdjusted.add(counter++); + } + + final DruidQueryBuilder newQueryBuilder = right + .getQueryBuilder() + .withGrouping( + Grouping.create(dimensionSpecs, ImmutableList.of()), + getCluster().getTypeFactory().createStructType(rowTypes, rowOrder), + rowOrder + ); + + return Pair.of(newQueryBuilder, rightKeysAdjusted); + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rel/Grouping.java b/sql/src/main/java/io/druid/sql/calcite/rel/Grouping.java new file mode 100644 index 00000000000..ae6152b0877 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rel/Grouping.java @@ -0,0 +1,139 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rel; + +import com.google.common.collect.ImmutableList; +import com.google.common.collect.Lists; +import com.google.common.collect.Sets; +import io.druid.java.util.common.ISE; +import io.druid.query.aggregation.AggregatorFactory; +import io.druid.query.aggregation.PostAggregator; +import io.druid.query.dimension.DimensionSpec; +import io.druid.sql.calcite.aggregation.Aggregation; + +import java.util.List; +import java.util.Set; + +public class Grouping +{ + private final List dimensions; + private final List aggregations; + + private Grouping( + final List dimensions, + final List aggregations + ) + { + this.dimensions = ImmutableList.copyOf(dimensions); + this.aggregations = ImmutableList.copyOf(aggregations); + + // Verify no collisions. + final Set seen = Sets.newHashSet(); + for (DimensionSpec dimensionSpec : dimensions) { + if (!seen.add(dimensionSpec.getOutputName())) { + throw new ISE("Duplicate field name: %s", dimensionSpec.getOutputName()); + } + } + for (Aggregation aggregation : aggregations) { + for (AggregatorFactory aggregatorFactory : aggregation.getAggregatorFactories()) { + if (!seen.add(aggregatorFactory.getName())) { + throw new ISE("Duplicate field name: %s", aggregatorFactory.getName()); + } + } + if (aggregation.getPostAggregator() != null && !seen.add(aggregation.getPostAggregator().getName())) { + throw new ISE("Duplicate field name in rowOrder: %s", aggregation.getPostAggregator().getName()); + } + } + } + + public static Grouping create( + final List dimensions, + final List aggregations + ) + { + return new Grouping(dimensions, aggregations); + } + + public List getDimensions() + { + return dimensions; + } + + public List getAggregations() + { + return aggregations; + } + + public List getAggregatorFactories() + { + final List retVal = Lists.newArrayList(); + for (final Aggregation aggregation : aggregations) { + retVal.addAll(aggregation.getAggregatorFactories()); + } + return retVal; + } + + public List getPostAggregators() + { + final List retVal = Lists.newArrayList(); + for (final Aggregation aggregation : aggregations) { + if (aggregation.getPostAggregator() != null) { + retVal.add(aggregation.getPostAggregator()); + } + } + return retVal; + } + + @Override + public boolean equals(Object o) + { + if (this == o) { + return true; + } + if (o == null || getClass() != o.getClass()) { + return false; + } + + Grouping grouping = (Grouping) o; + + if (dimensions != null ? !dimensions.equals(grouping.dimensions) : grouping.dimensions != null) { + return false; + } + return aggregations != null ? aggregations.equals(grouping.aggregations) : grouping.aggregations == null; + + } + + @Override + public int hashCode() + { + int result = dimensions != null ? dimensions.hashCode() : 0; + result = 31 * result + (aggregations != null ? aggregations.hashCode() : 0); + return result; + } + + @Override + public String toString() + { + return "Grouping{" + + "dimensions=" + dimensions + + ", aggregations=" + aggregations + + '}'; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rel/QueryMaker.java b/sql/src/main/java/io/druid/sql/calcite/rel/QueryMaker.java new file mode 100644 index 00000000000..20820ae2c35 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rel/QueryMaker.java @@ -0,0 +1,435 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rel; + +import com.google.common.base.Function; +import com.google.common.base.Preconditions; +import com.google.common.base.Strings; +import com.google.common.base.Throwables; +import com.google.common.collect.ImmutableList; +import com.google.common.collect.Iterables; +import com.google.common.collect.Maps; +import com.google.common.primitives.Doubles; +import com.google.common.primitives.Ints; +import io.druid.common.guava.GuavaUtils; +import io.druid.granularity.QueryGranularities; +import io.druid.granularity.QueryGranularity; +import io.druid.java.util.common.ISE; +import io.druid.java.util.common.guava.Accumulator; +import io.druid.java.util.common.logger.Logger; +import io.druid.query.Result; +import io.druid.query.dimension.DimensionSpec; +import io.druid.query.groupby.GroupByQuery; +import io.druid.query.groupby.having.DimFilterHavingSpec; +import io.druid.query.groupby.orderby.OrderByColumnSpec; +import io.druid.query.select.EventHolder; +import io.druid.query.select.PagingSpec; +import io.druid.query.select.SelectQuery; +import io.druid.query.select.SelectResultValue; +import io.druid.query.timeseries.TimeseriesQuery; +import io.druid.query.timeseries.TimeseriesResultValue; +import io.druid.query.topn.DimensionAndMetricValueExtractor; +import io.druid.query.topn.TopNMetricSpec; +import io.druid.query.topn.TopNQuery; +import io.druid.query.topn.TopNResultValue; +import io.druid.segment.column.Column; +import io.druid.sql.calcite.filtration.Filtration; +import io.druid.sql.calcite.table.DruidTable; +import org.apache.calcite.interpreter.Row; +import org.apache.calcite.interpreter.Sink; +import org.apache.calcite.rel.type.RelDataTypeField; +import org.apache.calcite.runtime.Hook; +import org.apache.calcite.sql.type.SqlTypeName; +import org.apache.calcite.util.NlsString; +import org.joda.time.DateTime; + +import java.util.Calendar; +import java.util.List; +import java.util.Map; +import java.util.concurrent.atomic.AtomicBoolean; +import java.util.concurrent.atomic.AtomicLong; +import java.util.concurrent.atomic.AtomicReference; + +public class QueryMaker +{ + private final static Logger log = new Logger(QueryMaker.class); + + private QueryMaker() + { + // No instantiation. + } + + public static Function sinkFunction(final Sink sink) + { + return new Function() + { + @Override + public Void apply(final Row row) + { + try { + sink.send(row); + return null; + } + catch (InterruptedException e) { + throw Throwables.propagate(e); + } + } + }; + } + + public static void executeSelect( + final DruidTable druidTable, + final DruidQueryBuilder queryBuilder, + final Function sink + ) + { + Preconditions.checkState(queryBuilder.getGrouping() == null, "grouping must be null"); + + final List fieldList = queryBuilder.getRowType().getFieldList(); + final Row.RowBuilder rowBuilder = Row.newBuilder(fieldList.size()); + final Filtration filtration = Filtration.create(queryBuilder.getFilter()).optimize(druidTable); + final SelectProjection selectProjection = queryBuilder.getSelectProjection(); + final Integer limit; + final boolean descending; + + if (queryBuilder.getLimitSpec() != null) { + limit = queryBuilder.getLimitSpec().getLimit(); + + // Safe to assume limitSpec has zero or one entry; DruidSelectSortRule wouldn't push in anything else. + if (queryBuilder.getLimitSpec().getColumns().size() > 0) { + final OrderByColumnSpec orderBy = Iterables.getOnlyElement(queryBuilder.getLimitSpec().getColumns()); + if (!orderBy.getDimension().equals(Column.TIME_COLUMN_NAME)) { + throw new ISE("WTF?! Got select with non-time orderBy[%s]", orderBy); + } + descending = orderBy.getDirection() == OrderByColumnSpec.Direction.DESCENDING; + } else { + descending = false; + } + } else { + limit = null; + descending = false; + } + + // Loop through pages. + final AtomicBoolean morePages = new AtomicBoolean(true); + final AtomicReference> pagingIdentifiers = new AtomicReference<>(); + final AtomicLong rowsRead = new AtomicLong(); + + while (morePages.get()) { + final SelectQuery query = new SelectQuery( + druidTable.getDataSource(), + filtration.getQuerySegmentSpec(), + descending, + filtration.getDimFilter(), + QueryGranularities.ALL, + selectProjection != null ? selectProjection.getDimensions() : ImmutableList.of(), + selectProjection != null ? selectProjection.getMetrics() : ImmutableList.of(), + null, + new PagingSpec(pagingIdentifiers.get(), druidTable.getPlannerConfig().getSelectThreshold(), true), + null + ); + + Hook.QUERY_PLAN.run(query); + + morePages.set(false); + final AtomicBoolean gotResult = new AtomicBoolean(); + + query.run(druidTable.getQuerySegmentWalker(), Maps.newHashMap()).accumulate( + null, + new Accumulator>() + { + @Override + public Object accumulate(final Object accumulated, final Result result) + { + if (!gotResult.compareAndSet(false, true)) { + throw new ISE("WTF?! Expected single result from Select query but got multiple!"); + } + + pagingIdentifiers.set(result.getValue().getPagingIdentifiers()); + + for (EventHolder holder : result.getValue().getEvents()) { + morePages.set(true); + final Map map = holder.getEvent(); + for (RelDataTypeField field : fieldList) { + final String outputName = queryBuilder.getRowOrder().get(field.getIndex()); + if (outputName.equals(Column.TIME_COLUMN_NAME)) { + rowBuilder.set( + field.getIndex(), + coerce(holder.getTimestamp().getMillis(), field.getType().getSqlTypeName()) + ); + } else { + rowBuilder.set( + field.getIndex(), + coerce(map.get(outputName), field.getType().getSqlTypeName()) + ); + } + } + if (limit == null || rowsRead.incrementAndGet() <= limit) { + sink.apply(rowBuilder.build()); + } else { + morePages.set(false); + break; + } + rowBuilder.reset(); + } + + return null; + } + } + ); + } + } + + public static void executeTimeseries( + final DruidTable druidTable, + final DruidQueryBuilder queryBuilder, + final Function sink + ) + { + final QueryGranularity queryGranularity = queryBuilder.asQueryGranularityIfTimeseries(); + + if (queryGranularity == null) { + throw new ISE("WTF?! executeTimeseries called on query that cannot become a timeseries?!"); + } + + final String timeOutputName = queryBuilder.getGrouping().getDimensions().size() == 1 + ? queryBuilder.getGrouping().getDimensions().get(0).getOutputName() + : null; + + final List fieldList = queryBuilder.getRowType().getFieldList(); + final Row.RowBuilder rowBuilder = Row.newBuilder(fieldList.size()); + final Filtration filtration = Filtration.create(queryBuilder.getFilter()).optimize(druidTable); + + final Map context = Maps.newHashMap(); + context.put("skipEmptyBuckets", true); + + final TimeseriesQuery query = new TimeseriesQuery( + druidTable.getDataSource(), + filtration.getQuerySegmentSpec(), + false, + filtration.getDimFilter(), + queryGranularity, + queryBuilder.getGrouping().getAggregatorFactories(), + queryBuilder.getGrouping().getPostAggregators(), + context + ); + + Hook.QUERY_PLAN.run(query); + + query.run(druidTable.getQuerySegmentWalker(), Maps.newHashMap()).accumulate( + null, + new Accumulator>() + { + @Override + public Object accumulate(final Object accumulated, final Result result) + { + final Map row = result.getValue().getBaseObject(); + + for (final RelDataTypeField field : fieldList) { + final String outputName = queryBuilder.getRowOrder().get(field.getIndex()); + if (outputName.equals(timeOutputName)) { + rowBuilder.set(field.getIndex(), coerce(result.getTimestamp(), field.getType().getSqlTypeName())); + } else { + rowBuilder.set(field.getIndex(), coerce(row.get(outputName), field.getType().getSqlTypeName())); + } + } + + sink.apply(rowBuilder.build()); + rowBuilder.reset(); + + return null; + } + } + ); + } + + public static void executeTopN( + final DruidTable druidTable, + final DruidQueryBuilder queryBuilder, + final Function sink + ) + { + // OK to hard-code permissive values here; this method is only called if we really do want a topN. + final TopNMetricSpec topNMetricSpec = queryBuilder.asTopNMetricSpecIfTopN(Integer.MAX_VALUE, true); + + if (topNMetricSpec == null) { + throw new ISE("WTF?! executeTopN called on query that cannot become a topN?!"); + } + + final List fieldList = queryBuilder.getRowType().getFieldList(); + final Row.RowBuilder rowBuilder = Row.newBuilder(fieldList.size()); + final Filtration filtration = Filtration.create(queryBuilder.getFilter()).optimize(druidTable); + + final TopNQuery query = new TopNQuery( + druidTable.getDataSource(), + Iterables.getOnlyElement(queryBuilder.getGrouping().getDimensions()), + topNMetricSpec, + queryBuilder.getLimitSpec().getLimit(), + filtration.getQuerySegmentSpec(), + filtration.getDimFilter(), + QueryGranularities.ALL, + queryBuilder.getGrouping().getAggregatorFactories(), + queryBuilder.getGrouping().getPostAggregators(), + null + ); + + Hook.QUERY_PLAN.run(query); + + query.run(druidTable.getQuerySegmentWalker(), Maps.newHashMap()).accumulate( + null, + new Accumulator>() + { + @Override + public Object accumulate(final Object accumulated, final Result result) + { + final List values = result.getValue().getValue(); + + for (DimensionAndMetricValueExtractor value : values) { + for (final RelDataTypeField field : fieldList) { + final String outputName = queryBuilder.getRowOrder().get(field.getIndex()); + rowBuilder.set(field.getIndex(), coerce(value.getMetric(outputName), field.getType().getSqlTypeName())); + } + + sink.apply(rowBuilder.build()); + rowBuilder.reset(); + } + + return null; + } + } + ); + } + + public static void executeGroupBy( + final DruidTable druidTable, + final DruidQueryBuilder queryBuilder, + final Function sink + ) + { + Preconditions.checkState(queryBuilder.getGrouping() != null, "grouping must be non-null"); + + final List fieldList = queryBuilder.getRowType().getFieldList(); + final Row.RowBuilder rowBuilder = Row.newBuilder(fieldList.size()); + final Filtration filtration = Filtration.create(queryBuilder.getFilter()).optimize(druidTable); + + final GroupByQuery query = new GroupByQuery( + druidTable.getDataSource(), + filtration.getQuerySegmentSpec(), + filtration.getDimFilter(), + QueryGranularities.ALL, + queryBuilder.getGrouping().getDimensions(), + queryBuilder.getGrouping().getAggregatorFactories(), + queryBuilder.getGrouping().getPostAggregators(), + queryBuilder.getHaving() != null ? new DimFilterHavingSpec(queryBuilder.getHaving()) : null, + queryBuilder.getLimitSpec(), + null + ); + + Hook.QUERY_PLAN.run(query); + + query.run(druidTable.getQuerySegmentWalker(), Maps.newHashMap()).accumulate( + null, + new Accumulator() + { + @Override + public Object accumulate(final Object accumulated, final io.druid.data.input.Row row) + { + for (RelDataTypeField field : fieldList) { + rowBuilder.set( + field.getIndex(), + coerce( + row.getRaw(queryBuilder.getRowOrder().get(field.getIndex())), + field.getType().getSqlTypeName() + ) + ); + } + sink.apply(rowBuilder.build()); + rowBuilder.reset(); + + return null; + } + } + ); + } + + private static Object coerce(final Object value, final SqlTypeName sqlType) + { + final Object coercedValue; + + if (SqlTypeName.CHAR_TYPES.contains(sqlType)) { + if (value == null || value instanceof String) { + coercedValue = Strings.nullToEmpty((String) value); + } else if (value instanceof NlsString) { + coercedValue = ((NlsString) value).getValue(); + } else { + throw new ISE("Cannot coerce[%s] to %s", value.getClass().getName(), sqlType); + } + } else if (value == null) { + coercedValue = null; + } else if (sqlType == SqlTypeName.DATE) { + final Long millis = (Long) coerce(value, SqlTypeName.TIMESTAMP); + if (millis == null) { + return null; + } else { + return new DateTime(millis.longValue()).dayOfMonth().roundFloorCopy().getMillis(); + } + } else if (sqlType == SqlTypeName.TIMESTAMP) { + if (value instanceof Number) { + coercedValue = new DateTime(((Number) value).longValue()).getMillis(); + } else if (value instanceof String) { + coercedValue = Long.parseLong((String) value); + } else if (value instanceof Calendar) { + coercedValue = ((Calendar) value).getTimeInMillis(); + } else if (value instanceof DateTime) { + coercedValue = ((DateTime) value).getMillis(); + } else { + throw new ISE("Cannot coerce[%s] to %s", value.getClass().getName(), sqlType); + } + } else if (sqlType == SqlTypeName.INTEGER) { + if (value instanceof String) { + coercedValue = Ints.tryParse((String) value); + } else if (value instanceof Number) { + coercedValue = ((Number) value).intValue(); + } else { + throw new ISE("Cannot coerce[%s] to %s", value.getClass().getName(), sqlType); + } + } else if (sqlType == SqlTypeName.BIGINT) { + if (value instanceof String) { + coercedValue = GuavaUtils.tryParseLong((String) value); + } else if (value instanceof Number) { + coercedValue = ((Number) value).longValue(); + } else { + throw new ISE("Cannot coerce[%s] to %s", value.getClass().getName(), sqlType); + } + } else if (sqlType == SqlTypeName.FLOAT || sqlType == SqlTypeName.DOUBLE) { + if (value instanceof String) { + coercedValue = Doubles.tryParse((String) value); + } else if (value instanceof Number) { + coercedValue = ((Number) value).doubleValue(); + } else { + throw new ISE("Cannot coerce[%s] to %s", value.getClass().getName(), sqlType); + } + } else { + throw new ISE("Cannot coerce[%s] to %s", value.getClass().getName(), sqlType); + } + + return coercedValue; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rel/SelectProjection.java b/sql/src/main/java/io/druid/sql/calcite/rel/SelectProjection.java new file mode 100644 index 00000000000..04889760983 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rel/SelectProjection.java @@ -0,0 +1,116 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rel; + +import com.google.common.collect.Sets; +import io.druid.java.util.common.ISE; +import io.druid.query.dimension.DimensionSpec; +import io.druid.segment.column.Column; +import org.apache.calcite.rel.core.Project; + +import java.util.List; +import java.util.Set; + +public class SelectProjection +{ + private final Project project; + private final List dimensions; + private final List metrics; + + public SelectProjection( + final Project project, + final List dimensions, + final List metrics + ) + { + this.project = project; + this.dimensions = dimensions; + this.metrics = metrics; + + // Verify no collisions. Start with TIME_COLUMN_NAME because QueryMaker.executeSelect hard-codes it. + final Set seen = Sets.newHashSet(Column.TIME_COLUMN_NAME); + for (DimensionSpec dimensionSpec : dimensions) { + if (!seen.add(dimensionSpec.getOutputName())) { + throw new ISE("Duplicate field name: %s", dimensionSpec.getOutputName()); + } + } + for (String fieldName : metrics) { + if (!seen.add(fieldName)) { + throw new ISE("Duplicate field name: %s", fieldName); + } + } + } + + public Project getProject() + { + return project; + } + + public List getDimensions() + { + return dimensions; + } + + public List getMetrics() + { + return metrics; + } + + @Override + public boolean equals(Object o) + { + if (this == o) { + return true; + } + if (o == null || getClass() != o.getClass()) { + return false; + } + + SelectProjection that = (SelectProjection) o; + + if (project != null ? !project.equals(that.project) : that.project != null) { + return false; + } + if (dimensions != null ? !dimensions.equals(that.dimensions) : that.dimensions != null) { + return false; + } + return metrics != null ? metrics.equals(that.metrics) : that.metrics == null; + + } + + @Override + public int hashCode() + { + int result = project != null ? project.hashCode() : 0; + result = 31 * result + (dimensions != null ? dimensions.hashCode() : 0); + result = 31 * result + (metrics != null ? metrics.hashCode() : 0); + return result; + } + + @Override + public String toString() + { + return "SelectProjection{" + + "project=" + project + + ", dimensions=" + dimensions + + ", metrics=" + metrics + + '}'; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rule/DruidBindableConverterRule.java b/sql/src/main/java/io/druid/sql/calcite/rule/DruidBindableConverterRule.java new file mode 100644 index 00000000000..d9e4a89232b --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rule/DruidBindableConverterRule.java @@ -0,0 +1,53 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rule; + +import io.druid.sql.calcite.rel.DruidRel; +import org.apache.calcite.interpreter.BindableConvention; +import org.apache.calcite.plan.Convention; +import org.apache.calcite.rel.RelNode; +import org.apache.calcite.rel.convert.ConverterRule; + +public class DruidBindableConverterRule extends ConverterRule +{ + private static DruidBindableConverterRule INSTANCE = new DruidBindableConverterRule(); + + private DruidBindableConverterRule() + { + super( + DruidRel.class, + Convention.NONE, + BindableConvention.INSTANCE, + DruidBindableConverterRule.class.getSimpleName() + ); + } + + public static DruidBindableConverterRule instance() + { + return INSTANCE; + } + + @Override + public RelNode convert(RelNode rel) + { + final DruidRel druidRel = (DruidRel) rel; + return druidRel.asBindable(); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rule/DruidFilterRule.java b/sql/src/main/java/io/druid/sql/calcite/rule/DruidFilterRule.java new file mode 100644 index 00000000000..f40592ff342 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rule/DruidFilterRule.java @@ -0,0 +1,66 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rule; + +import io.druid.query.filter.DimFilter; +import io.druid.sql.calcite.expression.Expressions; +import io.druid.sql.calcite.rel.DruidRel; +import org.apache.calcite.plan.RelOptRule; +import org.apache.calcite.plan.RelOptRuleCall; +import org.apache.calcite.rel.core.Filter; + +public class DruidFilterRule extends RelOptRule +{ + private static final DruidFilterRule INSTANCE = new DruidFilterRule(); + + private DruidFilterRule() + { + super(operand(Filter.class, operand(DruidRel.class, none()))); + } + + public static DruidFilterRule instance() + { + return INSTANCE; + } + + @Override + public void onMatch(RelOptRuleCall call) + { + final Filter filter = call.rel(0); + final DruidRel druidRel = call.rel(1); + + if (druidRel.getQueryBuilder().getFilter() != null + || druidRel.getQueryBuilder().getSelectProjection() != null + || druidRel.getQueryBuilder().getGrouping() != null) { + return; + } + + final DimFilter dimFilter = Expressions.toFilter( + druidRel.getDruidTable(), + druidRel.getQueryBuilder().getRowOrder(), + filter.getCondition() + ); + if (dimFilter != null) { + call.transformTo( + druidRel.withQueryBuilder(druidRel.getQueryBuilder().withFilter(dimFilter)) + ); + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rule/DruidSelectProjectionRule.java b/sql/src/main/java/io/druid/sql/calcite/rule/DruidSelectProjectionRule.java new file mode 100644 index 00000000000..13995f3a9f7 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rule/DruidSelectProjectionRule.java @@ -0,0 +1,125 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rule; + +import com.google.common.collect.Lists; +import io.druid.query.dimension.DefaultDimensionSpec; +import io.druid.query.dimension.DimensionSpec; +import io.druid.query.dimension.ExtractionDimensionSpec; +import io.druid.query.extraction.ExtractionFn; +import io.druid.segment.column.Column; +import io.druid.segment.column.ValueType; +import io.druid.sql.calcite.expression.Expressions; +import io.druid.sql.calcite.expression.RowExtraction; +import io.druid.sql.calcite.rel.DruidRel; +import io.druid.sql.calcite.rel.SelectProjection; +import io.druid.sql.calcite.table.DruidTables; +import org.apache.calcite.plan.RelOptRule; +import org.apache.calcite.plan.RelOptRuleCall; +import org.apache.calcite.rel.core.Project; + +import java.util.List; + +public class DruidSelectProjectionRule extends RelOptRule +{ + private static final DruidSelectProjectionRule INSTANCE = new DruidSelectProjectionRule(); + + private DruidSelectProjectionRule() + { + super(operand(Project.class, operand(DruidRel.class, none()))); + } + + public static DruidSelectProjectionRule instance() + { + return INSTANCE; + } + + @Override + public void onMatch(RelOptRuleCall call) + { + final Project project = call.rel(0); + final DruidRel druidRel = call.rel(1); + + if (druidRel.getQueryBuilder().getSelectProjection() != null + || druidRel.getQueryBuilder().getGrouping() != null + || druidRel.getQueryBuilder().getLimitSpec() != null) { + return; + } + + // Only push in projections that can be used by the Select query. + // Leave anything more complicated to DruidAggregateProjectRule for possible handling in a GroupBy query. + + final List dimensions = Lists.newArrayList(); + final List metrics = Lists.newArrayList(); + final List rowOrder = Lists.newArrayList(); + + int dimOutputNameCounter = 0; + for (int i = 0; i < project.getRowType().getFieldCount(); i++) { + final RowExtraction rex = Expressions.toRowExtraction( + DruidTables.rowOrder(druidRel.getDruidTable()), + project.getChildExps().get(i) + ); + + if (rex == null) { + return; + } + + final String column = rex.getColumn(); + final ExtractionFn extractionFn = rex.getExtractionFn(); + + // Check if this field should be a dimension, a metric, or a reference to __time. + final ValueType columnType = druidRel.getDruidTable() + .getColumnType(druidRel.getDruidTable().getColumnNumber(column)); + + if (columnType == ValueType.STRING || (column.equals(Column.TIME_COLUMN_NAME) && extractionFn != null)) { + // Add to dimensions. + do { + dimOutputNameCounter++; + } while (druidRel.getDruidTable().getColumnNumber(GroupByRules.dimOutputName(dimOutputNameCounter)) >= 0); + final String outputName = GroupByRules.dimOutputName(dimOutputNameCounter); + final DimensionSpec dimensionSpec = extractionFn == null + ? new DefaultDimensionSpec(column, outputName) + : new ExtractionDimensionSpec(column, outputName, extractionFn); + dimensions.add(dimensionSpec); + rowOrder.add(outputName); + } else if (extractionFn == null && !column.equals(Column.TIME_COLUMN_NAME)) { + // Add to metrics. + metrics.add(column); + rowOrder.add(column); + } else if (extractionFn == null && column.equals(Column.TIME_COLUMN_NAME)) { + // This is __time. + rowOrder.add(Column.TIME_COLUMN_NAME); + } else { + // Don't know what to do! + return; + } + } + + call.transformTo( + druidRel.withQueryBuilder( + druidRel.getQueryBuilder() + .withSelectProjection( + new SelectProjection(project, dimensions, metrics), + rowOrder + ) + ) + ); + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rule/DruidSelectSortRule.java b/sql/src/main/java/io/druid/sql/calcite/rule/DruidSelectSortRule.java new file mode 100644 index 00000000000..85534e0682e --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rule/DruidSelectSortRule.java @@ -0,0 +1,74 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rule; + +import io.druid.query.groupby.orderby.DefaultLimitSpec; +import io.druid.query.groupby.orderby.OrderByColumnSpec; +import io.druid.segment.column.Column; +import io.druid.sql.calcite.rel.DruidRel; +import org.apache.calcite.plan.RelOptRule; +import org.apache.calcite.plan.RelOptRuleCall; +import org.apache.calcite.rel.core.Sort; + +import java.util.List; + +public class DruidSelectSortRule extends RelOptRule +{ + private static final DruidSelectSortRule INSTANCE = new DruidSelectSortRule(); + + private DruidSelectSortRule() + { + super(operand(Sort.class, operand(DruidRel.class, none()))); + } + + public static DruidSelectSortRule instance() + { + return INSTANCE; + } + + @Override + public void onMatch(RelOptRuleCall call) + { + final Sort sort = call.rel(0); + final DruidRel druidRel = call.rel(1); + + if (druidRel.getQueryBuilder().getGrouping() != null + || druidRel.getQueryBuilder().getLimitSpec() != null) { + return; + } + + final DefaultLimitSpec limitSpec = GroupByRules.toLimitSpec(druidRel.getQueryBuilder().getRowOrder(), sort); + if (limitSpec == null) { + return; + } + + // Only push in sorts that can be used by the Select query. + final List orderBys = limitSpec.getColumns(); + if (orderBys.isEmpty() || + (orderBys.size() == 1 && orderBys.get(0).getDimension().equals(Column.TIME_COLUMN_NAME))) { + call.transformTo( + druidRel.withQueryBuilder( + druidRel.getQueryBuilder() + .withLimitSpec(limitSpec) + ) + ); + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rule/DruidSemiJoinRule.java b/sql/src/main/java/io/druid/sql/calcite/rule/DruidSemiJoinRule.java new file mode 100644 index 00000000000..6c6533c12b7 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rule/DruidSemiJoinRule.java @@ -0,0 +1,59 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rule; + +import io.druid.sql.calcite.rel.DruidRel; +import io.druid.sql.calcite.rel.DruidSemiJoin; +import org.apache.calcite.plan.RelOptRule; +import org.apache.calcite.plan.RelOptRuleCall; +import org.apache.calcite.rel.core.SemiJoin; + +public class DruidSemiJoinRule extends RelOptRule +{ + private static final DruidSemiJoinRule INSTANCE = new DruidSemiJoinRule(); + + private DruidSemiJoinRule() + { + super( + operand( + SemiJoin.class, + operand(DruidRel.class, none()), + operand(DruidRel.class, none()) + ) + ); + } + + public static DruidSemiJoinRule instance() + { + return INSTANCE; + } + + @Override + public void onMatch(RelOptRuleCall call) + { + final SemiJoin semiJoin = call.rel(0); + final DruidRel left = call.rel(1); + final DruidRel right = call.rel(2); + final DruidSemiJoin druidSemiJoin = DruidSemiJoin.from(semiJoin, semiJoin.getTraitSet(), left, right); + if (druidSemiJoin != null) { + call.transformTo(druidSemiJoin); + } + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/rule/GroupByRules.java b/sql/src/main/java/io/druid/sql/calcite/rule/GroupByRules.java new file mode 100644 index 00000000000..ec79cfbbc50 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/rule/GroupByRules.java @@ -0,0 +1,787 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.rule; + +import com.google.common.base.Preconditions; +import com.google.common.collect.ImmutableList; +import com.google.common.collect.Iterables; +import com.google.common.collect.Lists; +import com.google.common.collect.Maps; +import io.druid.java.util.common.ISE; +import io.druid.query.aggregation.AggregatorFactory; +import io.druid.query.aggregation.CountAggregatorFactory; +import io.druid.query.aggregation.DoubleMaxAggregatorFactory; +import io.druid.query.aggregation.DoubleMinAggregatorFactory; +import io.druid.query.aggregation.DoubleSumAggregatorFactory; +import io.druid.query.aggregation.LongMaxAggregatorFactory; +import io.druid.query.aggregation.LongMinAggregatorFactory; +import io.druid.query.aggregation.LongSumAggregatorFactory; +import io.druid.query.aggregation.PostAggregator; +import io.druid.query.aggregation.cardinality.CardinalityAggregatorFactory; +import io.druid.query.aggregation.hyperloglog.HyperUniqueFinalizingPostAggregator; +import io.druid.query.aggregation.post.ArithmeticPostAggregator; +import io.druid.query.aggregation.post.FieldAccessPostAggregator; +import io.druid.query.dimension.DefaultDimensionSpec; +import io.druid.query.dimension.DimensionSpec; +import io.druid.query.dimension.ExtractionDimensionSpec; +import io.druid.query.filter.AndDimFilter; +import io.druid.query.filter.DimFilter; +import io.druid.query.filter.NotDimFilter; +import io.druid.query.groupby.orderby.DefaultLimitSpec; +import io.druid.query.groupby.orderby.OrderByColumnSpec; +import io.druid.query.ordering.StringComparator; +import io.druid.query.ordering.StringComparators; +import io.druid.segment.column.Column; +import io.druid.segment.column.ValueType; +import io.druid.sql.calcite.aggregation.Aggregation; +import io.druid.sql.calcite.aggregation.PostAggregatorFactory; +import io.druid.sql.calcite.expression.Expressions; +import io.druid.sql.calcite.expression.RowExtraction; +import io.druid.sql.calcite.filtration.Filtration; +import io.druid.sql.calcite.planner.PlannerConfig; +import io.druid.sql.calcite.rel.DruidRel; +import io.druid.sql.calcite.rel.Grouping; +import io.druid.sql.calcite.table.DruidTable; +import io.druid.sql.calcite.table.DruidTables; +import org.apache.calcite.plan.RelOptRule; +import org.apache.calcite.plan.RelOptRuleCall; +import org.apache.calcite.rel.RelFieldCollation; +import org.apache.calcite.rel.core.Aggregate; +import org.apache.calcite.rel.core.AggregateCall; +import org.apache.calcite.rel.core.Filter; +import org.apache.calcite.rel.core.Project; +import org.apache.calcite.rel.core.Sort; +import org.apache.calcite.rex.RexCall; +import org.apache.calcite.rex.RexInputRef; +import org.apache.calcite.rex.RexLiteral; +import org.apache.calcite.rex.RexNode; +import org.apache.calcite.sql.SqlKind; +import org.apache.calcite.sql.type.SqlTypeName; +import org.apache.calcite.util.ImmutableBitSet; + +import java.util.List; +import java.util.Map; + +public class GroupByRules +{ + private GroupByRules() + { + // No instantiation. + } + + public static List rules(final PlannerConfig plannerConfig) + { + return ImmutableList.of( + new DruidAggregateRule(plannerConfig.isUseApproximateCountDistinct()), + new DruidAggregateProjectRule(plannerConfig.isUseApproximateCountDistinct()), + new DruidProjectAfterAggregationRule(), + new DruidFilterAfterAggregationRule(), + new DruidGroupBySortRule() + ); + } + + /** + * Used to represent inputs to aggregators. Ideally this should be folded into {@link RowExtraction}, but we + * can't do that until RowExtractions are a bit more versatile. + */ + private static class FieldOrExpression + { + private final String fieldName; + private final String expression; + + public FieldOrExpression(String fieldName, String expression) + { + this.fieldName = fieldName; + this.expression = expression; + Preconditions.checkArgument(fieldName == null ^ expression == null, "must have either fieldName or expression"); + } + + public static FieldOrExpression fromRexNode(final List rowOrder, final RexNode rexNode) + { + final RowExtraction rex = Expressions.toRowExtraction(rowOrder, rexNode); + if (rex != null && rex.getExtractionFn() == null) { + // This was a simple field access. + return fieldName(rex.getColumn()); + } + + // Try as a math expression. + final String mathExpression = Expressions.toMathExpression(rowOrder, rexNode); + if (mathExpression != null) { + return expression(mathExpression); + } + + return null; + } + + public static FieldOrExpression fieldName(final String fieldName) + { + return new FieldOrExpression(fieldName, null); + } + + public static FieldOrExpression expression(final String expression) + { + return new FieldOrExpression(null, expression); + } + + public String getFieldName() + { + return fieldName; + } + + public String getExpression() + { + return expression; + } + } + + public static class DruidAggregateRule extends RelOptRule + { + final boolean approximateCountDistinct; + + private DruidAggregateRule(final boolean approximateCountDistinct) + { + super(operand(Aggregate.class, operand(DruidRel.class, none()))); + this.approximateCountDistinct = approximateCountDistinct; + } + + @Override + public void onMatch(RelOptRuleCall call) + { + final Aggregate aggregate = call.rel(0); + final DruidRel druidRel = call.rel(1); + final DruidRel newDruidRel = GroupByRules.applyAggregate( + druidRel, + null, + aggregate, + approximateCountDistinct + ); + if (newDruidRel != null) { + call.transformTo(newDruidRel); + } + } + } + + public static class DruidAggregateProjectRule extends RelOptRule + { + final boolean approximateCountDistinct; + + private DruidAggregateProjectRule(final boolean approximateCountDistinct) + { + super(operand(Aggregate.class, operand(Project.class, operand(DruidRel.class, none())))); + this.approximateCountDistinct = approximateCountDistinct; + } + + @Override + public void onMatch(RelOptRuleCall call) + { + final Aggregate aggregate = call.rel(0); + final Project project = call.rel(1); + final DruidRel druidRel = call.rel(2); + final DruidRel newDruidRel = GroupByRules.applyAggregate( + druidRel, + project, + aggregate, + approximateCountDistinct + ); + if (newDruidRel != null) { + call.transformTo(newDruidRel); + } + } + } + + public static class DruidProjectAfterAggregationRule extends RelOptRule + { + private DruidProjectAfterAggregationRule() + { + super(operand(Project.class, operand(DruidRel.class, none()))); + } + + @Override + public void onMatch(RelOptRuleCall call) + { + final Project postProject = call.rel(0); + final DruidRel druidRel = call.rel(1); + final DruidRel newDruidRel = GroupByRules.applyProjectAfterAggregate(druidRel, postProject); + if (newDruidRel != null) { + call.transformTo(newDruidRel); + } + } + } + + public static class DruidFilterAfterAggregationRule extends RelOptRule + { + private DruidFilterAfterAggregationRule() + { + super(operand(Filter.class, operand(DruidRel.class, none()))); + } + + @Override + public void onMatch(RelOptRuleCall call) + { + final Filter postFilter = call.rel(0); + final DruidRel druidRel = call.rel(1); + final DruidRel newDruidRel = GroupByRules.applyFilterAfterAggregate(druidRel, postFilter); + if (newDruidRel != null) { + call.transformTo(newDruidRel); + } + } + } + + public static class DruidGroupBySortRule extends RelOptRule + { + private DruidGroupBySortRule() + { + super(operand(Sort.class, operand(DruidRel.class, none()))); + } + + @Override + public void onMatch(RelOptRuleCall call) + { + final Sort sort = call.rel(0); + final DruidRel druidRel = call.rel(1); + final DruidRel newDruidRel = GroupByRules.applySort(druidRel, sort); + if (newDruidRel != null) { + call.transformTo(newDruidRel); + } + } + } + + private static DruidRel applyAggregate( + final DruidRel druidRel, + final Project project0, + final Aggregate aggregate, + final boolean approximateCountDistinct + ) + { + if ((project0 != null && druidRel.getQueryBuilder().getSelectProjection() != null /* can't project twice */) + || druidRel.getQueryBuilder().getGrouping() != null + || aggregate.indicator + || aggregate.getGroupSets().size() != 1) { + return null; + } + + final Project project; + if (project0 != null) { + project = project0; + } else if (druidRel.getQueryBuilder().getSelectProjection() != null) { + project = druidRel.getQueryBuilder().getSelectProjection().getProject(); + } else { + project = null; + } + + final List dimensions = Lists.newArrayList(); + final List aggregations = Lists.newArrayList(); + final List rowOrder = Lists.newArrayList(); + + // Translate groupSet. + final ImmutableBitSet groupSet = aggregate.getGroupSet(); + + int dimOutputNameCounter = 0; + for (int i : groupSet) { + if (project != null && project.getChildExps().get(i) instanceof RexLiteral) { + // Ignore literals in GROUP BY, so a user can write e.g. "GROUP BY 'dummy'" to group everything into a single + // row. Add dummy rowOrder entry so NULLs come out. This is not strictly correct but it works as long as + // nobody actually expects to see the literal. + rowOrder.add(dimOutputName(dimOutputNameCounter++)); + } else { + final DimensionSpec dimensionSpec = toDimensionSpec( + druidRel.getDruidTable(), + Expressions.toRowExtraction( + DruidTables.rowOrder(druidRel.getDruidTable()), + Expressions.fromFieldAccess(druidRel.getDruidTable(), project, i) + ), + dimOutputName(dimOutputNameCounter++) + ); + if (dimensionSpec == null) { + return null; + } + dimensions.add(dimensionSpec); + rowOrder.add(dimensionSpec.getOutputName()); + } + } + + // Translate aggregates. + for (int i = 0; i < aggregate.getAggCallList().size(); i++) { + final AggregateCall aggCall = aggregate.getAggCallList().get(i); + final Aggregation aggregation = translateAggregateCall( + druidRel, + project, + aggCall, + i, + approximateCountDistinct + ); + + if (aggregation == null) { + return null; + } + + aggregations.add(aggregation); + rowOrder.add(aggregation.getOutputName()); + } + + return druidRel.withQueryBuilder( + druidRel.getQueryBuilder() + .withGrouping( + Grouping.create(dimensions, aggregations), + aggregate.getRowType(), + rowOrder + ) + ); + } + + private static DruidRel applyProjectAfterAggregate( + final DruidRel druidRel, + final Project postProject + ) + { + if (druidRel.getQueryBuilder().getGrouping() == null || druidRel.getQueryBuilder().getLimitSpec() != null) { + return null; + } + + final List rowOrder = druidRel.getQueryBuilder().getRowOrder(); + final Grouping grouping = druidRel.getQueryBuilder().getGrouping(); + final List newAggregations = Lists.newArrayList(grouping.getAggregations()); + final List finalizingPostAggregatorFactories = Lists.newArrayList(); + final List newRowOrder = Lists.newArrayList(); + + // Build list of finalizingPostAggregatorFactories. + final Map aggregationMap = Maps.newHashMap(); + for (final Aggregation aggregation : grouping.getAggregations()) { + aggregationMap.put(aggregation.getOutputName(), aggregation); + } + for (final String field : rowOrder) { + final Aggregation aggregation = aggregationMap.get(field); + finalizingPostAggregatorFactories.add( + aggregation == null + ? null + : aggregation.getFinalizingPostAggregatorFactory() + ); + } + + // Walk through the postProject expressions. + for (final RexNode projectExpression : postProject.getChildExps()) { + if (projectExpression.isA(SqlKind.INPUT_REF)) { + final RexInputRef ref = (RexInputRef) projectExpression; + final String fieldName = rowOrder.get(ref.getIndex()); + newRowOrder.add(fieldName); + finalizingPostAggregatorFactories.add(null); + } else { + // Attempt to convert to PostAggregator. + final String postAggregatorName = aggOutputName(newAggregations.size()); + final PostAggregator postAggregator = Expressions.toPostAggregator( + postAggregatorName, + rowOrder, + finalizingPostAggregatorFactories, + projectExpression + ); + if (postAggregator != null) { + newAggregations.add(Aggregation.create(postAggregator)); + newRowOrder.add(postAggregator.getName()); + finalizingPostAggregatorFactories.add(null); + } else { + return null; + } + } + } + + return druidRel.withQueryBuilder( + druidRel.getQueryBuilder() + .withAdjustedGrouping( + Grouping.create(grouping.getDimensions(), newAggregations), + postProject.getRowType(), + newRowOrder + ) + ); + } + + private static DruidRel applyFilterAfterAggregate( + final DruidRel druidRel, + final Filter postFilter + ) + { + if (druidRel.getQueryBuilder().getGrouping() == null + || druidRel.getQueryBuilder().getHaving() != null + || druidRel.getQueryBuilder().getLimitSpec() != null) { + return null; + } + + final DimFilter dimFilter = Expressions.toFilter( + null, // null table; this filter is being applied as a HAVING on result rows + druidRel.getQueryBuilder().getRowOrder(), + postFilter.getCondition() + ); + + if (dimFilter != null) { + return druidRel.withQueryBuilder( + druidRel.getQueryBuilder() + .withHaving(dimFilter) + ); + } else { + return null; + } + } + + private static DruidRel applySort( + final DruidRel druidRel, + final Sort sort + ) + { + if (druidRel.getQueryBuilder().getGrouping() == null || druidRel.getQueryBuilder().getLimitSpec() != null) { + // Can only sort when grouping and not already sorting. + return null; + } + + final Grouping grouping = druidRel.getQueryBuilder().getGrouping(); + final DefaultLimitSpec limitSpec = toLimitSpec(druidRel.getQueryBuilder().getRowOrder(), sort); + if (limitSpec == null) { + return null; + } + + final List orderBys = limitSpec.getColumns(); + final List newDimensions = Lists.newArrayList(grouping.getDimensions()); + + // Reorder dimensions, maybe, to allow groupBy to consider pushing down sorting (see DefaultLimitSpec). + if (!orderBys.isEmpty()) { + final Map dimensionOrderByOutputName = Maps.newHashMap(); + for (int i = 0; i < newDimensions.size(); i++) { + dimensionOrderByOutputName.put(newDimensions.get(i).getOutputName(), i); + } + for (int i = 0; i < orderBys.size(); i++) { + final OrderByColumnSpec orderBy = orderBys.get(i); + final Integer dimensionOrder = dimensionOrderByOutputName.get(orderBy.getDimension()); + if (dimensionOrder != null + && dimensionOrder != i + && orderBy.getDirection() == OrderByColumnSpec.Direction.ASCENDING + && orderBy.getDimensionComparator().equals(StringComparators.LEXICOGRAPHIC)) { + final DimensionSpec tmp = newDimensions.get(i); + newDimensions.set(i, newDimensions.get(dimensionOrder)); + newDimensions.set(dimensionOrder, tmp); + dimensionOrderByOutputName.put(newDimensions.get(i).getOutputName(), i); + dimensionOrderByOutputName.put(newDimensions.get(dimensionOrder).getOutputName(), dimensionOrder); + } + } + } + + if (!orderBys.isEmpty() || limitSpec.getLimit() < Integer.MAX_VALUE) { + return druidRel.withQueryBuilder( + druidRel.getQueryBuilder() + .withAdjustedGrouping( + Grouping.create(newDimensions, grouping.getAggregations()), + druidRel.getQueryBuilder().getRowType(), + druidRel.getQueryBuilder().getRowOrder() + ) + .withLimitSpec(limitSpec) + ); + } else { + return druidRel; + } + } + + public static DefaultLimitSpec toLimitSpec( + final List rowOrder, + final Sort sort + ) + { + final Integer limit = sort.fetch != null ? RexLiteral.intValue(sort.fetch) : null; + final List orderBys = Lists.newArrayListWithCapacity(sort.getChildExps().size()); + + if (sort.offset != null) { + // LimitSpecs don't accept offsets. + return null; + } + + // Extract orderBy column specs. + for (int sortKey = 0; sortKey < sort.getChildExps().size(); sortKey++) { + final RexNode sortExpression = sort.getChildExps().get(sortKey); + final RelFieldCollation collation = sort.getCollation().getFieldCollations().get(sortKey); + final OrderByColumnSpec.Direction direction; + final StringComparator comparator; + + if (collation.getDirection() == RelFieldCollation.Direction.ASCENDING) { + direction = OrderByColumnSpec.Direction.ASCENDING; + } else if (collation.getDirection() == RelFieldCollation.Direction.DESCENDING) { + direction = OrderByColumnSpec.Direction.DESCENDING; + } else { + throw new ISE("WTF?! Don't know what to do with direction[%s]", collation.getDirection()); + } + + if (SqlTypeName.NUMERIC_TYPES.contains(sortExpression.getType().getSqlTypeName()) + || SqlTypeName.DATETIME_TYPES.contains(sortExpression.getType().getSqlTypeName())) { + comparator = StringComparators.NUMERIC; + } else { + comparator = StringComparators.LEXICOGRAPHIC; + } + + if (sortExpression.isA(SqlKind.INPUT_REF)) { + final RexInputRef ref = (RexInputRef) sortExpression; + final String fieldName = rowOrder.get(ref.getIndex()); + orderBys.add(new OrderByColumnSpec(fieldName, direction, comparator)); + } else { + // We don't support sorting by anything other than refs which actually appear in the query result. + return null; + } + } + + return new DefaultLimitSpec(orderBys, limit); + } + + private static DimensionSpec toDimensionSpec( + final DruidTable druidTable, + final RowExtraction rex, + final String name + ) + { + if (rex == null) { + return null; + } + + final int columnNumber = druidTable.getColumnNumber(rex.getColumn()); + if (columnNumber < 0) { + return null; + } + + final ValueType columnType = druidTable.getColumnType(columnNumber); + + if (columnType == ValueType.STRING || + (rex.getColumn().equals(Column.TIME_COLUMN_NAME) && rex.getExtractionFn() != null)) { + return rex.getExtractionFn() == null + ? new DefaultDimensionSpec(rex.getColumn(), name) + : new ExtractionDimensionSpec(rex.getColumn(), name, rex.getExtractionFn()); + } else { + // Can't create dimensionSpecs for non-string, non-time. + return null; + } + } + + /** + * Translate an AggregateCall to Druid equivalents. + * + * @return translated aggregation, or null if translation failed. + */ + private static Aggregation translateAggregateCall( + final DruidRel druidRel, + final Project project, + final AggregateCall call, + final int aggNumber, + final boolean approximateCountDistinct + ) + { + final List filters = Lists.newArrayList(); + final List rowOrder = DruidTables.rowOrder(druidRel.getDruidTable()); + final String name = aggOutputName(aggNumber); + final SqlKind kind = call.getAggregation().getKind(); + final SqlTypeName outputType = call.getType().getSqlTypeName(); + final Aggregation retVal; + + if (call.filterArg >= 0) { + // AGG(xxx) FILTER(WHERE yyy) + if (project == null) { + // We need some kind of projection to support filtered aggregations. + return null; + } + + final RexNode expression = project.getChildExps().get(call.filterArg); + final DimFilter filter = Expressions.toFilter(druidRel.getDruidTable(), rowOrder, expression); + if (filter == null) { + return null; + } + + filters.add(filter); + } + + if (call.getAggregation().getKind() == SqlKind.COUNT && call.getArgList().isEmpty()) { + // COUNT(*) + retVal = Aggregation.create(new CountAggregatorFactory(name)); + } else if (call.getAggregation().getKind() == SqlKind.COUNT && call.isDistinct() && approximateCountDistinct) { + // COUNT(DISTINCT x) + final DimensionSpec dimensionSpec = toDimensionSpec( + druidRel.getDruidTable(), + Expressions.toRowExtraction( + rowOrder, + Expressions.fromFieldAccess( + druidRel.getDruidTable(), + project, + Iterables.getOnlyElement(call.getArgList()) + ) + ), + aggInternalName(aggNumber, "dimSpec") + ); + + if (dimensionSpec == null) { + return null; + } + + retVal = Aggregation.createFinalizable( + ImmutableList.of( + new CardinalityAggregatorFactory(name, ImmutableList.of(dimensionSpec), false) + ), + null, + new PostAggregatorFactory() + { + @Override + public PostAggregator factorize(String outputName) + { + return new HyperUniqueFinalizingPostAggregator(outputName, name); + } + } + ); + } else if (!call.isDistinct() && call.getArgList().size() == 1) { + // AGG(xxx), not distinct, not COUNT(*) + boolean forceCount = false; + final FieldOrExpression input; + + final int inputField = Iterables.getOnlyElement(call.getArgList()); + final RexNode rexNode = Expressions.fromFieldAccess(druidRel.getDruidTable(), project, inputField); + final FieldOrExpression foe = FieldOrExpression.fromRexNode(rowOrder, rexNode); + + if (foe != null) { + input = foe; + } else if (rexNode.getKind() == SqlKind.CASE && ((RexCall) rexNode).getOperands().size() == 3) { + // Possibly a CASE-style filtered aggregation. Styles supported: + // A: SUM(CASE WHEN x = 'foo' THEN cnt END) => operands (x = 'foo', cnt, null) + // B: SUM(CASE WHEN x = 'foo' THEN 1 ELSE 0 END) => operands (x = 'foo', 1, 0) + // C: COUNT(CASE WHEN x = 'foo' THEN 'dummy' END) => operands (x = 'foo', 'dummy', null) + // If the null and non-null args are switched, "flip" is set, which negates the filter. + + final RexCall caseCall = (RexCall) rexNode; + final boolean flip = RexLiteral.isNullLiteral(caseCall.getOperands().get(1)) + && !RexLiteral.isNullLiteral(caseCall.getOperands().get(2)); + final RexNode arg1 = caseCall.getOperands().get(flip ? 2 : 1); + final RexNode arg2 = caseCall.getOperands().get(flip ? 1 : 2); + + // Operand 1: Filter + final DimFilter filter = Expressions.toFilter( + druidRel.getDruidTable(), + rowOrder, + caseCall.getOperands().get(0) + ); + if (filter == null) { + return null; + } else { + filters.add(flip ? new NotDimFilter(filter) : filter); + } + + if (call.getAggregation().getKind() == SqlKind.COUNT + && arg1 instanceof RexLiteral + && !RexLiteral.isNullLiteral(arg1) + && RexLiteral.isNullLiteral(arg2)) { + // Case C + forceCount = true; + input = null; + } else if (call.getAggregation().getKind() == SqlKind.SUM + && arg1 instanceof RexLiteral + && ((Number) RexLiteral.value(arg1)).intValue() == 1 + && arg2 instanceof RexLiteral + && ((Number) RexLiteral.value(arg2)).intValue() == 0) { + // Case B + forceCount = true; + input = null; + } else if (RexLiteral.isNullLiteral(arg2)) { + // Maybe case A + input = FieldOrExpression.fromRexNode(rowOrder, arg1); + if (input == null) { + return null; + } + } else { + // Can't translate CASE into a filter. + return null; + } + } else { + // Can't translate aggregator expression. + return null; + } + + if (!forceCount) { + Preconditions.checkNotNull(input, "WTF?! input was null for non-COUNT aggregation"); + } + + if (forceCount || kind == SqlKind.COUNT) { + // COUNT(x) + retVal = Aggregation.create(new CountAggregatorFactory(name)); + } else { + // All aggregators other than COUNT expect a single argument with no extractionFn. + final String fieldName = input.getFieldName(); + final String expression = input.getExpression(); + + final boolean isLong = SqlTypeName.INT_TYPES.contains(outputType) + || SqlTypeName.DATETIME_TYPES.contains(outputType); + + if (kind == SqlKind.SUM || kind == SqlKind.SUM0) { + retVal = isLong + ? Aggregation.create(new LongSumAggregatorFactory(name, fieldName, expression)) + : Aggregation.create(new DoubleSumAggregatorFactory(name, fieldName, expression)); + } else if (kind == SqlKind.MIN) { + retVal = isLong + ? Aggregation.create(new LongMinAggregatorFactory(name, fieldName, expression)) + : Aggregation.create(new DoubleMinAggregatorFactory(name, fieldName, expression)); + } else if (kind == SqlKind.MAX) { + retVal = isLong + ? Aggregation.create(new LongMaxAggregatorFactory(name, fieldName, expression)) + : Aggregation.create(new DoubleMaxAggregatorFactory(name, fieldName, expression)); + } else if (kind == SqlKind.AVG) { + final String sumName = aggInternalName(aggNumber, "sum"); + final String countName = aggInternalName(aggNumber, "count"); + final AggregatorFactory sum = isLong + ? new LongSumAggregatorFactory(sumName, fieldName, expression) + : new DoubleSumAggregatorFactory(sumName, fieldName, expression); + final AggregatorFactory count = new CountAggregatorFactory(countName); + retVal = Aggregation.create( + ImmutableList.of(sum, count), + new ArithmeticPostAggregator( + name, + "quotient", + ImmutableList.of( + new FieldAccessPostAggregator(null, sumName), + new FieldAccessPostAggregator(null, countName) + ) + ) + ); + } else { + retVal = null; + } + } + } else { + retVal = null; + } + + final DimFilter filter = filters.isEmpty() + ? null + : Filtration.create(new AndDimFilter(filters)) + .optimizeFilterOnly(druidRel.getDruidTable()) + .getDimFilter(); + + return retVal != null ? retVal.filter(filter) : null; + } + + public static String dimOutputName(final int dimNumber) + { + return "d" + dimNumber; + } + + private static String aggOutputName(final int aggNumber) + { + return "a" + aggNumber; + } + + private static String aggInternalName(final int aggNumber, final String key) + { + return "A" + aggNumber + ":" + key; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/table/DruidTable.java b/sql/src/main/java/io/druid/sql/calcite/table/DruidTable.java new file mode 100644 index 00000000000..1a92ae49d13 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/table/DruidTable.java @@ -0,0 +1,210 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.table; + +import com.google.common.base.Preconditions; +import com.google.common.collect.ImmutableSortedMap; +import com.google.common.collect.Lists; +import com.google.common.collect.Maps; +import io.druid.java.util.common.ISE; +import io.druid.query.DataSource; +import io.druid.query.QuerySegmentWalker; +import io.druid.segment.column.Column; +import io.druid.segment.column.ValueType; +import io.druid.sql.calcite.planner.PlannerConfig; +import io.druid.sql.calcite.rel.DruidQueryRel; +import org.apache.calcite.plan.RelOptCluster; +import org.apache.calcite.plan.RelOptTable; +import org.apache.calcite.rel.RelNode; +import org.apache.calcite.rel.type.RelDataType; +import org.apache.calcite.rel.type.RelDataTypeFactory; +import org.apache.calcite.schema.Schema; +import org.apache.calcite.schema.Statistic; +import org.apache.calcite.schema.Statistics; +import org.apache.calcite.schema.TranslatableTable; +import org.apache.calcite.sql.type.SqlTypeName; + +import java.util.List; +import java.util.Map; + +public class DruidTable implements TranslatableTable +{ + private final QuerySegmentWalker walker; + private final DataSource dataSource; + private final PlannerConfig config; + private final Map columnNumbers; + private final List columnTypes; + private final List columnNames; + + public DruidTable( + final QuerySegmentWalker walker, + final DataSource dataSource, + final PlannerConfig config, + final Map columns + ) + { + this.walker = Preconditions.checkNotNull(walker, "walker"); + this.dataSource = Preconditions.checkNotNull(dataSource, "dataSource"); + this.config = Preconditions.checkNotNull(config, "config"); + this.columnNumbers = Maps.newLinkedHashMap(); + this.columnTypes = Lists.newArrayList(); + this.columnNames = Lists.newArrayList(); + + int i = 0; + for (Map.Entry entry : ImmutableSortedMap.copyOf(columns).entrySet()) { + columnNumbers.put(entry.getKey(), i++); + columnTypes.add(entry.getValue()); + columnNames.add(entry.getKey()); + } + } + + public QuerySegmentWalker getQuerySegmentWalker() + { + return walker; + } + + public DataSource getDataSource() + { + return dataSource; + } + + public PlannerConfig getPlannerConfig() + { + return config; + } + + public int getColumnCount() + { + return columnNames.size(); + } + + public int getColumnNumber(final String name) + { + final Integer number = columnNumbers.get(name); + return number != null ? number : -1; + } + + public String getColumnName(final int n) + { + return columnNames.get(n); + } + + public ValueType getColumnType(final int n) + { + return columnTypes.get(n); + } + + @Override + public Schema.TableType getJdbcTableType() + { + return Schema.TableType.TABLE; + } + + @Override + public Statistic getStatistic() + { + return Statistics.UNKNOWN; + } + + @Override + public RelDataType getRowType(final RelDataTypeFactory typeFactory) + { + final RelDataTypeFactory.FieldInfoBuilder builder = typeFactory.builder(); + for (Map.Entry entry : columnNumbers.entrySet()) { + final RelDataType sqlTypeName; + + if (entry.getKey().equals(Column.TIME_COLUMN_NAME)) { + sqlTypeName = typeFactory.createSqlType(SqlTypeName.TIMESTAMP); + } else { + final ValueType valueType = columnTypes.get(entry.getValue()); + switch (valueType) { + case STRING: + // Note that there is no attempt here to handle multi-value in any special way. Maybe one day... + sqlTypeName = typeFactory.createSqlType(SqlTypeName.VARCHAR, RelDataType.PRECISION_NOT_SPECIFIED); + break; + case LONG: + sqlTypeName = typeFactory.createSqlType(SqlTypeName.BIGINT); + break; + case FLOAT: + sqlTypeName = typeFactory.createSqlType(SqlTypeName.FLOAT); + break; + default: + throw new ISE("WTF?! valueType[%s] not translatable?", valueType); + } + } + + builder.add(entry.getKey(), sqlTypeName); + } + return builder.build(); + } + + @Override + public RelNode toRel(final RelOptTable.ToRelContext context, final RelOptTable table) + { + final RelOptCluster cluster = context.getCluster(); + return DruidQueryRel.fullScan( + cluster, + cluster.traitSet(), + table, + this + ); + } + + @Override + public boolean equals(Object o) + { + if (this == o) { + return true; + } + if (o == null || getClass() != o.getClass()) { + return false; + } + + DruidTable that = (DruidTable) o; + + if (dataSource != null ? !dataSource.equals(that.dataSource) : that.dataSource != null) { + return false; + } + if (columnNumbers != null ? !columnNumbers.equals(that.columnNumbers) : that.columnNumbers != null) { + return false; + } + return columnTypes != null ? columnTypes.equals(that.columnTypes) : that.columnTypes == null; + + } + + @Override + public int hashCode() + { + int result = dataSource != null ? dataSource.hashCode() : 0; + result = 31 * result + (columnNumbers != null ? columnNumbers.hashCode() : 0); + result = 31 * result + (columnTypes != null ? columnTypes.hashCode() : 0); + return result; + } + + @Override + public String toString() + { + return "DruidTable{" + + "dataSource=" + dataSource + + ", columnNumbers=" + columnNumbers + + ", columnTypes=" + columnTypes + + '}'; + } +} diff --git a/sql/src/main/java/io/druid/sql/calcite/table/DruidTables.java b/sql/src/main/java/io/druid/sql/calcite/table/DruidTables.java new file mode 100644 index 00000000000..58e5268ddc2 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/calcite/table/DruidTables.java @@ -0,0 +1,76 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.table; + +import com.google.common.collect.Lists; +import io.druid.query.ordering.StringComparator; +import io.druid.query.ordering.StringComparators; +import io.druid.segment.column.ValueType; +import io.druid.sql.calcite.expression.RowExtraction; + +import java.util.List; + +public class DruidTables +{ + private DruidTables() + { + // No instantiation. + } + + /** + * Returns the "natural" rowOrder for a Druid table. This is the order that a scan without projection would return. + * + * @param druidTable druid table + * + * @return natural row order + */ + public static List rowOrder( + final DruidTable druidTable + ) + { + final List rowOrder = Lists.newArrayListWithCapacity(druidTable.getColumnCount()); + for (int i = 0; i < druidTable.getColumnCount(); i++) { + rowOrder.add(druidTable.getColumnName(i)); + } + return rowOrder; + } + + /** + * Return the "natural" {@link StringComparator} for an extraction from a Druid table. This will be a lexicographic + * comparator for String types and a numeric comparator for Number types. + * + * @param druidTable underlying Druid table + * @param rowExtraction extraction from the table + * + * @return natural comparator + */ + public static StringComparator naturalStringComparator( + final DruidTable druidTable, + final RowExtraction rowExtraction + ) + { + if (rowExtraction.getExtractionFn() != null + || druidTable.getColumnType(druidTable.getColumnNumber(rowExtraction.getColumn())) == ValueType.STRING) { + return StringComparators.LEXICOGRAPHIC; + } else { + return StringComparators.NUMERIC; + } + } +} diff --git a/sql/src/main/java/io/druid/sql/guice/SqlModule.java b/sql/src/main/java/io/druid/sql/guice/SqlModule.java new file mode 100644 index 00000000000..c5b3906f816 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/guice/SqlModule.java @@ -0,0 +1,88 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.guice; + +import com.google.common.base.Preconditions; +import com.google.inject.Binder; +import com.google.inject.Inject; +import com.google.inject.Module; +import com.google.inject.Provides; +import io.druid.guice.Jerseys; +import io.druid.guice.JsonConfigProvider; +import io.druid.guice.LazySingleton; +import io.druid.guice.LifecycleModule; +import io.druid.server.initialization.jetty.JettyBindings; +import io.druid.server.metrics.MetricsModule; +import io.druid.sql.avatica.AvaticaMonitor; +import io.druid.sql.avatica.DruidAvaticaHandler; +import io.druid.sql.avatica.ServerConfig; +import io.druid.sql.calcite.DruidSchema; +import io.druid.sql.calcite.planner.Calcites; +import io.druid.sql.calcite.planner.PlannerConfig; +import io.druid.sql.http.SqlResource; +import org.apache.calcite.jdbc.CalciteConnection; + +import java.sql.SQLException; +import java.util.Properties; + +public class SqlModule implements Module +{ + private static final String PROPERTY_SQL_ENABLE = "druid.sql.enable"; + + @Inject + private Properties props; + + public SqlModule() + { + } + + @Override + public void configure(Binder binder) + { + if (isEnabled()) { + JsonConfigProvider.bind(binder, "druid.sql.server", ServerConfig.class); + JsonConfigProvider.bind(binder, "druid.sql.planner", PlannerConfig.class); + Jerseys.addResource(binder, SqlResource.class); + binder.bind(AvaticaMonitor.class).in(LazySingleton.class); + JettyBindings.addHandler(binder, DruidAvaticaHandler.class); + MetricsModule.register(binder, AvaticaMonitor.class); + LifecycleModule.register(binder, DruidSchema.class); + } + } + + @Provides + public CalciteConnection createCalciteConnection( + final DruidSchema druidSchema, + final PlannerConfig plannerConfig + ) throws SQLException + { + if (isEnabled()) { + return Calcites.jdbc(druidSchema, plannerConfig); + } else { + throw new IllegalStateException("Cannot provide CalciteConnection when SQL is disabled."); + } + } + + private boolean isEnabled() + { + Preconditions.checkNotNull(props, "props"); + return Boolean.valueOf(props.getProperty(PROPERTY_SQL_ENABLE, "false")); + } +} diff --git a/sql/src/main/java/io/druid/sql/http/SqlQuery.java b/sql/src/main/java/io/druid/sql/http/SqlQuery.java new file mode 100644 index 00000000000..cca0e598ca6 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/http/SqlQuery.java @@ -0,0 +1,72 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.http; + +import com.fasterxml.jackson.annotation.JsonCreator; +import com.fasterxml.jackson.annotation.JsonProperty; +import com.google.common.base.Preconditions; + +public class SqlQuery +{ + private final String query; + + @JsonCreator + public SqlQuery( + @JsonProperty("query") final String query + ) + { + this.query = Preconditions.checkNotNull(query, "query"); + } + + @JsonProperty + public String getQuery() + { + return query; + } + + @Override + public boolean equals(Object o) + { + if (this == o) { + return true; + } + if (o == null || getClass() != o.getClass()) { + return false; + } + + SqlQuery sqlQuery = (SqlQuery) o; + + return query != null ? query.equals(sqlQuery.query) : sqlQuery.query == null; + } + + @Override + public int hashCode() + { + return query != null ? query.hashCode() : 0; + } + + @Override + public String toString() + { + return "SqlQuery{" + + "query='" + query + '\'' + + '}'; + } +} diff --git a/sql/src/main/java/io/druid/sql/http/SqlResource.java b/sql/src/main/java/io/druid/sql/http/SqlResource.java new file mode 100644 index 00000000000..527d2e09686 --- /dev/null +++ b/sql/src/main/java/io/druid/sql/http/SqlResource.java @@ -0,0 +1,152 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.http; + +import com.fasterxml.jackson.core.JsonGenerator; +import com.fasterxml.jackson.databind.ObjectMapper; +import com.google.common.base.Preconditions; +import com.google.common.base.Throwables; +import com.google.inject.Inject; +import io.druid.guice.annotations.Json; +import io.druid.java.util.common.logger.Logger; +import io.druid.query.QueryInterruptedException; +import org.apache.calcite.jdbc.CalciteConnection; +import org.joda.time.DateTime; + +import javax.ws.rs.Consumes; +import javax.ws.rs.POST; +import javax.ws.rs.Path; +import javax.ws.rs.Produces; +import javax.ws.rs.WebApplicationException; +import javax.ws.rs.core.MediaType; +import javax.ws.rs.core.Response; +import javax.ws.rs.core.StreamingOutput; +import java.io.IOException; +import java.io.OutputStream; +import java.sql.Connection; +import java.sql.ResultSet; +import java.sql.ResultSetMetaData; +import java.sql.SQLException; +import java.sql.Types; + +@Path("/druid/v2/sql/") +public class SqlResource +{ + private static final Logger log = new Logger(SqlResource.class); + + private final ObjectMapper jsonMapper; + private final Connection connection; + + @Inject + public SqlResource( + @Json ObjectMapper jsonMapper, + CalciteConnection connection + ) + { + this.jsonMapper = Preconditions.checkNotNull(jsonMapper, "jsonMapper"); + this.connection = Preconditions.checkNotNull(connection, "connection"); + } + + @POST + @Produces(MediaType.APPLICATION_JSON) + @Consumes(MediaType.APPLICATION_JSON) + public Response doPost(final SqlQuery sqlQuery) throws SQLException, IOException + { + // This is not integrated with the experimental authorization framework. + // (Non-trivial since we don't know the dataSources up-front) + + try { + final ResultSet resultSet = connection.createStatement().executeQuery(sqlQuery.getQuery()); + final ResultSetMetaData metaData = resultSet.getMetaData(); + + // Remember which columns are time-typed, so we can emit ISO8601 instead of millis values. + final boolean[] timeColumns = new boolean[metaData.getColumnCount()]; + for (int i = 0; i < metaData.getColumnCount(); i++) { + final int columnType = metaData.getColumnType(i + 1); + if (columnType == Types.TIMESTAMP || columnType == Types.TIME || columnType == Types.DATE) { + timeColumns[i] = true; + } else { + timeColumns[i] = false; + } + } + + return Response.ok( + new StreamingOutput() + { + @Override + public void write(final OutputStream outputStream) throws IOException, WebApplicationException + { + try (final JsonGenerator jsonGenerator = jsonMapper.getFactory().createGenerator(outputStream)) { + jsonGenerator.writeStartArray(); + while (resultSet.next()) { + jsonGenerator.writeStartObject(); + for (int i = 0; i < metaData.getColumnCount(); i++) { + final Object value; + + if (timeColumns[i]) { + value = new DateTime(resultSet.getLong(i + 1)); + } else { + value = resultSet.getObject(i + 1); + } + + jsonGenerator.writeObjectField(metaData.getColumnName(i + 1), value); + } + jsonGenerator.writeEndObject(); + } + jsonGenerator.writeEndArray(); + jsonGenerator.flush(); + + // End with CRLF + outputStream.write('\r'); + outputStream.write('\n'); + } + catch (SQLException e) { + throw Throwables.propagate(e); + } + finally { + try { + resultSet.close(); + } + catch (SQLException e) { + log.warn(e, "Failed to close ResultSet, ignoring."); + } + } + } + } + ).build(); + } + catch (Exception e) { + log.warn(e, "Failed to handle query: %s", sqlQuery); + + // Unwrap preparing exceptions into potentially more useful exceptions. + final Throwable maybeUnwrapped; + if (e instanceof SQLException && e.getMessage().contains("Error while preparing statement")) { + maybeUnwrapped = e.getCause(); + } else { + maybeUnwrapped = e; + } + + return Response.serverError() + .type(MediaType.APPLICATION_JSON_TYPE) + .entity(jsonMapper.writeValueAsBytes(QueryInterruptedException.wrapIfNeeded(maybeUnwrapped))) + .build(); + } + } +} diff --git a/sql/src/test/java/io/druid/sql/avatica/DruidAvaticaHandlerTest.java b/sql/src/test/java/io/druid/sql/avatica/DruidAvaticaHandlerTest.java new file mode 100644 index 00000000000..2784450fbed --- /dev/null +++ b/sql/src/test/java/io/druid/sql/avatica/DruidAvaticaHandlerTest.java @@ -0,0 +1,268 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.avatica; + +import com.google.common.collect.ImmutableList; +import com.google.common.collect.ImmutableMap; +import com.google.common.collect.ImmutableSet; +import com.google.common.collect.Lists; +import com.google.common.collect.Maps; +import io.druid.java.util.common.Pair; +import io.druid.server.DruidNode; +import io.druid.sql.calcite.planner.Calcites; +import io.druid.sql.calcite.planner.PlannerConfig; +import io.druid.sql.calcite.util.CalciteTests; +import org.apache.calcite.jdbc.CalciteConnection; +import org.eclipse.jetty.server.Server; +import org.junit.After; +import org.junit.Assert; +import org.junit.Before; +import org.junit.Rule; +import org.junit.Test; +import org.junit.rules.ExpectedException; +import org.junit.rules.TemporaryFolder; + +import java.net.InetSocketAddress; +import java.sql.Connection; +import java.sql.DatabaseMetaData; +import java.sql.DriverManager; +import java.sql.ResultSet; +import java.sql.ResultSetMetaData; +import java.sql.SQLException; +import java.util.List; +import java.util.Map; +import java.util.Random; +import java.util.Set; + +public class DruidAvaticaHandlerTest +{ + @Rule + public ExpectedException expectedException = ExpectedException.none(); + + @Rule + public TemporaryFolder temporaryFolder = new TemporaryFolder(); + + private CalciteConnection serverConnection; + private Server server; + private Connection client; + + @Before + public void setUp() throws Exception + { + final PlannerConfig plannerConfig = new PlannerConfig(); + serverConnection = Calcites.jdbc( + CalciteTests.createMockSchema( + CalciteTests.createWalker(temporaryFolder.newFolder()), + plannerConfig + ), + plannerConfig + ); + final ServerConfig serverConfig = new ServerConfig() + { + @Override + public boolean isEnableAvatica() + { + return true; + } + }; + final DruidAvaticaHandler handler = new DruidAvaticaHandler( + serverConnection, + new DruidNode("dummy", "dummy", 1), + new AvaticaMonitor(), + serverConfig + ); + final int port = new Random().nextInt(9999) + 10000; + server = new Server(new InetSocketAddress("127.0.0.1", port)); + server.setHandler(handler); + server.start(); + final String url = String.format( + "jdbc:avatica:remote:url=http://127.0.0.1:%d%s", + port, + DruidAvaticaHandler.AVATICA_PATH + ); + client = DriverManager.getConnection(url); + } + + @After + public void tearDown() throws Exception + { + client.close(); + server.stop(); + serverConnection.close(); + client = null; + server = null; + serverConnection = null; + } + + @Test + public void testSelectCount() throws Exception + { + final ResultSet resultSet = client.createStatement().executeQuery("SELECT COUNT(*) AS cnt FROM druid.foo"); + final List> rows = getRows(resultSet); + Assert.assertEquals( + ImmutableList.of( + ImmutableMap.of("cnt", 6L) + ), + rows + ); + } + + @Test + public void testExplainSelectCount() throws Exception + { + final ResultSet resultSet = client.createStatement().executeQuery( + "EXPLAIN PLAN FOR SELECT COUNT(*) AS cnt FROM druid.foo" + ); + final List> rows = getRows(resultSet); + Assert.assertEquals( + ImmutableList.of( + ImmutableMap.of( + "PLAN", + "EnumerableInterpreter\n" + + " DruidQueryRel(dataSource=[foo], dimensions=[[]], aggregations=[[Aggregation{aggregatorFactories=[CountAggregatorFactory{name='a0'}], postAggregator=null, finalizingPostAggregatorFactory=null}]])\n" + ) + ), + rows + ); + } + + @Test + public void testDatabaseMetaDataSchemas() throws Exception + { + final DatabaseMetaData metaData = client.getMetaData(); + Assert.assertEquals( + ImmutableList.of( + ROW(Pair.of("TABLE_CATALOG", null), Pair.of("TABLE_SCHEM", "druid")) + ), + getRows(metaData.getSchemas(null, "druid")) + ); + } + + @Test + public void testDatabaseMetaDataTables() throws Exception + { + final DatabaseMetaData metaData = client.getMetaData(); + Assert.assertEquals( + ImmutableList.of( + ROW( + Pair.of("TABLE_CAT", null), + Pair.of("TABLE_NAME", "foo"), + Pair.of("TABLE_SCHEM", "druid"), + Pair.of("TABLE_TYPE", "TABLE") + ) + ), + getRows( + metaData.getTables(null, "druid", "%", null), + ImmutableSet.of("TABLE_CAT", "TABLE_NAME", "TABLE_SCHEM", "TABLE_TYPE") + ) + ); + } + + @Test + public void testDatabaseMetaDataColumns() throws Exception + { + final DatabaseMetaData metaData = client.getMetaData(); + final String varcharDescription = "VARCHAR(1) CHARACTER SET \"ISO-8859-1\" COLLATE \"ISO-8859-1$en_US$primary\" NOT NULL"; + Assert.assertEquals( + ImmutableList.of( + ROW( + Pair.of("TABLE_SCHEM", "druid"), + Pair.of("TABLE_NAME", "foo"), + Pair.of("COLUMN_NAME", "__time"), + Pair.of("DATA_TYPE", 93), + Pair.of("TYPE_NAME", "TIMESTAMP(0) NOT NULL"), + Pair.of("IS_NULLABLE", "NO") + ), + ROW( + Pair.of("TABLE_SCHEM", "druid"), + Pair.of("TABLE_NAME", "foo"), + Pair.of("COLUMN_NAME", "cnt"), + Pair.of("DATA_TYPE", -5), + Pair.of("TYPE_NAME", "BIGINT NOT NULL"), + Pair.of("IS_NULLABLE", "NO") + ), + ROW( + Pair.of("TABLE_SCHEM", "druid"), + Pair.of("TABLE_NAME", "foo"), + Pair.of("COLUMN_NAME", "dim1"), + Pair.of("DATA_TYPE", 12), + Pair.of("TYPE_NAME", varcharDescription), + Pair.of("IS_NULLABLE", "NO") + ), + ROW( + Pair.of("TABLE_SCHEM", "druid"), + Pair.of("TABLE_NAME", "foo"), + Pair.of("COLUMN_NAME", "dim2"), + Pair.of("DATA_TYPE", 12), + Pair.of("TYPE_NAME", varcharDescription), + Pair.of("IS_NULLABLE", "NO") + ), + ROW( + Pair.of("TABLE_SCHEM", "druid"), + Pair.of("TABLE_NAME", "foo"), + Pair.of("COLUMN_NAME", "m1"), + Pair.of("DATA_TYPE", 6), + Pair.of("TYPE_NAME", "FLOAT NOT NULL"), + Pair.of("IS_NULLABLE", "NO") + ) + ), + getRows( + metaData.getColumns(null, "druid", "foo", "%"), + ImmutableSet.of("IS_NULLABLE", "TABLE_NAME", "TABLE_SCHEM", "COLUMN_NAME", "DATA_TYPE", "TYPE_NAME") + ) + ); + } + + private static List> getRows(final ResultSet resultSet) throws SQLException + { + return getRows(resultSet, null); + } + + private static List> getRows(final ResultSet resultSet, final Set returnKeys) + throws SQLException + { + try { + final ResultSetMetaData metaData = resultSet.getMetaData(); + final List> rows = Lists.newArrayList(); + while (resultSet.next()) { + final Map row = Maps.newHashMap(); + for (int i = 0; i < metaData.getColumnCount(); i++) { + if (returnKeys == null || returnKeys.contains(metaData.getColumnName(i + 1))) { + row.put(metaData.getColumnName(i + 1), resultSet.getObject(i + 1)); + } + } + rows.add(row); + } + return rows; + } + finally { + resultSet.close(); + } + } + + private static Map ROW(final Pair... entries) + { + final Map m = Maps.newHashMap(); + for (Pair entry : entries) { + m.put(entry.lhs, entry.rhs); + } + return m; + } +} diff --git a/sql/src/test/java/io/druid/sql/calcite/CalciteQueryTest.java b/sql/src/test/java/io/druid/sql/calcite/CalciteQueryTest.java new file mode 100644 index 00000000000..fe4b8131de0 --- /dev/null +++ b/sql/src/test/java/io/druid/sql/calcite/CalciteQueryTest.java @@ -0,0 +1,2483 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite; + +import com.google.common.base.Function; +import com.google.common.collect.ImmutableList; +import com.google.common.collect.ImmutableMap; +import com.google.common.collect.Lists; +import com.google.common.collect.Maps; +import io.druid.granularity.QueryGranularities; +import io.druid.java.util.common.logger.Logger; +import io.druid.query.Druids; +import io.druid.query.Query; +import io.druid.query.QuerySegmentWalker; +import io.druid.query.aggregation.AggregatorFactory; +import io.druid.query.aggregation.CountAggregatorFactory; +import io.druid.query.aggregation.DoubleMaxAggregatorFactory; +import io.druid.query.aggregation.DoubleMinAggregatorFactory; +import io.druid.query.aggregation.DoubleSumAggregatorFactory; +import io.druid.query.aggregation.FilteredAggregatorFactory; +import io.druid.query.aggregation.LongMaxAggregatorFactory; +import io.druid.query.aggregation.LongMinAggregatorFactory; +import io.druid.query.aggregation.LongSumAggregatorFactory; +import io.druid.query.aggregation.PostAggregator; +import io.druid.query.aggregation.cardinality.CardinalityAggregatorFactory; +import io.druid.query.aggregation.hyperloglog.HyperUniqueFinalizingPostAggregator; +import io.druid.query.aggregation.post.ArithmeticPostAggregator; +import io.druid.query.aggregation.post.ConstantPostAggregator; +import io.druid.query.aggregation.post.ExpressionPostAggregator; +import io.druid.query.aggregation.post.FieldAccessPostAggregator; +import io.druid.query.dimension.DefaultDimensionSpec; +import io.druid.query.dimension.DimensionSpec; +import io.druid.query.dimension.ExtractionDimensionSpec; +import io.druid.query.extraction.BucketExtractionFn; +import io.druid.query.extraction.CascadeExtractionFn; +import io.druid.query.extraction.ExtractionFn; +import io.druid.query.extraction.StrlenExtractionFn; +import io.druid.query.extraction.SubstringDimExtractionFn; +import io.druid.query.extraction.TimeFormatExtractionFn; +import io.druid.query.filter.AndDimFilter; +import io.druid.query.filter.BoundDimFilter; +import io.druid.query.filter.DimFilter; +import io.druid.query.filter.InDimFilter; +import io.druid.query.filter.LikeDimFilter; +import io.druid.query.filter.NotDimFilter; +import io.druid.query.filter.OrDimFilter; +import io.druid.query.filter.SelectorDimFilter; +import io.druid.query.groupby.GroupByQuery; +import io.druid.query.groupby.having.DimFilterHavingSpec; +import io.druid.query.groupby.orderby.DefaultLimitSpec; +import io.druid.query.groupby.orderby.OrderByColumnSpec; +import io.druid.query.ordering.StringComparator; +import io.druid.query.ordering.StringComparators; +import io.druid.query.select.PagingSpec; +import io.druid.query.spec.MultipleIntervalSegmentSpec; +import io.druid.query.spec.QuerySegmentSpec; +import io.druid.query.topn.DimensionTopNMetricSpec; +import io.druid.query.topn.InvertedTopNMetricSpec; +import io.druid.query.topn.NumericTopNMetricSpec; +import io.druid.query.topn.TopNQueryBuilder; +import io.druid.segment.column.Column; +import io.druid.sql.calcite.filtration.Filtration; +import io.druid.sql.calcite.planner.Calcites; +import io.druid.sql.calcite.planner.PlannerConfig; +import io.druid.sql.calcite.util.CalciteTests; +import io.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker; +import org.apache.calcite.jdbc.CalciteConnection; +import org.apache.calcite.plan.RelOptPlanner; +import org.apache.calcite.runtime.Hook; +import org.joda.time.DateTime; +import org.joda.time.Interval; +import org.junit.After; +import org.junit.Assert; +import org.junit.Before; +import org.junit.Rule; +import org.junit.Test; +import org.junit.rules.TemporaryFolder; + +import java.sql.Connection; +import java.sql.ResultSet; +import java.sql.ResultSetMetaData; +import java.sql.SQLException; +import java.util.Arrays; +import java.util.Date; +import java.util.List; +import java.util.Map; + +public class CalciteQueryTest +{ + private static final Logger log = new Logger(CalciteQueryTest.class); + + // Used to mark tests that should pass once Calcite 1.11.0 is released. + private static final boolean CALCITE_1_11_0 = false; + + private static final PlannerConfig PLANNER_CONFIG_DEFAULT = new PlannerConfig(); + private static final PlannerConfig PLANNER_CONFIG_NO_TOPN = new PlannerConfig() + { + @Override + public int getMaxTopNLimit() + { + return 0; + } + }; + private static final PlannerConfig PLANNER_CONFIG_SELECT_PAGING = new PlannerConfig() + { + @Override + public int getSelectThreshold() + { + return 2; + } + }; + private static final PlannerConfig PLANNER_CONFIG_FALLBACK = new PlannerConfig() + { + @Override + public boolean isUseFallback() + { + return true; + } + }; + + private static final Map TIMESERIES_CONTEXT = ImmutableMap.of( + "skipEmptyBuckets", + true + ); + private static final PagingSpec FIRST_PAGING_SPEC = new PagingSpec(null, 1000, true); + + @Rule + public TemporaryFolder temporaryFolder = new TemporaryFolder(); + + private SpecificSegmentsQuerySegmentWalker walker = null; + private final Map connections = Maps.newHashMap(); + private Hook.Closeable unhook = null; + private List recordedQueries = Lists.newCopyOnWriteArrayList(); + + @Before + public void setUp() throws Exception + { + walker = CalciteTests.createWalker(temporaryFolder.newFolder()); + connections.put(PLANNER_CONFIG_DEFAULT, connectJdbc(walker, PLANNER_CONFIG_DEFAULT)); + connections.put(PLANNER_CONFIG_NO_TOPN, connectJdbc(walker, PLANNER_CONFIG_NO_TOPN)); + connections.put(PLANNER_CONFIG_SELECT_PAGING, connectJdbc(walker, PLANNER_CONFIG_SELECT_PAGING)); + connections.put(PLANNER_CONFIG_FALLBACK, connectJdbc(walker, PLANNER_CONFIG_FALLBACK)); + + unhook = Hook.QUERY_PLAN.add( + new Function() + { + @Override + public Object apply(Object input) + { + log.info("Issued query: %s", input); + recordedQueries.add((Query) input); + return null; + } + } + ); + } + + @After + public void tearDown() throws Exception + { + if (unhook != null) { + unhook.close(); + } + walker.close(); + walker = null; + for (CalciteConnection connection : connections.values()) { + connection.close(); + } + connections.clear(); + } + + private static CalciteConnection connectJdbc( + final QuerySegmentWalker walker, + final PlannerConfig plannerConfig + ) throws SQLException + { + return Calcites.jdbc(CalciteTests.createMockSchema(walker, plannerConfig), plannerConfig); + } + + @Test + public void testSelectConstantExpression() throws Exception + { + testQuery( + "SELECT 1 + 1", + ImmutableList.of(), + ImmutableList.of( + new Object[]{2} + ) + ); + } + + @Test + public void testExplainSelectConstantExpression() throws Exception + { + testQuery( + "EXPLAIN PLAN FOR SELECT 1 + 1", + ImmutableList.of(), + ImmutableList.of( + new Object[]{"EnumerableValues(tuples=[[{ 2 }]])\n"} + ) + ); + } + + @Test + public void testMetadata() throws Exception + { + final String varcharDescription = "VARCHAR(1) CHARACTER SET \"ISO-8859-1\" COLLATE \"ISO-8859-1$en_US$primary\" NOT NULL"; + + // Fallback is necessary since without it, we don't have the Enumerable operators necessary to do this query. + testQuery( + PLANNER_CONFIG_FALLBACK, + "SELECT columnName, dataType, typeName FROM metadata.COLUMNS WHERE tableName = 'foo'", + ImmutableList.of(), + ImmutableList.of( + new Object[]{"__time", 93, "TIMESTAMP(0) NOT NULL"}, + new Object[]{"cnt", -5, "BIGINT NOT NULL"}, + new Object[]{"dim1", 12, varcharDescription}, + new Object[]{"dim2", 12, varcharDescription}, + new Object[]{"m1", 6, "FLOAT NOT NULL"} + ) + ); + } + + + @Test + public void testSelectStar() throws Exception + { + testQuery( + "SELECT * FROM druid.foo", + ImmutableList.of( + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .pagingSpec(FIRST_PAGING_SPEC) + .build(), + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .pagingSpec( + new PagingSpec( + ImmutableMap.of("foo_1970-01-01T00:00:00.000Z_2001-01-03T00:00:00.001Z_1", 5), + 1000, + true + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{T("2000-01-01"), 1L, "", "a", 1.0}, + new Object[]{T("2000-01-02"), 1L, "10.1", "", 2.0}, + new Object[]{T("2000-01-03"), 1L, "2", "", 3.0}, + new Object[]{T("2001-01-01"), 1L, "1", "a", 4.0}, + new Object[]{T("2001-01-02"), 1L, "def", "abc", 5.0}, + new Object[]{T("2001-01-03"), 1L, "abc", "", 6.0} + ) + ); + } + + @Test + public void testExplainSelectStar() throws Exception + { + testQuery( + "EXPLAIN PLAN FOR SELECT * FROM druid.foo", + ImmutableList.of(), + ImmutableList.of( + new Object[]{ + "EnumerableInterpreter\n" + + " DruidQueryRel(dataSource=[foo])\n" + } + ) + ); + } + + @Test + public void testSelectStarWithLimit() throws Exception + { + testQuery( + "SELECT * FROM druid.foo LIMIT 2", + ImmutableList.of( + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .pagingSpec(FIRST_PAGING_SPEC) + .build() + ), + ImmutableList.of( + new Object[]{T("2000-01-01"), 1L, "", "a", 1.0}, + new Object[]{T("2000-01-02"), 1L, "10.1", "", 2.0} + ) + ); + } + + @Test + public void testSelectStarWithLimitDescending() throws Exception + { + testQuery( + "SELECT * FROM druid.foo ORDER BY __time DESC LIMIT 2", + ImmutableList.of( + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .descending(true) + .pagingSpec(FIRST_PAGING_SPEC) + .build() + ), + ImmutableList.of( + new Object[]{T("2001-01-03"), 1L, "abc", "", 6.0}, + new Object[]{T("2001-01-02"), 1L, "def", "abc", 5.0} + ) + ); + } + + @Test + public void testSelectSingleColumnWithLimitDescending() throws Exception + { + testQuery( + "SELECT dim1 FROM druid.foo ORDER BY __time DESC LIMIT 2", + ImmutableList.of( + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .dimensionSpecs(DIMS(new DefaultDimensionSpec("dim1", "d1"))) + .granularity(QueryGranularities.ALL) + .descending(true) + .pagingSpec(FIRST_PAGING_SPEC) + .build() + ), + ImmutableList.of( + new Object[]{"abc"}, + new Object[]{"def"} + ) + ); + } + + @Test + public void testSelfJoinWithFallback() throws Exception + { + testQuery( + PLANNER_CONFIG_FALLBACK, + "SELECT x.dim1, y.dim1, y.dim2\n" + + "FROM\n" + + " druid.foo x INNER JOIN druid.foo y ON x.dim1 = y.dim2\n" + + "WHERE\n" + + " x.dim1 <> ''", + ImmutableList.of( + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .filters(NOT(SELECTOR("dim1", "", null))) + .pagingSpec(FIRST_PAGING_SPEC) + .build(), + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .filters(NOT(SELECTOR("dim1", "", null))) + .pagingSpec( + new PagingSpec( + ImmutableMap.of("foo_1970-01-01T00:00:00.000Z_2001-01-03T00:00:00.001Z_1", 4), + 1000, + true + ) + ) + .build(), + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .pagingSpec(FIRST_PAGING_SPEC) + .build(), + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .pagingSpec( + new PagingSpec( + ImmutableMap.of("foo_1970-01-01T00:00:00.000Z_2001-01-03T00:00:00.001Z_1", 5), + 1000, + true + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{"abc", "def", "abc"} + ) + ); + } + + @Test + public void testExplainSelfJoinWithFallback() throws Exception + { + testQuery( + PLANNER_CONFIG_FALLBACK, + "EXPLAIN PLAN FOR\n" + + "SELECT x.dim1, y.dim1, y.dim2\n" + + "FROM\n" + + " druid.foo x INNER JOIN druid.foo y ON x.dim1 = y.dim2\n" + + "WHERE\n" + + " x.dim1 <> ''", + ImmutableList.of(), + ImmutableList.of( + new Object[]{ + "EnumerableCalc(expr#0..9=[{inputs}], dim1=[$t7], dim10=[$t2], dim2=[$t3])\n" + + " EnumerableJoin(condition=[=($3, $7)], joinType=[inner])\n" + + " EnumerableInterpreter\n" + + " DruidQueryRel(dataSource=[foo])\n" + + " EnumerableInterpreter\n" + + " DruidQueryRel(dataSource=[foo], filter=[!dim1 = ])\n" + } + ) + ); + } + + @Test + public void testUnplannableQueries() throws Exception + { + // All of these queries are unplannable because they rely on features Druid doesn't support. + // This test is here to confirm that we don't fall back to Calcite's interpreter or enumerable implementation. + // It's also here so when we do support these features, we can have "real" tests for these queries. + + final List queries = ImmutableList.of( + "SELECT (dim1 || ' ' || dim2) AS cc, COUNT(*) FROM druid.foo GROUP BY dim1 || ' ' || dim2", // Concat two dims + "SELECT dim1 FROM druid.foo ORDER BY dim1", // SELECT query with order by + "SELECT TRIM(dim1) FROM druid.foo", // TRIM function + "SELECT cnt, COUNT(*) FROM druid.foo GROUP BY cnt", // GROUP BY long + "SELECT m1, COUNT(*) FROM druid.foo GROUP BY m1", // GROUP BY float + "SELECT COUNT(*) FROM druid.foo WHERE m1 = 1.0", // Filter on float + "SELECT COUNT(*) FROM druid.foo WHERE dim1 = dim2", // Filter on two columns equaling each other + "SELECT COUNT(*) FROM druid.foo WHERE CHARACTER_LENGTH(dim1) = CHARACTER_LENGTH(dim2)", // Similar to above + "SELECT CHARACTER_LENGTH(dim1) + 1 FROM druid.foo GROUP BY CHARACTER_LENGTH(dim1) + 1", // Group by math + "SELECT COUNT(*) FROM druid.foo x, druid.foo y", // Self-join + "SELECT\n" + + " (CAST(__time AS DATE) + EXTRACT(HOUR FROM __time) * INTERVAL '1' HOUR) AS t,\n" + + " SUM(cnt) AS cnt\n" + + "FROM druid.foo\n" + + "GROUP BY (CAST(__time AS DATE) + EXTRACT(HOUR FROM __time) * INTERVAL '1' HOUR)", // Time arithmetic + "SELECT columnName, typeName FROM metadata.COLUMNS WHERE tableName = 'foo'" // Metadata tables without fallback + ); + + for (final String query : queries) { + Exception e = null; + try { + testQuery(query, ImmutableList.of(), ImmutableList.of()); + } + catch (Exception e1) { + e = e1; + } + + if (!(e instanceof SQLException) || !(e.getCause() instanceof RelOptPlanner.CannotPlanException)) { + log.error(e, "Expected SQLException caused by CannotPlanException for query: %s", query); + Assert.fail(query); + } + } + } + + @Test + public void testSelectStarWithDimFilter() throws Exception + { + testQuery( + "SELECT * FROM druid.foo WHERE dim1 > 'd' OR dim2 = 'a'", + ImmutableList.of( + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .pagingSpec(FIRST_PAGING_SPEC) + .filters( + OR( + BOUND("dim1", "d", null, true, false, null, StringComparators.LEXICOGRAPHIC), + SELECTOR("dim2", "a", null) + ) + ) + .build(), + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .pagingSpec( + new PagingSpec( + ImmutableMap.of("foo_1970-01-01T00:00:00.000Z_2001-01-03T00:00:00.001Z_1", 2), + 1000, + true + ) + ) + .filters( + OR( + BOUND("dim1", "d", null, true, false, null, StringComparators.LEXICOGRAPHIC), + SELECTOR("dim2", "a", null) + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{T("2000-01-01"), 1L, "", "a", 1.0}, + new Object[]{T("2001-01-01"), 1L, "1", "a", 4.0}, + new Object[]{T("2001-01-02"), 1L, "def", "abc", 5.0} + ) + ); + } + + @Test + public void testSelectStarWithDimFilterAndPaging() throws Exception + { + testQuery( + PLANNER_CONFIG_SELECT_PAGING, + "SELECT * FROM druid.foo WHERE dim1 > 'd' OR dim2 = 'a'", + ImmutableList.of( + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .pagingSpec(new PagingSpec(null, 2, true)) + .filters( + OR( + BOUND("dim1", "d", null, true, false, null, StringComparators.LEXICOGRAPHIC), + SELECTOR("dim2", "a", null) + ) + ) + .build(), + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .pagingSpec( + new PagingSpec( + ImmutableMap.of("foo_1970-01-01T00:00:00.000Z_2001-01-03T00:00:00.001Z_1", 1), + 2, + true + ) + ) + .filters( + OR( + BOUND("dim1", "d", null, true, false, null, StringComparators.LEXICOGRAPHIC), + SELECTOR("dim2", "a", null) + ) + ) + .build(), + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .pagingSpec( + new PagingSpec( + ImmutableMap.of("foo_1970-01-01T00:00:00.000Z_2001-01-03T00:00:00.001Z_1", 2), + 2, + true + ) + ) + .filters( + OR( + BOUND("dim1", "d", null, true, false, null, StringComparators.LEXICOGRAPHIC), + SELECTOR("dim2", "a", null) + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{T("2000-01-01"), 1L, "", "a", 1.0}, + new Object[]{T("2001-01-01"), 1L, "1", "a", 4.0}, + new Object[]{T("2001-01-02"), 1L, "def", "abc", 5.0} + ) + ); + } + + @Test + public void testGroupByNothingWithLiterallyFalseFilter() throws Exception + { + if (!CALCITE_1_11_0) { + // https://issues.apache.org/jira/browse/CALCITE-1488 + return; + } + + testQuery( + "SELECT COUNT(*), MAX(cnt) FROM druid.foo WHERE 1 = 0", + ImmutableList.of(), + ImmutableList.of( + new Object[]{0L, null} + ) + ); + } + + @Test + public void testGroupByOneColumnWithLiterallyFalseFilter() throws Exception + { + if (!CALCITE_1_11_0) { + // https://issues.apache.org/jira/browse/CALCITE-1488 + return; + } + + testQuery( + "SELECT COUNT(*), MAX(cnt) FROM druid.foo WHERE 1 = 0 GROUP BY dim1", + ImmutableList.of(), + ImmutableList.of() + ); + } + + @Test + public void testGroupByWithFilterMatchingNothing() throws Exception + { + // This query should actually return [0, null] rather than an empty result set, but it doesn't. + // This test just "documents" the current behavior. + + testQuery( + "SELECT COUNT(*), MAX(cnt) FROM druid.foo WHERE dim1 = 'foobar'", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .filters(SELECTOR("dim1", "foobar", null)) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS( + new CountAggregatorFactory("a0"), + new LongMaxAggregatorFactory("a1", "cnt") + )) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of() + ); + } + + @Test + public void testGroupByWithFilterMatchingNothingWithGroupByLiteral() throws Exception + { + testQuery( + "SELECT COUNT(*), MAX(cnt) FROM druid.foo WHERE dim1 = 'foobar' GROUP BY 'dummy'", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .filters(SELECTOR("dim1", "foobar", null)) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS( + new CountAggregatorFactory("a0"), + new LongMaxAggregatorFactory("a1", "cnt") + )) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of() + ); + } + + @Test + public void testCountStar() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{6L} + ) + ); + } + + @Test + public void testCountStarWithLikeFilter() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo WHERE dim1 like 'a%' OR dim2 like '%xb%' escape 'x'", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .filters( + OR( + new LikeDimFilter("dim1", "a%", null, null), + new LikeDimFilter("dim2", "%xb%", "x", null) + ) + ) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{2L} + ) + ); + } + + @Test + public void testCountStarWithLongColumnFilters() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo WHERE cnt >= 3 OR cnt = 1", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .filters( + OR( + BOUND("cnt", "3", null, false, false, null, StringComparators.NUMERIC), + SELECTOR("cnt", "1", null) + ) + ) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{6L} + ) + ); + } + + @Test + public void testCountStarWithLongColumnFiltersOnTwoPoints() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo WHERE cnt = 1 OR cnt = 2", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .filters(IN("cnt", ImmutableList.of("1", "2"), null)) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{6L} + ) + ); + } + + @Test + public void testFilterOnStringAsNumber() throws Exception + { + testQuery( + "SELECT distinct dim1 FROM druid.foo WHERE " + + "dim1 = 10 OR " + + "(floor(CAST(dim1 AS float)) = 10.00 and CAST(dim1 AS float) > 9 and CAST(dim1 AS float) <= 10.5)", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions(DIMS(new DefaultDimensionSpec("dim1", "d0"))) + .setDimFilter( + OR( + SELECTOR("dim1", "10", null), + AND( + NUMERIC_SELECTOR("dim1", "10.00", new BucketExtractionFn(1.0, 0.0)), + BOUND("dim1", "9", "10.5", true, false, null, StringComparators.NUMERIC) + ) + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{"10.1"} + ) + ); + } + + @Test + public void testSimpleAggregations() throws Exception + { + testQuery( + "SELECT COUNT(*), COUNT(cnt), COUNT(dim1), AVG(cnt), SUM(cnt), SUM(cnt) + MIN(cnt) + MAX(cnt) FROM druid.foo", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .aggregators( + AGGS( + new CountAggregatorFactory("a0"), + new LongSumAggregatorFactory("A1:sum", "cnt"), + new CountAggregatorFactory("A1:count"), + new LongSumAggregatorFactory("a2", "cnt"), + new LongMinAggregatorFactory("a3", "cnt"), + new LongMaxAggregatorFactory("a4", "cnt") + ) + ) + .postAggregators( + ImmutableList.of( + new ArithmeticPostAggregator( + "a1", + "quotient", + ImmutableList.of( + new FieldAccessPostAggregator(null, "A1:sum"), + new FieldAccessPostAggregator(null, "A1:count") + ) + ), + new ArithmeticPostAggregator( + "a5", + "+", + ImmutableList.of( + new ArithmeticPostAggregator( + null, + "+", + ImmutableList.of( + new FieldAccessPostAggregator(null, "a2"), + new FieldAccessPostAggregator(null, "a3") + ) + ), + new FieldAccessPostAggregator(null, "a4") + ) + ) + ) + ) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{6L, 6L, 6L, 1L, 6L, 8L} + ) + ); + } + + @Test + public void testGroupByWithSortOnPostAggregation() throws Exception + { + testQuery( + "SELECT dim1, MIN(m1) + MAX(m1) AS x FROM druid.foo GROUP BY dim1 ORDER BY x LIMIT 3", + ImmutableList.of( + new TopNQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .dimension(new DefaultDimensionSpec("dim1", "d0")) + .metric(new InvertedTopNMetricSpec(new NumericTopNMetricSpec("a2"))) + .aggregators(AGGS( + new DoubleMinAggregatorFactory("a0", "m1"), + new DoubleMaxAggregatorFactory("a1", "m1") + )) + .postAggregators( + ImmutableList.of( + new ArithmeticPostAggregator( + "a2", + "+", + ImmutableList.of( + new FieldAccessPostAggregator(null, "a0"), + new FieldAccessPostAggregator(null, "a1") + ) + ) + ) + ) + .threshold(3) + .build() + ), + ImmutableList.of( + new Object[]{"", 2.0}, + new Object[]{"10.1", 4.0}, + new Object[]{"2", 6.0} + ) + ); + } + + @Test + public void testGroupByWithSortOnPostAggregationNoTopN() throws Exception + { + testQuery( + PLANNER_CONFIG_NO_TOPN, + "SELECT dim1, MIN(m1) + MAX(m1) AS x FROM druid.foo GROUP BY dim1 ORDER BY x LIMIT 3", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions(DIMS(new DefaultDimensionSpec("dim1", "d0"))) + .setAggregatorSpecs( + ImmutableList.of( + new DoubleMinAggregatorFactory("a0", "m1"), + new DoubleMaxAggregatorFactory("a1", "m1") + ) + ) + .setPostAggregatorSpecs( + ImmutableList.of( + new ArithmeticPostAggregator( + "a2", + "+", + ImmutableList.of( + new FieldAccessPostAggregator(null, "a0"), + new FieldAccessPostAggregator(null, "a1") + ) + ) + ) + ) + .setLimitSpec( + new DefaultLimitSpec( + ImmutableList.of( + new OrderByColumnSpec( + "a2", + OrderByColumnSpec.Direction.ASCENDING, + StringComparators.NUMERIC + ) + ), + 3 + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{"", 2.0}, + new Object[]{"10.1", 4.0}, + new Object[]{"2", 6.0} + ) + ); + } + + @Test + public void testFilteredAggregations() throws Exception + { + testQuery( + "SELECT " + + "SUM(case dim1 when 'abc' then cnt end), " + + "SUM(case dim1 when 'abc' then null else cnt end), " + + "SUM(case substring(dim1, 1, 1) when 'a' then cnt end), " + + "COUNT(dim2) filter(WHERE dim1 <> '1'), " + + "COUNT(CASE WHEN dim1 <> '1' THEN 'dummy' END), " + + "SUM(CASE WHEN dim1 <> '1' THEN 1 ELSE 0 END), " + + "SUM(cnt) filter(WHERE dim2 = 'a'), " + + "SUM(case when dim1 <> '1' then cnt end) filter(WHERE dim2 = 'a') " + + "FROM druid.foo", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS( + new FilteredAggregatorFactory( + new LongSumAggregatorFactory("a0", "cnt"), + SELECTOR("dim1", "abc", null) + ), + new FilteredAggregatorFactory( + new LongSumAggregatorFactory("a1", "cnt"), + NOT(SELECTOR("dim1", "abc", null)) + ), + new FilteredAggregatorFactory( + new LongSumAggregatorFactory("a2", "cnt"), + SELECTOR("dim1", "a", new SubstringDimExtractionFn(0, 1)) + ), + new FilteredAggregatorFactory( + new CountAggregatorFactory("a3"), + NOT(SELECTOR("dim1", "1", null)) + ), + new FilteredAggregatorFactory( + new CountAggregatorFactory("a4"), + NOT(SELECTOR("dim1", "1", null)) + ), + new FilteredAggregatorFactory( + new CountAggregatorFactory("a5"), + NOT(SELECTOR("dim1", "1", null)) + ), + new FilteredAggregatorFactory( + new LongSumAggregatorFactory("a6", "cnt"), + SELECTOR("dim2", "a", null) + ), + new FilteredAggregatorFactory( + new LongSumAggregatorFactory("a7", "cnt"), + AND( + SELECTOR("dim2", "a", null), + NOT(SELECTOR("dim1", "1", null)) + ) + ) + )) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{1L, 5L, 1L, 5L, 5L, 5, 2L, 1L} + ) + ); + } + + @Test + public void testExpressionAggregations() throws Exception + { + testQuery( + "SELECT SUM(cnt * 3), LN(SUM(cnt) + SUM(m1)) FROM druid.foo", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS( + new LongSumAggregatorFactory("a0", null, "(\"cnt\" * 3)"), + new LongSumAggregatorFactory("a1", "cnt", null), + new DoubleSumAggregatorFactory("a2", "m1", null) + )) + .postAggregators(ImmutableList.of( + new ExpressionPostAggregator("a3", "log((\"a1\" + \"a2\"))") + )) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{18L, 3.295836866004329} + ) + ); + } + + @Test + public void testInFilter() throws Exception + { + testQuery( + "SELECT dim1, COUNT(*) FROM druid.foo WHERE dim1 IN ('abc', 'def', 'ghi') GROUP BY dim1", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions(DIMS(new DefaultDimensionSpec("dim1", "d0"))) + .setDimFilter(new InDimFilter("dim1", ImmutableList.of("abc", "def", "ghi"), null)) + .setAggregatorSpecs( + AGGS( + new CountAggregatorFactory("a0") + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{"abc", 1L}, + new Object[]{"def", 1L} + ) + ); + } + + @Test + public void testCountStarWithDegenerateFilter() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo WHERE dim2 = 'a' and (dim1 > 'a' OR dim1 < 'b')", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .filters(SELECTOR("dim2", "a", null)) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{2L} + ) + ); + } + + @Test + public void testCountStarWithNotOfDegenerateFilter() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo WHERE dim2 = 'a' and not (dim1 > 'a' OR dim1 < 'b')", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS()) + .granularity(QueryGranularities.ALL) + .filters(null) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of() + ); + } + + @Test + public void testCountStarWithBoundFilterSimplifyOr() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo WHERE (dim1 >= 'a' and dim1 < 'b') OR dim1 = 'ab'", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .filters(BOUND("dim1", "a", "b", false, true, null, StringComparators.LEXICOGRAPHIC)) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{1L} + ) + ); + } + + @Test + public void testCountStarWithBoundFilterSimplifyAnd() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo WHERE (dim1 >= 'a' and dim1 < 'b') and dim1 = 'abc'", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .filters(SELECTOR("dim1", "abc", null)) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{1L} + ) + ); + } + + @Test + public void testCountStarWithFilterOnCastedString() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo WHERE CAST(dim1 AS bigint) = 2", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .filters(NUMERIC_SELECTOR("dim1", "2", null)) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{1L} + ) + ); + } + + @Test + public void testCountStarWithTimeFilter() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo " + + "WHERE __time >= TIMESTAMP '2000-01-01 00:00:00' AND __time < TIMESTAMP '2001-01-01 00:00:00'", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(new Interval("2000-01-01/2001-01-01"))) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{3L} + ) + ); + } + + @Test + public void testCountStarWithSinglePointInTime() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo WHERE __time = TIMESTAMP '2000-01-01 00:00:00'", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(new Interval("2000-01-01/2000-01-01T00:00:00.001"))) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{1L} + ) + ); + } + + @Test + public void testCountStarWithTwoPointsInTime() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo WHERE " + + "__time = TIMESTAMP '2000-01-01 00:00:00' OR __time = TIMESTAMP '2000-01-01 00:00:00' + INTERVAL '1' DAY", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals( + QSS( + new Interval("2000-01-01/2000-01-01T00:00:00.001"), + new Interval("2000-01-02/2000-01-02T00:00:00.001") + ) + ) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{2L} + ) + ); + } + + @Test + public void testCountStarWithComplexDisjointTimeFilter() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo " + + "WHERE dim2 = 'a' and (" + + " (__time >= TIMESTAMP '2000-01-01 00:00:00' AND __time < TIMESTAMP '2001-01-01 00:00:00')" + + " OR (" + + " (__time >= TIMESTAMP '2002-01-01 00:00:00' AND __time < TIMESTAMP '2003-05-01 00:00:00')" + + " and (__time >= TIMESTAMP '2002-05-01 00:00:00' AND __time < TIMESTAMP '2004-01-01 00:00:00')" + + " and dim1 = 'abc'" + + " )" + + ")", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(new Interval("2000/2001"), new Interval("2002-05-01/2003-05-01"))) + .granularity(QueryGranularities.ALL) + .filters( + AND( + SELECTOR("dim2", "a", null), + OR( + TIME_BOUND("2000/2001"), + AND( + SELECTOR("dim1", "abc", null), + TIME_BOUND("2002-05-01/2003-05-01") + ) + ) + ) + ) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{1L} + ) + ); + } + + @Test + public void testCountStarWithNotOfComplexDisjointTimeFilter() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo " + + "WHERE not (dim2 = 'a' and (" + + " (__time >= TIMESTAMP '2000-01-01 00:00:00' AND __time < TIMESTAMP '2001-01-01 00:00:00')" + + " OR (" + + " (__time >= TIMESTAMP '2002-01-01 00:00:00' AND __time < TIMESTAMP '2004-01-01 00:00:00')" + + " and (__time >= TIMESTAMP '2002-05-01 00:00:00' AND __time < TIMESTAMP '2003-05-01 00:00:00')" + + " and dim1 = 'abc'" + + " )" + + " )" + + ")", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .filters( + OR( + NOT(SELECTOR("dim2", "a", null)), + AND( + NOT(TIME_BOUND("2000/2001")), + NOT( + AND( + SELECTOR("dim1", "abc", null), + TIME_BOUND("2002-05-01/2003-05-01") + ) + ) + ) + ) + ) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{5L} + ) + ); + } + + @Test + public void testCountStarWithNotTimeFilter() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo " + + "WHERE dim1 <> 'xxx' and not (" + + " (__time >= TIMESTAMP '2000-01-01 00:00:00' AND __time < TIMESTAMP '2001-01-01 00:00:00')" + + " OR (__time >= TIMESTAMP '2003-01-01 00:00:00' AND __time < TIMESTAMP '2004-01-01 00:00:00'))", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals( + QSS( + new Interval(Filtration.eternity().getStart(), new DateTime("2000")), + new Interval("2001/2003"), + new Interval(new DateTime("2004"), Filtration.eternity().getEnd()) + ) + ) + .filters(NOT(SELECTOR("dim1", "xxx", null))) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{3L} + ) + ); + } + + @Test + public void testCountStarWithTimeAndDimFilter() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo " + + "WHERE dim2 <> 'a' " + + "and __time BETWEEN TIMESTAMP '2000-01-01 00:00:00' AND TIMESTAMP '2000-12-31 23:59:59.999'", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(new Interval("2000-01-01/2001-01-01"))) + .filters(NOT(SELECTOR("dim2", "a", null))) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{2L} + ) + ); + } + + @Test + public void testCountStarWithTimeOrDimFilter() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo " + + "WHERE dim2 <> 'a' " + + "or __time BETWEEN TIMESTAMP '2000-01-01 00:00:00' AND TIMESTAMP '2000-12-31 23:59:59.999'", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .filters( + OR( + NOT(SELECTOR("dim2", "a", null)), + BOUND( + "__time", + String.valueOf(T("2000-01-01").getTime()), + String.valueOf(T("2000-12-31T23:59:59.999").getTime()), + false, + false, + null, + StringComparators.NUMERIC + ) + ) + ) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{5L} + ) + ); + } + + @Test + public void testCountStarWithTimeFilterOnLongColumn() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo WHERE " + + "cnt >= EXTRACT(EPOCH FROM TIMESTAMP '1970-01-01 00:00:00') * 1000 " + + "AND cnt < EXTRACT(EPOCH FROM TIMESTAMP '1970-01-02 00:00:00') * 1000", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .filters( + BOUND( + "cnt", + String.valueOf(new DateTime("1970-01-01").getMillis()), + String.valueOf(new DateTime("1970-01-02").getMillis()), + false, + true, + null, + StringComparators.NUMERIC + ) + ) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{6L} + ) + ); + } + + @Test + public void testSelectDistinctWithCascadeExtractionFilter() throws Exception + { + testQuery( + "SELECT distinct dim1 FROM druid.foo WHERE substring(substring(dim1, 2), 1, 1) = 'e' OR dim2 = 'a'", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions(DIMS(new DefaultDimensionSpec("dim1", "d0"))) + .setDimFilter( + OR( + SELECTOR( + "dim1", + "e", + CASCADE( + new SubstringDimExtractionFn(1, null), + new SubstringDimExtractionFn(0, 1) + ) + ), + SELECTOR("dim2", "a", null) + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{""}, + new Object[]{"1"}, + new Object[]{"def"} + ) + ); + } + + @Test + public void testSelectDistinctWithStrlenFilter() throws Exception + { + testQuery( + "SELECT distinct dim1 FROM druid.foo " + + "WHERE CHARACTER_LENGTH(dim1) = 3 OR CAST(CHARACTER_LENGTH(dim1) AS varchar) = 3", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions(DIMS(new DefaultDimensionSpec("dim1", "d0"))) + .setDimFilter( + OR( + NUMERIC_SELECTOR("dim1", "3", StrlenExtractionFn.instance()), + SELECTOR("dim1", "3", StrlenExtractionFn.instance()) + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{"abc"}, + new Object[]{"def"} + ) + ); + } + + @Test + public void testCountDistinct() throws Exception + { + testQuery( + "SELECT SUM(cnt), COUNT(distinct dim2) FROM druid.foo", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .aggregators( + AGGS( + new LongSumAggregatorFactory("a0", "cnt"), + new CardinalityAggregatorFactory( + "a1", + null, + DIMS(new DefaultDimensionSpec("dim2", "A1:dimSpec")), + false + ) + ) + ) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{6L, 3L} + ) + ); + } + + @Test + public void testCountDistinctArithmetic() throws Exception + { + testQuery( + "SELECT\n" + + " SUM(cnt),\n" + + " COUNT(DISTINCT dim2),\n" + + " CAST(COUNT(DISTINCT dim2) AS FLOAT),\n" + + " SUM(cnt) / COUNT(DISTINCT dim2),\n" + + " SUM(cnt) / COUNT(DISTINCT dim2) + 3,\n" + + " CAST(SUM(cnt) AS FLOAT) / CAST(COUNT(DISTINCT dim2) AS FLOAT) + 3\n" + + "FROM druid.foo", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .aggregators( + AGGS( + new LongSumAggregatorFactory("a0", "cnt"), + new CardinalityAggregatorFactory( + "a1", + null, + DIMS(new DefaultDimensionSpec("dim2", "A1:dimSpec")), + false + ) + ) + ) + .postAggregators(ImmutableList.of( + new HyperUniqueFinalizingPostAggregator("a2", "a1"), + new ArithmeticPostAggregator("a3", "quotient", ImmutableList.of( + new FieldAccessPostAggregator(null, "a0"), + new HyperUniqueFinalizingPostAggregator(null, "a1") + )), + new ArithmeticPostAggregator("a4", "+", ImmutableList.of( + new ArithmeticPostAggregator(null, "quotient", ImmutableList.of( + new FieldAccessPostAggregator(null, "a0"), + new HyperUniqueFinalizingPostAggregator(null, "a1") + )), + new ConstantPostAggregator(null, 3) + )), + new ArithmeticPostAggregator("a5", "+", ImmutableList.of( + new ArithmeticPostAggregator(null, "quotient", ImmutableList.of( + new FieldAccessPostAggregator(null, "a0"), + new HyperUniqueFinalizingPostAggregator(null, "a1") + )), + new ConstantPostAggregator(null, 3) + )) + )) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{6L, 3L, 3.0021994137521975, 1L, 4L, 4.9985347983600805} + ) + ); + } + + @Test + public void testCountDistinctOfSubstring() throws Exception + { + testQuery( + "SELECT COUNT(distinct substring(dim1, 1, 1)) FROM druid.foo WHERE dim1 <> ''", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .filters(NOT(SELECTOR("dim1", "", null))) + .granularity(QueryGranularities.ALL) + .aggregators( + AGGS( + new CardinalityAggregatorFactory( + "a0", + DIMS( + new ExtractionDimensionSpec( + "dim1", + "A0:dimSpec", + new SubstringDimExtractionFn(0, 1) + ) + ), + false + ) + ) + ) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{4L} + ) + ); + } + + @Test + public void testGroupByLimitPushDown() throws Exception + { + testQuery( + "SELECT dim1, dim2, SUM(cnt) FROM druid.foo GROUP BY dim1, dim2 ORDER BY dim2 LIMIT 4", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions( + DIMS( + new DefaultDimensionSpec("dim2", "d1"), + new DefaultDimensionSpec("dim1", "d0") + ) + ) + .setAggregatorSpecs( + AGGS( + new LongSumAggregatorFactory("a0", "cnt") + ) + ) + .setLimitSpec( + new DefaultLimitSpec( + ImmutableList.of( + new OrderByColumnSpec("d1", OrderByColumnSpec.Direction.ASCENDING) + ), + 4 + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{"10.1", "", 1L}, + new Object[]{"2", "", 1L}, + new Object[]{"abc", "", 1L}, + new Object[]{"", "a", 1L} + ) + ); + } + + @Test + public void testGroupByLimitPushDownWithHavingOnLong() throws Exception + { + testQuery( + "SELECT dim1, dim2, SUM(cnt) AS thecnt " + + "FROM druid.foo " + + "group by dim1, dim2 " + + "having SUM(cnt) = 1 " + + "order by dim2 " + + "limit 4", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions( + DIMS( + new DefaultDimensionSpec("dim2", "d1"), + new DefaultDimensionSpec("dim1", "d0") + ) + ) + .setAggregatorSpecs( + AGGS( + new LongSumAggregatorFactory("a0", "cnt") + ) + ) + .setLimitSpec( + new DefaultLimitSpec( + ImmutableList.of( + new OrderByColumnSpec("d1", OrderByColumnSpec.Direction.ASCENDING) + ), + 4 + ) + ) + .setHavingSpec(new DimFilterHavingSpec(NUMERIC_SELECTOR("a0", "1", null))) + .build() + ), + ImmutableList.of( + new Object[]{"10.1", "", 1L}, + new Object[]{"2", "", 1L}, + new Object[]{"abc", "", 1L}, + new Object[]{"", "a", 1L} + ) + ); + } + + @Test + public void testGroupByLimitPushDownWithHavingOnDouble() throws Exception + { + testQuery( + "SELECT dim1, dim2, SUM(m1) AS m1_sum " + + "FROM druid.foo " + + "group by dim1, dim2 " + + "having SUM(m1) > 1 " + + "order by dim2 " + + "limit 4", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions( + DIMS( + new DefaultDimensionSpec("dim2", "d1"), + new DefaultDimensionSpec("dim1", "d0") + ) + ) + .setAggregatorSpecs( + AGGS( + new DoubleSumAggregatorFactory("a0", "m1") + ) + ) + .setLimitSpec( + new DefaultLimitSpec( + ImmutableList.of( + new OrderByColumnSpec("d1", OrderByColumnSpec.Direction.ASCENDING) + ), + 4 + ) + ) + .setHavingSpec(new DimFilterHavingSpec( + BOUND("a0", "1", null, true, false, null, StringComparators.NUMERIC) + )) + .build() + ), + ImmutableList.of( + new Object[]{"10.1", "", 2.0}, + new Object[]{"2", "", 3.0}, + new Object[]{"abc", "", 6.0}, + new Object[]{"1", "a", 4.0} + ) + ); + } + + @Test + public void testFilterOnTimeFloor() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo " + + "WHERE floor(__time TO month) = TIMESTAMP '2000-01-01 00:00:00'", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(new Interval("2000/P1M"))) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{3L} + ) + ); + } + + @Test + public void testFilterOnTimeFloorMisaligned() throws Exception + { + testQuery( + "SELECT COUNT(*) FROM druid.foo " + + "WHERE floor(__time TO month) = TIMESTAMP '2000-01-01 00:00:01'", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS()) + .granularity(QueryGranularities.ALL) + .aggregators(AGGS(new CountAggregatorFactory("a0"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of() + ); + } + + @Test + public void testGroupByFloor() throws Exception + { + testQuery( + "SELECT floor(CAST(dim1 AS float)), COUNT(*) FROM druid.foo GROUP BY floor(CAST(dim1 AS float))", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions(DIMS( + new ExtractionDimensionSpec("dim1", "d0", new BucketExtractionFn(1.0, 0.0)) + )) + .setAggregatorSpecs(AGGS(new CountAggregatorFactory("a0"))) + .build() + ), + ImmutableList.of( + new Object[]{null, 3L}, + new Object[]{1.0, 1L}, + new Object[]{10.0, 1L}, + new Object[]{2.0, 1L} + ) + ); + } + + @Test + public void testGroupByFloorWithOrderBy() throws Exception + { + testQuery( + "SELECT floor(CAST(dim1 AS float)) AS fl, COUNT(*) FROM druid.foo GROUP BY floor(CAST(dim1 AS float)) ORDER BY fl DESC", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions( + DIMS( + new ExtractionDimensionSpec("dim1", "d0", new BucketExtractionFn(1.0, 0.0)) + ) + ) + .setAggregatorSpecs(AGGS(new CountAggregatorFactory("a0"))) + .setLimitSpec( + new DefaultLimitSpec( + ImmutableList.of( + new OrderByColumnSpec( + "d0", + OrderByColumnSpec.Direction.DESCENDING, + StringComparators.NUMERIC + ) + ), + Integer.MAX_VALUE + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{10.0, 1L}, + new Object[]{2.0, 1L}, + new Object[]{1.0, 1L}, + new Object[]{null, 3L} + ) + ); + } + + @Test + public void testGroupByFloorTimeAndOneOtherDimensionWithOrderBy() throws Exception + { + testQuery( + "SELECT floor(__time TO year), dim2, COUNT(*)" + + " FROM druid.foo" + + " GROUP BY floor(__time TO year), dim2" + + " ORDER BY floor(__time TO year), dim2, COUNT(*) DESC", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions( + DIMS( + new ExtractionDimensionSpec( + "__time", + "d0", + new TimeFormatExtractionFn(null, null, null, QueryGranularities.YEAR, true) + ), + new DefaultDimensionSpec("dim2", "d1") + ) + ) + .setAggregatorSpecs( + AGGS( + new CountAggregatorFactory("a0") + ) + ) + .setLimitSpec( + new DefaultLimitSpec( + ImmutableList.of( + new OrderByColumnSpec( + "d0", + OrderByColumnSpec.Direction.ASCENDING, + StringComparators.NUMERIC + ), + new OrderByColumnSpec( + "d1", + OrderByColumnSpec.Direction.ASCENDING, + StringComparators.LEXICOGRAPHIC + ), + new OrderByColumnSpec( + "a0", + OrderByColumnSpec.Direction.DESCENDING, + StringComparators.NUMERIC + ) + ), + Integer.MAX_VALUE + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{T("2000"), "", 2L}, + new Object[]{T("2000"), "a", 1L}, + new Object[]{T("2001"), "", 1L}, + new Object[]{T("2001"), "a", 1L}, + new Object[]{T("2001"), "abc", 1L} + ) + ); + } + + @Test + public void testGroupByStringLength() throws Exception + { + testQuery( + "SELECT CHARACTER_LENGTH(dim1), COUNT(*) FROM druid.foo GROUP BY CHARACTER_LENGTH(dim1)", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions( + DIMS( + new ExtractionDimensionSpec( + "dim1", + "d0", + StrlenExtractionFn.instance() + ) + ) + ) + .setAggregatorSpecs( + AGGS( + new CountAggregatorFactory("a0") + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{0, 1L}, + new Object[]{1, 2L}, + new Object[]{3, 2L}, + new Object[]{4, 1L} + ) + ); + } + + @Test + public void testTimeseries() throws Exception + { + testQuery( + "SELECT gran, SUM(cnt) FROM (SELECT floor(__time TO month) AS gran, cnt FROM druid.foo) AS x GROUP BY gran ORDER BY gran", + ImmutableList.of( + Druids.newTimeseriesQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.MONTH) + .aggregators(AGGS(new LongSumAggregatorFactory("a0", "cnt"))) + .context(TIMESERIES_CONTEXT) + .build() + ), + ImmutableList.of( + new Object[]{T("2000-01-01"), 3L}, + new Object[]{T("2001-01-01"), 3L} + ) + ); + } + + @Test + public void testGroupByExtractYear() throws Exception + { + if (!CALCITE_1_11_0) { + // https://issues.apache.org/jira/browse/CALCITE-1509 + return; + } + + testQuery( + "SELECT\n" + + " EXTRACT(YEAR FROM __time) AS \"year\",\n" + + " SUM(cnt)\n" + + "FROM druid.foo\n" + + "GROUP BY EXTRACT(YEAR FROM __time)\n" + + "ORDER BY 1", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions( + DIMS( + new ExtractionDimensionSpec( + "__time", + "d0", + new TimeFormatExtractionFn("Y", null, null, QueryGranularities.NONE, true) + ) + ) + ) + .setAggregatorSpecs(AGGS(new LongSumAggregatorFactory("a0", "cnt"))) + .setLimitSpec( + new DefaultLimitSpec( + ImmutableList.of( + new OrderByColumnSpec( + "d0", + OrderByColumnSpec.Direction.ASCENDING, + StringComparators.NUMERIC + ) + ), + Integer.MAX_VALUE + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{2000L, 3L}, + new Object[]{2001L, 3L} + ) + ); + } + + @Test + public void testExtractFloorTime() throws Exception + { + if (!CALCITE_1_11_0) { + // https://issues.apache.org/jira/browse/CALCITE-1509 + return; + } + + testQuery( + "SELECT\n" + + "EXTRACT(YEAR FROM FLOOR(__time TO YEAR)) AS \"year\", SUM(cnt)\n" + + "FROM druid.foo\n" + + "GROUP BY EXTRACT(YEAR FROM FLOOR(__time TO YEAR))", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions( + DIMS( + new ExtractionDimensionSpec( + "__time", + "d0", + CASCADE( + new TimeFormatExtractionFn(null, null, null, QueryGranularities.YEAR, true), + new TimeFormatExtractionFn("Y", null, null, QueryGranularities.NONE, true) + ) + ) + ) + ) + .setAggregatorSpecs(AGGS(new LongSumAggregatorFactory("a0", "cnt"))) + .build() + ), + ImmutableList.of( + new Object[]{2000L, 3L}, + new Object[]{2001L, 3L} + ) + ); + } + + @Test + public void testTimeseriesWithLimitNoTopN() throws Exception + { + testQuery( + PLANNER_CONFIG_NO_TOPN, + "SELECT gran, SUM(cnt)\n" + + "FROM (\n" + + " SELECT floor(__time TO month) AS gran, cnt\n" + + " FROM druid.foo\n" + + ") AS x\n" + + "GROUP BY gran\n" + + "ORDER BY gran\n" + + "LIMIT 1", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions( + DIMS( + new ExtractionDimensionSpec( + "__time", + "d0", + new TimeFormatExtractionFn(null, null, null, QueryGranularities.MONTH, true) + ) + ) + ) + .setAggregatorSpecs(AGGS(new LongSumAggregatorFactory("a0", "cnt"))) + .setLimitSpec( + new DefaultLimitSpec( + ImmutableList.of( + new OrderByColumnSpec( + "d0", + OrderByColumnSpec.Direction.ASCENDING, + StringComparators.NUMERIC + ) + ), + 1 + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{T("2000-01-01"), 3L} + ) + ); + } + + @Test + public void testTimeseriesWithLimit() throws Exception + { + testQuery( + "SELECT gran, SUM(cnt)\n" + + "FROM (\n" + + " SELECT floor(__time TO month) AS gran, cnt\n" + + " FROM druid.foo\n" + + ") AS x\n" + + "GROUP BY gran\n" + + "ORDER BY gran\n" + + "LIMIT 1", + ImmutableList.of( + new TopNQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .dimension( + new ExtractionDimensionSpec( + "__time", + "d0", + new TimeFormatExtractionFn(null, null, null, QueryGranularities.MONTH, true) + ) + ) + .aggregators(AGGS(new LongSumAggregatorFactory("a0", "cnt"))) + .metric(new DimensionTopNMetricSpec(null, StringComparators.NUMERIC)) + .threshold(1) + .build() + ), + ImmutableList.of( + new Object[]{T("2000-01-01"), 3L} + ) + ); + } + + @Test + public void testGroupByTimeAndOtherDimension() throws Exception + { + testQuery( + "SELECT dim2, gran, SUM(cnt)\n" + + "FROM (SELECT FLOOR(__time TO MONTH) AS gran, dim2, cnt FROM druid.foo) AS x\n" + + "GROUP BY dim2, gran\n" + + "ORDER BY dim2, gran", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimensions( + DIMS( + new DefaultDimensionSpec("dim2", "d1"), + new ExtractionDimensionSpec( + "__time", + "d0", + new TimeFormatExtractionFn(null, null, null, QueryGranularities.MONTH, true) + ) + ) + ) + .setAggregatorSpecs(AGGS(new LongSumAggregatorFactory("a0", "cnt"))) + .setLimitSpec( + new DefaultLimitSpec( + ImmutableList.of( + new OrderByColumnSpec("d1", OrderByColumnSpec.Direction.ASCENDING), + new OrderByColumnSpec( + "d0", + OrderByColumnSpec.Direction.ASCENDING, + StringComparators.NUMERIC + ) + ), + Integer.MAX_VALUE + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{"", T("2000-01-01"), 2L}, + new Object[]{"", T("2001-01-01"), 1L}, + new Object[]{"a", T("2000-01-01"), 1L}, + new Object[]{"a", T("2001-01-01"), 1L}, + new Object[]{"abc", T("2001-01-01"), 1L} + ) + ); + } + + @Test + public void testUsingSubqueryAsFilter() throws Exception + { + testQuery( + "SELECT dim1, dim2, COUNT(*) FROM druid.foo " + + "WHERE dim2 IN (SELECT dim1 FROM druid.foo WHERE dim1 <> '')" + + "AND dim1 <> 'xxx'" + + "group by dim1, dim2 ORDER BY dim2", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimFilter(NOT(SELECTOR("dim1", "", null))) + .setDimensions(DIMS(new DefaultDimensionSpec("dim1", "v2"))) + .build(), + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimFilter( + AND( + IN("dim2", ImmutableList.of("1", "10.1", "2", "abc", "def"), null), + NOT(SELECTOR("dim1", "xxx", null)) + ) + ) + .setDimensions( + DIMS( + new DefaultDimensionSpec("dim2", "d1"), + new DefaultDimensionSpec("dim1", "d0") + ) + ) + .setAggregatorSpecs(AGGS(new CountAggregatorFactory("a0"))) + .setLimitSpec( + new DefaultLimitSpec( + ImmutableList.of(new OrderByColumnSpec("d1", OrderByColumnSpec.Direction.ASCENDING)), + Integer.MAX_VALUE + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{"def", "abc", 1L} + ) + ); + } + + @Test + public void testUsingSubqueryAsFilterOnTwoColumns() throws Exception + { + if (!CALCITE_1_11_0) { + // https://issues.apache.org/jira/browse/CALCITE-1479 + return; + } + + testQuery( + "SELECT __time, cnt, dim1, dim2 FROM druid.foo " + + " WHERE (dim1, dim2) IN (" + + " SELECT dim1, dim2 FROM (" + + " SELECT dim1, dim2, COUNT(*)" + + " FROM druid.foo" + + " WHERE dim2 = 'abc'" + + " GROUP BY dim1, dim2" + + " HAVING COUNT(*) = 1" + + " )" + + " )", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimFilter(SELECTOR("dim2", "abc", null)) + .setDimensions(DIMS( + new DefaultDimensionSpec("dim1", "d0"), + new DefaultDimensionSpec("dim2", "d1") + )) + .setAggregatorSpecs(AGGS(new CountAggregatorFactory("a0"))) + .setHavingSpec(new DimFilterHavingSpec(NUMERIC_SELECTOR("a0", "1", null))) + .build(), + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .dimensionSpecs(DIMS( + new DefaultDimensionSpec("dim1", "d1"), + new DefaultDimensionSpec("dim2", "d2") + )) + .metrics(ImmutableList.of("cnt")) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .filters(AND(SELECTOR("dim1", "def", null), SELECTOR("dim2", "abc", null))) + .pagingSpec(FIRST_PAGING_SPEC) + .build(), + Druids.newSelectQueryBuilder() + .dataSource(CalciteTests.DATASOURCE) + .dimensionSpecs(DIMS( + new DefaultDimensionSpec("dim1", "d1"), + new DefaultDimensionSpec("dim2", "d2") + )) + .metrics(ImmutableList.of("cnt")) + .intervals(QSS(Filtration.eternity())) + .granularity(QueryGranularities.ALL) + .filters(AND(SELECTOR("dim1", "def", null), SELECTOR("dim2", "abc", null))) + .pagingSpec( + new PagingSpec( + ImmutableMap.of("foo_1970-01-01T00:00:00.000Z_2001-01-03T00:00:00.001Z_1", 0), + 1000, + true + ) + ) + .build() + ), + ImmutableList.of( + new Object[]{T("2001-01-02"), 1L, "def", "abc"} + ) + ); + } + + @Test + public void testUsingSubqueryWithExtractionFns() throws Exception + { + testQuery( + "SELECT dim2, COUNT(*) FROM druid.foo " + + "WHERE substring(dim2, 1, 1) IN (SELECT substring(dim1, 1, 1) FROM druid.foo WHERE dim1 <> '')" + + "group by dim2", + ImmutableList.of( + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimFilter(NOT(SELECTOR("dim1", "", null))) + .setDimensions( + DIMS(new ExtractionDimensionSpec("dim1", "v0", new SubstringDimExtractionFn(0, 1))) + ) + .build(), + GroupByQuery.builder() + .setDataSource(CalciteTests.DATASOURCE) + .setInterval(QSS(Filtration.eternity())) + .setGranularity(QueryGranularities.ALL) + .setDimFilter( + IN( + "dim2", + ImmutableList.of("1", "2", "a", "d"), + new SubstringDimExtractionFn(0, 1) + ) + ) + .setDimensions(DIMS(new DefaultDimensionSpec("dim2", "d0"))) + .setAggregatorSpecs(AGGS(new CountAggregatorFactory("a0"))) + .build() + ), + ImmutableList.of( + new Object[]{"a", 2L}, + new Object[]{"abc", 1L} + ) + ); + } + + private void testQuery( + final String sql, + final List expectedQueries, + final List expectedResults + ) throws Exception + { + testQuery(PLANNER_CONFIG_DEFAULT, sql, expectedQueries, expectedResults); + } + + private void testQuery( + final PlannerConfig plannerConfig, + final String sql, + final List expectedQueries, + final List expectedResults + ) throws Exception + { + recordedQueries.clear(); + + log.info("SQL: %s", sql); + + final Connection theConnection = connections.get(plannerConfig); + final ResultSet resultSet = theConnection.createStatement().executeQuery(sql); + final ResultSetMetaData metaData = resultSet.getMetaData(); + final List results = Lists.newArrayList(); + + while (resultSet.next()) { + final Object[] row = new Object[metaData.getColumnCount()]; + for (int i = 0; i < row.length; i++) { + row[i] = resultSet.getObject(i + 1); + } + log.info("Result row: %s", Arrays.toString(row)); + results.add(row); + } + + Assert.assertEquals("result count", expectedResults.size(), results.size()); + for (int i = 0; i < results.size(); i++) { + Assert.assertArrayEquals("result #" + (i + 1), expectedResults.get(i), results.get(i)); + } + + if (expectedQueries != null) { + Assert.assertEquals("query count", expectedQueries.size(), recordedQueries.size()); + for (int i = 0; i < expectedQueries.size(); i++) { + Assert.assertEquals("query #" + (i + 1), expectedQueries.get(i), recordedQueries.get(i)); + } + } + } + + // Generate java.util.Date, for expected results + private static Date T(final String timeString) + { + return new Date(new DateTime(timeString).getMillis()); + } + + private static QuerySegmentSpec QSS(final Interval... intervals) + { + return new MultipleIntervalSegmentSpec(Arrays.asList(intervals)); + } + + private static AndDimFilter AND(DimFilter... filters) + { + return new AndDimFilter(Arrays.asList(filters)); + } + + private static OrDimFilter OR(DimFilter... filters) + { + return new OrDimFilter(Arrays.asList(filters)); + } + + private static NotDimFilter NOT(DimFilter filter) + { + return new NotDimFilter(filter); + } + + private static InDimFilter IN(String dimension, List values, ExtractionFn extractionFn) + { + return new InDimFilter(dimension, values, extractionFn); + } + + private static SelectorDimFilter SELECTOR(final String fieldName, final String value, final ExtractionFn extractionFn) + { + return new SelectorDimFilter(fieldName, value, extractionFn); + } + + private static DimFilter NUMERIC_SELECTOR( + final String fieldName, + final String value, + final ExtractionFn extractionFn + ) + { + // We use Bound filters for numeric equality to achieve "10.0" = "10" + return BOUND(fieldName, value, value, false, false, extractionFn, StringComparators.NUMERIC); + } + + private static BoundDimFilter BOUND( + final String fieldName, + final String lower, + final String upper, + final boolean lowerStrict, + final boolean upperStrict, + final ExtractionFn extractionFn, + final StringComparator comparator + ) + { + return new BoundDimFilter(fieldName, lower, upper, lowerStrict, upperStrict, null, extractionFn, comparator); + } + + private static BoundDimFilter TIME_BOUND(final Object intervalObj) + { + final Interval interval = new Interval(intervalObj); + return new BoundDimFilter( + Column.TIME_COLUMN_NAME, + String.valueOf(interval.getStartMillis()), + String.valueOf(interval.getEndMillis()), + false, + true, + null, + null, + StringComparators.NUMERIC + ); + } + + private static CascadeExtractionFn CASCADE(final ExtractionFn... fns) + { + return new CascadeExtractionFn(fns); + } + + private static List DIMS(final DimensionSpec... dimensionSpecs) + { + return Arrays.asList(dimensionSpecs); + } + + private static List AGGS(final AggregatorFactory... aggregators) + { + return Arrays.asList(aggregators); + } +} diff --git a/sql/src/test/java/io/druid/sql/calcite/DruidSchemaTest.java b/sql/src/test/java/io/druid/sql/calcite/DruidSchemaTest.java new file mode 100644 index 00000000000..35d1e94acb2 --- /dev/null +++ b/sql/src/test/java/io/druid/sql/calcite/DruidSchemaTest.java @@ -0,0 +1,133 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite; + +import com.google.common.collect.ImmutableSet; +import com.google.common.collect.Iterables; +import io.druid.sql.calcite.planner.PlannerConfig; +import io.druid.sql.calcite.table.DruidTable; +import io.druid.sql.calcite.util.CalciteTests; +import io.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker; +import io.druid.sql.calcite.util.TestServerInventoryView; +import org.apache.calcite.jdbc.CalciteConnection; +import org.apache.calcite.jdbc.JavaTypeFactoryImpl; +import org.apache.calcite.rel.type.RelDataType; +import org.apache.calcite.rel.type.RelDataTypeField; +import org.apache.calcite.schema.Table; +import org.apache.calcite.sql.type.SqlTypeName; +import org.junit.After; +import org.junit.Assert; +import org.junit.Before; +import org.junit.Rule; +import org.junit.Test; +import org.junit.rules.TemporaryFolder; + +import java.sql.Connection; +import java.sql.DriverManager; +import java.util.List; +import java.util.Map; +import java.util.Properties; + +public class DruidSchemaTest +{ + private static final PlannerConfig PLANNER_CONFIG_DEFAULT = new PlannerConfig(); + private static final PlannerConfig PLANNER_CONFIG_NO_TOPN = new PlannerConfig() + { + @Override + public int getMaxTopNLimit() + { + return 0; + } + + @Override + public boolean isUseApproximateTopN() + { + return false; + } + }; + + @Rule + public TemporaryFolder temporaryFolder = new TemporaryFolder(); + + private SpecificSegmentsQuerySegmentWalker walker = null; + private DruidSchema schema = null; + private Connection connection = null; + + @Before + public void setUp() throws Exception + { + walker = CalciteTests.createWalker(temporaryFolder.newFolder()); + + Properties props = new Properties(); + props.setProperty("caseSensitive", "true"); + props.setProperty("unquotedCasing", "UNCHANGED"); + connection = DriverManager.getConnection("jdbc:calcite:", props); + CalciteConnection calciteConnection = connection.unwrap(CalciteConnection.class); + + schema = new DruidSchema( + walker, + new TestServerInventoryView(walker.getSegments()), + PLANNER_CONFIG_DEFAULT + ); + + calciteConnection.getRootSchema().add("s", schema); + schema.start(); + schema.awaitInitialization(); + } + + @After + public void tearDown() throws Exception + { + schema.stop(); + walker.close(); + connection.close(); + } + + @Test + public void testGetTableMap() + { + Assert.assertEquals(ImmutableSet.of("foo"), schema.getTableNames()); + + final Map tableMap = schema.getTableMap(); + Assert.assertEquals(1, tableMap.size()); + Assert.assertEquals("foo", Iterables.getOnlyElement(tableMap.keySet())); + + final DruidTable druidTable = (DruidTable) Iterables.getOnlyElement(tableMap.values()); + final RelDataType rowType = druidTable.getRowType(new JavaTypeFactoryImpl()); + final List fields = rowType.getFieldList(); + + Assert.assertEquals(5, fields.size()); + + Assert.assertEquals("__time", fields.get(0).getName()); + Assert.assertEquals(SqlTypeName.TIMESTAMP, fields.get(0).getType().getSqlTypeName()); + + Assert.assertEquals("cnt", fields.get(1).getName()); + Assert.assertEquals(SqlTypeName.BIGINT, fields.get(1).getType().getSqlTypeName()); + + Assert.assertEquals("dim1", fields.get(2).getName()); + Assert.assertEquals(SqlTypeName.VARCHAR, fields.get(2).getType().getSqlTypeName()); + + Assert.assertEquals("dim2", fields.get(3).getName()); + Assert.assertEquals(SqlTypeName.VARCHAR, fields.get(3).getType().getSqlTypeName()); + + Assert.assertEquals("m1", fields.get(4).getName()); + Assert.assertEquals(SqlTypeName.FLOAT, fields.get(4).getType().getSqlTypeName()); + } +} diff --git a/sql/src/test/java/io/druid/sql/calcite/filtration/FiltrationTest.java b/sql/src/test/java/io/druid/sql/calcite/filtration/FiltrationTest.java new file mode 100644 index 00000000000..e38d12c399c --- /dev/null +++ b/sql/src/test/java/io/druid/sql/calcite/filtration/FiltrationTest.java @@ -0,0 +1,62 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.filtration; + +import com.google.common.collect.ImmutableList; +import io.druid.query.filter.IntervalDimFilter; +import io.druid.query.filter.NotDimFilter; +import io.druid.segment.column.Column; +import org.joda.time.Interval; +import org.junit.Assert; +import org.junit.Test; + +public class FiltrationTest +{ + @Test + public void testNotIntervals() + { + final Filtration filtration = Filtration.create( + new NotDimFilter( + new IntervalDimFilter( + Column.TIME_COLUMN_NAME, + ImmutableList.of(new Interval("2000/2001"), new Interval("2002/2003")), + null + ) + ), + null + ).optimize(null); + + Assert.assertEquals( + ImmutableList.of(Filtration.eternity()), + filtration.getIntervals() + ); + + Assert.assertEquals( + new NotDimFilter( + new IntervalDimFilter( + Column.TIME_COLUMN_NAME, + ImmutableList.of(new Interval("2000/2001"), new Interval("2002/2003")), + null + ) + ), + filtration.getDimFilter() + ); + } +} diff --git a/sql/src/test/java/io/druid/sql/calcite/http/SqlResourceTest.java b/sql/src/test/java/io/druid/sql/calcite/http/SqlResourceTest.java new file mode 100644 index 00000000000..625631b99c2 --- /dev/null +++ b/sql/src/test/java/io/druid/sql/calcite/http/SqlResourceTest.java @@ -0,0 +1,161 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.http; + +import com.fasterxml.jackson.core.type.TypeReference; +import com.fasterxml.jackson.databind.ObjectMapper; +import com.google.common.collect.ImmutableList; +import com.google.common.collect.ImmutableMap; +import io.druid.jackson.DefaultObjectMapper; +import io.druid.query.QueryInterruptedException; +import io.druid.sql.calcite.planner.Calcites; +import io.druid.sql.calcite.planner.PlannerConfig; +import io.druid.sql.calcite.util.CalciteTests; +import io.druid.sql.http.SqlQuery; +import io.druid.sql.http.SqlResource; +import org.apache.calcite.jdbc.CalciteConnection; +import org.junit.After; +import org.junit.Assert; +import org.junit.Before; +import org.junit.Rule; +import org.junit.Test; +import org.junit.rules.ExpectedException; +import org.junit.rules.TemporaryFolder; + +import javax.ws.rs.core.Response; +import javax.ws.rs.core.StreamingOutput; +import java.io.ByteArrayOutputStream; +import java.util.List; +import java.util.Map; + +public class SqlResourceTest +{ + private static final ObjectMapper JSON_MAPPER = new DefaultObjectMapper(); + + @Rule + public ExpectedException expectedException = ExpectedException.none(); + + @Rule + public TemporaryFolder temporaryFolder = new TemporaryFolder(); + + private CalciteConnection connection; + private SqlResource resource; + + @Before + public void setUp() throws Exception + { + final PlannerConfig plannerConfig = new PlannerConfig(); + connection = Calcites.jdbc( + CalciteTests.createMockSchema( + CalciteTests.createWalker(temporaryFolder.newFolder()), + plannerConfig + ), + plannerConfig + ); + resource = new SqlResource(JSON_MAPPER, connection); + } + + @After + public void tearDown() throws Exception + { + connection.close(); + connection = null; + } + + @Test + public void testCountStar() throws Exception + { + final List> rows = doPost( + new SqlQuery("SELECT COUNT(*) AS cnt FROM druid.foo") + ); + + Assert.assertEquals( + ImmutableList.of( + ImmutableMap.of("cnt", 6) + ), + rows + ); + } + + @Test + public void testTimestampsInResponse() throws Exception + { + final List> rows = doPost( + new SqlQuery("SELECT __time FROM druid.foo LIMIT 1") + ); + + Assert.assertEquals( + ImmutableList.of( + ImmutableMap.of("__time", "2000-01-01T00:00:00.000Z") + ), + rows + ); + } + + @Test + public void testExplainCountStar() throws Exception + { + final List> rows = doPost( + new SqlQuery("EXPLAIN PLAN FOR SELECT COUNT(*) AS cnt FROM druid.foo") + ); + + Assert.assertEquals( + ImmutableList.of( + ImmutableMap.of( + "PLAN", + "EnumerableInterpreter\n" + + " DruidQueryRel(dataSource=[foo], dimensions=[[]], aggregations=[[Aggregation{aggregatorFactories=[CountAggregatorFactory{name='a0'}], postAggregator=null, finalizingPostAggregatorFactory=null}]])\n" + ) + ), + rows + ); + } + + @Test + public void testCannotPlan() throws Exception + { + expectedException.expect(QueryInterruptedException.class); + expectedException.expectMessage("Column 'dim3' not found in any table"); + + doPost( + new SqlQuery("SELECT dim3 FROM druid.foo") + ); + + Assert.fail(); + } + + private List> doPost(final SqlQuery query) throws Exception + { + final Response response = resource.doPost(query); + if (response.getStatus() == 200) { + final StreamingOutput output = (StreamingOutput) response.getEntity(); + final ByteArrayOutputStream baos = new ByteArrayOutputStream(); + output.write(baos); + return JSON_MAPPER.readValue( + baos.toByteArray(), + new TypeReference>>() + { + } + ); + } else { + throw JSON_MAPPER.readValue((byte[]) response.getEntity(), QueryInterruptedException.class); + } + } +} diff --git a/sql/src/test/java/io/druid/sql/calcite/util/CalciteTests.java b/sql/src/test/java/io/druid/sql/calcite/util/CalciteTests.java new file mode 100644 index 00000000000..7b25ed5cfb2 --- /dev/null +++ b/sql/src/test/java/io/druid/sql/calcite/util/CalciteTests.java @@ -0,0 +1,247 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.util; + +import com.google.common.base.Supplier; +import com.google.common.collect.ImmutableList; +import com.google.common.collect.ImmutableMap; +import io.druid.collections.StupidPool; +import io.druid.data.input.InputRow; +import io.druid.data.input.impl.DimensionsSpec; +import io.druid.data.input.impl.InputRowParser; +import io.druid.data.input.impl.MapInputRowParser; +import io.druid.data.input.impl.TimeAndDimsParseSpec; +import io.druid.data.input.impl.TimestampSpec; +import io.druid.query.DefaultQueryRunnerFactoryConglomerate; +import io.druid.query.Query; +import io.druid.query.QueryRunnerFactory; +import io.druid.query.QueryRunnerFactoryConglomerate; +import io.druid.query.QueryRunnerTestHelper; +import io.druid.query.QuerySegmentWalker; +import io.druid.query.TableDataSource; +import io.druid.query.aggregation.AggregatorFactory; +import io.druid.query.aggregation.CountAggregatorFactory; +import io.druid.query.aggregation.DoubleSumAggregatorFactory; +import io.druid.query.aggregation.hyperloglog.HyperUniquesAggregatorFactory; +import io.druid.query.groupby.GroupByQuery; +import io.druid.query.groupby.GroupByQueryConfig; +import io.druid.query.groupby.GroupByQueryRunnerTest; +import io.druid.query.groupby.strategy.GroupByStrategySelector; +import io.druid.query.metadata.SegmentMetadataQueryConfig; +import io.druid.query.metadata.SegmentMetadataQueryQueryToolChest; +import io.druid.query.metadata.SegmentMetadataQueryRunnerFactory; +import io.druid.query.metadata.metadata.SegmentMetadataQuery; +import io.druid.query.select.SelectQuery; +import io.druid.query.select.SelectQueryEngine; +import io.druid.query.select.SelectQueryQueryToolChest; +import io.druid.query.select.SelectQueryRunnerFactory; +import io.druid.query.timeseries.TimeseriesQuery; +import io.druid.query.timeseries.TimeseriesQueryEngine; +import io.druid.query.timeseries.TimeseriesQueryQueryToolChest; +import io.druid.query.timeseries.TimeseriesQueryRunnerFactory; +import io.druid.query.topn.TopNQuery; +import io.druid.query.topn.TopNQueryConfig; +import io.druid.query.topn.TopNQueryQueryToolChest; +import io.druid.query.topn.TopNQueryRunnerFactory; +import io.druid.segment.IndexBuilder; +import io.druid.segment.QueryableIndex; +import io.druid.segment.TestHelper; +import io.druid.segment.column.ValueType; +import io.druid.segment.incremental.IncrementalIndexSchema; +import io.druid.sql.calcite.planner.PlannerConfig; +import io.druid.sql.calcite.table.DruidTable; +import io.druid.timeline.DataSegment; +import io.druid.timeline.partition.LinearShardSpec; +import org.apache.calcite.schema.Schema; +import org.apache.calcite.schema.Table; +import org.apache.calcite.schema.impl.AbstractSchema; + +import java.io.File; +import java.nio.ByteBuffer; +import java.util.List; +import java.util.Map; + +/** + * Utility functions for Calcite tests. + */ +public class CalciteTests +{ + public static final String DATASOURCE = "foo"; + + private static final String TIMESTAMP_COLUMN = "t"; + private static final InputRowParser> PARSER = new MapInputRowParser( + new TimeAndDimsParseSpec( + new TimestampSpec(TIMESTAMP_COLUMN, "iso", null), + new DimensionsSpec( + DimensionsSpec.getDefaultSchemas(ImmutableList.of("dim1", "dim2")), + null, + null + ) + ) + ); + private static final List ROWS = ImmutableList.of( + ROW(ImmutableMap.of("t", "2000-01-01", "m1", "1.0", "dim1", "", "dim2", ImmutableList.of("a"))), + ROW(ImmutableMap.of("t", "2000-01-02", "m1", "2.0", "dim1", "10.1", "dim2", ImmutableList.of())), + ROW(ImmutableMap.of("t", "2000-01-03", "m1", "3.0", "dim1", "2", "dim2", ImmutableList.of(""))), + ROW(ImmutableMap.of("t", "2001-01-01", "m1", "4.0", "dim1", "1", "dim2", ImmutableList.of("a"))), + ROW(ImmutableMap.of("t", "2001-01-02", "m1", "5.0", "dim1", "def", "dim2", ImmutableList.of("abc"))), + ROW(ImmutableMap.of("t", "2001-01-03", "m1", "6.0", "dim1", "abc")) + ); + private static final Map COLUMN_TYPES = ImmutableMap.of( + "__time", ValueType.LONG, + "cnt", ValueType.LONG, + "dim1", ValueType.STRING, + "dim2", ValueType.STRING, + "m1", ValueType.FLOAT + ); + + private CalciteTests() + { + // No instantiation. + } + + public static SpecificSegmentsQuerySegmentWalker createWalker(final File tmpDir) + { + return createWalker(tmpDir, ROWS); + } + + public static SpecificSegmentsQuerySegmentWalker createWalker(final File tmpDir, final List rows) + { + final QueryableIndex index = IndexBuilder.create() + .tmpDir(tmpDir) + .indexMerger(TestHelper.getTestIndexMergerV9()) + .schema( + new IncrementalIndexSchema.Builder() + .withMetrics( + new AggregatorFactory[]{ + new CountAggregatorFactory("cnt"), + new DoubleSumAggregatorFactory("m1", "m1"), + new HyperUniquesAggregatorFactory("unique_dim1", "dim1") + } + ) + .withRollup(false) + .build() + ) + .rows(rows) + .buildMMappedIndex(); + + final QueryRunnerFactoryConglomerate conglomerate = new DefaultQueryRunnerFactoryConglomerate( + ImmutableMap., QueryRunnerFactory>builder() + .put( + SegmentMetadataQuery.class, + new SegmentMetadataQueryRunnerFactory( + new SegmentMetadataQueryQueryToolChest( + new SegmentMetadataQueryConfig("P1W") + ), + QueryRunnerTestHelper.NOOP_QUERYWATCHER + ) + ) + .put( + SelectQuery.class, + new SelectQueryRunnerFactory( + new SelectQueryQueryToolChest( + TestHelper.getObjectMapper(), + QueryRunnerTestHelper.NoopIntervalChunkingQueryRunnerDecorator() + ), + new SelectQueryEngine(), + QueryRunnerTestHelper.NOOP_QUERYWATCHER + ) + ) + .put( + TimeseriesQuery.class, + new TimeseriesQueryRunnerFactory( + new TimeseriesQueryQueryToolChest( + QueryRunnerTestHelper.NoopIntervalChunkingQueryRunnerDecorator() + ), + new TimeseriesQueryEngine(), + QueryRunnerTestHelper.NOOP_QUERYWATCHER + ) + ) + .put( + TopNQuery.class, + new TopNQueryRunnerFactory( + new StupidPool<>( + new Supplier() + { + @Override + public ByteBuffer get() + { + return ByteBuffer.allocate(10 * 1024 * 1024); + } + } + ), + new TopNQueryQueryToolChest( + new TopNQueryConfig(), + QueryRunnerTestHelper.NoopIntervalChunkingQueryRunnerDecorator() + ), + QueryRunnerTestHelper.NOOP_QUERYWATCHER + ) + ) + .put( + GroupByQuery.class, + GroupByQueryRunnerTest.makeQueryRunnerFactory( + new GroupByQueryConfig() + { + @Override + public String getDefaultStrategy() + { + return GroupByStrategySelector.STRATEGY_V2; + } + } + ) + ) + .build() + ); + + return new SpecificSegmentsQuerySegmentWalker(conglomerate).add( + DataSegment.builder() + .dataSource(DATASOURCE) + .interval(index.getDataInterval()) + .version("1") + .shardSpec(new LinearShardSpec(0)) + .build(), + index + ); + } + + public static DruidTable createDruidTable(final QuerySegmentWalker walker, final PlannerConfig plannerConfig) + { + return new DruidTable(walker, new TableDataSource(DATASOURCE), plannerConfig, COLUMN_TYPES); + } + + public static Schema createMockSchema(final QuerySegmentWalker walker, final PlannerConfig plannerConfig) + { + final DruidTable druidTable = createDruidTable(walker, plannerConfig); + final Map tableMap = ImmutableMap.of(DATASOURCE, druidTable); + return new AbstractSchema() + { + @Override + protected Map getTableMap() + { + return tableMap; + } + }; + } + + private static InputRow ROW(final ImmutableMap map) + { + return PARSER.parse((Map) map); + } +} diff --git a/sql/src/test/java/io/druid/sql/calcite/util/SpecificSegmentsQuerySegmentWalker.java b/sql/src/test/java/io/druid/sql/calcite/util/SpecificSegmentsQuerySegmentWalker.java new file mode 100644 index 00000000000..332f9189671 --- /dev/null +++ b/sql/src/test/java/io/druid/sql/calcite/util/SpecificSegmentsQuerySegmentWalker.java @@ -0,0 +1,217 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.util; + +import com.google.common.base.Function; +import com.google.common.collect.Iterables; +import com.google.common.collect.Lists; +import com.google.common.collect.Maps; +import com.google.common.collect.Ordering; +import com.google.common.io.Closeables; +import com.google.common.util.concurrent.MoreExecutors; +import io.druid.java.util.common.ISE; +import io.druid.java.util.common.guava.FunctionalIterable; +import io.druid.query.FinalizeResultsQueryRunner; +import io.druid.query.NoopQueryRunner; +import io.druid.query.Query; +import io.druid.query.QueryRunner; +import io.druid.query.QueryRunnerFactory; +import io.druid.query.QueryRunnerFactoryConglomerate; +import io.druid.query.QuerySegmentWalker; +import io.druid.query.QueryToolChest; +import io.druid.query.SegmentDescriptor; +import io.druid.query.TableDataSource; +import io.druid.query.spec.SpecificSegmentQueryRunner; +import io.druid.query.spec.SpecificSegmentSpec; +import io.druid.segment.QueryableIndex; +import io.druid.segment.QueryableIndexSegment; +import io.druid.segment.Segment; +import io.druid.timeline.DataSegment; +import io.druid.timeline.TimelineObjectHolder; +import io.druid.timeline.VersionedIntervalTimeline; +import io.druid.timeline.partition.PartitionChunk; +import io.druid.timeline.partition.PartitionHolder; +import org.joda.time.Interval; + +import java.io.Closeable; +import java.io.IOException; +import java.util.List; +import java.util.Map; + +public class SpecificSegmentsQuerySegmentWalker implements QuerySegmentWalker, Closeable +{ + private final QueryRunnerFactoryConglomerate conglomerate; + private final Map> timelines = Maps.newHashMap(); + private final List closeables = Lists.newArrayList(); + private final List segments = Lists.newArrayList(); + + public SpecificSegmentsQuerySegmentWalker(QueryRunnerFactoryConglomerate conglomerate) + { + this.conglomerate = conglomerate; + } + + public SpecificSegmentsQuerySegmentWalker add( + final DataSegment descriptor, + final QueryableIndex index + ) + { + final Segment segment = new QueryableIndexSegment(descriptor.getIdentifier(), index); + if (!timelines.containsKey(descriptor.getDataSource())) { + timelines.put(descriptor.getDataSource(), new VersionedIntervalTimeline(Ordering.natural())); + } + + final VersionedIntervalTimeline timeline = timelines.get(descriptor.getDataSource()); + timeline.add(descriptor.getInterval(), descriptor.getVersion(), descriptor.getShardSpec().createChunk(segment)); + segments.add(descriptor); + return this; + } + + public List getSegments() + { + return segments; + } + + @Override + public QueryRunner getQueryRunnerForIntervals( + final Query query, + final Iterable intervals + ) + { + final VersionedIntervalTimeline timeline = getTimeline(query); + if (timeline == null) { + return new NoopQueryRunner<>(); + } + + final Iterable specs = FunctionalIterable + .create(intervals) + .transformCat( + new Function>>() + { + @Override + public Iterable> apply(final Interval interval) + { + return timeline.lookup(interval); + } + } + ) + .transformCat( + new Function, Iterable>() + { + @Override + public Iterable apply(final TimelineObjectHolder holder) + { + return FunctionalIterable + .create(holder.getObject()) + .transform( + new Function, SegmentDescriptor>() + { + @Override + public SegmentDescriptor apply(final PartitionChunk chunk) + { + return new SegmentDescriptor( + holder.getInterval(), + holder.getVersion(), + chunk.getChunkNumber() + ); + } + } + ); + } + } + ); + + return getQueryRunnerForSegments(query, specs); + } + + @Override + public QueryRunner getQueryRunnerForSegments( + final Query query, + final Iterable specs + ) + { + final VersionedIntervalTimeline timeline = getTimeline(query); + if (timeline == null) { + return new NoopQueryRunner<>(); + } + + final QueryRunnerFactory> factory = conglomerate.findFactory(query); + if (factory == null) { + throw new ISE("Unknown query type[%s].", query.getClass()); + } + + final QueryToolChest> toolChest = factory.getToolchest(); + + return new FinalizeResultsQueryRunner<>( + toolChest.mergeResults( + factory.mergeRunners( + MoreExecutors.sameThreadExecutor(), + FunctionalIterable + .create(specs) + .transformCat( + new Function>>() + { + @Override + public Iterable> apply(final SegmentDescriptor descriptor) + { + final PartitionHolder holder = timeline.findEntry( + descriptor.getInterval(), + descriptor.getVersion() + ); + + return Iterables.transform( + holder, + new Function, QueryRunner>() + { + @Override + public QueryRunner apply(PartitionChunk chunk) + { + return new SpecificSegmentQueryRunner( + factory.createRunner(chunk.getObject()), + new SpecificSegmentSpec(descriptor) + ); + } + } + ); + } + } + ) + ) + ), + toolChest + ); + } + + @Override + public void close() throws IOException + { + for (Closeable closeable : closeables) { + Closeables.close(closeable, true); + } + } + + private VersionedIntervalTimeline getTimeline(Query query) + { + if (query.getDataSource() instanceof TableDataSource) { + return timelines.get(((TableDataSource) query.getDataSource()).getName()); + } else { + return null; + } + } +} diff --git a/sql/src/test/java/io/druid/sql/calcite/util/TestServerInventoryView.java b/sql/src/test/java/io/druid/sql/calcite/util/TestServerInventoryView.java new file mode 100644 index 00000000000..193cc91c18c --- /dev/null +++ b/sql/src/test/java/io/druid/sql/calcite/util/TestServerInventoryView.java @@ -0,0 +1,95 @@ +/* + * Licensed to Metamarkets Group Inc. (Metamarkets) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. Metamarkets licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ + +package io.druid.sql.calcite.util; + +import com.google.common.collect.ImmutableList; +import io.druid.client.DruidServer; +import io.druid.client.ServerView; +import io.druid.client.TimelineServerView; +import io.druid.client.selector.ServerSelector; +import io.druid.query.DataSource; +import io.druid.query.QueryRunner; +import io.druid.server.coordination.DruidServerMetadata; +import io.druid.timeline.DataSegment; +import io.druid.timeline.TimelineLookup; + +import java.util.List; +import java.util.concurrent.Executor; + +public class TestServerInventoryView implements TimelineServerView +{ + private final List segments; + + public TestServerInventoryView(List segments) + { + this.segments = ImmutableList.copyOf(segments); + } + + @Override + public TimelineLookup getTimeline(DataSource dataSource) + { + throw new UnsupportedOperationException(); + } + + @Override + public void registerSegmentCallback(Executor exec, final SegmentCallback callback) + { + final DruidServerMetadata dummyServer = new DruidServerMetadata("dummy", "dummy", 0, "dummy", "dummy", 0); + + for (final DataSegment segment : segments) { + exec.execute( + new Runnable() + { + @Override + public void run() + { + callback.segmentAdded(dummyServer, segment); + } + } + ); + } + + exec.execute( + new Runnable() + { + @Override + public void run() + { + callback.segmentViewInitialized(); + } + } + ); + } + + @Override + public QueryRunner getQueryRunner(DruidServer server) + { + throw new UnsupportedOperationException(); + } + + @Override + public void registerServerCallback( + Executor exec, + ServerView.ServerCallback callback + ) + { + // Do nothing + } +}