SQL: Add support for explicit types in CsvSpecTests (elastic/x-pack-elasticsearch#2306)

Adds support for specifying column types in CSV Spec tests. Original commit: elastic/x-pack-elasticsearch@4d5622f298
2017-08-18 12:12:06 -04:00 · 2017-08-18 12:12:06 -04:00 · 4c597a2944
parent a68d839edc
commit 4c597a2944
2 changed files with 87 additions and 16 deletions
--- a/sql/jdbc/src/test/java/org/elasticsearch/xpack/sql/jdbc/CsvSpecIT.java
+++ b/sql/jdbc/src/test/java/org/elasticsearch/xpack/sql/jdbc/CsvSpecIT.java
@ -7,40 +7,37 @@ package org.elasticsearch.xpack.sql.jdbc;

 import com.carrotsearch.randomizedtesting.annotations.ParametersFactory;

+import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.collect.Tuple;
+import org.elasticsearch.common.io.Streams;
 import org.elasticsearch.xpack.sql.jdbc.framework.SpecBaseIntegrationTestCase;
 import org.elasticsearch.xpack.sql.util.CollectionUtils;
 import org.relique.io.TableReader;
 import org.relique.jdbc.csv.CsvConnection;

+import java.io.BufferedReader;
+import java.io.BufferedWriter;
+import java.io.IOException;
 import java.io.Reader;
 import java.io.StringReader;
+import java.io.StringWriter;
 import java.nio.file.Path;
 import java.sql.Connection;
 import java.sql.ResultSet;
 import java.sql.SQLException;
 import java.sql.Statement;
 import java.util.List;
+import java.util.Locale;
 import java.util.Properties;

 import static org.elasticsearch.xpack.sql.jdbc.framework.JdbcAssert.assertResultSets;
+import static org.hamcrest.Matchers.arrayWithSize;

 /**
 * Tests comparing sql queries executed against our jdbc client
 * with hard coded result sets.
 */
 public class CsvSpecIT extends SpecBaseIntegrationTestCase {
-    /**
-     * Properties used when settings up a CSV-based jdbc connection.
-     */
-    private static final Properties CSV_PROPERTIES = new Properties();
-    static {
-        CSV_PROPERTIES.setProperty("charset", "UTF-8");
-        // trigger auto-detection
-        CSV_PROPERTIES.setProperty("columnTypes", "");
-        CSV_PROPERTIES.setProperty("separator", "|");
-        CSV_PROPERTIES.setProperty("trimValues", "true");
-    }
-
    private final CsvTestCase testCase;

    @ParametersFactory(argumentFormatting = PARAM_FORMATTING)
@ -49,7 +46,8 @@ public class CsvSpecIT extends SpecBaseIntegrationTestCase {
        return CollectionUtils.combine(
                readScriptSpec("/command.csv-spec", parser),
                readScriptSpec("/fulltext.csv-spec", parser),
-                readScriptSpec("/agg.csv-spec", parser)
+                readScriptSpec("/agg.csv-spec", parser),
+                readScriptSpec("/columns.csv-spec", parser)
                );
    }

@ -66,8 +64,14 @@ public class CsvSpecIT extends SpecBaseIntegrationTestCase {
        }
    }

-    private void assertMatchesCsv(String query, String csvTableName, String expectedResults) throws SQLException {
-        Reader reader = new StringReader(expectedResults);
+    private void assertMatchesCsv(String query, String csvTableName, String expectedResults) throws SQLException, IOException {
+        Properties csvProperties = new Properties();
+        csvProperties.setProperty("charset", "UTF-8");
+        csvProperties.setProperty("separator", "|");
+        csvProperties.setProperty("trimValues", "true");
+        Tuple<String,String> resultsAndTypes = extractColumnTypes(expectedResults);
+        csvProperties.setProperty("columnTypes", resultsAndTypes.v2());
+        Reader reader = new StringReader(resultsAndTypes.v1());
        TableReader tableReader = new TableReader() {
            @Override
            public Reader getReader(Statement statement, String tableName) throws SQLException {
@ -79,7 +83,7 @@ public class CsvSpecIT extends SpecBaseIntegrationTestCase {
                throw new UnsupportedOperationException();
            }
        };
-        try (Connection csv = new CsvConnection(tableReader, CSV_PROPERTIES, "") {};
+        try (Connection csv = new CsvConnection(tableReader, csvProperties, "") {};
             Connection es = esJdbc()) {
            // pass the testName as table for debugging purposes (in case the underlying reader is missing)
            ResultSet expected = csv.createStatement(ResultSet.TYPE_SCROLL_INSENSITIVE, ResultSet.CONCUR_READ_ONLY)
@ -91,6 +95,58 @@ public class CsvSpecIT extends SpecBaseIntegrationTestCase {
        }
    }

+    private Tuple<String,String> extractColumnTypes(String expectedResults) throws IOException {
+        try (StringReader reader = new StringReader(expectedResults)){
+            try (BufferedReader bufferedReader = new BufferedReader(reader)){
+                String header = bufferedReader.readLine();
+                if (!header.contains(":")) {
+                    // No type information in headers, no need to parse columns - trigger auto-detection
+                    return new Tuple<>(expectedResults,"");
+                }
+                try (StringWriter writer = new StringWriter()) {
+                    try (BufferedWriter bufferedWriter = new BufferedWriter(writer)){
+                        Tuple<String, String> headerAndColumns = extractColumnTypesFromHeader(header);
+                        bufferedWriter.write(headerAndColumns.v1());
+                        bufferedWriter.newLine();
+                        bufferedWriter.flush();
+                        // Copy the rest of test
+                        Streams.copy(bufferedReader, bufferedWriter);
+                        return new Tuple<>(writer.toString(), headerAndColumns.v2());
+                    }
+                }
+            }
+        }
+    }
+
+    private Tuple<String,String> extractColumnTypesFromHeader(String header) {
+        String[] columnTypes = Strings.delimitedListToStringArray(header, "|", " \t");
+        StringBuilder types = new StringBuilder();
+        StringBuilder columns = new StringBuilder();
+        for(String column : columnTypes) {
+            String[] nameType = Strings.delimitedListToStringArray(column, ":");
+            assertThat("If at least one column has a type associated with it, all columns should have types",  nameType, arrayWithSize(2));
+            if(types.length() > 0) {
+                types.append(",");
+                columns.append("|");
+            }
+            columns.append(nameType[0]);
+            types.append(resolveColumnType(nameType[1]));
+        }
+        return new Tuple<>(columns.toString(), types.toString());
+    }
+    
+    private String resolveColumnType(String type) {
+        switch (type.toLowerCase(Locale.ROOT)) {
+            case "s": return "string";
+            case "b": return "boolean";
+            case "i": return "integer";
+            case "l": return "long";
+            case "f": return "float";
+            case "d": return "double";
+            default: return type;
+        }
+    }
+
    protected void assertResults(ResultSet expected, ResultSet actual) throws SQLException {
        assertResultSets(expected, actual);
    }
--- a/sql/jdbc/src/test/resources/columns.csv-spec
+++ b/sql/jdbc/src/test/resources/columns.csv-spec
@ -0,0 +1,15 @@
+//
+// Test of explicit column types
+// the columns can be specified as <ColumnName:ColumnType> or as <ColumnName>
+// if at least one column has an explicit column type, all columns should have an explicit type
+// type might be missing in which case it will be autodetected or can be one of the following
+// d - double, f - float, i - int, b - byte, l - long, t - timestamp, date
+
+
+columnDetectionOverride
+SELECT gender, FLOOR(PERCENTILE(emp_no, 97.76)) p1 FROM test_emp GROUP BY gender;
+
+gender:s             | p1:double
+M                    | 10095
+F                    | 10099
+;