diff --git a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/Facet2DStream.java b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/Facet2DStream.java index 6e3dd0a7910..2ccb147d472 100644 --- a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/Facet2DStream.java +++ b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/Facet2DStream.java @@ -115,6 +115,11 @@ public class Facet2DStream extends TupleStream implements Expressible { params.add(namedParam.getName(), namedParam.getParameter().toString().trim()); } } + + if(params.get("q") == null) { + params.set("q", "*:*"); + } + Bucket x = null; if (bucketXExpression != null) { if (bucketXExpression.getParameter() instanceof StreamExpressionValue) { @@ -148,8 +153,8 @@ public class Facet2DStream extends TupleStream implements Expressible { String bucketSortString = metric.getIdentifier() + " desc"; FieldComparator bucketSort = parseBucketSort(bucketSortString, x, y); - int dimensionX = 0; - int dimensionY = 0; + int dimensionX = 10; + int dimensionY = 10; if (dimensionsExpression != null) { if (dimensionsExpression.getParameter() instanceof StreamExpressionValue) { String[] strDimensions = ((StreamExpressionValue) dimensionsExpression.getParameter()).getValue().split(","); diff --git a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/FacetStream.java b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/FacetStream.java index 9257df3435e..b2b28095b22 100644 --- a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/FacetStream.java +++ b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/FacetStream.java @@ -47,6 +47,7 @@ import org.apache.solr.client.solrj.io.stream.expr.StreamExpressionParameter; import org.apache.solr.client.solrj.io.stream.expr.StreamExpressionValue; import org.apache.solr.client.solrj.io.stream.expr.StreamFactory; import org.apache.solr.client.solrj.io.stream.metrics.Bucket; +import org.apache.solr.client.solrj.io.stream.metrics.CountMetric; import org.apache.solr.client.solrj.io.stream.metrics.Metric; import org.apache.solr.client.solrj.request.QueryRequest; import org.apache.solr.common.params.ModifiableSolrParams; @@ -148,6 +149,10 @@ public class FacetStream extends TupleStream implements Expressible { } } + if(params.get("q") == null) { + params.set("q", "*:*"); + } + // buckets, required - comma separated Bucket[] buckets = null; if(null != bucketExpression){ @@ -166,12 +171,31 @@ public class FacetStream extends TupleStream implements Expressible { throw new IOException(String.format(Locale.ROOT,"invalid expression %s - at least one bucket expected. eg. 'buckets=\"name\"'",expression,collectionName)); } + + // Construct the metrics + Metric[] metrics = new Metric[metricExpressions.size()]; + for(int idx = 0; idx < metricExpressions.size(); ++idx) { + metrics[idx] = factory.constructMetric(metricExpressions.get(idx)); + } + + if(metrics.length == 0) { + metrics = new Metric[1]; + metrics[0] = new CountMetric(); + } + String bucketSortString = null; if(bucketSortExpression == null) { - throw new IOException("The bucketSorts parameter is required for the facet function."); + bucketSortString = metrics[0].getIdentifier()+" desc"; } else { bucketSortString = ((StreamExpressionValue)bucketSortExpression.getParameter()).getValue(); + if(bucketSortString.contains("(") && + metricExpressions.size() == 0 && + (!bucketSortExpression.equals("count(*) desc") && + !bucketSortExpression.equals("count(*) asc"))) { + //Attempting bucket sort on a metric that is not going to be calculated. + throw new IOException(String.format(Locale.ROOT,"invalid expression %s - the bucketSort is being performed on a metric that is not being calculated.",expression,collectionName)); + } } FieldComparator[] bucketSorts = parseBucketSorts(bucketSortString, buckets); @@ -180,15 +204,7 @@ public class FacetStream extends TupleStream implements Expressible { throw new IOException(String.format(Locale.ROOT,"invalid expression %s - at least one bucket sort expected. eg. 'bucketSorts=\"name asc\"'",expression,collectionName)); } - // Construct the metrics - Metric[] metrics = new Metric[metricExpressions.size()]; - for(int idx = 0; idx < metricExpressions.size(); ++idx) { - metrics[idx] = factory.constructMetric(metricExpressions.get(idx)); - } - if(0 == metrics.length) { - throw new IOException(String.format(Locale.ROOT,"invalid expression %s - at least one metric expected.",expression,collectionName)); - } boolean refine = false; @@ -210,7 +226,7 @@ public class FacetStream extends TupleStream implements Expressible { methodStr = ((StreamExpressionValue) methodExpression.getParameter()).getValue(); } - int overfetchInt = 150; + int overfetchInt = 250; if(overfetchExpression != null) { String overfetchStr = ((StreamExpressionValue) overfetchExpression.getParameter()).getValue(); overfetchInt = Integer.parseInt(overfetchStr); diff --git a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/RandomFacadeStream.java b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/RandomFacadeStream.java index f9735cef9c4..0af858cf981 100644 --- a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/RandomFacadeStream.java +++ b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/RandomFacadeStream.java @@ -53,11 +53,6 @@ public class RandomFacadeStream extends TupleStream implements Expressible { throw new IOException(String.format(Locale.ROOT,"invalid expression %s - collectionName expected as first operand",expression)); } - // Named parameters - passed directly to solr as solrparams - if(0 == namedParams.size()){ - throw new IOException(String.format(Locale.ROOT,"invalid expression %s - at least one named parameter expected. eg. 'q=*:*'",expression)); - } - // pull out known named params Map params = new HashMap(); for(StreamExpressionNamedParameter namedParam : namedParams){ @@ -66,6 +61,20 @@ public class RandomFacadeStream extends TupleStream implements Expressible { } } + //Add sensible defaults + + if(!params.containsKey("q")) { + params.put("q", "*:*"); + } + + if(!params.containsKey("fl")) { + params.put("fl", "*"); + } + + if(!params.containsKey("rows")) { + params.put("rows", "500"); + } + // zkHost, optional - if not provided then will look into factory list to get String zkHost = null; if(null == zkHostExpression){ diff --git a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/RandomStream.java b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/RandomStream.java index 1a6083b8d9b..8f065000d65 100644 --- a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/RandomStream.java +++ b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/RandomStream.java @@ -88,10 +88,6 @@ public class RandomStream extends TupleStream implements Expressible { throw new IOException(String.format(Locale.ROOT,"invalid expression %s - collectionName expected as first operand",expression)); } - // Named parameters - passed directly to solr as solrparams - if(0 == namedParams.size()){ - throw new IOException(String.format(Locale.ROOT,"invalid expression %s - at least one named parameter expected. eg. 'q=*:*'",expression)); - } // pull out known named params Map params = new HashMap(); @@ -101,6 +97,7 @@ public class RandomStream extends TupleStream implements Expressible { } } + // zkHost, optional - if not provided then will look into factory list to get String zkHost = null; if(null == zkHostExpression){ diff --git a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/StatsStream.java b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/StatsStream.java index 81ffaa8d6ba..c497290d585 100644 --- a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/StatsStream.java +++ b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/StatsStream.java @@ -91,21 +91,12 @@ public class StatsStream extends TupleStream implements Expressible { List metricExpressions = factory.getExpressionOperandsRepresentingTypes(expression, Metric.class); StreamExpressionNamedParameter zkHostExpression = factory.getNamedOperand(expression, "zkHost"); - // Validate there are no unknown parameters - zkHost is namedParameter so we don't need to count it twice - if(expression.getParameters().size() != 1 + namedParams.size() + metricExpressions.size()){ - throw new IOException(String.format(Locale.ROOT,"invalid expression %s - unknown operands found",expression)); - } // Collection Name if(null == collectionName){ throw new IOException(String.format(Locale.ROOT,"invalid expression %s - collectionName expected as first operand",expression)); } - // Named parameters - passed directly to solr as solrparams - if(0 == namedParams.size()){ - throw new IOException(String.format(Locale.ROOT,"invalid expression %s - at least one named parameter expected. eg. 'q=*:*'",expression)); - } - ModifiableSolrParams params = new ModifiableSolrParams(); for(StreamExpressionNamedParameter namedParam : namedParams){ if(!namedParam.getName().equals("zkHost")){ @@ -113,6 +104,10 @@ public class StatsStream extends TupleStream implements Expressible { } } + if(params.get("q") == null) { + params.set("q", "*:*"); + } + // zkHost, optional - if not provided then will look into factory list to get String zkHost = null; if(null == zkHostExpression){ diff --git a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/TimeSeriesStream.java b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/TimeSeriesStream.java index 19c886aec5c..bccc4388b6d 100644 --- a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/TimeSeriesStream.java +++ b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/TimeSeriesStream.java @@ -45,6 +45,7 @@ import org.apache.solr.client.solrj.io.stream.expr.StreamExpressionNamedParamete import org.apache.solr.client.solrj.io.stream.expr.StreamExpressionParameter; import org.apache.solr.client.solrj.io.stream.expr.StreamExpressionValue; import org.apache.solr.client.solrj.io.stream.expr.StreamFactory; +import org.apache.solr.client.solrj.io.stream.metrics.CountMetric; import org.apache.solr.client.solrj.io.stream.metrics.Metric; import org.apache.solr.client.solrj.request.QueryRequest; import org.apache.solr.common.params.ModifiableSolrParams; @@ -100,34 +101,36 @@ public class TimeSeriesStream extends TupleStream implements Expressible { StreamExpressionNamedParameter fieldExpression = factory.getNamedOperand(expression, "field"); StreamExpressionNamedParameter gapExpression = factory.getNamedOperand(expression, "gap"); StreamExpressionNamedParameter formatExpression = factory.getNamedOperand(expression, "format"); - StreamExpressionNamedParameter qExpression = factory.getNamedOperand(expression, "q"); StreamExpressionNamedParameter zkHostExpression = factory.getNamedOperand(expression, "zkHost"); List metricExpressions = factory.getExpressionOperandsRepresentingTypes(expression, Expressible.class, Metric.class); - - if(qExpression == null) { - throw new IOException("The timeseries expression requires the q parameter"); - } - String start = null; if(startExpression != null) { start = ((StreamExpressionValue)startExpression.getParameter()).getValue(); + } else { + throw new IOException(String.format(Locale.ROOT,"invalid expression %s - start parameter is required",expression)); } String end = null; if(endExpression != null) { end = ((StreamExpressionValue)endExpression.getParameter()).getValue(); + } else { + throw new IOException(String.format(Locale.ROOT,"invalid expression %s - end parameter is required",expression)); } String gap = null; if(gapExpression != null) { gap = ((StreamExpressionValue)gapExpression.getParameter()).getValue(); - } + } else { + throw new IOException(String.format(Locale.ROOT,"invalid expression %s - gap parameter is required",expression)); + } String field = null; if(fieldExpression != null) { field = ((StreamExpressionValue)fieldExpression.getParameter()).getValue(); + } else { + throw new IOException(String.format(Locale.ROOT,"invalid expression %s - field parameter is required",expression)); } String format = null; @@ -146,13 +149,15 @@ public class TimeSeriesStream extends TupleStream implements Expressible { } // Construct the metrics - Metric[] metrics = new Metric[metricExpressions.size()]; - for(int idx = 0; idx < metricExpressions.size(); ++idx){ - metrics[idx] = factory.constructMetric(metricExpressions.get(idx)); - } - - if(0 == metrics.length){ - throw new IOException(String.format(Locale.ROOT,"invalid expression %s - at least one metric expected.",expression,collectionName)); + Metric[] metrics = null; + if(metricExpressions.size() > 0) { + metrics = new Metric[metricExpressions.size()]; + for(int idx = 0; idx < metricExpressions.size(); ++idx){ + metrics[idx] = factory.constructMetric(metricExpressions.get(idx)); + } + } else { + metrics = new Metric[1]; + metrics[0] = new CountMetric(); } // pull out known named params @@ -163,6 +168,10 @@ public class TimeSeriesStream extends TupleStream implements Expressible { } } + if(params.get("q") == null) { + params.set("q", "*:*"); + } + // zkHost, optional - if not provided then will look into factory list to get String zkHost = null; if(null == zkHostExpression){ diff --git a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/UpdateStream.java b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/UpdateStream.java index c00de1020c5..7ea88085940 100644 --- a/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/UpdateStream.java +++ b/solr/solrj/src/java/org/apache/solr/client/solrj/io/stream/UpdateStream.java @@ -237,10 +237,10 @@ public class UpdateStream extends TupleStream implements Expressible { private int extractBatchSize(StreamExpression expression, StreamFactory factory) throws IOException { StreamExpressionNamedParameter batchSizeParam = factory.getNamedOperand(expression, "batchSize"); - if(null == batchSizeParam || null == batchSizeParam.getParameter() || !(batchSizeParam.getParameter() instanceof StreamExpressionValue)){ - throw new IOException(String.format(Locale.ROOT,"Invalid expression %s - expecting a 'batchSize' parameter of type positive integer but didn't find one",expression)); + if(batchSizeParam == null) { + // Sensible default batch size + return 250; } - String batchSizeStr = ((StreamExpressionValue)batchSizeParam.getParameter()).getValue(); return parseBatchSize(batchSizeStr, expression); } diff --git a/solr/solrj/src/test/org/apache/solr/client/solrj/io/stream/StreamExpressionTest.java b/solr/solrj/src/test/org/apache/solr/client/solrj/io/stream/StreamExpressionTest.java index 9c6e345fc9c..7bb0584f8bb 100644 --- a/solr/solrj/src/test/org/apache/solr/client/solrj/io/stream/StreamExpressionTest.java +++ b/solr/solrj/src/test/org/apache/solr/client/solrj/io/stream/StreamExpressionTest.java @@ -664,12 +664,16 @@ public class StreamExpressionTest extends SolrCloudTestCase { assert (tuples4.size() == 1); sParams = new ModifiableSolrParams(StreamingTest.mapParams(CommonParams.QT, "/stream")); - sParams.add("expr", "random(" + COLLECTIONORALIAS + ", q=\"*:*\", rows=\"10001\", fl=\"id, a_i\")"); + sParams.add("expr", "random(" + COLLECTIONORALIAS + ")"); jetty = cluster.getJettySolrRunner(0); solrStream = new SolrStream(jetty.getBaseUrl().toString() + "/collection1", sParams); tuples4 = getTuples(solrStream); - assert (tuples4.size() == 1000); - + assert(tuples4.size() == 500); + Map fields = tuples4.get(0).fields; + assert(fields.containsKey("id")); + assert(fields.containsKey("a_f")); + assert(fields.containsKey("a_i")); + assert(fields.containsKey("a_s")); } finally { cache.close(); } @@ -792,6 +796,41 @@ public class StreamExpressionTest extends SolrCloudTestCase { assertTrue(avgf.doubleValue() == 5.5D); assertTrue(count.doubleValue() == 10); + //Test without query + + expr = "stats(" + COLLECTIONORALIAS + ", sum(a_i), sum(a_f), min(a_i), min(a_f), max(a_i), max(a_f), avg(a_i), avg(a_f), count(*))"; + expression = StreamExpressionParser.parse(expr); + stream = factory.constructStream(expression); + stream.setStreamContext(streamContext); + + tuples = getTuples(stream); + + assert (tuples.size() == 1); + + //Test Long and Double Sums + + tuple = tuples.get(0); + + sumi = tuple.getDouble("sum(a_i)"); + sumf = tuple.getDouble("sum(a_f)"); + mini = tuple.getDouble("min(a_i)"); + minf = tuple.getDouble("min(a_f)"); + maxi = tuple.getDouble("max(a_i)"); + maxf = tuple.getDouble("max(a_f)"); + avgi = tuple.getDouble("avg(a_i)"); + avgf = tuple.getDouble("avg(a_f)"); + count = tuple.getDouble("count(*)"); + + assertTrue(sumi.longValue() == 70); + assertTrue(sumf.doubleValue() == 55.0D); + assertTrue(mini.doubleValue() == 0.0D); + assertTrue(minf.doubleValue() == 1.0D); + assertTrue(maxi.doubleValue() == 14.0D); + assertTrue(maxf.doubleValue() == 10.0D); + assertTrue(avgi.doubleValue() == 7.0D); + assertTrue(avgf.doubleValue() == 5.5D); + assertTrue(count.doubleValue() == 10); + //Test with shards parameter List shardUrls = TupleStream.getShards(cluster.getZkServer().getZkAddress(), COLLECTIONORALIAS, streamContext); @@ -939,7 +978,7 @@ public class StreamExpressionTest extends SolrCloudTestCase { paramsLoc = new ModifiableSolrParams(); - expr = "facet2D(collection1, q=\"*:*\", x=\"diseases_s\", y=\"symptoms_s\", dimensions=\"3,1\")"; + expr = "facet2D(collection1, x=\"diseases_s\", y=\"symptoms_s\", dimensions=\"3,1\")"; paramsLoc.set("expr", expr); paramsLoc.set("qt", "/stream"); @@ -2780,7 +2819,7 @@ public class StreamExpressionTest extends SolrCloudTestCase { assertTrue(tuples.get(3).get("term_s").equals("f")); // update - expression = StreamExpressionParser.parse("update(destinationCollection, batchSize=5, " + featuresExpression + ")"); + expression = StreamExpressionParser.parse("update(destinationCollection, " + featuresExpression + ")"); stream = new UpdateStream(expression, factory); stream.setStreamContext(streamContext); getTuples(stream); diff --git a/solr/solrj/src/test/org/apache/solr/client/solrj/io/stream/StreamExpressionToExpessionTest.java b/solr/solrj/src/test/org/apache/solr/client/solrj/io/stream/StreamExpressionToExpessionTest.java index e71c769208a..d69047caf6a 100644 --- a/solr/solrj/src/test/org/apache/solr/client/solrj/io/stream/StreamExpressionToExpessionTest.java +++ b/solr/solrj/src/test/org/apache/solr/client/solrj/io/stream/StreamExpressionToExpessionTest.java @@ -296,7 +296,7 @@ public class StreamExpressionToExpessionTest extends SolrTestCase { assertTrue(expressionString.contains("bucketSorts=\"sum(a_i) asc\"")); assertTrue(expressionString.contains("rows=10")); assertTrue(expressionString.contains("offset=0")); - assertTrue(expressionString.contains("overfetch=150")); + assertTrue(expressionString.contains("overfetch=250")); assertTrue(expressionString.contains("sum(a_i)")); assertTrue(expressionString.contains("sum(a_f)")); assertTrue(expressionString.contains("min(a_i)")); @@ -306,8 +306,8 @@ public class StreamExpressionToExpessionTest extends SolrTestCase { assertTrue(expressionString.contains("avg(a_i,false)")); assertTrue(expressionString.contains("avg(a_f,false)")); assertTrue(expressionString.contains("count(*)")); - assertEquals(stream.getOverfetch(), 150); - assertEquals(stream.getBucketSizeLimit(), 160); + assertEquals(stream.getOverfetch(), 250); + assertEquals(stream.getBucketSizeLimit(), 260); assertEquals(stream.getRows(), 10); assertEquals(stream.getOffset(), 0); } @@ -332,7 +332,7 @@ public class StreamExpressionToExpessionTest extends SolrTestCase { assertTrue(!expressionString.contains("bucketSizeLimit")); assertTrue(expressionString.contains("rows=10")); assertTrue(expressionString.contains("offset=0")); - assertTrue(expressionString.contains("overfetch=150")); + assertTrue(expressionString.contains("overfetch=250")); assertTrue(expressionString.contains("method=dvhash")); assertTrue(expressionString.contains("sum(a_i)")); assertTrue(expressionString.contains("sum(a_f)")); @@ -343,10 +343,10 @@ public class StreamExpressionToExpessionTest extends SolrTestCase { assertTrue(expressionString.contains("avg(a_i,false)")); assertTrue(expressionString.contains("avg(a_f,false)")); assertTrue(expressionString.contains("count(*)")); - assertEquals(stream.getBucketSizeLimit(), 160); + assertEquals(stream.getBucketSizeLimit(), 260); assertEquals(stream.getRows(), 10); assertEquals(stream.getOffset(), 0); - assertEquals(stream.getOverfetch(), 150); + assertEquals(stream.getOverfetch(), 250); }