fix backwards compatibility issues

2012-11-08 15:09:00 -08:00 · 2012-11-08 15:09:00 -08:00 · 6da047b5fa
parent 17fb93d049
commit 6da047b5fa
2 changed files with 146 additions and 0 deletions
--- a/indexer/src/main/java/com/metamx/druid/indexer/HadoopDruidIndexer.java
+++ b/indexer/src/main/java/com/metamx/druid/indexer/HadoopDruidIndexer.java
@ -0,0 +1,133 @@
+/*
+ * Druid - a distributed column store.
+ * Copyright (C) 2012  Metamarkets Group Inc.
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
+ */
+
+package com.metamx.druid.indexer;
+
+import com.google.common.collect.ImmutableList;
+import com.metamx.common.Pair;
+import com.metamx.common.lifecycle.Lifecycle;
+import com.metamx.druid.jackson.DefaultObjectMapper;
+import org.codehaus.jackson.map.ObjectMapper;
+
+import java.util.List;
+
+/**
+ */
+@Deprecated
+public class HadoopDruidIndexer
+{
+  public static void main(String[] args) throws Exception
+  {
+    if (args.length < 1 || args.length > 2) {
+      printHelp();
+      System.exit(2);
+    }
+
+    HadoopDruidIndexerNode node = HadoopDruidIndexerNode.builder().build();
+
+    if (args.length == 2) {
+      node.setIntervalSpec(args[0]);
+    }
+    node.setArgumentSpec(args[args.length == 1 ? 0 : 1]);
+
+    Lifecycle lifecycle = new Lifecycle();
+    lifecycle.addManagedInstance(node);
+
+    try {
+      lifecycle.start();
+    }
+    catch (Exception e) {
+      e.printStackTrace();
+      Thread.sleep(500);
+      printHelp();
+      System.exit(1);
+    }
+  }
+
+  private static final List<Pair<String, String>> expectedFields =
+      ImmutableList.<Pair<String, String>>builder()
+                   .add(Pair.of("dataSource", "Name of dataSource"))
+                   .add(Pair.of("timestampColumn", "Column name of the timestamp column"))
+                   .add(Pair.of("timestampFormat", "Format name of the timestamp column (posix or iso)"))
+                   .add(
+                       Pair.of(
+                           "dataSpec",
+                           "A JSON object with fields "
+                           +
+                           "format=(json, csv, tsv), "
+                           +
+                           "columns=JSON array of column names for the delimited text input file (only for csv and tsv formats),"
+                           +
+                           "dimensions=JSON array of dimensionn names (must match names in columns),"
+                           +
+                           "delimiter=delimiter of the data (only for tsv format)"
+                       )
+                   )
+                   .add(
+                       Pair.of(
+                           "granularitySpec",
+                           "A JSON object indicating the Granularity that segments should be created at."
+                       )
+                   )
+                   .add(
+                       Pair.of(
+                           "pathSpec",
+                           "A JSON object with fields type=granularity, inputPath, filePattern, dataGranularity"
+                       )
+                   )
+                   .add(
+                       Pair.of(
+                           "rollupSpec",
+                           "JSON object with fields rollupGranularity, aggs=JSON Array of Aggregator specs"
+                       )
+                   )
+                   .add(Pair.of("workingPath", "Path to store intermediate output data.  Deleted when finished."))
+                   .add(Pair.of("segmentOutputPath", "Path to store output segments."))
+                   .add(
+                       Pair.of(
+                           "updaterJobSpec",
+                           "JSON object with fields type=db, connectURI of the database, username, password, and segment table name"
+                       )
+                   )
+                   .add(Pair.of("cleanupOnFailure", "Clean up intermediate files on failure? (default: true)"))
+                   .add(Pair.of("leaveIntermediate", "Leave intermediate files. (default: false)"))
+                   .add(Pair.of("partitionDimension", "Dimension to partition by (optional)"))
+                   .add(
+                       Pair.of(
+                           "targetPartitionSize",
+                           "Integer representing the target number of rows in a partition (required if partitionDimension != null)"
+                       )
+                   )
+                   .build();
+
+  private static void printHelp()
+  {
+    System.out.println("Usage: <java invocation> <time_interval> <config_spec>");
+    System.out.println("<time_interval> is the ISO8601 interval of data to run over.");
+    System.out.println("<config_spec> is either a JSON object or the path to a file that contains a JSON object.");
+    System.out.println();
+    System.out.println("JSON object description:");
+    System.out.println("{");
+    for (Pair<String, String> expectedField : expectedFields) {
+      System.out.printf("  \"%s\": %s%n", expectedField.lhs, expectedField.rhs);
+    }
+    System.out.println("}");
+  }
+
+}
--- a/indexer/src/main/java/com/metamx/druid/indexer/HadoopDruidIndexerNode.java
+++ b/indexer/src/main/java/com/metamx/druid/indexer/HadoopDruidIndexerNode.java
@ -1,11 +1,15 @@
 package com.metamx.druid.indexer;

 import com.google.common.base.Preconditions;
+import com.google.common.collect.Lists;
 import com.metamx.common.lifecycle.LifecycleStart;
 import com.metamx.common.lifecycle.LifecycleStop;
 import org.codehaus.jackson.map.jsontype.NamedType;
+import org.joda.time.Interval;

 import java.io.File;
+import java.util.Arrays;
+import java.util.List;

 /**
 */
@ -67,6 +71,15 @@ public class HadoopDruidIndexerNode
      config = HadoopDruidIndexerConfig.fromFile(new File(argumentSpec));
    }

+    if (intervalSpec != null) {
+      final List<Interval> dataInterval = Lists.transform(
+          Arrays.asList(intervalSpec.split(",")),
+          new StringIntervalFunction()
+      );
+
+      config.setIntervals(dataInterval);
+    }
+
    new HadoopDruidIndexerJob(config).run();
  }