allow legacy index generator

2014-09-09 17:04:35 -07:00 · 2014-09-09 17:04:35 -07:00 · 351afb8be7
parent 197c80a694
commit 351afb8be7
7 changed files with 1995 additions and 11 deletions
--- a/indexing-hadoop/src/main/java/io/druid/indexer/HadoopDruidIndexerConfig.java
+++ b/indexing-hadoop/src/main/java/io/druid/indexer/HadoopDruidIndexerConfig.java
@ -207,6 +207,12 @@ public class HadoopDruidIndexerConfig
    }
  }

+  // TODO: remove this
+  public boolean isLegacy()
+  {
+    return schema.isLegacy();
+  }
+
  @JsonProperty
  public HadoopIngestionSpec getSchema()
  {
--- a/indexing-hadoop/src/main/java/io/druid/indexer/HadoopDruidIndexerJob.java
+++ b/indexing-hadoop/src/main/java/io/druid/indexer/HadoopDruidIndexerJob.java
@ -57,7 +57,11 @@ public class HadoopDruidIndexerJob implements Jobby
    List<Jobby> jobs = Lists.newArrayList();
    JobHelper.ensurePaths(config);

+    if (config.isLegacy()) {
+      indexJob = new LegacyIndexGeneratorJob(config);
+    } else {
      indexJob = new IndexGeneratorJob(config);
+    }
    jobs.add(indexJob);

    if (dbUpdaterJob != null) {
@ -66,7 +70,8 @@ public class HadoopDruidIndexerJob implements Jobby
      log.info("No updaterJobSpec set, not uploading to database");
    }

-    jobs.add(new Jobby()
+    jobs.add(
+        new Jobby()
        {
          @Override
          public boolean run()
@ -74,7 +79,8 @@ public class HadoopDruidIndexerJob implements Jobby
            publishedSegments = IndexGeneratorJob.getPublishedSegments(config);
            return true;
          }
-    });
+        }
+    );


    JobHelper.runJobs(jobs, config);
--- a/indexing-hadoop/src/main/java/io/druid/indexer/HadoopIngestionSpec.java
+++ b/indexing-hadoop/src/main/java/io/druid/indexer/HadoopIngestionSpec.java
@ -50,11 +50,14 @@ public class HadoopIngestionSpec extends IngestionSpec<HadoopIOConfig, HadoopTun
  private final HadoopIOConfig ioConfig;
  private final HadoopTuningConfig tuningConfig;

+  private final boolean legacy; // TODO: remove
+
  @JsonCreator
  public HadoopIngestionSpec(
      @JsonProperty("dataSchema") DataSchema dataSchema,
      @JsonProperty("ioConfig") HadoopIOConfig ioConfig,
      @JsonProperty("tuningConfig") HadoopTuningConfig tuningConfig,
+      @JsonProperty("legacy") boolean legacy, // TODO: remove
      // All deprecated
      final @JsonProperty("dataSource") String dataSource,
      final @JsonProperty("timestampSpec") TimestampSpec timestampSpec,
@ -84,6 +87,7 @@ public class HadoopIngestionSpec extends IngestionSpec<HadoopIOConfig, HadoopTun
  )
  {
    super(dataSchema, ioConfig, tuningConfig);
+    this.legacy = legacy;

    if (dataSchema != null) {
      this.dataSchema = dataSchema;
@ -197,6 +201,7 @@ public class HadoopIngestionSpec extends IngestionSpec<HadoopIOConfig, HadoopTun
        schema,
        ioConfig,
        tuningConfig,
+        legacy,
        null,
        null,
        null,
@ -230,6 +235,7 @@ public class HadoopIngestionSpec extends IngestionSpec<HadoopIOConfig, HadoopTun
        dataSchema,
        config,
        tuningConfig,
+        legacy,
        null,
        null,
        null,
@ -263,6 +269,7 @@ public class HadoopIngestionSpec extends IngestionSpec<HadoopIOConfig, HadoopTun
        dataSchema,
        ioConfig,
        config,
+        legacy,
        null,
        null,
        null,
@ -289,4 +296,11 @@ public class HadoopIngestionSpec extends IngestionSpec<HadoopIOConfig, HadoopTun
        null
    );
  }
+
+  // TODO: remove
+  @JsonProperty
+  public boolean isLegacy()
+  {
+    return legacy;
+  }
 }
--- a/indexing-hadoop/src/main/java/io/druid/indexer/LegacyIndexGeneratorJob.java
+++ b/indexing-hadoop/src/main/java/io/druid/indexer/LegacyIndexGeneratorJob.java
@ -0,0 +1,609 @@
+/*
+ * Druid - a distributed column store.
+ * Copyright (C) 2012, 2013  Metamarkets Group Inc.
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
+ */
+
+package io.druid.indexer;
+
+import com.google.common.base.Optional;
+import com.google.common.base.Throwables;
+import com.google.common.collect.ImmutableMap;
+import com.google.common.collect.Iterables;
+import com.google.common.collect.Lists;
+import com.google.common.collect.Sets;
+import com.google.common.io.Closeables;
+import com.google.common.primitives.Longs;
+import com.metamx.common.IAE;
+import com.metamx.common.ISE;
+import com.metamx.common.guava.CloseQuietly;
+import com.metamx.common.logger.Logger;
+import io.druid.data.input.InputRow;
+import io.druid.data.input.impl.StringInputRowParser;
+import io.druid.offheap.OffheapBufferPool;
+import io.druid.query.aggregation.AggregatorFactory;
+import io.druid.segment.IndexIO;
+import io.druid.segment.IndexMerger;
+import io.druid.segment.QueryableIndex;
+import io.druid.segment.SegmentUtils;
+import io.druid.segment.incremental.IncrementalIndex;
+import io.druid.segment.incremental.IncrementalIndexSchema;
+import io.druid.timeline.DataSegment;
+import org.apache.commons.io.FileUtils;
+import org.apache.hadoop.conf.Configurable;
+import org.apache.hadoop.conf.Configuration;
+import org.apache.hadoop.fs.FSDataOutputStream;
+import org.apache.hadoop.fs.FileStatus;
+import org.apache.hadoop.fs.FileSystem;
+import org.apache.hadoop.fs.LocalFileSystem;
+import org.apache.hadoop.fs.Path;
+import org.apache.hadoop.fs.s3native.NativeS3FileSystem;
+import org.apache.hadoop.hdfs.DistributedFileSystem;
+import org.apache.hadoop.io.BytesWritable;
+import org.apache.hadoop.io.Text;
+import org.apache.hadoop.mapred.InvalidJobConfException;
+import org.apache.hadoop.mapreduce.Counter;
+import org.apache.hadoop.mapreduce.Job;
+import org.apache.hadoop.mapreduce.JobContext;
+import org.apache.hadoop.mapreduce.Partitioner;
+import org.apache.hadoop.mapreduce.Reducer;
+import org.apache.hadoop.mapreduce.lib.input.CombineTextInputFormat;
+import org.apache.hadoop.mapreduce.lib.input.TextInputFormat;
+import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
+import org.apache.hadoop.mapreduce.lib.output.TextOutputFormat;
+import org.joda.time.DateTime;
+import org.joda.time.Interval;
+
+import java.io.BufferedOutputStream;
+import java.io.File;
+import java.io.FileInputStream;
+import java.io.IOException;
+import java.io.InputStream;
+import java.net.URI;
+import java.nio.ByteBuffer;
+import java.util.Arrays;
+import java.util.List;
+import java.util.Set;
+import java.util.zip.ZipEntry;
+import java.util.zip.ZipOutputStream;
+
+/**
+ */
+public class LegacyIndexGeneratorJob extends IndexGeneratorJob
+{
+  private static final Logger log = new Logger(IndexGeneratorJob.class);
+  private final HadoopDruidIndexerConfig config;
+  private IndexGeneratorStats jobStats;
+
+  public LegacyIndexGeneratorJob(
+      HadoopDruidIndexerConfig config
+  )
+  {
+    super(config);
+    this.config = config;
+    this.jobStats = new IndexGeneratorStats();
+  }
+
+  public boolean run()
+  {
+    try {
+      Job job = new Job(
+          new Configuration(),
+          String.format("%s-index-generator-%s", config.getDataSource(), config.getIntervals())
+      );
+
+      job.getConfiguration().set("io.sort.record.percent", "0.23");
+
+      JobHelper.injectSystemProperties(job);
+
+      if (config.isCombineText()) {
+        job.setInputFormatClass(CombineTextInputFormat.class);
+      } else {
+        job.setInputFormatClass(TextInputFormat.class);
+      }
+
+      job.setMapperClass(IndexGeneratorMapper.class);
+      job.setMapOutputValueClass(Text.class);
+
+      SortableBytes.useSortableBytesAsMapOutputKey(job);
+
+      job.setNumReduceTasks(Iterables.size(config.getAllBuckets().get()));
+      job.setPartitionerClass(IndexGeneratorPartitioner.class);
+
+      job.setReducerClass(IndexGeneratorReducer.class);
+      job.setOutputKeyClass(BytesWritable.class);
+      job.setOutputValueClass(Text.class);
+      job.setOutputFormatClass(IndexGeneratorOutputFormat.class);
+      FileOutputFormat.setOutputPath(job, config.makeIntermediatePath());
+
+      config.addInputPaths(job);
+      config.addJobProperties(job);
+      config.intoConfiguration(job);
+
+      JobHelper.setupClasspath(config, job);
+
+      job.submit();
+      log.info("Job %s submitted, status available at %s", job.getJobName(), job.getTrackingURL());
+
+      boolean success = job.waitForCompletion(true);
+
+      Counter invalidRowCount = job.getCounters()
+                                   .findCounter(HadoopDruidIndexerConfig.IndexJobCounters.INVALID_ROW_COUNTER);
+      jobStats.setInvalidRowCount(invalidRowCount.getValue());
+
+      return success;
+    }
+    catch (Exception e) {
+      throw new RuntimeException(e);
+    }
+  }
+
+  public static class IndexGeneratorMapper extends HadoopDruidIndexerMapper<BytesWritable, Text>
+
+  {
+    @Override
+    protected void innerMap(
+        InputRow inputRow,
+        Text text,
+        Context context
+    ) throws IOException, InterruptedException
+    {
+      // Group by bucket, sort by timestamp
+      final Optional<Bucket> bucket = getConfig().getBucket(inputRow);
+
+      if (!bucket.isPresent()) {
+        throw new ISE("WTF?! No bucket found for row: %s", inputRow);
+      }
+
+      context.write(
+          new SortableBytes(
+              bucket.get().toGroupKey(),
+              Longs.toByteArray(inputRow.getTimestampFromEpoch())
+          ).toBytesWritable(),
+          text
+      );
+    }
+  }
+
+  public static class IndexGeneratorPartitioner extends Partitioner<BytesWritable, Text> implements Configurable
+  {
+    private Configuration config;
+
+    @Override
+    public int getPartition(BytesWritable bytesWritable, Text text, int numPartitions)
+    {
+      final ByteBuffer bytes = ByteBuffer.wrap(bytesWritable.getBytes());
+      bytes.position(4); // Skip length added by SortableBytes
+      int shardNum = bytes.getInt();
+      if (config.get("mapred.job.tracker").equals("local")) {
+        return shardNum % numPartitions;
+      } else {
+        if (shardNum >= numPartitions) {
+          throw new ISE("Not enough partitions, shard[%,d] >= numPartitions[%,d]", shardNum, numPartitions);
+        }
+        return shardNum;
+
+      }
+    }
+
+    @Override
+    public Configuration getConf()
+    {
+      return config;
+    }
+
+    @Override
+    public void setConf(Configuration config)
+    {
+      this.config = config;
+    }
+  }
+
+  public static class IndexGeneratorReducer extends Reducer<BytesWritable, Text, BytesWritable, Text>
+  {
+    private HadoopDruidIndexerConfig config;
+    private List<String> metricNames = Lists.newArrayList();
+    private StringInputRowParser parser;
+
+    @Override
+    protected void setup(Context context)
+        throws IOException, InterruptedException
+    {
+      config = HadoopDruidIndexerConfig.fromConfiguration(context.getConfiguration());
+
+      for (AggregatorFactory factory : config.getSchema().getDataSchema().getAggregators()) {
+        metricNames.add(factory.getName().toLowerCase());
+      }
+
+      parser = config.getParser();
+    }
+
+    @Override
+    protected void reduce(
+        BytesWritable key, Iterable<Text> values, final Context context
+    ) throws IOException, InterruptedException
+    {
+      SortableBytes keyBytes = SortableBytes.fromBytesWritable(key);
+      Bucket bucket = Bucket.fromGroupKey(keyBytes.getGroupKey()).lhs;
+
+      final Interval interval = config.getGranularitySpec().bucketInterval(bucket.time).get();
+      //final DataRollupSpec rollupSpec = config.getRollupSpec();
+      final AggregatorFactory[] aggs = config.getSchema().getDataSchema().getAggregators();
+
+      IncrementalIndex index = makeIncrementalIndex(bucket, aggs);
+      try {
+        File baseFlushFile = File.createTempFile("base", "flush");
+        baseFlushFile.delete();
+        baseFlushFile.mkdirs();
+
+        Set<File> toMerge = Sets.newTreeSet();
+        int indexCount = 0;
+        int lineCount = 0;
+        int runningTotalLineCount = 0;
+        long startTime = System.currentTimeMillis();
+
+        Set<String> allDimensionNames = Sets.newHashSet();
+        final IndexMerger.ProgressIndicator progressIndicator = new IndexMerger.ProgressIndicator()
+        {
+          @Override
+          public void progress()
+          {
+            context.progress();
+          }
+        };
+
+        for (final Text value : values) {
+          context.progress();
+          final InputRow inputRow = index.formatRow(parser.parse(value.toString()));
+          allDimensionNames.addAll(inputRow.getDimensions());
+
+          int numRows = index.add(inputRow);
+          ++lineCount;
+
+          if (index.isFull()) {
+            log.info(
+                "%,d lines to %,d rows in %,d millis",
+                lineCount - runningTotalLineCount,
+                numRows,
+                System.currentTimeMillis() - startTime
+            );
+            runningTotalLineCount = lineCount;
+
+            final File file = new File(baseFlushFile, String.format("index%,05d", indexCount));
+            toMerge.add(file);
+
+            context.progress();
+            IndexMerger.persist(
+                index, interval, file, progressIndicator
+            );
+            // close this index and make a new one
+            index.close();
+            index = makeIncrementalIndex(bucket, aggs);
+
+            startTime = System.currentTimeMillis();
+            ++indexCount;
+          }
+        }
+
+        log.info("%,d lines completed.", lineCount);
+
+        List<QueryableIndex> indexes = Lists.newArrayListWithCapacity(indexCount);
+        final File mergedBase;
+
+        if (toMerge.size() == 0) {
+          if (index.isEmpty()) {
+            throw new IAE("If you try to persist empty indexes you are going to have a bad time");
+          }
+
+          mergedBase = new File(baseFlushFile, "merged");
+          IndexMerger.persist(
+              index, interval, mergedBase, progressIndicator
+          );
+        } else {
+          if (!index.isEmpty()) {
+            final File finalFile = new File(baseFlushFile, "final");
+            IndexMerger.persist(
+                index, interval, finalFile, progressIndicator
+            );
+            toMerge.add(finalFile);
+          }
+
+          for (File file : toMerge) {
+            indexes.add(IndexIO.loadIndex(file));
+          }
+          mergedBase = IndexMerger.mergeQueryableIndex(
+              indexes, aggs, new File(baseFlushFile, "merged"), progressIndicator
+          );
+        }
+        serializeOutIndex(context, bucket, mergedBase, Lists.newArrayList(allDimensionNames));
+        for (File file : toMerge) {
+          FileUtils.deleteDirectory(file);
+        }
+      }
+      finally {
+        index.close();
+      }
+    }
+
+    private void serializeOutIndex(Context context, Bucket bucket, File mergedBase, List<String> dimensionNames)
+        throws IOException
+    {
+      Interval interval = config.getGranularitySpec().bucketInterval(bucket.time).get();
+
+      int attemptNumber = context.getTaskAttemptID().getId();
+
+      FileSystem fileSystem = FileSystem.get(context.getConfiguration());
+      Path indexBasePath = config.makeSegmentOutputPath(fileSystem, bucket);
+      Path indexZipFilePath = new Path(indexBasePath, String.format("index.zip.%s", attemptNumber));
+      final FileSystem infoFS = config.makeDescriptorInfoDir().getFileSystem(context.getConfiguration());
+      final FileSystem outputFS = indexBasePath.getFileSystem(context.getConfiguration());
+
+      outputFS.mkdirs(indexBasePath);
+
+      Exception caughtException = null;
+      ZipOutputStream out = null;
+      long size = 0;
+      try {
+        out = new ZipOutputStream(new BufferedOutputStream(outputFS.create(indexZipFilePath), 256 * 1024));
+
+        List<String> filesToCopy = Arrays.asList(mergedBase.list());
+
+        for (String file : filesToCopy) {
+          size += copyFile(context, out, mergedBase, file);
+        }
+      }
+      catch (Exception e) {
+        caughtException = e;
+      }
+      finally {
+        if (caughtException == null) {
+          Closeables.close(out, false);
+        } else {
+          CloseQuietly.close(out);
+          throw Throwables.propagate(caughtException);
+        }
+      }
+
+      Path finalIndexZipFilePath = new Path(indexBasePath, "index.zip");
+      final URI indexOutURI = finalIndexZipFilePath.toUri();
+      ImmutableMap<String, Object> loadSpec;
+      if (outputFS instanceof NativeS3FileSystem) {
+        loadSpec = ImmutableMap.<String, Object>of(
+            "type", "s3_zip",
+            "bucket", indexOutURI.getHost(),
+            "key", indexOutURI.getPath().substring(1) // remove the leading "/"
+        );
+      } else if (outputFS instanceof LocalFileSystem) {
+        loadSpec = ImmutableMap.<String, Object>of(
+            "type", "local",
+            "path", indexOutURI.getPath()
+        );
+      } else if (outputFS instanceof DistributedFileSystem) {
+        loadSpec = ImmutableMap.<String, Object>of(
+            "type", "hdfs",
+            "path", indexOutURI.getPath()
+        );
+      } else {
+        throw new ISE("Unknown file system[%s]", outputFS.getClass());
+      }
+
+      DataSegment segment = new DataSegment(
+          config.getDataSource(),
+          interval,
+          config.getSchema().getTuningConfig().getVersion(),
+          loadSpec,
+          dimensionNames,
+          metricNames,
+          config.getShardSpec(bucket).getActualSpec(),
+          SegmentUtils.getVersionFromDir(mergedBase),
+          size
+      );
+
+      // retry 1 minute
+      boolean success = false;
+      for (int i = 0; i < 6; i++) {
+        if (renameIndexFiles(infoFS, outputFS, indexBasePath, indexZipFilePath, finalIndexZipFilePath, segment)) {
+          log.info("Successfully renamed [%s] to [%s]", indexZipFilePath, finalIndexZipFilePath);
+          success = true;
+          break;
+        } else {
+          log.info("Failed to rename [%s] to [%s]", indexZipFilePath, finalIndexZipFilePath);
+          try {
+            Thread.sleep(10000);
+            context.progress();
+          }
+          catch (InterruptedException e) {
+            throw new ISE(
+                "Thread error in retry loop for renaming [%s] to [%s]",
+                indexZipFilePath.toUri().getPath(),
+                finalIndexZipFilePath.toUri().getPath()
+            );
+          }
+        }
+      }
+
+      if (!success) {
+        if (!outputFS.exists(indexZipFilePath)) {
+          throw new ISE("File [%s] does not exist after retry loop.", indexZipFilePath.toUri().getPath());
+        }
+
+        if (outputFS.getFileStatus(indexZipFilePath).getLen() == outputFS.getFileStatus(finalIndexZipFilePath)
+                                                                         .getLen()) {
+          outputFS.delete(indexZipFilePath, true);
+        } else {
+          outputFS.delete(finalIndexZipFilePath, true);
+          if (!renameIndexFiles(infoFS, outputFS, indexBasePath, indexZipFilePath, finalIndexZipFilePath, segment)) {
+            throw new ISE(
+                "Files [%s] and [%s] are different, but still cannot rename after retry loop",
+                indexZipFilePath.toUri().getPath(),
+                finalIndexZipFilePath.toUri().getPath()
+            );
+          }
+        }
+      }
+    }
+
+    private boolean renameIndexFiles(
+        FileSystem intermediateFS,
+        FileSystem outputFS,
+        Path indexBasePath,
+        Path indexZipFilePath,
+        Path finalIndexZipFilePath,
+        DataSegment segment
+    )
+        throws IOException
+    {
+      final boolean needRename;
+
+      if (outputFS.exists(finalIndexZipFilePath)) {
+        // NativeS3FileSystem.rename won't overwrite, so we might need to delete the old index first
+        final FileStatus zipFile = outputFS.getFileStatus(indexZipFilePath);
+        final FileStatus finalIndexZipFile = outputFS.getFileStatus(finalIndexZipFilePath);
+
+        if (zipFile.getModificationTime() >= finalIndexZipFile.getModificationTime()
+            || zipFile.getLen() != finalIndexZipFile.getLen()) {
+          log.info(
+              "File[%s / %s / %sB] existed, but wasn't the same as [%s / %s / %sB]",
+              finalIndexZipFile.getPath(),
+              new DateTime(finalIndexZipFile.getModificationTime()),
+              finalIndexZipFile.getLen(),
+              zipFile.getPath(),
+              new DateTime(zipFile.getModificationTime()),
+              zipFile.getLen()
+          );
+          outputFS.delete(finalIndexZipFilePath, false);
+          needRename = true;
+        } else {
+          log.info(
+              "File[%s / %s / %sB] existed and will be kept",
+              finalIndexZipFile.getPath(),
+              new DateTime(finalIndexZipFile.getModificationTime()),
+              finalIndexZipFile.getLen()
+          );
+          needRename = false;
+        }
+      } else {
+        needRename = true;
+      }
+
+      if (needRename && !outputFS.rename(indexZipFilePath, finalIndexZipFilePath)) {
+        return false;
+      }
+
+      writeSegmentDescriptor(outputFS, segment, new Path(indexBasePath, "descriptor.json"));
+      final Path descriptorPath = config.makeDescriptorInfoPath(segment);
+      log.info("Writing descriptor to path[%s]", descriptorPath);
+      intermediateFS.mkdirs(descriptorPath.getParent());
+      writeSegmentDescriptor(intermediateFS, segment, descriptorPath);
+
+      return true;
+    }
+
+    private void writeSegmentDescriptor(FileSystem outputFS, DataSegment segment, Path descriptorPath)
+        throws IOException
+    {
+      if (outputFS.exists(descriptorPath)) {
+        outputFS.delete(descriptorPath, false);
+      }
+
+      final FSDataOutputStream descriptorOut = outputFS.create(descriptorPath);
+      try {
+        HadoopDruidIndexerConfig.jsonMapper.writeValue(descriptorOut, segment);
+      }
+      finally {
+        descriptorOut.close();
+      }
+    }
+
+    private long copyFile(
+        Context context, ZipOutputStream out, File mergedBase, final String filename
+    ) throws IOException
+    {
+      createNewZipEntry(out, filename);
+      long numRead = 0;
+
+      InputStream in = null;
+      try {
+        in = new FileInputStream(new File(mergedBase, filename));
+        byte[] buf = new byte[0x10000];
+        int read;
+        while (true) {
+          read = in.read(buf);
+          if (read == -1) {
+            break;
+          }
+
+          out.write(buf, 0, read);
+          numRead += read;
+          context.progress();
+        }
+      }
+      finally {
+        CloseQuietly.close(in);
+      }
+      out.closeEntry();
+      context.progress();
+
+      return numRead;
+    }
+
+    private IncrementalIndex makeIncrementalIndex(Bucket theBucket, AggregatorFactory[] aggs)
+    {
+      return new IncrementalIndex(
+          new IncrementalIndexSchema.Builder()
+              .withMinTimestamp(theBucket.time.getMillis())
+              .withDimensionsSpec(config.getSchema().getDataSchema().getParser())
+              .withQueryGranularity(config.getSchema().getDataSchema().getGranularitySpec().getQueryGranularity())
+              .withMetrics(aggs)
+              .build(),
+          new OffheapBufferPool(config.getSchema().getTuningConfig().getBufferSize())
+      );
+    }
+
+    private void createNewZipEntry(ZipOutputStream out, String name) throws IOException
+    {
+      log.info("Creating new ZipEntry[%s]", name);
+      out.putNextEntry(new ZipEntry(name));
+    }
+  }
+
+  public static class IndexGeneratorOutputFormat extends TextOutputFormat
+  {
+    @Override
+    public void checkOutputSpecs(JobContext job) throws IOException
+    {
+      Path outDir = getOutputPath(job);
+      if (outDir == null) {
+        throw new InvalidJobConfException("Output directory not set.");
+      }
+    }
+  }
+
+  public static class IndexGeneratorStats
+  {
+    private long invalidRowCount = 0;
+
+    public long getInvalidRowCount()
+    {
+      return invalidRowCount;
+    }
+
+    public void setInvalidRowCount(long invalidRowCount)
+    {
+      this.invalidRowCount = invalidRowCount;
+    }
+  }
+}
--- a/indexing-service/src/test/java/io/druid/indexing/common/task/TaskSerdeTest.java
+++ b/indexing-service/src/test/java/io/druid/indexing/common/task/TaskSerdeTest.java
@ -350,7 +350,7 @@ public class TaskSerdeTest
        null,
        null,
        new HadoopIngestionSpec(
-            null, null, null,
+            null, null, null, false, // TODO
            "foo",
            new TimestampSpec("timestamp", "auto"),
            new JSONDataSpec(ImmutableList.of("foo"), null),
--- a/processing/src/main/java/io/druid/segment/IndexMerger.java
+++ b/processing/src/main/java/io/druid/segment/IndexMerger.java
--- a/processing/src/main/java/io/druid/segment/data/VSizeIndexedWriter.java
+++ b/processing/src/main/java/io/druid/segment/data/VSizeIndexedWriter.java
@ -0,0 +1,145 @@
+/*
+ * Druid - a distributed column store.
+ * Copyright (C) 2012, 2013  Metamarkets Group Inc.
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
+ */
+
+package io.druid.segment.data;
+
+import com.google.common.base.Function;
+import com.google.common.base.Preconditions;
+import com.google.common.collect.Iterables;
+import com.google.common.io.ByteStreams;
+import com.google.common.io.Closeables;
+import com.google.common.io.CountingOutputStream;
+import com.google.common.io.InputSupplier;
+import com.google.common.primitives.Ints;
+
+import java.io.Closeable;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.OutputStream;
+import java.util.Arrays;
+import java.util.List;
+
+/**
+ * Streams arrays of objects out in the binary format described by VSizeIndexed
+ */
+public class VSizeIndexedWriter implements Closeable
+{
+  private static final byte version = 0x1;
+  private static final byte[] EMPTY_ARRAY = new byte[]{};
+
+  private final int maxId;
+
+  private CountingOutputStream headerOut = null;
+  private CountingOutputStream valuesOut = null;
+  int numWritten = 0;
+  private final IOPeon ioPeon;
+  private final String filenameBase;
+
+  public VSizeIndexedWriter(
+      IOPeon ioPeon,
+      String filenameBase,
+      int maxId
+  )
+  {
+    this.ioPeon = ioPeon;
+    this.filenameBase = filenameBase;
+    this.maxId = maxId;
+  }
+
+  public void open() throws IOException
+  {
+    headerOut = new CountingOutputStream(ioPeon.makeOutputStream(makeFilename("header")));
+    valuesOut = new CountingOutputStream(ioPeon.makeOutputStream(makeFilename("values")));
+  }
+
+  public void write(List<Integer> ints) throws IOException
+  {
+    byte[] bytesToWrite = ints == null ? EMPTY_ARRAY : VSizeIndexedInts.fromList(ints, maxId).getBytesNoPadding();
+
+    valuesOut.write(bytesToWrite);
+
+    headerOut.write(Ints.toByteArray((int) valuesOut.getCount()));
+
+    ++numWritten;
+  }
+
+  private String makeFilename(String suffix)
+  {
+    return String.format("%s.%s", filenameBase, suffix);
+  }
+
+  @Override
+  public void close() throws IOException
+  {
+    final byte numBytesForMax = VSizeIndexedInts.getNumBytesForMax(maxId);
+
+    valuesOut.write(new byte[4 - numBytesForMax]);
+
+    Closeables.close(headerOut, false);
+    Closeables.close(valuesOut, false);
+
+    final long numBytesWritten = headerOut.getCount() + valuesOut.getCount();
+
+    Preconditions.checkState(
+        headerOut.getCount() == (numWritten * 4),
+        "numWritten[%s] number of rows should have [%s] bytes written to headerOut, had[%s]",
+        numWritten,
+        numWritten * 4,
+        headerOut.getCount()
+    );
+    Preconditions.checkState(
+        numBytesWritten < Integer.MAX_VALUE, "Wrote[%s] bytes, which is too many.", numBytesWritten
+    );
+
+    OutputStream metaOut = ioPeon.makeOutputStream(makeFilename("meta"));
+
+    try {
+      metaOut.write(new byte[]{version, numBytesForMax});
+      metaOut.write(Ints.toByteArray((int) numBytesWritten + 4));
+      metaOut.write(Ints.toByteArray(numWritten));
+    }
+    finally {
+      metaOut.close();
+    }
+  }
+
+  public InputSupplier<InputStream> combineStreams()
+  {
+    return ByteStreams.join(
+        Iterables.transform(
+            Arrays.asList("meta", "header", "values"),
+            new Function<String,InputSupplier<InputStream>>() {
+
+              @Override
+              public InputSupplier<InputStream> apply(final String input)
+              {
+                return new InputSupplier<InputStream>()
+                {
+                  @Override
+                  public InputStream getInput() throws IOException
+                  {
+                    return ioPeon.makeInputStream(makeFilename(input));
+                  }
+                };
+              }
+            }
+        )
+    );
+  }
+}