diff --git a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/pom.xml b/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/pom.xml
index 1e5b0fd31a..9ef6fc431e 100644
--- a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/pom.xml
+++ b/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/pom.xml
@@ -26,8 +26,7 @@
     <packaging>jar</packaging>
 
     <properties>
-        <hive.version>2.0.1</hive.version>
-        <orc.version>1.1.2</orc.version>
+        <hive.version>1.2.1</hive.version>
     </properties>
 
 
@@ -139,11 +138,6 @@
                 </exclusion>
             </exclusions>
         </dependency>
-        <dependency>
-            <groupId>org.apache.orc</groupId>
-            <artifactId>orc-core</artifactId>
-            <version>${orc.version}</version>
-        </dependency>
         <dependency>
             <groupId>org.apache.hive.hcatalog</groupId>
             <artifactId>hive-hcatalog-streaming</artifactId>
@@ -168,6 +162,10 @@
             <artifactId>hive-hcatalog-core</artifactId>
             <version>${hive.version}</version>
         </dependency>
+        <dependency>
+            <groupId>org.apache.hadoop</groupId>
+            <artifactId>hadoop-mapreduce-client-core</artifactId>
+        </dependency>
         <dependency>
             <groupId>org.apache.hadoop</groupId>
             <artifactId>hadoop-common</artifactId>
diff --git a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/java/org/apache/nifi/processors/hive/ConvertAvroToORC.java b/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/java/org/apache/nifi/processors/hive/ConvertAvroToORC.java
deleted file mode 100644
index 2cec1d0d31..0000000000
--- a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/java/org/apache/nifi/processors/hive/ConvertAvroToORC.java
+++ /dev/null
@@ -1,310 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-package org.apache.nifi.processors.hive;
-
-import org.apache.avro.Schema;
-import org.apache.avro.file.DataFileStream;
-import org.apache.avro.generic.GenericDatumReader;
-import org.apache.avro.generic.GenericRecord;
-import org.apache.commons.lang3.mutable.MutableInt;
-import org.apache.hadoop.conf.Configuration;
-import org.apache.hadoop.fs.Path;
-import org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch;
-import org.apache.nifi.annotation.behavior.InputRequirement;
-import org.apache.nifi.annotation.behavior.SideEffectFree;
-import org.apache.nifi.annotation.behavior.SupportsBatching;
-import org.apache.nifi.annotation.behavior.WritesAttribute;
-import org.apache.nifi.annotation.behavior.WritesAttributes;
-import org.apache.nifi.annotation.documentation.CapabilityDescription;
-import org.apache.nifi.annotation.documentation.Tags;
-import org.apache.nifi.annotation.lifecycle.OnScheduled;
-import org.apache.nifi.components.PropertyDescriptor;
-import org.apache.nifi.flowfile.FlowFile;
-import org.apache.nifi.flowfile.attributes.CoreAttributes;
-import org.apache.nifi.processor.AbstractProcessor;
-import org.apache.nifi.processor.DataUnit;
-import org.apache.nifi.processor.ProcessContext;
-import org.apache.nifi.processor.ProcessSession;
-import org.apache.nifi.processor.Relationship;
-import org.apache.nifi.processor.exception.ProcessException;
-import org.apache.nifi.processor.io.StreamCallback;
-import org.apache.nifi.processor.util.StandardValidators;
-import org.apache.nifi.util.hive.HiveJdbcCommon;
-import org.apache.nifi.util.hive.HiveUtils;
-import org.apache.nifi.util.orc.OrcFlowFileWriter;
-import org.apache.nifi.util.orc.OrcUtils;
-import org.apache.orc.CompressionKind;
-import org.apache.orc.OrcFile;
-import org.apache.orc.TypeDescription;
-
-import java.io.BufferedInputStream;
-import java.io.BufferedOutputStream;
-import java.io.IOException;
-import java.io.InputStream;
-import java.io.OutputStream;
-import java.util.ArrayList;
-import java.util.Collections;
-import java.util.HashSet;
-import java.util.List;
-import java.util.Set;
-import java.util.concurrent.atomic.AtomicInteger;
-import java.util.concurrent.atomic.AtomicReference;
-
-/**
- * The ConvertAvroToORC processor takes an Avro-formatted flow file as input and converts it into ORC format.
- */
-@SideEffectFree
-@SupportsBatching
-@Tags({"avro", "orc", "hive", "convert"})
-@InputRequirement(InputRequirement.Requirement.INPUT_REQUIRED)
-@CapabilityDescription("Converts an Avro record into ORC file format. This processor provides a direct mapping of an Avro record to an ORC record, such "
-        + "that the resulting ORC file will have the same hierarchical structure as the Avro document. If an incoming FlowFile contains a stream of "
-        + "multiple Avro records, the resultant FlowFile will contain a ORC file containing all of the Avro records.  If an incoming FlowFile does "
-        + "not contain any records, an empty ORC file is the output.")
-@WritesAttributes({
-        @WritesAttribute(attribute = "mime.type", description = "Sets the mime type to application/octet-stream"),
-        @WritesAttribute(attribute = "filename", description = "Sets the filename to the existing filename with the extension replaced by / added to by .orc"),
-        @WritesAttribute(attribute = "record.count", description = "Sets the number of records in the ORC file."),
-        @WritesAttribute(attribute = "hive.ddl", description = "Creates a partial Hive DDL statement for creating a table in Hive from this ORC file. "
-                + "This can be used in ReplaceText for setting the content to the DDL. To make it valid DDL, add \"LOCATION '<path_to_orc_file_in_hdfs>'\", where "
-                + "the path is the directory that contains this ORC file on HDFS. For example, ConvertAvroToORC can send flow files to a PutHDFS processor to send the file to "
-                + "HDFS, then to a ReplaceText to set the content to this DDL (plus the LOCATION clause as described), then to PutHiveQL processor to create the table "
-                + "if it doesn't exist.")
-})
-public class ConvertAvroToORC extends AbstractProcessor {
-
-    // Attributes
-    public static final String ORC_MIME_TYPE = "application/octet-stream";
-    public static final String HIVE_DDL_ATTRIBUTE = "hive.ddl";
-    public static final String RECORD_COUNT_ATTRIBUTE = "record.count";
-
-
-    // Properties
-    public static final PropertyDescriptor ORC_CONFIGURATION_RESOURCES = new PropertyDescriptor.Builder()
-            .name("orc-config-resources")
-            .displayName("ORC Configuration Resources")
-            .description("A file or comma separated list of files which contains the ORC configuration (hive-site.xml, e.g.). Without this, Hadoop "
-                    + "will search the classpath for a 'hive-site.xml' file or will revert to a default configuration. Please see the ORC documentation for more details.")
-            .required(false).addValidator(HiveUtils.createMultipleFilesExistValidator()).build();
-
-    public static final PropertyDescriptor STRIPE_SIZE = new PropertyDescriptor.Builder()
-            .name("orc-stripe-size")
-            .displayName("Stripe Size")
-            .description("The size of the memory buffer (in bytes) for writing stripes to an ORC file")
-            .required(true)
-            .addValidator(StandardValidators.DATA_SIZE_VALIDATOR)
-            .defaultValue("100 KB")
-            .build();
-
-    public static final PropertyDescriptor BUFFER_SIZE = new PropertyDescriptor.Builder()
-            .name("orc-buffer-size")
-            .displayName("Buffer Size")
-            .description("The maximum size of the memory buffers (in bytes) used for compressing and storing a stripe in memory. This is a hint to the ORC writer, "
-                    + "which may choose to use a smaller buffer size based on stripe size and number of columns for efficient stripe writing and memory utilization.")
-            .required(true)
-            .addValidator(StandardValidators.DATA_SIZE_VALIDATOR)
-            .defaultValue("10 KB")
-            .build();
-
-    public static final PropertyDescriptor COMPRESSION_TYPE = new PropertyDescriptor.Builder()
-            .name("orc-compression-type")
-            .displayName("Compression Type")
-            .required(true)
-            .allowableValues("NONE", "ZLIB", "SNAPPY", "LZO")
-            .defaultValue("NONE")
-            .build();
-
-    public static final PropertyDescriptor HIVE_TABLE_NAME = new PropertyDescriptor.Builder()
-            .name("orc-hive-table-name")
-            .displayName("Hive Table Name")
-            .description("An optional table name to insert into the hive.ddl attribute. The generated DDL can be used by "
-                    + "a PutHiveQL processor (presumably after a PutHDFS processor) to create a table backed by the converted ORC file. "
-                    + "If this property is not provided, the full name (including namespace) of the incoming Avro record will be normalized "
-                    + "and used as the table name.")
-            .required(false)
-            .expressionLanguageSupported(true)
-            .addValidator(StandardValidators.NON_BLANK_VALIDATOR)
-            .build();
-
-    // Relationships
-    static final Relationship REL_SUCCESS = new Relationship.Builder()
-            .name("success")
-            .description("A FlowFile is routed to this relationship after it has been converted to ORC format.")
-            .build();
-    static final Relationship REL_FAILURE = new Relationship.Builder()
-            .name("failure")
-            .description("A FlowFile is routed to this relationship if it cannot be parsed as Avro or cannot be converted to ORC for any reason")
-            .build();
-
-    private final static List<PropertyDescriptor> propertyDescriptors;
-    private final static Set<Relationship> relationships;
-
-    private volatile Configuration orcConfig;
-
-    /*
-     * Will ensure that the list of property descriptors is built only once.
-     * Will also create a Set of relationships
-     */
-    static {
-        List<PropertyDescriptor> _propertyDescriptors = new ArrayList<>();
-        _propertyDescriptors.add(ORC_CONFIGURATION_RESOURCES);
-        _propertyDescriptors.add(STRIPE_SIZE);
-        _propertyDescriptors.add(BUFFER_SIZE);
-        _propertyDescriptors.add(COMPRESSION_TYPE);
-        _propertyDescriptors.add(HIVE_TABLE_NAME);
-        propertyDescriptors = Collections.unmodifiableList(_propertyDescriptors);
-
-        Set<Relationship> _relationships = new HashSet<>();
-        _relationships.add(REL_SUCCESS);
-        _relationships.add(REL_FAILURE);
-        relationships = Collections.unmodifiableSet(_relationships);
-    }
-
-    @Override
-    protected List<PropertyDescriptor> getSupportedPropertyDescriptors() {
-        return propertyDescriptors;
-    }
-
-    @Override
-    public Set<Relationship> getRelationships() {
-        return relationships;
-    }
-
-    @OnScheduled
-    public void setup(ProcessContext context) {
-        boolean confFileProvided = context.getProperty(ORC_CONFIGURATION_RESOURCES).isSet();
-        if (confFileProvided) {
-            final String configFiles = context.getProperty(ORC_CONFIGURATION_RESOURCES).getValue();
-            orcConfig = HiveJdbcCommon.getConfigurationFromFiles(configFiles);
-        }
-    }
-
-    @Override
-    public void onTrigger(final ProcessContext context, final ProcessSession session) throws ProcessException {
-        FlowFile flowFile = session.get();
-        if (flowFile == null) {
-            return;
-        }
-
-        try {
-            long startTime = System.currentTimeMillis();
-            final long stripeSize = context.getProperty(STRIPE_SIZE).asDataSize(DataUnit.B).longValue();
-            final int bufferSize = context.getProperty(BUFFER_SIZE).asDataSize(DataUnit.B).intValue();
-            final CompressionKind compressionType = CompressionKind.valueOf(context.getProperty(COMPRESSION_TYPE).getValue());
-            final AtomicReference<Schema> hiveAvroSchema = new AtomicReference<>(null);
-            final AtomicInteger totalRecordCount = new AtomicInteger(0);
-            final String fileName = flowFile.getAttribute(CoreAttributes.FILENAME.key());
-            flowFile = session.write(flowFile, new StreamCallback() {
-                @Override
-                public void process(final InputStream rawIn, final OutputStream rawOut) throws IOException {
-                    try (final InputStream in = new BufferedInputStream(rawIn);
-                         final OutputStream out = new BufferedOutputStream(rawOut);
-                         final DataFileStream<GenericRecord> reader = new DataFileStream<>(in, new GenericDatumReader<>())) {
-
-                        // Create ORC schema from Avro schema
-                        Schema avroSchema = reader.getSchema();
-                        TypeDescription orcSchema = OrcUtils.getOrcField(avroSchema);
-
-                        if (orcConfig == null) {
-                            orcConfig = new Configuration();
-                        }
-                        OrcFile.WriterOptions options = OrcFile.writerOptions(orcConfig)
-                                .setSchema(orcSchema)
-                                .stripeSize(stripeSize)
-                                .bufferSize(bufferSize)
-                                .compress(compressionType)
-                                .version(OrcFile.Version.CURRENT);
-
-                        OrcFlowFileWriter orcWriter = new OrcFlowFileWriter(out, new Path(fileName), options);
-                        try {
-                            VectorizedRowBatch batch = orcSchema.createRowBatch();
-                            int recordCount = 0;
-                            int recordsInBatch = 0;
-                            GenericRecord currRecord = null;
-                            while (reader.hasNext()) {
-                                currRecord = reader.next(currRecord);
-                                List<Schema.Field> fields = currRecord.getSchema().getFields();
-                                if (fields != null) {
-                                    MutableInt[] vectorOffsets = new MutableInt[fields.size()];
-                                    for (int i = 0; i < fields.size(); i++) {
-                                        vectorOffsets[i] = new MutableInt(0);
-                                        Schema.Field field = fields.get(i);
-                                        Schema fieldSchema = field.schema();
-                                        Object o = currRecord.get(field.name());
-                                        try {
-                                            OrcUtils.putToRowBatch(batch.cols[i], vectorOffsets[i], recordsInBatch, fieldSchema, o);
-                                        } catch (ArrayIndexOutOfBoundsException aioobe) {
-                                            getLogger().error("Index out of bounds at record {} for column {}, type {}, and object {}",
-                                                    new Object[]{recordsInBatch, i, fieldSchema.getType().getName(), o.toString()},
-                                                    aioobe);
-                                            throw new IOException(aioobe);
-                                        }
-                                    }
-                                }
-                                recordCount++;
-                                recordsInBatch++;
-
-                                if (recordsInBatch == batch.getMaxSize()) {
-                                    // add batch and start a new one
-                                    batch.size = recordsInBatch;
-                                    orcWriter.addRowBatch(batch);
-                                    batch = orcSchema.createRowBatch();
-                                    recordsInBatch = 0;
-                                }
-                            }
-
-                            // If there are records in the batch, add the batch
-                            if (recordsInBatch > 0) {
-                                batch.size = recordsInBatch;
-                                orcWriter.addRowBatch(batch);
-                            }
-
-                            hiveAvroSchema.set(avroSchema);
-                            totalRecordCount.set(recordCount);
-                        } finally {
-                            // finished writing this record, close the writer (which will flush to the flow file)
-                            orcWriter.close();
-                        }
-                    }
-                }
-            });
-
-            final String hiveTableName = context.getProperty(HIVE_TABLE_NAME).isSet()
-                    ? context.getProperty(HIVE_TABLE_NAME).evaluateAttributeExpressions(flowFile).getValue()
-                    : OrcUtils.normalizeHiveTableName(hiveAvroSchema.get().getFullName());
-            String hiveDDL = OrcUtils.generateHiveDDL(hiveAvroSchema.get(), hiveTableName);
-            // Add attributes and transfer to success
-            flowFile = session.putAttribute(flowFile, RECORD_COUNT_ATTRIBUTE, Integer.toString(totalRecordCount.get()));
-            flowFile = session.putAttribute(flowFile, HIVE_DDL_ATTRIBUTE, hiveDDL);
-            StringBuilder newFilename = new StringBuilder();
-            int extensionIndex = fileName.lastIndexOf(".");
-            if (extensionIndex != -1) {
-                newFilename.append(fileName.substring(0, extensionIndex));
-            } else {
-                newFilename.append(fileName);
-            }
-            newFilename.append(".orc");
-            flowFile = session.putAttribute(flowFile, CoreAttributes.MIME_TYPE.key(), ORC_MIME_TYPE);
-            flowFile = session.putAttribute(flowFile, CoreAttributes.FILENAME.key(), newFilename.toString());
-            session.transfer(flowFile, REL_SUCCESS);
-            session.getProvenanceReporter().modifyContent(flowFile, "Converted "+totalRecordCount.get()+" records", System.currentTimeMillis() - startTime);
-        } catch (final ProcessException pe) {
-            getLogger().error("Failed to convert {} from Avro to ORC due to {}; transferring to failure", new Object[]{flowFile, pe});
-            session.transfer(flowFile, REL_FAILURE);
-        }
-    }
-}
diff --git a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/java/org/apache/nifi/util/orc/OrcFlowFileWriter.java b/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/java/org/apache/nifi/util/orc/OrcFlowFileWriter.java
deleted file mode 100644
index 7055fcbd5e..0000000000
--- a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/java/org/apache/nifi/util/orc/OrcFlowFileWriter.java
+++ /dev/null
@@ -1,2944 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-package org.apache.nifi.util.orc;
-
-import static com.google.common.base.Preconditions.checkArgument;
-
-import java.io.IOException;
-import java.io.OutputStream;
-import java.nio.ByteBuffer;
-import java.sql.Timestamp;
-import java.util.ArrayList;
-import java.util.Arrays;
-import java.util.EnumSet;
-import java.util.List;
-import java.util.Map;
-import java.util.TimeZone;
-import java.util.TreeMap;
-
-import org.apache.hadoop.conf.Configuration;
-import org.apache.hadoop.fs.Path;
-import org.apache.hadoop.hive.ql.util.JavaDataModel;
-import org.apache.nifi.stream.io.ByteCountingOutputStream;
-import org.apache.orc.BinaryColumnStatistics;
-import org.apache.orc.BloomFilterIO;
-import org.apache.orc.CompressionCodec;
-import org.apache.orc.CompressionKind;
-import org.apache.orc.OrcConf;
-import org.apache.orc.OrcFile;
-import org.apache.orc.OrcProto;
-import org.apache.orc.OrcUtils;
-import org.apache.orc.StringColumnStatistics;
-import org.apache.orc.StripeInformation;
-import org.apache.orc.TypeDescription;
-import org.apache.orc.Writer;
-import org.apache.orc.impl.BitFieldWriter;
-import org.apache.orc.impl.ColumnStatisticsImpl;
-import org.apache.orc.impl.DynamicIntArray;
-import org.apache.orc.impl.IntegerWriter;
-import org.apache.orc.impl.MemoryManager;
-import org.apache.orc.impl.OutStream;
-import org.apache.orc.impl.PositionRecorder;
-import org.apache.orc.impl.PositionedOutputStream;
-import org.apache.orc.impl.RunLengthByteWriter;
-import org.apache.orc.impl.RunLengthIntegerWriter;
-import org.apache.orc.impl.RunLengthIntegerWriterV2;
-import org.apache.orc.impl.SerializationUtils;
-import org.apache.orc.impl.SnappyCodec;
-import org.apache.orc.impl.StreamName;
-import org.apache.orc.impl.StringRedBlackTree;
-import org.apache.orc.impl.ZlibCodec;
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
-import org.apache.hadoop.hive.common.type.HiveDecimal;
-import org.apache.hadoop.hive.ql.exec.vector.BytesColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.ColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.DecimalColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.DoubleColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.ListColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.LongColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.MapColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.StructColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.TimestampColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.UnionColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch;
-import org.apache.hadoop.io.Text;
-
-import com.google.common.annotations.VisibleForTesting;
-import com.google.common.collect.Lists;
-import com.google.common.primitives.Longs;
-import com.google.protobuf.ByteString;
-import com.google.protobuf.CodedOutputStream;
-
-/**
- * An ORC file writer. The file is divided into stripes, which is the natural
- * unit of work when reading. Each stripe is buffered in memory until the
- * memory reaches the stripe size and then it is written out broken down by
- * columns. Each column is written by a TreeWriter that is specific to that
- * type of column. TreeWriters may have children TreeWriters that handle the
- * sub-types. Each of the TreeWriters writes the column's data as a set of
- * streams.
- * <p>
- * This class is unsynchronized like most Stream objects, so from the creation
- * of an OrcFile and all access to a single instance has to be from a single
- * thread.
- * <p>
- * There are no known cases where these happen between different threads today.
- * <p>
- * Caveat: the MemoryManager is created during WriterOptions create, that has
- * to be confined to a single thread as well.
- */
-public class OrcFlowFileWriter implements Writer, MemoryManager.Callback {
-
-    private static final Logger LOG = LoggerFactory.getLogger(OrcFlowFileWriter.class);
-
-    private static final int HDFS_BUFFER_SIZE = 256 * 1024;
-    private static final int MIN_ROW_INDEX_STRIDE = 1000;
-
-    // threshold above which buffer size will be automatically resized
-    private static final int COLUMN_COUNT_THRESHOLD = 1000;
-
-    private final Path path;
-    private final long defaultStripeSize;
-    private long adjustedStripeSize;
-    private final int rowIndexStride;
-    private final CompressionKind compress;
-    private final CompressionCodec codec;
-    private final boolean addBlockPadding;
-    private final int bufferSize;
-    private final long blockSize;
-    private final double paddingTolerance;
-    private final TypeDescription schema;
-
-    private final OutputStream flowFileOutputStream;
-
-    // the streams that make up the current stripe
-    private final Map<StreamName, BufferedStream> streams = new TreeMap<>();
-
-    private ByteCountingOutputStream rawWriter = null;
-    // the compressed metadata information outStream
-    private OutStream writer = null;
-    // a protobuf outStream around streamFactory
-    private CodedOutputStream protobufWriter = null;
-    private long headerLength;
-    private int columnCount;
-    private long rowCount = 0;
-    private long rowsInStripe = 0;
-    private long rawDataSize = 0;
-    private int rowsInIndex = 0;
-    private int stripesAtLastFlush = -1;
-    private final List<OrcProto.StripeInformation> stripes = new ArrayList<>();
-    private final Map<String, ByteString> userMetadata = new TreeMap<>();
-    private final StreamFactory streamFactory = new StreamFactory();
-    private final TreeWriter treeWriter;
-    private final boolean buildIndex;
-    private final MemoryManager memoryManager;
-    private final OrcFile.Version version;
-    private final Configuration conf;
-    private final OrcFile.WriterCallback callback;
-    private final OrcFile.WriterContext callbackContext;
-    private final OrcFile.EncodingStrategy encodingStrategy;
-    private final OrcFile.CompressionStrategy compressionStrategy;
-    private final boolean[] bloomFilterColumns;
-    private final double bloomFilterFpp;
-    private boolean writeTimeZone;
-
-    public OrcFlowFileWriter(OutputStream flowFileOutputStream, Path path, OrcFile.WriterOptions opts) throws IOException {
-        this.flowFileOutputStream = flowFileOutputStream;
-        this.path = path;
-        this.conf = opts.getConfiguration();
-        this.callback = opts.getCallback();
-        this.schema = opts.getSchema();
-        if (callback != null) {
-            callbackContext = new OrcFile.WriterContext() {
-
-                @Override
-                public Writer getWriter() {
-                    return OrcFlowFileWriter.this;
-                }
-            };
-        } else {
-            callbackContext = null;
-        }
-        this.adjustedStripeSize = opts.getStripeSize();
-        this.defaultStripeSize = opts.getStripeSize();
-        this.version = opts.getVersion();
-        this.encodingStrategy = opts.getEncodingStrategy();
-        this.compressionStrategy = opts.getCompressionStrategy();
-        this.addBlockPadding = opts.getBlockPadding();
-        this.blockSize = opts.getBlockSize();
-        this.paddingTolerance = opts.getPaddingTolerance();
-        this.compress = opts.getCompress();
-        this.rowIndexStride = opts.getRowIndexStride();
-        this.memoryManager = opts.getMemoryManager();
-        buildIndex = rowIndexStride > 0;
-        codec = createCodec(compress);
-        int numColumns = schema.getMaximumId() + 1;
-        if (opts.isEnforceBufferSize()) {
-            this.bufferSize = opts.getBufferSize();
-        } else {
-            this.bufferSize = getEstimatedBufferSize(defaultStripeSize,
-                    numColumns, opts.getBufferSize());
-        }
-        if (version == OrcFile.Version.V_0_11) {
-      /* do not write bloom filters for ORC v11 */
-            this.bloomFilterColumns = new boolean[schema.getMaximumId() + 1];
-        } else {
-            this.bloomFilterColumns =
-                    OrcUtils.includeColumns(opts.getBloomFilterColumns(), schema);
-        }
-        this.bloomFilterFpp = opts.getBloomFilterFpp();
-        treeWriter = createTreeWriter(schema, streamFactory, false);
-        if (buildIndex && rowIndexStride < MIN_ROW_INDEX_STRIDE) {
-            throw new IllegalArgumentException("Row stride must be at least " +
-                    MIN_ROW_INDEX_STRIDE);
-        }
-
-        // ensure that we are able to handle callbacks before we register ourselves
-        memoryManager.addWriter(path, opts.getStripeSize(), this);
-        LOG.info("ORC writer created for path: {} with stripeSize: {} blockSize: {}" +
-                        " compression: {} bufferSize: {}", path, defaultStripeSize, blockSize,
-                compress, bufferSize);
-    }
-
-    @VisibleForTesting
-    public static int getEstimatedBufferSize(long stripeSize, int numColumns,
-                                             int bs) {
-        // The worst case is that there are 2 big streams per a column and
-        // we want to guarantee that each stream gets ~10 buffers.
-        // This keeps buffers small enough that we don't get really small stripe
-        // sizes.
-        int estBufferSize = (int) (stripeSize / (20 * numColumns));
-        estBufferSize = getClosestBufferSize(estBufferSize);
-        return estBufferSize > bs ? bs : estBufferSize;
-    }
-
-    private static int getClosestBufferSize(int estBufferSize) {
-        final int kb4 = 4 * 1024;
-        final int kb8 = 8 * 1024;
-        final int kb16 = 16 * 1024;
-        final int kb32 = 32 * 1024;
-        final int kb64 = 64 * 1024;
-        final int kb128 = 128 * 1024;
-        final int kb256 = 256 * 1024;
-        if (estBufferSize <= kb4) {
-            return kb4;
-        } else if (estBufferSize > kb4 && estBufferSize <= kb8) {
-            return kb8;
-        } else if (estBufferSize > kb8 && estBufferSize <= kb16) {
-            return kb16;
-        } else if (estBufferSize > kb16 && estBufferSize <= kb32) {
-            return kb32;
-        } else if (estBufferSize > kb32 && estBufferSize <= kb64) {
-            return kb64;
-        } else if (estBufferSize > kb64 && estBufferSize <= kb128) {
-            return kb128;
-        } else {
-            return kb256;
-        }
-    }
-
-    public static CompressionCodec createCodec(CompressionKind kind) {
-        switch (kind) {
-            case NONE:
-                return null;
-            case ZLIB:
-                return new ZlibCodec();
-            case SNAPPY:
-                return new SnappyCodec();
-            case LZO:
-                try {
-                    ClassLoader loader = Thread.currentThread().getContextClassLoader();
-                    if (loader == null) {
-                        loader = OrcFlowFileWriter.class.getClassLoader();
-                    }
-                    @SuppressWarnings("unchecked")
-                    Class<? extends CompressionCodec> lzo =
-                            (Class<? extends CompressionCodec>)
-                                    loader.loadClass("org.apache.hadoop.hive.ql.io.orc.LzoCodec");
-                    return lzo.newInstance();
-                } catch (ClassNotFoundException e) {
-                    throw new IllegalArgumentException("LZO is not available.", e);
-                } catch (InstantiationException e) {
-                    throw new IllegalArgumentException("Problem initializing LZO", e);
-                } catch (IllegalAccessException e) {
-                    throw new IllegalArgumentException("Insufficient access to LZO", e);
-                }
-            default:
-                throw new IllegalArgumentException("Unknown compression codec: " +
-                        kind);
-        }
-    }
-
-    @Override
-    public boolean checkMemory(double newScale) throws IOException {
-        long limit = (long) Math.round(adjustedStripeSize * newScale);
-        long size = estimateStripeSize();
-        if (LOG.isDebugEnabled()) {
-            LOG.debug("ORC writer " + path + " size = " + size + " limit = " +
-                    limit);
-        }
-        if (size > limit) {
-            flushStripe();
-            return true;
-        }
-        return false;
-    }
-
-    /**
-     * This class is used to hold the contents of streams as they are buffered.
-     * The TreeWriters write to the outStream and the codec compresses the
-     * data as buffers fill up and stores them in the output list. When the
-     * stripe is being written, the whole stream is written to the file.
-     */
-    private class BufferedStream implements OutStream.OutputReceiver {
-        private final OutStream outStream;
-        private final List<ByteBuffer> output = new ArrayList<ByteBuffer>();
-
-        BufferedStream(String name, int bufferSize,
-                       CompressionCodec codec) throws IOException {
-            outStream = new OutStream(name, bufferSize, codec, this);
-        }
-
-        /**
-         * Receive a buffer from the compression codec.
-         *
-         * @param buffer the buffer to save
-         */
-        @Override
-        public void output(ByteBuffer buffer) {
-            output.add(buffer);
-        }
-
-        /**
-         * Get the number of bytes in buffers that are allocated to this stream.
-         *
-         * @return number of bytes in buffers
-         */
-        public long getBufferSize() {
-            long result = 0;
-            for (ByteBuffer buf : output) {
-                result += buf.capacity();
-            }
-            return outStream.getBufferSize() + result;
-        }
-
-        /**
-         * Flush the stream to the codec.
-         *
-         * @throws IOException if an error occurs during flush
-         */
-        public void flush() throws IOException {
-            outStream.flush();
-        }
-
-        /**
-         * Clear all of the buffers.
-         *
-         * @throws IOException if an error occurs during clear
-         */
-        public void clear() throws IOException {
-            outStream.clear();
-            output.clear();
-        }
-
-        /**
-         * Check the state of suppress flag in output stream
-         *
-         * @return value of suppress flag
-         */
-        public boolean isSuppressed() {
-            return outStream.isSuppressed();
-        }
-
-        /**
-         * Get the number of bytes that will be written to the output. Assumes
-         * the stream has already been flushed.
-         *
-         * @return the number of bytes
-         */
-        public long getOutputSize() {
-            long result = 0;
-            for (ByteBuffer buffer : output) {
-                result += buffer.remaining();
-            }
-            return result;
-        }
-
-        /**
-         * Write the saved compressed buffers to the OutputStream.
-         *
-         * @param out the stream to write to
-         * @throws IOException if an error occurs while writing to the output stream
-         */
-        void spillTo(OutputStream out) throws IOException {
-            for (ByteBuffer buffer : output) {
-                out.write(buffer.array(), buffer.arrayOffset() + buffer.position(),
-                        buffer.remaining());
-            }
-        }
-
-        @Override
-        public String toString() {
-            return outStream.toString();
-        }
-    }
-
-    /**
-     * An output receiver that writes the ByteBuffers to the output stream
-     * as they are received.
-     */
-    private class DirectStream implements OutStream.OutputReceiver {
-        private final OutputStream output;
-
-        DirectStream(OutputStream output) {
-            this.output = output;
-        }
-
-        @Override
-        public void output(ByteBuffer buffer) throws IOException {
-            output.write(buffer.array(), buffer.arrayOffset() + buffer.position(),
-                    buffer.remaining());
-        }
-    }
-
-    private static class RowIndexPositionRecorder implements PositionRecorder {
-        private final OrcProto.RowIndexEntry.Builder builder;
-
-        RowIndexPositionRecorder(OrcProto.RowIndexEntry.Builder builder) {
-            this.builder = builder;
-        }
-
-        @Override
-        public void addPosition(long position) {
-            builder.addPositions(position);
-        }
-    }
-
-    /**
-     * Interface from the Writer to the TreeWriters. This limits the visibility
-     * that the TreeWriters have into the Writer.
-     */
-    private class StreamFactory {
-        /**
-         * Create a stream to store part of a column.
-         *
-         * @param column the column id for the stream
-         * @param kind   the kind of stream
-         * @return The output outStream that the section needs to be written to.
-         * @throws IOException if an error occurs while creating the stream
-         */
-        public OutStream createStream(int column, OrcProto.Stream.Kind kind) throws IOException {
-            final StreamName name = new StreamName(column, kind);
-            final EnumSet<CompressionCodec.Modifier> modifiers;
-
-            switch (kind) {
-                case BLOOM_FILTER:
-                case DATA:
-                case DICTIONARY_DATA:
-                    if (getCompressionStrategy() == OrcFile.CompressionStrategy.SPEED) {
-                        modifiers = EnumSet.of(CompressionCodec.Modifier.FAST,
-                                CompressionCodec.Modifier.TEXT);
-                    } else {
-                        modifiers = EnumSet.of(CompressionCodec.Modifier.DEFAULT,
-                                CompressionCodec.Modifier.TEXT);
-                    }
-                    break;
-                case LENGTH:
-                case DICTIONARY_COUNT:
-                case PRESENT:
-                case ROW_INDEX:
-                case SECONDARY:
-                    // easily compressed using the fastest modes
-                    modifiers = EnumSet.of(CompressionCodec.Modifier.FASTEST,
-                            CompressionCodec.Modifier.BINARY);
-                    break;
-                default:
-                    LOG.warn("Missing ORC compression modifiers for " + kind);
-                    modifiers = null;
-                    break;
-            }
-
-            BufferedStream result = streams.get(name);
-            if (result == null) {
-                result = new BufferedStream(name.toString(), bufferSize,
-                        codec == null ? codec : codec.modify(modifiers));
-                streams.put(name, result);
-            }
-            return result.outStream;
-        }
-
-        /**
-         * Get the next column id.
-         *
-         * @return a number from 0 to the number of columns - 1
-         */
-        public int getNextColumnId() {
-            return columnCount++;
-        }
-
-        /**
-         * Get the stride rate of the row index.
-         */
-        public int getRowIndexStride() {
-            return rowIndexStride;
-        }
-
-        /**
-         * Should be building the row index.
-         *
-         * @return true if we are building the index
-         */
-        public boolean buildIndex() {
-            return buildIndex;
-        }
-
-        /**
-         * Is the ORC file compressed?
-         *
-         * @return are the streams compressed
-         */
-        public boolean isCompressed() {
-            return codec != null;
-        }
-
-        /**
-         * Get the encoding strategy to use.
-         *
-         * @return encoding strategy
-         */
-        public OrcFile.EncodingStrategy getEncodingStrategy() {
-            return encodingStrategy;
-        }
-
-        /**
-         * Get the compression strategy to use.
-         *
-         * @return compression strategy
-         */
-        public OrcFile.CompressionStrategy getCompressionStrategy() {
-            return compressionStrategy;
-        }
-
-        /**
-         * Get the bloom filter columns
-         *
-         * @return bloom filter columns
-         */
-        public boolean[] getBloomFilterColumns() {
-            return bloomFilterColumns;
-        }
-
-        /**
-         * Get bloom filter false positive percentage.
-         *
-         * @return fpp
-         */
-        public double getBloomFilterFPP() {
-            return bloomFilterFpp;
-        }
-
-        /**
-         * Get the writer's configuration.
-         *
-         * @return configuration
-         */
-        public Configuration getConfiguration() {
-            return conf;
-        }
-
-        /**
-         * Get the version of the file to write.
-         */
-        public OrcFile.Version getVersion() {
-            return version;
-        }
-
-        public void useWriterTimeZone(boolean val) {
-            writeTimeZone = val;
-        }
-
-        public boolean hasWriterTimeZone() {
-            return writeTimeZone;
-        }
-    }
-
-    /**
-     * The parent class of all of the writers for each column. Each column
-     * is written by an instance of this class. The compound types (struct,
-     * list, map, and union) have children tree writers that write the children
-     * types.
-     */
-    private abstract static class TreeWriter {
-        protected final int id;
-        protected final BitFieldWriter isPresent;
-        private final boolean isCompressed;
-        protected final ColumnStatisticsImpl indexStatistics;
-        protected final ColumnStatisticsImpl stripeColStatistics;
-        private final ColumnStatisticsImpl fileStatistics;
-        protected TreeWriter[] childrenWriters;
-        protected final RowIndexPositionRecorder rowIndexPosition;
-        private final OrcProto.RowIndex.Builder rowIndex;
-        private final OrcProto.RowIndexEntry.Builder rowIndexEntry;
-        private final PositionedOutputStream rowIndexStream;
-        private final PositionedOutputStream bloomFilterStream;
-        protected final BloomFilterIO bloomFilter;
-        protected final boolean createBloomFilter;
-        private final OrcProto.BloomFilterIndex.Builder bloomFilterIndex;
-        private final OrcProto.BloomFilter.Builder bloomFilterEntry;
-        private boolean foundNulls;
-        private OutStream isPresentOutStream;
-        private final List<OrcProto.StripeStatistics.Builder> stripeStatsBuilders;
-        private final StreamFactory streamFactory;
-
-        /**
-         * Create a tree writer.
-         *
-         * @param columnId      the column id of the column to write
-         * @param schema        the row schema
-         * @param streamFactory limited access to the Writer's data.
-         * @param nullable      can the value be null?
-         * @throws IOException if an error occurs while creating the tree writer
-         */
-        TreeWriter(int columnId,
-                   TypeDescription schema,
-                   StreamFactory streamFactory,
-                   boolean nullable) throws IOException {
-            this.streamFactory = streamFactory;
-            this.isCompressed = streamFactory.isCompressed();
-            this.id = columnId;
-            if (nullable) {
-                isPresentOutStream = streamFactory.createStream(id,
-                        OrcProto.Stream.Kind.PRESENT);
-                isPresent = new BitFieldWriter(isPresentOutStream, 1);
-            } else {
-                isPresent = null;
-            }
-            this.foundNulls = false;
-            createBloomFilter = streamFactory.getBloomFilterColumns()[columnId];
-            indexStatistics = ColumnStatisticsImpl.create(schema);
-            stripeColStatistics = ColumnStatisticsImpl.create(schema);
-            fileStatistics = ColumnStatisticsImpl.create(schema);
-            childrenWriters = new TreeWriter[0];
-            rowIndex = OrcProto.RowIndex.newBuilder();
-            rowIndexEntry = OrcProto.RowIndexEntry.newBuilder();
-            rowIndexPosition = new RowIndexPositionRecorder(rowIndexEntry);
-            stripeStatsBuilders = Lists.newArrayList();
-            if (streamFactory.buildIndex()) {
-                rowIndexStream = streamFactory.createStream(id, OrcProto.Stream.Kind.ROW_INDEX);
-            } else {
-                rowIndexStream = null;
-            }
-            if (createBloomFilter) {
-                bloomFilterEntry = OrcProto.BloomFilter.newBuilder();
-                bloomFilterIndex = OrcProto.BloomFilterIndex.newBuilder();
-                bloomFilterStream = streamFactory.createStream(id, OrcProto.Stream.Kind.BLOOM_FILTER);
-                bloomFilter = new BloomFilterIO(streamFactory.getRowIndexStride(),
-                        streamFactory.getBloomFilterFPP());
-            } else {
-                bloomFilterEntry = null;
-                bloomFilterIndex = null;
-                bloomFilterStream = null;
-                bloomFilter = null;
-            }
-        }
-
-        protected OrcProto.RowIndex.Builder getRowIndex() {
-            return rowIndex;
-        }
-
-        protected ColumnStatisticsImpl getStripeStatistics() {
-            return stripeColStatistics;
-        }
-
-        protected OrcProto.RowIndexEntry.Builder getRowIndexEntry() {
-            return rowIndexEntry;
-        }
-
-        IntegerWriter createIntegerWriter(PositionedOutputStream output,
-                                          boolean signed, boolean isDirectV2,
-                                          StreamFactory writer) {
-            if (isDirectV2) {
-                boolean alignedBitpacking = false;
-                if (writer.getEncodingStrategy().equals(OrcFile.EncodingStrategy.SPEED)) {
-                    alignedBitpacking = true;
-                }
-                return new RunLengthIntegerWriterV2(output, signed, alignedBitpacking);
-            } else {
-                return new RunLengthIntegerWriter(output, signed);
-            }
-        }
-
-        boolean isNewWriteFormat(StreamFactory writer) {
-            return writer.getVersion() != OrcFile.Version.V_0_11;
-        }
-
-        /**
-         * Handle the top level object write.
-         * <p>
-         * This default method is used for all types except structs, which are the
-         * typical case. VectorizedRowBatch assumes the top level object is a
-         * struct, so we use the first column for all other types.
-         *
-         * @param batch  the batch to write from
-         * @param offset the row to start on
-         * @param length the number of rows to write
-         * @throws IOException if an error occurs while writing the batch
-         */
-        void writeRootBatch(VectorizedRowBatch batch, int offset,
-                            int length) throws IOException {
-            writeBatch(batch.cols[0], offset, length);
-        }
-
-        /**
-         * Write the values from the given vector from offset for length elements.
-         *
-         * @param vector the vector to write from
-         * @param offset the first value from the vector to write
-         * @param length the number of values from the vector to write
-         * @throws IOException if an error occurs while writing the batch
-         */
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            if (vector.noNulls) {
-                indexStatistics.increment(length);
-                if (isPresent != null) {
-                    for (int i = 0; i < length; ++i) {
-                        isPresent.write(1);
-                    }
-                }
-            } else {
-                if (vector.isRepeating) {
-                    boolean isNull = vector.isNull[0];
-                    if (isPresent != null) {
-                        for (int i = 0; i < length; ++i) {
-                            isPresent.write(isNull ? 0 : 1);
-                        }
-                    }
-                    if (isNull) {
-                        foundNulls = true;
-                        indexStatistics.setNull();
-                    } else {
-                        indexStatistics.increment(length);
-                    }
-                } else {
-                    // count the number of non-null values
-                    int nonNullCount = 0;
-                    for (int i = 0; i < length; ++i) {
-                        boolean isNull = vector.isNull[i + offset];
-                        if (!isNull) {
-                            nonNullCount += 1;
-                        }
-                        if (isPresent != null) {
-                            isPresent.write(isNull ? 0 : 1);
-                        }
-                    }
-                    indexStatistics.increment(nonNullCount);
-                    if (nonNullCount != length) {
-                        foundNulls = true;
-                        indexStatistics.setNull();
-                    }
-                }
-            }
-        }
-
-        private void removeIsPresentPositions() {
-            for (int i = 0; i < rowIndex.getEntryCount(); ++i) {
-                OrcProto.RowIndexEntry.Builder entry = rowIndex.getEntryBuilder(i);
-                List<Long> positions = entry.getPositionsList();
-                // bit streams use 3 positions if uncompressed, 4 if compressed
-                positions = positions.subList(isCompressed ? 4 : 3, positions.size());
-                entry.clearPositions();
-                entry.addAllPositions(positions);
-            }
-        }
-
-        /**
-         * Write the stripe out to the file.
-         *
-         * @param builder              the stripe footer that contains the information about the
-         *                             layout of the stripe. The TreeWriter is required to update
-         *                             the footer with its information.
-         * @param requiredIndexEntries the number of index entries that are
-         *                             required. this is to check to make sure the
-         *                             row index is well formed.
-         * @throws IOException if an error occurs while writing the stripe
-         */
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            if (isPresent != null) {
-                isPresent.flush();
-
-                // if no nulls are found in a stream, then suppress the stream
-                if (!foundNulls) {
-                    isPresentOutStream.suppress();
-                    // since isPresent bitstream is suppressed, update the index to
-                    // remove the positions of the isPresent stream
-                    if (rowIndexStream != null) {
-                        removeIsPresentPositions();
-                    }
-                }
-            }
-
-            // merge stripe-level column statistics to file statistics and write it to
-            // stripe statistics
-            OrcProto.StripeStatistics.Builder stripeStatsBuilder = OrcProto.StripeStatistics.newBuilder();
-            writeStripeStatistics(stripeStatsBuilder, this);
-            stripeStatsBuilders.add(stripeStatsBuilder);
-
-            // reset the flag for next stripe
-            foundNulls = false;
-
-            builder.addColumns(getEncoding());
-            if (streamFactory.hasWriterTimeZone()) {
-                builder.setWriterTimezone(TimeZone.getDefault().getID());
-            }
-            if (rowIndexStream != null) {
-                if (rowIndex.getEntryCount() != requiredIndexEntries) {
-                    throw new IllegalArgumentException("Column has wrong number of " +
-                            "index entries found: " + rowIndex.getEntryCount() + " expected: " +
-                            requiredIndexEntries);
-                }
-                rowIndex.build().writeTo(rowIndexStream);
-                rowIndexStream.flush();
-            }
-            rowIndex.clear();
-            rowIndexEntry.clear();
-
-            // write the bloom filter to out stream
-            if (bloomFilterStream != null) {
-                bloomFilterIndex.build().writeTo(bloomFilterStream);
-                bloomFilterStream.flush();
-                bloomFilterIndex.clear();
-                bloomFilterEntry.clear();
-            }
-        }
-
-        private void writeStripeStatistics(OrcProto.StripeStatistics.Builder builder,
-                                           TreeWriter treeWriter) {
-            treeWriter.fileStatistics.merge(treeWriter.stripeColStatistics);
-            builder.addColStats(treeWriter.stripeColStatistics.serialize().build());
-            treeWriter.stripeColStatistics.reset();
-            for (TreeWriter child : treeWriter.getChildrenWriters()) {
-                writeStripeStatistics(builder, child);
-            }
-        }
-
-        TreeWriter[] getChildrenWriters() {
-            return childrenWriters;
-        }
-
-        /**
-         * Get the encoding for this column.
-         *
-         * @return the information about the encoding of this column
-         */
-        OrcProto.ColumnEncoding getEncoding() {
-            return OrcProto.ColumnEncoding.newBuilder().setKind(
-                    OrcProto.ColumnEncoding.Kind.DIRECT).build();
-        }
-
-        /**
-         * Create a row index entry with the previous location and the current
-         * index statistics. Also merges the index statistics into the file
-         * statistics before they are cleared. Finally, it records the start of the
-         * next index and ensures all of the children columns also create an entry.
-         *
-         * @throws IOException if an error occurs while creating the row index entry
-         */
-        void createRowIndexEntry() throws IOException {
-            stripeColStatistics.merge(indexStatistics);
-            rowIndexEntry.setStatistics(indexStatistics.serialize());
-            indexStatistics.reset();
-            rowIndex.addEntry(rowIndexEntry);
-            rowIndexEntry.clear();
-            addBloomFilterEntry();
-            recordPosition(rowIndexPosition);
-            for (TreeWriter child : childrenWriters) {
-                child.createRowIndexEntry();
-            }
-        }
-
-        void addBloomFilterEntry() {
-            if (createBloomFilter) {
-                bloomFilterEntry.setNumHashFunctions(bloomFilter.getNumHashFunctions());
-                bloomFilterEntry.addAllBitset(Longs.asList(bloomFilter.getBitSet()));
-                bloomFilterIndex.addBloomFilter(bloomFilterEntry.build());
-                bloomFilter.reset();
-                bloomFilterEntry.clear();
-            }
-        }
-
-        /**
-         * Record the current position in each of this column's streams.
-         *
-         * @param recorder where should the locations be recorded
-         * @throws IOException if an error occurs while recording the position
-         */
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            if (isPresent != null) {
-                isPresent.getPosition(recorder);
-            }
-        }
-
-        /**
-         * Estimate how much memory the writer is consuming excluding the streams.
-         *
-         * @return the number of bytes.
-         */
-        long estimateMemory() {
-            long result = 0;
-            for (TreeWriter child : childrenWriters) {
-                result += child.estimateMemory();
-            }
-            return result;
-        }
-    }
-
-    private static class BooleanTreeWriter extends TreeWriter {
-        private final BitFieldWriter writer;
-
-        BooleanTreeWriter(int columnId,
-                          TypeDescription schema,
-                          StreamFactory writer,
-                          boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            PositionedOutputStream out = writer.createStream(id,
-                    OrcProto.Stream.Kind.DATA);
-            this.writer = new BitFieldWriter(out, 1);
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            LongColumnVector vec = (LongColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    int value = vec.vector[0] == 0 ? 0 : 1;
-                    indexStatistics.updateBoolean(value != 0, length);
-                    for (int i = 0; i < length; ++i) {
-                        writer.write(value);
-                    }
-                }
-            } else {
-                for (int i = 0; i < length; ++i) {
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        int value = vec.vector[i + offset] == 0 ? 0 : 1;
-                        writer.write(value);
-                        indexStatistics.updateBoolean(value != 0, 1);
-                    }
-                }
-            }
-        }
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            writer.flush();
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            super.recordPosition(recorder);
-            writer.getPosition(recorder);
-        }
-    }
-
-    private static class ByteTreeWriter extends TreeWriter {
-        private final RunLengthByteWriter writer;
-
-        ByteTreeWriter(int columnId,
-                       TypeDescription schema,
-                       StreamFactory writer,
-                       boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            this.writer = new RunLengthByteWriter(writer.createStream(id,
-                    OrcProto.Stream.Kind.DATA));
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            LongColumnVector vec = (LongColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    byte value = (byte) vec.vector[0];
-                    indexStatistics.updateInteger(value, length);
-                    if (createBloomFilter) {
-                        bloomFilter.addLong(value);
-                    }
-                    for (int i = 0; i < length; ++i) {
-                        writer.write(value);
-                    }
-                }
-            } else {
-                for (int i = 0; i < length; ++i) {
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        byte value = (byte) vec.vector[i + offset];
-                        writer.write(value);
-                        indexStatistics.updateInteger(value, 1);
-                        if (createBloomFilter) {
-                            bloomFilter.addLong(value);
-                        }
-                    }
-                }
-            }
-        }
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            writer.flush();
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            super.recordPosition(recorder);
-            writer.getPosition(recorder);
-        }
-    }
-
-    private static class IntegerTreeWriter extends TreeWriter {
-        private final IntegerWriter writer;
-        private boolean isDirectV2 = true;
-
-        IntegerTreeWriter(int columnId,
-                          TypeDescription schema,
-                          StreamFactory writer,
-                          boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            OutStream out = writer.createStream(id,
-                    OrcProto.Stream.Kind.DATA);
-            this.isDirectV2 = isNewWriteFormat(writer);
-            this.writer = createIntegerWriter(out, true, isDirectV2, writer);
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        OrcProto.ColumnEncoding getEncoding() {
-            if (isDirectV2) {
-                return OrcProto.ColumnEncoding.newBuilder()
-                        .setKind(OrcProto.ColumnEncoding.Kind.DIRECT_V2).build();
-            }
-            return OrcProto.ColumnEncoding.newBuilder()
-                    .setKind(OrcProto.ColumnEncoding.Kind.DIRECT).build();
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            LongColumnVector vec = (LongColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    long value = vec.vector[0];
-                    indexStatistics.updateInteger(value, length);
-                    if (createBloomFilter) {
-                        bloomFilter.addLong(value);
-                    }
-                    for (int i = 0; i < length; ++i) {
-                        writer.write(value);
-                    }
-                }
-            } else {
-                for (int i = 0; i < length; ++i) {
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        long value = vec.vector[i + offset];
-                        writer.write(value);
-                        indexStatistics.updateInteger(value, 1);
-                        if (createBloomFilter) {
-                            bloomFilter.addLong(value);
-                        }
-                    }
-                }
-            }
-        }
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            writer.flush();
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            super.recordPosition(recorder);
-            writer.getPosition(recorder);
-        }
-    }
-
-    private static class FloatTreeWriter extends TreeWriter {
-        private final PositionedOutputStream stream;
-        private final SerializationUtils utils;
-
-        FloatTreeWriter(int columnId,
-                        TypeDescription schema,
-                        StreamFactory writer,
-                        boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            this.stream = writer.createStream(id,
-                    OrcProto.Stream.Kind.DATA);
-            this.utils = new SerializationUtils();
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            DoubleColumnVector vec = (DoubleColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    float value = (float) vec.vector[0];
-                    indexStatistics.updateDouble(value);
-                    if (createBloomFilter) {
-                        bloomFilter.addDouble(value);
-                    }
-                    for (int i = 0; i < length; ++i) {
-                        utils.writeFloat(stream, value);
-                    }
-                }
-            } else {
-                for (int i = 0; i < length; ++i) {
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        float value = (float) vec.vector[i + offset];
-                        utils.writeFloat(stream, value);
-                        indexStatistics.updateDouble(value);
-                        if (createBloomFilter) {
-                            bloomFilter.addDouble(value);
-                        }
-                    }
-                }
-            }
-        }
-
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            stream.flush();
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            super.recordPosition(recorder);
-            stream.getPosition(recorder);
-        }
-    }
-
-    private static class DoubleTreeWriter extends TreeWriter {
-        private final PositionedOutputStream stream;
-        private final SerializationUtils utils;
-
-        DoubleTreeWriter(int columnId,
-                         TypeDescription schema,
-                         StreamFactory writer,
-                         boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            this.stream = writer.createStream(id,
-                    OrcProto.Stream.Kind.DATA);
-            this.utils = new SerializationUtils();
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            DoubleColumnVector vec = (DoubleColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    double value = vec.vector[0];
-                    indexStatistics.updateDouble(value);
-                    if (createBloomFilter) {
-                        bloomFilter.addDouble(value);
-                    }
-                    for (int i = 0; i < length; ++i) {
-                        utils.writeDouble(stream, value);
-                    }
-                }
-            } else {
-                for (int i = 0; i < length; ++i) {
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        double value = vec.vector[i + offset];
-                        utils.writeDouble(stream, value);
-                        indexStatistics.updateDouble(value);
-                        if (createBloomFilter) {
-                            bloomFilter.addDouble(value);
-                        }
-                    }
-                }
-            }
-        }
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            stream.flush();
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            super.recordPosition(recorder);
-            stream.getPosition(recorder);
-        }
-    }
-
-    private static abstract class StringBaseTreeWriter extends TreeWriter {
-        private static final int INITIAL_DICTIONARY_SIZE = 4096;
-        private final OutStream stringOutput;
-        private final IntegerWriter lengthOutput;
-        private final IntegerWriter rowOutput;
-        protected final StringRedBlackTree dictionary =
-                new StringRedBlackTree(INITIAL_DICTIONARY_SIZE);
-        protected final DynamicIntArray rows = new DynamicIntArray();
-        protected final PositionedOutputStream directStreamOutput;
-        protected final IntegerWriter directLengthOutput;
-        private final List<OrcProto.RowIndexEntry> savedRowIndex =
-                new ArrayList<OrcProto.RowIndexEntry>();
-        private final boolean buildIndex;
-        private final List<Long> rowIndexValueCount = new ArrayList<Long>();
-        // If the number of keys in a dictionary is greater than this fraction of
-        //the total number of non-null rows, turn off dictionary encoding
-        private final double dictionaryKeySizeThreshold;
-        protected boolean useDictionaryEncoding = true;
-        private boolean isDirectV2 = true;
-        private boolean doneDictionaryCheck;
-        private final boolean strideDictionaryCheck;
-
-        StringBaseTreeWriter(int columnId,
-                             TypeDescription schema,
-                             StreamFactory writer,
-                             boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            this.isDirectV2 = isNewWriteFormat(writer);
-            stringOutput = writer.createStream(id,
-                    OrcProto.Stream.Kind.DICTIONARY_DATA);
-            lengthOutput = createIntegerWriter(writer.createStream(id,
-                    OrcProto.Stream.Kind.LENGTH), false, isDirectV2, writer);
-            rowOutput = createIntegerWriter(writer.createStream(id,
-                    OrcProto.Stream.Kind.DATA), false, isDirectV2, writer);
-            recordPosition(rowIndexPosition);
-            rowIndexValueCount.add(0L);
-            buildIndex = writer.buildIndex();
-            directStreamOutput = writer.createStream(id, OrcProto.Stream.Kind.DATA);
-            directLengthOutput = createIntegerWriter(writer.createStream(id,
-                    OrcProto.Stream.Kind.LENGTH), false, isDirectV2, writer);
-            Configuration conf = writer.getConfiguration();
-            dictionaryKeySizeThreshold =
-                    OrcConf.DICTIONARY_KEY_SIZE_THRESHOLD.getDouble(conf);
-            strideDictionaryCheck =
-                    OrcConf.ROW_INDEX_STRIDE_DICTIONARY_CHECK.getBoolean(conf);
-            doneDictionaryCheck = false;
-        }
-
-        private boolean checkDictionaryEncoding() {
-            if (!doneDictionaryCheck) {
-                // Set the flag indicating whether or not to use dictionary encoding
-                // based on whether or not the fraction of distinct keys over number of
-                // non-null rows is less than the configured threshold
-                float ratio = rows.size() > 0 ? (float) (dictionary.size()) / rows.size() : 0.0f;
-                useDictionaryEncoding = !isDirectV2 || ratio <= dictionaryKeySizeThreshold;
-                doneDictionaryCheck = true;
-            }
-            return useDictionaryEncoding;
-        }
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            // if rows in stripe is less than dictionaryCheckAfterRows, dictionary
-            // checking would not have happened. So do it again here.
-            checkDictionaryEncoding();
-
-            if (useDictionaryEncoding) {
-                flushDictionary();
-            } else {
-                // flushout any left over entries from dictionary
-                if (rows.size() > 0) {
-                    flushDictionary();
-                }
-
-                // suppress the stream for every stripe if dictionary is disabled
-                stringOutput.suppress();
-            }
-
-            // we need to build the rowindex before calling super, since it
-            // writes it out.
-            super.writeStripe(builder, requiredIndexEntries);
-            stringOutput.flush();
-            lengthOutput.flush();
-            rowOutput.flush();
-            directStreamOutput.flush();
-            directLengthOutput.flush();
-            // reset all of the fields to be ready for the next stripe.
-            dictionary.clear();
-            savedRowIndex.clear();
-            rowIndexValueCount.clear();
-            recordPosition(rowIndexPosition);
-            rowIndexValueCount.add(0L);
-
-            if (!useDictionaryEncoding) {
-                // record the start positions of first index stride of next stripe i.e
-                // beginning of the direct streams when dictionary is disabled
-                recordDirectStreamPosition();
-            }
-        }
-
-        private void flushDictionary() throws IOException {
-            final int[] dumpOrder = new int[dictionary.size()];
-
-            if (useDictionaryEncoding) {
-                // Write the dictionary by traversing the red-black tree writing out
-                // the bytes and lengths; and creating the map from the original order
-                // to the final sorted order.
-
-                dictionary.visit(new StringRedBlackTree.Visitor() {
-                    private int currentId = 0;
-
-                    @Override
-                    public void visit(StringRedBlackTree.VisitorContext context
-                    ) throws IOException {
-                        context.writeBytes(stringOutput);
-                        lengthOutput.write(context.getLength());
-                        dumpOrder[context.getOriginalPosition()] = currentId++;
-                    }
-                });
-            } else {
-                // for direct encoding, we don't want the dictionary data stream
-                stringOutput.suppress();
-            }
-            int length = rows.size();
-            int rowIndexEntry = 0;
-            OrcProto.RowIndex.Builder rowIndex = getRowIndex();
-            Text text = new Text();
-            // write the values translated into the dump order.
-            for (int i = 0; i <= length; ++i) {
-                // now that we are writing out the row values, we can finalize the
-                // row index
-                if (buildIndex) {
-                    while (i == rowIndexValueCount.get(rowIndexEntry) && rowIndexEntry < savedRowIndex.size()) {
-                        OrcProto.RowIndexEntry.Builder base =
-                                savedRowIndex.get(rowIndexEntry++).toBuilder();
-                        if (useDictionaryEncoding) {
-                            rowOutput.getPosition(new RowIndexPositionRecorder(base));
-                        } else {
-                            PositionRecorder posn = new RowIndexPositionRecorder(base);
-                            directStreamOutput.getPosition(posn);
-                            directLengthOutput.getPosition(posn);
-                        }
-                        rowIndex.addEntry(base.build());
-                    }
-                }
-                if (i != length) {
-                    if (useDictionaryEncoding) {
-                        rowOutput.write(dumpOrder[rows.get(i)]);
-                    } else {
-                        dictionary.getText(text, rows.get(i));
-                        directStreamOutput.write(text.getBytes(), 0, text.getLength());
-                        directLengthOutput.write(text.getLength());
-                    }
-                }
-            }
-            rows.clear();
-        }
-
-        @Override
-        OrcProto.ColumnEncoding getEncoding() {
-            // Returns the encoding used for the last call to writeStripe
-            if (useDictionaryEncoding) {
-                if (isDirectV2) {
-                    return OrcProto.ColumnEncoding.newBuilder().setKind(
-                            OrcProto.ColumnEncoding.Kind.DICTIONARY_V2).setDictionarySize(dictionary.size()).build();
-                }
-                return OrcProto.ColumnEncoding.newBuilder().setKind(
-                        OrcProto.ColumnEncoding.Kind.DICTIONARY).setDictionarySize(dictionary.size()).build();
-            } else {
-                if (isDirectV2) {
-                    return OrcProto.ColumnEncoding.newBuilder().setKind(OrcProto.ColumnEncoding.Kind.DIRECT_V2).build();
-                }
-                return OrcProto.ColumnEncoding.newBuilder().setKind(OrcProto.ColumnEncoding.Kind.DIRECT).build();
-            }
-        }
-
-        /**
-         * This method doesn't call the super method, because unlike most of the
-         * other TreeWriters, this one can't record the position in the streams
-         * until the stripe is being flushed. Therefore it saves all of the entries
-         * and augments them with the final information as the stripe is written.
-         *
-         * @throws IOException if an error occurs while creating a row index entry
-         */
-        @Override
-        void createRowIndexEntry() throws IOException {
-            getStripeStatistics().merge(indexStatistics);
-            OrcProto.RowIndexEntry.Builder rowIndexEntry = getRowIndexEntry();
-            rowIndexEntry.setStatistics(indexStatistics.serialize());
-            indexStatistics.reset();
-            OrcProto.RowIndexEntry base = rowIndexEntry.build();
-            savedRowIndex.add(base);
-            rowIndexEntry.clear();
-            addBloomFilterEntry();
-            recordPosition(rowIndexPosition);
-            rowIndexValueCount.add(Long.valueOf(rows.size()));
-            if (strideDictionaryCheck) {
-                checkDictionaryEncoding();
-            }
-            if (!useDictionaryEncoding) {
-                if (rows.size() > 0) {
-                    flushDictionary();
-                    // just record the start positions of next index stride
-                    recordDirectStreamPosition();
-                } else {
-                    // record the start positions of next index stride
-                    recordDirectStreamPosition();
-                    getRowIndex().addEntry(base);
-                }
-            }
-        }
-
-        private void recordDirectStreamPosition() throws IOException {
-            directStreamOutput.getPosition(rowIndexPosition);
-            directLengthOutput.getPosition(rowIndexPosition);
-        }
-
-        @Override
-        long estimateMemory() {
-            return rows.getSizeInBytes() + dictionary.getSizeInBytes();
-        }
-    }
-
-    private static class StringTreeWriter extends StringBaseTreeWriter {
-        StringTreeWriter(int columnId,
-                         TypeDescription schema,
-                         StreamFactory writer,
-                         boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            BytesColumnVector vec = (BytesColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    if (useDictionaryEncoding) {
-                        int id = dictionary.add(vec.vector[0], vec.start[0], vec.length[0]);
-                        for (int i = 0; i < length; ++i) {
-                            rows.add(id);
-                        }
-                    } else {
-                        for (int i = 0; i < length; ++i) {
-                            directStreamOutput.write(vec.vector[0], vec.start[0],
-                                    vec.length[0]);
-                            directLengthOutput.write(vec.length[0]);
-                        }
-                    }
-                    indexStatistics.updateString(vec.vector[0], vec.start[0],
-                            vec.length[0], length);
-                    if (createBloomFilter) {
-                        bloomFilter.addBytes(vec.vector[0], vec.start[0], vec.length[0]);
-                    }
-                }
-            } else {
-                for (int i = 0; i < length; ++i) {
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        if (useDictionaryEncoding) {
-                            rows.add(dictionary.add(vec.vector[offset + i],
-                                    vec.start[offset + i], vec.length[offset + i]));
-                        } else {
-                            directStreamOutput.write(vec.vector[offset + i],
-                                    vec.start[offset + i], vec.length[offset + i]);
-                            directLengthOutput.write(vec.length[offset + i]);
-                        }
-                        indexStatistics.updateString(vec.vector[offset + i],
-                                vec.start[offset + i], vec.length[offset + i], 1);
-                        if (createBloomFilter) {
-                            bloomFilter.addBytes(vec.vector[offset + i],
-                                    vec.start[offset + i], vec.length[offset + i]);
-                        }
-                    }
-                }
-            }
-        }
-    }
-
-    /**
-     * Under the covers, char is written to ORC the same way as string.
-     */
-    private static class CharTreeWriter extends StringBaseTreeWriter {
-        private final int itemLength;
-        private final byte[] padding;
-
-        CharTreeWriter(int columnId,
-                       TypeDescription schema,
-                       StreamFactory writer,
-                       boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            itemLength = schema.getMaxLength();
-            padding = new byte[itemLength];
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            BytesColumnVector vec = (BytesColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    byte[] ptr;
-                    int ptrOffset;
-                    if (vec.length[0] >= itemLength) {
-                        ptr = vec.vector[0];
-                        ptrOffset = vec.start[0];
-                    } else {
-                        ptr = padding;
-                        ptrOffset = 0;
-                        System.arraycopy(vec.vector[0], vec.start[0], ptr, 0,
-                                vec.length[0]);
-                        Arrays.fill(ptr, vec.length[0], itemLength, (byte) ' ');
-                    }
-                    if (useDictionaryEncoding) {
-                        int id = dictionary.add(ptr, ptrOffset, itemLength);
-                        for (int i = 0; i < length; ++i) {
-                            rows.add(id);
-                        }
-                    } else {
-                        for (int i = 0; i < length; ++i) {
-                            directStreamOutput.write(ptr, ptrOffset, itemLength);
-                            directLengthOutput.write(itemLength);
-                        }
-                    }
-                    indexStatistics.updateString(ptr, ptrOffset, itemLength, length);
-                    if (createBloomFilter) {
-                        bloomFilter.addBytes(ptr, ptrOffset, itemLength);
-                    }
-                }
-            } else {
-                for (int i = 0; i < length; ++i) {
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        byte[] ptr;
-                        int ptrOffset;
-                        if (vec.length[offset + i] >= itemLength) {
-                            ptr = vec.vector[offset + i];
-                            ptrOffset = vec.start[offset + i];
-                        } else {
-                            // it is the wrong length, so copy it
-                            ptr = padding;
-                            ptrOffset = 0;
-                            System.arraycopy(vec.vector[offset + i], vec.start[offset + i],
-                                    ptr, 0, vec.length[offset + i]);
-                            Arrays.fill(ptr, vec.length[offset + i], itemLength, (byte) ' ');
-                        }
-                        if (useDictionaryEncoding) {
-                            rows.add(dictionary.add(ptr, ptrOffset, itemLength));
-                        } else {
-                            directStreamOutput.write(ptr, ptrOffset, itemLength);
-                            directLengthOutput.write(itemLength);
-                        }
-                        indexStatistics.updateString(ptr, ptrOffset, itemLength, 1);
-                        if (createBloomFilter) {
-                            bloomFilter.addBytes(ptr, ptrOffset, itemLength);
-                        }
-                    }
-                }
-            }
-        }
-    }
-
-    /**
-     * Under the covers, varchar is written to ORC the same way as string.
-     */
-    private static class VarcharTreeWriter extends StringBaseTreeWriter {
-        private final int maxLength;
-
-        VarcharTreeWriter(int columnId,
-                          TypeDescription schema,
-                          StreamFactory writer,
-                          boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            maxLength = schema.getMaxLength();
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            BytesColumnVector vec = (BytesColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    int itemLength = Math.min(vec.length[0], maxLength);
-                    if (useDictionaryEncoding) {
-                        int id = dictionary.add(vec.vector[0], vec.start[0], itemLength);
-                        for (int i = 0; i < length; ++i) {
-                            rows.add(id);
-                        }
-                    } else {
-                        for (int i = 0; i < length; ++i) {
-                            directStreamOutput.write(vec.vector[0], vec.start[0],
-                                    itemLength);
-                            directLengthOutput.write(itemLength);
-                        }
-                    }
-                    indexStatistics.updateString(vec.vector[0], vec.start[0],
-                            itemLength, length);
-                    if (createBloomFilter) {
-                        bloomFilter.addBytes(vec.vector[0], vec.start[0], itemLength);
-                    }
-                }
-            } else {
-                for (int i = 0; i < length; ++i) {
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        int itemLength = Math.min(vec.length[offset + i], maxLength);
-                        if (useDictionaryEncoding) {
-                            rows.add(dictionary.add(vec.vector[offset + i],
-                                    vec.start[offset + i], itemLength));
-                        } else {
-                            directStreamOutput.write(vec.vector[offset + i],
-                                    vec.start[offset + i], itemLength);
-                            directLengthOutput.write(itemLength);
-                        }
-                        indexStatistics.updateString(vec.vector[offset + i],
-                                vec.start[offset + i], itemLength, 1);
-                        if (createBloomFilter) {
-                            bloomFilter.addBytes(vec.vector[offset + i],
-                                    vec.start[offset + i], itemLength);
-                        }
-                    }
-                }
-            }
-        }
-    }
-
-    private static class BinaryTreeWriter extends TreeWriter {
-        private final PositionedOutputStream stream;
-        private final IntegerWriter length;
-        private boolean isDirectV2 = true;
-
-        BinaryTreeWriter(int columnId,
-                         TypeDescription schema,
-                         StreamFactory writer,
-                         boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            this.stream = writer.createStream(id,
-                    OrcProto.Stream.Kind.DATA);
-            this.isDirectV2 = isNewWriteFormat(writer);
-            this.length = createIntegerWriter(writer.createStream(id,
-                    OrcProto.Stream.Kind.LENGTH), false, isDirectV2, writer);
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        OrcProto.ColumnEncoding getEncoding() {
-            if (isDirectV2) {
-                return OrcProto.ColumnEncoding.newBuilder()
-                        .setKind(OrcProto.ColumnEncoding.Kind.DIRECT_V2).build();
-            }
-            return OrcProto.ColumnEncoding.newBuilder()
-                    .setKind(OrcProto.ColumnEncoding.Kind.DIRECT).build();
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            BytesColumnVector vec = (BytesColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    for (int i = 0; i < length; ++i) {
-                        stream.write(vec.vector[0], vec.start[0],
-                                vec.length[0]);
-                        this.length.write(vec.length[0]);
-                    }
-                    indexStatistics.updateBinary(vec.vector[0], vec.start[0],
-                            vec.length[0], length);
-                    if (createBloomFilter) {
-                        bloomFilter.addBytes(vec.vector[0], vec.start[0], vec.length[0]);
-                    }
-                }
-            } else {
-                for (int i = 0; i < length; ++i) {
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        stream.write(vec.vector[offset + i],
-                                vec.start[offset + i], vec.length[offset + i]);
-                        this.length.write(vec.length[offset + i]);
-                        indexStatistics.updateBinary(vec.vector[offset + i],
-                                vec.start[offset + i], vec.length[offset + i], 1);
-                        if (createBloomFilter) {
-                            bloomFilter.addBytes(vec.vector[offset + i],
-                                    vec.start[offset + i], vec.length[offset + i]);
-                        }
-                    }
-                }
-            }
-        }
-
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            stream.flush();
-            length.flush();
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            super.recordPosition(recorder);
-            stream.getPosition(recorder);
-            length.getPosition(recorder);
-        }
-    }
-
-    public static long MILLIS_PER_DAY = 24 * 60 * 60 * 1000;
-    public static long NANOS_PER_MILLI = 1000000;
-    public static final int MILLIS_PER_SECOND = 1000;
-    static final int NANOS_PER_SECOND = 1000000000;
-    public static final String BASE_TIMESTAMP_STRING = "2015-01-01 00:00:00";
-
-    private static class TimestampTreeWriter extends TreeWriter {
-        private final IntegerWriter seconds;
-        private final IntegerWriter nanos;
-        private final boolean isDirectV2;
-        private final long base_timestamp;
-
-        TimestampTreeWriter(int columnId,
-                            TypeDescription schema,
-                            StreamFactory writer,
-                            boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            this.isDirectV2 = isNewWriteFormat(writer);
-            this.seconds = createIntegerWriter(writer.createStream(id,
-                    OrcProto.Stream.Kind.DATA), true, isDirectV2, writer);
-            this.nanos = createIntegerWriter(writer.createStream(id,
-                    OrcProto.Stream.Kind.SECONDARY), false, isDirectV2, writer);
-            recordPosition(rowIndexPosition);
-            // for unit tests to set different time zones
-            this.base_timestamp = Timestamp.valueOf(BASE_TIMESTAMP_STRING).getTime() / MILLIS_PER_SECOND;
-            writer.useWriterTimeZone(true);
-        }
-
-        @Override
-        OrcProto.ColumnEncoding getEncoding() {
-            if (isDirectV2) {
-                return OrcProto.ColumnEncoding.newBuilder()
-                        .setKind(OrcProto.ColumnEncoding.Kind.DIRECT_V2).build();
-            }
-            return OrcProto.ColumnEncoding.newBuilder()
-                    .setKind(OrcProto.ColumnEncoding.Kind.DIRECT).build();
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            TimestampColumnVector vec = (TimestampColumnVector) vector;
-            Timestamp val;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    val = vec.asScratchTimestamp(0);
-                    long millis = val.getTime();
-                    indexStatistics.updateTimestamp(millis);
-                    if (createBloomFilter) {
-                        bloomFilter.addLong(millis);
-                    }
-                    final long secs = millis / MILLIS_PER_SECOND - base_timestamp;
-                    final long nano = formatNanos(val.getNanos());
-                    for (int i = 0; i < length; ++i) {
-                        seconds.write(secs);
-                        nanos.write(nano);
-                    }
-                }
-            } else {
-                for (int i = 0; i < length; ++i) {
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        val = vec.asScratchTimestamp(i + offset);
-                        long millis = val.getTime();
-                        long secs = millis / MILLIS_PER_SECOND - base_timestamp;
-                        seconds.write(secs);
-                        nanos.write(formatNanos(val.getNanos()));
-                        indexStatistics.updateTimestamp(millis);
-                        if (createBloomFilter) {
-                            bloomFilter.addLong(millis);
-                        }
-                    }
-                }
-            }
-        }
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            seconds.flush();
-            nanos.flush();
-            recordPosition(rowIndexPosition);
-        }
-
-        private static long formatNanos(int nanos) {
-            if (nanos == 0) {
-                return 0;
-            } else if (nanos % 100 != 0) {
-                return ((long) nanos) << 3;
-            } else {
-                nanos /= 100;
-                int trailingZeros = 1;
-                while (nanos % 10 == 0 && trailingZeros < 7) {
-                    nanos /= 10;
-                    trailingZeros += 1;
-                }
-                return ((long) nanos) << 3 | trailingZeros;
-            }
-        }
-
-        @Override
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            super.recordPosition(recorder);
-            seconds.getPosition(recorder);
-            nanos.getPosition(recorder);
-        }
-    }
-
-    private static class DateTreeWriter extends TreeWriter {
-        private final IntegerWriter writer;
-        private final boolean isDirectV2;
-
-        DateTreeWriter(int columnId,
-                       TypeDescription schema,
-                       StreamFactory writer,
-                       boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            OutStream out = writer.createStream(id,
-                    OrcProto.Stream.Kind.DATA);
-            this.isDirectV2 = isNewWriteFormat(writer);
-            this.writer = createIntegerWriter(out, true, isDirectV2, writer);
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            LongColumnVector vec = (LongColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    int value = (int) vec.vector[0];
-                    indexStatistics.updateDate(value);
-                    if (createBloomFilter) {
-                        bloomFilter.addLong(value);
-                    }
-                    for (int i = 0; i < length; ++i) {
-                        writer.write(value);
-                    }
-                }
-            } else {
-                for (int i = 0; i < length; ++i) {
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        int value = (int) vec.vector[i + offset];
-                        writer.write(value);
-                        indexStatistics.updateDate(value);
-                        if (createBloomFilter) {
-                            bloomFilter.addLong(value);
-                        }
-                    }
-                }
-            }
-        }
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            writer.flush();
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            super.recordPosition(recorder);
-            writer.getPosition(recorder);
-        }
-
-        @Override
-        OrcProto.ColumnEncoding getEncoding() {
-            if (isDirectV2) {
-                return OrcProto.ColumnEncoding.newBuilder()
-                        .setKind(OrcProto.ColumnEncoding.Kind.DIRECT_V2).build();
-            }
-            return OrcProto.ColumnEncoding.newBuilder()
-                    .setKind(OrcProto.ColumnEncoding.Kind.DIRECT).build();
-        }
-    }
-
-    private static class DecimalTreeWriter extends TreeWriter {
-        private final PositionedOutputStream valueStream;
-        private final IntegerWriter scaleStream;
-        private final boolean isDirectV2;
-
-        DecimalTreeWriter(int columnId,
-                          TypeDescription schema,
-                          StreamFactory writer,
-                          boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            this.isDirectV2 = isNewWriteFormat(writer);
-            valueStream = writer.createStream(id, OrcProto.Stream.Kind.DATA);
-            this.scaleStream = createIntegerWriter(writer.createStream(id,
-                    OrcProto.Stream.Kind.SECONDARY), true, isDirectV2, writer);
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        OrcProto.ColumnEncoding getEncoding() {
-            if (isDirectV2) {
-                return OrcProto.ColumnEncoding.newBuilder()
-                        .setKind(OrcProto.ColumnEncoding.Kind.DIRECT_V2).build();
-            }
-            return OrcProto.ColumnEncoding.newBuilder()
-                    .setKind(OrcProto.ColumnEncoding.Kind.DIRECT).build();
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            DecimalColumnVector vec = (DecimalColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    HiveDecimal value = vec.vector[0].getHiveDecimal();
-                    indexStatistics.updateDecimal(value);
-                    if (createBloomFilter) {
-                        bloomFilter.addString(value.toString());
-                    }
-                    for (int i = 0; i < length; ++i) {
-                        SerializationUtils.writeBigInteger(valueStream,
-                                value.unscaledValue());
-                        scaleStream.write(value.scale());
-                    }
-                }
-            } else {
-                for (int i = 0; i < length; ++i) {
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        HiveDecimal value = vec.vector[i + offset].getHiveDecimal();
-                        SerializationUtils.writeBigInteger(valueStream,
-                                value.unscaledValue());
-                        scaleStream.write(value.scale());
-                        indexStatistics.updateDecimal(value);
-                        if (createBloomFilter) {
-                            bloomFilter.addString(value.toString());
-                        }
-                    }
-                }
-            }
-        }
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            valueStream.flush();
-            scaleStream.flush();
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            super.recordPosition(recorder);
-            valueStream.getPosition(recorder);
-            scaleStream.getPosition(recorder);
-        }
-    }
-
-    private static class StructTreeWriter extends TreeWriter {
-        StructTreeWriter(int columnId,
-                         TypeDescription schema,
-                         StreamFactory writer,
-                         boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            List<TypeDescription> children = schema.getChildren();
-            childrenWriters = new TreeWriter[children.size()];
-            for (int i = 0; i < childrenWriters.length; ++i) {
-                childrenWriters[i] = createTreeWriter(
-                        children.get(i), writer,
-                        true);
-            }
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void writeRootBatch(VectorizedRowBatch batch, int offset,
-                            int length) throws IOException {
-            // update the statistics for the root column
-            indexStatistics.increment(length);
-            // I'm assuming that the root column isn't nullable so that I don't need
-            // to update isPresent.
-            for (int i = 0; i < childrenWriters.length; ++i) {
-                childrenWriters[i].writeBatch(batch.cols[i], offset, length);
-            }
-        }
-
-        private static void writeFields(StructColumnVector vector,
-                                        TreeWriter[] childrenWriters,
-                                        int offset, int length) throws IOException {
-            for (int field = 0; field < childrenWriters.length; ++field) {
-                childrenWriters[field].writeBatch(vector.fields[field], offset, length);
-            }
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            StructColumnVector vec = (StructColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    writeFields(vec, childrenWriters, offset, length);
-                }
-            } else if (vector.noNulls) {
-                writeFields(vec, childrenWriters, offset, length);
-            } else {
-                // write the records in runs
-                int currentRun = 0;
-                boolean started = false;
-                for (int i = 0; i < length; ++i) {
-                    if (!vec.isNull[i + offset]) {
-                        if (!started) {
-                            started = true;
-                            currentRun = i;
-                        }
-                    } else if (started) {
-                        started = false;
-                        writeFields(vec, childrenWriters, offset + currentRun,
-                                i - currentRun);
-                    }
-                }
-                if (started) {
-                    writeFields(vec, childrenWriters, offset + currentRun,
-                            length - currentRun);
-                }
-            }
-        }
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            for (TreeWriter child : childrenWriters) {
-                child.writeStripe(builder, requiredIndexEntries);
-            }
-            recordPosition(rowIndexPosition);
-        }
-    }
-
-    private static class ListTreeWriter extends TreeWriter {
-        private final IntegerWriter lengths;
-        private final boolean isDirectV2;
-
-        ListTreeWriter(int columnId,
-                       TypeDescription schema,
-                       StreamFactory writer,
-                       boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            this.isDirectV2 = isNewWriteFormat(writer);
-            childrenWriters = new TreeWriter[1];
-            childrenWriters[0] =
-                    createTreeWriter(schema.getChildren().get(0), writer, true);
-            lengths = createIntegerWriter(writer.createStream(columnId,
-                    OrcProto.Stream.Kind.LENGTH), false, isDirectV2, writer);
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        OrcProto.ColumnEncoding getEncoding() {
-            if (isDirectV2) {
-                return OrcProto.ColumnEncoding.newBuilder()
-                        .setKind(OrcProto.ColumnEncoding.Kind.DIRECT_V2).build();
-            }
-            return OrcProto.ColumnEncoding.newBuilder()
-                    .setKind(OrcProto.ColumnEncoding.Kind.DIRECT).build();
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            ListColumnVector vec = (ListColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    int childOffset = (int) vec.offsets[0];
-                    int childLength = (int) vec.lengths[0];
-                    for (int i = 0; i < length; ++i) {
-                        lengths.write(childLength);
-                        childrenWriters[0].writeBatch(vec.child, childOffset, childLength);
-                    }
-                    if (createBloomFilter) {
-                        bloomFilter.addLong(childLength);
-                    }
-                }
-            } else {
-                // write the elements in runs
-                int currentOffset = 0;
-                int currentLength = 0;
-                for (int i = 0; i < length; ++i) {
-                    if (!vec.isNull[i + offset]) {
-                        int nextLength = (int) vec.lengths[offset + i];
-                        int nextOffset = (int) vec.offsets[offset + i];
-                        lengths.write(nextLength);
-                        if (currentLength == 0) {
-                            currentOffset = nextOffset;
-                            currentLength = nextLength;
-                        } else if (currentOffset + currentLength != nextOffset) {
-                            childrenWriters[0].writeBatch(vec.child, currentOffset,
-                                    currentLength);
-                            currentOffset = nextOffset;
-                            currentLength = nextLength;
-                        } else {
-                            currentLength += nextLength;
-                        }
-                    }
-                }
-                if (currentLength != 0) {
-                    childrenWriters[0].writeBatch(vec.child, currentOffset,
-                            currentLength);
-                }
-            }
-        }
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            lengths.flush();
-            for (TreeWriter child : childrenWriters) {
-                child.writeStripe(builder, requiredIndexEntries);
-            }
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            super.recordPosition(recorder);
-            lengths.getPosition(recorder);
-        }
-    }
-
-    private static class MapTreeWriter extends TreeWriter {
-        private final IntegerWriter lengths;
-        private final boolean isDirectV2;
-
-        MapTreeWriter(int columnId,
-                      TypeDescription schema,
-                      StreamFactory writer,
-                      boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            this.isDirectV2 = isNewWriteFormat(writer);
-            childrenWriters = new TreeWriter[2];
-            List<TypeDescription> children = schema.getChildren();
-            childrenWriters[0] =
-                    createTreeWriter(children.get(0), writer, true);
-            childrenWriters[1] =
-                    createTreeWriter(children.get(1), writer, true);
-            lengths = createIntegerWriter(writer.createStream(columnId,
-                    OrcProto.Stream.Kind.LENGTH), false, isDirectV2, writer);
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        OrcProto.ColumnEncoding getEncoding() {
-            if (isDirectV2) {
-                return OrcProto.ColumnEncoding.newBuilder()
-                        .setKind(OrcProto.ColumnEncoding.Kind.DIRECT_V2).build();
-            }
-            return OrcProto.ColumnEncoding.newBuilder()
-                    .setKind(OrcProto.ColumnEncoding.Kind.DIRECT).build();
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            MapColumnVector vec = (MapColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    int childOffset = (int) vec.offsets[0];
-                    int childLength = (int) vec.lengths[0];
-                    for (int i = 0; i < length; ++i) {
-                        lengths.write(childLength);
-                        childrenWriters[0].writeBatch(vec.keys, childOffset, childLength);
-                        childrenWriters[1].writeBatch(vec.values, childOffset, childLength);
-                    }
-                    if (createBloomFilter) {
-                        bloomFilter.addLong(childLength);
-                    }
-                }
-            } else {
-                // write the elements in runs
-                int currentOffset = 0;
-                int currentLength = 0;
-                for (int i = 0; i < length; ++i) {
-                    if (!vec.isNull[i + offset]) {
-                        int nextLength = (int) vec.lengths[offset + i];
-                        int nextOffset = (int) vec.offsets[offset + i];
-                        lengths.write(nextLength);
-                        if (currentLength == 0) {
-                            currentOffset = nextOffset;
-                            currentLength = nextLength;
-                        } else if (currentOffset + currentLength != nextOffset) {
-                            childrenWriters[0].writeBatch(vec.keys, currentOffset,
-                                    currentLength);
-                            childrenWriters[1].writeBatch(vec.values, currentOffset,
-                                    currentLength);
-                            currentOffset = nextOffset;
-                            currentLength = nextLength;
-                        } else {
-                            currentLength += nextLength;
-                        }
-                    }
-                }
-                if (currentLength != 0) {
-                    childrenWriters[0].writeBatch(vec.keys, currentOffset,
-                            currentLength);
-                    childrenWriters[1].writeBatch(vec.values, currentOffset,
-                            currentLength);
-                }
-            }
-        }
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            lengths.flush();
-            for (TreeWriter child : childrenWriters) {
-                child.writeStripe(builder, requiredIndexEntries);
-            }
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            super.recordPosition(recorder);
-            lengths.getPosition(recorder);
-        }
-    }
-
-    private static class UnionTreeWriter extends TreeWriter {
-        private final RunLengthByteWriter tags;
-
-        UnionTreeWriter(int columnId,
-                        TypeDescription schema,
-                        StreamFactory writer,
-                        boolean nullable) throws IOException {
-            super(columnId, schema, writer, nullable);
-            List<TypeDescription> children = schema.getChildren();
-            childrenWriters = new TreeWriter[children.size()];
-            for (int i = 0; i < childrenWriters.length; ++i) {
-                childrenWriters[i] =
-                        createTreeWriter(children.get(i), writer, true);
-            }
-            tags =
-                    new RunLengthByteWriter(writer.createStream(columnId,
-                            OrcProto.Stream.Kind.DATA));
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void writeBatch(ColumnVector vector, int offset,
-                        int length) throws IOException {
-            super.writeBatch(vector, offset, length);
-            UnionColumnVector vec = (UnionColumnVector) vector;
-            if (vector.isRepeating) {
-                if (vector.noNulls || !vector.isNull[0]) {
-                    byte tag = (byte) vec.tags[0];
-                    for (int i = 0; i < length; ++i) {
-                        tags.write(tag);
-                    }
-                    if (createBloomFilter) {
-                        bloomFilter.addLong(tag);
-                    }
-                    childrenWriters[tag].writeBatch(vec.fields[tag], offset, length);
-                }
-            } else {
-                // write the records in runs of the same tag
-                int[] currentStart = new int[vec.fields.length];
-                int[] currentLength = new int[vec.fields.length];
-                for (int i = 0; i < length; ++i) {
-                    // only need to deal with the non-nulls, since the nulls were dealt
-                    // with in the super method.
-                    if (vec.noNulls || !vec.isNull[i + offset]) {
-                        byte tag = (byte) vec.tags[offset + i];
-                        tags.write(tag);
-                        if (currentLength[tag] == 0) {
-                            // start a new sequence
-                            currentStart[tag] = i + offset;
-                            currentLength[tag] = 1;
-                        } else if (currentStart[tag] + currentLength[tag] == i + offset) {
-                            // ok, we are extending the current run for that tag.
-                            currentLength[tag] += 1;
-                        } else {
-                            // otherwise, we need to close off the old run and start a new one
-                            childrenWriters[tag].writeBatch(vec.fields[tag],
-                                    currentStart[tag], currentLength[tag]);
-                            currentStart[tag] = i + offset;
-                            currentLength[tag] = 1;
-                        }
-                    }
-                }
-                // write out any left over sequences
-                for (int tag = 0; tag < currentStart.length; ++tag) {
-                    if (currentLength[tag] != 0) {
-                        childrenWriters[tag].writeBatch(vec.fields[tag], currentStart[tag],
-                                currentLength[tag]);
-                    }
-                }
-            }
-        }
-
-        @Override
-        void writeStripe(OrcProto.StripeFooter.Builder builder,
-                         int requiredIndexEntries) throws IOException {
-            super.writeStripe(builder, requiredIndexEntries);
-            tags.flush();
-            for (TreeWriter child : childrenWriters) {
-                child.writeStripe(builder, requiredIndexEntries);
-            }
-            recordPosition(rowIndexPosition);
-        }
-
-        @Override
-        void recordPosition(PositionRecorder recorder) throws IOException {
-            super.recordPosition(recorder);
-            tags.getPosition(recorder);
-        }
-    }
-
-    private static TreeWriter createTreeWriter(TypeDescription schema,
-                                               StreamFactory streamFactory,
-                                               boolean nullable) throws IOException {
-        switch (schema.getCategory()) {
-            case BOOLEAN:
-                return new BooleanTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case BYTE:
-                return new ByteTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case SHORT:
-            case INT:
-            case LONG:
-                return new IntegerTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case FLOAT:
-                return new FloatTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case DOUBLE:
-                return new DoubleTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case STRING:
-                return new StringTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case CHAR:
-                return new CharTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case VARCHAR:
-                return new VarcharTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case BINARY:
-                return new BinaryTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case TIMESTAMP:
-                return new TimestampTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case DATE:
-                return new DateTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case DECIMAL:
-                return new DecimalTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case STRUCT:
-                return new StructTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case MAP:
-                return new MapTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case LIST:
-                return new ListTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            case UNION:
-                return new UnionTreeWriter(streamFactory.getNextColumnId(),
-                        schema, streamFactory, nullable);
-            default:
-                throw new IllegalArgumentException("Bad category: " +
-                        schema.getCategory());
-        }
-    }
-
-    private static void writeTypes(OrcProto.Footer.Builder builder,
-                                   TypeDescription schema) {
-        OrcProto.Type.Builder type = OrcProto.Type.newBuilder();
-        List<TypeDescription> children = schema.getChildren();
-        switch (schema.getCategory()) {
-            case BOOLEAN:
-                type.setKind(OrcProto.Type.Kind.BOOLEAN);
-                break;
-            case BYTE:
-                type.setKind(OrcProto.Type.Kind.BYTE);
-                break;
-            case SHORT:
-                type.setKind(OrcProto.Type.Kind.SHORT);
-                break;
-            case INT:
-                type.setKind(OrcProto.Type.Kind.INT);
-                break;
-            case LONG:
-                type.setKind(OrcProto.Type.Kind.LONG);
-                break;
-            case FLOAT:
-                type.setKind(OrcProto.Type.Kind.FLOAT);
-                break;
-            case DOUBLE:
-                type.setKind(OrcProto.Type.Kind.DOUBLE);
-                break;
-            case STRING:
-                type.setKind(OrcProto.Type.Kind.STRING);
-                break;
-            case CHAR:
-                type.setKind(OrcProto.Type.Kind.CHAR);
-                type.setMaximumLength(schema.getMaxLength());
-                break;
-            case VARCHAR:
-                type.setKind(OrcProto.Type.Kind.VARCHAR);
-                type.setMaximumLength(schema.getMaxLength());
-                break;
-            case BINARY:
-                type.setKind(OrcProto.Type.Kind.BINARY);
-                break;
-            case TIMESTAMP:
-                type.setKind(OrcProto.Type.Kind.TIMESTAMP);
-                break;
-            case DATE:
-                type.setKind(OrcProto.Type.Kind.DATE);
-                break;
-            case DECIMAL:
-                type.setKind(OrcProto.Type.Kind.DECIMAL);
-                type.setPrecision(schema.getPrecision());
-                type.setScale(schema.getScale());
-                break;
-            case LIST:
-                type.setKind(OrcProto.Type.Kind.LIST);
-                type.addSubtypes(children.get(0).getId());
-                break;
-            case MAP:
-                type.setKind(OrcProto.Type.Kind.MAP);
-                for (TypeDescription t : children) {
-                    type.addSubtypes(t.getId());
-                }
-                break;
-            case STRUCT:
-                type.setKind(OrcProto.Type.Kind.STRUCT);
-                for (TypeDescription t : children) {
-                    type.addSubtypes(t.getId());
-                }
-                for (String field : schema.getFieldNames()) {
-                    type.addFieldNames(field);
-                }
-                break;
-            case UNION:
-                type.setKind(OrcProto.Type.Kind.UNION);
-                for (TypeDescription t : children) {
-                    type.addSubtypes(t.getId());
-                }
-                break;
-            default:
-                throw new IllegalArgumentException("Unknown category: " +
-                        schema.getCategory());
-        }
-        builder.addTypes(type);
-        if (children != null) {
-            for (TypeDescription child : children) {
-                writeTypes(builder, child);
-            }
-        }
-    }
-
-    @VisibleForTesting
-    public OutputStream getStream() throws IOException {
-        if (rawWriter == null) {
-            rawWriter = new ByteCountingOutputStream(flowFileOutputStream);
-            rawWriter.write(OrcFile.MAGIC.getBytes());
-            headerLength = rawWriter.getBytesWritten();
-            writer = new OutStream("metadata", bufferSize, codec,
-                    new DirectStream(rawWriter));
-            protobufWriter = CodedOutputStream.newInstance(writer);
-        }
-        return rawWriter;
-    }
-
-    private void createRowIndexEntry() throws IOException {
-        treeWriter.createRowIndexEntry();
-        rowsInIndex = 0;
-    }
-
-    private void flushStripe() throws IOException {
-        getStream();
-        if (buildIndex && rowsInIndex != 0) {
-            createRowIndexEntry();
-        }
-        if (rowsInStripe != 0) {
-            if (callback != null) {
-                callback.preStripeWrite(callbackContext);
-            }
-            // finalize the data for the stripe
-            int requiredIndexEntries = rowIndexStride == 0 ? 0 :
-                    (int) ((rowsInStripe + rowIndexStride - 1) / rowIndexStride);
-            OrcProto.StripeFooter.Builder builder =
-                    OrcProto.StripeFooter.newBuilder();
-            treeWriter.writeStripe(builder, requiredIndexEntries);
-            long indexSize = 0;
-            long dataSize = 0;
-            for (Map.Entry<StreamName, BufferedStream> pair : streams.entrySet()) {
-                BufferedStream stream = pair.getValue();
-                if (!stream.isSuppressed()) {
-                    stream.flush();
-                    StreamName name = pair.getKey();
-                    long streamSize = pair.getValue().getOutputSize();
-                    builder.addStreams(OrcProto.Stream.newBuilder()
-                            .setColumn(name.getColumn())
-                            .setKind(name.getKind())
-                            .setLength(streamSize));
-                    if (StreamName.Area.INDEX == name.getArea()) {
-                        indexSize += streamSize;
-                    } else {
-                        dataSize += streamSize;
-                    }
-                }
-            }
-            OrcProto.StripeFooter footer = builder.build();
-
-            // Do we need to pad the file so the stripe doesn't straddle a block
-            // boundary?
-            long start = rawWriter.getBytesWritten();
-            final long currentStripeSize = indexSize + dataSize + footer.getSerializedSize();
-            final long available = blockSize - (start % blockSize);
-            final long overflow = currentStripeSize - adjustedStripeSize;
-            final float availRatio = (float) available / (float) defaultStripeSize;
-
-            if (availRatio > 0.0f && availRatio < 1.0f
-                    && availRatio > paddingTolerance) {
-                // adjust default stripe size to fit into remaining space, also adjust
-                // the next stripe for correction based on the current stripe size
-                // and user specified padding tolerance. Since stripe size can overflow
-                // the default stripe size we should apply this correction to avoid
-                // writing portion of last stripe to next hdfs block.
-                double correction = overflow > 0 ? (double) overflow
-                        / (double) adjustedStripeSize : 0.0;
-
-                // correction should not be greater than user specified padding
-                // tolerance
-                correction = correction > paddingTolerance ? paddingTolerance
-                        : correction;
-
-                // adjust next stripe size based on current stripe estimate correction
-                adjustedStripeSize = (long) ((1.0f - correction) * (availRatio * defaultStripeSize));
-            } else if (availRatio >= 1.0) {
-                adjustedStripeSize = defaultStripeSize;
-            }
-
-            if (availRatio < paddingTolerance && addBlockPadding) {
-                long padding = blockSize - (start % blockSize);
-                byte[] pad = new byte[(int) Math.min(HDFS_BUFFER_SIZE, padding)];
-                LOG.info(String.format("Padding ORC by %d bytes (<=  %.2f * %d)",
-                        padding, availRatio, defaultStripeSize));
-                start += padding;
-                while (padding > 0) {
-                    int writeLen = (int) Math.min(padding, pad.length);
-                    rawWriter.write(pad, 0, writeLen);
-                    padding -= writeLen;
-                }
-                adjustedStripeSize = defaultStripeSize;
-            } else if (currentStripeSize < blockSize
-                    && (start % blockSize) + currentStripeSize > blockSize) {
-                // even if you don't pad, reset the default stripe size when crossing a
-                // block boundary
-                adjustedStripeSize = defaultStripeSize;
-            }
-
-            // write out the data streams
-            for (Map.Entry<StreamName, BufferedStream> pair : streams.entrySet()) {
-                BufferedStream stream = pair.getValue();
-                if (!stream.isSuppressed()) {
-                    stream.spillTo(rawWriter);
-                }
-                stream.clear();
-            }
-            footer.writeTo(protobufWriter);
-            protobufWriter.flush();
-            writer.flush();
-            long footerLength = rawWriter.getBytesWritten() - start - dataSize - indexSize;
-            OrcProto.StripeInformation dirEntry =
-                    OrcProto.StripeInformation.newBuilder()
-                            .setOffset(start)
-                            .setNumberOfRows(rowsInStripe)
-                            .setIndexLength(indexSize)
-                            .setDataLength(dataSize)
-                            .setFooterLength(footerLength).build();
-            stripes.add(dirEntry);
-            rowCount += rowsInStripe;
-            rowsInStripe = 0;
-        }
-    }
-
-    private long computeRawDataSize() {
-        return getRawDataSize(treeWriter, schema);
-    }
-
-    private long getRawDataSize(TreeWriter child,
-                                TypeDescription schema) {
-        long total = 0;
-        long numVals = child.fileStatistics.getNumberOfValues();
-        switch (schema.getCategory()) {
-            case BOOLEAN:
-            case BYTE:
-            case SHORT:
-            case INT:
-            case FLOAT:
-                return numVals * JavaDataModel.get().primitive1();
-            case LONG:
-            case DOUBLE:
-                return numVals * JavaDataModel.get().primitive2();
-            case STRING:
-            case VARCHAR:
-            case CHAR:
-                // ORC strings are converted to java Strings. so use JavaDataModel to
-                // compute the overall size of strings
-                StringColumnStatistics scs = (StringColumnStatistics) child.fileStatistics;
-                numVals = numVals == 0 ? 1 : numVals;
-                int avgStringLen = (int) (scs.getSum() / numVals);
-                return numVals * JavaDataModel.get().lengthForStringOfLength(avgStringLen);
-            case DECIMAL:
-                return numVals * JavaDataModel.get().lengthOfDecimal();
-            case DATE:
-                return numVals * JavaDataModel.get().lengthOfDate();
-            case BINARY:
-                // get total length of binary blob
-                BinaryColumnStatistics bcs = (BinaryColumnStatistics) child.fileStatistics;
-                return bcs.getSum();
-            case TIMESTAMP:
-                return numVals * JavaDataModel.get().lengthOfTimestamp();
-            case LIST:
-            case MAP:
-            case UNION:
-            case STRUCT: {
-                TreeWriter[] childWriters = child.getChildrenWriters();
-                List<TypeDescription> childTypes = schema.getChildren();
-                for (int i = 0; i < childWriters.length; ++i) {
-                    total += getRawDataSize(childWriters[i], childTypes.get(i));
-                }
-                break;
-            }
-            default:
-                LOG.debug("Unknown object inspector category.");
-                break;
-        }
-        return total;
-    }
-
-    private OrcProto.CompressionKind writeCompressionKind(CompressionKind kind) {
-        switch (kind) {
-            case NONE:
-                return OrcProto.CompressionKind.NONE;
-            case ZLIB:
-                return OrcProto.CompressionKind.ZLIB;
-            case SNAPPY:
-                return OrcProto.CompressionKind.SNAPPY;
-            case LZO:
-                return OrcProto.CompressionKind.LZO;
-            default:
-                throw new IllegalArgumentException("Unknown compression " + kind);
-        }
-    }
-
-    private void writeFileStatistics(OrcProto.Footer.Builder builder,
-                                     TreeWriter writer) throws IOException {
-        builder.addStatistics(writer.fileStatistics.serialize());
-        for (TreeWriter child : writer.getChildrenWriters()) {
-            writeFileStatistics(builder, child);
-        }
-    }
-
-    private int writeMetadata() throws IOException {
-        getStream();
-        OrcProto.Metadata.Builder builder = OrcProto.Metadata.newBuilder();
-        for (OrcProto.StripeStatistics.Builder ssb : treeWriter.stripeStatsBuilders) {
-            builder.addStripeStats(ssb.build());
-        }
-
-        long startPosn = rawWriter.getBytesWritten();
-        OrcProto.Metadata metadata = builder.build();
-        metadata.writeTo(protobufWriter);
-        protobufWriter.flush();
-        writer.flush();
-        return (int) (rawWriter.getBytesWritten() - startPosn);
-    }
-
-    private int writeFooter(long bodyLength) throws IOException {
-        getStream();
-        OrcProto.Footer.Builder builder = OrcProto.Footer.newBuilder();
-        builder.setContentLength(bodyLength);
-        builder.setHeaderLength(headerLength);
-        builder.setNumberOfRows(rowCount);
-        builder.setRowIndexStride(rowIndexStride);
-        // populate raw data size
-        rawDataSize = computeRawDataSize();
-        // serialize the types
-        writeTypes(builder, schema);
-        // add the stripe information
-        for (OrcProto.StripeInformation stripe : stripes) {
-            builder.addStripes(stripe);
-        }
-        // add the column statistics
-        writeFileStatistics(builder, treeWriter);
-        // add all of the user metadata
-        for (Map.Entry<String, ByteString> entry : userMetadata.entrySet()) {
-            builder.addMetadata(OrcProto.UserMetadataItem.newBuilder()
-                    .setName(entry.getKey()).setValue(entry.getValue()));
-        }
-        long startPosn = rawWriter.getBytesWritten();
-        OrcProto.Footer footer = builder.build();
-        footer.writeTo(protobufWriter);
-        protobufWriter.flush();
-        writer.flush();
-        return (int) (rawWriter.getBytesWritten() - startPosn);
-    }
-
-    private int writePostScript(int footerLength, int metadataLength) throws IOException {
-        OrcProto.PostScript.Builder builder =
-                OrcProto.PostScript.newBuilder()
-                        .setCompression(writeCompressionKind(compress))
-                        .setFooterLength(footerLength)
-                        .setMetadataLength(metadataLength)
-                        .setMagic(OrcFile.MAGIC)
-                        .addVersion(version.getMajor())
-                        .addVersion(version.getMinor())
-                        .setWriterVersion(OrcFile.CURRENT_WRITER.getId());
-        if (compress != CompressionKind.NONE) {
-            builder.setCompressionBlockSize(bufferSize);
-        }
-        OrcProto.PostScript ps = builder.build();
-        // need to write this uncompressed
-        long startPosn = rawWriter.getBytesWritten();
-        ps.writeTo(rawWriter);
-        long length = rawWriter.getBytesWritten() - startPosn;
-        if (length > 255) {
-            throw new IllegalArgumentException("PostScript too large at " + length);
-        }
-        return (int) length;
-    }
-
-    private long estimateStripeSize() {
-        long result = 0;
-        for (BufferedStream stream : streams.values()) {
-            result += stream.getBufferSize();
-        }
-        result += treeWriter.estimateMemory();
-        return result;
-    }
-
-    @Override
-    public TypeDescription getSchema() {
-        return schema;
-    }
-
-    @Override
-    public void addUserMetadata(String name, ByteBuffer value) {
-        userMetadata.put(name, ByteString.copyFrom(value));
-    }
-
-    @Override
-    public void addRowBatch(VectorizedRowBatch batch) throws IOException {
-        if (buildIndex) {
-            // Batch the writes up to the rowIndexStride so that we can get the
-            // right size indexes.
-            int posn = 0;
-            while (posn < batch.size) {
-                int chunkSize = Math.min(batch.size - posn,
-                        rowIndexStride - rowsInIndex);
-                treeWriter.writeRootBatch(batch, posn, chunkSize);
-                posn += chunkSize;
-                rowsInIndex += chunkSize;
-                rowsInStripe += chunkSize;
-                if (rowsInIndex >= rowIndexStride) {
-                    createRowIndexEntry();
-                }
-            }
-        } else {
-            rowsInStripe += batch.size;
-            treeWriter.writeRootBatch(batch, 0, batch.size);
-        }
-        memoryManager.addedRow(batch.size);
-    }
-
-    @Override
-    public void close() throws IOException {
-        if (callback != null) {
-            callback.preFooterWrite(callbackContext);
-        }
-        // remove us from the memory manager so that we don't get any callbacks
-        memoryManager.removeWriter(path);
-        // actually close the file
-        flushStripe();
-        int metadataLength = writeMetadata();
-        int footerLength = writeFooter(rawWriter.getBytesWritten() - metadataLength);
-        rawWriter.write(writePostScript(footerLength, metadataLength));
-        rawWriter.close();
-
-    }
-
-    /**
-     * Raw data size will be compute when writing the file footer. Hence raw data
-     * size value will be available only after closing the writer.
-     */
-    @Override
-    public long getRawDataSize() {
-        return rawDataSize;
-    }
-
-    /**
-     * Row count gets updated when flushing the stripes. To get accurate row
-     * count call this method after writer is closed.
-     */
-    @Override
-    public long getNumberOfRows() {
-        return rowCount;
-    }
-
-    @Override
-    public long writeIntermediateFooter() throws IOException {
-        // flush any buffered rows
-        flushStripe();
-        // write a footer
-        if (stripesAtLastFlush != stripes.size()) {
-            if (callback != null) {
-                callback.preFooterWrite(callbackContext);
-            }
-            int metaLength = writeMetadata();
-            int footLength = writeFooter(rawWriter.getBytesWritten() - metaLength);
-            rawWriter.write(writePostScript(footLength, metaLength));
-            stripesAtLastFlush = stripes.size();
-            rawWriter.flush();
-        }
-        return rawWriter.getBytesWritten();
-    }
-
-    @Override
-    public void appendStripe(byte[] stripe, int offset, int length,
-                             StripeInformation stripeInfo,
-                             OrcProto.StripeStatistics stripeStatistics) throws IOException {
-        checkArgument(stripe != null, "Stripe must not be null");
-        checkArgument(length <= stripe.length,
-                "Specified length must not be greater specified array length");
-        checkArgument(stripeInfo != null, "Stripe information must not be null");
-        checkArgument(stripeStatistics != null,
-                "Stripe statistics must not be null");
-
-        getStream();
-        long start = rawWriter.getBytesWritten();
-        long availBlockSpace = blockSize - (start % blockSize);
-
-        // see if stripe can fit in the current hdfs block, else pad the remaining
-        // space in the block
-        if (length < blockSize && length > availBlockSpace && addBlockPadding) {
-            byte[] pad = new byte[(int) Math.min(HDFS_BUFFER_SIZE, availBlockSpace)];
-            LOG.info(String.format("Padding ORC by %d bytes while merging..", availBlockSpace));
-            start += availBlockSpace;
-            while (availBlockSpace > 0) {
-                int writeLen = (int) Math.min(availBlockSpace, pad.length);
-                rawWriter.write(pad, 0, writeLen);
-                availBlockSpace -= writeLen;
-            }
-        }
-
-        rawWriter.write(stripe);
-        rowsInStripe = stripeStatistics.getColStats(0).getNumberOfValues();
-        rowCount += rowsInStripe;
-
-        // since we have already written the stripe, just update stripe statistics
-        treeWriter.stripeStatsBuilders.add(stripeStatistics.toBuilder());
-
-        // update file level statistics
-        updateFileStatistics(stripeStatistics);
-
-        // update stripe information
-        OrcProto.StripeInformation dirEntry = OrcProto.StripeInformation
-                .newBuilder()
-                .setOffset(start)
-                .setNumberOfRows(rowsInStripe)
-                .setIndexLength(stripeInfo.getIndexLength())
-                .setDataLength(stripeInfo.getDataLength())
-                .setFooterLength(stripeInfo.getFooterLength())
-                .build();
-        stripes.add(dirEntry);
-
-        // reset it after writing the stripe
-        rowsInStripe = 0;
-    }
-
-    private void updateFileStatistics(OrcProto.StripeStatistics stripeStatistics) {
-        List<OrcProto.ColumnStatistics> cs = stripeStatistics.getColStatsList();
-        List<TreeWriter> allWriters = getAllColumnTreeWriters(treeWriter);
-        for (int i = 0; i < allWriters.size(); i++) {
-            allWriters.get(i).fileStatistics.merge(ColumnStatisticsImpl.deserialize(cs.get(i)));
-        }
-    }
-
-    private List<TreeWriter> getAllColumnTreeWriters(TreeWriter rootTreeWriter) {
-        List<TreeWriter> result = Lists.newArrayList();
-        getAllColumnTreeWritersImpl(rootTreeWriter, result);
-        return result;
-    }
-
-    private void getAllColumnTreeWritersImpl(TreeWriter tw,
-                                             List<TreeWriter> result) {
-        result.add(tw);
-        for (TreeWriter child : tw.childrenWriters) {
-            getAllColumnTreeWritersImpl(child, result);
-        }
-    }
-
-    @Override
-    public void appendUserMetadata(List<OrcProto.UserMetadataItem> userMetadata) {
-        if (userMetadata != null) {
-            for (OrcProto.UserMetadataItem item : userMetadata) {
-                this.userMetadata.put(item.getName(), item.getValue());
-            }
-        }
-    }
-}
diff --git a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/java/org/apache/nifi/util/orc/OrcUtils.java b/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/java/org/apache/nifi/util/orc/OrcUtils.java
deleted file mode 100644
index e3f6db5893..0000000000
--- a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/java/org/apache/nifi/util/orc/OrcUtils.java
+++ /dev/null
@@ -1,408 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-package org.apache.nifi.util.orc;
-
-import org.apache.avro.Schema;
-import org.apache.commons.lang3.StringUtils;
-import org.apache.commons.lang3.mutable.MutableInt;
-import org.apache.hadoop.hive.ql.exec.vector.BytesColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.ColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.DoubleColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.ListColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.LongColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.MapColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.UnionColumnVector;
-import org.apache.orc.TypeDescription;
-
-import java.nio.ByteBuffer;
-import java.util.ArrayList;
-import java.util.List;
-import java.util.Map;
-import java.util.stream.Collectors;
-
-/**
- * Utility methods for ORC support (conversion from Avro, conversion to Hive types, e.g.
- */
-public class OrcUtils {
-
-    public static void putToRowBatch(ColumnVector col, MutableInt vectorOffset, int rowNumber, Schema fieldSchema, Object o) {
-        Schema.Type fieldType = fieldSchema.getType();
-
-        if (fieldType == null) {
-            throw new IllegalArgumentException("Field type is null");
-        }
-
-        if (o == null) {
-            col.isNull[rowNumber] = true;
-        } else {
-
-            switch (fieldType) {
-                case INT:
-                    ((LongColumnVector) col).vector[rowNumber] = (int) o;
-                    break;
-                case LONG:
-                    ((LongColumnVector) col).vector[rowNumber] = (long) o;
-                    break;
-                case BOOLEAN:
-                    ((LongColumnVector) col).vector[rowNumber] = ((boolean) o) ? 1 : 0;
-                    break;
-                case BYTES:
-                    ByteBuffer byteBuffer = ((ByteBuffer) o);
-                    int size = byteBuffer.remaining();
-                    byte[] buf = new byte[size];
-                    byteBuffer.get(buf, 0, size);
-                    ((BytesColumnVector) col).setVal(rowNumber, buf);
-                    break;
-                case DOUBLE:
-                    ((DoubleColumnVector) col).vector[rowNumber] = (double) o;
-                    break;
-                case FLOAT:
-                    ((DoubleColumnVector) col).vector[rowNumber] = (float) o;
-                    break;
-                case STRING:
-                case ENUM:
-                    ((BytesColumnVector) col).setVal(rowNumber, o.toString().getBytes());
-                    break;
-                case UNION:
-                    // If the union only has one non-null type in it, it was flattened in the ORC schema
-                    if (col instanceof UnionColumnVector) {
-                        UnionColumnVector union = ((UnionColumnVector) col);
-                        Schema.Type avroType = OrcUtils.getAvroSchemaTypeOfObject(o);
-                        // Find the index in the union with the matching Avro type
-                        int unionIndex = -1;
-                        List<Schema> types = fieldSchema.getTypes();
-                        final int numFields = types.size();
-                        for (int i = 0; i < numFields && unionIndex == -1; i++) {
-                            if (avroType.equals(types.get(i).getType())) {
-                                unionIndex = i;
-                            }
-                        }
-                        if (unionIndex == -1) {
-                            throw new IllegalArgumentException("Object type " + avroType.getName() + " not found in union '" + fieldSchema.getName() + "'");
-                        }
-
-                        // Need nested vector offsets
-                        MutableInt unionVectorOffset = new MutableInt(0);
-                        putToRowBatch(union.fields[unionIndex], unionVectorOffset, rowNumber, fieldSchema.getTypes().get(unionIndex), o);
-                    } else {
-                        // Find and use the non-null type from the union
-                        List<Schema> types = fieldSchema.getTypes();
-                        Schema effectiveType = null;
-                        for (Schema type : types) {
-                            if (!Schema.Type.NULL.equals(type.getType())) {
-                                effectiveType = type;
-                                break;
-                            }
-                        }
-                        putToRowBatch(col, vectorOffset, rowNumber, effectiveType, o);
-                    }
-                    break;
-                case ARRAY:
-                    Schema arrayType = fieldSchema.getElementType();
-                    ListColumnVector array = ((ListColumnVector) col);
-                    if (o instanceof int[] || o instanceof long[]) {
-                        int length = (o instanceof int[]) ? ((int[]) o).length : ((long[]) o).length;
-                        for (int i = 0; i < length; i++) {
-                            ((LongColumnVector) array.child).vector[vectorOffset.getValue() + i] =
-                                    (o instanceof int[]) ? ((int[]) o)[i] : ((long[]) o)[i];
-                        }
-                        array.offsets[rowNumber] = vectorOffset.longValue();
-                        array.lengths[rowNumber] = length;
-                        vectorOffset.add(length);
-                    } else if (o instanceof float[]) {
-                        float[] floatArray = (float[]) o;
-                        for (int i = 0; i < floatArray.length; i++) {
-                            ((DoubleColumnVector) array.child).vector[vectorOffset.getValue() + i] = floatArray[i];
-                        }
-                        array.offsets[rowNumber] = vectorOffset.longValue();
-                        array.lengths[rowNumber] = floatArray.length;
-                        vectorOffset.add(floatArray.length);
-                    } else if (o instanceof double[]) {
-                        double[] doubleArray = (double[]) o;
-                        for (int i = 0; i < doubleArray.length; i++) {
-                            ((DoubleColumnVector) array.child).vector[vectorOffset.getValue() + i] = doubleArray[i];
-                        }
-                        array.offsets[rowNumber] = vectorOffset.longValue();
-                        array.lengths[rowNumber] = doubleArray.length;
-                        vectorOffset.add(doubleArray.length);
-                    } else if (o instanceof String[]) {
-                        String[] stringArray = (String[]) o;
-                        BytesColumnVector byteCol = ((BytesColumnVector) array.child);
-                        for (int i = 0; i < stringArray.length; i++) {
-                            if (stringArray[i] == null) {
-                                byteCol.isNull[rowNumber] = true;
-                            } else {
-                                byteCol.setVal(vectorOffset.getValue() + i, stringArray[i].getBytes());
-                            }
-                        }
-                        array.offsets[rowNumber] = vectorOffset.longValue();
-                        array.lengths[rowNumber] = stringArray.length;
-                        vectorOffset.add(stringArray.length);
-                    } else if (o instanceof Map[]) {
-                        Map[] mapArray = (Map[]) o;
-                        MutableInt mapVectorOffset = new MutableInt(0);
-                        for (int i = 0; i < mapArray.length; i++) {
-                            if (mapArray[i] == null) {
-                                array.child.isNull[rowNumber] = true;
-                            } else {
-                                putToRowBatch(array.child, mapVectorOffset, vectorOffset.getValue() + i, arrayType, mapArray[i]);
-                            }
-                        }
-                        array.offsets[rowNumber] = vectorOffset.longValue();
-                        array.lengths[rowNumber] = mapArray.length;
-                        vectorOffset.add(mapArray.length);
-                    } else if (o instanceof List) {
-                        List listArray = (List) o;
-                        MutableInt listVectorOffset = new MutableInt(0);
-                        int numElements = listArray.size();
-                        for (int i = 0; i < numElements; i++) {
-                            if (listArray.get(i) == null) {
-                                array.child.isNull[rowNumber] = true;
-                            } else {
-                                putToRowBatch(array.child, listVectorOffset, vectorOffset.getValue() + i, arrayType, listArray.get(i));
-                            }
-                        }
-                        array.offsets[rowNumber] = vectorOffset.longValue();
-                        array.lengths[rowNumber] = numElements;
-                        vectorOffset.add(numElements);
-
-                    } else {
-                        throw new IllegalArgumentException("Object class " + o.getClass().getName() + " not supported as an ORC list/array");
-                    }
-                    break;
-                case MAP:
-                    MapColumnVector map = ((MapColumnVector) col);
-
-                    // Avro maps require String keys
-                    @SuppressWarnings("unchecked")
-                    Map<String, ?> mapObj = (Map<String, ?>) o;
-                    int effectiveRowNumber = vectorOffset.getValue();
-                    for (Map.Entry<String, ?> entry : mapObj.entrySet()) {
-                        putToRowBatch(map.keys, vectorOffset, effectiveRowNumber, Schema.create(Schema.Type.STRING), entry.getKey());
-                        putToRowBatch(map.values, vectorOffset, effectiveRowNumber, fieldSchema.getValueType(), entry.getValue());
-                        effectiveRowNumber++;
-                    }
-                    map.offsets[rowNumber] = vectorOffset.longValue();
-                    map.lengths[rowNumber] = mapObj.size();
-                    vectorOffset.add(mapObj.size());
-
-                    break;
-                default:
-                    throw new IllegalArgumentException("Field type " + fieldType.getName() + " not recognized");
-            }
-        }
-    }
-
-    public static String normalizeHiveTableName(String name) {
-        return name.replaceAll("[\\. ]", "_");
-    }
-
-    public static String generateHiveDDL(Schema avroSchema, String tableName) {
-        Schema.Type schemaType = avroSchema.getType();
-        StringBuilder sb = new StringBuilder("CREATE EXTERNAL TABLE IF NOT EXISTS ");
-        sb.append(tableName);
-        sb.append(" (");
-        if (Schema.Type.RECORD.equals(schemaType)) {
-            List<String> hiveColumns = new ArrayList<>();
-            List<Schema.Field> fields = avroSchema.getFields();
-            if (fields != null) {
-                hiveColumns.addAll(
-                        fields.stream().map(field -> field.name() + " " + getHiveTypeFromAvroType(field.schema())).collect(Collectors.toList()));
-            }
-            sb.append(StringUtils.join(hiveColumns, ", "));
-            sb.append(") STORED AS ORC");
-            return sb.toString();
-        } else {
-            throw new IllegalArgumentException("Avro schema is of type " + schemaType.getName() + ", not RECORD");
-        }
-    }
-
-
-    public static void addOrcField(TypeDescription orcSchema, Schema.Field avroField) {
-        Schema fieldSchema = avroField.schema();
-        String fieldName = avroField.name();
-
-        orcSchema.addField(fieldName, getOrcField(fieldSchema));
-    }
-
-    public static TypeDescription getOrcField(Schema fieldSchema) throws IllegalArgumentException {
-        Schema.Type fieldType = fieldSchema.getType();
-
-        switch (fieldType) {
-            case INT:
-            case LONG:
-            case BOOLEAN:
-            case BYTES:
-            case DOUBLE:
-            case FLOAT:
-            case STRING:
-                return getPrimitiveOrcTypeFromPrimitiveAvroType(fieldType);
-
-            case UNION:
-                List<Schema> unionFieldSchemas = fieldSchema.getTypes();
-                TypeDescription unionSchema = TypeDescription.createUnion();
-                if (unionFieldSchemas != null) {
-                    // Ignore null types in union
-                    List<TypeDescription> orcFields = unionFieldSchemas.stream().filter(
-                            unionFieldSchema -> !Schema.Type.NULL.equals(unionFieldSchema.getType())).map(OrcUtils::getOrcField).collect(Collectors.toList());
-
-
-                    // Flatten the field if the union only has one non-null element
-                    if (orcFields.size() == 1) {
-                        return orcFields.get(0);
-                    } else {
-                        orcFields.forEach(unionSchema::addUnionChild);
-                    }
-                }
-                return unionSchema;
-
-            case ARRAY:
-                return TypeDescription.createList(getOrcField(fieldSchema.getElementType()));
-
-            case MAP:
-                return TypeDescription.createMap(TypeDescription.createString(), getOrcField(fieldSchema.getValueType()));
-
-            case RECORD:
-                TypeDescription record = TypeDescription.createStruct();
-                List<Schema.Field> avroFields = fieldSchema.getFields();
-                if (avroFields != null) {
-                    avroFields.forEach(avroField -> addOrcField(record, avroField));
-                }
-                return record;
-
-            case ENUM:
-                // An enum value is just a String for ORC/Hive
-                return TypeDescription.createString();
-
-            default:
-                throw new IllegalArgumentException("Did not recognize Avro type " + fieldType.getName());
-        }
-
-    }
-
-    public static Schema.Type getAvroSchemaTypeOfObject(Object o) {
-        if (o == null) {
-            return Schema.Type.NULL;
-        } else if (o instanceof Integer) {
-            return Schema.Type.INT;
-        } else if (o instanceof Long) {
-            return Schema.Type.LONG;
-        } else if (o instanceof Boolean) {
-            return Schema.Type.BOOLEAN;
-        } else if (o instanceof byte[]) {
-            return Schema.Type.BYTES;
-        } else if (o instanceof Float) {
-            return Schema.Type.FLOAT;
-        } else if (o instanceof Double) {
-            return Schema.Type.DOUBLE;
-        } else if (o instanceof Enum) {
-            return Schema.Type.ENUM;
-        } else if (o instanceof Object[]) {
-            return Schema.Type.ARRAY;
-        } else if (o instanceof List) {
-            return Schema.Type.ARRAY;
-        } else if (o instanceof Map) {
-            return Schema.Type.MAP;
-        } else {
-            throw new IllegalArgumentException("Object of class " + o.getClass() + " is not a supported Avro Type");
-        }
-    }
-
-    public static TypeDescription getPrimitiveOrcTypeFromPrimitiveAvroType(Schema.Type avroType) throws IllegalArgumentException {
-        if (avroType == null) {
-            throw new IllegalArgumentException("Avro type is null");
-        }
-        switch (avroType) {
-            case INT:
-                return TypeDescription.createInt();
-            case LONG:
-                return TypeDescription.createLong();
-            case BOOLEAN:
-                return TypeDescription.createBoolean();
-            case BYTES:
-                return TypeDescription.createBinary();
-            case DOUBLE:
-                return TypeDescription.createDouble();
-            case FLOAT:
-                return TypeDescription.createFloat();
-            case STRING:
-                return TypeDescription.createString();
-            default:
-                throw new IllegalArgumentException("Avro type " + avroType.getName() + " is not a primitive type");
-        }
-    }
-
-    public static String getHiveTypeFromAvroType(Schema avroSchema) {
-        if (avroSchema == null) {
-            throw new IllegalArgumentException("Avro schema is null");
-        }
-
-        Schema.Type avroType = avroSchema.getType();
-
-        switch (avroType) {
-            case INT:
-                return "INT";
-            case LONG:
-                return "BIGINT";
-            case BOOLEAN:
-                return "BOOLEAN";
-            case BYTES:
-                return "BINARY";
-            case DOUBLE:
-                return "DOUBLE";
-            case FLOAT:
-                return "FLOAT";
-            case STRING:
-            case ENUM:
-                return "STRING";
-            case UNION:
-                List<Schema> unionFieldSchemas = avroSchema.getTypes();
-                if (unionFieldSchemas != null) {
-                    List<String> hiveFields = new ArrayList<>();
-                    for (Schema unionFieldSchema : unionFieldSchemas) {
-                        Schema.Type unionFieldSchemaType = unionFieldSchema.getType();
-                        // Ignore null types in union
-                        if (!Schema.Type.NULL.equals(unionFieldSchemaType)) {
-                            hiveFields.add(getHiveTypeFromAvroType(unionFieldSchema));
-                        }
-                    }
-                    // Flatten the field if the union only has one non-null element
-                    return (hiveFields.size() == 1)
-                            ? hiveFields.get(0)
-                            : "UNIONTYPE<" + StringUtils.join(hiveFields, ", ") + ">";
-
-                }
-                break;
-            case MAP:
-                return "MAP<STRING, " + getHiveTypeFromAvroType(avroSchema.getValueType()) + ">";
-            case ARRAY:
-                return "ARRAY<" + getHiveTypeFromAvroType(avroSchema.getElementType()) + ">";
-            case RECORD:
-                List<Schema.Field> recordFields = avroSchema.getFields();
-                if (recordFields != null) {
-                    List<String> hiveFields = recordFields.stream().map(
-                            recordField -> recordField.name() + ":" + getHiveTypeFromAvroType(recordField.schema())).collect(Collectors.toList());
-                    return "STRUCT<" + StringUtils.join(hiveFields, ", ") + ">";
-                }
-                break;
-            default:
-                break;
-        }
-
-        throw new IllegalArgumentException("Error converting Avro type " + avroType.getName() + " to Hive type");
-    }
-}
diff --git a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/resources/META-INF/services/org.apache.nifi.processor.Processor b/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/resources/META-INF/services/org.apache.nifi.processor.Processor
index 45e1f29e7e..55ee005f71 100644
--- a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/resources/META-INF/services/org.apache.nifi.processor.Processor
+++ b/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/main/resources/META-INF/services/org.apache.nifi.processor.Processor
@@ -14,5 +14,4 @@
 # limitations under the License.
 org.apache.nifi.processors.hive.SelectHiveQL
 org.apache.nifi.processors.hive.PutHiveQL
-org.apache.nifi.processors.hive.ConvertAvroToORC
 org.apache.nifi.processors.hive.PutHiveStreaming
diff --git a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/test/java/org/apache/nifi/processors/hive/TestConvertAvroToORC.java b/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/test/java/org/apache/nifi/processors/hive/TestConvertAvroToORC.java
deleted file mode 100644
index 9afcf7f0af..0000000000
--- a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/test/java/org/apache/nifi/processors/hive/TestConvertAvroToORC.java
+++ /dev/null
@@ -1,260 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-package org.apache.nifi.processors.hive;
-
-import org.apache.avro.Schema;
-import org.apache.avro.file.DataFileWriter;
-import org.apache.avro.generic.GenericData;
-import org.apache.avro.generic.GenericDatumWriter;
-import org.apache.avro.io.DatumWriter;
-import org.apache.hadoop.conf.Configuration;
-import org.apache.hadoop.fs.FileSystem;
-import org.apache.hadoop.fs.Path;
-import org.apache.hadoop.hive.ql.exec.vector.BytesColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.DoubleColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.ListColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.LongColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.MapColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.UnionColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch;
-import org.apache.nifi.flowfile.attributes.CoreAttributes;
-import org.apache.nifi.util.MockFlowFile;
-import org.apache.nifi.util.TestRunner;
-import org.apache.nifi.util.TestRunners;
-import org.apache.nifi.util.orc.TestOrcUtils;
-import org.apache.orc.OrcFile;
-import org.apache.orc.Reader;
-import org.apache.orc.RecordReader;
-import org.junit.Before;
-import org.junit.Test;
-
-import java.io.ByteArrayOutputStream;
-import java.io.FileOutputStream;
-import java.nio.charset.StandardCharsets;
-import java.util.Arrays;
-import java.util.HashMap;
-import java.util.Map;
-import java.util.TreeMap;
-
-import static org.junit.Assert.assertEquals;
-import static org.junit.Assert.assertTrue;
-
-
-/**
- * Unit tests for ConvertAvroToORC processor
- */
-public class TestConvertAvroToORC {
-
-    private ConvertAvroToORC processor;
-    private TestRunner runner;
-
-    @Before
-    public void setUp() throws Exception {
-        processor = new ConvertAvroToORC();
-        runner = TestRunners.newTestRunner(processor);
-    }
-
-    @Test
-    public void test_Setup() throws Exception {
-
-    }
-
-    @Test
-    public void test_onTrigger_primitive_record() throws Exception {
-        GenericData.Record record = TestOrcUtils.buildPrimitiveAvroRecord(10, 20L, true, 30.0f, 40, StandardCharsets.UTF_8.encode("Hello"), "World");
-
-        DatumWriter<GenericData.Record> writer = new GenericDatumWriter<>(record.getSchema());
-        DataFileWriter<GenericData.Record> fileWriter = new DataFileWriter<>(writer);
-        ByteArrayOutputStream out = new ByteArrayOutputStream();
-        fileWriter.create(record.getSchema(), out);
-        fileWriter.append(record);
-        // Put another record in
-        record = TestOrcUtils.buildPrimitiveAvroRecord(1, 2L, false, 3.0f, 4L, StandardCharsets.UTF_8.encode("I am"), "another record");
-        fileWriter.append(record);
-        // And one more
-        record = TestOrcUtils.buildPrimitiveAvroRecord(100, 200L, true, 300.0f, 400L, StandardCharsets.UTF_8.encode("Me"), "too!");
-        fileWriter.append(record);
-        fileWriter.flush();
-        fileWriter.close();
-        out.close();
-        Map<String,String> attributes = new HashMap<String,String>(){{
-            put(CoreAttributes.FILENAME.key(), "test.avro");
-        }};
-        runner.enqueue(out.toByteArray(), attributes);
-        runner.run();
-
-        runner.assertAllFlowFilesTransferred(ConvertAvroToORC.REL_SUCCESS, 1);
-
-        // Write the flow file out to disk, since the ORC Reader needs a path
-        MockFlowFile resultFlowFile = runner.getFlowFilesForRelationship(ConvertAvroToORC.REL_SUCCESS).get(0);
-        assertEquals("CREATE EXTERNAL TABLE IF NOT EXISTS test_record (int INT, long BIGINT, boolean BOOLEAN, float FLOAT, double DOUBLE, bytes BINARY, string STRING)"
-                + " STORED AS ORC", resultFlowFile.getAttribute(ConvertAvroToORC.HIVE_DDL_ATTRIBUTE));
-        assertEquals("3", resultFlowFile.getAttribute(ConvertAvroToORC.RECORD_COUNT_ATTRIBUTE));
-        assertEquals("test.orc", resultFlowFile.getAttribute(CoreAttributes.FILENAME.key()));
-        byte[] resultContents = runner.getContentAsByteArray(resultFlowFile);
-        FileOutputStream fos = new FileOutputStream("target/test1.orc");
-        fos.write(resultContents);
-        fos.flush();
-        fos.close();
-
-        Configuration conf = new Configuration();
-        FileSystem fs = FileSystem.getLocal(conf);
-        Reader reader = OrcFile.createReader(new Path("target/test1.orc"), OrcFile.readerOptions(conf).filesystem(fs));
-        RecordReader rows = reader.rows();
-        VectorizedRowBatch batch = reader.getSchema().createRowBatch();
-        assertTrue(rows.nextBatch(batch));
-        assertTrue(batch.cols[0] instanceof LongColumnVector);
-        assertEquals(10, ((LongColumnVector) batch.cols[0]).vector[0]);
-        assertEquals(1, ((LongColumnVector) batch.cols[0]).vector[1]);
-        assertEquals(100, ((LongColumnVector) batch.cols[0]).vector[2]);
-        assertTrue(batch.cols[1] instanceof LongColumnVector);
-        assertEquals(20, ((LongColumnVector) batch.cols[1]).vector[0]);
-        assertEquals(2, ((LongColumnVector) batch.cols[1]).vector[1]);
-        assertEquals(200, ((LongColumnVector) batch.cols[1]).vector[2]);
-        assertTrue(batch.cols[2] instanceof LongColumnVector);
-        assertEquals(1, ((LongColumnVector) batch.cols[2]).vector[0]);
-        assertEquals(0, ((LongColumnVector) batch.cols[2]).vector[1]);
-        assertEquals(1, ((LongColumnVector) batch.cols[2]).vector[2]);
-        assertTrue(batch.cols[3] instanceof DoubleColumnVector);
-        assertEquals(30.0f, ((DoubleColumnVector) batch.cols[3]).vector[0], Double.MIN_NORMAL);
-        assertEquals(3.0f, ((DoubleColumnVector) batch.cols[3]).vector[1], Double.MIN_NORMAL);
-        assertEquals(300.0f, ((DoubleColumnVector) batch.cols[3]).vector[2], Double.MIN_NORMAL);
-        assertTrue(batch.cols[4] instanceof DoubleColumnVector);
-        assertEquals(40.0f, ((DoubleColumnVector) batch.cols[4]).vector[0], Double.MIN_NORMAL);
-        assertEquals(4.0f, ((DoubleColumnVector) batch.cols[4]).vector[1], Double.MIN_NORMAL);
-        assertEquals(400.0f, ((DoubleColumnVector) batch.cols[4]).vector[2], Double.MIN_NORMAL);
-        assertTrue(batch.cols[5] instanceof BytesColumnVector);
-        assertEquals("Hello", ((BytesColumnVector) batch.cols[5]).toString(0));
-        assertEquals("I am", ((BytesColumnVector) batch.cols[5]).toString(1));
-        assertEquals("Me", ((BytesColumnVector) batch.cols[5]).toString(2));
-        assertTrue(batch.cols[6] instanceof BytesColumnVector);
-        assertEquals("World", ((BytesColumnVector) batch.cols[6]).toString(0));
-        assertEquals("another record", ((BytesColumnVector) batch.cols[6]).toString(1));
-        assertEquals("too!", ((BytesColumnVector) batch.cols[6]).toString(2));
-    }
-
-    @Test
-    public void test_onTrigger_complex_record() throws Exception {
-
-        Map<String, Double> mapData1 = new TreeMap<String, Double>() {{
-            put("key1", 1.0);
-            put("key2", 2.0);
-        }};
-
-        GenericData.Record record = TestOrcUtils.buildComplexAvroRecord(10, mapData1, "DEF", 3.0f, Arrays.asList(10, 20));
-
-        DatumWriter<GenericData.Record> writer = new GenericDatumWriter<>(record.getSchema());
-        DataFileWriter<GenericData.Record> fileWriter = new DataFileWriter<>(writer);
-        ByteArrayOutputStream out = new ByteArrayOutputStream();
-        fileWriter.create(record.getSchema(), out);
-        fileWriter.append(record);
-
-        // Put another record in
-        Map<String, Double> mapData2 = new TreeMap<String, Double>() {{
-            put("key1", 3.0);
-            put("key2", 4.0);
-        }};
-
-        record = TestOrcUtils.buildComplexAvroRecord(null, mapData2, "XYZ", 4L, Arrays.asList(100, 200));
-        fileWriter.append(record);
-
-        fileWriter.flush();
-        fileWriter.close();
-        out.close();
-
-        Map<String,String> attributes = new HashMap<String,String>(){{
-            put(CoreAttributes.FILENAME.key(), "test");
-        }};
-        runner.enqueue(out.toByteArray(), attributes);
-        runner.run();
-
-        runner.assertAllFlowFilesTransferred(ConvertAvroToORC.REL_SUCCESS, 1);
-
-        // Write the flow file out to disk, since the ORC Reader needs a path
-        MockFlowFile resultFlowFile = runner.getFlowFilesForRelationship(ConvertAvroToORC.REL_SUCCESS).get(0);
-        assertEquals("CREATE EXTERNAL TABLE IF NOT EXISTS complex_record " +
-                "(myInt INT, myMap MAP<STRING, DOUBLE>, myEnum STRING, myLongOrFloat UNIONTYPE<BIGINT, FLOAT>, myIntList ARRAY<INT>)"
-                + " STORED AS ORC", resultFlowFile.getAttribute(ConvertAvroToORC.HIVE_DDL_ATTRIBUTE));
-        assertEquals("2", resultFlowFile.getAttribute(ConvertAvroToORC.RECORD_COUNT_ATTRIBUTE));
-        assertEquals("test.orc", resultFlowFile.getAttribute(CoreAttributes.FILENAME.key()));
-        byte[] resultContents = runner.getContentAsByteArray(resultFlowFile);
-        FileOutputStream fos = new FileOutputStream("target/test1.orc");
-        fos.write(resultContents);
-        fos.flush();
-        fos.close();
-
-        Configuration conf = new Configuration();
-        FileSystem fs = FileSystem.getLocal(conf);
-        Reader reader = OrcFile.createReader(new Path("target/test1.orc"), OrcFile.readerOptions(conf).filesystem(fs));
-        RecordReader rows = reader.rows();
-        VectorizedRowBatch batch = reader.getSchema().createRowBatch();
-        assertTrue(rows.nextBatch(batch));
-        assertTrue(batch.cols[0] instanceof LongColumnVector);
-        assertEquals(10, ((LongColumnVector) batch.cols[0]).vector[0]);
-        assertTrue(batch.cols[1] instanceof MapColumnVector);
-        assertTrue(batch.cols[2] instanceof BytesColumnVector);
-        assertTrue(batch.cols[3] instanceof UnionColumnVector);
-        StringBuilder buffer = new StringBuilder();
-        batch.cols[3].stringifyValue(buffer, 1);
-        assertEquals("{\"tag\": 0, \"value\": 4}", buffer.toString());
-        assertTrue(batch.cols[4] instanceof ListColumnVector);
-    }
-
-    @Test
-    public void test_onTrigger_multiple_batches() throws Exception {
-
-        Schema recordSchema = TestOrcUtils.buildPrimitiveAvroSchema();
-        DatumWriter<GenericData.Record> writer = new GenericDatumWriter<>(recordSchema);
-        DataFileWriter<GenericData.Record> fileWriter = new DataFileWriter<>(writer);
-        ByteArrayOutputStream out = new ByteArrayOutputStream();
-        fileWriter.create(recordSchema, out);
-
-        GenericData.Record record;
-        for (int i = 1;i<=2000;i++) {
-            record = TestOrcUtils.buildPrimitiveAvroRecord(i, 2L * i, true, 30.0f * i, 40L * i, StandardCharsets.UTF_8.encode("Hello"), "World");
-
-
-            fileWriter.append(record);
-        }
-
-        fileWriter.flush();
-        fileWriter.close();
-        out.close();
-        runner.enqueue(out.toByteArray());
-        runner.run();
-
-        runner.assertAllFlowFilesTransferred(ConvertAvroToORC.REL_SUCCESS, 1);
-
-        // Write the flow file out to disk, since the ORC Reader needs a path
-        MockFlowFile resultFlowFile = runner.getFlowFilesForRelationship(ConvertAvroToORC.REL_SUCCESS).get(0);
-        assertEquals("2000", resultFlowFile.getAttribute(ConvertAvroToORC.RECORD_COUNT_ATTRIBUTE));
-        byte[] resultContents = runner.getContentAsByteArray(resultFlowFile);
-        FileOutputStream fos = new FileOutputStream("target/test1.orc");
-        fos.write(resultContents);
-        fos.flush();
-        fos.close();
-
-        Configuration conf = new Configuration();
-        FileSystem fs = FileSystem.getLocal(conf);
-        Reader reader = OrcFile.createReader(new Path("target/test1.orc"), OrcFile.readerOptions(conf).filesystem(fs));
-        RecordReader rows = reader.rows();
-        VectorizedRowBatch batch = reader.getSchema().createRowBatch();
-        assertTrue(rows.nextBatch(batch));
-        // At least 2 batches were created
-        assertTrue(rows.nextBatch(batch));
-    }
-}
\ No newline at end of file
diff --git a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/test/java/org/apache/nifi/util/orc/TestOrcUtils.java b/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/test/java/org/apache/nifi/util/orc/TestOrcUtils.java
deleted file mode 100644
index 539fddba74..0000000000
--- a/nifi-nar-bundles/nifi-hive-bundle/nifi-hive-processors/src/test/java/org/apache/nifi/util/orc/TestOrcUtils.java
+++ /dev/null
@@ -1,555 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-package org.apache.nifi.util.orc;
-
-
-import org.apache.avro.Schema;
-import org.apache.avro.SchemaBuilder;
-import org.apache.avro.generic.GenericData;
-import org.apache.commons.lang3.mutable.MutableInt;
-import org.apache.hadoop.hive.ql.exec.vector.BytesColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.DoubleColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.ListColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.LongColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.MapColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.UnionColumnVector;
-import org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch;
-import org.apache.orc.TypeDescription;
-import org.junit.Test;
-
-import java.nio.ByteBuffer;
-import java.util.Arrays;
-import java.util.List;
-import java.util.Map;
-import java.util.TreeMap;
-
-import static org.junit.Assert.assertEquals;
-import static org.junit.Assert.assertTrue;
-
-/**
- * Unit tests for the OrcUtils helper class
- */
-public class TestOrcUtils {
-
-    @Test
-    public void test_getOrcField_primitive() throws Exception {
-        // Expected ORC types
-        TypeDescription[] expectedTypes = {
-                TypeDescription.createInt(),
-                TypeDescription.createLong(),
-                TypeDescription.createBoolean(),
-                TypeDescription.createFloat(),
-                TypeDescription.createDouble(),
-                TypeDescription.createBinary(),
-                TypeDescription.createString(),
-        };
-
-        // Build a fake Avro record with all types
-        Schema testSchema = buildPrimitiveAvroSchema();
-        List<Schema.Field> fields = testSchema.getFields();
-        for (int i = 0; i < fields.size(); i++) {
-            assertEquals(expectedTypes[i], OrcUtils.getOrcField(fields.get(i).schema()));
-        }
-
-    }
-
-    @Test
-    public void test_getOrcField_union_optional_type() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("union").type().unionOf().nullBuilder().endNull().and().booleanType().endUnion().noDefault();
-        Schema testSchema = builder.endRecord();
-        TypeDescription orcType = OrcUtils.getOrcField(testSchema.getField("union").schema());
-        assertEquals(TypeDescription.createBoolean(), orcType);
-    }
-
-    @Test
-    public void test_getOrcField_union() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("union").type().unionOf().intType().and().booleanType().endUnion().noDefault();
-        Schema testSchema = builder.endRecord();
-        TypeDescription orcType = OrcUtils.getOrcField(testSchema.getField("union").schema());
-        assertEquals(
-                TypeDescription.createUnion()
-                        .addUnionChild(TypeDescription.createInt())
-                        .addUnionChild(TypeDescription.createBoolean()),
-                orcType);
-    }
-
-    @Test
-    public void test_getOrcField_map() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("map").type().map().values().doubleType().noDefault();
-        Schema testSchema = builder.endRecord();
-        TypeDescription orcType = OrcUtils.getOrcField(testSchema.getField("map").schema());
-        assertEquals(
-                TypeDescription.createMap(TypeDescription.createString(), TypeDescription.createDouble()),
-                orcType);
-    }
-
-    @Test
-    public void test_getOrcField_nested_map() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("map").type().map().values().map().values().doubleType().noDefault();
-        Schema testSchema = builder.endRecord();
-        TypeDescription orcType = OrcUtils.getOrcField(testSchema.getField("map").schema());
-        assertEquals(
-                TypeDescription.createMap(TypeDescription.createString(),
-                        TypeDescription.createMap(TypeDescription.createString(), TypeDescription.createDouble())),
-                orcType);
-    }
-
-    @Test
-    public void test_getOrcField_array() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("array").type().array().items().longType().noDefault();
-        Schema testSchema = builder.endRecord();
-        TypeDescription orcType = OrcUtils.getOrcField(testSchema.getField("array").schema());
-        assertEquals(
-                TypeDescription.createList(TypeDescription.createLong()),
-                orcType);
-    }
-
-    @Test
-    public void test_getOrcField_complex_array() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("array").type().array().items().map().values().floatType().noDefault();
-        Schema testSchema = builder.endRecord();
-        TypeDescription orcType = OrcUtils.getOrcField(testSchema.getField("array").schema());
-        assertEquals(
-                TypeDescription.createList(TypeDescription.createMap(TypeDescription.createString(), TypeDescription.createFloat())),
-                orcType);
-    }
-
-    @Test
-    public void test_getOrcField_record() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("int").type().intType().noDefault();
-        builder.name("long").type().longType().longDefault(1L);
-        builder.name("array").type().array().items().stringType().noDefault();
-        Schema testSchema = builder.endRecord();
-        TypeDescription orcType = OrcUtils.getOrcField(testSchema);
-        assertEquals(
-                TypeDescription.createStruct()
-                        .addField("int", TypeDescription.createInt())
-                        .addField("long", TypeDescription.createLong())
-                        .addField("array", TypeDescription.createList(TypeDescription.createString())),
-                orcType);
-    }
-
-    @Test
-    public void test_getOrcField_enum() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("enumField").type().enumeration("enum").symbols("a", "b", "c").enumDefault("a");
-        Schema testSchema = builder.endRecord();
-        TypeDescription orcType = OrcUtils.getOrcField(testSchema.getField("enumField").schema());
-        assertEquals(TypeDescription.createString(), orcType);
-    }
-
-    @Test
-    public void test_getPrimitiveOrcTypeFromPrimitiveAvroType() throws Exception {
-        // Expected ORC types
-        TypeDescription[] expectedTypes = {
-                TypeDescription.createInt(),
-                TypeDescription.createLong(),
-                TypeDescription.createBoolean(),
-                TypeDescription.createFloat(),
-                TypeDescription.createDouble(),
-                TypeDescription.createBinary(),
-                TypeDescription.createString(),
-        };
-
-        Schema testSchema = buildPrimitiveAvroSchema();
-        List<Schema.Field> fields = testSchema.getFields();
-        for (int i = 0; i < fields.size(); i++) {
-            assertEquals(expectedTypes[i], OrcUtils.getPrimitiveOrcTypeFromPrimitiveAvroType(fields.get(i).schema().getType()));
-        }
-    }
-
-    @Test(expected = IllegalArgumentException.class)
-    public void test_getPrimitiveOrcTypeFromPrimitiveAvroType_badType() throws Exception {
-        Schema.Type nonPrimitiveType = Schema.Type.ARRAY;
-        OrcUtils.getPrimitiveOrcTypeFromPrimitiveAvroType(nonPrimitiveType);
-    }
-
-    @Test
-    public void test_putRowToBatch() {
-        TypeDescription orcSchema = buildPrimitiveOrcSchema();
-        VectorizedRowBatch batch = orcSchema.createRowBatch();
-        Schema avroSchema = buildPrimitiveAvroSchema();
-        List<Schema.Field> fields = avroSchema.getFields();
-        GenericData.Record record = buildPrimitiveAvroRecord(1, 2L, false, 1.0f, 3.0, ByteBuffer.wrap("Hello".getBytes()), "World");
-        for (int i = 0; i < fields.size(); i++) {
-            OrcUtils.putToRowBatch(batch.cols[i], new MutableInt(0), 0, fields.get(i).schema(), record.get(i));
-        }
-
-        assertEquals(1, ((LongColumnVector) batch.cols[0]).vector[0]);
-        assertEquals(2, ((LongColumnVector) batch.cols[1]).vector[0]);
-        assertEquals(0, ((LongColumnVector) batch.cols[2]).vector[0]);
-        assertEquals(1.0, ((DoubleColumnVector) batch.cols[3]).vector[0], Double.MIN_NORMAL);
-        assertEquals(3.0, ((DoubleColumnVector) batch.cols[4]).vector[0], Double.MIN_NORMAL);
-        assertEquals("Hello", ((BytesColumnVector) batch.cols[5]).toString(0));
-        assertEquals("World", ((BytesColumnVector) batch.cols[6]).toString(0));
-
-    }
-
-    @Test
-    public void test_putRowToBatch_union() {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("union").type().unionOf().intType().and().floatType().endUnion().noDefault();
-        Schema testSchema = builder.endRecord();
-
-        GenericData.Record row = new GenericData.Record(testSchema);
-        row.put("union", 2);
-
-        TypeDescription orcSchema = TypeDescription.createUnion()
-                .addUnionChild(TypeDescription.createInt())
-                .addUnionChild(TypeDescription.createFloat());
-
-        VectorizedRowBatch batch = orcSchema.createRowBatch();
-        batch.ensureSize(2);
-        OrcUtils.putToRowBatch(batch.cols[0], new MutableInt(0), 0, testSchema.getField("union").schema(), row.get("union"));
-
-        UnionColumnVector union = ((UnionColumnVector) batch.cols[0]);
-        // verify the value is in the union field of type 'int'
-        assertEquals(2, ((LongColumnVector) union.fields[0]).vector[0]);
-        assertEquals(0.0, ((DoubleColumnVector) union.fields[1]).vector[0], Double.MIN_NORMAL);
-
-        row.put("union", 2.0f);
-        OrcUtils.putToRowBatch(batch.cols[0], new MutableInt(0), 1, testSchema.getField("union").schema(), row.get("union"));
-
-        union = ((UnionColumnVector) batch.cols[0]);
-        // verify the value is in the union field of type 'double'
-        assertEquals(0, ((LongColumnVector) union.fields[0]).vector[1]);
-        assertEquals(2.0, ((DoubleColumnVector) union.fields[1]).vector[1], Double.MIN_NORMAL);
-    }
-
-    @Test
-    public void test_putRowToBatch_optional_union() {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("union").type().unionOf().nullType().and().floatType().endUnion().noDefault();
-        Schema testSchema = builder.endRecord();
-
-        GenericData.Record row = new GenericData.Record(testSchema);
-        row.put("union", 2.0f);
-
-        TypeDescription orcSchema = TypeDescription.createFloat();
-
-        VectorizedRowBatch batch = orcSchema.createRowBatch();
-        batch.ensureSize(2);
-        OrcUtils.putToRowBatch(batch.cols[0], new MutableInt(0), 0, testSchema.getField("union").schema(), row.get("union"));
-
-        assertTrue(batch.cols[0] instanceof DoubleColumnVector);
-
-        DoubleColumnVector union = ((DoubleColumnVector) batch.cols[0]);
-        // verify the value is in the union field of type 'int'
-        assertEquals(2.0, union.vector[0], Double.MIN_NORMAL);
-
-    }
-
-    @Test
-    public void test_putRowToBatch_array_ints() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("array").type().array().items().intType().noDefault();
-        Schema testSchema = builder.endRecord();
-
-        GenericData.Record row = new GenericData.Record(testSchema);
-        int[] data1 = {1, 2, 3, 4, 5};
-        row.put("array", data1);
-
-        TypeDescription orcSchema = OrcUtils.getOrcField(testSchema.getField("array").schema());
-        VectorizedRowBatch batch = orcSchema.createRowBatch();
-        batch.ensureSize(2);
-        MutableInt vectorOffset = new MutableInt(0);
-        OrcUtils.putToRowBatch(batch.cols[0], vectorOffset, 0, testSchema.getField("array").schema(), row.get("array"));
-
-        int[] data2 = {10, 20, 30, 40};
-        row.put("array", data2);
-        OrcUtils.putToRowBatch(batch.cols[0], vectorOffset, 1, testSchema.getField("array").schema(), row.get("array"));
-
-        ListColumnVector array = ((ListColumnVector) batch.cols[0]);
-        LongColumnVector dataColumn = ((LongColumnVector) array.child);
-        // Check the first row, entries 0..4 should have values 1..5
-        for (int i = 0; i < 5; i++) {
-            assertEquals(i + 1, dataColumn.vector[i]);
-        }
-        // Check the second row, entries 5..8 should have values 10..40 (by tens)
-        for (int i = 0; i < 4; i++) {
-            assertEquals((i + 1) * 10, dataColumn.vector[(int) array.offsets[1] + i]);
-        }
-        assertEquals(0, dataColumn.vector[9]);
-    }
-
-    @Test
-    public void test_putRowToBatch_array_floats() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("array").type().array().items().floatType().noDefault();
-        Schema testSchema = builder.endRecord();
-
-        GenericData.Record row = new GenericData.Record(testSchema);
-        float[] data1 = {1.0f, 2.0f, 3.0f};
-        row.put("array", data1);
-
-        TypeDescription orcSchema = OrcUtils.getOrcField(testSchema.getField("array").schema());
-        VectorizedRowBatch batch = orcSchema.createRowBatch();
-        batch.ensureSize(2);
-        MutableInt vectorOffset = new MutableInt(0);
-        OrcUtils.putToRowBatch(batch.cols[0], vectorOffset, 0, testSchema.getField("array").schema(), row.get("array"));
-
-        float[] data2 = {40.0f, 41.0f, 42.0f, 43.0f};
-        row.put("array", data2);
-        OrcUtils.putToRowBatch(batch.cols[0], vectorOffset, 1, testSchema.getField("array").schema(), row.get("array"));
-
-        ListColumnVector array = ((ListColumnVector) batch.cols[0]);
-        DoubleColumnVector dataColumn = ((DoubleColumnVector) array.child);
-        // Check the first row, entries 0..4 should have values 1..5
-        for (int i = 0; i < 3; i++) {
-            assertEquals(i + 1.0f, dataColumn.vector[i], Float.MIN_NORMAL);
-        }
-        // Check the second row, entries 5..8 should have values 10..40 (by tens)
-        for (int i = 0; i < 4; i++) {
-            assertEquals((i + 40.0f), dataColumn.vector[(int) array.offsets[1] + i], Float.MIN_NORMAL);
-        }
-        assertEquals(0.0f, dataColumn.vector[9], Float.MIN_NORMAL);
-    }
-
-    @Test
-    public void test_putRowToBatch_list_doubles() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("array").type().array().items().doubleType().noDefault();
-        Schema testSchema = builder.endRecord();
-
-        GenericData.Record row = new GenericData.Record(testSchema);
-        List<Double> data1 = Arrays.asList(1.0, 2.0, 3.0);
-        row.put("array", data1);
-
-        TypeDescription orcSchema = OrcUtils.getOrcField(testSchema.getField("array").schema());
-        VectorizedRowBatch batch = orcSchema.createRowBatch();
-        batch.ensureSize(2);
-        MutableInt vectorOffset = new MutableInt(0);
-        OrcUtils.putToRowBatch(batch.cols[0], vectorOffset, 0, testSchema.getField("array").schema(), row.get("array"));
-
-        List<Double> data2 = Arrays.asList(40.0, 41.0, 42.0, 43.0);
-        row.put("array", data2);
-        OrcUtils.putToRowBatch(batch.cols[0], vectorOffset, 1, testSchema.getField("array").schema(), row.get("array"));
-
-        ListColumnVector array = ((ListColumnVector) batch.cols[0]);
-        DoubleColumnVector dataColumn = ((DoubleColumnVector) array.child);
-        // Check the first row, entries 0..4 should have values 1..5
-        for (int i = 0; i < 3; i++) {
-            assertEquals(i + 1.0f, dataColumn.vector[i], Float.MIN_NORMAL);
-        }
-        // Check the second row, entries 5..8 should have values 10..40 (by tens)
-        for (int i = 0; i < 4; i++) {
-            assertEquals((i + 40.0), dataColumn.vector[(int) array.offsets[1] + i], Float.MIN_NORMAL);
-        }
-        assertEquals(0.0, dataColumn.vector[9], Float.MIN_NORMAL);
-    }
-
-    @Test
-    public void test_putRowToBatch_array_of_maps() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("array").type().array().items().map().values().floatType().noDefault();
-        Schema testSchema = builder.endRecord();
-
-        Map<String, Float> map1 = new TreeMap<String, Float>() {{
-            put("key10", 10.0f);
-            put("key20", 20.0f);
-        }};
-
-        Map<String, Float> map2 = new TreeMap<String, Float>() {{
-            put("key101", 101.0f);
-            put("key202", 202.0f);
-        }};
-
-        Map[] maps = new Map[]{map1, map2, null};
-        GenericData.Record row = new GenericData.Record(testSchema);
-        row.put("array", maps);
-
-        TypeDescription orcSchema = OrcUtils.getOrcField(testSchema.getField("array").schema());
-        VectorizedRowBatch batch = orcSchema.createRowBatch();
-        OrcUtils.putToRowBatch(batch.cols[0], new MutableInt(0), 0, testSchema.getField("array").schema(), row.get("array"));
-
-        ListColumnVector array = ((ListColumnVector) batch.cols[0]);
-        MapColumnVector map = ((MapColumnVector) array.child);
-        StringBuilder buffer = new StringBuilder();
-        map.stringifyValue(buffer, 0);
-        assertEquals("[{\"key\": \"key10\", \"value\": 10.0}, {\"key\": \"key20\", \"value\": 20.0}]", buffer.toString());
-        buffer = new StringBuilder();
-        map.stringifyValue(buffer, 1);
-        assertEquals("[{\"key\": \"key101\", \"value\": 101.0}, {\"key\": \"key202\", \"value\": 202.0}]", buffer.toString());
-
-    }
-
-    @Test
-    public void test_putRowToBatch_primitive_map() throws Exception {
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("testRecord").namespace("any.data").fields();
-        builder.name("map").type().map().values().longType().noDefault();
-        Schema testSchema = builder.endRecord();
-
-        Map<String, Long> mapData1 = new TreeMap<String, Long>() {{
-            put("key10", 100L);
-            put("key20", 200L);
-        }};
-
-        GenericData.Record row = new GenericData.Record(testSchema);
-        row.put("map", mapData1);
-
-        TypeDescription orcSchema = OrcUtils.getOrcField(testSchema.getField("map").schema());
-        VectorizedRowBatch batch = orcSchema.createRowBatch();
-        batch.ensureSize(2);
-        MutableInt vectorOffset = new MutableInt(0);
-        OrcUtils.putToRowBatch(batch.cols[0], vectorOffset, 0, testSchema.getField("map").schema(), row.get("map"));
-
-        Map<String, Long> mapData2 = new TreeMap<String, Long>() {{
-            put("key1000", 1000L);
-            put("key2000", 2000L);
-        }};
-
-        OrcUtils.putToRowBatch(batch.cols[0], vectorOffset, 1, testSchema.getField("map").schema(), mapData2);
-
-        MapColumnVector map = ((MapColumnVector) batch.cols[0]);
-        StringBuilder buffer = new StringBuilder();
-        map.stringifyValue(buffer, 0);
-        assertEquals("[{\"key\": \"key10\", \"value\": 100}, {\"key\": \"key20\", \"value\": 200}]", buffer.toString());
-        buffer = new StringBuilder();
-        map.stringifyValue(buffer, 1);
-        assertEquals("[{\"key\": \"key1000\", \"value\": 1000}, {\"key\": \"key2000\", \"value\": 2000}]", buffer.toString());
-
-    }
-
-    @Test
-    public void test_getHiveTypeFromAvroType_primitive() throws Exception {
-        // Expected ORC types
-        String[] expectedTypes = {
-                "INT",
-                "BIGINT",
-                "BOOLEAN",
-                "FLOAT",
-                "DOUBLE",
-                "BINARY",
-                "STRING",
-        };
-
-        Schema testSchema = buildPrimitiveAvroSchema();
-        List<Schema.Field> fields = testSchema.getFields();
-        for (int i = 0; i < fields.size(); i++) {
-            assertEquals(expectedTypes[i], OrcUtils.getHiveTypeFromAvroType(fields.get(i).schema()));
-        }
-    }
-
-    @Test
-    public void test_getHiveTypeFromAvroType_complex() throws Exception {
-        // Expected ORC types
-        String[] expectedTypes = {
-                "INT",
-                "MAP<STRING, DOUBLE>",
-                "STRING",
-                "UNIONTYPE<BIGINT, FLOAT>",
-                "ARRAY<INT>"
-        };
-
-        Schema testSchema = buildComplexAvroSchema();
-        List<Schema.Field> fields = testSchema.getFields();
-        for (int i = 0; i < fields.size(); i++) {
-            assertEquals(expectedTypes[i], OrcUtils.getHiveTypeFromAvroType(fields.get(i).schema()));
-        }
-
-        assertEquals("STRUCT<myInt:INT, myMap:MAP<STRING, DOUBLE>, myEnum:STRING, myLongOrFloat:UNIONTYPE<BIGINT, FLOAT>, myIntList:ARRAY<INT>>",
-                OrcUtils.getHiveTypeFromAvroType(testSchema));
-    }
-
-    @Test
-    public void test_generateHiveDDL_primitive() throws Exception {
-        Schema avroSchema = buildPrimitiveAvroSchema();
-        String ddl = OrcUtils.generateHiveDDL(avroSchema, "myHiveTable");
-        assertEquals("CREATE EXTERNAL TABLE IF NOT EXISTS myHiveTable (int INT, long BIGINT, boolean BOOLEAN, float FLOAT, double DOUBLE, bytes BINARY, string STRING)"
-                + " STORED AS ORC", ddl);
-    }
-
-    @Test
-    public void test_generateHiveDDL_complex() throws Exception {
-        Schema avroSchema = buildComplexAvroSchema();
-        String ddl = OrcUtils.generateHiveDDL(avroSchema, "myHiveTable");
-        assertEquals("CREATE EXTERNAL TABLE IF NOT EXISTS myHiveTable "
-                + "(myInt INT, myMap MAP<STRING, DOUBLE>, myEnum STRING, myLongOrFloat UNIONTYPE<BIGINT, FLOAT>, myIntList ARRAY<INT>)"
-                + " STORED AS ORC", ddl);
-    }
-
-
-    //////////////////
-    // Helper methods
-    //////////////////
-
-    public static Schema buildPrimitiveAvroSchema() {
-        // Build a fake Avro record with all primitive types
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("test.record").namespace("any.data").fields();
-        builder.name("int").type().intType().noDefault();
-        builder.name("long").type().longType().longDefault(1L);
-        builder.name("boolean").type().booleanType().booleanDefault(true);
-        builder.name("float").type().floatType().floatDefault(0.0f);
-        builder.name("double").type().doubleType().doubleDefault(0.0);
-        builder.name("bytes").type().bytesType().noDefault();
-        builder.name("string").type().stringType().stringDefault("default");
-        return builder.endRecord();
-    }
-
-    public static GenericData.Record buildPrimitiveAvroRecord(int i, long l, boolean b, float f, double d, ByteBuffer bytes, String string) {
-        Schema schema = buildPrimitiveAvroSchema();
-        GenericData.Record row = new GenericData.Record(schema);
-        row.put("int", i);
-        row.put("long", l);
-        row.put("boolean", b);
-        row.put("float", f);
-        row.put("double", d);
-        row.put("bytes", bytes);
-        row.put("string", string);
-        return row;
-    }
-
-    public static TypeDescription buildPrimitiveOrcSchema() {
-        return TypeDescription.createStruct()
-                .addField("int", TypeDescription.createInt())
-                .addField("long", TypeDescription.createLong())
-                .addField("boolean", TypeDescription.createBoolean())
-                .addField("float", TypeDescription.createFloat())
-                .addField("double", TypeDescription.createDouble())
-                .addField("bytes", TypeDescription.createBinary())
-                .addField("string", TypeDescription.createString());
-    }
-
-    public static Schema buildComplexAvroSchema() {
-        // Build a fake Avro record with nested  types
-        final SchemaBuilder.FieldAssembler<Schema> builder = SchemaBuilder.record("complex.record").namespace("any.data").fields();
-        builder.name("myInt").type().unionOf().nullType().and().intType().endUnion().nullDefault();
-        builder.name("myMap").type().map().values().doubleType().noDefault();
-        builder.name("myEnum").type().enumeration("myEnum").symbols("ABC", "DEF", "XYZ").enumDefault("ABC");
-        builder.name("myLongOrFloat").type().unionOf().longType().and().floatType().endUnion().noDefault();
-        builder.name("myIntList").type().array().items().intType().noDefault();
-        return builder.endRecord();
-    }
-
-    public static GenericData.Record buildComplexAvroRecord(Integer i, Map<String, Double> m, String e, Object unionVal, List<Integer> intArray) {
-        Schema schema = buildComplexAvroSchema();
-        GenericData.Record row = new GenericData.Record(schema);
-        row.put("myInt", i);
-        row.put("myMap", m);
-        row.put("myEnum", e);
-        row.put("myLongOrFloat", unionVal);
-        row.put("myIntList", intArray);
-        return row;
-    }
-}
\ No newline at end of file