NIFI-6318: Support EL in CSV formatting properties

CSVReader and CSVRecordSetWriter controller services and also ConvertExcelToCSVProcessor
support EL for Value Separator, Quote Character and Escape Character properties.

NIFI-6318: Fixed null checks and compound OR expression.

NIFI-6318: RecordSetWriterFactory.createWriter() changes.

NIFI-6318: Initialize CSVFormat in onEnabled() if there are no dynamic formatting properties.

NIFI-6318: Comment Marker supports EL.

NIFI-6318: Various review changes.

This closes #3504.

Signed-off-by: Koji Kawamura <ijokarumawak@apache.org>
This commit is contained in:
Peter Turcsanyi 2019-05-28 00:22:25 +02:00 committed by Koji Kawamura
parent 6d5acf1cb2
commit c6e6a418aa
No known key found for this signature in database
GPG Key ID: 36136B0EC89E4758
65 changed files with 1876 additions and 1330 deletions

View File

@ -294,7 +294,7 @@ public class MockPropertyValue implements PropertyValue {
@Override @Override
public boolean isExpressionLanguagePresent() { public boolean isExpressionLanguagePresent() {
if (!Boolean.TRUE.equals(expectExpressions)) { if (rawValue == null) {
return false; return false;
} }

View File

@ -465,7 +465,7 @@ public class ConsumeAzureEventHub extends AbstractSessionFactoryProcessor {
// Initialize the writer when the first record is read. // Initialize the writer when the first record is read.
final RecordSchema readerSchema = record.getSchema(); final RecordSchema readerSchema = record.getSchema();
final RecordSchema writeSchema = writerFactory.getSchema(schemaRetrievalVariables, readerSchema); final RecordSchema writeSchema = writerFactory.getSchema(schemaRetrievalVariables, readerSchema);
writer = writerFactory.createWriter(logger, writeSchema, out); writer = writerFactory.createWriter(logger, writeSchema, out, flowFile);
writer.beginRecordSet(); writer.beginRecordSet();
} }

View File

@ -18,6 +18,7 @@ package org.apache.nifi.processors.azure.eventhub;
import com.microsoft.azure.eventhubs.EventData; import com.microsoft.azure.eventhubs.EventData;
import com.microsoft.azure.eventprocessorhost.PartitionContext; import com.microsoft.azure.eventprocessorhost.PartitionContext;
import org.apache.nifi.flowfile.FlowFile;
import org.apache.nifi.processor.ProcessSessionFactory; import org.apache.nifi.processor.ProcessSessionFactory;
import org.apache.nifi.processor.ProcessorInitializationContext; import org.apache.nifi.processor.ProcessorInitializationContext;
import org.apache.nifi.provenance.ProvenanceEventRecord; import org.apache.nifi.provenance.ProvenanceEventRecord;
@ -180,7 +181,7 @@ public class TestConsumeAzureEventHub {
processor.setWriterFactory(writerFactory); processor.setWriterFactory(writerFactory);
final RecordSetWriter writer = mock(RecordSetWriter.class); final RecordSetWriter writer = mock(RecordSetWriter.class);
final AtomicReference<OutputStream> outRef = new AtomicReference<>(); final AtomicReference<OutputStream> outRef = new AtomicReference<>();
when(writerFactory.createWriter(any(), any(), any())).thenAnswer(invocation -> { when(writerFactory.createWriter(any(), any(), any(), any(FlowFile.class))).thenAnswer(invocation -> {
outRef.set(invocation.getArgument(2)); outRef.set(invocation.getArgument(2));
return writer; return writer;
}); });

View File

@ -187,11 +187,11 @@ public class PutDruidRecord extends AbstractSessionFactoryProcessor {
final RecordReader reader = recordParserFactory.createRecordReader(flowFile, in, getLogger()); final RecordReader reader = recordParserFactory.createRecordReader(flowFile, in, getLogger());
final RecordSchema outSchema = writerFactory.getSchema(attributes, reader.getSchema()); final RecordSchema outSchema = writerFactory.getSchema(attributes, reader.getSchema());
droppedRecordWriter = writerFactory.createWriter(log, outSchema, droppedOutputStream); droppedRecordWriter = writerFactory.createWriter(log, outSchema, droppedOutputStream, flowFile);
droppedRecordWriter.beginRecordSet(); droppedRecordWriter.beginRecordSet();
failedRecordWriter = writerFactory.createWriter(log, outSchema, failedOutputStream); failedRecordWriter = writerFactory.createWriter(log, outSchema, failedOutputStream, flowFile);
failedRecordWriter.beginRecordSet(); failedRecordWriter.beginRecordSet();
successfulRecordWriter = writerFactory.createWriter(log, outSchema, successfulOutputStream); successfulRecordWriter = writerFactory.createWriter(log, outSchema, successfulOutputStream, flowFile);
successfulRecordWriter.beginRecordSet(); successfulRecordWriter.beginRecordSet();
Record r; Record r;

View File

@ -558,8 +558,8 @@ public class PutElasticsearchHttpRecord extends AbstractElasticsearchHttpProcess
final RecordSchema schema = writerFactory.getSchema(inputFlowFile.getAttributes(), reader.getSchema()); final RecordSchema schema = writerFactory.getSchema(inputFlowFile.getAttributes(), reader.getSchema());
try (final RecordSetWriter successWriter = writerFactory.createWriter(getLogger(), schema, successOut); try (final RecordSetWriter successWriter = writerFactory.createWriter(getLogger(), schema, successOut, successFlowFile);
final RecordSetWriter failedWriter = writerFactory.createWriter(getLogger(), schema, failedOut)) { final RecordSetWriter failedWriter = writerFactory.createWriter(getLogger(), schema, failedOut, failedFlowFile)) {
successWriter.beginRecordSet(); successWriter.beginRecordSet();
failedWriter.beginRecordSet(); failedWriter.beginRecordSet();

View File

@ -199,7 +199,7 @@ public abstract class AbstractFetchHDFSRecord extends AbstractHadoopProcessor {
final RecordSchema schema = recordSetWriterFactory.getSchema(originalFlowFile.getAttributes(), final RecordSchema schema = recordSetWriterFactory.getSchema(originalFlowFile.getAttributes(),
record == null ? null : record.getSchema()); record == null ? null : record.getSchema());
try (final RecordSetWriter recordSetWriter = recordSetWriterFactory.createWriter(getLogger(), schema, out)) { try (final RecordSetWriter recordSetWriter = recordSetWriterFactory.createWriter(getLogger(), schema, out, originalFlowFile)) {
recordSetWriter.beginRecordSet(); recordSetWriter.beginRecordSet();
if (record != null) { if (record != null) {
recordSetWriter.write(record); recordSetWriter.write(record);

View File

@ -30,8 +30,8 @@ import java.util.List;
import java.util.Map; import java.util.Map;
/** /**
* An implementation that is suitable for testing that does not serialize the data to an Output Stream but insted just buffers the data into an * An implementation that is suitable for testing that does not serialize the data to an Output Stream but instead just buffers the data into an
* ArrayList and then provides that List of written records to the user * ArrayList and then provides that List of written records to the user.
*/ */
public class ArrayListRecordWriter extends AbstractControllerService implements RecordSetWriterFactory { public class ArrayListRecordWriter extends AbstractControllerService implements RecordSetWriterFactory {
private final List<Record> records = new ArrayList<>(); private final List<Record> records = new ArrayList<>();
@ -48,7 +48,7 @@ public class ArrayListRecordWriter extends AbstractControllerService implements
} }
@Override @Override
public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out) { public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out, final Map<String, String> variables) {
return new ArrayListRecordSetWriter(records); return new ArrayListRecordSetWriter(records);
} }

View File

@ -70,7 +70,7 @@ public class MockRecordWriter extends AbstractControllerService implements Recor
} }
@Override @Override
public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream rawOut) { public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream rawOut, Map<String, String> variables) {
final OutputStream out = bufferOutput ? new BufferedOutputStream(rawOut) : rawOut; final OutputStream out = bufferOutput ? new BufferedOutputStream(rawOut) : rawOut;
return new RecordSetWriter() { return new RecordSetWriter() {

View File

@ -26,9 +26,15 @@ import org.apache.nifi.components.PropertyValue;
import org.apache.nifi.context.PropertyContext; import org.apache.nifi.context.PropertyContext;
import org.apache.nifi.expression.ExpressionLanguageScope; import org.apache.nifi.expression.ExpressionLanguageScope;
import org.apache.nifi.processor.util.StandardValidators; import org.apache.nifi.processor.util.StandardValidators;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import java.util.Map;
public class CSVUtils { public class CSVUtils {
private static Logger LOG = LoggerFactory.getLogger(CSVUtils.class);
public static final AllowableValue CUSTOM = new AllowableValue("custom", "Custom Format", public static final AllowableValue CUSTOM = new AllowableValue("custom", "Custom Format",
"The format of the CSV is configured by using the properties of this Controller Service, such as Value Separator"); "The format of the CSV is configured by using the properties of this Controller Service, such as Value Separator");
public static final AllowableValue RFC_4180 = new AllowableValue("rfc-4180", "RFC 4180", "CSV data follows the RFC 4180 Specification defined at https://tools.ietf.org/html/rfc4180"); public static final AllowableValue RFC_4180 = new AllowableValue("rfc-4180", "RFC 4180", "CSV data follows the RFC 4180 Specification defined at https://tools.ietf.org/html/rfc4180");
@ -49,17 +55,19 @@ public class CSVUtils {
.build(); .build();
public static final PropertyDescriptor VALUE_SEPARATOR = new PropertyDescriptor.Builder() public static final PropertyDescriptor VALUE_SEPARATOR = new PropertyDescriptor.Builder()
.name("Value Separator") .name("Value Separator")
.description("The character that is used to separate values/fields in a CSV Record") .description("The character that is used to separate values/fields in a CSV Record. If the property has been specified via Expression Language " +
"but the expression gets evaluated to an invalid Value Separator at runtime, then it will be skipped and the default Value Separator will be used.")
.addValidator(CSVValidators.UNESCAPED_SINGLE_CHAR_VALIDATOR) .addValidator(CSVValidators.UNESCAPED_SINGLE_CHAR_VALIDATOR)
.expressionLanguageSupported(ExpressionLanguageScope.NONE) .expressionLanguageSupported(ExpressionLanguageScope.FLOWFILE_ATTRIBUTES)
.defaultValue(",") .defaultValue(",")
.required(true) .required(true)
.build(); .build();
public static final PropertyDescriptor QUOTE_CHAR = new PropertyDescriptor.Builder() public static final PropertyDescriptor QUOTE_CHAR = new PropertyDescriptor.Builder()
.name("Quote Character") .name("Quote Character")
.description("The character that is used to quote values so that escape characters do not have to be used") .description("The character that is used to quote values so that escape characters do not have to be used. If the property has been specified via Expression Language " +
"but the expression gets evaluated to an invalid Quote Character at runtime, then it will be skipped and the default Quote Character will be used.")
.addValidator(new CSVValidators.SingleCharacterValidator()) .addValidator(new CSVValidators.SingleCharacterValidator())
.expressionLanguageSupported(ExpressionLanguageScope.NONE) .expressionLanguageSupported(ExpressionLanguageScope.FLOWFILE_ATTRIBUTES)
.defaultValue("\"") .defaultValue("\"")
.required(true) .required(true)
.build(); .build();
@ -92,14 +100,15 @@ public class CSVUtils {
.name("Comment Marker") .name("Comment Marker")
.description("The character that is used to denote the start of a comment. Any line that begins with this comment will be ignored.") .description("The character that is used to denote the start of a comment. Any line that begins with this comment will be ignored.")
.addValidator(new CSVValidators.SingleCharacterValidator()) .addValidator(new CSVValidators.SingleCharacterValidator())
.expressionLanguageSupported(ExpressionLanguageScope.NONE) .expressionLanguageSupported(ExpressionLanguageScope.FLOWFILE_ATTRIBUTES)
.required(false) .required(false)
.build(); .build();
public static final PropertyDescriptor ESCAPE_CHAR = new PropertyDescriptor.Builder() public static final PropertyDescriptor ESCAPE_CHAR = new PropertyDescriptor.Builder()
.name("Escape Character") .name("Escape Character")
.description("The character that is used to escape characters that would otherwise have a specific meaning to the CSV Parser.") .description("The character that is used to escape characters that would otherwise have a specific meaning to the CSV Parser. If the property has been specified via Expression Language " +
"but the expression gets evaluated to an invalid Escape Character at runtime, then it will be skipped and the default Escape Character will be used.")
.addValidator(new CSVValidators.SingleCharacterValidator()) .addValidator(new CSVValidators.SingleCharacterValidator())
.expressionLanguageSupported(ExpressionLanguageScope.NONE) .expressionLanguageSupported(ExpressionLanguageScope.FLOWFILE_ATTRIBUTES)
.defaultValue("\\") .defaultValue("\\")
.required(true) .required(true)
.build(); .build();
@ -168,10 +177,19 @@ public class CSVUtils {
.required(true) .required(true)
.build(); .build();
public static CSVFormat createCSVFormat(final PropertyContext context) { public static boolean isDynamicCSVFormat(final PropertyContext context) {
final String formatName = context.getProperty(CSV_FORMAT).getValue();
return formatName.equalsIgnoreCase(CUSTOM.getValue())
&& (context.getProperty(VALUE_SEPARATOR).isExpressionLanguagePresent()
|| context.getProperty(QUOTE_CHAR).isExpressionLanguagePresent()
|| context.getProperty(ESCAPE_CHAR).isExpressionLanguagePresent()
|| context.getProperty(COMMENT_MARKER).isExpressionLanguagePresent());
}
public static CSVFormat createCSVFormat(final PropertyContext context, final Map<String, String> variables) {
final String formatName = context.getProperty(CSV_FORMAT).getValue(); final String formatName = context.getProperty(CSV_FORMAT).getValue();
if (formatName.equalsIgnoreCase(CUSTOM.getValue())) { if (formatName.equalsIgnoreCase(CUSTOM.getValue())) {
return buildCustomFormat(context); return buildCustomFormat(context, variables);
} }
if (formatName.equalsIgnoreCase(RFC_4180.getValue())) { if (formatName.equalsIgnoreCase(RFC_4180.getValue())) {
return CSVFormat.RFC4180; return CSVFormat.RFC4180;
@ -190,50 +208,87 @@ public class CSVUtils {
} }
} }
private static char getUnescapedChar(final PropertyContext context, final PropertyDescriptor property) { private static Character getCharUnescapedJava(final PropertyContext context, final PropertyDescriptor property, final Map<String, String> variables) {
return StringEscapeUtils.unescapeJava(context.getProperty(property).getValue()).charAt(0); String value = context.getProperty(property).evaluateAttributeExpressions(variables).getValue();
if (value != null) {
String unescaped = unescapeJava(value);
if (unescaped.length() == 1) {
return unescaped.charAt(0);
}
}
LOG.warn("'{}' property evaluated to an invalid value: \"{}\". It must be a single character. The property value will be ignored.", property.getName(), value);
if (property.getDefaultValue() != null) {
return property.getDefaultValue().charAt(0);
} else {
return null;
}
} }
private static char getChar(final PropertyContext context, final PropertyDescriptor property) { private static Character getCharUnescaped(final PropertyContext context, final PropertyDescriptor property, final Map<String, String> variables) {
return CSVUtils.unescape(context.getProperty(property).getValue()).charAt(0); String value = context.getProperty(property).evaluateAttributeExpressions(variables).getValue();
if (value != null) {
String unescaped = unescape(value);
if (unescaped.length() == 1) {
return unescaped.charAt(0);
}
}
LOG.warn("'{}' property evaluated to an invalid value: \"{}\". It must be a single character. The property value will be ignored.", property.getName(), value);
if (property.getDefaultValue() != null) {
return property.getDefaultValue().charAt(0);
} else {
return null;
}
} }
private static CSVFormat buildCustomFormat(final PropertyContext context) { private static CSVFormat buildCustomFormat(final PropertyContext context, final Map<String, String> variables) {
final char valueSeparator = getUnescapedChar(context, VALUE_SEPARATOR); final Character valueSeparator = getCharUnescapedJava(context, VALUE_SEPARATOR, variables);
CSVFormat format = CSVFormat.newFormat(valueSeparator) CSVFormat format = CSVFormat.newFormat(valueSeparator)
.withAllowMissingColumnNames() .withAllowMissingColumnNames()
.withIgnoreEmptyLines(); .withIgnoreEmptyLines();
final PropertyValue skipHeaderPropertyValue = context.getProperty(FIRST_LINE_IS_HEADER); final PropertyValue firstLineIsHeaderPropertyValue = context.getProperty(FIRST_LINE_IS_HEADER);
if (skipHeaderPropertyValue.getValue() != null && skipHeaderPropertyValue.asBoolean()) { if (firstLineIsHeaderPropertyValue.getValue() != null && firstLineIsHeaderPropertyValue.asBoolean()) {
format = format.withFirstRecordAsHeader(); format = format.withFirstRecordAsHeader();
} }
format = format.withQuote(getChar(context, QUOTE_CHAR)); final Character quoteChar = getCharUnescaped(context, QUOTE_CHAR, variables);
format = format.withEscape(getChar(context, ESCAPE_CHAR)); format = format.withQuote(quoteChar);
final Character escapeChar = getCharUnescaped(context, ESCAPE_CHAR, variables);
format = format.withEscape(escapeChar);
format = format.withTrim(context.getProperty(TRIM_FIELDS).asBoolean()); format = format.withTrim(context.getProperty(TRIM_FIELDS).asBoolean());
if (context.getProperty(COMMENT_MARKER).isSet()) { if (context.getProperty(COMMENT_MARKER).isSet()) {
format = format.withCommentMarker(getChar(context, COMMENT_MARKER)); final Character commentMarker = getCharUnescaped(context, COMMENT_MARKER, variables);
if (commentMarker != null) {
format = format.withCommentMarker(commentMarker);
}
} }
if (context.getProperty(NULL_STRING).isSet()) { if (context.getProperty(NULL_STRING).isSet()) {
format = format.withNullString(CSVUtils.unescape(context.getProperty(NULL_STRING).getValue())); format = format.withNullString(unescape(context.getProperty(NULL_STRING).getValue()));
} }
final PropertyValue quoteValue = context.getProperty(QUOTE_MODE); final PropertyValue quoteValue = context.getProperty(QUOTE_MODE);
if (quoteValue != null) { if (quoteValue != null && quoteValue.isSet()) {
final QuoteMode quoteMode = QuoteMode.valueOf(quoteValue.getValue()); final QuoteMode quoteMode = QuoteMode.valueOf(quoteValue.getValue());
format = format.withQuoteMode(quoteMode); format = format.withQuoteMode(quoteMode);
} }
final PropertyValue trailingDelimiterValue = context.getProperty(TRAILING_DELIMITER); final PropertyValue trailingDelimiterValue = context.getProperty(TRAILING_DELIMITER);
if (trailingDelimiterValue != null) { if (trailingDelimiterValue != null && trailingDelimiterValue.isSet()) {
final boolean trailingDelimiter = trailingDelimiterValue.asBoolean(); final boolean trailingDelimiter = trailingDelimiterValue.asBoolean();
format = format.withTrailingDelimiter(trailingDelimiter); format = format.withTrailingDelimiter(trailingDelimiter);
} }
final PropertyValue recordSeparator = context.getProperty(RECORD_SEPARATOR); final PropertyValue recordSeparator = context.getProperty(RECORD_SEPARATOR);
if (recordSeparator != null) { if (recordSeparator != null && recordSeparator.isSet()) {
final String separator = unescape(recordSeparator.getValue()); final String separator = unescape(recordSeparator.getValue());
format = format.withRecordSeparator(separator); format = format.withRecordSeparator(separator);
} }
@ -241,6 +296,13 @@ public class CSVUtils {
return format; return format;
} }
public static String unescapeJava(String input) {
if (input != null && input.length() > 1) {
input = StringEscapeUtils.unescapeJava(input);
}
return input;
}
public static String unescape(final String input) { public static String unescape(final String input) {
if (input == null) { if (input == null) {

View File

@ -17,7 +17,6 @@
package org.apache.nifi.csv; package org.apache.nifi.csv;
import org.apache.commons.text.StringEscapeUtils;
import org.apache.nifi.components.ValidationContext; import org.apache.nifi.components.ValidationContext;
import org.apache.nifi.components.ValidationResult; import org.apache.nifi.components.ValidationResult;
import org.apache.nifi.components.Validator; import org.apache.nifi.components.Validator;
@ -47,23 +46,25 @@ public class CSVValidators {
.build(); .build();
} }
final String unescaped = CSVUtils.unescape(input); if (!context.isExpressionLanguageSupported(subject) || !context.isExpressionLanguagePresent(input)) {
if (unescaped.length() != 1) { final String unescaped = CSVUtils.unescape(input);
return new ValidationResult.Builder() if (unescaped.length() != 1) {
.input(input) return new ValidationResult.Builder()
.subject(subject) .input(input)
.valid(false) .subject(subject)
.explanation("Value must be exactly 1 character but was " + input.length() + " in length") .valid(false)
.build(); .explanation("Value must be exactly 1 character but was " + input.length() + " in length")
} .build();
}
if (illegalChars.contains(unescaped)) { if (illegalChars.contains(unescaped)) {
return new ValidationResult.Builder() return new ValidationResult.Builder()
.input(input) .input(input)
.subject(subject) .subject(subject)
.valid(false) .valid(false)
.explanation(input + " is not a valid character for this property") .explanation(input + " is not a valid character for this property")
.build(); .build();
}
} }
return new ValidationResult.Builder() return new ValidationResult.Builder()
@ -88,22 +89,16 @@ public class CSVValidators {
.build(); .build();
} }
String unescapeString = unescapeString(input); String unescaped = CSVUtils.unescapeJava(input);
return new ValidationResult.Builder() return new ValidationResult.Builder()
.subject(subject) .subject(subject)
.input(unescapeString) .input(unescaped)
.explanation("Only non-null single characters are supported") .explanation("Only non-null single characters are supported")
.valid((unescapeString.length() == 1 && unescapeString.charAt(0) != 0) || context.isExpressionLanguagePresent(input)) .valid((unescaped.length() == 1 && unescaped.charAt(0) != 0)
|| (context.isExpressionLanguageSupported(subject) && context.isExpressionLanguagePresent(input)))
.build(); .build();
} }
private String unescapeString(String input) {
if (input != null && input.length() > 1) {
input = StringEscapeUtils.unescapeJava(input);
}
return input;
}
}; };
} }

View File

@ -0,0 +1,152 @@
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.nifi.csv;
import org.apache.commons.csv.CSVFormat;
import org.apache.nifi.components.PropertyDescriptor;
import org.apache.nifi.context.PropertyContext;
import org.apache.nifi.util.MockConfigurationContext;
import org.junit.Test;
import java.util.Collections;
import java.util.HashMap;
import java.util.Map;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertNull;
import static org.junit.Assert.assertTrue;
public class CSVUtilsTest {
@Test
public void testIsDynamicCSVFormatWithStaticProperties() {
PropertyContext context = createContext("|", "'", "^", "~");
boolean isDynamicCSVFormat = CSVUtils.isDynamicCSVFormat(context);
assertFalse(isDynamicCSVFormat);
}
@Test
public void testIsDynamicCSVFormatWithDynamicValueSeparator() {
PropertyContext context = createContext("${csv.delimiter}", "'", "^", "~");
boolean isDynamicCSVFormat = CSVUtils.isDynamicCSVFormat(context);
assertTrue(isDynamicCSVFormat);
}
@Test
public void testIsDynamicCSVFormatWithDynamicQuoteCharacter() {
PropertyContext context = createContext("|", "${csv.quote}", "^", "~");
boolean isDynamicCSVFormat = CSVUtils.isDynamicCSVFormat(context);
assertTrue(isDynamicCSVFormat);
}
@Test
public void testIsDynamicCSVFormatWithDynamicEscapeCharacter() {
PropertyContext context = createContext("|", "'", "${csv.escape}", "~");
boolean isDynamicCSVFormat = CSVUtils.isDynamicCSVFormat(context);
assertTrue(isDynamicCSVFormat);
}
@Test
public void testIsDynamicCSVFormatWithDynamicCommentMarker() {
PropertyContext context = createContext("|", "'", "^", "${csv.comment}");
boolean isDynamicCSVFormat = CSVUtils.isDynamicCSVFormat(context);
assertTrue(isDynamicCSVFormat);
}
@Test
public void testCustomFormat() {
PropertyContext context = createContext("|", "'", "^", "~");
CSVFormat csvFormat = CSVUtils.createCSVFormat(context, Collections.emptyMap());
assertEquals('|', csvFormat.getDelimiter());
assertEquals('\'', (char) csvFormat.getQuoteCharacter());
assertEquals('^', (char) csvFormat.getEscapeCharacter());
assertEquals('~', (char) csvFormat.getCommentMarker());
}
@Test
public void testCustomFormatWithEL() {
PropertyContext context = createContext("${csv.delimiter}", "${csv.quote}", "${csv.escape}", "${csv.comment}");
Map<String, String> attributes = new HashMap<>();
attributes.put("csv.delimiter", "|");
attributes.put("csv.quote", "'");
attributes.put("csv.escape", "^");
attributes.put("csv.comment", "~");
CSVFormat csvFormat = CSVUtils.createCSVFormat(context, attributes);
assertEquals('|', csvFormat.getDelimiter());
assertEquals('\'', (char) csvFormat.getQuoteCharacter());
assertEquals('^', (char) csvFormat.getEscapeCharacter());
assertEquals('~', (char) csvFormat.getCommentMarker());
}
@Test
public void testCustomFormatWithELEmptyValues() {
PropertyContext context = createContext("${csv.delimiter}", "${csv.quote}", "${csv.escape}", "${csv.comment}");
CSVFormat csvFormat = CSVUtils.createCSVFormat(context, Collections.emptyMap());
assertEquals(',', csvFormat.getDelimiter());
assertEquals('"', (char) csvFormat.getQuoteCharacter());
assertEquals('\\', (char) csvFormat.getEscapeCharacter());
assertNull(csvFormat.getCommentMarker());
}
@Test
public void testCustomFormatWithELInvalidValues() {
PropertyContext context = createContext("${csv.delimiter}", "${csv.quote}", "${csv.escape}", "${csv.comment}");
Map<String, String> attributes = new HashMap<>();
attributes.put("csv.delimiter", "invalid");
attributes.put("csv.quote", "invalid");
attributes.put("csv.escape", "invalid");
attributes.put("csv.comment", "invalid");
CSVFormat csvFormat = CSVUtils.createCSVFormat(context, attributes);
assertEquals(',', csvFormat.getDelimiter());
assertEquals('"', (char) csvFormat.getQuoteCharacter());
assertEquals('\\', (char) csvFormat.getEscapeCharacter());
assertNull(csvFormat.getCommentMarker());
}
private PropertyContext createContext(String valueSeparator, String quoteChar, String escapeChar, String commentMarker) {
Map<PropertyDescriptor, String> properties = new HashMap<>();
properties.put(CSVUtils.VALUE_SEPARATOR, valueSeparator);
properties.put(CSVUtils.QUOTE_CHAR, quoteChar);
properties.put(CSVUtils.ESCAPE_CHAR, escapeChar);
properties.put(CSVUtils.COMMENT_MARKER, commentMarker);
return new MockConfigurationContext(properties, null);
}
}

View File

@ -312,7 +312,7 @@ public class JoltTransformRecord extends AbstractProcessor {
final Record firstRecord = reader.nextRecord(); final Record firstRecord = reader.nextRecord();
if (firstRecord == null) { if (firstRecord == null) {
try (final OutputStream out = session.write(transformed); try (final OutputStream out = session.write(transformed);
final RecordSetWriter writer = writerFactory.createWriter(getLogger(), schema, out)) { final RecordSetWriter writer = writerFactory.createWriter(getLogger(), schema, out, transformed)) {
writer.beginRecordSet(); writer.beginRecordSet();
writeResult = writer.finishRecordSet(); writeResult = writer.finishRecordSet();
@ -339,7 +339,7 @@ public class JoltTransformRecord extends AbstractProcessor {
// and instead use a Map<RecordSchema, RecordSetWriter>. This way, even if many different output schemas are possible, // and instead use a Map<RecordSchema, RecordSetWriter>. This way, even if many different output schemas are possible,
// the output FlowFiles will each only contain records that have the same schema. // the output FlowFiles will each only contain records that have the same schema.
try (final OutputStream out = session.write(transformed); try (final OutputStream out = session.write(transformed);
final RecordSetWriter writer = writerFactory.createWriter(getLogger(), writeSchema, out)) { final RecordSetWriter writer = writerFactory.createWriter(getLogger(), writeSchema, out, transformed)) {
writer.beginRecordSet(); writer.beginRecordSet();

View File

@ -508,7 +508,7 @@ public abstract class ConsumerLease implements Closeable, ConsumerRebalanceListe
throw new ProcessException(e); throw new ProcessException(e);
} }
writer = writerFactory.createWriter(logger, writeSchema, rawOut); writer = writerFactory.createWriter(logger, writeSchema, rawOut, flowFile);
writer.beginRecordSet(); writer.beginRecordSet();
tracker = new BundleTracker(consumerRecord, topicPartition, keyEncoding, writer); tracker = new BundleTracker(consumerRecord, topicPartition, keyEncoding, writer);

View File

@ -122,7 +122,7 @@ public class PublisherLease implements Closeable {
recordCount++; recordCount++;
baos.reset(); baos.reset();
try (final RecordSetWriter writer = writerFactory.createWriter(logger, schema, baos)) { try (final RecordSetWriter writer = writerFactory.createWriter(logger, schema, baos, flowFile)) {
writer.write(record); writer.write(record);
writer.flush(); writer.flush();
} }

View File

@ -282,11 +282,11 @@ public class TestPublisherLease {
final RecordSetWriterFactory writerFactory = Mockito.mock(RecordSetWriterFactory.class); final RecordSetWriterFactory writerFactory = Mockito.mock(RecordSetWriterFactory.class);
final RecordSetWriter writer = Mockito.mock(RecordSetWriter.class); final RecordSetWriter writer = Mockito.mock(RecordSetWriter.class);
Mockito.when(writerFactory.createWriter(eq(logger), eq(schema), any())).thenReturn(writer); Mockito.when(writerFactory.createWriter(eq(logger), eq(schema), any(), eq(flowFile))).thenReturn(writer);
lease.publish(flowFile, recordSet, writerFactory, schema, keyField, topic); lease.publish(flowFile, recordSet, writerFactory, schema, keyField, topic);
verify(writerFactory, times(2)).createWriter(eq(logger), eq(schema), any()); verify(writerFactory, times(2)).createWriter(eq(logger), eq(schema), any(), eq(flowFile));
verify(writer, times(2)).write(any(Record.class)); verify(writer, times(2)).write(any(Record.class));
verify(producer, times(2)).send(any(), any()); verify(producer, times(2)).send(any(), any());
} }

View File

@ -57,7 +57,7 @@ public class MockRecordWriter extends AbstractControllerService implements Recor
} }
@Override @Override
public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out) { public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out, final Map<String, String> variables) {
return new RecordSetWriter() { return new RecordSetWriter() {
@Override @Override

View File

@ -558,7 +558,7 @@ public abstract class ConsumerLease implements Closeable, ConsumerRebalanceListe
throw new ProcessException(e); throw new ProcessException(e);
} }
writer = writerFactory.createWriter(logger, writeSchema, rawOut); writer = writerFactory.createWriter(logger, writeSchema, rawOut, flowFile);
writer.beginRecordSet(); writer.beginRecordSet();
tracker = new BundleTracker(consumerRecord, topicPartition, keyEncoding, writer); tracker = new BundleTracker(consumerRecord, topicPartition, keyEncoding, writer);

View File

@ -167,7 +167,7 @@ public class PublisherLease implements Closeable {
baos.reset(); baos.reset();
Map<String, String> additionalAttributes = Collections.emptyMap(); Map<String, String> additionalAttributes = Collections.emptyMap();
try (final RecordSetWriter writer = writerFactory.createWriter(logger, schema, baos)) { try (final RecordSetWriter writer = writerFactory.createWriter(logger, schema, baos, flowFile)) {
final WriteResult writeResult = writer.write(record); final WriteResult writeResult = writer.write(record);
additionalAttributes = writeResult.getAttributes(); additionalAttributes = writeResult.getAttributes();
writer.flush(); writer.flush();

View File

@ -277,11 +277,11 @@ public class TestPublisherLease {
final RecordSetWriter writer = Mockito.mock(RecordSetWriter.class); final RecordSetWriter writer = Mockito.mock(RecordSetWriter.class);
Mockito.when(writer.write(Mockito.any(Record.class))).thenReturn(WriteResult.of(1, Collections.emptyMap())); Mockito.when(writer.write(Mockito.any(Record.class))).thenReturn(WriteResult.of(1, Collections.emptyMap()));
Mockito.when(writerFactory.createWriter(eq(logger), eq(schema), any())).thenReturn(writer); Mockito.when(writerFactory.createWriter(eq(logger), eq(schema), any(), eq(flowFile))).thenReturn(writer);
lease.publish(flowFile, recordSet, writerFactory, schema, keyField, topic); lease.publish(flowFile, recordSet, writerFactory, schema, keyField, topic);
verify(writerFactory, times(2)).createWriter(eq(logger), eq(schema), any()); verify(writerFactory, times(2)).createWriter(eq(logger), eq(schema), any(), eq(flowFile));
verify(writer, times(2)).write(any(Record.class)); verify(writer, times(2)).write(any(Record.class));
verify(producer, times(2)).send(any(), any()); verify(producer, times(2)).send(any(), any());
} }

View File

@ -57,7 +57,7 @@ public class MockRecordWriter extends AbstractControllerService implements Recor
} }
@Override @Override
public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out) { public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out, final Map<String, String> variables) {
return new RecordSetWriter() { return new RecordSetWriter() {
@Override @Override

View File

@ -558,7 +558,7 @@ public abstract class ConsumerLease implements Closeable, ConsumerRebalanceListe
throw new ProcessException(e); throw new ProcessException(e);
} }
writer = writerFactory.createWriter(logger, writeSchema, rawOut); writer = writerFactory.createWriter(logger, writeSchema, rawOut, flowFile);
writer.beginRecordSet(); writer.beginRecordSet();
tracker = new BundleTracker(consumerRecord, topicPartition, keyEncoding, writer); tracker = new BundleTracker(consumerRecord, topicPartition, keyEncoding, writer);

View File

@ -166,7 +166,7 @@ public class PublisherLease implements Closeable {
baos.reset(); baos.reset();
Map<String, String> additionalAttributes = Collections.emptyMap(); Map<String, String> additionalAttributes = Collections.emptyMap();
try (final RecordSetWriter writer = writerFactory.createWriter(logger, schema, baos)) { try (final RecordSetWriter writer = writerFactory.createWriter(logger, schema, baos, flowFile)) {
final WriteResult writeResult = writer.write(record); final WriteResult writeResult = writer.write(record);
additionalAttributes = writeResult.getAttributes(); additionalAttributes = writeResult.getAttributes();
writer.flush(); writer.flush();

View File

@ -277,11 +277,11 @@ public class TestPublisherLease {
final RecordSetWriter writer = Mockito.mock(RecordSetWriter.class); final RecordSetWriter writer = Mockito.mock(RecordSetWriter.class);
Mockito.when(writer.write(Mockito.any(Record.class))).thenReturn(WriteResult.of(1, Collections.emptyMap())); Mockito.when(writer.write(Mockito.any(Record.class))).thenReturn(WriteResult.of(1, Collections.emptyMap()));
Mockito.when(writerFactory.createWriter(eq(logger), eq(schema), any())).thenReturn(writer); Mockito.when(writerFactory.createWriter(eq(logger), eq(schema), any(), eq(flowFile))).thenReturn(writer);
lease.publish(flowFile, recordSet, writerFactory, schema, keyField, topic); lease.publish(flowFile, recordSet, writerFactory, schema, keyField, topic);
verify(writerFactory, times(2)).createWriter(eq(logger), eq(schema), any()); verify(writerFactory, times(2)).createWriter(eq(logger), eq(schema), any(), eq(flowFile));
verify(writer, times(2)).write(any(Record.class)); verify(writer, times(2)).write(any(Record.class));
verify(producer, times(2)).send(any(), any()); verify(producer, times(2)).send(any(), any());
} }

View File

@ -57,7 +57,7 @@ public class MockRecordWriter extends AbstractControllerService implements Recor
} }
@Override @Override
public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out) { public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out, final Map<String, String> variables) {
return new RecordSetWriter() { return new RecordSetWriter() {
@Override @Override

View File

@ -558,7 +558,7 @@ public abstract class ConsumerLease implements Closeable, ConsumerRebalanceListe
throw new ProcessException(e); throw new ProcessException(e);
} }
writer = writerFactory.createWriter(logger, writeSchema, rawOut); writer = writerFactory.createWriter(logger, writeSchema, rawOut, flowFile);
writer.beginRecordSet(); writer.beginRecordSet();
tracker = new BundleTracker(consumerRecord, topicPartition, keyEncoding, writer); tracker = new BundleTracker(consumerRecord, topicPartition, keyEncoding, writer);

View File

@ -166,7 +166,7 @@ public class PublisherLease implements Closeable {
baos.reset(); baos.reset();
Map<String, String> additionalAttributes = Collections.emptyMap(); Map<String, String> additionalAttributes = Collections.emptyMap();
try (final RecordSetWriter writer = writerFactory.createWriter(logger, schema, baos)) { try (final RecordSetWriter writer = writerFactory.createWriter(logger, schema, baos, flowFile)) {
final WriteResult writeResult = writer.write(record); final WriteResult writeResult = writer.write(record);
additionalAttributes = writeResult.getAttributes(); additionalAttributes = writeResult.getAttributes();
writer.flush(); writer.flush();

View File

@ -278,11 +278,11 @@ public class TestPublisherLease {
final RecordSetWriter writer = Mockito.mock(RecordSetWriter.class); final RecordSetWriter writer = Mockito.mock(RecordSetWriter.class);
Mockito.when(writer.write(Mockito.any(Record.class))).thenReturn(WriteResult.of(1, Collections.emptyMap())); Mockito.when(writer.write(Mockito.any(Record.class))).thenReturn(WriteResult.of(1, Collections.emptyMap()));
Mockito.when(writerFactory.createWriter(eq(logger), eq(schema), any())).thenReturn(writer); Mockito.when(writerFactory.createWriter(eq(logger), eq(schema), any(), eq(flowFile))).thenReturn(writer);
lease.publish(flowFile, recordSet, writerFactory, schema, keyField, topic); lease.publish(flowFile, recordSet, writerFactory, schema, keyField, topic);
verify(writerFactory, times(2)).createWriter(eq(logger), eq(schema), any()); verify(writerFactory, times(2)).createWriter(eq(logger), eq(schema), any(), eq(flowFile));
verify(writer, times(2)).write(any(Record.class)); verify(writer, times(2)).write(any(Record.class));
verify(producer, times(2)).send(any(), any()); verify(producer, times(2)).send(any(), any());
} }

View File

@ -57,7 +57,7 @@ public class MockRecordWriter extends AbstractControllerService implements Recor
} }
@Override @Override
public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out) { public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out, final Map<String, String> variables) {
return new RecordSetWriter() { return new RecordSetWriter() {
@Override @Override

View File

@ -165,7 +165,7 @@ public class GetMongoRecord extends AbstractMongoQueryProcessor {
put("schema.name", schemaName); put("schema.name", schemaName);
}}; }};
RecordSchema schema = writerFactory.getSchema(attrs, null); RecordSchema schema = writerFactory.getSchema(attrs, null);
RecordSetWriter writer = writerFactory.createWriter(getLogger(), schema, out); RecordSetWriter writer = writerFactory.createWriter(getLogger(), schema, out, attrs);
long count = 0L; long count = 0L;
writer.beginRecordSet(); writer.beginRecordSet();
while (cursor.hasNext()) { while (cursor.hasNext()) {

View File

@ -230,7 +230,8 @@ public class FetchParquetTest {
final RecordSetWriterFactory recordSetWriterFactory = Mockito.mock(RecordSetWriterFactory.class); final RecordSetWriterFactory recordSetWriterFactory = Mockito.mock(RecordSetWriterFactory.class);
when(recordSetWriterFactory.getIdentifier()).thenReturn("mock-writer-factory"); when(recordSetWriterFactory.getIdentifier()).thenReturn("mock-writer-factory");
when(recordSetWriterFactory.createWriter(any(ComponentLog.class), AdditionalMatchers.or(any(RecordSchema.class), isNull()), any(OutputStream.class))).thenReturn(recordSetWriter); when(recordSetWriterFactory.createWriter(any(ComponentLog.class), AdditionalMatchers.or(any(RecordSchema.class), isNull()), any(OutputStream.class), any(FlowFile.class)))
.thenReturn(recordSetWriter);
testRunner.addControllerService("mock-writer-factory", recordSetWriterFactory); testRunner.addControllerService("mock-writer-factory", recordSetWriterFactory);
testRunner.enableControllerService(recordSetWriterFactory); testRunner.enableControllerService(recordSetWriterFactory);

View File

@ -202,7 +202,7 @@ public class ConvertExcelToCSVProcessor
final String desiredSheetsDelimited = context.getProperty(DESIRED_SHEETS).evaluateAttributeExpressions(flowFile).getValue(); final String desiredSheetsDelimited = context.getProperty(DESIRED_SHEETS).evaluateAttributeExpressions(flowFile).getValue();
final boolean formatValues = context.getProperty(FORMAT_VALUES).asBoolean(); final boolean formatValues = context.getProperty(FORMAT_VALUES).asBoolean();
final CSVFormat csvFormat = CSVUtils.createCSVFormat(context); final CSVFormat csvFormat = CSVUtils.createCSVFormat(context, flowFile.getAttributes());
//Switch to 0 based index //Switch to 0 based index
final int firstRow = context.getProperty(ROWS_TO_SKIP).evaluateAttributeExpressions(flowFile).asInteger() - 1; final int firstRow = context.getProperty(ROWS_TO_SKIP).evaluateAttributeExpressions(flowFile).asInteger() - 1;

View File

@ -167,7 +167,7 @@ public class ConvertExcelToCSVProcessorTest {
public void testSkipRowsWithEL() throws Exception { public void testSkipRowsWithEL() throws Exception {
Map<String, String> attributes = new HashMap<String, String>(); Map<String, String> attributes = new HashMap<String, String>();
attributes.put("rowsToSkip", "2"); attributes.put("rowsToSkip", "2");
testRunner.enqueue(new File("src/test/resources/dataformatting.xlsx").toPath(),attributes); testRunner.enqueue(new File("src/test/resources/dataformatting.xlsx").toPath(), attributes);
testRunner.setProperty(ConvertExcelToCSVProcessor.ROWS_TO_SKIP, "${rowsToSkip}"); testRunner.setProperty(ConvertExcelToCSVProcessor.ROWS_TO_SKIP, "${rowsToSkip}");
testRunner.setProperty(ConvertExcelToCSVProcessor.FORMAT_VALUES, "true"); testRunner.setProperty(ConvertExcelToCSVProcessor.FORMAT_VALUES, "true");
@ -224,7 +224,7 @@ public class ConvertExcelToCSVProcessorTest {
public void testSkipColumnsWithEL() throws Exception { public void testSkipColumnsWithEL() throws Exception {
Map<String, String> attributes = new HashMap<String, String>(); Map<String, String> attributes = new HashMap<String, String>();
attributes.put("columnsToSkip", "2"); attributes.put("columnsToSkip", "2");
testRunner.enqueue(new File("src/test/resources/dataformatting.xlsx").toPath(),attributes); testRunner.enqueue(new File("src/test/resources/dataformatting.xlsx").toPath(), attributes);
testRunner.setProperty(ConvertExcelToCSVProcessor.COLUMNS_TO_SKIP, "${columnsToSkip}"); testRunner.setProperty(ConvertExcelToCSVProcessor.COLUMNS_TO_SKIP, "${columnsToSkip}");
testRunner.setProperty(ConvertExcelToCSVProcessor.FORMAT_VALUES, "true"); testRunner.setProperty(ConvertExcelToCSVProcessor.FORMAT_VALUES, "true");
@ -280,6 +280,100 @@ public class ConvertExcelToCSVProcessorTest {
"9.8765E+08||\r\n"); "9.8765E+08||\r\n");
} }
@Test
public void testCustomValueSeparatorWithEL() throws Exception {
Map<String, String> attributes = new HashMap<String, String>();
attributes.put("csv.delimiter", "|");
testRunner.enqueue(new File("src/test/resources/dataformatting.xlsx").toPath(), attributes);
testRunner.setProperty(CSVUtils.VALUE_SEPARATOR, "${csv.delimiter}");
testRunner.setProperty(ConvertExcelToCSVProcessor.FORMAT_VALUES, "true");
testRunner.run();
testRunner.assertTransferCount(ConvertExcelToCSVProcessor.SUCCESS, 1);
testRunner.assertTransferCount(ConvertExcelToCSVProcessor.ORIGINAL, 1);
testRunner.assertTransferCount(ConvertExcelToCSVProcessor.FAILURE, 0);
MockFlowFile ff = testRunner.getFlowFilesForRelationship(ConvertExcelToCSVProcessor.SUCCESS).get(0);
Long rowsSheet = new Long(ff.getAttribute(ConvertExcelToCSVProcessor.ROW_NUM));
assertTrue(rowsSheet == 9);
LocalDateTime localDt = LocalDateTime.of(2017, 1, 1, 12, 0, 0);
ff.assertContentEquals("Numbers|Timestamps|Money\n" +
"1234.456|" + DateTimeFormatter.ofPattern("d/M/yy").format(localDt) + "|$ 123.45\n" +
"1234.46|" + DateTimeFormatter.ofPattern("hh:mm:ss a").format(localDt) + "|£ 123.45\n" +
"1234.5|" + DateTimeFormatter.ofPattern("EEEE, MMMM dd, yyyy").format(localDt) + "|¥ 123.45\n" +
"1,234.46|" + DateTimeFormatter.ofPattern("d/M/yy HH:mm").format(localDt) + "|$ 1,023.45\n" +
"1,234.4560|" + DateTimeFormatter.ofPattern("hh:mm a").format(localDt) + "|£ 1,023.45\n" +
"9.88E+08|" + DateTimeFormatter.ofPattern("yyyy/MM/dd/ HH:mm").format(localDt) + "|¥ 1,023.45\n" +
"9.877E+08||\n" +
"9.8765E+08||\n");
}
@Test
public void testCustomQuoteCharWithEL() throws Exception {
Map<String, String> attributes = new HashMap<String, String>();
attributes.put("csv.quote", "'");
testRunner.enqueue(new File("src/test/resources/dataformatting.xlsx").toPath(), attributes);
testRunner.setProperty(CSVUtils.QUOTE_CHAR, "${csv.quote}");
testRunner.setProperty(ConvertExcelToCSVProcessor.FORMAT_VALUES, "true");
testRunner.setProperty(CSVUtils.QUOTE_MODE, CSVUtils.QUOTE_ALL);
testRunner.run();
testRunner.assertTransferCount(ConvertExcelToCSVProcessor.SUCCESS, 1);
testRunner.assertTransferCount(ConvertExcelToCSVProcessor.ORIGINAL, 1);
testRunner.assertTransferCount(ConvertExcelToCSVProcessor.FAILURE, 0);
MockFlowFile ff = testRunner.getFlowFilesForRelationship(ConvertExcelToCSVProcessor.SUCCESS).get(0);
Long rowsSheet = new Long(ff.getAttribute(ConvertExcelToCSVProcessor.ROW_NUM));
assertTrue(rowsSheet == 9);
LocalDateTime localDt = LocalDateTime.of(2017, 1, 1, 12, 0, 0);
ff.assertContentEquals("'Numbers','Timestamps','Money'\n" +
"'1234.456','" + DateTimeFormatter.ofPattern("d/M/yy").format(localDt) + "','$ 123.45'\n" +
"'1234.46','" + DateTimeFormatter.ofPattern("hh:mm:ss a").format(localDt) + "','£ 123.45'\n" +
"'1234.5','" + DateTimeFormatter.ofPattern("EEEE, MMMM dd, yyyy").format(localDt) + "','¥ 123.45'\n" +
"'1,234.46','" + DateTimeFormatter.ofPattern("d/M/yy HH:mm").format(localDt) + "','$ 1,023.45'\n" +
"'1,234.4560','" + DateTimeFormatter.ofPattern("hh:mm a").format(localDt) + "','£ 1,023.45'\n" +
"'9.88E+08','" + DateTimeFormatter.ofPattern("yyyy/MM/dd/ HH:mm").format(localDt) + "','¥ 1,023.45'\n" +
"'9.877E+08',,\n" +
"'9.8765E+08',,\n");
}
@Test
public void testCustomEscapeCharWithEL() throws Exception {
Map<String, String> attributes = new HashMap<String, String>();
attributes.put("csv.escape", "^");
testRunner.enqueue(new File("src/test/resources/dataformatting.xlsx").toPath(), attributes);
testRunner.setProperty(CSVUtils.ESCAPE_CHAR, "${csv.escape}");
testRunner.setProperty(ConvertExcelToCSVProcessor.FORMAT_VALUES, "true");
testRunner.run();
testRunner.assertTransferCount(ConvertExcelToCSVProcessor.SUCCESS, 1);
testRunner.assertTransferCount(ConvertExcelToCSVProcessor.ORIGINAL, 1);
testRunner.assertTransferCount(ConvertExcelToCSVProcessor.FAILURE, 0);
MockFlowFile ff = testRunner.getFlowFilesForRelationship(ConvertExcelToCSVProcessor.SUCCESS).get(0);
Long rowsSheet = new Long(ff.getAttribute(ConvertExcelToCSVProcessor.ROW_NUM));
assertTrue(rowsSheet == 9);
LocalDateTime localDt = LocalDateTime.of(2017, 1, 1, 12, 0, 0);
ff.assertContentEquals("Numbers,Timestamps,Money\n" +
"1234.456," + DateTimeFormatter.ofPattern("d/M/yy").format(localDt) + ",$ 123.45\n" +
"1234.46," + DateTimeFormatter.ofPattern("hh:mm:ss a").format(localDt) + ",£ 123.45\n" +
"1234.5," + DateTimeFormatter.ofPattern("EEEE^, MMMM dd^, yyyy").format(localDt) + ",¥ 123.45\n" +
"1^,234.46," + DateTimeFormatter.ofPattern("d/M/yy HH:mm").format(localDt) + ",$ 1^,023.45\n" +
"1^,234.4560," + DateTimeFormatter.ofPattern("hh:mm a").format(localDt) + ",£ 1^,023.45\n" +
"9.88E+08," + DateTimeFormatter.ofPattern("yyyy/MM/dd/ HH:mm").format(localDt) + ",¥ 1^,023.45\n" +
"9.877E+08,,\n" +
"9.8765E+08,,\n");
}
/** /**
* Validates that all sheets in the Excel document are exported. * Validates that all sheets in the Excel document are exported.
* *

View File

@ -62,10 +62,10 @@ public class ScriptedRecordSetWriter extends AbstractScriptedRecordFactory<Recor
@Override @Override
public RecordSetWriter createWriter(ComponentLog logger, RecordSchema schema, OutputStream out) throws SchemaNotFoundException, IOException { public RecordSetWriter createWriter(ComponentLog logger, RecordSchema schema, OutputStream out, Map<String, String> variables) throws SchemaNotFoundException, IOException {
if (recordFactory.get() != null) { if (recordFactory.get() != null) {
try { try {
return recordFactory.get().createWriter(logger, schema, out); return recordFactory.get().createWriter(logger, schema, out, variables);
} catch (UndeclaredThrowableException ute) { } catch (UndeclaredThrowableException ute) {
throw new IOException(ute.getCause()); throw new IOException(ute.getCause());
} }

View File

@ -102,7 +102,7 @@ class ScriptedRecordSetWriterTest {
def schema = recordSetWriterFactory.getSchema(Collections.emptyMap(), null) def schema = recordSetWriterFactory.getSchema(Collections.emptyMap(), null)
ByteArrayOutputStream outputStream = new ByteArrayOutputStream() ByteArrayOutputStream outputStream = new ByteArrayOutputStream()
RecordSetWriter recordSetWriter = recordSetWriterFactory.createWriter(logger, schema, outputStream) RecordSetWriter recordSetWriter = recordSetWriterFactory.createWriter(logger, schema, outputStream, Collections.emptyMap())
assertNotNull(recordSetWriter) assertNotNull(recordSetWriter)
def recordSchema = new SimpleRecordSchema( def recordSchema = new SimpleRecordSchema(

View File

@ -104,7 +104,7 @@ class GroovyRecordSetWriterFactory extends AbstractControllerService implements
} }
@Override @Override
RecordSetWriter createWriter(ComponentLog logger, RecordSchema schema, OutputStream out) throws SchemaNotFoundException, IOException { RecordSetWriter createWriter(ComponentLog logger, RecordSchema schema, OutputStream out, Map<String, String> variables) throws SchemaNotFoundException, IOException {
return new GroovyRecordSetWriter(out) return new GroovyRecordSetWriter(out)
} }

View File

@ -285,7 +285,7 @@ public abstract class AbstractSiteToSiteReportingTask extends AbstractReportingT
final RecordSchema writeSchema = writerFactory.getSchema(null, recordSchema); final RecordSchema writeSchema = writerFactory.getSchema(null, recordSchema);
final ByteArrayOutputStream out = new ByteArrayOutputStream(); final ByteArrayOutputStream out = new ByteArrayOutputStream();
try (final RecordSetWriter writer = writerFactory.createWriter(getLogger(), writeSchema, out)) { try (final RecordSetWriter writer = writerFactory.createWriter(getLogger(), writeSchema, out, attributes)) {
writer.beginRecordSet(); writer.beginRecordSet();
Record record; Record record;

View File

@ -376,11 +376,12 @@ public class GetSolr extends SolrProcessor {
final RecordSchema schema = writerFactory.getSchema(null, null); final RecordSchema schema = writerFactory.getSchema(null, null);
final RecordSet recordSet = SolrUtils.solrDocumentsToRecordSet(response.getResults(), schema); final RecordSet recordSet = SolrUtils.solrDocumentsToRecordSet(response.getResults(), schema);
final StringBuffer mimeType = new StringBuffer(); final StringBuffer mimeType = new StringBuffer();
final FlowFile flowFileRef = flowFile;
flowFile = session.write(flowFile, new OutputStreamCallback() { flowFile = session.write(flowFile, new OutputStreamCallback() {
@Override @Override
public void process(final OutputStream out) throws IOException { public void process(final OutputStream out) throws IOException {
try { try {
final RecordSetWriter writer = writerFactory.createWriter(getLogger(), schema, out); final RecordSetWriter writer = writerFactory.createWriter(getLogger(), schema, out, flowFileRef);
writer.write(recordSet); writer.write(recordSet);
writer.flush(); writer.flush();
mimeType.append(writer.getMimeType()); mimeType.append(writer.getMimeType());

View File

@ -131,7 +131,7 @@ public abstract class AbstractRecordProcessor extends AbstractProcessor {
Record firstRecord = reader.nextRecord(); Record firstRecord = reader.nextRecord();
if (firstRecord == null) { if (firstRecord == null) {
final RecordSchema writeSchema = writerFactory.getSchema(originalAttributes, reader.getSchema()); final RecordSchema writeSchema = writerFactory.getSchema(originalAttributes, reader.getSchema());
try (final RecordSetWriter writer = writerFactory.createWriter(getLogger(), writeSchema, out)) { try (final RecordSetWriter writer = writerFactory.createWriter(getLogger(), writeSchema, out, originalAttributes)) {
writer.beginRecordSet(); writer.beginRecordSet();
final WriteResult writeResult = writer.finishRecordSet(); final WriteResult writeResult = writer.finishRecordSet();
@ -147,7 +147,7 @@ public abstract class AbstractRecordProcessor extends AbstractProcessor {
firstRecord = AbstractRecordProcessor.this.process(firstRecord, original, context); firstRecord = AbstractRecordProcessor.this.process(firstRecord, original, context);
final RecordSchema writeSchema = writerFactory.getSchema(originalAttributes, firstRecord.getSchema()); final RecordSchema writeSchema = writerFactory.getSchema(originalAttributes, firstRecord.getSchema());
try (final RecordSetWriter writer = writerFactory.createWriter(getLogger(), writeSchema, out)) { try (final RecordSetWriter writer = writerFactory.createWriter(getLogger(), writeSchema, out, originalAttributes)) {
writer.beginRecordSet(); writer.beginRecordSet();
writer.write(firstRecord); writer.write(firstRecord);

View File

@ -219,11 +219,11 @@ public abstract class AbstractRouteRecord<T> extends AbstractProcessor {
Tuple<FlowFile, RecordSetWriter> tuple = writers.get(relationship); Tuple<FlowFile, RecordSetWriter> tuple = writers.get(relationship);
if (tuple == null) { if (tuple == null) {
FlowFile outFlowFile = session.create(original); final FlowFile outFlowFile = session.create(original);
final OutputStream out = session.write(outFlowFile); final OutputStream out = session.write(outFlowFile);
final RecordSchema recordWriteSchema = writerFactory.getSchema(originalAttributes, record.getSchema()); final RecordSchema recordWriteSchema = writerFactory.getSchema(originalAttributes, record.getSchema());
recordSetWriter = writerFactory.createWriter(getLogger(), recordWriteSchema, out); recordSetWriter = writerFactory.createWriter(getLogger(), recordWriteSchema, out, outFlowFile);
recordSetWriter.beginRecordSet(); recordSetWriter.beginRecordSet();
tuple = new Tuple<>(outFlowFile, recordSetWriter); tuple = new Tuple<>(outFlowFile, recordSetWriter);

View File

@ -243,7 +243,7 @@ public class ForkRecord extends AbstractProcessor {
final RecordSchema writeSchema = writerFactory.getSchema(originalAttributes, reader.getSchema()); final RecordSchema writeSchema = writerFactory.getSchema(originalAttributes, reader.getSchema());
final OutputStream out = session.write(outFlowFile); final OutputStream out = session.write(outFlowFile);
try (final RecordSetWriter recordSetWriter = writerFactory.createWriter(getLogger(), writeSchema, out)) { try (final RecordSetWriter recordSetWriter = writerFactory.createWriter(getLogger(), writeSchema, out, outFlowFile)) {
recordSetWriter.beginRecordSet(); recordSetWriter.beginRecordSet();

View File

@ -379,7 +379,7 @@ public class ListenTCPRecord extends AbstractProcessor {
final RecordSchema recordSchema = recordSetWriterFactory.getSchema(Collections.EMPTY_MAP, record.getSchema()); final RecordSchema recordSchema = recordSetWriterFactory.getSchema(Collections.EMPTY_MAP, record.getSchema());
try (final OutputStream out = session.write(flowFile); try (final OutputStream out = session.write(flowFile);
final RecordSetWriter recordWriter = recordSetWriterFactory.createWriter(getLogger(), recordSchema, out)) { final RecordSetWriter recordWriter = recordSetWriterFactory.createWriter(getLogger(), recordSchema, out, flowFile)) {
// start the record set and write the first record from above // start the record set and write the first record from above
recordWriter.beginRecordSet(); recordWriter.beginRecordSet();

View File

@ -274,7 +274,7 @@ public class ListenUDPRecord extends AbstractListenEventProcessor<StandardEvent>
final RecordSchema recordSchema = firstRecord.getSchema(); final RecordSchema recordSchema = firstRecord.getSchema();
final RecordSchema writeSchema = writerFactory.getSchema(Collections.emptyMap(), recordSchema); final RecordSchema writeSchema = writerFactory.getSchema(Collections.emptyMap(), recordSchema);
writer = writerFactory.createWriter(getLogger(), writeSchema, rawOut); writer = writerFactory.createWriter(getLogger(), writeSchema, rawOut, flowFile);
writer.beginRecordSet(); writer.beginRecordSet();
flowFileRecordWriter = new FlowFileRecordWriter(flowFile, writer); flowFileRecordWriter = new FlowFileRecordWriter(flowFile, writer);

View File

@ -230,7 +230,7 @@ public class PartitionRecord extends AbstractProcessor {
final OutputStream out = session.write(childFlowFile); final OutputStream out = session.write(childFlowFile);
writer = writerFactory.createWriter(getLogger(), writeSchema, out); writer = writerFactory.createWriter(getLogger(), writeSchema, out, childFlowFile);
writer.beginRecordSet(); writer.beginRecordSet();
writerMap.put(recordValueMap, writer); writerMap.put(recordValueMap, writer);
} }

View File

@ -336,7 +336,7 @@ public class QueryRecord extends AbstractProcessor {
throw new ProcessException(e); throw new ProcessException(e);
} }
try (final RecordSetWriter resultSetWriter = recordSetWriterFactory.createWriter(getLogger(), writeSchema, out)) { try (final RecordSetWriter resultSetWriter = recordSetWriterFactory.createWriter(getLogger(), writeSchema, out, original)) {
writeResultRef.set(resultSetWriter.write(recordSet)); writeResultRef.set(resultSetWriter.write(recordSet));
mimeTypeRef.set(resultSetWriter.getMimeType()); mimeTypeRef.set(resultSetWriter.getMimeType());
} catch (final Exception e) { } catch (final Exception e) {

View File

@ -169,7 +169,7 @@ public class SplitRecord extends AbstractProcessor {
final WriteResult writeResult; final WriteResult writeResult;
try (final OutputStream out = session.write(split); try (final OutputStream out = session.write(split);
final RecordSetWriter writer = writerFactory.createWriter(getLogger(), schema, out)) { final RecordSetWriter writer = writerFactory.createWriter(getLogger(), schema, out, split)) {
if (maxRecords == 1) { if (maxRecords == 1) {
final Record record = pushbackSet.next(); final Record record = pushbackSet.next();
writeResult = writer.write(record); writeResult = writer.write(record);

View File

@ -445,7 +445,7 @@ public class ValidateRecord extends AbstractProcessor {
} }
final OutputStream out = session.write(flowFile); final OutputStream out = session.write(flowFile);
final RecordSetWriter created = factory.createWriter(getLogger(), outputSchema, out); final RecordSetWriter created = factory.createWriter(getLogger(), outputSchema, out, flowFile);
created.beginRecordSet(); created.beginRecordSet();
return created; return created;
} }

View File

@ -132,7 +132,7 @@ public class RecordBin {
this.out = new ByteCountingOutputStream(rawOut); this.out = new ByteCountingOutputStream(rawOut);
recordWriter = writerFactory.createWriter(logger, record.getSchema(), out); recordWriter = writerFactory.createWriter(logger, record.getSchema(), out, flowFile);
recordWriter.beginRecordSet(); recordWriter.beginRecordSet();
} }

View File

@ -36,6 +36,7 @@ import java.io.IOException;
import java.io.OutputStream; import java.io.OutputStream;
import java.sql.ResultSet; import java.sql.ResultSet;
import java.sql.SQLException; import java.sql.SQLException;
import java.util.Collections;
import java.util.HashMap; import java.util.HashMap;
import java.util.Map; import java.util.Map;
import java.util.concurrent.atomic.AtomicReference; import java.util.concurrent.atomic.AtomicReference;
@ -77,7 +78,7 @@ public class RecordSqlWriter implements SqlWriter {
} catch (final SQLException | SchemaNotFoundException | IOException e) { } catch (final SQLException | SchemaNotFoundException | IOException e) {
throw new ProcessException(e); throw new ProcessException(e);
} }
try (final RecordSetWriter resultSetWriter = recordSetWriterFactory.createWriter(logger, writeSchema, outputStream)) { try (final RecordSetWriter resultSetWriter = recordSetWriterFactory.createWriter(logger, writeSchema, outputStream, Collections.emptyMap())) {
writeResultRef.set(resultSetWriter.write(recordSet)); writeResultRef.set(resultSetWriter.write(recordSet));
if (mimeType == null) { if (mimeType == null) {
mimeType = resultSetWriter.getMimeType(); mimeType = resultSetWriter.getMimeType();
@ -115,7 +116,7 @@ public class RecordSqlWriter implements SqlWriter {
@Override @Override
public void writeEmptyResultSet(OutputStream outputStream, ComponentLog logger) throws IOException { public void writeEmptyResultSet(OutputStream outputStream, ComponentLog logger) throws IOException {
try (final RecordSetWriter resultSetWriter = recordSetWriterFactory.createWriter(logger, writeSchema, outputStream)) { try (final RecordSetWriter resultSetWriter = recordSetWriterFactory.createWriter(logger, writeSchema, outputStream, Collections.emptyMap())) {
mimeType = resultSetWriter.getMimeType(); mimeType = resultSetWriter.getMimeType();
resultSetWriter.beginRecordSet(); resultSetWriter.beginRecordSet();
resultSetWriter.finishRecordSet(); resultSetWriter.finishRecordSet();

View File

@ -27,7 +27,12 @@ import java.io.OutputStream;
import java.nio.charset.StandardCharsets; import java.nio.charset.StandardCharsets;
import java.nio.file.Files; import java.nio.file.Files;
import java.nio.file.Paths; import java.nio.file.Paths;
import java.util.HashMap;
import java.util.Map;
import org.apache.nifi.csv.CSVReader;
import org.apache.nifi.csv.CSVRecordSetWriter;
import org.apache.nifi.csv.CSVUtils;
import org.apache.nifi.json.JsonRecordSetWriter; import org.apache.nifi.json.JsonRecordSetWriter;
import org.apache.nifi.json.JsonTreeReader; import org.apache.nifi.json.JsonTreeReader;
import org.apache.nifi.reporting.InitializationException; import org.apache.nifi.reporting.InitializationException;
@ -203,9 +208,9 @@ public class TestConvertRecord {
runner.setProperty(ConvertRecord.RECORD_WRITER, "writer"); runner.setProperty(ConvertRecord.RECORD_WRITER, "writer");
runner.run(); runner.run();
runner.assertAllFlowFilesTransferred(UpdateRecord.REL_SUCCESS, 1); runner.assertAllFlowFilesTransferred(ConvertRecord.REL_SUCCESS, 1);
MockFlowFile flowFile = runner.getFlowFilesForRelationship(ExecuteSQL.REL_SUCCESS).get(0); MockFlowFile flowFile = runner.getFlowFilesForRelationship(ConvertRecord.REL_SUCCESS).get(0);
final ByteArrayOutputStream baos = new ByteArrayOutputStream(); final ByteArrayOutputStream baos = new ByteArrayOutputStream();
try (final SnappyInputStream sis = new SnappyInputStream(new ByteArrayInputStream(flowFile.toByteArray())); final OutputStream out = baos) { try (final SnappyInputStream sis = new SnappyInputStream(new ByteArrayInputStream(flowFile.toByteArray())); final OutputStream out = baos) {
@ -218,4 +223,50 @@ public class TestConvertRecord {
assertEquals(new String(Files.readAllBytes(Paths.get("src/test/resources/TestConvertRecord/input/person.json"))), baos.toString(StandardCharsets.UTF_8.name())); assertEquals(new String(Files.readAllBytes(Paths.get("src/test/resources/TestConvertRecord/input/person.json"))), baos.toString(StandardCharsets.UTF_8.name()));
} }
@Test
public void testCSVFormattingWithEL() throws InitializationException {
TestRunner runner = TestRunners.newTestRunner(ConvertRecord.class);
CSVReader csvReader = new CSVReader();
runner.addControllerService("csv-reader", csvReader);
runner.setProperty(csvReader, CSVUtils.VALUE_SEPARATOR, "${csv.in.delimiter}");
runner.setProperty(csvReader, CSVUtils.QUOTE_CHAR, "${csv.in.quote}");
runner.setProperty(csvReader, CSVUtils.ESCAPE_CHAR, "${csv.in.escape}");
runner.setProperty(csvReader, CSVUtils.COMMENT_MARKER, "${csv.in.comment}");
runner.enableControllerService(csvReader);
CSVRecordSetWriter csvWriter = new CSVRecordSetWriter();
runner.addControllerService("csv-writer", csvWriter);
runner.setProperty(csvWriter, CSVUtils.VALUE_SEPARATOR, "${csv.out.delimiter}");
runner.setProperty(csvWriter, CSVUtils.QUOTE_CHAR, "${csv.out.quote}");
runner.setProperty(csvWriter, CSVUtils.QUOTE_MODE, CSVUtils.QUOTE_ALL);
runner.enableControllerService(csvWriter);
runner.setProperty(ConvertRecord.RECORD_READER, "csv-reader");
runner.setProperty(ConvertRecord.RECORD_WRITER, "csv-writer");
String ffContent = "~ comment\n" +
"id|username|password\n" +
"123|'John'|^|^'^^\n";
Map<String, String> ffAttributes = new HashMap<>();
ffAttributes.put("csv.in.delimiter", "|");
ffAttributes.put("csv.in.quote", "'");
ffAttributes.put("csv.in.escape", "^");
ffAttributes.put("csv.in.comment", "~");
ffAttributes.put("csv.out.delimiter", "\t");
ffAttributes.put("csv.out.quote", "`");
runner.enqueue(ffContent, ffAttributes);
runner.run();
runner.assertAllFlowFilesTransferred(ConvertRecord.REL_SUCCESS, 1);
MockFlowFile flowFile = runner.getFlowFilesForRelationship(ConvertRecord.REL_SUCCESS).get(0);
String expected = "`id`\t`username`\t`password`\n" +
"`123`\t`John`\t`|'^`\n";
assertEquals(expected, new String(flowFile.toByteArray()));
}
} }

View File

@ -824,7 +824,7 @@ public class TestQueryRecord {
} }
@Override @Override
public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out) { public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out, final Map<String, String> variables) {
return new RecordSetWriter() { return new RecordSetWriter() {
@Override @Override

View File

@ -19,9 +19,11 @@ package org.apache.nifi.serialization;
import java.io.IOException; import java.io.IOException;
import java.io.OutputStream; import java.io.OutputStream;
import java.util.Collections;
import java.util.Map; import java.util.Map;
import org.apache.nifi.controller.ControllerService; import org.apache.nifi.controller.ControllerService;
import org.apache.nifi.flowfile.FlowFile;
import org.apache.nifi.logging.ComponentLog; import org.apache.nifi.logging.ComponentLog;
import org.apache.nifi.schema.access.SchemaNotFoundException; import org.apache.nifi.schema.access.SchemaNotFoundException;
import org.apache.nifi.serialization.record.RecordSchema; import org.apache.nifi.serialization.record.RecordSchema;
@ -75,6 +77,47 @@ public interface RecordSetWriterFactory extends ControllerService {
* *
* @return a RecordSetWriter that can write record sets to an OutputStream * @return a RecordSetWriter that can write record sets to an OutputStream
* @throws IOException if unable to read from the given InputStream * @throws IOException if unable to read from the given InputStream
*
* @deprecated Use {@link #createWriter(ComponentLog, RecordSchema, OutputStream, FlowFile)} or {@link #createWriter(ComponentLog, RecordSchema, OutputStream, Map)} instead.
*/ */
RecordSetWriter createWriter(ComponentLog logger, RecordSchema schema, OutputStream out) throws SchemaNotFoundException, IOException; @Deprecated
default RecordSetWriter createWriter(ComponentLog logger, RecordSchema schema, OutputStream out) throws SchemaNotFoundException, IOException {
return createWriter(logger, schema, out, Collections.emptyMap());
}
/**
* <p>
* Creates a new RecordSetWriter that is capable of writing record contents to an OutputStream.
* The method accepts a FlowFile whose attributes can be used to resolve properties specified via Expression Language.
* </p>
*
* @param logger the logger to use when logging information. This is passed in, rather than using the logger of the Controller Service
* because it allows messages to be logged for the component that is calling this Controller Service.
* @param schema the schema that will be used for writing records
* @param out the OutputStream to write to
* @param flowFile the FlowFile whose attributes are used to resolve properties specified via Expression Language
*
* @return a RecordSetWriter that can write record sets to an OutputStream
* @throws IOException if unable to read from the given InputStream
*/
default RecordSetWriter createWriter(ComponentLog logger, RecordSchema schema, OutputStream out, FlowFile flowFile) throws SchemaNotFoundException, IOException {
return createWriter(logger, schema, out, flowFile.getAttributes());
}
/**
* <p>
* Creates a new RecordSetWriter that is capable of writing record contents to an OutputStream.
* The method accepts a variables map that can be used to resolve properties specified via Expression Language.
* </p>
*
* @param logger the logger to use when logging information. This is passed in, rather than using the logger of the Controller Service
* because it allows messages to be logged for the component that is calling this Controller Service.
* @param schema the schema that will be used for writing records
* @param out the OutputStream to write to
* @param variables the variables which are used to resolve properties specified via Expression Language
*
* @return a RecordSetWriter that can write record sets to an OutputStream
* @throws IOException if unable to read from the given InputStream
*/
RecordSetWriter createWriter(ComponentLog logger, RecordSchema schema, OutputStream out, Map<String, String> variables) throws SchemaNotFoundException, IOException;
} }

View File

@ -49,6 +49,7 @@ import java.util.ArrayList;
import java.util.Collection; import java.util.Collection;
import java.util.EnumSet; import java.util.EnumSet;
import java.util.List; import java.util.List;
import java.util.Map;
import java.util.Optional; import java.util.Optional;
import java.util.Set; import java.util.Set;
import java.util.concurrent.BlockingQueue; import java.util.concurrent.BlockingQueue;
@ -123,7 +124,7 @@ public class AvroRecordSetWriter extends SchemaRegistryRecordSetWriter implement
} }
@Override @Override
public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema recordSchema, final OutputStream out) throws IOException { public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema recordSchema, final OutputStream out, final Map<String, String> variables) throws IOException {
final String strategyValue = getConfigurationContext().getProperty(getSchemaWriteStrategyDescriptor()).getValue(); final String strategyValue = getConfigurationContext().getProperty(getSchemaWriteStrategyDescriptor()).getValue();
final String compressionFormat = getConfigurationContext().getProperty(COMPRESSION_FORMAT).getValue(); final String compressionFormat = getConfigurationContext().getProperty(COMPRESSION_FORMAT).getValue();

View File

@ -54,7 +54,7 @@ public class CSVHeaderSchemaStrategy implements SchemaAccessStrategy {
} }
try { try {
final CSVFormat csvFormat = CSVUtils.createCSVFormat(context).withFirstRecordAsHeader(); final CSVFormat csvFormat = CSVUtils.createCSVFormat(context, variables).withFirstRecordAsHeader();
try (final Reader reader = new InputStreamReader(new BOMInputStream(contentStream)); try (final Reader reader = new InputStreamReader(new BOMInputStream(contentStream));
final CSVParser csvParser = new CSVParser(reader, csvFormat)) { final CSVParser csvParser = new CSVParser(reader, csvFormat)) {

View File

@ -46,6 +46,7 @@ import org.apache.nifi.stream.io.NonCloseableInputStream;
import java.io.IOException; import java.io.IOException;
import java.io.InputStream; import java.io.InputStream;
import java.util.ArrayList; import java.util.ArrayList;
import java.util.Collections;
import java.util.List; import java.util.List;
import java.util.Map; import java.util.Map;
@ -55,7 +56,7 @@ import java.util.Map;
+ "the values. See Controller Service's Usage for further documentation.") + "the values. See Controller Service's Usage for further documentation.")
public class CSVReader extends SchemaRegistryService implements RecordReaderFactory { public class CSVReader extends SchemaRegistryService implements RecordReaderFactory {
private final AllowableValue headerDerivedAllowableValue = new AllowableValue("csv-header-derived", "Use String Fields From Header", private static final AllowableValue HEADER_DERIVED = new AllowableValue("csv-header-derived", "Use String Fields From Header",
"The first non-comment line of the CSV file is a header line that contains the names of the columns. The schema will be derived by using the " "The first non-comment line of the CSV file is a header line that contains the names of the columns. The schema will be derived by using the "
+ "column names in the header and assuming that all columns are of type String."); + "column names in the header and assuming that all columns are of type String.");
@ -78,8 +79,9 @@ public class CSVReader extends SchemaRegistryService implements RecordReaderFact
.required(true) .required(true)
.build(); .build();
private volatile ConfigurationContext context;
private volatile String csvParser; private volatile String csvParser;
private volatile CSVFormat csvFormat;
private volatile String dateFormat; private volatile String dateFormat;
private volatile String timeFormat; private volatile String timeFormat;
private volatile String timestampFormat; private volatile String timestampFormat;
@ -87,6 +89,9 @@ public class CSVReader extends SchemaRegistryService implements RecordReaderFact
private volatile boolean ignoreHeader; private volatile boolean ignoreHeader;
private volatile String charSet; private volatile String charSet;
// it will be initialized only if there are no dynamic csv formatting properties
private volatile CSVFormat csvFormat;
@Override @Override
protected List<PropertyDescriptor> getSupportedPropertyDescriptors() { protected List<PropertyDescriptor> getSupportedPropertyDescriptors() {
final List<PropertyDescriptor> properties = new ArrayList<>(super.getSupportedPropertyDescriptors()); final List<PropertyDescriptor> properties = new ArrayList<>(super.getSupportedPropertyDescriptors());
@ -108,9 +113,10 @@ public class CSVReader extends SchemaRegistryService implements RecordReaderFact
} }
@OnEnabled @OnEnabled
public void storeCsvFormat(final ConfigurationContext context) { public void storeStaticProperties(final ConfigurationContext context) {
this.context = context;
this.csvParser = context.getProperty(CSV_PARSER).getValue(); this.csvParser = context.getProperty(CSV_PARSER).getValue();
this.csvFormat = CSVUtils.createCSVFormat(context);
this.dateFormat = context.getProperty(DateTimeUtils.DATE_FORMAT).getValue(); this.dateFormat = context.getProperty(DateTimeUtils.DATE_FORMAT).getValue();
this.timeFormat = context.getProperty(DateTimeUtils.TIME_FORMAT).getValue(); this.timeFormat = context.getProperty(DateTimeUtils.TIME_FORMAT).getValue();
this.timestampFormat = context.getProperty(DateTimeUtils.TIMESTAMP_FORMAT).getValue(); this.timestampFormat = context.getProperty(DateTimeUtils.TIMESTAMP_FORMAT).getValue();
@ -121,10 +127,15 @@ public class CSVReader extends SchemaRegistryService implements RecordReaderFact
// Ensure that if we are deriving schema from header that we always treat the first line as a header, // Ensure that if we are deriving schema from header that we always treat the first line as a header,
// regardless of the 'First Line is Header' property // regardless of the 'First Line is Header' property
final String accessStrategy = context.getProperty(SchemaAccessUtils.SCHEMA_ACCESS_STRATEGY).getValue(); final String accessStrategy = context.getProperty(SchemaAccessUtils.SCHEMA_ACCESS_STRATEGY).getValue();
if (headerDerivedAllowableValue.getValue().equals(accessStrategy) || SchemaInferenceUtil.INFER_SCHEMA.getValue().equals(accessStrategy)) { if (HEADER_DERIVED.getValue().equals(accessStrategy) || SchemaInferenceUtil.INFER_SCHEMA.getValue().equals(accessStrategy)) {
this.csvFormat = this.csvFormat.withFirstRecordAsHeader();
this.firstLineIsHeader = true; this.firstLineIsHeader = true;
} }
if (!CSVUtils.isDynamicCSVFormat(context)) {
this.csvFormat = CSVUtils.createCSVFormat(context, Collections.emptyMap());
} else {
this.csvFormat = null;
}
} }
@Override @Override
@ -134,6 +145,13 @@ public class CSVReader extends SchemaRegistryService implements RecordReaderFact
final RecordSchema schema = getSchema(variables, new NonCloseableInputStream(in), null); final RecordSchema schema = getSchema(variables, new NonCloseableInputStream(in), null);
in.reset(); in.reset();
CSVFormat csvFormat;
if (this.csvFormat != null) {
csvFormat = this.csvFormat;
} else {
csvFormat = CSVUtils.createCSVFormat(context, variables);
}
if(APACHE_COMMONS_CSV.getValue().equals(csvParser)) { if(APACHE_COMMONS_CSV.getValue().equals(csvParser)) {
return new CSVRecordReader(in, logger, schema, csvFormat, firstLineIsHeader, ignoreHeader, dateFormat, timeFormat, timestampFormat, charSet); return new CSVRecordReader(in, logger, schema, csvFormat, firstLineIsHeader, ignoreHeader, dateFormat, timeFormat, timestampFormat, charSet);
} else if(JACKSON_CSV.getValue().equals(csvParser)) { } else if(JACKSON_CSV.getValue().equals(csvParser)) {
@ -145,10 +163,10 @@ public class CSVReader extends SchemaRegistryService implements RecordReaderFact
@Override @Override
protected SchemaAccessStrategy getSchemaAccessStrategy(final String allowableValue, final SchemaRegistry schemaRegistry, final PropertyContext context) { protected SchemaAccessStrategy getSchemaAccessStrategy(final String allowableValue, final SchemaRegistry schemaRegistry, final PropertyContext context) {
if (allowableValue.equalsIgnoreCase(headerDerivedAllowableValue.getValue())) { if (allowableValue.equalsIgnoreCase(HEADER_DERIVED.getValue())) {
return new CSVHeaderSchemaStrategy(context); return new CSVHeaderSchemaStrategy(context);
} else if (allowableValue.equalsIgnoreCase(SchemaInferenceUtil.INFER_SCHEMA.getValue())) { } else if (allowableValue.equalsIgnoreCase(SchemaInferenceUtil.INFER_SCHEMA.getValue())) {
final RecordSourceFactory<CSVRecordAndFieldNames> sourceFactory = (var, in) -> new CSVRecordSource(in, context); final RecordSourceFactory<CSVRecordAndFieldNames> sourceFactory = (variables, in) -> new CSVRecordSource(in, context, variables);
final SchemaInferenceEngine<CSVRecordAndFieldNames> inference = new CSVSchemaInference(new TimeValueInference(dateFormat, timeFormat, timestampFormat)); final SchemaInferenceEngine<CSVRecordAndFieldNames> inference = new CSVSchemaInference(new TimeValueInference(dateFormat, timeFormat, timestampFormat));
return new InferSchemaAccessStrategy<>(sourceFactory, inference, getLogger()); return new InferSchemaAccessStrategy<>(sourceFactory, inference, getLogger());
} }
@ -159,7 +177,7 @@ public class CSVReader extends SchemaRegistryService implements RecordReaderFact
@Override @Override
protected List<AllowableValue> getSchemaAccessStrategyValues() { protected List<AllowableValue> getSchemaAccessStrategyValues() {
final List<AllowableValue> allowableValues = new ArrayList<>(super.getSchemaAccessStrategyValues()); final List<AllowableValue> allowableValues = new ArrayList<>(super.getSchemaAccessStrategyValues());
allowableValues.add(headerDerivedAllowableValue); allowableValues.add(HEADER_DERIVED);
allowableValues.add(SchemaInferenceUtil.INFER_SCHEMA); allowableValues.add(SchemaInferenceUtil.INFER_SCHEMA);
return allowableValues; return allowableValues;
} }

View File

@ -20,7 +20,9 @@ package org.apache.nifi.csv;
import java.io.IOException; import java.io.IOException;
import java.io.OutputStream; import java.io.OutputStream;
import java.util.ArrayList; import java.util.ArrayList;
import java.util.Collections;
import java.util.List; import java.util.List;
import java.util.Map;
import org.apache.commons.csv.CSVFormat; import org.apache.commons.csv.CSVFormat;
import org.apache.nifi.annotation.documentation.CapabilityDescription; import org.apache.nifi.annotation.documentation.CapabilityDescription;
@ -41,10 +43,14 @@ import org.apache.nifi.serialization.record.RecordSchema;
+ "corresponding to the record fields.") + "corresponding to the record fields.")
public class CSVRecordSetWriter extends DateTimeTextRecordSetWriter implements RecordSetWriterFactory { public class CSVRecordSetWriter extends DateTimeTextRecordSetWriter implements RecordSetWriterFactory {
private volatile CSVFormat csvFormat; private volatile ConfigurationContext context;
private volatile boolean includeHeader; private volatile boolean includeHeader;
private volatile String charSet; private volatile String charSet;
// it will be initialized only if there are no dynamic csv formatting properties
private volatile CSVFormat csvFormat;
@Override @Override
protected List<PropertyDescriptor> getSupportedPropertyDescriptors() { protected List<PropertyDescriptor> getSupportedPropertyDescriptors() {
final List<PropertyDescriptor> properties = new ArrayList<>(super.getSupportedPropertyDescriptors()); final List<PropertyDescriptor> properties = new ArrayList<>(super.getSupportedPropertyDescriptors());
@ -64,14 +70,28 @@ public class CSVRecordSetWriter extends DateTimeTextRecordSetWriter implements R
} }
@OnEnabled @OnEnabled
public void storeCsvFormat(final ConfigurationContext context) { public void storeStaticProperties(final ConfigurationContext context) {
this.csvFormat = CSVUtils.createCSVFormat(context); this.context = context;
this.includeHeader = context.getProperty(CSVUtils.INCLUDE_HEADER_LINE).asBoolean(); this.includeHeader = context.getProperty(CSVUtils.INCLUDE_HEADER_LINE).asBoolean();
this.charSet = context.getProperty(CSVUtils.CHARSET).getValue(); this.charSet = context.getProperty(CSVUtils.CHARSET).getValue();
if (!CSVUtils.isDynamicCSVFormat(context)) {
this.csvFormat = CSVUtils.createCSVFormat(context, Collections.emptyMap());
} else {
this.csvFormat = null;
}
} }
@Override @Override
public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out) throws SchemaNotFoundException, IOException { public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out, final Map<String, String> variables) throws SchemaNotFoundException, IOException {
CSVFormat csvFormat;
if (this.csvFormat != null) {
csvFormat = this.csvFormat;
} else {
csvFormat = CSVUtils.createCSVFormat(context, variables);
}
return new WriteCSVResult(csvFormat, schema, getSchemaAccessWriter(schema), out, return new WriteCSVResult(csvFormat, schema, getSchemaAccessWriter(schema), out,
getDateFormat().orElse(null), getTimeFormat().orElse(null), getTimestampFormat().orElse(null), includeHeader, charSet); getDateFormat().orElse(null), getTimeFormat().orElse(null), getTimestampFormat().orElse(null), includeHeader, charSet);
} }

View File

@ -33,12 +33,13 @@ import java.util.ArrayList;
import java.util.Collections; import java.util.Collections;
import java.util.Iterator; import java.util.Iterator;
import java.util.List; import java.util.List;
import java.util.Map;
public class CSVRecordSource implements RecordSource<CSVRecordAndFieldNames> { public class CSVRecordSource implements RecordSource<CSVRecordAndFieldNames> {
private final Iterator<CSVRecord> csvRecordIterator; private final Iterator<CSVRecord> csvRecordIterator;
private final List<String> fieldNames; private final List<String> fieldNames;
public CSVRecordSource(final InputStream in, final PropertyContext context) throws IOException { public CSVRecordSource(final InputStream in, final PropertyContext context, final Map<String, String> variables) throws IOException {
final String charset = context.getProperty(CSVUtils.CHARSET).getValue(); final String charset = context.getProperty(CSVUtils.CHARSET).getValue();
final Reader reader; final Reader reader;
@ -48,7 +49,7 @@ public class CSVRecordSource implements RecordSource<CSVRecordAndFieldNames> {
throw new ProcessException(e); throw new ProcessException(e);
} }
final CSVFormat csvFormat = CSVUtils.createCSVFormat(context).withFirstRecordAsHeader().withTrim(); final CSVFormat csvFormat = CSVUtils.createCSVFormat(context, variables).withFirstRecordAsHeader().withTrim();
final CSVParser csvParser = new CSVParser(reader, csvFormat); final CSVParser csvParser = new CSVParser(reader, csvFormat);
fieldNames = Collections.unmodifiableList(new ArrayList<>(csvParser.getHeaderMap().keySet())); fieldNames = Collections.unmodifiableList(new ArrayList<>(csvParser.getHeaderMap().keySet()));

View File

@ -23,6 +23,7 @@ import java.io.OutputStream;
import java.util.ArrayList; import java.util.ArrayList;
import java.util.Collection; import java.util.Collection;
import java.util.List; import java.util.List;
import java.util.Map;
import org.apache.commons.compress.compressors.CompressorException; import org.apache.commons.compress.compressors.CompressorException;
import org.apache.commons.compress.compressors.CompressorStreamFactory; import org.apache.commons.compress.compressors.CompressorStreamFactory;
@ -173,7 +174,7 @@ public class JsonRecordSetWriter extends DateTimeTextRecordSetWriter implements
} }
@Override @Override
public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out) throws SchemaNotFoundException, IOException { public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out, final Map<String, String> variables) throws SchemaNotFoundException, IOException {
final OutputStream bufferedOut = new BufferedOutputStream(out, 65536); final OutputStream bufferedOut = new BufferedOutputStream(out, 65536);
final OutputStream compressionOut; final OutputStream compressionOut;

View File

@ -39,6 +39,7 @@ import java.io.OutputStream;
import java.nio.charset.Charset; import java.nio.charset.Charset;
import java.util.ArrayList; import java.util.ArrayList;
import java.util.List; import java.util.List;
import java.util.Map;
@Tags({"text", "freeform", "expression", "language", "el", "record", "recordset", "resultset", "writer", "serialize"}) @Tags({"text", "freeform", "expression", "language", "el", "record", "recordset", "resultset", "writer", "serialize"})
@CapabilityDescription("Writes the contents of a RecordSet as free-form text. The configured " @CapabilityDescription("Writes the contents of a RecordSet as free-form text. The configured "
@ -79,7 +80,7 @@ public class FreeFormTextRecordSetWriter extends SchemaRegistryRecordSetWriter i
} }
@Override @Override
public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out) { public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out, final Map<String, String> variables) {
return new FreeFormTextWriter(textValue, characterSet, out); return new FreeFormTextWriter(textValue, characterSet, out);
} }

View File

@ -1,209 +1,210 @@
/* /*
* Licensed to the Apache Software Foundation (ASF) under one or more * Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with * contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership. * this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0 * The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with * (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at * the License. You may obtain a copy of the License at
* *
* http://www.apache.org/licenses/LICENSE-2.0 * http://www.apache.org/licenses/LICENSE-2.0
* *
* Unless required by applicable law or agreed to in writing, software * Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS, * distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and * See the License for the specific language governing permissions and
* limitations under the License. * limitations under the License.
*/ */
package org.apache.nifi.xml; package org.apache.nifi.xml;
import org.apache.nifi.record.NullSuppression; import org.apache.nifi.record.NullSuppression;
import org.apache.nifi.annotation.documentation.CapabilityDescription; import org.apache.nifi.annotation.documentation.CapabilityDescription;
import org.apache.nifi.annotation.documentation.Tags; import org.apache.nifi.annotation.documentation.Tags;
import org.apache.nifi.components.AllowableValue; import org.apache.nifi.components.AllowableValue;
import org.apache.nifi.components.PropertyDescriptor; import org.apache.nifi.components.PropertyDescriptor;
import org.apache.nifi.components.ValidationContext; import org.apache.nifi.components.ValidationContext;
import org.apache.nifi.components.ValidationResult; import org.apache.nifi.components.ValidationResult;
import org.apache.nifi.expression.ExpressionLanguageScope; import org.apache.nifi.expression.ExpressionLanguageScope;
import org.apache.nifi.logging.ComponentLog; import org.apache.nifi.logging.ComponentLog;
import org.apache.nifi.processor.util.StandardValidators; import org.apache.nifi.processor.util.StandardValidators;
import org.apache.nifi.schema.access.SchemaNotFoundException; import org.apache.nifi.schema.access.SchemaNotFoundException;
import org.apache.nifi.serialization.DateTimeTextRecordSetWriter; import org.apache.nifi.serialization.DateTimeTextRecordSetWriter;
import org.apache.nifi.serialization.RecordSetWriter; import org.apache.nifi.serialization.RecordSetWriter;
import org.apache.nifi.serialization.RecordSetWriterFactory; import org.apache.nifi.serialization.RecordSetWriterFactory;
import org.apache.nifi.serialization.record.RecordSchema; import org.apache.nifi.serialization.record.RecordSchema;
import java.io.IOException; import java.io.IOException;
import java.io.OutputStream; import java.io.OutputStream;
import java.util.ArrayList; import java.util.ArrayList;
import java.util.Collection; import java.util.Collection;
import java.util.Collections; import java.util.Collections;
import java.util.List; import java.util.List;
import java.util.Map;
@Tags({"xml", "resultset", "writer", "serialize", "record", "recordset", "row"})
@CapabilityDescription("Writes a RecordSet to XML. The records are wrapped by a root tag.") @Tags({"xml", "resultset", "writer", "serialize", "record", "recordset", "row"})
public class XMLRecordSetWriter extends DateTimeTextRecordSetWriter implements RecordSetWriterFactory { @CapabilityDescription("Writes a RecordSet to XML. The records are wrapped by a root tag.")
public class XMLRecordSetWriter extends DateTimeTextRecordSetWriter implements RecordSetWriterFactory {
public static final AllowableValue ALWAYS_SUPPRESS = new AllowableValue("always-suppress", "Always Suppress",
"Fields that are missing (present in the schema but not in the record), or that have a value of null, will not be written out"); public static final AllowableValue ALWAYS_SUPPRESS = new AllowableValue("always-suppress", "Always Suppress",
public static final AllowableValue NEVER_SUPPRESS = new AllowableValue("never-suppress", "Never Suppress", "Fields that are missing (present in the schema but not in the record), or that have a value of null, will not be written out");
"Fields that are missing (present in the schema but not in the record), or that have a value of null, will be written out as a null value"); public static final AllowableValue NEVER_SUPPRESS = new AllowableValue("never-suppress", "Never Suppress",
public static final AllowableValue SUPPRESS_MISSING = new AllowableValue("suppress-missing", "Suppress Missing Values", "Fields that are missing (present in the schema but not in the record), or that have a value of null, will be written out as a null value");
"When a field has a value of null, it will be written out. However, if a field is defined in the schema and not present in the record, the field will not be written out."); public static final AllowableValue SUPPRESS_MISSING = new AllowableValue("suppress-missing", "Suppress Missing Values",
"When a field has a value of null, it will be written out. However, if a field is defined in the schema and not present in the record, the field will not be written out.");
public static final AllowableValue USE_PROPERTY_AS_WRAPPER = new AllowableValue("use-property-as-wrapper", "Use Property as Wrapper",
"The value of the property \"Array Tag Name\" will be used as the tag name to wrap elements of an array. The field name of the array field will be used for the tag name " + public static final AllowableValue USE_PROPERTY_AS_WRAPPER = new AllowableValue("use-property-as-wrapper", "Use Property as Wrapper",
"of the elements."); "The value of the property \"Array Tag Name\" will be used as the tag name to wrap elements of an array. The field name of the array field will be used for the tag name " +
public static final AllowableValue USE_PROPERTY_FOR_ELEMENTS = new AllowableValue("use-property-for-elements", "Use Property for Elements", "of the elements.");
"The value of the property \"Array Tag Name\" will be used for the tag name of the elements of an array. The field name of the array field will be used as the tag name " + public static final AllowableValue USE_PROPERTY_FOR_ELEMENTS = new AllowableValue("use-property-for-elements", "Use Property for Elements",
"to wrap elements."); "The value of the property \"Array Tag Name\" will be used for the tag name of the elements of an array. The field name of the array field will be used as the tag name " +
public static final AllowableValue NO_WRAPPING = new AllowableValue("no-wrapping", "No Wrapping", "to wrap elements.");
"The elements of an array will not be wrapped"); public static final AllowableValue NO_WRAPPING = new AllowableValue("no-wrapping", "No Wrapping",
"The elements of an array will not be wrapped");
public static final PropertyDescriptor SUPPRESS_NULLS = new PropertyDescriptor.Builder()
.name("suppress_nulls") public static final PropertyDescriptor SUPPRESS_NULLS = new PropertyDescriptor.Builder()
.displayName("Suppress Null Values") .name("suppress_nulls")
.description("Specifies how the writer should handle a null field") .displayName("Suppress Null Values")
.allowableValues(NEVER_SUPPRESS, ALWAYS_SUPPRESS, SUPPRESS_MISSING) .description("Specifies how the writer should handle a null field")
.defaultValue(NEVER_SUPPRESS.getValue()) .allowableValues(NEVER_SUPPRESS, ALWAYS_SUPPRESS, SUPPRESS_MISSING)
.required(true) .defaultValue(NEVER_SUPPRESS.getValue())
.build(); .required(true)
.build();
public static final PropertyDescriptor PRETTY_PRINT_XML = new PropertyDescriptor.Builder()
.name("pretty_print_xml") public static final PropertyDescriptor PRETTY_PRINT_XML = new PropertyDescriptor.Builder()
.displayName("Pretty Print XML") .name("pretty_print_xml")
.description("Specifies whether or not the XML should be pretty printed") .displayName("Pretty Print XML")
.expressionLanguageSupported(ExpressionLanguageScope.NONE) .description("Specifies whether or not the XML should be pretty printed")
.allowableValues("true", "false") .expressionLanguageSupported(ExpressionLanguageScope.NONE)
.defaultValue("false") .allowableValues("true", "false")
.required(true) .defaultValue("false")
.build(); .required(true)
.build();
public static final PropertyDescriptor ROOT_TAG_NAME = new PropertyDescriptor.Builder()
.name("root_tag_name") public static final PropertyDescriptor ROOT_TAG_NAME = new PropertyDescriptor.Builder()
.displayName("Name of Root Tag") .name("root_tag_name")
.description("Specifies the name of the XML root tag wrapping the record set. This property has to be defined if " + .displayName("Name of Root Tag")
"the writer is supposed to write multiple records in a single FlowFile.") .description("Specifies the name of the XML root tag wrapping the record set. This property has to be defined if " +
.addValidator(StandardValidators.NON_EMPTY_VALIDATOR) "the writer is supposed to write multiple records in a single FlowFile.")
.expressionLanguageSupported(ExpressionLanguageScope.NONE) .addValidator(StandardValidators.NON_EMPTY_VALIDATOR)
.required(false) .expressionLanguageSupported(ExpressionLanguageScope.NONE)
.build(); .required(false)
.build();
public static final PropertyDescriptor RECORD_TAG_NAME = new PropertyDescriptor.Builder()
.name("record_tag_name") public static final PropertyDescriptor RECORD_TAG_NAME = new PropertyDescriptor.Builder()
.displayName("Name of Record Tag") .name("record_tag_name")
.description("Specifies the name of the XML record tag wrapping the record fields. If this is not set, the writer " + .displayName("Name of Record Tag")
"will use the record name in the schema.") .description("Specifies the name of the XML record tag wrapping the record fields. If this is not set, the writer " +
.addValidator(StandardValidators.NON_EMPTY_VALIDATOR) "will use the record name in the schema.")
.expressionLanguageSupported(ExpressionLanguageScope.NONE) .addValidator(StandardValidators.NON_EMPTY_VALIDATOR)
.required(false) .expressionLanguageSupported(ExpressionLanguageScope.NONE)
.build(); .required(false)
.build();
public static final PropertyDescriptor ARRAY_WRAPPING = new PropertyDescriptor.Builder()
.name("array_wrapping") public static final PropertyDescriptor ARRAY_WRAPPING = new PropertyDescriptor.Builder()
.displayName("Wrap Elements of Arrays") .name("array_wrapping")
.description("Specifies how the writer wraps elements of fields of type array") .displayName("Wrap Elements of Arrays")
.allowableValues(USE_PROPERTY_AS_WRAPPER, USE_PROPERTY_FOR_ELEMENTS, NO_WRAPPING) .description("Specifies how the writer wraps elements of fields of type array")
.defaultValue(NO_WRAPPING.getValue()) .allowableValues(USE_PROPERTY_AS_WRAPPER, USE_PROPERTY_FOR_ELEMENTS, NO_WRAPPING)
.required(true) .defaultValue(NO_WRAPPING.getValue())
.build(); .required(true)
.build();
public static final PropertyDescriptor ARRAY_TAG_NAME = new PropertyDescriptor.Builder()
.name("array_tag_name") public static final PropertyDescriptor ARRAY_TAG_NAME = new PropertyDescriptor.Builder()
.displayName("Array Tag Name") .name("array_tag_name")
.description("Name of the tag used by property \"Wrap Elements of Arrays\" to write arrays") .displayName("Array Tag Name")
.addValidator(StandardValidators.NON_EMPTY_VALIDATOR) .description("Name of the tag used by property \"Wrap Elements of Arrays\" to write arrays")
.expressionLanguageSupported(ExpressionLanguageScope.NONE) .addValidator(StandardValidators.NON_EMPTY_VALIDATOR)
.required(false) .expressionLanguageSupported(ExpressionLanguageScope.NONE)
.build(); .required(false)
.build();
public static final PropertyDescriptor CHARACTER_SET = new PropertyDescriptor.Builder()
.name("Character Set") public static final PropertyDescriptor CHARACTER_SET = new PropertyDescriptor.Builder()
.description("The Character set to use when writing the data to the FlowFile") .name("Character Set")
.addValidator(StandardValidators.CHARACTER_SET_VALIDATOR) .description("The Character set to use when writing the data to the FlowFile")
.defaultValue("UTF-8") .addValidator(StandardValidators.CHARACTER_SET_VALIDATOR)
.expressionLanguageSupported(ExpressionLanguageScope.NONE) .defaultValue("UTF-8")
.required(true) .expressionLanguageSupported(ExpressionLanguageScope.NONE)
.build(); .required(true)
.build();
@Override
protected List<PropertyDescriptor> getSupportedPropertyDescriptors() { @Override
final List<PropertyDescriptor> properties = new ArrayList<>(super.getSupportedPropertyDescriptors()); protected List<PropertyDescriptor> getSupportedPropertyDescriptors() {
properties.add(SUPPRESS_NULLS); final List<PropertyDescriptor> properties = new ArrayList<>(super.getSupportedPropertyDescriptors());
properties.add(PRETTY_PRINT_XML); properties.add(SUPPRESS_NULLS);
properties.add(ROOT_TAG_NAME); properties.add(PRETTY_PRINT_XML);
properties.add(RECORD_TAG_NAME); properties.add(ROOT_TAG_NAME);
properties.add(ARRAY_WRAPPING); properties.add(RECORD_TAG_NAME);
properties.add(ARRAY_TAG_NAME); properties.add(ARRAY_WRAPPING);
properties.add(CHARACTER_SET); properties.add(ARRAY_TAG_NAME);
return properties; properties.add(CHARACTER_SET);
} return properties;
}
@Override
protected Collection<ValidationResult> customValidate(final ValidationContext validationContext) { @Override
if (!validationContext.getProperty(ARRAY_WRAPPING).getValue().equals(NO_WRAPPING.getValue())) { protected Collection<ValidationResult> customValidate(final ValidationContext validationContext) {
if (!validationContext.getProperty(ARRAY_TAG_NAME).isSet()) { if (!validationContext.getProperty(ARRAY_WRAPPING).getValue().equals(NO_WRAPPING.getValue())) {
StringBuilder explanation = new StringBuilder() if (!validationContext.getProperty(ARRAY_TAG_NAME).isSet()) {
.append("if property \'") StringBuilder explanation = new StringBuilder()
.append(ARRAY_WRAPPING.getName()) .append("if property \'")
.append("\' is defined as \'") .append(ARRAY_WRAPPING.getName())
.append(USE_PROPERTY_AS_WRAPPER.getDisplayName()) .append("\' is defined as \'")
.append("\' or \'") .append(USE_PROPERTY_AS_WRAPPER.getDisplayName())
.append(USE_PROPERTY_FOR_ELEMENTS.getDisplayName()) .append("\' or \'")
.append("\' the property \'") .append(USE_PROPERTY_FOR_ELEMENTS.getDisplayName())
.append(ARRAY_TAG_NAME.getDisplayName()) .append("\' the property \'")
.append("\' has to be set."); .append(ARRAY_TAG_NAME.getDisplayName())
.append("\' has to be set.");
return Collections.singleton(new ValidationResult.Builder()
.subject(ARRAY_TAG_NAME.getName()) return Collections.singleton(new ValidationResult.Builder()
.valid(false) .subject(ARRAY_TAG_NAME.getName())
.explanation(explanation.toString()) .valid(false)
.build()); .explanation(explanation.toString())
} .build());
} }
return Collections.emptyList(); }
} return Collections.emptyList();
}
@Override
public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out) throws SchemaNotFoundException, IOException { @Override
final String nullSuppression = getConfigurationContext().getProperty(SUPPRESS_NULLS).getValue(); public RecordSetWriter createWriter(final ComponentLog logger, final RecordSchema schema, final OutputStream out, final Map<String, String> variables) throws SchemaNotFoundException, IOException {
final NullSuppression nullSuppressionEnum; final String nullSuppression = getConfigurationContext().getProperty(SUPPRESS_NULLS).getValue();
if (nullSuppression.equals(ALWAYS_SUPPRESS.getValue())) { final NullSuppression nullSuppressionEnum;
nullSuppressionEnum = NullSuppression.ALWAYS_SUPPRESS; if (nullSuppression.equals(ALWAYS_SUPPRESS.getValue())) {
} else if (nullSuppression.equals(NEVER_SUPPRESS.getValue())) { nullSuppressionEnum = NullSuppression.ALWAYS_SUPPRESS;
nullSuppressionEnum = NullSuppression.NEVER_SUPPRESS; } else if (nullSuppression.equals(NEVER_SUPPRESS.getValue())) {
} else { nullSuppressionEnum = NullSuppression.NEVER_SUPPRESS;
nullSuppressionEnum = NullSuppression.SUPPRESS_MISSING; } else {
} nullSuppressionEnum = NullSuppression.SUPPRESS_MISSING;
}
final boolean prettyPrint = getConfigurationContext().getProperty(PRETTY_PRINT_XML).getValue().equals("true");
final boolean prettyPrint = getConfigurationContext().getProperty(PRETTY_PRINT_XML).getValue().equals("true");
final String rootTagName = getConfigurationContext().getProperty(ROOT_TAG_NAME).isSet()
? getConfigurationContext().getProperty(ROOT_TAG_NAME).getValue() : null; final String rootTagName = getConfigurationContext().getProperty(ROOT_TAG_NAME).isSet()
final String recordTagName = getConfigurationContext().getProperty(RECORD_TAG_NAME).isSet() ? getConfigurationContext().getProperty(ROOT_TAG_NAME).getValue() : null;
? getConfigurationContext().getProperty(RECORD_TAG_NAME).getValue() : null; final String recordTagName = getConfigurationContext().getProperty(RECORD_TAG_NAME).isSet()
? getConfigurationContext().getProperty(RECORD_TAG_NAME).getValue() : null;
final String arrayWrapping = getConfigurationContext().getProperty(ARRAY_WRAPPING).getValue();
final ArrayWrapping arrayWrappingEnum; final String arrayWrapping = getConfigurationContext().getProperty(ARRAY_WRAPPING).getValue();
if (arrayWrapping.equals(NO_WRAPPING.getValue())) { final ArrayWrapping arrayWrappingEnum;
arrayWrappingEnum = ArrayWrapping.NO_WRAPPING; if (arrayWrapping.equals(NO_WRAPPING.getValue())) {
} else if (arrayWrapping.equals(USE_PROPERTY_AS_WRAPPER.getValue())) { arrayWrappingEnum = ArrayWrapping.NO_WRAPPING;
arrayWrappingEnum = ArrayWrapping.USE_PROPERTY_AS_WRAPPER; } else if (arrayWrapping.equals(USE_PROPERTY_AS_WRAPPER.getValue())) {
} else { arrayWrappingEnum = ArrayWrapping.USE_PROPERTY_AS_WRAPPER;
arrayWrappingEnum = ArrayWrapping.USE_PROPERTY_FOR_ELEMENTS; } else {
} arrayWrappingEnum = ArrayWrapping.USE_PROPERTY_FOR_ELEMENTS;
}
final String arrayTagName;
if (getConfigurationContext().getProperty(ARRAY_TAG_NAME).isSet()) { final String arrayTagName;
arrayTagName = getConfigurationContext().getProperty(ARRAY_TAG_NAME).getValue(); if (getConfigurationContext().getProperty(ARRAY_TAG_NAME).isSet()) {
} else { arrayTagName = getConfigurationContext().getProperty(ARRAY_TAG_NAME).getValue();
arrayTagName = null; } else {
} arrayTagName = null;
}
final String charSet = getConfigurationContext().getProperty(CHARACTER_SET).getValue();
final String charSet = getConfigurationContext().getProperty(CHARACTER_SET).getValue();
return new WriteXMLResult(schema, getSchemaAccessWriter(schema),
out, prettyPrint, nullSuppressionEnum, arrayWrappingEnum, arrayTagName, rootTagName, recordTagName, charSet, return new WriteXMLResult(schema, getSchemaAccessWriter(schema),
getDateFormat().orElse(null), getTimeFormat().orElse(null), getTimestampFormat().orElse(null)); out, prettyPrint, nullSuppressionEnum, arrayWrappingEnum, arrayTagName, rootTagName, recordTagName, charSet,
} getDateFormat().orElse(null), getTimeFormat().orElse(null), getTimestampFormat().orElse(null));
} }
}

View File

@ -40,7 +40,7 @@ public class TestCSVHeaderSchemaStrategy {
@Test @Test
public void testSimple() throws SchemaNotFoundException, IOException { public void testSimple() throws SchemaNotFoundException, IOException {
final String headerLine = "a, b, c, d, e\\,z, f"; final String headerLine = "\"a\", b, c, d, e\\,z, f";
final byte[] headerBytes = headerLine.getBytes(); final byte[] headerBytes = headerLine.getBytes();
final Map<PropertyDescriptor, String> properties = new HashMap<>(); final Map<PropertyDescriptor, String> properties = new HashMap<>();
@ -66,4 +66,37 @@ public class TestCSVHeaderSchemaStrategy {
.allMatch(field -> field.getDataType().equals(RecordFieldType.STRING.getDataType()))); .allMatch(field -> field.getDataType().equals(RecordFieldType.STRING.getDataType())));
} }
@Test
public void testWithEL() throws SchemaNotFoundException, IOException {
final String headerLine = "\'a\'; b; c; d; e^;z; f";
final byte[] headerBytes = headerLine.getBytes();
final Map<PropertyDescriptor, String> properties = new HashMap<>();
properties.put(CSVUtils.CSV_FORMAT, CSVUtils.CUSTOM.getValue());
properties.put(CSVUtils.COMMENT_MARKER, "#");
properties.put(CSVUtils.VALUE_SEPARATOR, "${csv.delimiter}");
properties.put(CSVUtils.TRIM_FIELDS, "true");
properties.put(CSVUtils.QUOTE_CHAR, "${csv.quote}");
properties.put(CSVUtils.ESCAPE_CHAR, "${csv.escape}");
final Map<String, String> variables = new HashMap<>();
variables.put("csv.delimiter", ";");
variables.put("csv.quote", "'");
variables.put("csv.escape", "^");
final ConfigurationContext context = new MockConfigurationContext(properties, null);
final CSVHeaderSchemaStrategy strategy = new CSVHeaderSchemaStrategy(context);
final RecordSchema schema;
try (final InputStream bais = new ByteArrayInputStream(headerBytes)) {
schema = strategy.getSchema(variables, bais, null);
}
final List<String> expectedFieldNames = Arrays.asList("a", "b", "c", "d", "e;z", "f");
assertEquals(expectedFieldNames, schema.getFieldNames());
assertTrue(schema.getFields().stream()
.allMatch(field -> field.getDataType().equals(RecordFieldType.STRING.getDataType())));
}
} }

View File

@ -58,7 +58,7 @@ public class TestCSVSchemaInference {
final InputStream bufferedIn = new BufferedInputStream(in)) { final InputStream bufferedIn = new BufferedInputStream(in)) {
final InferSchemaAccessStrategy<?> accessStrategy = new InferSchemaAccessStrategy<>( final InferSchemaAccessStrategy<?> accessStrategy = new InferSchemaAccessStrategy<>(
(var, content) -> new CSVRecordSource(content, context), (variables, content) -> new CSVRecordSource(content, context, variables),
new CSVSchemaInference(timestampInference), Mockito.mock(ComponentLog.class)); new CSVSchemaInference(timestampInference), Mockito.mock(ComponentLog.class));
schema = accessStrategy.getSchema(null, bufferedIn, null); schema = accessStrategy.getSchema(null, bufferedIn, null);
} }
@ -82,4 +82,51 @@ public class TestCSVSchemaInference {
"componentId", "componentType", "componentName", "processGroupId", "processGroupName", "entityId", "entityType", "entitySize", "previousEntitySize", "updatedAttributes", "actorHostname", "componentId", "componentType", "componentName", "processGroupId", "processGroupName", "entityId", "entityType", "entitySize", "previousEntitySize", "updatedAttributes", "actorHostname",
"contentURI", "previousContentURI", "parentIds", "childIds", "platform", "application", "extra field", "numeric string"), fieldNames); "contentURI", "previousContentURI", "parentIds", "childIds", "platform", "application", "extra field", "numeric string"), fieldNames);
} }
@Test
public void testInferenceIncludesAllRecordsWithEL() throws IOException {
final File file = new File("src/test/resources/csv/prov-events.csv");
final Map<PropertyDescriptor, String> properties = new HashMap<>();
new CSVReader().getSupportedPropertyDescriptors().forEach(prop -> properties.put(prop, prop.getDefaultValue()));
properties.put(CSVUtils.TRIM_FIELDS, "true");
properties.put(CSVUtils.VALUE_SEPARATOR, "${csv.delimiter}");
properties.put(CSVUtils.QUOTE_CHAR, "${csv.quote}");
properties.put(CSVUtils.ESCAPE_CHAR, "${csv.escape}");
final PropertyContext context = new MockConfigurationContext(properties, null);
final Map<String, String> attributes = new HashMap<>();
attributes.put("csv.delimiter", ",");
attributes.put("csv.quote", "\"");
attributes.put("csv.escape", "\\");
final RecordSchema schema;
try (final InputStream in = new FileInputStream(file);
final InputStream bufferedIn = new BufferedInputStream(in)) {
final InferSchemaAccessStrategy<?> accessStrategy = new InferSchemaAccessStrategy<>(
(variables, content) -> new CSVRecordSource(content, context, variables),
new CSVSchemaInference(timestampInference), Mockito.mock(ComponentLog.class));
schema = accessStrategy.getSchema(attributes, bufferedIn, null);
}
assertSame(RecordFieldType.STRING, schema.getDataType("eventId").get().getFieldType());
assertSame(RecordFieldType.INT, schema.getDataType("eventOrdinal").get().getFieldType());
assertSame(RecordFieldType.STRING, schema.getDataType("eventType").get().getFieldType());
assertSame(RecordFieldType.LONG, schema.getDataType("timestampMillis").get().getFieldType());
assertEquals(RecordFieldType.TIMESTAMP.getDataType("yyyy-MM-dd'T'HH:mm:ss.SSS'Z'"), schema.getDataType("timestamp").get());
assertEquals(RecordFieldType.TIME.getDataType("HH:mm:ss"), schema.getDataType("eventTime").get());
assertEquals(RecordFieldType.DATE.getDataType("yyyy-MM-dd"), schema.getDataType("eventDate").get());
assertEquals(RecordFieldType.STRING.getDataType(), schema.getDataType("maybeTime").get());
assertEquals(RecordFieldType.DATE.getDataType("yyyy-MM-dd"), schema.getDataType("maybeDate").get());
assertSame(RecordFieldType.INT, schema.getDataType("parentIds").get().getFieldType());
assertSame(RecordFieldType.STRING, schema.getDataType("numeric string").get().getFieldType());
final List<String> fieldNames = schema.getFieldNames();
assertEquals(Arrays.asList("eventId", "eventOrdinal", "eventType", "timestampMillis", "timestamp", "eventDate", "eventTime", "maybeTime", "maybeDate", "durationMillis", "lineageStart",
"componentId", "componentType", "componentName", "processGroupId", "processGroupName", "entityId", "entityType", "entitySize", "previousEntitySize", "updatedAttributes", "actorHostname",
"contentURI", "previousContentURI", "parentIds", "childIds", "platform", "application", "extra field", "numeric string"), fieldNames);
}
} }

View File

@ -33,7 +33,6 @@ public class TestCSVValidators {
/*** SingleCharValidator **/ /*** SingleCharValidator **/
@Test @Test
public void testSingleCharNullValue() { public void testSingleCharNullValue() {
CSVValidators.SingleCharacterValidator validator = new CSVValidators.SingleCharacterValidator(); CSVValidators.SingleCharacterValidator validator = new CSVValidators.SingleCharacterValidator();
ValidationContext mockContext = Mockito.mock(ValidationContext.class); ValidationContext mockContext = Mockito.mock(ValidationContext.class);
ValidationResult result = validator.validate("EscapeChar", null, mockContext); ValidationResult result = validator.validate("EscapeChar", null, mockContext);
@ -66,6 +65,16 @@ public class TestCSVValidators {
assertTrue(result.isValid()); assertTrue(result.isValid());
} }
@Test
public void testSingleCharExpressionLanguage() {
CSVValidators.SingleCharacterValidator validator = new CSVValidators.SingleCharacterValidator();
ValidationContext mockContext = Mockito.mock(ValidationContext.class);
Mockito.when(mockContext.isExpressionLanguageSupported(Mockito.any())).thenReturn(true);
Mockito.when(mockContext.isExpressionLanguagePresent(Mockito.any())).thenReturn(true);
ValidationResult result = validator.validate("EscapeChar", "${csv.escape}", mockContext);
assertTrue(result.isValid());
}
/*** Unescaped SingleCharValidator **/ /*** Unescaped SingleCharValidator **/
@ -95,4 +104,14 @@ public class TestCSVValidators {
assertTrue(result.isValid()); assertTrue(result.isValid());
} }
@Test
public void testUnescapedSingleCharExpressionLanguage() {
Validator validator = CSVValidators.UNESCAPED_SINGLE_CHAR_VALIDATOR;
ValidationContext mockContext = Mockito.mock(ValidationContext.class);
Mockito.when(mockContext.isExpressionLanguageSupported(Mockito.any())).thenReturn(true);
Mockito.when(mockContext.isExpressionLanguagePresent(Mockito.any())).thenReturn(true);
ValidationResult result = validator.validate("Delimiter", "${csv.delimiter}", mockContext);
assertTrue(result.isValid());
}
} }

View File

@ -1,247 +1,248 @@
/* /*
* Licensed to the Apache Software Foundation (ASF) under one or more * Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with * contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership. * this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0 * The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with * (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at * the License. You may obtain a copy of the License at
* *
* http://www.apache.org/licenses/LICENSE-2.0 * http://www.apache.org/licenses/LICENSE-2.0
* *
* Unless required by applicable law or agreed to in writing, software * Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS, * distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and * See the License for the specific language governing permissions and
* limitations under the License. * limitations under the License.
*/ */
package org.apache.nifi.xml; package org.apache.nifi.xml;
import org.apache.avro.Schema; import org.apache.avro.Schema;
import org.apache.nifi.avro.AvroTypeUtil; import org.apache.nifi.avro.AvroTypeUtil;
import org.apache.nifi.components.AllowableValue; import org.apache.nifi.components.AllowableValue;
import org.apache.nifi.logging.ComponentLog; import org.apache.nifi.logging.ComponentLog;
import org.apache.nifi.reporting.InitializationException; import org.apache.nifi.reporting.InitializationException;
import org.apache.nifi.schema.access.SchemaAccessUtils; import org.apache.nifi.schema.access.SchemaAccessUtils;
import org.apache.nifi.schema.access.SchemaNotFoundException; import org.apache.nifi.schema.access.SchemaNotFoundException;
import org.apache.nifi.serialization.RecordSetWriter; import org.apache.nifi.serialization.RecordSetWriter;
import org.apache.nifi.serialization.record.RecordSchema; import org.apache.nifi.serialization.record.RecordSchema;
import org.apache.nifi.serialization.record.SchemaIdentifier; import org.apache.nifi.serialization.record.SchemaIdentifier;
import org.apache.nifi.util.TestRunner; import org.apache.nifi.util.TestRunner;
import org.apache.nifi.util.TestRunners; import org.apache.nifi.util.TestRunners;
import org.junit.Assert; import org.junit.Assert;
import org.junit.Test; import org.junit.Test;
import org.xmlunit.diff.DefaultNodeMatcher; import org.xmlunit.diff.DefaultNodeMatcher;
import org.xmlunit.diff.ElementSelectors; import org.xmlunit.diff.ElementSelectors;
import org.xmlunit.matchers.CompareMatcher; import org.xmlunit.matchers.CompareMatcher;
import java.io.IOException; import java.io.IOException;
import java.io.OutputStream; import java.io.OutputStream;
import java.nio.file.Files; import java.nio.file.Files;
import java.nio.file.Paths; import java.nio.file.Paths;
import java.util.Collections;
import static org.junit.Assert.assertThat;
import static org.junit.Assert.assertThat;
public class TestXMLRecordSetWriter {
public class TestXMLRecordSetWriter {
private TestRunner setup(XMLRecordSetWriter writer) throws InitializationException, IOException {
TestRunner runner = TestRunners.newTestRunner(TestXMLRecordSetWriterProcessor.class); private TestRunner setup(XMLRecordSetWriter writer) throws InitializationException, IOException {
TestRunner runner = TestRunners.newTestRunner(TestXMLRecordSetWriterProcessor.class);
final String outputSchemaText = new String(Files.readAllBytes(Paths.get("src/test/resources/xml/testschema3")));
final String outputSchemaText = new String(Files.readAllBytes(Paths.get("src/test/resources/xml/testschema3")));
runner.addControllerService("xml_writer", writer);
runner.setProperty(TestXMLRecordSetWriterProcessor.XML_WRITER, "xml_writer"); runner.addControllerService("xml_writer", writer);
runner.setProperty(TestXMLRecordSetWriterProcessor.XML_WRITER, "xml_writer");
runner.setProperty(writer, SchemaAccessUtils.SCHEMA_ACCESS_STRATEGY, SchemaAccessUtils.SCHEMA_TEXT_PROPERTY);
runner.setProperty(writer, SchemaAccessUtils.SCHEMA_TEXT, outputSchemaText); runner.setProperty(writer, SchemaAccessUtils.SCHEMA_ACCESS_STRATEGY, SchemaAccessUtils.SCHEMA_TEXT_PROPERTY);
runner.setProperty(writer, XMLRecordSetWriter.PRETTY_PRINT_XML, new AllowableValue("true")); runner.setProperty(writer, SchemaAccessUtils.SCHEMA_TEXT, outputSchemaText);
runner.setProperty(writer, XMLRecordSetWriter.PRETTY_PRINT_XML, new AllowableValue("true"));
runner.setProperty(writer, "Schema Write Strategy", "no-schema");
runner.setProperty(writer, "Schema Write Strategy", "no-schema");
return runner;
} return runner;
}
@Test
public void testDefault() throws IOException, InitializationException { @Test
XMLRecordSetWriter writer = new XMLRecordSetWriter(); public void testDefault() throws IOException, InitializationException {
TestRunner runner = setup(writer); XMLRecordSetWriter writer = new XMLRecordSetWriter();
TestRunner runner = setup(writer);
runner.setProperty(writer, XMLRecordSetWriter.ROOT_TAG_NAME, "root");
runner.setProperty(writer, XMLRecordSetWriter.ROOT_TAG_NAME, "root");
runner.enableControllerService(writer);
runner.enqueue(""); runner.enableControllerService(writer);
runner.run(); runner.enqueue("");
runner.assertQueueEmpty(); runner.run();
runner.assertAllFlowFilesTransferred(TestXMLRecordSetWriterProcessor.SUCCESS, 1); runner.assertQueueEmpty();
runner.assertAllFlowFilesTransferred(TestXMLRecordSetWriterProcessor.SUCCESS, 1);
String expected = "<root><array_record><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" +
"<name1>val1</name1><name2></name2></array_record>" + String expected = "<root><array_record><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" +
"<array_record><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" + "<name1>val1</name1><name2></name2></array_record>" +
"<name1>val1</name1><name2></name2></array_record></root>"; "<array_record><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" +
String actual = new String(runner.getContentAsByteArray(runner.getFlowFilesForRelationship(TestXMLRecordSetWriterProcessor.SUCCESS).get(0))); "<name1>val1</name1><name2></name2></array_record></root>";
assertThat(expected, CompareMatcher.isSimilarTo(actual).ignoreWhitespace().withNodeMatcher(new DefaultNodeMatcher(ElementSelectors.byNameAndText))); String actual = new String(runner.getContentAsByteArray(runner.getFlowFilesForRelationship(TestXMLRecordSetWriterProcessor.SUCCESS).get(0)));
} assertThat(expected, CompareMatcher.isSimilarTo(actual).ignoreWhitespace().withNodeMatcher(new DefaultNodeMatcher(ElementSelectors.byNameAndText)));
}
@Test
public void testDefaultSingleRecord() throws IOException, InitializationException { @Test
XMLRecordSetWriter writer = new XMLRecordSetWriter(); public void testDefaultSingleRecord() throws IOException, InitializationException {
TestRunner runner = setup(writer); XMLRecordSetWriter writer = new XMLRecordSetWriter();
TestRunner runner = setup(writer);
runner.setProperty(TestXMLRecordSetWriterProcessor.MULTIPLE_RECORDS, "false");
runner.setProperty(TestXMLRecordSetWriterProcessor.MULTIPLE_RECORDS, "false");
runner.enableControllerService(writer);
runner.enqueue(""); runner.enableControllerService(writer);
runner.run(); runner.enqueue("");
runner.assertQueueEmpty(); runner.run();
runner.assertAllFlowFilesTransferred(TestXMLRecordSetWriterProcessor.SUCCESS, 1); runner.assertQueueEmpty();
runner.assertAllFlowFilesTransferred(TestXMLRecordSetWriterProcessor.SUCCESS, 1);
String expected = "<array_record><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" +
"<name1>val1</name1><name2></name2></array_record>"; String expected = "<array_record><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" +
"<name1>val1</name1><name2></name2></array_record>";
String actual = new String(runner.getContentAsByteArray(runner.getFlowFilesForRelationship(TestXMLRecordSetWriterProcessor.SUCCESS).get(0)));
assertThat(expected, CompareMatcher.isSimilarTo(actual).ignoreWhitespace().withNodeMatcher(new DefaultNodeMatcher(ElementSelectors.byNameAndText))); String actual = new String(runner.getContentAsByteArray(runner.getFlowFilesForRelationship(TestXMLRecordSetWriterProcessor.SUCCESS).get(0)));
} assertThat(expected, CompareMatcher.isSimilarTo(actual).ignoreWhitespace().withNodeMatcher(new DefaultNodeMatcher(ElementSelectors.byNameAndText)));
}
@Test
public void testRootAndRecordNaming() throws IOException, InitializationException { @Test
XMLRecordSetWriter writer = new XMLRecordSetWriter(); public void testRootAndRecordNaming() throws IOException, InitializationException {
TestRunner runner = setup(writer); XMLRecordSetWriter writer = new XMLRecordSetWriter();
TestRunner runner = setup(writer);
runner.setProperty(writer, XMLRecordSetWriter.ROOT_TAG_NAME, "ROOT_NODE");
runner.setProperty(writer, XMLRecordSetWriter.RECORD_TAG_NAME, "RECORD_NODE"); runner.setProperty(writer, XMLRecordSetWriter.ROOT_TAG_NAME, "ROOT_NODE");
runner.setProperty(writer, XMLRecordSetWriter.RECORD_TAG_NAME, "RECORD_NODE");
runner.enableControllerService(writer);
runner.enqueue(""); runner.enableControllerService(writer);
runner.run(); runner.enqueue("");
runner.assertQueueEmpty(); runner.run();
runner.assertAllFlowFilesTransferred(TestXMLRecordSetWriterProcessor.SUCCESS, 1); runner.assertQueueEmpty();
runner.assertAllFlowFilesTransferred(TestXMLRecordSetWriterProcessor.SUCCESS, 1);
String expected = "<ROOT_NODE><RECORD_NODE><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" +
"<name1>val1</name1><name2></name2></RECORD_NODE>" + String expected = "<ROOT_NODE><RECORD_NODE><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" +
"<RECORD_NODE><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" + "<name1>val1</name1><name2></name2></RECORD_NODE>" +
"<name1>val1</name1><name2></name2></RECORD_NODE></ROOT_NODE>"; "<RECORD_NODE><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" +
String actual = new String(runner.getContentAsByteArray(runner.getFlowFilesForRelationship(TestXMLRecordSetWriterProcessor.SUCCESS).get(0))); "<name1>val1</name1><name2></name2></RECORD_NODE></ROOT_NODE>";
assertThat(expected, CompareMatcher.isSimilarTo(actual).ignoreWhitespace().withNodeMatcher(new DefaultNodeMatcher(ElementSelectors.byNameAndText))); String actual = new String(runner.getContentAsByteArray(runner.getFlowFilesForRelationship(TestXMLRecordSetWriterProcessor.SUCCESS).get(0)));
} assertThat(expected, CompareMatcher.isSimilarTo(actual).ignoreWhitespace().withNodeMatcher(new DefaultNodeMatcher(ElementSelectors.byNameAndText)));
}
@Test
public void testSchemaRootRecordNaming() throws IOException, InitializationException { @Test
String avroSchemaText = new String(Files.readAllBytes(Paths.get("src/test/resources/xml/testschema3")));; public void testSchemaRootRecordNaming() throws IOException, InitializationException {
Schema avroSchema = new Schema.Parser().parse(avroSchemaText); String avroSchemaText = new String(Files.readAllBytes(Paths.get("src/test/resources/xml/testschema3")));;
Schema avroSchema = new Schema.Parser().parse(avroSchemaText);
SchemaIdentifier schemaId = SchemaIdentifier.builder().name("schemaName").build();
RecordSchema recordSchema = AvroTypeUtil.createSchema(avroSchema, avroSchemaText, schemaId); SchemaIdentifier schemaId = SchemaIdentifier.builder().name("schemaName").build();
RecordSchema recordSchema = AvroTypeUtil.createSchema(avroSchema, avroSchemaText, schemaId);
XMLRecordSetWriter writer = new _XMLRecordSetWriter(recordSchema);
TestRunner runner = setup(writer); XMLRecordSetWriter writer = new _XMLRecordSetWriter(recordSchema);
TestRunner runner = setup(writer);
runner.setProperty(writer, XMLRecordSetWriter.ROOT_TAG_NAME, "ROOT_NODE");
runner.setProperty(writer, XMLRecordSetWriter.ROOT_TAG_NAME, "ROOT_NODE");
runner.enableControllerService(writer);
runner.enqueue(""); runner.enableControllerService(writer);
runner.run(); runner.enqueue("");
runner.assertQueueEmpty(); runner.run();
runner.assertAllFlowFilesTransferred(TestXMLRecordSetWriterProcessor.SUCCESS, 1); runner.assertQueueEmpty();
runner.assertAllFlowFilesTransferred(TestXMLRecordSetWriterProcessor.SUCCESS, 1);
String expected = "<ROOT_NODE><array_record><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" +
"<name1>val1</name1><name2></name2></array_record>" + String expected = "<ROOT_NODE><array_record><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" +
"<array_record><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" + "<name1>val1</name1><name2></name2></array_record>" +
"<name1>val1</name1><name2></name2></array_record></ROOT_NODE>"; "<array_record><array_field>1</array_field><array_field></array_field><array_field>3</array_field>" +
String actual = new String(runner.getContentAsByteArray(runner.getFlowFilesForRelationship(TestXMLRecordSetWriterProcessor.SUCCESS).get(0))); "<name1>val1</name1><name2></name2></array_record></ROOT_NODE>";
assertThat(expected, CompareMatcher.isSimilarTo(actual).ignoreWhitespace().withNodeMatcher(new DefaultNodeMatcher(ElementSelectors.byNameAndText))); String actual = new String(runner.getContentAsByteArray(runner.getFlowFilesForRelationship(TestXMLRecordSetWriterProcessor.SUCCESS).get(0)));
} assertThat(expected, CompareMatcher.isSimilarTo(actual).ignoreWhitespace().withNodeMatcher(new DefaultNodeMatcher(ElementSelectors.byNameAndText)));
}
@Test
public void testNullSuppression() throws IOException, InitializationException { @Test
XMLRecordSetWriter writer = new XMLRecordSetWriter(); public void testNullSuppression() throws IOException, InitializationException {
TestRunner runner = setup(writer); XMLRecordSetWriter writer = new XMLRecordSetWriter();
TestRunner runner = setup(writer);
runner.setProperty(writer, XMLRecordSetWriter.ROOT_TAG_NAME, "root");
runner.setProperty(writer, XMLRecordSetWriter.RECORD_TAG_NAME, "record"); runner.setProperty(writer, XMLRecordSetWriter.ROOT_TAG_NAME, "root");
runner.setProperty(writer, XMLRecordSetWriter.RECORD_TAG_NAME, "record");
runner.setProperty(writer, XMLRecordSetWriter.SUPPRESS_NULLS, XMLRecordSetWriter.ALWAYS_SUPPRESS);
runner.setProperty(writer, XMLRecordSetWriter.SUPPRESS_NULLS, XMLRecordSetWriter.ALWAYS_SUPPRESS);
runner.enableControllerService(writer);
runner.enqueue(""); runner.enableControllerService(writer);
runner.run(); runner.enqueue("");
runner.assertQueueEmpty(); runner.run();
runner.assertAllFlowFilesTransferred(TestXMLRecordSetWriterProcessor.SUCCESS, 1); runner.assertQueueEmpty();
runner.assertAllFlowFilesTransferred(TestXMLRecordSetWriterProcessor.SUCCESS, 1);
String expected = "<root><record><array_field>1</array_field><array_field>3</array_field>" +
"<name1>val1</name1></record>" + String expected = "<root><record><array_field>1</array_field><array_field>3</array_field>" +
"<record><array_field>1</array_field><array_field>3</array_field>" + "<name1>val1</name1></record>" +
"<name1>val1</name1></record></root>"; "<record><array_field>1</array_field><array_field>3</array_field>" +
String actual = new String(runner.getContentAsByteArray(runner.getFlowFilesForRelationship(TestXMLRecordSetWriterProcessor.SUCCESS).get(0))); "<name1>val1</name1></record></root>";
assertThat(expected, CompareMatcher.isSimilarTo(actual).ignoreWhitespace().withNodeMatcher(new DefaultNodeMatcher(ElementSelectors.byNameAndText))); String actual = new String(runner.getContentAsByteArray(runner.getFlowFilesForRelationship(TestXMLRecordSetWriterProcessor.SUCCESS).get(0)));
} assertThat(expected, CompareMatcher.isSimilarTo(actual).ignoreWhitespace().withNodeMatcher(new DefaultNodeMatcher(ElementSelectors.byNameAndText)));
}
@Test
public void testArrayWrapping() throws IOException, InitializationException { @Test
XMLRecordSetWriter writer = new XMLRecordSetWriter(); public void testArrayWrapping() throws IOException, InitializationException {
TestRunner runner = setup(writer); XMLRecordSetWriter writer = new XMLRecordSetWriter();
TestRunner runner = setup(writer);
runner.setProperty(writer, XMLRecordSetWriter.ROOT_TAG_NAME, "root");
runner.setProperty(writer, XMLRecordSetWriter.RECORD_TAG_NAME, "record"); runner.setProperty(writer, XMLRecordSetWriter.ROOT_TAG_NAME, "root");
runner.setProperty(writer, XMLRecordSetWriter.RECORD_TAG_NAME, "record");
runner.setProperty(writer, XMLRecordSetWriter.ARRAY_WRAPPING, XMLRecordSetWriter.USE_PROPERTY_AS_WRAPPER);
runner.setProperty(writer, XMLRecordSetWriter.ARRAY_TAG_NAME, "wrap"); runner.setProperty(writer, XMLRecordSetWriter.ARRAY_WRAPPING, XMLRecordSetWriter.USE_PROPERTY_AS_WRAPPER);
runner.setProperty(writer, XMLRecordSetWriter.ARRAY_TAG_NAME, "wrap");
runner.enableControllerService(writer);
runner.enqueue(""); runner.enableControllerService(writer);
runner.run(); runner.enqueue("");
runner.assertQueueEmpty(); runner.run();
runner.assertAllFlowFilesTransferred(TestXMLRecordSetWriterProcessor.SUCCESS, 1); runner.assertQueueEmpty();
runner.assertAllFlowFilesTransferred(TestXMLRecordSetWriterProcessor.SUCCESS, 1);
String expected = "<root><record><wrap><array_field>1</array_field><array_field></array_field><array_field>3</array_field></wrap>" +
"<name1>val1</name1><name2></name2></record>" + String expected = "<root><record><wrap><array_field>1</array_field><array_field></array_field><array_field>3</array_field></wrap>" +
"<record><wrap><array_field>1</array_field><array_field></array_field><array_field>3</array_field></wrap>" + "<name1>val1</name1><name2></name2></record>" +
"<name1>val1</name1><name2></name2></record></root>"; "<record><wrap><array_field>1</array_field><array_field></array_field><array_field>3</array_field></wrap>" +
String actual = new String(runner.getContentAsByteArray(runner.getFlowFilesForRelationship(TestXMLRecordSetWriterProcessor.SUCCESS).get(0))); "<name1>val1</name1><name2></name2></record></root>";
assertThat(expected, CompareMatcher.isSimilarTo(actual).ignoreWhitespace().withNodeMatcher(new DefaultNodeMatcher(ElementSelectors.byNameAndText))); String actual = new String(runner.getContentAsByteArray(runner.getFlowFilesForRelationship(TestXMLRecordSetWriterProcessor.SUCCESS).get(0)));
} assertThat(expected, CompareMatcher.isSimilarTo(actual).ignoreWhitespace().withNodeMatcher(new DefaultNodeMatcher(ElementSelectors.byNameAndText)));
}
@Test
public void testValidation() throws IOException, InitializationException { @Test
XMLRecordSetWriter writer = new XMLRecordSetWriter(); public void testValidation() throws IOException, InitializationException {
TestRunner runner = setup(writer); XMLRecordSetWriter writer = new XMLRecordSetWriter();
TestRunner runner = setup(writer);
runner.setProperty(writer, XMLRecordSetWriter.ROOT_TAG_NAME, "root");
runner.setProperty(writer, XMLRecordSetWriter.RECORD_TAG_NAME, "record"); runner.setProperty(writer, XMLRecordSetWriter.ROOT_TAG_NAME, "root");
runner.setProperty(writer, XMLRecordSetWriter.RECORD_TAG_NAME, "record");
runner.setProperty(writer, XMLRecordSetWriter.ARRAY_WRAPPING, XMLRecordSetWriter.USE_PROPERTY_AS_WRAPPER);
runner.assertNotValid(writer); runner.setProperty(writer, XMLRecordSetWriter.ARRAY_WRAPPING, XMLRecordSetWriter.USE_PROPERTY_AS_WRAPPER);
runner.assertNotValid(writer);
runner.setProperty(writer, XMLRecordSetWriter.ARRAY_TAG_NAME, "array-tag-name");
runner.assertValid(writer); runner.setProperty(writer, XMLRecordSetWriter.ARRAY_TAG_NAME, "array-tag-name");
runner.assertValid(writer);
runner.enableControllerService(writer);
runner.enqueue(""); runner.enableControllerService(writer);
runner.enqueue("");
String message = "Processor has 1 validation failures:\n" +
"'xml_writer' validated against 'xml_writer' is invalid because Controller Service is not valid: " + String message = "Processor has 1 validation failures:\n" +
"'array_tag_name' is invalid because if property 'array_wrapping' is defined as 'Use Property as Wrapper' " + "'xml_writer' validated against 'xml_writer' is invalid because Controller Service is not valid: " +
"or 'Use Property for Elements' the property 'Array Tag Name' has to be set.\n"; "'array_tag_name' is invalid because if property 'array_wrapping' is defined as 'Use Property as Wrapper' " +
"or 'Use Property for Elements' the property 'Array Tag Name' has to be set.\n";
try {
runner.run(); try {
} catch (AssertionError e) { runner.run();
Assert.assertEquals(message, e.getMessage()); } catch (AssertionError e) {
} Assert.assertEquals(message, e.getMessage());
} }
}
static class _XMLRecordSetWriter extends XMLRecordSetWriter{
static class _XMLRecordSetWriter extends XMLRecordSetWriter{
RecordSchema recordSchema;
RecordSchema recordSchema;
_XMLRecordSetWriter(RecordSchema recordSchema){
this.recordSchema = recordSchema; _XMLRecordSetWriter(RecordSchema recordSchema){
} this.recordSchema = recordSchema;
}
@Override
public RecordSetWriter createWriter(ComponentLog logger, RecordSchema schema, OutputStream out) @Override
throws SchemaNotFoundException, IOException { public RecordSetWriter createWriter(ComponentLog logger, RecordSchema schema, OutputStream out)
return super.createWriter(logger, this.recordSchema, out); throws SchemaNotFoundException, IOException {
} return super.createWriter(logger, this.recordSchema, out, Collections.emptyMap());
} }
}
}
}

View File

@ -1,122 +1,123 @@
/* /*
* Licensed to the Apache Software Foundation (ASF) under one or more * Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with * contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership. * this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0 * The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with * (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at * the License. You may obtain a copy of the License at
* *
* http://www.apache.org/licenses/LICENSE-2.0 * http://www.apache.org/licenses/LICENSE-2.0
* *
* Unless required by applicable law or agreed to in writing, software * Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS, * distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and * See the License for the specific language governing permissions and
* limitations under the License. * limitations under the License.
*/ */
package org.apache.nifi.xml; package org.apache.nifi.xml;
import org.apache.nifi.components.PropertyDescriptor; import org.apache.nifi.components.PropertyDescriptor;
import org.apache.nifi.flowfile.FlowFile; import org.apache.nifi.flowfile.FlowFile;
import org.apache.nifi.processor.AbstractProcessor; import org.apache.nifi.processor.AbstractProcessor;
import org.apache.nifi.processor.ProcessContext; import org.apache.nifi.processor.ProcessContext;
import org.apache.nifi.processor.ProcessSession; import org.apache.nifi.processor.ProcessSession;
import org.apache.nifi.processor.Relationship; import org.apache.nifi.processor.Relationship;
import org.apache.nifi.processor.exception.ProcessException; import org.apache.nifi.processor.exception.ProcessException;
import org.apache.nifi.processor.util.StandardValidators; import org.apache.nifi.processor.util.StandardValidators;
import org.apache.nifi.serialization.RecordSetWriter; import org.apache.nifi.serialization.RecordSetWriter;
import org.apache.nifi.serialization.RecordSetWriterFactory; import org.apache.nifi.serialization.RecordSetWriterFactory;
import org.apache.nifi.serialization.SimpleRecordSchema; import org.apache.nifi.serialization.SimpleRecordSchema;
import org.apache.nifi.serialization.record.ListRecordSet; import org.apache.nifi.serialization.record.ListRecordSet;
import org.apache.nifi.serialization.record.MapRecord; import org.apache.nifi.serialization.record.MapRecord;
import org.apache.nifi.serialization.record.Record; import org.apache.nifi.serialization.record.Record;
import org.apache.nifi.serialization.record.RecordSchema; import org.apache.nifi.serialization.record.RecordSchema;
import org.apache.nifi.serialization.record.RecordSet; import org.apache.nifi.serialization.record.RecordSet;
import java.util.ArrayList; import java.util.ArrayList;
import java.util.Collections; import java.util.Collections;
import java.util.HashMap; import java.util.HashMap;
import java.util.HashSet; import java.util.HashSet;
import java.util.List; import java.util.List;
import java.util.Map; import java.util.Map;
import java.util.Set; import java.util.Set;
public class TestXMLRecordSetWriterProcessor extends AbstractProcessor { public class TestXMLRecordSetWriterProcessor extends AbstractProcessor {
static final PropertyDescriptor XML_WRITER = new PropertyDescriptor.Builder() static final PropertyDescriptor XML_WRITER = new PropertyDescriptor.Builder()
.name("xml_writer") .name("xml_writer")
.identifiesControllerService(XMLRecordSetWriter.class) .identifiesControllerService(XMLRecordSetWriter.class)
.required(true) .required(true)
.build(); .build();
static final PropertyDescriptor MULTIPLE_RECORDS = new PropertyDescriptor.Builder() static final PropertyDescriptor MULTIPLE_RECORDS = new PropertyDescriptor.Builder()
.name("multiple_records") .name("multiple_records")
.allowableValues("true", "false") .allowableValues("true", "false")
.defaultValue("true") .defaultValue("true")
.addValidator(StandardValidators.NON_EMPTY_VALIDATOR) .addValidator(StandardValidators.NON_EMPTY_VALIDATOR)
.build(); .build();
public static final Relationship SUCCESS = new Relationship.Builder().name("success").description("success").build(); public static final Relationship SUCCESS = new Relationship.Builder().name("success").description("success").build();
@Override @Override
public void onTrigger(ProcessContext context, ProcessSession session) throws ProcessException { public void onTrigger(ProcessContext context, ProcessSession session) throws ProcessException {
FlowFile flowFile = session.get(); FlowFile flowFile = session.get();
final RecordSetWriterFactory writerFactory = context.getProperty(XML_WRITER).asControllerService(RecordSetWriterFactory.class); final RecordSetWriterFactory writerFactory = context.getProperty(XML_WRITER).asControllerService(RecordSetWriterFactory.class);
flowFile = session.write(flowFile, out -> { final FlowFile flowFileRef = flowFile;
try { flowFile = session.write(flowFile, out -> {
try {
final RecordSchema schema = writerFactory.getSchema(null, null);
final RecordSchema schema = writerFactory.getSchema(null, null);
boolean multipleRecords = Boolean.parseBoolean(context.getProperty(MULTIPLE_RECORDS).getValue());
RecordSet recordSet = getRecordSet(multipleRecords); boolean multipleRecords = Boolean.parseBoolean(context.getProperty(MULTIPLE_RECORDS).getValue());
RecordSet recordSet = getRecordSet(multipleRecords);
final RecordSetWriter writer = writerFactory.createWriter(getLogger(), schema, out);
final RecordSetWriter writer = writerFactory.createWriter(getLogger(), schema, out, flowFileRef);
writer.write(recordSet);
writer.flush(); writer.write(recordSet);
writer.flush();
} catch (Exception e) {
throw new ProcessException(e.getMessage()); } catch (Exception e) {
} throw new ProcessException(e.getMessage());
}
});
session.transfer(flowFile, SUCCESS); });
} session.transfer(flowFile, SUCCESS);
}
@Override
protected List<PropertyDescriptor> getSupportedPropertyDescriptors() { @Override
return new ArrayList<PropertyDescriptor>() {{ add(XML_WRITER); add(MULTIPLE_RECORDS); }}; protected List<PropertyDescriptor> getSupportedPropertyDescriptors() {
} return new ArrayList<PropertyDescriptor>() {{ add(XML_WRITER); add(MULTIPLE_RECORDS); }};
}
@Override
public Set<Relationship> getRelationships() { @Override
return new HashSet<Relationship>() {{ add(SUCCESS); }}; public Set<Relationship> getRelationships() {
} return new HashSet<Relationship>() {{ add(SUCCESS); }};
}
protected static RecordSet getRecordSet(boolean multipleRecords) {
Object[] arrayVals = {1, null, 3}; protected static RecordSet getRecordSet(boolean multipleRecords) {
Object[] arrayVals = {1, null, 3};
Map<String,Object> recordFields = new HashMap<>();
recordFields.put("name1", "val1"); Map<String,Object> recordFields = new HashMap<>();
recordFields.put("name2", null); recordFields.put("name1", "val1");
recordFields.put("array_field", arrayVals); recordFields.put("name2", null);
recordFields.put("array_field", arrayVals);
RecordSchema emptySchema = new SimpleRecordSchema(Collections.emptyList());
RecordSchema emptySchema = new SimpleRecordSchema(Collections.emptyList());
List<Record> records = new ArrayList<>();
records.add(new MapRecord(emptySchema, recordFields)); List<Record> records = new ArrayList<>();
records.add(new MapRecord(emptySchema, recordFields));
if (multipleRecords) {
records.add(new MapRecord(emptySchema, recordFields)); if (multipleRecords) {
} records.add(new MapRecord(emptySchema, recordFields));
}
return new ListRecordSet(emptySchema, records);
} return new ListRecordSet(emptySchema, records);
}
}
}