NIFI-4957 Add Resource File Support for Jolt Specifications

This closes #4044

Signed-off-by: David Handermann <exceptionfactory@apache.org>
This commit is contained in:
Matthew Burgess 2020-02-10 13:02:49 -05:00 committed by exceptionfactory
parent 63452da617
commit 991e5e24de
No known key found for this signature in database
GPG Key ID: 29B6A52D2AAE8DBA
4 changed files with 277 additions and 115 deletions

View File

@ -34,9 +34,11 @@ import org.apache.nifi.annotation.documentation.Tags;
import org.apache.nifi.annotation.lifecycle.OnScheduled; import org.apache.nifi.annotation.lifecycle.OnScheduled;
import org.apache.nifi.components.AllowableValue; import org.apache.nifi.components.AllowableValue;
import org.apache.nifi.components.PropertyDescriptor; import org.apache.nifi.components.PropertyDescriptor;
import org.apache.nifi.components.PropertyValue;
import org.apache.nifi.components.ValidationContext; import org.apache.nifi.components.ValidationContext;
import org.apache.nifi.components.ValidationResult; import org.apache.nifi.components.ValidationResult;
import org.apache.nifi.components.resource.ResourceCardinality; import org.apache.nifi.components.resource.ResourceCardinality;
import org.apache.nifi.components.resource.ResourceReference;
import org.apache.nifi.components.resource.ResourceType; import org.apache.nifi.components.resource.ResourceType;
import org.apache.nifi.expression.ExpressionLanguageScope; import org.apache.nifi.expression.ExpressionLanguageScope;
import org.apache.nifi.flowfile.FlowFile; import org.apache.nifi.flowfile.FlowFile;
@ -60,10 +62,15 @@ import org.apache.nifi.serialization.record.RecordSchema;
import org.apache.nifi.serialization.record.util.DataTypeUtils; import org.apache.nifi.serialization.record.util.DataTypeUtils;
import org.apache.nifi.util.StopWatch; import org.apache.nifi.util.StopWatch;
import org.apache.nifi.util.StringUtils; import org.apache.nifi.util.StringUtils;
import org.apache.nifi.util.file.classloader.ClassLoaderUtils;
import java.io.BufferedReader;
import java.io.FilenameFilter;
import java.io.IOException; import java.io.IOException;
import java.io.InputStream; import java.io.InputStream;
import java.io.InputStreamReader;
import java.io.OutputStream; import java.io.OutputStream;
import java.io.UncheckedIOException;
import java.util.ArrayList; import java.util.ArrayList;
import java.util.Arrays; import java.util.Arrays;
import java.util.Collection; import java.util.Collection;
@ -86,7 +93,7 @@ import java.util.stream.Collectors;
@WritesAttribute(attribute = "record.count", description = "The number of records in an outgoing FlowFile"), @WritesAttribute(attribute = "record.count", description = "The number of records in an outgoing FlowFile"),
@WritesAttribute(attribute = "mime.type", description = "The MIME Type that the configured Record Writer indicates is appropriate"), @WritesAttribute(attribute = "mime.type", description = "The MIME Type that the configured Record Writer indicates is appropriate"),
}) })
@CapabilityDescription("Applies a list of Jolt specifications to the FlowFile payload. A new FlowFile is created " @CapabilityDescription("Applies a JOLT specification to each record in the FlowFile payload. A new FlowFile is created "
+ "with transformed content and is routed to the 'success' relationship. If the transform " + "with transformed content and is routed to the 'success' relationship. If the transform "
+ "fails, the original FlowFile is routed to the 'failure' relationship.") + "fails, the original FlowFile is routed to the 'failure' relationship.")
@RequiresInstanceClassLoading @RequiresInstanceClassLoading
@ -141,9 +148,11 @@ public class JoltTransformRecord extends AbstractProcessor {
static final PropertyDescriptor JOLT_SPEC = new PropertyDescriptor.Builder() static final PropertyDescriptor JOLT_SPEC = new PropertyDescriptor.Builder()
.name("jolt-record-spec") .name("jolt-record-spec")
.displayName("Jolt Specification") .displayName("Jolt Specification")
.description("Jolt Specification for transform of record data. This value is ignored if the Jolt Sort Transformation is selected.") .description("Jolt Specification for transform of record data. The value for this property may be the text of a JOLT specification "
+ "or the path to a file containing a JOLT specification. This value is ignored if the Jolt Sort Transformation is selected.")
.expressionLanguageSupported(ExpressionLanguageScope.FLOWFILE_ATTRIBUTES) .expressionLanguageSupported(ExpressionLanguageScope.FLOWFILE_ATTRIBUTES)
.addValidator(StandardValidators.NON_EMPTY_VALIDATOR) .addValidator(StandardValidators.NON_EMPTY_VALIDATOR)
.identifiesExternalResource(ResourceCardinality.SINGLE, ResourceType.FILE, ResourceType.TEXT)
.required(false) .required(false)
.build(); .build();
@ -238,19 +247,26 @@ public class JoltTransformRecord extends AbstractProcessor {
final List<ValidationResult> results = new ArrayList<>(super.customValidate(validationContext)); final List<ValidationResult> results = new ArrayList<>(super.customValidate(validationContext));
final String transform = validationContext.getProperty(JOLT_TRANSFORM).getValue(); final String transform = validationContext.getProperty(JOLT_TRANSFORM).getValue();
final String customTransform = validationContext.getProperty(CUSTOM_CLASS).getValue(); final String customTransform = validationContext.getProperty(CUSTOM_CLASS).getValue();
if (!validationContext.getProperty(JOLT_SPEC).isSet() || StringUtils.isEmpty(validationContext.getProperty(JOLT_SPEC).getValue())) { final String modulePath = validationContext.getProperty(MODULES).isSet()? validationContext.getProperty(MODULES).getValue() : null;
if (!SORTR.getValue().equals(transform)) { final String joltSpecValue = validationContext.getProperty(JOLT_SPEC).getValue();
final String message = "A specification is required for this transformation";
results.add(new ValidationResult.Builder().valid(false)
.explanation(message)
.build());
}
} else {
try {
final String specValue = validationContext.getProperty(JOLT_SPEC).getValue();
if (validationContext.isExpressionLanguagePresent(specValue) ) { if (StringUtils.isEmpty(joltSpecValue) && !SORTR.getValue().equals(transform)) {
final String invalidExpressionMsg = validationContext.newExpressionLanguageCompiler().validateExpression(specValue, true); results.add(new ValidationResult.Builder().subject(JOLT_SPEC.getDisplayName()).valid(false).explanation(
"'Jolt Specification' must be set, or the Transformation must be 'Sort'").build());
} else {
final ClassLoader customClassLoader;
try {
if (modulePath != null) {
customClassLoader = ClassLoaderUtils.getCustomClassLoader(modulePath, this.getClass().getClassLoader(), getJarFilenameFilter());
} else {
customClassLoader = this.getClass().getClassLoader();
}
final boolean elPresent = validationContext.isExpressionLanguagePresent(joltSpecValue);
if (elPresent) {
final String invalidExpressionMsg = validationContext.newExpressionLanguageCompiler().validateExpression(joltSpecValue, true);
if (!StringUtils.isEmpty(invalidExpressionMsg)) { if (!StringUtils.isEmpty(invalidExpressionMsg)) {
results.add(new ValidationResult.Builder().valid(false) results.add(new ValidationResult.Builder().valid(false)
.subject(JOLT_SPEC.getDisplayName()) .subject(JOLT_SPEC.getDisplayName())
@ -258,8 +274,11 @@ public class JoltTransformRecord extends AbstractProcessor {
.build()); .build());
} }
} else { } else {
if (!SORTR.getValue().equals(transform)) {
//for validation we want to be able to ensure the spec is syntactically correct and not try to resolve variables since they may not exist yet //for validation we want to be able to ensure the spec is syntactically correct and not try to resolve variables since they may not exist yet
Object specJson = SORTR.getValue().equals(transform) ? null : JsonUtils.jsonToObject(specValue.replaceAll("\\$\\{", "\\\\\\\\\\$\\{"), DEFAULT_CHARSET); final String content = readTransform(validationContext.getProperty(JOLT_SPEC));
final Object specJson = JsonUtils.jsonToObject(content.replaceAll("\\$\\{", "\\\\\\\\\\$\\{"), DEFAULT_CHARSET);
if (CUSTOMR.getValue().equals(transform)) { if (CUSTOMR.getValue().equals(transform)) {
if (StringUtils.isEmpty(customTransform)) { if (StringUtils.isEmpty(customTransform)) {
@ -267,19 +286,12 @@ public class JoltTransformRecord extends AbstractProcessor {
results.add(new ValidationResult.Builder().valid(false) results.add(new ValidationResult.Builder().valid(false)
.explanation(customMessage) .explanation(customMessage)
.build()); .build());
} else if (validationContext.isExpressionLanguagePresent(customTransform)) { } else {
final String invalidExpressionMsg = validationContext.newExpressionLanguageCompiler().validateExpression(customTransform, true); TransformFactory.getCustomTransform(customClassLoader, customTransform, specJson);
if (!StringUtils.isEmpty(invalidExpressionMsg)) {
results.add(new ValidationResult.Builder().valid(false)
.subject(CUSTOM_CLASS.getDisplayName())
.explanation("Invalid Expression Language: " + invalidExpressionMsg)
.build());
} }
} else { } else {
TransformFactory.getCustomTransform(Thread.currentThread().getContextClassLoader(), customTransform, specJson); TransformFactory.getTransform(customClassLoader, transform, specJson);
} }
} else {
TransformFactory.getTransform(Thread.currentThread().getContextClassLoader(), transform, specJson);
} }
} }
} catch (final Exception e) { } catch (final Exception e) {
@ -294,7 +306,6 @@ public class JoltTransformRecord extends AbstractProcessor {
return results; return results;
} }
@SuppressWarnings("unchecked")
@Override @Override
public void onTrigger(final ProcessContext context, ProcessSession session) throws ProcessException { public void onTrigger(final ProcessContext context, ProcessSession session) throws ProcessException {
final FlowFile original = session.get(); final FlowFile original = session.get();
@ -337,7 +348,7 @@ public class JoltTransformRecord extends AbstractProcessor {
} }
transformed = session.putAllAttributes(transformed, attributes); transformed = session.putAllAttributes(transformed, attributes);
logger.info("{} had no Records to transform", new Object[]{original}); logger.info("{} had no Records to transform", original);
} else { } else {
final JoltTransform transform = getTransform(context, original); final JoltTransform transform = getTransform(context, original);
@ -375,9 +386,6 @@ public class JoltTransformRecord extends AbstractProcessor {
while ((record = reader.nextRecord()) != null) { while ((record = reader.nextRecord()) != null) {
final List<Record> transformedRecords = transform(record, transform); final List<Record> transformedRecords = transform(record, transform);
if (transformedRecords == null) {
throw new ProcessException("Error transforming the record");
}
for (Record transformedRecord : transformedRecords) { for (Record transformedRecord : transformedRecords) {
writer.write(transformedRecord); writer.write(transformedRecord);
} }
@ -388,7 +396,7 @@ public class JoltTransformRecord extends AbstractProcessor {
try { try {
writer.close(); writer.close();
} catch (final IOException ioe) { } catch (final IOException ioe) {
getLogger().warn("Failed to close Writer for {}", new Object[]{transformed}); getLogger().warn("Failed to close Writer for {}", transformed);
} }
attributes.put("record.count", String.valueOf(writeResult.getRecordCount())); attributes.put("record.count", String.valueOf(writeResult.getRecordCount()));
@ -399,10 +407,10 @@ public class JoltTransformRecord extends AbstractProcessor {
final String transformType = context.getProperty(JOLT_TRANSFORM).getValue(); final String transformType = context.getProperty(JOLT_TRANSFORM).getValue();
transformed = session.putAllAttributes(transformed, attributes); transformed = session.putAllAttributes(transformed, attributes);
session.getProvenanceReporter().modifyContent(transformed, "Modified With " + transformType, stopWatch.getElapsed(TimeUnit.MILLISECONDS)); session.getProvenanceReporter().modifyContent(transformed, "Modified With " + transformType, stopWatch.getElapsed(TimeUnit.MILLISECONDS));
logger.debug("Transformed {}", new Object[]{original}); logger.debug("Transform completed {}", original);
} }
} catch (final Exception ex) { } catch (final Exception e) {
logger.error("Unable to transform {} due to {}", new Object[]{original, ex.toString(), ex}); logger.error("Transform failed for {}", original, e);
session.transfer(original, REL_FAILURE); session.transfer(original, REL_FAILURE);
if (transformed != null) { if (transformed != null) {
session.remove(transformed); session.remove(transformed);
@ -449,13 +457,15 @@ public class JoltTransformRecord extends AbstractProcessor {
final Optional<String> specString; final Optional<String> specString;
if (context.getProperty(JOLT_SPEC).isSet()) { if (context.getProperty(JOLT_SPEC).isSet()) {
specString = Optional.of(context.getProperty(JOLT_SPEC).evaluateAttributeExpressions(flowFile).getValue()); specString = Optional.of(context.getProperty(JOLT_SPEC).evaluateAttributeExpressions(flowFile).getValue());
} else { } else if (SORTR.getValue().equals(context.getProperty(JOLT_TRANSFORM).getValue())) {
specString = Optional.empty(); specString = Optional.empty();
} else {
throw new IllegalArgumentException("'Jolt Specification' must be set, or the Transformation must be Sort.");
} }
return transformCache.get(specString, currString -> { return transformCache.get(specString, currString -> {
try { try {
return createTransform(context, currString.orElse(null), flowFile); return createTransform(context, flowFile);
} catch (Exception e) { } catch (Exception e) {
getLogger().error("Problem getting transform", e); getLogger().error("Problem getting transform", e);
} }
@ -463,6 +473,27 @@ public class JoltTransformRecord extends AbstractProcessor {
}); });
} }
private String readTransform(final PropertyValue propertyValue, final FlowFile flowFile) {
final String transform;
if (propertyValue.isExpressionLanguagePresent()) {
transform = propertyValue.evaluateAttributeExpressions(flowFile).getValue();
} else {
transform = readTransform(propertyValue);
}
return transform;
}
private String readTransform(final PropertyValue propertyValue) {
final ResourceReference resourceReference = propertyValue.asResource();
try (final BufferedReader reader = new BufferedReader(new InputStreamReader(resourceReference.read()))) {
return reader.lines().collect(Collectors.joining());
} catch (final IOException e) {
throw new UncheckedIOException("Read JOLT Transform failed", e);
}
}
@OnScheduled @OnScheduled
public void setup(final ProcessContext context) { public void setup(final ProcessContext context) {
int maxTransformsToCache = context.getProperty(TRANSFORM_CACHE_SIZE).asInteger(); int maxTransformsToCache = context.getProperty(TRANSFORM_CACHE_SIZE).asInteger();
@ -471,10 +502,11 @@ public class JoltTransformRecord extends AbstractProcessor {
.build(); .build();
} }
private JoltTransform createTransform(final ProcessContext context, final String specString, final FlowFile flowFile) throws Exception { private JoltTransform createTransform(final ProcessContext context, final FlowFile flowFile) throws Exception {
final Object specJson; final Object specJson;
if (context.getProperty(JOLT_SPEC).isSet() && !SORTR.getValue().equals(context.getProperty(JOLT_TRANSFORM).getValue())) { if ((context.getProperty(JOLT_SPEC).isSet() && !SORTR.getValue().equals(context.getProperty(JOLT_TRANSFORM).getValue()))) {
specJson = JsonUtils.jsonToObject(specString, DEFAULT_CHARSET); final String resolvedSpec = readTransform(context.getProperty(JOLT_SPEC), flowFile);
specJson = JsonUtils.jsonToObject(resolvedSpec, DEFAULT_CHARSET);
} else { } else {
specJson = null; specJson = null;
} }
@ -491,6 +523,10 @@ public class JoltTransformRecord extends AbstractProcessor {
? ((ContextualTransform) joltTransform).transform(input, Collections.emptyMap()) : ((Transform) joltTransform).transform(input); ? ((ContextualTransform) joltTransform).transform(input, Collections.emptyMap()) : ((Transform) joltTransform).transform(input);
} }
protected FilenameFilter getJarFilenameFilter(){
return (dir, name) -> (name != null && name.endsWith(".jar"));
}
/** /**
* Recursively replace List objects with Object[]. JOLT expects arrays to be of type List where our Record code uses Object[]. * Recursively replace List objects with Object[]. JOLT expects arrays to be of type List where our Record code uses Object[].
* *

View File

@ -102,6 +102,24 @@ public class TestJoltTransformRecord {
assertEquals(3, relationships.size()); assertEquals(3, relationships.size());
} }
@Test
public void testRelationshipsCreatedFromFile() throws IOException {
generateTestData(1, null);
final String outputSchemaText = new String(Files.readAllBytes(Paths.get("src/test/resources/TestJoltTransformRecord/chainrOutputSchema.avsc")));
runner.setProperty(writer, SchemaAccessUtils.SCHEMA_ACCESS_STRATEGY, SchemaAccessUtils.SCHEMA_TEXT_PROPERTY);
runner.setProperty(writer, SchemaAccessUtils.SCHEMA_TEXT, outputSchemaText);
runner.setProperty(writer, "Pretty Print JSON", "true");
runner.enableControllerService(writer);
final String spec = "./src/test/resources/TestJoltTransformRecord/chainrSpec.json";
runner.setProperty(JoltTransformRecord.JOLT_SPEC, spec);
runner.enqueue(new byte[0]);
Set<Relationship> relationships = processor.getRelationships();
assertTrue(relationships.contains(JoltTransformRecord.REL_FAILURE));
assertTrue(relationships.contains(JoltTransformRecord.REL_SUCCESS));
assertTrue(relationships.contains(JoltTransformRecord.REL_ORIGINAL));
assertEquals(3, relationships.size());
}
@Test @Test
public void testInvalidJOLTSpec() throws IOException { public void testInvalidJOLTSpec() throws IOException {
generateTestData(1, null); generateTestData(1, null);
@ -110,9 +128,14 @@ public class TestJoltTransformRecord {
runner.setProperty(writer, SchemaAccessUtils.SCHEMA_TEXT, outputSchemaText); runner.setProperty(writer, SchemaAccessUtils.SCHEMA_TEXT, outputSchemaText);
runner.setProperty(writer, "Pretty Print JSON", "true"); runner.setProperty(writer, "Pretty Print JSON", "true");
runner.enableControllerService(writer); runner.enableControllerService(writer);
final String spec = "[{}]"; String spec = "[{}]";
runner.setProperty(JoltTransformRecord.JOLT_SPEC, spec); runner.setProperty(JoltTransformRecord.JOLT_SPEC, spec);
runner.assertNotValid(); runner.assertNotValid();
final String specLocation = "src/test/resources/TestJoltTransformRecord/chainrSpec.json";
spec = new String(Files.readAllBytes(Paths.get(specLocation)));
runner.setProperty(JoltTransformRecord.JOLT_SPEC, spec);
runner.assertValid();
} }
@Test @Test
@ -365,7 +388,28 @@ runner.assertTransferCount(JoltTransformRecord.REL_ORIGINAL, 1);
transformed.assertAttributeEquals(CoreAttributes.MIME_TYPE.key(), "application/json"); transformed.assertAttributeEquals(CoreAttributes.MIME_TYPE.key(), "application/json");
assertEquals(new String(Files.readAllBytes(Paths.get("src/test/resources/TestJoltTransformRecord/shiftrOutputMultipleOutputRecords.json"))), assertEquals(new String(Files.readAllBytes(Paths.get("src/test/resources/TestJoltTransformRecord/shiftrOutputMultipleOutputRecords.json"))),
new String(transformed.toByteArray())); new String(transformed.toByteArray()));
}
@Test
public void testTransformInputWithShiftrFromFile() throws IOException {
generateTestData(1, null);
final String outputSchemaText = new String(Files.readAllBytes(Paths.get("src/test/resources/TestJoltTransformRecord/shiftrOutputSchema.avsc")));
runner.setProperty(writer, SchemaAccessUtils.SCHEMA_ACCESS_STRATEGY, SchemaAccessUtils.SCHEMA_TEXT_PROPERTY);
runner.setProperty(writer, SchemaAccessUtils.SCHEMA_TEXT, outputSchemaText);
runner.setProperty(writer, "Pretty Print JSON", "true");
runner.enableControllerService(writer);
final String spec = "./src/test/resources/TestJoltTransformRecord/shiftrSpec.json";
runner.setProperty(JoltTransformRecord.JOLT_SPEC, spec);
runner.setProperty(JoltTransformRecord.JOLT_TRANSFORM, JoltTransformRecord.SHIFTR);
runner.enqueue(new byte[0]);
runner.run();
runner.assertTransferCount(JoltTransformRecord.REL_SUCCESS, 1);
runner.assertTransferCount(JoltTransformRecord.REL_ORIGINAL, 1);
final MockFlowFile transformed = runner.getFlowFilesForRelationship(JoltTransformRecord.REL_SUCCESS).get(0);
transformed.assertAttributeExists(CoreAttributes.MIME_TYPE.key());
transformed.assertAttributeEquals(CoreAttributes.MIME_TYPE.key(), "application/json");
assertEquals(new String(Files.readAllBytes(Paths.get("src/test/resources/TestJoltTransformRecord/shiftrOutput.json"))),
new String(transformed.toByteArray()));
} }
@Test @Test
@ -684,5 +728,4 @@ runner.assertTransferCount(JoltTransformRecord.REL_ORIGINAL, 1);
recordGenerator.apply(numRecords, parser); recordGenerator.apply(numRecords, parser);
} }
} }
} }

View File

@ -31,9 +31,11 @@ import org.apache.nifi.annotation.documentation.Tags;
import org.apache.nifi.annotation.lifecycle.OnScheduled; import org.apache.nifi.annotation.lifecycle.OnScheduled;
import org.apache.nifi.components.AllowableValue; import org.apache.nifi.components.AllowableValue;
import org.apache.nifi.components.PropertyDescriptor; import org.apache.nifi.components.PropertyDescriptor;
import org.apache.nifi.components.PropertyValue;
import org.apache.nifi.components.ValidationContext; import org.apache.nifi.components.ValidationContext;
import org.apache.nifi.components.ValidationResult; import org.apache.nifi.components.ValidationResult;
import org.apache.nifi.components.resource.ResourceCardinality; import org.apache.nifi.components.resource.ResourceCardinality;
import org.apache.nifi.components.resource.ResourceReference;
import org.apache.nifi.components.resource.ResourceType; import org.apache.nifi.components.resource.ResourceType;
import org.apache.nifi.expression.ExpressionLanguageScope; import org.apache.nifi.expression.ExpressionLanguageScope;
import org.apache.nifi.flowfile.FlowFile; import org.apache.nifi.flowfile.FlowFile;
@ -44,7 +46,6 @@ import org.apache.nifi.processor.ProcessContext;
import org.apache.nifi.processor.ProcessSession; import org.apache.nifi.processor.ProcessSession;
import org.apache.nifi.processor.Relationship; import org.apache.nifi.processor.Relationship;
import org.apache.nifi.processor.exception.ProcessException; import org.apache.nifi.processor.exception.ProcessException;
import org.apache.nifi.processor.io.OutputStreamCallback;
import org.apache.nifi.processor.util.StandardValidators; import org.apache.nifi.processor.util.StandardValidators;
import org.apache.nifi.processors.standard.util.jolt.TransformFactory; import org.apache.nifi.processors.standard.util.jolt.TransformFactory;
import org.apache.nifi.processors.standard.util.jolt.TransformUtils; import org.apache.nifi.processors.standard.util.jolt.TransformUtils;
@ -52,10 +53,12 @@ import org.apache.nifi.util.StopWatch;
import org.apache.nifi.util.StringUtils; import org.apache.nifi.util.StringUtils;
import org.apache.nifi.util.file.classloader.ClassLoaderUtils; import org.apache.nifi.util.file.classloader.ClassLoaderUtils;
import java.io.BufferedReader;
import java.io.FilenameFilter; import java.io.FilenameFilter;
import java.io.IOException; import java.io.IOException;
import java.io.InputStream; import java.io.InputStream;
import java.io.OutputStream; import java.io.InputStreamReader;
import java.io.UncheckedIOException;
import java.util.ArrayList; import java.util.ArrayList;
import java.util.Collection; import java.util.Collection;
import java.util.Collections; import java.util.Collections;
@ -64,6 +67,7 @@ import java.util.List;
import java.util.Optional; import java.util.Optional;
import java.util.Set; import java.util.Set;
import java.util.concurrent.TimeUnit; import java.util.concurrent.TimeUnit;
import java.util.stream.Collectors;
@EventDriven @EventDriven
@SideEffectFree @SideEffectFree
@ -100,9 +104,12 @@ public class JoltTransformJSON extends AbstractProcessor {
public static final PropertyDescriptor JOLT_SPEC = new PropertyDescriptor.Builder() public static final PropertyDescriptor JOLT_SPEC = new PropertyDescriptor.Builder()
.name("jolt-spec") .name("jolt-spec")
.displayName("Jolt Specification") .displayName("Jolt Specification")
.description("Jolt Specification for transform of JSON data. This value is ignored if the Jolt Sort Transformation is selected.") .description("Jolt Specification for transformation of JSON data. The value for this property may be the text of a Jolt specification "
+ "or the path to a file containing a Jolt specification. 'Jolt Specification' must be set, or "
+ "the value is ignored if the Jolt Sort Transformation is selected.")
.expressionLanguageSupported(ExpressionLanguageScope.FLOWFILE_ATTRIBUTES) .expressionLanguageSupported(ExpressionLanguageScope.FLOWFILE_ATTRIBUTES)
.addValidator(StandardValidators.NON_EMPTY_VALIDATOR) .addValidator(StandardValidators.NON_EMPTY_VALIDATOR)
.identifiesExternalResource(ResourceCardinality.SINGLE, ResourceType.FILE, ResourceType.TEXT)
.required(false) .required(false)
.build(); .build();
@ -199,14 +206,11 @@ public class JoltTransformJSON extends AbstractProcessor {
final String transform = validationContext.getProperty(JOLT_TRANSFORM).getValue(); final String transform = validationContext.getProperty(JOLT_TRANSFORM).getValue();
final String customTransform = validationContext.getProperty(CUSTOM_CLASS).getValue(); final String customTransform = validationContext.getProperty(CUSTOM_CLASS).getValue();
final String modulePath = validationContext.getProperty(MODULES).isSet() ? validationContext.getProperty(MODULES).getValue() : null; final String modulePath = validationContext.getProperty(MODULES).isSet() ? validationContext.getProperty(MODULES).getValue() : null;
final String joltSpecBody = validationContext.getProperty(JOLT_SPEC).getValue();
if(!validationContext.getProperty(JOLT_SPEC).isSet() || StringUtils.isEmpty(validationContext.getProperty(JOLT_SPEC).getValue())){ if (StringUtils.isEmpty(joltSpecBody) && !SORTR.getValue().equals(transform)) {
if(!SORTR.getValue().equals(transform)) { results.add(new ValidationResult.Builder().subject(JOLT_SPEC.getDisplayName()).valid(false).explanation(
final String message = "A specification is required for this transformation"; "'Jolt Specification' must be set, or the Transformation must be 'Sort'").build());
results.add(new ValidationResult.Builder().valid(false)
.explanation(message)
.build());
}
} else { } else {
final ClassLoader customClassLoader; final ClassLoader customClassLoader;
@ -217,9 +221,11 @@ public class JoltTransformJSON extends AbstractProcessor {
customClassLoader = this.getClass().getClassLoader(); customClassLoader = this.getClass().getClassLoader();
} }
final String specValue = validationContext.getProperty(JOLT_SPEC).getValue(); String specValue = validationContext.getProperty(JOLT_SPEC).getValue();
if (validationContext.isExpressionLanguagePresent(specValue)) { final boolean elPresent = validationContext.isExpressionLanguagePresent(specValue);
if (elPresent) {
final String invalidExpressionMsg = validationContext.newExpressionLanguageCompiler().validateExpression(specValue, true); final String invalidExpressionMsg = validationContext.newExpressionLanguageCompiler().validateExpression(specValue, true);
if (!StringUtils.isEmpty(invalidExpressionMsg)) { if (!StringUtils.isEmpty(invalidExpressionMsg)) {
results.add(new ValidationResult.Builder().valid(false) results.add(new ValidationResult.Builder().valid(false)
@ -236,8 +242,11 @@ public class JoltTransformJSON extends AbstractProcessor {
.build()); .build());
} }
} else { } else {
//for validation we want to be able to ensure the spec is syntactically correct and not try to resolve variables since they may not exist yet if (!SORTR.getValue().equals(transform)) {
Object specJson = SORTR.getValue().equals(transform) ? null : JsonUtils.jsonToObject(specValue.replaceAll("\\$\\{","\\\\\\\\\\$\\{"), DEFAULT_CHARSET);
///for validation we want to be able to ensure the spec is syntactically correct and not try to resolve variables since they may not exist yet
final String content = readTransform(validationContext.getProperty(JOLT_SPEC));
final Object specJson = JsonUtils.jsonToObject(content.replaceAll("\\$\\{", "\\\\\\\\\\$\\{"), DEFAULT_CHARSET);
if (CUSTOMR.getValue().equals(transform)) { if (CUSTOMR.getValue().equals(transform)) {
if (StringUtils.isEmpty(customTransform)) { if (StringUtils.isEmpty(customTransform)) {
@ -252,10 +261,12 @@ public class JoltTransformJSON extends AbstractProcessor {
TransformFactory.getTransform(customClassLoader, transform, specJson); TransformFactory.getTransform(customClassLoader, transform, specJson);
} }
} }
}
} catch (final Exception e) { } catch (final Exception e) {
getLogger().error("processor is not valid: ", e); String message = String.format("Specification not valid for the selected transformation: %s", e);
String message = "Specification not valid for the selected transformation." ; results.add(new ValidationResult.Builder()
results.add(new ValidationResult.Builder().valid(false) .valid(false)
.subject(JOLT_SPEC.getDisplayName())
.explanation(message) .explanation(message)
.build()); .build());
} }
@ -278,7 +289,7 @@ public class JoltTransformJSON extends AbstractProcessor {
try (final InputStream in = session.read(original)) { try (final InputStream in = session.read(original)) {
inputJson = JsonUtils.jsonToObject(in); inputJson = JsonUtils.jsonToObject(in);
} catch (final Exception e) { } catch (final Exception e) {
logger.error("Failed to transform {}; routing to failure", new Object[] {original, e}); logger.error("JSON parsing failed for {}", original, e);
session.transfer(original, REL_FAILURE); session.transfer(original, REL_FAILURE);
return; return;
} }
@ -293,8 +304,8 @@ public class JoltTransformJSON extends AbstractProcessor {
final Object transformedJson = TransformUtils.transform(transform, inputJson); final Object transformedJson = TransformUtils.transform(transform, inputJson);
jsonString = context.getProperty(PRETTY_PRINT).asBoolean() ? JsonUtils.toPrettyJsonString(transformedJson) : JsonUtils.toJsonString(transformedJson); jsonString = context.getProperty(PRETTY_PRINT).asBoolean() ? JsonUtils.toPrettyJsonString(transformedJson) : JsonUtils.toJsonString(transformedJson);
} catch (final Exception ex) { } catch (final Exception e) {
logger.error("Unable to transform {} due to {}", new Object[] {original, ex.toString(), ex}); logger.error("Transform failed for {}", original, e);
session.transfer(original, REL_FAILURE); session.transfer(original, REL_FAILURE);
return; return;
} finally { } finally {
@ -303,33 +314,30 @@ public class JoltTransformJSON extends AbstractProcessor {
} }
} }
FlowFile transformed = session.write(original, new OutputStreamCallback() { FlowFile transformed = session.write(original, out -> out.write(jsonString.getBytes(DEFAULT_CHARSET)));
@Override
public void process(OutputStream out) throws IOException {
out.write(jsonString.getBytes(DEFAULT_CHARSET));
}
});
final String transformType = context.getProperty(JOLT_TRANSFORM).getValue(); final String transformType = context.getProperty(JOLT_TRANSFORM).getValue();
transformed = session.putAttribute(transformed, CoreAttributes.MIME_TYPE.key(), "application/json"); transformed = session.putAttribute(transformed, CoreAttributes.MIME_TYPE.key(), "application/json");
session.transfer(transformed, REL_SUCCESS); session.transfer(transformed, REL_SUCCESS);
session.getProvenanceReporter().modifyContent(transformed, "Modified With " + transformType, stopWatch.getElapsed(TimeUnit.MILLISECONDS)); session.getProvenanceReporter().modifyContent(transformed, "Modified With " + transformType, stopWatch.getElapsed(TimeUnit.MILLISECONDS));
logger.info("Transformed {}", new Object[]{original}); logger.info("Transform completed for {}", original);
} }
private JoltTransform getTransform(final ProcessContext context, final FlowFile flowFile) { private JoltTransform getTransform(final ProcessContext context, final FlowFile flowFile) {
final Optional<String> specString; final Optional<String> specString;
if (context.getProperty(JOLT_SPEC).isSet()) { if (context.getProperty(JOLT_SPEC).isSet()) {
specString = Optional.of(context.getProperty(JOLT_SPEC).evaluateAttributeExpressions(flowFile).getValue()); specString = Optional.of(context.getProperty(JOLT_SPEC).evaluateAttributeExpressions(flowFile).getValue());
} else { } else if (SORTR.getValue().equals(context.getProperty(JOLT_TRANSFORM).getValue())) {
specString = Optional.empty(); specString = Optional.empty();
} else {
throw new IllegalArgumentException("'Jolt Specification' must be set, or the Transformation must be Sort.");
} }
return transformCache.get(specString, currString -> { return transformCache.get(specString, currString -> {
try { try {
return createTransform(context, currString.orElse(null), flowFile); return createTransform(context, flowFile);
} catch (Exception e) { } catch (Exception e) {
getLogger().error("Problem getting transform", e); getLogger().error("Transform creation failed", e);
} }
return null; return null;
}); });
@ -352,15 +360,16 @@ public class JoltTransformJSON extends AbstractProcessor {
} else { } else {
customClassLoader = this.getClass().getClassLoader(); customClassLoader = this.getClass().getClassLoader();
} }
} catch (final Exception ex) { } catch (final Exception e) {
getLogger().error("Unable to setup processor", ex); getLogger().error("ClassLoader configuration failed", e);
} }
} }
private JoltTransform createTransform(final ProcessContext context, final String specString, final FlowFile flowFile) throws Exception { private JoltTransform createTransform(final ProcessContext context, final FlowFile flowFile) throws Exception {
final Object specJson; final Object specJson;
if (context.getProperty(JOLT_SPEC).isSet() && !SORTR.getValue().equals(context.getProperty(JOLT_TRANSFORM).getValue())) { if ((context.getProperty(JOLT_SPEC).isSet() && !SORTR.getValue().equals(context.getProperty(JOLT_TRANSFORM).getValue()))) {
specJson = JsonUtils.jsonToObject(specString, DEFAULT_CHARSET); final String resolvedSpec = readTransform(context.getProperty(JOLT_SPEC), flowFile);
specJson = JsonUtils.jsonToObject(resolvedSpec, DEFAULT_CHARSET);
} else { } else {
specJson = null; specJson = null;
} }
@ -372,8 +381,28 @@ public class JoltTransformJSON extends AbstractProcessor {
} }
} }
private String readTransform(final PropertyValue propertyValue, final FlowFile flowFile) {
final String transform;
if (propertyValue.isExpressionLanguagePresent()) {
transform = propertyValue.evaluateAttributeExpressions(flowFile).getValue();
} else {
transform = readTransform(propertyValue);
}
return transform;
}
private String readTransform(final PropertyValue propertyValue) {
final ResourceReference resourceReference = propertyValue.asResource();
try (final BufferedReader reader = new BufferedReader(new InputStreamReader(resourceReference.read()))) {
return reader.lines().collect(Collectors.joining());
} catch (final IOException e) {
throw new UncheckedIOException("Read JOLT Transform failed", e);
}
}
protected FilenameFilter getJarFilenameFilter() { protected FilenameFilter getJarFilenameFilter() {
return (dir, name) -> (name != null && name.endsWith(".jar")); return (dir, name) -> (name != null && name.endsWith(".jar"));
} }
} }

View File

@ -59,11 +59,29 @@ public class TestJoltTransformJSON {
} }
@Test @Test
public void testInvalidJOLTSpec() { public void testRelationshipsCreatedFromFile() throws IOException{
Processor processor= new JoltTransformJSON();
final TestRunner runner = TestRunners.newTestRunner(processor);
final String spec = "./src/test/resources/TestJoltTransformJson/chainrSpec.json";
runner.setProperty(JoltTransformJSON.JOLT_SPEC, spec);
runner.enqueue(JSON_INPUT);
Set<Relationship> relationships = processor.getRelationships();
assertTrue(relationships.contains(JoltTransformJSON.REL_FAILURE));
assertTrue(relationships.contains(JoltTransformJSON.REL_SUCCESS));
assertEquals(2, relationships.size());
}
@Test
public void testInvalidJOLTSpec() throws IOException {
final TestRunner runner = TestRunners.newTestRunner(new JoltTransformJSON()); final TestRunner runner = TestRunners.newTestRunner(new JoltTransformJSON());
final String spec = "[{}]"; String spec = "[{}]";
runner.setProperty(JoltTransformJSON.JOLT_SPEC, spec); runner.setProperty(JoltTransformJSON.JOLT_SPEC, spec);
runner.assertNotValid(); runner.assertNotValid();
final String specLocation = "src/test/resources/TestJoltTransformJson/chainrSpec.json";
spec = new String(Files.readAllBytes(Paths.get(specLocation)));
runner.setProperty(JoltTransformJSON.JOLT_SPEC, spec);
runner.assertValid();
} }
@Test @Test
@ -76,7 +94,16 @@ public class TestJoltTransformJSON {
} }
@Test @Test
public void testSpecIsNotSet() { public void testIncorrectJOLTSpecFromFile() throws IOException {
final TestRunner runner = TestRunners.newTestRunner(new JoltTransformJSON());
final String chainrSpec = "./src/test/resources/TestJoltTransformJson/chainrSpec.json";
runner.setProperty(JoltTransformJSON.JOLT_SPEC, chainrSpec);
runner.setProperty(JoltTransformJSON.JOLT_TRANSFORM, JoltTransformJSON.SHIFTR);
runner.assertNotValid();
}
@Test
public void testSpecIsNotSet() throws IOException {
final TestRunner runner = TestRunners.newTestRunner(new JoltTransformJSON()); final TestRunner runner = TestRunners.newTestRunner(new JoltTransformJSON());
runner.setProperty(JoltTransformJSON.JOLT_TRANSFORM, JoltTransformJSON.SHIFTR); runner.setProperty(JoltTransformJSON.JOLT_TRANSFORM, JoltTransformJSON.SHIFTR);
runner.assertNotValid(); runner.assertNotValid();
@ -118,6 +145,16 @@ public class TestJoltTransformJSON {
runner.assertAllFlowFilesTransferred(JoltTransformJSON.REL_FAILURE); runner.assertAllFlowFilesTransferred(JoltTransformJSON.REL_FAILURE);
} }
@Test
public void testInvalidFlowFileContentJsonFromFile() throws IOException {
final TestRunner runner = TestRunners.newTestRunner(new JoltTransformJSON());
final String spec = "./src/test/resources/TestJoltTransformJson/chainrSpec.json";
runner.setProperty(JoltTransformJSON.JOLT_SPEC, spec);
runner.enqueue("invalid json");
runner.run();
runner.assertAllFlowFilesTransferred(JoltTransformJSON.REL_FAILURE);
}
@Test @Test
public void testCustomTransformationWithNoModule() throws IOException { public void testCustomTransformationWithNoModule() throws IOException {
final TestRunner runner = TestRunners.newTestRunner(new JoltTransformJSON()); final TestRunner runner = TestRunners.newTestRunner(new JoltTransformJSON());
@ -201,6 +238,23 @@ public class TestJoltTransformJSON {
assertTrue(DIFFY.diff(compareJson, transformedJson).isEmpty()); assertTrue(DIFFY.diff(compareJson, transformedJson).isEmpty());
} }
@Test
public void testTransformInputWithShiftrFromFile() throws IOException {
final TestRunner runner = TestRunners.newTestRunner(new JoltTransformJSON());
final String spec = "./src/test/resources/TestJoltTransformJson/shiftrSpec.json";
runner.setProperty(JoltTransformJSON.JOLT_SPEC, spec);
runner.setProperty(JoltTransformJSON.JOLT_TRANSFORM, JoltTransformJSON.SHIFTR);
runner.enqueue(JSON_INPUT);
runner.run();
runner.assertAllFlowFilesTransferred(JoltTransformJSON.REL_SUCCESS);
final MockFlowFile transformed = runner.getFlowFilesForRelationship(JoltTransformJSON.REL_SUCCESS).get(0);
transformed.assertAttributeExists(CoreAttributes.MIME_TYPE.key());
transformed.assertAttributeEquals(CoreAttributes.MIME_TYPE.key(),"application/json");
Object transformedJson = JsonUtils.jsonToObject(new ByteArrayInputStream(transformed.toByteArray()));
Object compareJson = JsonUtils.jsonToObject(Files.newInputStream(Paths.get("src/test/resources/TestJoltTransformJson/shiftrOutput.json")));
assertTrue(DIFFY.diff(compareJson, transformedJson).isEmpty());
}
@Test @Test
public void testTransformInputWithDefaultr() throws IOException { public void testTransformInputWithDefaultr() throws IOException {
final TestRunner runner = TestRunners.newTestRunner(new JoltTransformJSON()); final TestRunner runner = TestRunners.newTestRunner(new JoltTransformJSON());