mirror of https://github.com/apache/nifi.git
NIFI-6741: Add RecordPath support to scripting components
This closes #3790. Signed-off-by: Andy LoPresto <alopresto@apache.org>
This commit is contained in:
parent
ba141690c5
commit
b588073cbb
|
@ -51,6 +51,11 @@
|
|||
<groupId>org.apache.nifi</groupId>
|
||||
<artifactId>nifi-record</artifactId>
|
||||
</dependency>
|
||||
<dependency>
|
||||
<groupId>org.apache.nifi</groupId>
|
||||
<artifactId>nifi-record-path</artifactId>
|
||||
<version>1.10.0-SNAPSHOT</version>
|
||||
</dependency>
|
||||
<dependency>
|
||||
<groupId>org.apache.nifi</groupId>
|
||||
<artifactId>nifi-lookup-service-api</artifactId>
|
||||
|
@ -107,6 +112,12 @@
|
|||
<version>1.10.0-SNAPSHOT</version>
|
||||
<scope>test</scope>
|
||||
</dependency>
|
||||
<dependency>
|
||||
<groupId>org.apache.nifi</groupId>
|
||||
<artifactId>nifi-mock-record-utils</artifactId>
|
||||
<version>1.10.0-SNAPSHOT</version>
|
||||
<scope>test</scope>
|
||||
</dependency>
|
||||
<dependency>
|
||||
<groupId>org.codehaus.groovy</groupId>
|
||||
<artifactId>groovy-json</artifactId>
|
||||
|
|
|
@ -21,6 +21,8 @@ import org.apache.commons.codec.binary.Hex;
|
|||
import org.apache.nifi.components.PropertyDescriptor;
|
||||
import org.apache.nifi.processor.Relationship;
|
||||
import org.apache.nifi.script.ScriptingComponentUtils;
|
||||
import org.apache.nifi.serialization.record.MockRecordParser;
|
||||
import org.apache.nifi.serialization.record.RecordFieldType;
|
||||
import org.apache.nifi.util.MockFlowFile;
|
||||
import org.apache.nifi.util.MockProcessContext;
|
||||
import org.apache.nifi.util.MockProcessorInitializationContext;
|
||||
|
@ -35,6 +37,7 @@ import java.security.MessageDigest;
|
|||
import java.util.List;
|
||||
import java.util.Set;
|
||||
|
||||
import static org.junit.Assert.assertEquals;
|
||||
import static org.junit.Assert.assertFalse;
|
||||
import static org.junit.Assert.assertNotNull;
|
||||
import static org.junit.Assert.assertTrue;
|
||||
|
@ -209,4 +212,38 @@ public class TestInvokeGroovy extends BaseScriptTest {
|
|||
outputFlowFile.assertContentEquals(expectedOutput);
|
||||
outputFlowFile.assertAttributeEquals("outAttr", expectedOutput);
|
||||
}
|
||||
|
||||
/**
|
||||
* Tests a script that has a Groovy Processor that reads records and outputs a comma-delimited list of fields selected by a given RecordPath expression
|
||||
*
|
||||
* @throws Exception Any error encountered while testing
|
||||
*/
|
||||
@Test
|
||||
public void testReadRecordsWithRecordPath() throws Exception {
|
||||
runner.setProperty(scriptingComponent.getScriptingComponentHelper().SCRIPT_ENGINE, "Groovy");
|
||||
runner.setProperty(ScriptingComponentUtils.SCRIPT_FILE, "target/test/resources/groovy/test_record_path.groovy");
|
||||
runner.setProperty(ScriptingComponentUtils.MODULES, "target/test/resources/groovy");
|
||||
|
||||
final MockRecordParser readerService = new MockRecordParser();
|
||||
runner.addControllerService("reader", readerService);
|
||||
runner.enableControllerService(readerService);
|
||||
runner.setProperty("record-reader", "reader");
|
||||
runner.setProperty("record-path", "/age");
|
||||
readerService.addSchemaField("name", RecordFieldType.STRING);
|
||||
readerService.addSchemaField("age", RecordFieldType.INT);
|
||||
|
||||
readerService.addRecord("John Doe", 48);
|
||||
readerService.addRecord("Jane Doe", 47);
|
||||
readerService.addRecord("Jimmy Doe", 14);
|
||||
|
||||
runner.assertValid();
|
||||
runner.enqueue("".getBytes(StandardCharsets.UTF_8));
|
||||
runner.run();
|
||||
|
||||
runner.assertAllFlowFilesTransferred("success", 1);
|
||||
final List<MockFlowFile> result = runner.getFlowFilesForRelationship("success");
|
||||
assertEquals(1, result.size());
|
||||
MockFlowFile ff = result.get(0);
|
||||
ff.assertContentEquals("48\n47\n14\n");
|
||||
}
|
||||
}
|
||||
|
|
|
@ -0,0 +1,110 @@
|
|||
/*
|
||||
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
* contributor license agreements. See the NOTICE file distributed with
|
||||
* this work for additional information regarding copyright ownership.
|
||||
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
* (the "License"); you may not use this file except in compliance with
|
||||
* the License. You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
import org.apache.nifi.flowfile.FlowFile
|
||||
import org.apache.nifi.processor.AbstractProcessor
|
||||
import org.apache.nifi.processor.ProcessContext
|
||||
import org.apache.nifi.processor.ProcessSession
|
||||
import org.apache.nifi.processor.Relationship
|
||||
import org.apache.nifi.processor.io.StreamCallback
|
||||
import org.apache.nifi.processor.util.StandardValidators
|
||||
import org.apache.nifi.record.path.RecordPath
|
||||
import org.apache.nifi.record.path.RecordPathResult
|
||||
import org.apache.nifi.serialization.*
|
||||
import org.apache.nifi.serialization.record.*
|
||||
import org.apache.nifi.schema.access.SchemaNotFoundException
|
||||
import java.util.concurrent.atomic.AtomicInteger
|
||||
import java.util.stream.Collectors
|
||||
|
||||
class MyRecordProcessor extends AbstractProcessor {
|
||||
|
||||
// Properties
|
||||
static final PropertyDescriptor RECORD_READER = new PropertyDescriptor.Builder()
|
||||
.name("record-reader")
|
||||
.displayName("Record Reader")
|
||||
.description("Specifies the Controller Service to use for reading incoming data")
|
||||
.identifiesControllerService(RecordReaderFactory.class)
|
||||
.required(true)
|
||||
.build()
|
||||
|
||||
static final PropertyDescriptor RECORD_PATH = new PropertyDescriptor.Builder()
|
||||
.name("record-path")
|
||||
.displayName("Record Path")
|
||||
.description("Specifies the Record Path expression to evaluate against each record")
|
||||
.addValidator(StandardValidators.NON_EMPTY_VALIDATOR)
|
||||
.required(true)
|
||||
.build()
|
||||
|
||||
def REL_SUCCESS = new Relationship.Builder().name("success").description('FlowFiles that were successfully processed are routed here').build()
|
||||
def REL_FAILURE = new Relationship.Builder().name("failure").description('FlowFiles are routed here if an error occurs during processing').build()
|
||||
|
||||
@Override
|
||||
protected List<PropertyDescriptor> getSupportedPropertyDescriptors() {
|
||||
def properties = [] as ArrayList
|
||||
properties.add(RECORD_READER)
|
||||
properties.add(RECORD_PATH)
|
||||
properties
|
||||
}
|
||||
|
||||
@Override
|
||||
Set<Relationship> getRelationships() {
|
||||
[REL_SUCCESS, REL_FAILURE] as Set<Relationship>
|
||||
}
|
||||
|
||||
@Override
|
||||
void onTrigger(ProcessContext context, ProcessSession session) {
|
||||
def flowFile = session.get()
|
||||
if (!flowFile) return
|
||||
|
||||
def readerFactory = context.getProperty(RECORD_READER).asControllerService(RecordReaderFactory)
|
||||
|
||||
final Map<String, String> attributes = new HashMap<>()
|
||||
final FlowFile original = flowFile
|
||||
final Map<String, String> originalAttributes = flowFile.attributes
|
||||
final String recordPathExpression = context.getProperty(RECORD_PATH).getValue()
|
||||
final RecordPath recordPath = RecordPath.compile(recordPathExpression)
|
||||
try {
|
||||
flowFile = session.write(flowFile, { inStream, outStream ->
|
||||
def reader = readerFactory.createRecordReader(originalAttributes, inStream, 100, getLogger())
|
||||
try {
|
||||
Record record
|
||||
while (record = reader.nextRecord()) {
|
||||
RecordPathResult result = recordPath.evaluate(record)
|
||||
def line = result.selectedFields.map({f -> record.getAsString(f.field.fieldName).toString()}).collect(Collectors.joining(',')) + '\n'
|
||||
outStream.write(line.bytes)
|
||||
}
|
||||
|
||||
} catch (final SchemaNotFoundException e) {
|
||||
throw new ProcessException(e.localizedMessage, e)
|
||||
} catch (final MalformedRecordException e) {
|
||||
throw new ProcessException('Could not parse incoming data', e)
|
||||
} finally {
|
||||
reader.close()
|
||||
}
|
||||
} as StreamCallback)
|
||||
|
||||
} catch (final Exception e) {
|
||||
getLogger().error('Failed to process {}; will route to failure', [flowFile, e] as Object[])
|
||||
session.transfer(flowFile, REL_FAILURE);
|
||||
return;
|
||||
}
|
||||
flowFile = session.putAllAttributes(flowFile, attributes)
|
||||
session.transfer(flowFile, REL_SUCCESS)
|
||||
}
|
||||
}
|
||||
|
||||
processor = new MyRecordProcessor()
|
Loading…
Reference in New Issue