NIFI-9276: Adding config verification to AbstractListProcessor subclasses (#5453)

This commit is contained in:
Joe Gresock 2021-10-21 12:22:50 -04:00 committed by GitHub
parent 1bec905890
commit d2f8f97b10
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
17 changed files with 582 additions and 255 deletions

View File

@ -35,7 +35,6 @@ import com.microsoft.azure.storage.blob.CloudBlobClient;
import com.microsoft.azure.storage.blob.CloudBlobContainer; import com.microsoft.azure.storage.blob.CloudBlobContainer;
import com.microsoft.azure.storage.blob.CloudBlockBlob; import com.microsoft.azure.storage.blob.CloudBlockBlob;
import com.microsoft.azure.storage.blob.ListBlobItem; import com.microsoft.azure.storage.blob.ListBlobItem;
import org.apache.commons.lang3.exception.ExceptionUtils; import org.apache.commons.lang3.exception.ExceptionUtils;
import org.apache.nifi.annotation.behavior.InputRequirement; import org.apache.nifi.annotation.behavior.InputRequirement;
import org.apache.nifi.annotation.behavior.InputRequirement.Requirement; import org.apache.nifi.annotation.behavior.InputRequirement.Requirement;
@ -62,6 +61,8 @@ import org.apache.nifi.processors.azure.storage.utils.BlobInfo;
import org.apache.nifi.processors.azure.storage.utils.BlobInfo.Builder; import org.apache.nifi.processors.azure.storage.utils.BlobInfo.Builder;
import org.apache.nifi.serialization.record.RecordSchema; import org.apache.nifi.serialization.record.RecordSchema;
import java.util.Optional;
@PrimaryNodeOnly @PrimaryNodeOnly
@TriggerSerially @TriggerSerially
@Tags({ "azure", "microsoft", "cloud", "storage", "blob" }) @Tags({ "azure", "microsoft", "cloud", "storage", "blob" })
@ -140,6 +141,11 @@ public class ListAzureBlobStorage extends AbstractListProcessor<BlobInfo> {
return attributes; return attributes;
} }
@Override
protected String getListingContainerName(final ProcessContext context) {
return String.format("Azure Blob Storage Container [%s]", getPath(context));
}
@Override @Override
protected String getPath(final ProcessContext context) { protected String getPath(final ProcessContext context) {
return context.getProperty(AzureStorageUtils.CONTAINER).evaluateAttributeExpressions().getValue(); return context.getProperty(AzureStorageUtils.CONTAINER).evaluateAttributeExpressions().getValue();
@ -173,27 +179,24 @@ public class ListAzureBlobStorage extends AbstractListProcessor<BlobInfo> {
} }
@Override @Override
protected List<BlobInfo> performListing(final ProcessContext context, final Long minTimestamp) throws IOException { protected List<BlobInfo> performListing(final ProcessContext context, final Long minTimestamp, final ListingMode listingMode) throws IOException {
String containerName = context.getProperty(AzureStorageUtils.CONTAINER).evaluateAttributeExpressions().getValue(); final String containerName = context.getProperty(AzureStorageUtils.CONTAINER).evaluateAttributeExpressions().getValue();
String prefix = context.getProperty(PROP_PREFIX).evaluateAttributeExpressions().getValue(); final String prefix = Optional.ofNullable(context.getProperty(PROP_PREFIX).evaluateAttributeExpressions().getValue()).orElse("");
if (prefix == null) {
prefix = "";
}
final List<BlobInfo> listing = new ArrayList<>(); final List<BlobInfo> listing = new ArrayList<>();
try { try {
CloudBlobClient blobClient = AzureStorageUtils.createCloudBlobClient(context, getLogger(), null); final CloudBlobClient blobClient = AzureStorageUtils.createCloudBlobClient(context, getLogger(), null);
CloudBlobContainer container = blobClient.getContainerReference(containerName); final CloudBlobContainer container = blobClient.getContainerReference(containerName);
final OperationContext operationContext = new OperationContext(); final OperationContext operationContext = new OperationContext();
AzureStorageUtils.setProxy(operationContext, context); AzureStorageUtils.setProxy(operationContext, context);
for (ListBlobItem blob : container.listBlobs(prefix, true, EnumSet.of(BlobListingDetails.METADATA), null, operationContext)) { for (final ListBlobItem blob : container.listBlobs(prefix, true, EnumSet.of(BlobListingDetails.METADATA), null, operationContext)) {
if (blob instanceof CloudBlob) { if (blob instanceof CloudBlob) {
CloudBlob cloudBlob = (CloudBlob) blob; final CloudBlob cloudBlob = (CloudBlob) blob;
BlobProperties properties = cloudBlob.getProperties(); final BlobProperties properties = cloudBlob.getProperties();
StorageUri uri = cloudBlob.getSnapshotQualifiedStorageUri(); final StorageUri uri = cloudBlob.getSnapshotQualifiedStorageUri();
Builder builder = new BlobInfo.Builder() final Builder builder = new BlobInfo.Builder()
.primaryUri(uri.getPrimaryUri().toString()) .primaryUri(uri.getPrimaryUri().toString())
.blobName(cloudBlob.getName()) .blobName(cloudBlob.getName())
.containerName(containerName) .containerName(containerName)
@ -215,12 +218,15 @@ public class ListAzureBlobStorage extends AbstractListProcessor<BlobInfo> {
listing.add(builder.build()); listing.add(builder.build());
} }
} }
} catch (Throwable t) { } catch (final Throwable t) {
throw new IOException(ExceptionUtils.getRootCause(t)); throw new IOException(ExceptionUtils.getRootCause(t));
} }
return listing; return listing;
} }
// Unfiltered listing is not supported - must provide a prefix
@Override
protected Integer countUnfilteredListing(final ProcessContext context) {
return null;
}
} }

View File

@ -160,12 +160,9 @@ public class ListAzureDataLakeStorage extends AbstractListProcessor<ADLSFileInfo
} }
@OnScheduled @OnScheduled
public void onScheduled(ProcessContext context) { public void onScheduled(final ProcessContext context) {
String fileFilter = context.getProperty(FILE_FILTER).evaluateAttributeExpressions().getValue(); filePattern = getPattern(context, FILE_FILTER);
filePattern = fileFilter != null ? Pattern.compile(fileFilter) : null; pathPattern = getPattern(context, PATH_FILTER);
String pathFilter = context.getProperty(PATH_FILTER).evaluateAttributeExpressions().getValue();
pathPattern = pathFilter != null ? Pattern.compile(pathFilter) : null;
} }
@OnStopped @OnStopped
@ -175,7 +172,7 @@ public class ListAzureDataLakeStorage extends AbstractListProcessor<ADLSFileInfo
} }
@Override @Override
protected void customValidate(ValidationContext context, Collection<ValidationResult> results) { protected void customValidate(final ValidationContext context, final Collection<ValidationResult> results) {
if (context.getProperty(PATH_FILTER).isSet() && !context.getProperty(RECURSE_SUBDIRECTORIES).asBoolean()) { if (context.getProperty(PATH_FILTER).isSet() && !context.getProperty(RECURSE_SUBDIRECTORIES).asBoolean()) {
results.add(new ValidationResult.Builder() results.add(new ValidationResult.Builder()
.subject(PATH_FILTER.getDisplayName()) .subject(PATH_FILTER.getDisplayName())
@ -191,7 +188,7 @@ public class ListAzureDataLakeStorage extends AbstractListProcessor<ADLSFileInfo
} }
@Override @Override
protected Scope getStateScope(PropertyContext context) { protected Scope getStateScope(final PropertyContext context) {
return Scope.CLUSTER; return Scope.CLUSTER;
} }
@ -201,55 +198,34 @@ public class ListAzureDataLakeStorage extends AbstractListProcessor<ADLSFileInfo
} }
@Override @Override
protected boolean isListingResetNecessary(PropertyDescriptor property) { protected boolean isListingResetNecessary(final PropertyDescriptor property) {
return LISTING_RESET_PROPERTIES.contains(property); return LISTING_RESET_PROPERTIES.contains(property);
} }
@Override @Override
protected String getPath(ProcessContext context) { protected String getPath(final ProcessContext context) {
String directory = context.getProperty(DIRECTORY).evaluateAttributeExpressions().getValue(); final String directory = context.getProperty(DIRECTORY).evaluateAttributeExpressions().getValue();
return directory != null ? directory : "."; return directory != null ? directory : ".";
} }
@Override @Override
protected List<ADLSFileInfo> performListing(ProcessContext context, Long minTimestamp) throws IOException { protected List<ADLSFileInfo> performListing(final ProcessContext context, final Long minTimestamp, final ListingMode listingMode) throws IOException {
try { return performListing(context, listingMode, true);
String fileSystem = evaluateFileSystemProperty(context, null);
String baseDirectory = evaluateDirectoryProperty(context, null);
boolean recurseSubdirectories = context.getProperty(RECURSE_SUBDIRECTORIES).asBoolean();
DataLakeServiceClient storageClient = getStorageClient(context, null);
DataLakeFileSystemClient fileSystemClient = storageClient.getFileSystemClient(fileSystem);
ListPathsOptions options = new ListPathsOptions();
options.setPath(baseDirectory);
options.setRecursive(recurseSubdirectories);
Pattern baseDirectoryPattern = Pattern.compile("^" + baseDirectory + "/?");
List<ADLSFileInfo> listing = fileSystemClient.listPaths(options, null).stream()
.filter(pathItem -> !pathItem.isDirectory())
.map(pathItem -> new ADLSFileInfo.Builder()
.fileSystem(fileSystem)
.filePath(pathItem.getName())
.length(pathItem.getContentLength())
.lastModified(pathItem.getLastModified().toInstant().toEpochMilli())
.etag(pathItem.getETag())
.build())
.filter(fileInfo -> filePattern == null || filePattern.matcher(fileInfo.getFilename()).matches())
.filter(fileInfo -> pathPattern == null || pathPattern.matcher(RegExUtils.removeFirst(fileInfo.getDirectory(), baseDirectoryPattern)).matches())
.collect(Collectors.toList());
return listing;
} catch (Exception e) {
getLogger().error("Failed to list directory on Azure Data Lake Storage", e);
throw new IOException(ExceptionUtils.getRootCause(e));
}
} }
@Override @Override
protected Map<String, String> createAttributes(ADLSFileInfo fileInfo, ProcessContext context) { protected Integer countUnfilteredListing(final ProcessContext context) throws IOException {
Map<String, String> attributes = new HashMap<>(); return performListing(context, ListingMode.CONFIGURATION_VERIFICATION, false).size();
}
@Override
protected String getListingContainerName(final ProcessContext context) {
return String.format("Azure Data Lake Directory [%s]", getPath(context));
}
@Override
protected Map<String, String> createAttributes(final ADLSFileInfo fileInfo, final ProcessContext context) {
final Map<String, String> attributes = new HashMap<>();
attributes.put(ATTR_NAME_FILESYSTEM, fileInfo.getFileSystem()); attributes.put(ATTR_NAME_FILESYSTEM, fileInfo.getFileSystem());
attributes.put(ATTR_NAME_FILE_PATH, fileInfo.getFilePath()); attributes.put(ATTR_NAME_FILE_PATH, fileInfo.getFilePath());
@ -261,4 +237,48 @@ public class ListAzureDataLakeStorage extends AbstractListProcessor<ADLSFileInfo
return attributes; return attributes;
} }
private List<ADLSFileInfo> performListing(final ProcessContext context, final ListingMode listingMode,
final boolean applyFilters) throws IOException {
try {
final String fileSystem = evaluateFileSystemProperty(context, null);
final String baseDirectory = evaluateDirectoryProperty(context, null);
final boolean recurseSubdirectories = context.getProperty(RECURSE_SUBDIRECTORIES).asBoolean();
final Pattern filePattern = listingMode == ListingMode.EXECUTION ? this.filePattern : getPattern(context, FILE_FILTER);
final Pattern pathPattern = listingMode == ListingMode.EXECUTION ? this.pathPattern : getPattern(context, PATH_FILTER);
final DataLakeServiceClient storageClient = getStorageClient(context, null);
final DataLakeFileSystemClient fileSystemClient = storageClient.getFileSystemClient(fileSystem);
final ListPathsOptions options = new ListPathsOptions();
options.setPath(baseDirectory);
options.setRecursive(recurseSubdirectories);
final Pattern baseDirectoryPattern = Pattern.compile("^" + baseDirectory + "/?");
final List<ADLSFileInfo> listing = fileSystemClient.listPaths(options, null).stream()
.filter(pathItem -> !pathItem.isDirectory())
.map(pathItem -> new ADLSFileInfo.Builder()
.fileSystem(fileSystem)
.filePath(pathItem.getName())
.length(pathItem.getContentLength())
.lastModified(pathItem.getLastModified().toInstant().toEpochMilli())
.etag(pathItem.getETag())
.build())
.filter(fileInfo -> applyFilters && (filePattern == null || filePattern.matcher(fileInfo.getFilename()).matches()))
.filter(fileInfo -> applyFilters && (pathPattern == null || pathPattern.matcher(RegExUtils.removeFirst(fileInfo.getDirectory(), baseDirectoryPattern)).matches()))
.collect(Collectors.toList());
return listing;
} catch (final Exception e) {
getLogger().error("Failed to list directory on Azure Data Lake Storage", e);
throw new IOException(ExceptionUtils.getRootCause(e));
}
}
private Pattern getPattern(final ProcessContext context, final PropertyDescriptor filterDescriptor) {
String value = context.getProperty(filterDescriptor).evaluateAttributeExpressions().getValue();
return value != null ? Pattern.compile(value) : null;
}
} }

View File

@ -26,6 +26,8 @@ import org.apache.nifi.annotation.lifecycle.OnScheduled;
import org.apache.nifi.annotation.notification.OnPrimaryNodeStateChange; import org.apache.nifi.annotation.notification.OnPrimaryNodeStateChange;
import org.apache.nifi.annotation.notification.PrimaryNodeState; import org.apache.nifi.annotation.notification.PrimaryNodeState;
import org.apache.nifi.components.AllowableValue; import org.apache.nifi.components.AllowableValue;
import org.apache.nifi.components.ConfigVerificationResult;
import org.apache.nifi.components.ConfigVerificationResult.Outcome;
import org.apache.nifi.components.PropertyDescriptor; import org.apache.nifi.components.PropertyDescriptor;
import org.apache.nifi.components.PropertyDescriptor.Builder; import org.apache.nifi.components.PropertyDescriptor.Builder;
import org.apache.nifi.components.ValidationContext; import org.apache.nifi.components.ValidationContext;
@ -40,10 +42,12 @@ import org.apache.nifi.distributed.cache.client.Serializer;
import org.apache.nifi.distributed.cache.client.exception.DeserializationException; import org.apache.nifi.distributed.cache.client.exception.DeserializationException;
import org.apache.nifi.distributed.cache.client.exception.SerializationException; import org.apache.nifi.distributed.cache.client.exception.SerializationException;
import org.apache.nifi.flowfile.FlowFile; import org.apache.nifi.flowfile.FlowFile;
import org.apache.nifi.logging.ComponentLog;
import org.apache.nifi.processor.AbstractProcessor; import org.apache.nifi.processor.AbstractProcessor;
import org.apache.nifi.processor.ProcessContext; import org.apache.nifi.processor.ProcessContext;
import org.apache.nifi.processor.ProcessSession; import org.apache.nifi.processor.ProcessSession;
import org.apache.nifi.processor.Relationship; import org.apache.nifi.processor.Relationship;
import org.apache.nifi.processor.VerifiableProcessor;
import org.apache.nifi.processor.exception.ProcessException; import org.apache.nifi.processor.exception.ProcessException;
import org.apache.nifi.schema.access.SchemaNotFoundException; import org.apache.nifi.schema.access.SchemaNotFoundException;
import org.apache.nifi.serialization.RecordSetWriter; import org.apache.nifi.serialization.RecordSetWriter;
@ -121,7 +125,7 @@ import java.util.stream.Collectors;
* </p> * </p>
* <ul> * <ul>
* <li> * <li>
* Perform a listing of resources. The subclass will implement the {@link #performListing(ProcessContext, Long)} method, which creates a listing of all * Perform a listing of resources. The subclass will implement the {@link #performListing(ProcessContext, Long, ListingMode)} method, which creates a listing of all
* entities on the target system that have timestamps later than the provided timestamp. If the entities returned have a timestamp before the provided one, those * entities on the target system that have timestamps later than the provided timestamp. If the entities returned have a timestamp before the provided one, those
* entities will be filtered out. It is therefore not necessary to perform the filtering of timestamps but is provided in order to give the implementation the ability * entities will be filtered out. It is therefore not necessary to perform the filtering of timestamps but is provided in order to give the implementation the ability
* to filter those resources on the server side rather than pulling back all of the information, if it makes sense to do so in the concrete implementation. * to filter those resources on the server side rather than pulling back all of the information, if it makes sense to do so in the concrete implementation.
@ -149,42 +153,61 @@ import java.util.stream.Collectors;
@TriggerSerially @TriggerSerially
@Stateful(scopes = {Scope.LOCAL, Scope.CLUSTER}, description = "After a listing of resources is performed, the latest timestamp of any of the resources is stored in the component's state. " @Stateful(scopes = {Scope.LOCAL, Scope.CLUSTER}, description = "After a listing of resources is performed, the latest timestamp of any of the resources is stored in the component's state. "
+ "The scope used depends on the implementation.") + "The scope used depends on the implementation.")
public abstract class AbstractListProcessor<T extends ListableEntity> extends AbstractProcessor { public abstract class AbstractListProcessor<T extends ListableEntity> extends AbstractProcessor implements VerifiableProcessor {
/**
* Indicates the mode when performing a listing.
*/
protected enum ListingMode {
/**
* Indicates the listing is being performed during normal processor execution. May use configuration cached in the Processor object.
*/
EXECUTION,
/**
* Indicates the listing is being performed during configuration verification. Only use configuration provided in the ProcessContext argument, since the configuration may not
* have been applied to the processor yet.
*/
CONFIGURATION_VERIFICATION
}
private static final Long IGNORE_MIN_TIMESTAMP_VALUE = 0L;
public static final PropertyDescriptor DISTRIBUTED_CACHE_SERVICE = new Builder() public static final PropertyDescriptor DISTRIBUTED_CACHE_SERVICE = new Builder()
.name("Distributed Cache Service") .name("Distributed Cache Service")
.description("NOTE: This property is used merely for migration from old NiFi version before state management was introduced at version 0.5.0. " .description("NOTE: This property is used merely for migration from old NiFi version before state management was introduced at version 0.5.0. "
+ "The stored value in the cache service will be migrated into the state when this processor is started at the first time. " + "The stored value in the cache service will be migrated into the state when this processor is started at the first time. "
+ "The specified Controller Service was used to maintain state about what had been pulled from the remote server so that if a new node " + "The specified Controller Service was used to maintain state about what had been pulled from the remote server so that if a new node "
+ "begins pulling data, it won't duplicate all of the work that has been done. If not specified, the information was not shared across the cluster. " + "begins pulling data, it won't duplicate all of the work that has been done. If not specified, the information was not shared across the cluster. "
+ "This property did not need to be set for standalone instances of NiFi but was supposed to be configured if NiFi had been running within a cluster.") + "This property did not need to be set for standalone instances of NiFi but was supposed to be configured if NiFi had been running within a cluster.")
.required(false) .required(false)
.identifiesControllerService(DistributedMapCacheClient.class) .identifiesControllerService(DistributedMapCacheClient.class)
.build(); .build();
public static final AllowableValue PRECISION_AUTO_DETECT = new AllowableValue("auto-detect", "Auto Detect", public static final AllowableValue PRECISION_AUTO_DETECT = new AllowableValue("auto-detect", "Auto Detect",
"Automatically detect time unit deterministically based on candidate entries timestamp." "Automatically detect time unit deterministically based on candidate entries timestamp."
+ " Please note that this option may take longer to list entities unnecessarily, if none of entries has a precise precision timestamp." + " Please note that this option may take longer to list entities unnecessarily, if none of entries has a precise precision timestamp."
+ " E.g. even if a target system supports millis, if all entries only have timestamps without millis, such as '2017-06-16 09:06:34.000', then its precision is determined as 'seconds'."); + " E.g. even if a target system supports millis, if all entries only have timestamps without millis, such as '2017-06-16 09:06:34.000', "
+ "then its precision is determined as 'seconds'.");
public static final AllowableValue PRECISION_MILLIS = new AllowableValue("millis", "Milliseconds", public static final AllowableValue PRECISION_MILLIS = new AllowableValue("millis", "Milliseconds",
"This option provides the minimum latency for an entry from being available to being listed if target system supports millis, if not, use other options."); "This option provides the minimum latency for an entry from being available to being listed if target system supports millis, if not, use other options.");
public static final AllowableValue PRECISION_SECONDS = new AllowableValue("seconds", "Seconds","For a target system that does not have millis precision, but has in seconds."); public static final AllowableValue PRECISION_SECONDS = new AllowableValue("seconds", "Seconds",
"For a target system that does not have millis precision, but has in seconds.");
public static final AllowableValue PRECISION_MINUTES = new AllowableValue("minutes", "Minutes", "For a target system that only supports precision in minutes."); public static final AllowableValue PRECISION_MINUTES = new AllowableValue("minutes", "Minutes", "For a target system that only supports precision in minutes.");
public static final PropertyDescriptor TARGET_SYSTEM_TIMESTAMP_PRECISION = new Builder() public static final PropertyDescriptor TARGET_SYSTEM_TIMESTAMP_PRECISION = new Builder()
.name("target-system-timestamp-precision") .name("target-system-timestamp-precision")
.displayName("Target System Timestamp Precision") .displayName("Target System Timestamp Precision")
.description("Specify timestamp precision at the target system." .description("Specify timestamp precision at the target system."
+ " Since this processor uses timestamp of entities to decide which should be listed, it is crucial to use the right timestamp precision.") + " Since this processor uses timestamp of entities to decide which should be listed, it is crucial to use the right timestamp precision.")
.required(true) .required(true)
.allowableValues(PRECISION_AUTO_DETECT, PRECISION_MILLIS, PRECISION_SECONDS, PRECISION_MINUTES) .allowableValues(PRECISION_AUTO_DETECT, PRECISION_MILLIS, PRECISION_SECONDS, PRECISION_MINUTES)
.defaultValue(PRECISION_AUTO_DETECT.getValue()) .defaultValue(PRECISION_AUTO_DETECT.getValue())
.build(); .build();
public static final Relationship REL_SUCCESS = new Relationship.Builder() public static final Relationship REL_SUCCESS = new Relationship.Builder()
.name("success") .name("success")
.description("All FlowFiles that are received are routed to success") .description("All FlowFiles that are received are routed to success")
.build(); .build();
public static final AllowableValue BY_TIMESTAMPS = new AllowableValue("timestamps", "Tracking Timestamps", public static final AllowableValue BY_TIMESTAMPS = new AllowableValue("timestamps", "Tracking Timestamps",
"This strategy tracks the latest timestamp of listed entity to determine new/updated entities." + "This strategy tracks the latest timestamp of listed entity to determine new/updated entities." +
@ -214,22 +237,22 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
" are accurate."); " are accurate.");
public static final PropertyDescriptor LISTING_STRATEGY = new Builder() public static final PropertyDescriptor LISTING_STRATEGY = new Builder()
.name("listing-strategy") .name("listing-strategy")
.displayName("Listing Strategy") .displayName("Listing Strategy")
.description("Specify how to determine new/updated entities. See each strategy descriptions for detail.") .description("Specify how to determine new/updated entities. See each strategy descriptions for detail.")
.required(true) .required(true)
.allowableValues(BY_TIMESTAMPS, BY_ENTITIES, NO_TRACKING) .allowableValues(BY_TIMESTAMPS, BY_ENTITIES, NO_TRACKING)
.defaultValue(BY_TIMESTAMPS.getValue()) .defaultValue(BY_TIMESTAMPS.getValue())
.build(); .build();
public static final PropertyDescriptor RECORD_WRITER = new Builder() public static final PropertyDescriptor RECORD_WRITER = new Builder()
.name("record-writer") .name("record-writer")
.displayName("Record Writer") .displayName("Record Writer")
.description("Specifies the Record Writer to use for creating the listing. If not specified, one FlowFile will be created for each entity that is listed. If the Record Writer is specified, " + .description("Specifies the Record Writer to use for creating the listing. If not specified, one FlowFile will be created for each entity that is listed. " +
"all entities will be written to a single FlowFile instead of adding attributes to individual FlowFiles.") "If the Record Writer is specified, all entities will be written to a single FlowFile instead of adding attributes to individual FlowFiles.")
.required(false) .required(false)
.identifiesControllerService(RecordSetWriterFactory.class) .identifiesControllerService(RecordSetWriterFactory.class)
.build(); .build();
/** /**
* Represents the timestamp of an entity which was the latest one within those listed at the previous cycle. * Represents the timestamp of an entity which was the latest one within those listed at the previous cycle.
@ -255,6 +278,7 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
* near instantaneously after the prior iteration effectively voiding the built in buffer * near instantaneously after the prior iteration effectively voiding the built in buffer
*/ */
public static final Map<TimeUnit, Long> LISTING_LAG_MILLIS; public static final Map<TimeUnit, Long> LISTING_LAG_MILLIS;
static { static {
final Map<TimeUnit, Long> nanos = new HashMap<>(); final Map<TimeUnit, Long> nanos = new HashMap<>();
nanos.put(TimeUnit.MILLISECONDS, 100L); nanos.put(TimeUnit.MILLISECONDS, 100L);
@ -262,6 +286,7 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
nanos.put(TimeUnit.MINUTES, 60_000L); nanos.put(TimeUnit.MINUTES, 60_000L);
LISTING_LAG_MILLIS = Collections.unmodifiableMap(nanos); LISTING_LAG_MILLIS = Collections.unmodifiableMap(nanos);
} }
static final String LATEST_LISTED_ENTRY_TIMESTAMP_KEY = "listing.timestamp"; static final String LATEST_LISTED_ENTRY_TIMESTAMP_KEY = "listing.timestamp";
static final String LAST_PROCESSED_LATEST_ENTRY_TIMESTAMP_KEY = "processed.timestamp"; static final String LAST_PROCESSED_LATEST_ENTRY_TIMESTAMP_KEY = "processed.timestamp";
static final String IDENTIFIER_PREFIX = "id"; static final String IDENTIFIER_PREFIX = "id";
@ -279,7 +304,6 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
} }
} }
@Override @Override
public Set<Relationship> getRelationships() { public Set<Relationship> getRelationships() {
final Set<Relationship> relationships = new HashSet<>(); final Set<Relationship> relationships = new HashSet<>();
@ -291,7 +315,7 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
* In order to add custom validation at sub-classes, implement {@link #customValidate(ValidationContext, Collection)} method. * In order to add custom validation at sub-classes, implement {@link #customValidate(ValidationContext, Collection)} method.
*/ */
@Override @Override
protected final Collection<ValidationResult> customValidate(ValidationContext context) { protected final Collection<ValidationResult> customValidate(final ValidationContext context) {
final Collection<ValidationResult> results = new ArrayList<>(); final Collection<ValidationResult> results = new ArrayList<>();
final String listingStrategy = context.getProperty(LISTING_STRATEGY).getValue(); final String listingStrategy = context.getProperty(LISTING_STRATEGY).getValue();
@ -303,9 +327,9 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
return results; return results;
} }
/** /**
* Sub-classes can add custom validation by implementing this method. * Sub-classes can add custom validation by implementing this method.
*
* @param validationContext the validation context * @param validationContext the validation context
* @param validationResults add custom validation result to this collection * @param validationResults add custom validation result to this collection
*/ */
@ -313,6 +337,54 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
} }
@Override
public List<ConfigVerificationResult> verify(final ProcessContext context, final ComponentLog logger, final Map<String, String> attributes) {
final List<ConfigVerificationResult> results = new ArrayList<>();
final String containerName = getListingContainerName(context);
try {
final Integer unfilteredListingCount = countUnfilteredListing(context);
final int matchingCount = performListing(context, IGNORE_MIN_TIMESTAMP_VALUE, ListingMode.CONFIGURATION_VERIFICATION).size();
final String countExplanation;
if (unfilteredListingCount == null) {
if (matchingCount == 0) {
countExplanation = "Found no objects matching the filter.";
} else {
final String matchingCountText = matchingCount == 1 ? matchingCount + " object" : matchingCount + " objects";
countExplanation = String.format("Found %s matching the filter.", matchingCountText);
}
} else if (unfilteredListingCount == 0) {
countExplanation = "Found no objects.";
} else {
final String unfilteredListingCountText = unfilteredListingCount == 1 ? unfilteredListingCount + " object" : unfilteredListingCount + " objects";
final String unfilteredDemonstrativePronoun = unfilteredListingCount == 1 ? "that" : "those";
final String matchingCountText = matchingCount == 1 ? matchingCount + " matches" : matchingCount + " match";
countExplanation = String.format("Found %s. Of %s, %s the filter.",
unfilteredListingCountText, unfilteredDemonstrativePronoun, matchingCountText);
}
results.add(new ConfigVerificationResult.Builder()
.verificationStepName("Perform Listing")
.outcome(Outcome.SUCCESSFUL)
.explanation(String.format("Successfully listed contents of %s. %s", containerName, countExplanation))
.build());
logger.info("Successfully verified configuration");
} catch (final IOException e) {
logger.warn("Failed to verify configuration. Could not list contents of {}", containerName, e);
results.add(new ConfigVerificationResult.Builder()
.verificationStepName("Perform Listing")
.outcome(Outcome.FAILED)
.explanation(String.format("Failed to list contents of %s: %s", containerName, e.getMessage()))
.build());
}
return results;
}
@OnPrimaryNodeStateChange @OnPrimaryNodeStateChange
public void onPrimaryNodeChange(final PrimaryNodeState newState) { public void onPrimaryNodeChange(final PrimaryNodeState newState) {
justElectedPrimaryNode = (newState == PrimaryNodeState.ELECTED_PRIMARY_NODE); justElectedPrimaryNode = (newState == PrimaryNodeState.ELECTED_PRIMARY_NODE);
@ -376,7 +448,7 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
client.remove(path, new StringSerDe()); client.remove(path, new StringSerDe());
} catch (final IOException ioe) { } catch (final IOException ioe) {
getLogger().warn("Failed to remove entry from Distributed Cache Service. However, the state has already been migrated to use the new " getLogger().warn("Failed to remove entry from Distributed Cache Service. However, the state has already been migrated to use the new "
+ "State Management service, so the Distributed Cache Service is no longer needed."); + "State Management service, so the Distributed Cache Service is no longer needed.");
} }
} }
} }
@ -415,8 +487,8 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
} }
private Map<String, String> createStateMap(final long latestListedEntryTimestampThisCycleMillis, private Map<String, String> createStateMap(final long latestListedEntryTimestampThisCycleMillis,
final long lastProcessedLatestEntryTimestampMillis, final long lastProcessedLatestEntryTimestampMillis,
final List<String> processedIdentifiesWithLatestTimestamp) throws IOException { final List<String> processedIdentifiesWithLatestTimestamp) throws IOException {
final Map<String, String> updatedState = new HashMap<>(processedIdentifiesWithLatestTimestamp.size() + 2); final Map<String, String> updatedState = new HashMap<>(processedIdentifiesWithLatestTimestamp.size() + 2);
updatedState.put(LATEST_LISTED_ENTRY_TIMESTAMP_KEY, String.valueOf(latestListedEntryTimestampThisCycleMillis)); updatedState.put(LATEST_LISTED_ENTRY_TIMESTAMP_KEY, String.valueOf(latestListedEntryTimestampThisCycleMillis));
@ -428,7 +500,6 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
return updatedState; return updatedState;
} }
private void persist(final long latestListedEntryTimestampThisCycleMillis, private void persist(final long latestListedEntryTimestampThisCycleMillis,
final long lastProcessedLatestEntryTimestampMillis, final long lastProcessedLatestEntryTimestampMillis,
final List<String> processedIdentifiesWithLatestTimestamp, final List<String> processedIdentifiesWithLatestTimestamp,
@ -467,6 +538,10 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
} }
} }
protected long getCurrentTime() {
return System.currentTimeMillis();
}
public void listByNoTracking(final ProcessContext context, final ProcessSession session) { public void listByNoTracking(final ProcessContext context, final ProcessSession session) {
final List<T> entityList; final List<T> entityList;
@ -483,7 +558,7 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
try { try {
// minTimestamp = 0L by default on this strategy to ignore any future // minTimestamp = 0L by default on this strategy to ignore any future
// comparision in lastModifiedMap to the same entity. // comparision in lastModifiedMap to the same entity.
entityList = performListing(context, 0L); entityList = performListing(context, IGNORE_MIN_TIMESTAMP_VALUE, ListingMode.EXECUTION);
} catch (final IOException pe) { } catch (final IOException pe) {
getLogger().error("Failed to perform listing on remote host due to {}", new Object[]{pe.getMessage()}, pe); getLogger().error("Failed to perform listing on remote host due to {}", new Object[]{pe.getMessage()}, pe);
context.yield(); context.yield();
@ -516,12 +591,12 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
} }
public void listByTimeWindow(final ProcessContext context, final ProcessSession session) throws ProcessException { public void listByTimeWindow(final ProcessContext context, final ProcessSession session) throws ProcessException {
if (this.lastListedLatestEntryTimestampMillis == null || justElectedPrimaryNode) { if (lastListedLatestEntryTimestampMillis == null || justElectedPrimaryNode) {
try { try {
final StateMap stateMap = context.getStateManager().getState(getStateScope(context)); final StateMap stateMap = context.getStateManager().getState(getStateScope(context));
Optional.ofNullable(stateMap.get(LATEST_LISTED_ENTRY_TIMESTAMP_KEY)) Optional.ofNullable(stateMap.get(LATEST_LISTED_ENTRY_TIMESTAMP_KEY))
.map(Long::parseLong) .map(Long::parseLong)
.ifPresent(lastTimestamp -> this.lastListedLatestEntryTimestampMillis = lastTimestamp); .ifPresent(lastTimestamp -> lastListedLatestEntryTimestampMillis = lastTimestamp);
justElectedPrimaryNode = false; justElectedPrimaryNode = false;
} catch (final IOException ioe) { } catch (final IOException ioe) {
@ -531,14 +606,14 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
} }
} }
long lowerBoundInclusiveTimestamp = Optional.ofNullable(this.lastListedLatestEntryTimestampMillis).orElse(0L); long lowerBoundInclusiveTimestamp = Optional.ofNullable(lastListedLatestEntryTimestampMillis).orElse(IGNORE_MIN_TIMESTAMP_VALUE);
long upperBoundExclusiveTimestamp; long upperBoundExclusiveTimestamp;
long currentTime = getCurrentTime(); long currentTime = getCurrentTime();
final TreeMap<Long, List<T>> orderedEntries = new TreeMap<>(); final TreeMap<Long, List<T>> orderedEntries = new TreeMap<>();
try { try {
List<T> entityList = performListing(context, lowerBoundInclusiveTimestamp); List<T> entityList = performListing(context, lowerBoundInclusiveTimestamp, ListingMode.EXECUTION);
boolean targetSystemHasMilliseconds = false; boolean targetSystemHasMilliseconds = false;
boolean targetSystemHasSeconds = false; boolean targetSystemHasSeconds = false;
@ -560,7 +635,7 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
} }
final TimeUnit targetSystemTimePrecision final TimeUnit targetSystemTimePrecision
= PRECISION_AUTO_DETECT.getValue().equals(specifiedPrecision) = PRECISION_AUTO_DETECT.getValue().equals(specifiedPrecision)
? targetSystemHasMilliseconds ? TimeUnit.MILLISECONDS : targetSystemHasSeconds ? TimeUnit.SECONDS : TimeUnit.MINUTES ? targetSystemHasMilliseconds ? TimeUnit.MILLISECONDS : targetSystemHasSeconds ? TimeUnit.SECONDS : TimeUnit.MINUTES
: PRECISION_MILLIS.getValue().equals(specifiedPrecision) ? TimeUnit.MILLISECONDS : PRECISION_MILLIS.getValue().equals(specifiedPrecision) ? TimeUnit.MILLISECONDS
: PRECISION_SECONDS.getValue().equals(specifiedPrecision) ? TimeUnit.SECONDS : TimeUnit.MINUTES; : PRECISION_SECONDS.getValue().equals(specifiedPrecision) ? TimeUnit.SECONDS : TimeUnit.MINUTES;
final Long listingLagMillis = LISTING_LAG_MILLIS.get(targetSystemTimePrecision); final Long listingLagMillis = LISTING_LAG_MILLIS.get(targetSystemTimePrecision);
@ -572,19 +647,19 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
getLogger().trace("entityList: " + entityList.stream().map(entity -> entity.getName() + "_" + entity.getTimestamp()).collect(Collectors.joining(", "))); getLogger().trace("entityList: " + entityList.stream().map(entity -> entity.getName() + "_" + entity.getTimestamp()).collect(Collectors.joining(", ")));
} }
entityList entityList
.stream() .stream()
.filter(entity -> entity.getTimestamp() >= lowerBoundInclusiveTimestamp) .filter(entity -> entity.getTimestamp() >= lowerBoundInclusiveTimestamp)
.filter(entity -> entity.getTimestamp() < upperBoundExclusiveTimestamp) .filter(entity -> entity.getTimestamp() < upperBoundExclusiveTimestamp)
.forEach(entity -> orderedEntries .forEach(entity -> orderedEntries
.computeIfAbsent(entity.getTimestamp(), __ -> new ArrayList<>()) .computeIfAbsent(entity.getTimestamp(), __ -> new ArrayList<>())
.add(entity) .add(entity)
); );
if (getLogger().isTraceEnabled()) { if (getLogger().isTraceEnabled()) {
getLogger().trace("orderedEntries: " + getLogger().trace("orderedEntries: " +
orderedEntries.values().stream() orderedEntries.values().stream()
.flatMap(List::stream) .flatMap(List::stream)
.map(entity -> entity.getName() + "_" + entity.getTimestamp()) .map(entity -> entity.getName() + "_" + entity.getTimestamp())
.collect(Collectors.joining(", ")) .collect(Collectors.joining(", "))
); );
} }
} catch (final IOException e) { } catch (final IOException e) {
@ -614,31 +689,27 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
try { try {
if (getLogger().isTraceEnabled()) { if (getLogger().isTraceEnabled()) {
getLogger().info("this.lastListedLatestEntryTimestampMillis = upperBoundExclusiveTimestamp: " + this.lastListedLatestEntryTimestampMillis + " = " + upperBoundExclusiveTimestamp); getLogger().info("this.lastListedLatestEntryTimestampMillis = upperBoundExclusiveTimestamp: " + lastListedLatestEntryTimestampMillis + " = " + upperBoundExclusiveTimestamp);
} }
this.lastListedLatestEntryTimestampMillis = upperBoundExclusiveTimestamp; lastListedLatestEntryTimestampMillis = upperBoundExclusiveTimestamp;
persist(upperBoundExclusiveTimestamp, upperBoundExclusiveTimestamp, latestIdentifiersProcessed, session, getStateScope(context)); persist(upperBoundExclusiveTimestamp, upperBoundExclusiveTimestamp, latestIdentifiersProcessed, session, getStateScope(context));
} catch (final IOException ioe) { } catch (final IOException ioe) {
getLogger().warn("Unable to save state due to {}. If NiFi is restarted before state is saved, or " getLogger().warn("Unable to save state due to {}. If NiFi is restarted before state is saved, or "
+ "if another node begins executing this Processor, data duplication may occur.", ioe); + "if another node begins executing this Processor, data duplication may occur.", ioe);
} }
} }
protected long getCurrentTime() {
return System.currentTimeMillis();
}
public void listByTrackingTimestamps(final ProcessContext context, final ProcessSession session) throws ProcessException { public void listByTrackingTimestamps(final ProcessContext context, final ProcessSession session) throws ProcessException {
Long minTimestampToListMillis = lastListedLatestEntryTimestampMillis; Long minTimestampToListMillis = lastListedLatestEntryTimestampMillis;
if (this.lastListedLatestEntryTimestampMillis == null || this.lastProcessedLatestEntryTimestampMillis == null || justElectedPrimaryNode) { if (lastListedLatestEntryTimestampMillis == null || lastProcessedLatestEntryTimestampMillis == null || justElectedPrimaryNode) {
try { try {
boolean noUpdateRequired = false; boolean noUpdateRequired = false;
// Attempt to retrieve state from the state manager if a last listing was not yet established or // Attempt to retrieve state from the state manager if a last listing was not yet established or
// if just elected the primary node // if just elected the primary node
final StateMap stateMap = session.getState(getStateScope(context)); final StateMap stateMap = session.getState(getStateScope(context));
latestIdentifiersProcessed.clear(); latestIdentifiersProcessed.clear();
for (Map.Entry<String, String> state : stateMap.toMap().entrySet()) { for (final Map.Entry<String, String> state : stateMap.toMap().entrySet()) {
final String k = state.getKey(); final String k = state.getKey();
final String v = state.getValue(); final String v = state.getValue();
if (v == null || v.isEmpty()) { if (v == null || v.isEmpty()) {
@ -648,13 +719,13 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
if (LATEST_LISTED_ENTRY_TIMESTAMP_KEY.equals(k)) { if (LATEST_LISTED_ENTRY_TIMESTAMP_KEY.equals(k)) {
minTimestampToListMillis = Long.parseLong(v); minTimestampToListMillis = Long.parseLong(v);
// If our determined timestamp is the same as that of our last listing, skip this execution as there are no updates // If our determined timestamp is the same as that of our last listing, skip this execution as there are no updates
if (minTimestampToListMillis.equals(this.lastListedLatestEntryTimestampMillis)) { if (minTimestampToListMillis.equals(lastListedLatestEntryTimestampMillis)) {
noUpdateRequired = true; noUpdateRequired = true;
} else { } else {
this.lastListedLatestEntryTimestampMillis = minTimestampToListMillis; lastListedLatestEntryTimestampMillis = minTimestampToListMillis;
} }
} else if (LAST_PROCESSED_LATEST_ENTRY_TIMESTAMP_KEY.equals(k)) { } else if (LAST_PROCESSED_LATEST_ENTRY_TIMESTAMP_KEY.equals(k)) {
this.lastProcessedLatestEntryTimestampMillis = Long.parseLong(v); lastProcessedLatestEntryTimestampMillis = Long.parseLong(v);
} else if (k.startsWith(IDENTIFIER_PREFIX)) { } else if (k.startsWith(IDENTIFIER_PREFIX)) {
latestIdentifiersProcessed.add(v); latestIdentifiersProcessed.add(v);
} }
@ -676,7 +747,7 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
final long currentRunTimeMillis = System.currentTimeMillis(); final long currentRunTimeMillis = System.currentTimeMillis();
try { try {
// track of when this last executed for consideration of the lag nanos // track of when this last executed for consideration of the lag nanos
entityList = performListing(context, minTimestampToListMillis); entityList = performListing(context, minTimestampToListMillis, ListingMode.EXECUTION);
} catch (final IOException e) { } catch (final IOException e) {
getLogger().error("Failed to perform listing on remote host due to {}", new Object[]{e.getMessage()}, e); getLogger().error("Failed to perform listing on remote host due to {}", new Object[]{e.getMessage()}, e);
context.yield(); context.yield();
@ -728,7 +799,7 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
} }
final TimeUnit targetSystemTimePrecision final TimeUnit targetSystemTimePrecision
= PRECISION_AUTO_DETECT.getValue().equals(specifiedPrecision) = PRECISION_AUTO_DETECT.getValue().equals(specifiedPrecision)
? targetSystemHasMilliseconds ? TimeUnit.MILLISECONDS : targetSystemHasSeconds ? TimeUnit.SECONDS : TimeUnit.MINUTES ? targetSystemHasMilliseconds ? TimeUnit.MILLISECONDS : targetSystemHasSeconds ? TimeUnit.SECONDS : TimeUnit.MINUTES
: PRECISION_MILLIS.getValue().equals(specifiedPrecision) ? TimeUnit.MILLISECONDS : PRECISION_MILLIS.getValue().equals(specifiedPrecision) ? TimeUnit.MILLISECONDS
: PRECISION_SECONDS.getValue().equals(specifiedPrecision) ? TimeUnit.SECONDS : TimeUnit.MINUTES; : PRECISION_SECONDS.getValue().equals(specifiedPrecision) ? TimeUnit.SECONDS : TimeUnit.MINUTES;
final Long listingLagMillis = LISTING_LAG_MILLIS.get(targetSystemTimePrecision); final Long listingLagMillis = LISTING_LAG_MILLIS.get(targetSystemTimePrecision);
@ -743,8 +814,8 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
final long listingLagNanos = TimeUnit.MILLISECONDS.toNanos(listingLagMillis); final long listingLagNanos = TimeUnit.MILLISECONDS.toNanos(listingLagMillis);
if (currentRunTimeNanos - lastRunTimeNanos < listingLagNanos if (currentRunTimeNanos - lastRunTimeNanos < listingLagNanos
|| (latestListedEntryTimestampThisCycleMillis.equals(lastProcessedLatestEntryTimestampMillis) || (latestListedEntryTimestampThisCycleMillis.equals(lastProcessedLatestEntryTimestampMillis)
&& orderedEntries.get(latestListedEntryTimestampThisCycleMillis).stream() && orderedEntries.get(latestListedEntryTimestampThisCycleMillis).stream()
.allMatch(entity -> latestIdentifiersProcessed.contains(entity.getIdentifier())))) { .allMatch(entity -> latestIdentifiersProcessed.contains(entity.getIdentifier())))) {
context.yield(); context.yield();
return; return;
} }
@ -778,7 +849,7 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
// As long as we have a listing timestamp, there is meaningful state to capture regardless of any outputs generated // As long as we have a listing timestamp, there is meaningful state to capture regardless of any outputs generated
if (latestListedEntryTimestampThisCycleMillis != null) { if (latestListedEntryTimestampThisCycleMillis != null) {
boolean processedNewFiles = entitiesListed > 0; final boolean processedNewFiles = entitiesListed > 0;
if (!latestListedEntryTimestampThisCycleMillis.equals(lastListedLatestEntryTimestampMillis) || processedNewFiles) { if (!latestListedEntryTimestampThisCycleMillis.equals(lastListedLatestEntryTimestampMillis) || processedNewFiles) {
// We have performed a listing and pushed any FlowFiles out that may have been generated // We have performed a listing and pushed any FlowFiles out that may have been generated
@ -794,7 +865,7 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
persist(latestListedEntryTimestampThisCycleMillis, lastProcessedLatestEntryTimestampMillis, latestIdentifiersProcessed, session, getStateScope(context)); persist(latestListedEntryTimestampThisCycleMillis, lastProcessedLatestEntryTimestampMillis, latestIdentifiersProcessed, session, getStateScope(context));
} catch (final IOException ioe) { } catch (final IOException ioe) {
getLogger().warn("Unable to save state due to {}. If NiFi is restarted before state is saved, or " getLogger().warn("Unable to save state due to {}. If NiFi is restarted before state is saved, or "
+ "if another node begins executing this Processor, data duplication may occur.", ioe); + "if another node begins executing this Processor, data duplication may occur.", ioe);
} }
} }
@ -834,17 +905,17 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
final WriteResult writeResult; final WriteResult writeResult;
try (final OutputStream out = session.write(flowFile); try (final OutputStream out = session.write(flowFile);
final RecordSetWriter recordSetWriter = writerFactory.createWriter(getLogger(), getRecordSchema(), out, Collections.emptyMap())) { final RecordSetWriter recordSetWriter = writerFactory.createWriter(getLogger(), getRecordSchema(), out, Collections.emptyMap())) {
recordSetWriter.beginRecordSet(); recordSetWriter.beginRecordSet();
for (Map.Entry<Long, List<T>> timestampEntities : orderedEntries.entrySet()) { for (final Map.Entry<Long, List<T>> timestampEntities : orderedEntries.entrySet()) {
List<T> entities = timestampEntities.getValue(); List<T> entities = timestampEntities.getValue();
if (timestampEntities.getKey().equals(lastProcessedLatestEntryTimestampMillis)) { if (timestampEntities.getKey().equals(lastProcessedLatestEntryTimestampMillis)) {
// Filter out previously processed entities. // Filter out previously processed entities.
entities = entities.stream().filter(entity -> !latestIdentifiersProcessed.contains(entity.getIdentifier())).collect(Collectors.toList()); entities = entities.stream().filter(entity -> !latestIdentifiersProcessed.contains(entity.getIdentifier())).collect(Collectors.toList());
} }
for (T entity : entities) { for (final T entity : entities) {
entitiesListed++; entitiesListed++;
recordSetWriter.write(entity.toRecord()); recordSetWriter.write(entity.toRecord());
} }
@ -868,14 +939,14 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
private int createFlowFilesForEntities(final ProcessContext context, final ProcessSession session, final Map<Long, List<T>> orderedEntries) { private int createFlowFilesForEntities(final ProcessContext context, final ProcessSession session, final Map<Long, List<T>> orderedEntries) {
int entitiesListed = 0; int entitiesListed = 0;
for (Map.Entry<Long, List<T>> timestampEntities : orderedEntries.entrySet()) { for (final Map.Entry<Long, List<T>> timestampEntities : orderedEntries.entrySet()) {
List<T> entities = timestampEntities.getValue(); List<T> entities = timestampEntities.getValue();
if (timestampEntities.getKey().equals(lastProcessedLatestEntryTimestampMillis)) { if (timestampEntities.getKey().equals(lastProcessedLatestEntryTimestampMillis)) {
// Filter out previously processed entities. // Filter out previously processed entities.
entities = entities.stream().filter(entity -> !latestIdentifiersProcessed.contains(entity.getIdentifier())).collect(Collectors.toList()); entities = entities.stream().filter(entity -> !latestIdentifiersProcessed.contains(entity.getIdentifier())).collect(Collectors.toList());
} }
for (T entity : entities) { for (final T entity : entities) {
entitiesListed++; entitiesListed++;
// Create the FlowFile for this path. // Create the FlowFile for this path.
@ -894,6 +965,7 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
* So that it use return different precisions than PRECISION_AUTO_DETECT. * So that it use return different precisions than PRECISION_AUTO_DETECT.
* If TARGET_SYSTEM_TIMESTAMP_PRECISION is supported as a valid Processor property, * If TARGET_SYSTEM_TIMESTAMP_PRECISION is supported as a valid Processor property,
* then PRECISION_AUTO_DETECT will be the default value when not specified by a user. * then PRECISION_AUTO_DETECT will be the default value when not specified by a user.
*
* @return * @return
*/ */
protected String getDefaultTimePrecision() { protected String getDefaultTimePrecision() {
@ -936,11 +1008,13 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
* will be filtered out by the Processor. Therefore, it is not necessary that implementations perform this filtering but can be more efficient * will be filtered out by the Processor. Therefore, it is not necessary that implementations perform this filtering but can be more efficient
* if the filtering can be performed on the server side prior to retrieving the information. * if the filtering can be performed on the server side prior to retrieving the information.
* *
* @param context the ProcessContex to use in order to pull the appropriate entities * @param context the ProcessContext to use in order to pull the appropriate entities
* @param minTimestamp the minimum timestamp of entities that should be returned. * @param minTimestamp the minimum timestamp of entities that should be returned
* @param listingMode the listing mode, indicating whether the listing is being performed during configuration verification or normal processor execution
* @return a Listing of entities that have a timestamp >= minTimestamp * @return a Listing of entities that have a timestamp >= minTimestamp
*/ */
protected abstract List<T> performListing(final ProcessContext context, final Long minTimestamp) throws IOException; protected abstract List<T> performListing(final ProcessContext context, final Long minTimestamp, final ListingMode listingMode)
throws IOException;
/** /**
* Determines whether or not the listing must be reset if the value of the given property is changed * Determines whether or not the listing must be reset if the value of the given property is changed
@ -963,7 +1037,25 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
*/ */
protected abstract RecordSchema getRecordSchema(); protected abstract RecordSchema getRecordSchema();
/**
* Performs an unfiltered listing and returns the count, or null if this operation is not supported.
*
* @param context the ProcessContext to use in order to pull the appropriate entities
* @return The number of unfiltered entities in the listing, or null if this processor does not support an unfiltered listing
*/
protected abstract Integer countUnfilteredListing(final ProcessContext context)
throws IOException;
/**
* Provides a human-readable name for the container being listed, for the purpose of displaying readable verification messages during processor configuration verification.
*
* @param context The process context
* @return The user-friendly name for the container
*/
protected abstract String getListingContainerName(final ProcessContext context);
private static class StringSerDe implements Serializer<String>, Deserializer<String> { private static class StringSerDe implements Serializer<String>, Deserializer<String> {
@Override @Override
public String deserialize(final byte[] value) throws DeserializationException, IOException { public String deserialize(final byte[] value) throws DeserializationException, IOException {
if (value == null) { if (value == null) {
@ -972,11 +1064,11 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
return new String(value, StandardCharsets.UTF_8); return new String(value, StandardCharsets.UTF_8);
} }
@Override @Override
public void serialize(final String value, final OutputStream out) throws SerializationException, IOException { public void serialize(final String value, final OutputStream out) throws SerializationException, IOException {
out.write(value.getBytes(StandardCharsets.UTF_8)); out.write(value.getBytes(StandardCharsets.UTF_8));
} }
} }
@OnScheduled @OnScheduled
@ -1007,7 +1099,7 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
private void listByTrackingEntities(ProcessContext context, ProcessSession session) throws ProcessException { private void listByTrackingEntities(ProcessContext context, ProcessSession session) throws ProcessException {
listedEntityTracker.trackEntities(context, session, justElectedPrimaryNode, getStateScope(context), minTimestampToList -> { listedEntityTracker.trackEntities(context, session, justElectedPrimaryNode, getStateScope(context), minTimestampToList -> {
try { try {
return performListing(context, minTimestampToList); return performListing(context, minTimestampToList, ListingMode.EXECUTION);
} catch (final IOException e) { } catch (final IOException e) {
getLogger().error("Failed to perform listing on remote host due to {}", new Object[]{e.getMessage()}, e); getLogger().error("Failed to perform listing on remote host due to {}", new Object[]{e.getMessage()}, e);
return Collections.emptyList(); return Collections.emptyList();
@ -1015,5 +1107,4 @@ public abstract class AbstractListProcessor<T extends ListableEntity> extends Ab
}, entity -> createAttributes(entity, context)); }, entity -> createAttributes(entity, context));
justElectedPrimaryNode = false; justElectedPrimaryNode = false;
} }
} }

View File

@ -257,7 +257,7 @@ public class ListedEntityTracker<T extends ListableEntity> {
} else { } else {
this.alreadyListedEntities = new ConcurrentHashMap<>(fetchedListedEntities); this.alreadyListedEntities = new ConcurrentHashMap<>(fetchedListedEntities);
} }
} catch (IOException e) { } catch (final IOException e) {
throw new ProcessException("Failed to restore already-listed entities due to " + e, e); throw new ProcessException("Failed to restore already-listed entities due to " + e, e);
} }
} }

View File

@ -17,6 +17,7 @@
package org.apache.nifi.processor.util.list; package org.apache.nifi.processor.util.list;
import org.apache.nifi.annotation.notification.PrimaryNodeState; import org.apache.nifi.annotation.notification.PrimaryNodeState;
import org.apache.nifi.components.ConfigVerificationResult;
import org.apache.nifi.components.state.Scope; import org.apache.nifi.components.state.Scope;
import org.apache.nifi.components.state.StateMap; import org.apache.nifi.components.state.StateMap;
import org.apache.nifi.flowfile.FlowFile; import org.apache.nifi.flowfile.FlowFile;
@ -30,7 +31,9 @@ import org.junit.rules.TemporaryFolder;
import org.junit.rules.TestWatcher; import org.junit.rules.TestWatcher;
import java.io.IOException; import java.io.IOException;
import java.util.Collections;
import java.util.HashMap; import java.util.HashMap;
import java.util.List;
import java.util.Map; import java.util.Map;
import java.util.concurrent.TimeUnit; import java.util.concurrent.TimeUnit;
import java.util.stream.Collectors; import java.util.stream.Collectors;
@ -225,6 +228,10 @@ public class ITAbstractListProcessor {
runner.run(); runner.run();
runner.assertAllFlowFilesTransferred(ConcreteListProcessor.REL_SUCCESS, 1); runner.assertAllFlowFilesTransferred(ConcreteListProcessor.REL_SUCCESS, 1);
runner.clearTransferState(); runner.clearTransferState();
final List<ConfigVerificationResult> results = proc.verify(runner.getProcessContext(), runner.getLogger(), Collections.emptyMap());
assertEquals(1, results.size());
assertEquals(ConfigVerificationResult.Outcome.SUCCESSFUL, results.get(0).getOutcome());
} }
private void setTargetSystemTimestampPrecision(TimeUnit targetPrecision) { private void setTargetSystemTimestampPrecision(TimeUnit targetPrecision) {

View File

@ -17,7 +17,10 @@
package org.apache.nifi.processor.util.list; package org.apache.nifi.processor.util.list;
import org.apache.nifi.components.ConfigVerificationResult;
import org.apache.nifi.components.ConfigVerificationResult.Outcome;
import org.apache.nifi.components.PropertyDescriptor; import org.apache.nifi.components.PropertyDescriptor;
import org.apache.nifi.components.PropertyValue;
import org.apache.nifi.components.Validator; import org.apache.nifi.components.Validator;
import org.apache.nifi.components.state.Scope; import org.apache.nifi.components.state.Scope;
import org.apache.nifi.components.state.StateManager; import org.apache.nifi.components.state.StateManager;
@ -30,6 +33,7 @@ import org.apache.nifi.flowfile.FlowFile;
import org.apache.nifi.flowfile.attributes.CoreAttributes; import org.apache.nifi.flowfile.attributes.CoreAttributes;
import org.apache.nifi.processor.ProcessContext; import org.apache.nifi.processor.ProcessContext;
import org.apache.nifi.processor.ProcessSession; import org.apache.nifi.processor.ProcessSession;
import org.apache.nifi.processor.util.StandardValidators;
import org.apache.nifi.reporting.InitializationException; import org.apache.nifi.reporting.InitializationException;
import org.apache.nifi.serialization.RecordSetWriterFactory; import org.apache.nifi.serialization.RecordSetWriterFactory;
import org.apache.nifi.serialization.SimpleRecordSchema; import org.apache.nifi.serialization.SimpleRecordSchema;
@ -43,6 +47,7 @@ import org.apache.nifi.state.MockStateManager;
import org.apache.nifi.util.MockFlowFile; import org.apache.nifi.util.MockFlowFile;
import org.apache.nifi.util.TestRunner; import org.apache.nifi.util.TestRunner;
import org.apache.nifi.util.TestRunners; import org.apache.nifi.util.TestRunners;
import org.glassfish.jersey.internal.guava.Predicates;
import org.junit.Assert; import org.junit.Assert;
import org.junit.Before; import org.junit.Before;
import org.junit.Rule; import org.junit.Rule;
@ -55,6 +60,7 @@ import java.io.FileOutputStream;
import java.io.IOException; import java.io.IOException;
import java.nio.charset.StandardCharsets; import java.nio.charset.StandardCharsets;
import java.util.ArrayList; import java.util.ArrayList;
import java.util.Collections;
import java.util.Comparator; import java.util.Comparator;
import java.util.HashMap; import java.util.HashMap;
import java.util.List; import java.util.List;
@ -62,11 +68,13 @@ import java.util.Map;
import java.util.UUID; import java.util.UUID;
import java.util.concurrent.TimeUnit; import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicReference; import java.util.concurrent.atomic.AtomicReference;
import java.util.function.Predicate;
import java.util.regex.Matcher; import java.util.regex.Matcher;
import java.util.regex.Pattern; import java.util.regex.Pattern;
import java.util.stream.Collectors; import java.util.stream.Collectors;
import static org.junit.Assert.assertEquals; import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertTrue;
public class TestAbstractListProcessor { public class TestAbstractListProcessor {
@ -224,9 +232,12 @@ public class TestAbstractListProcessor {
proc.addEntity("one","firstFile",1585344381476L); proc.addEntity("one","firstFile",1585344381476L);
proc.addEntity("two","secondFile",1585344381475L); proc.addEntity("two","secondFile",1585344381475L);
assertVerificationOutcome(Outcome.SUCCESSFUL, ".* Found 2 objects. Of those, 2 match the filter.");
runner.run(); runner.run();
assertEquals(2, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size()); assertEquals(2, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size());
assertEquals(2, proc.entities.size()); assertEquals(2, proc.entities.size());
assertVerificationOutcome(Outcome.SUCCESSFUL, ".* Found 2 objects. Of those, 2 match the filter.");
final MockStateManager stateManager = runner.getStateManager(); final MockStateManager stateManager = runner.getStateManager();
final Map<String, String> expectedState = new HashMap<>(); final Map<String, String> expectedState = new HashMap<>();
@ -252,14 +263,16 @@ public class TestAbstractListProcessor {
// Clear any listed entities after choose No Tracking Strategy // Clear any listed entities after choose No Tracking Strategy
proc.entities.clear(); proc.entities.clear();
assertVerificationOutcome(Outcome.SUCCESSFUL, ".* Found no objects.");
// Add new entity // Add new entity
proc.addEntity("one","firstFile",1585344381476L); proc.addEntity("one","firstFile",1585344381476L);
proc.listByNoTracking(context, session); proc.listByTrackingTimestamps(context, session);
// Test if state cleared or not // Test if state cleared or not
runner.getStateManager().assertStateNotEquals(expectedState, Scope.CLUSTER); runner.getStateManager().assertStateNotEquals(expectedState, Scope.CLUSTER);
assertEquals(1, proc.entities.size()); assertEquals(1, proc.entities.size());
assertVerificationOutcome(Outcome.SUCCESSFUL, ".* Found 1 object. Of that, 1 matches the filter.");
} }
@Test @Test
@ -285,14 +298,22 @@ public class TestAbstractListProcessor {
proc.addEntity("one", "one", 1, 1); proc.addEntity("one", "one", 1, 1);
proc.currentTimestamp.set(1L); proc.currentTimestamp.set(1L);
runner.clearTransferState(); runner.clearTransferState();
// Prior to running the processor, we should expect 3 objects during verification
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed contents of .*.json.*" +
"Found 1 object. Of that, 1 matches the filter.");
runner.run(); runner.run();
assertEquals(1, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size()); assertEquals(1, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size());
runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).get(0) runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).get(0)
.assertAttributeEquals(CoreAttributes.FILENAME.key(), "one"); .assertAttributeEquals(CoreAttributes.FILENAME.key(), "one");
// The object is now tracked, so it's no longer considered new
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed contents of .*.json.*" +
"Found 1 object. Of that, 1 matches the filter.");
// Should not list any entity. // Should not list any entity.
proc.currentTimestamp.set(2L); proc.currentTimestamp.set(2L);
runner.clearTransferState(); runner.clearTransferState();
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed contents of .*.json.*" +
"Found 1 object. Of that, 1 matches the filter.");
runner.run(); runner.run();
assertEquals(0, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size()); assertEquals(0, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size());
@ -301,6 +322,8 @@ public class TestAbstractListProcessor {
proc.addEntity("five", "five", 5, 5); proc.addEntity("five", "five", 5, 5);
proc.addEntity("six", "six", 6, 6); proc.addEntity("six", "six", 6, 6);
runner.clearTransferState(); runner.clearTransferState();
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed contents of .*.json.*" +
"Found 3 objects. Of those, 3 match the filter.");
runner.run(); runner.run();
assertEquals(2, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size()); assertEquals(2, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size());
runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).get(0) runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).get(0)
@ -316,6 +339,8 @@ public class TestAbstractListProcessor {
proc.addEntity("three", "three", 3, 3); proc.addEntity("three", "three", 3, 3);
proc.addEntity("four", "four", 4, 4); proc.addEntity("four", "four", 4, 4);
runner.clearTransferState(); runner.clearTransferState();
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed contents of .*.json.*" +
"Found 6 objects. Of those, 6 match the filter.");
runner.run(); runner.run();
assertEquals(2, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size()); assertEquals(2, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size());
runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).get(0) runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).get(0)
@ -329,6 +354,8 @@ public class TestAbstractListProcessor {
proc.addEntity("five", "five", 7, 5); proc.addEntity("five", "five", 7, 5);
proc.addEntity("six", "six", 6, 16); proc.addEntity("six", "six", 6, 16);
runner.clearTransferState(); runner.clearTransferState();
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed contents of .*.json.*" +
"Found 6 objects. Of those, 6 match the filter.");
runner.run(); runner.run();
assertEquals(2, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size()); assertEquals(2, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size());
runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).get(0) runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).get(0)
@ -344,7 +371,12 @@ public class TestAbstractListProcessor {
runner.setProperty(ConcreteListProcessor.RESET_STATE, "1"); runner.setProperty(ConcreteListProcessor.RESET_STATE, "1");
runner.setProperty(ListedEntityTracker.INITIAL_LISTING_TARGET, "window"); runner.setProperty(ListedEntityTracker.INITIAL_LISTING_TARGET, "window");
runner.clearTransferState(); runner.clearTransferState();
// Prior to running the processor, we should expect 3 objects during verification
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed contents of .*.json.*" +
"Found 6 objects. Of those, 6 match the filter.");
runner.run(); runner.run();
assertEquals(3, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size()); assertEquals(3, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size());
runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).get(0) runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).get(0)
.assertAttributeEquals(CoreAttributes.FILENAME.key(), "four"); .assertAttributeEquals(CoreAttributes.FILENAME.key(), "four");
@ -353,16 +385,44 @@ public class TestAbstractListProcessor {
runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).get(2) runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).get(2)
.assertAttributeEquals(CoreAttributes.FILENAME.key(), "five"); .assertAttributeEquals(CoreAttributes.FILENAME.key(), "five");
// Reset state again. // Reset state again.
proc.currentTimestamp.set(20L); proc.currentTimestamp.set(20L);
// ConcreteListProcessor can reset state with any property. // ConcreteListProcessor can reset state with any property.
runner.setProperty(ListedEntityTracker.INITIAL_LISTING_TARGET, "all"); runner.setProperty(ListedEntityTracker.INITIAL_LISTING_TARGET, "all");
runner.setProperty(ConcreteListProcessor.RESET_STATE, "2"); runner.setProperty(ConcreteListProcessor.RESET_STATE, "2");
runner.clearTransferState(); runner.clearTransferState();
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed contents of .*.json.*" +
"Found 6 objects. Of those, 6 match the filter.");
runner.run(); runner.run();
// All entities should be picked, one to six. // All entities should be picked, one to six.
assertEquals(6, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size()); assertEquals(6, runner.getFlowFilesForRelationship(AbstractListProcessor.REL_SUCCESS).size());
// Now all are tracked, so none are new
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed contents of .*.json.*" +
"Found 6 objects. Of those, 6 match the filter.");
// Reset state again.
proc.currentTimestamp.set(25L);
runner.setProperty(ListedEntityTracker.INITIAL_LISTING_TARGET, "window");
runner.setProperty(ListedEntityTracker.TRACKING_TIME_WINDOW, "20ms");
runner.setProperty(ConcreteListProcessor.LISTING_FILTER, "f[a-z]+"); // Match only four and five
runner.setProperty(ConcreteListProcessor.RESET_STATE, "3");
runner.clearTransferState();
// Time window is now 5ms - 25ms, so only 5 and 6 fall in the window, so only 1 of the 2 filtered entities are considered 'new'
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed contents of .*.json.*" +
"Found 6 objects. Of those, 2 match the filter.");
}
private void assertVerificationOutcome(final Outcome expectedOutcome, final String expectedExplanationRegex) {
final List<ConfigVerificationResult> results = proc.verify(runner.getProcessContext(), runner.getLogger(), Collections.emptyMap());
assertEquals(1, results.size());
final ConfigVerificationResult result = results.get(0);
assertEquals(expectedOutcome, result.getOutcome());
assertTrue(String.format("Expected verification result to match pattern [%s]. Actual explanation was: %s", expectedExplanationRegex, result.getExplanation()),
result.getExplanation().matches(expectedExplanationRegex));
} }
static class DistributedCache extends AbstractControllerService implements DistributedMapCacheClient { static class DistributedCache extends AbstractControllerService implements DistributedMapCacheClient {
@ -434,6 +494,12 @@ public class TestAbstractListProcessor {
.name("reset-state") .name("reset-state")
.addValidator(Validator.VALID) .addValidator(Validator.VALID)
.build(); .build();
private static final PropertyDescriptor LISTING_FILTER = new PropertyDescriptor.Builder()
.name("listing-filter")
.displayName("Listing Filter")
.description("Filters listed entities by name.")
.addValidator(StandardValidators.REGULAR_EXPRESSION_VALIDATOR)
.build();
final AtomicReference<Long> currentTimestamp = new AtomicReference<>(); final AtomicReference<Long> currentTimestamp = new AtomicReference<>();
@ -453,6 +519,7 @@ public class TestAbstractListProcessor {
properties.add(ListedEntityTracker.TRACKING_TIME_WINDOW); properties.add(ListedEntityTracker.TRACKING_TIME_WINDOW);
properties.add(ListedEntityTracker.INITIAL_LISTING_TARGET); properties.add(ListedEntityTracker.INITIAL_LISTING_TARGET);
properties.add(RESET_STATE); properties.add(RESET_STATE);
properties.add(LISTING_FILTER);
return properties; return properties;
} }
@ -514,8 +581,17 @@ public class TestAbstractListProcessor {
} }
@Override @Override
protected List<ListableEntity> performListing(final ProcessContext context, final Long minTimestamp) throws IOException { protected List<ListableEntity> performListing(final ProcessContext context, final Long minTimestamp, ListingMode listingMode) throws IOException {
return getEntityList(); final PropertyValue listingFilter = context.getProperty(LISTING_FILTER);
Predicate<ListableEntity> filter = listingFilter.isSet()
? entity -> entity.getName().matches(listingFilter.getValue())
: Predicates.alwaysTrue();
return getEntityList().stream().filter(filter).collect(Collectors.toList());
}
@Override
protected Integer countUnfilteredListing(final ProcessContext context) throws IOException {
return entities.size();
} }
List<ListableEntity> getEntityList() { List<ListableEntity> getEntityList() {
@ -527,6 +603,11 @@ public class TestAbstractListProcessor {
return RESET_STATE.equals(property); return RESET_STATE.equals(property);
} }
@Override
protected String getListingContainerName(final ProcessContext context) {
return persistenceFilename;
}
@Override @Override
protected Scope getStateScope(final PropertyContext context) { protected Scope getStateScope(final PropertyContext context) {
return Scope.CLUSTER; return Scope.CLUSTER;

View File

@ -296,7 +296,7 @@ public abstract class GetFileTransfer extends AbstractProcessor {
} }
final StopWatch stopWatch = new StopWatch(true); final StopWatch stopWatch = new StopWatch(true);
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
final long millis = stopWatch.getElapsed(TimeUnit.MILLISECONDS); final long millis = stopWatch.getElapsed(TimeUnit.MILLISECONDS);
int newItems = 0; int newItems = 0;

View File

@ -126,4 +126,5 @@ public class ListFTP extends ListFileTransfer {
protected void customValidate(ValidationContext validationContext, Collection<ValidationResult> results) { protected void customValidate(ValidationContext validationContext, Collection<ValidationResult> results) {
FTPTransfer.validateProxySpec(validationContext, results); FTPTransfer.validateProxySpec(validationContext, results);
} }
} }

View File

@ -338,7 +338,6 @@ public class ListFile extends AbstractListProcessor<FileInfo> {
@OnScheduled @OnScheduled
public void onScheduled(final ProcessContext context) { public void onScheduled(final ProcessContext context) {
fileFilterRef.set(createFileFilter(context));
includeFileAttributes = context.getProperty(INCLUDE_FILE_ATTRIBUTES).asBoolean(); includeFileAttributes = context.getProperty(INCLUDE_FILE_ATTRIBUTES).asBoolean();
final long maxDiskOperationMillis = context.getProperty(MAX_DISK_OPERATION_TIME).evaluateAttributeExpressions().asTimePeriod(TimeUnit.MILLISECONDS); final long maxDiskOperationMillis = context.getProperty(MAX_DISK_OPERATION_TIME).evaluateAttributeExpressions().asTimePeriod(TimeUnit.MILLISECONDS);
@ -351,6 +350,7 @@ public class ListFile extends AbstractListProcessor<FileInfo> {
} else { } else {
performanceTracker = new UntrackedPerformanceTracker(getLogger(), maxDiskOperationMillis); performanceTracker = new UntrackedPerformanceTracker(getLogger(), maxDiskOperationMillis);
} }
fileFilterRef.set(createFileFilter(context, performanceTracker, true));
final long millisToKeepStats = TimeUnit.MINUTES.toMillis(15); final long millisToKeepStats = TimeUnit.MINUTES.toMillis(15);
final MonitorActiveTasks monitorTask = new MonitorActiveTasks(performanceTracker, getLogger(), maxDiskOperationMillis, maxListingMillis, millisToKeepStats); final MonitorActiveTasks monitorTask = new MonitorActiveTasks(performanceTracker, getLogger(), maxDiskOperationMillis, maxListingMillis, millisToKeepStats);
@ -502,12 +502,31 @@ public class ListFile extends AbstractListProcessor<FileInfo> {
} }
@Override @Override
protected List<FileInfo> performListing(final ProcessContext context, final Long minTimestamp) throws IOException { protected Integer countUnfilteredListing(final ProcessContext context) throws IOException {
return performListing(context, 0L, ListingMode.CONFIGURATION_VERIFICATION, false).size();
}
@Override
protected List<FileInfo> performListing(final ProcessContext context, final Long minTimestamp, final ListingMode listingMode)
throws IOException {
return performListing(context, minTimestamp, listingMode, true);
}
private List<FileInfo> performListing(final ProcessContext context, final Long minTimestamp, final ListingMode listingMode, final boolean applyFilters)
throws IOException {
final Path basePath = new File(getPath(context)).toPath(); final Path basePath = new File(getPath(context)).toPath();
final Boolean recurse = context.getProperty(RECURSE).asBoolean(); final Boolean recurse = context.getProperty(RECURSE).asBoolean();
final Map<Path, BasicFileAttributes> lastModifiedMap = new HashMap<>(); final Map<Path, BasicFileAttributes> lastModifiedMap = new HashMap<>();
final BiPredicate<Path, BasicFileAttributes> fileFilter = fileFilterRef.get(); final BiPredicate<Path, BasicFileAttributes> fileFilter;
final PerformanceTracker performanceTracker;
if (listingMode == ListingMode.EXECUTION) {
fileFilter = fileFilterRef.get();
performanceTracker = this.performanceTracker;
} else {
final long maxDiskOperationMillis = context.getProperty(MAX_DISK_OPERATION_TIME).evaluateAttributeExpressions().asTimePeriod(TimeUnit.MILLISECONDS);
performanceTracker = new UntrackedPerformanceTracker(getLogger(), maxDiskOperationMillis);
fileFilter = createFileFilter(context, performanceTracker, applyFilters);
}
int maxDepth = recurse ? Integer.MAX_VALUE : 1; int maxDepth = recurse ? Integer.MAX_VALUE : 1;
final BiPredicate<Path, BasicFileAttributes> matcher = new BiPredicate<Path, BasicFileAttributes>() { final BiPredicate<Path, BasicFileAttributes> matcher = new BiPredicate<Path, BasicFileAttributes>() {
@ -515,7 +534,7 @@ public class ListFile extends AbstractListProcessor<FileInfo> {
@Override @Override
public boolean test(final Path path, final BasicFileAttributes attributes) { public boolean test(final Path path, final BasicFileAttributes attributes) {
if (!isScheduled()) { if (!isScheduled() && listingMode == ListingMode.EXECUTION) {
throw new ProcessorStoppedException(); throw new ProcessorStoppedException();
} }
@ -536,10 +555,11 @@ public class ListFile extends AbstractListProcessor<FileInfo> {
final TimedOperationKey operationKey = performanceTracker.beginOperation(DiskOperation.FILTER, relativePath, filename); final TimedOperationKey operationKey = performanceTracker.beginOperation(DiskOperation.FILTER, relativePath, filename);
try { try {
if (!isDirectory && (minTimestamp == null || attributes.lastModifiedTime().toMillis() >= minTimestamp) final boolean matchesFilters = (minTimestamp == null || attributes.lastModifiedTime().toMillis() >= minTimestamp)
&& fileFilter.test(path, attributes)) { && fileFilter.test(path, attributes);
// We store the attributes for each Path we are returning in order to avoid to if (!isDirectory && (!applyFilters || matchesFilters)) {
// retrieve them again later when creating the FileInfo // We store the attributes for each Path we are returning in order to avoid
// retrieving them again later when creating the FileInfo
lastModifiedMap.put(path, attributes); lastModifiedMap.put(path, attributes);
return true; return true;
@ -562,17 +582,17 @@ public class ListFile extends AbstractListProcessor<FileInfo> {
Files.walkFileTree(basePath, Collections.singleton(FileVisitOption.FOLLOW_LINKS), maxDepth, new FileVisitor<Path>() { Files.walkFileTree(basePath, Collections.singleton(FileVisitOption.FOLLOW_LINKS), maxDepth, new FileVisitor<Path>() {
@Override @Override
public FileVisitResult preVisitDirectory(final Path dir, final BasicFileAttributes attributes) throws IOException { public FileVisitResult preVisitDirectory(final Path dir, final BasicFileAttributes attributes) {
if (Files.isReadable(dir)) { if (Files.isReadable(dir)) {
return FileVisitResult.CONTINUE; return FileVisitResult.CONTINUE;
} else { } else {
getLogger().debug("The following directory is not readable: {}", new Object[] {dir.toString()}); getLogger().debug("The following directory is not readable: {}", new Object[]{dir.toString()});
return FileVisitResult.SKIP_SUBTREE; return FileVisitResult.SKIP_SUBTREE;
} }
} }
@Override @Override
public FileVisitResult visitFile(final Path path, final BasicFileAttributes attributes) throws IOException { public FileVisitResult visitFile(final Path path, final BasicFileAttributes attributes) {
if (matcher.test(path, attributes)) { if (matcher.test(path, attributes)) {
final File file = path.toFile(); final File file = path.toFile();
final BasicFileAttributes fileAttributes = lastModifiedMap.get(path); final BasicFileAttributes fileAttributes = lastModifiedMap.get(path);
@ -591,20 +611,20 @@ public class ListFile extends AbstractListProcessor<FileInfo> {
} }
@Override @Override
public FileVisitResult visitFileFailed(final Path path, final IOException e) throws IOException { public FileVisitResult visitFileFailed(final Path path, final IOException e) {
if (e instanceof AccessDeniedException) { if (e instanceof AccessDeniedException) {
getLogger().debug("The following file is not readable: {}", new Object[] {path.toString()}); getLogger().debug("The following file is not readable: {}", new Object[]{path.toString()});
return FileVisitResult.SKIP_SUBTREE; return FileVisitResult.SKIP_SUBTREE;
} else { } else {
getLogger().error("Error during visiting file {}: {}", new Object[] {path.toString(), e.getMessage()}, e); getLogger().error("Error during visiting file {}: {}", new Object[]{path.toString(), e.getMessage()}, e);
return FileVisitResult.TERMINATE; return FileVisitResult.TERMINATE;
} }
} }
@Override @Override
public FileVisitResult postVisitDirectory(final Path dir, final IOException e) throws IOException { public FileVisitResult postVisitDirectory(final Path dir, final IOException e) {
if (e != null) { if (e != null) {
getLogger().error("Error during visiting directory {}: {}", new Object[] {dir.toString(), e.getMessage()}, e); getLogger().error("Error during visiting directory {}: {}", new Object[]{dir.toString(), e.getMessage()}, e);
} }
return FileVisitResult.CONTINUE; return FileVisitResult.CONTINUE;
@ -619,10 +639,17 @@ public class ListFile extends AbstractListProcessor<FileInfo> {
getLogger().info("Processor was stopped so will not complete listing of Files"); getLogger().info("Processor was stopped so will not complete listing of Files");
return Collections.emptyList(); return Collections.emptyList();
} finally { } finally {
performanceTracker.completeActiveDirectory(); if (performanceTracker != null) {
performanceTracker.completeActiveDirectory();
}
} }
} }
@Override
protected String getListingContainerName(final ProcessContext context) {
return String.format("%s Directory [%s]", context.getProperty(DIRECTORY_LOCATION).getValue(), getPath(context));
}
@Override @Override
protected boolean isListingResetNecessary(final PropertyDescriptor property) { protected boolean isListingResetNecessary(final PropertyDescriptor property) {
return DIRECTORY.equals(property) return DIRECTORY.equals(property)
@ -636,7 +663,8 @@ public class ListFile extends AbstractListProcessor<FileInfo> {
|| IGNORE_HIDDEN_FILES.equals(property); || IGNORE_HIDDEN_FILES.equals(property);
} }
private BiPredicate<Path, BasicFileAttributes> createFileFilter(final ProcessContext context) { private BiPredicate<Path, BasicFileAttributes> createFileFilter(final ProcessContext context, final PerformanceTracker performanceTracker,
final boolean applyFilters) {
final long minSize = context.getProperty(MIN_SIZE).asDataSize(DataUnit.B).longValue(); final long minSize = context.getProperty(MIN_SIZE).asDataSize(DataUnit.B).longValue();
final Double maxSize = context.getProperty(MAX_SIZE).asDataSize(DataUnit.B); final Double maxSize = context.getProperty(MAX_SIZE).asDataSize(DataUnit.B);
final long minAge = context.getProperty(MIN_AGE).asTimePeriod(TimeUnit.MILLISECONDS); final long minAge = context.getProperty(MIN_AGE).asTimePeriod(TimeUnit.MILLISECONDS);
@ -652,6 +680,10 @@ public class ListFile extends AbstractListProcessor<FileInfo> {
final Path basePath = Paths.get(indir); final Path basePath = Paths.get(indir);
return (path, attributes) -> { return (path, attributes) -> {
if (!applyFilters) {
return true;
}
if (minSize > attributes.size()) { if (minSize > attributes.size()) {
return false; return false;
} }

View File

@ -17,10 +17,6 @@
package org.apache.nifi.processors.standard; package org.apache.nifi.processors.standard;
import java.io.IOException;
import java.text.DateFormat;
import java.text.SimpleDateFormat;
import org.apache.commons.io.IOUtils; import org.apache.commons.io.IOUtils;
import org.apache.nifi.components.PropertyDescriptor; import org.apache.nifi.components.PropertyDescriptor;
import org.apache.nifi.expression.ExpressionLanguageScope; import org.apache.nifi.expression.ExpressionLanguageScope;
@ -32,12 +28,15 @@ import org.apache.nifi.processors.standard.util.FileInfo;
import org.apache.nifi.processors.standard.util.FileTransfer; import org.apache.nifi.processors.standard.util.FileTransfer;
import org.apache.nifi.serialization.record.RecordSchema; import org.apache.nifi.serialization.record.RecordSchema;
import java.util.Map; import java.io.IOException;
import java.util.HashMap; import java.text.DateFormat;
import java.util.List; import java.text.SimpleDateFormat;
import java.util.Iterator;
import java.util.Date; import java.util.Date;
import java.util.HashMap;
import java.util.Iterator;
import java.util.List;
import java.util.Locale; import java.util.Locale;
import java.util.Map;
public abstract class ListFileTransfer extends AbstractListProcessor<FileInfo> { public abstract class ListFileTransfer extends AbstractListProcessor<FileInfo> {
public static final PropertyDescriptor HOSTNAME = new PropertyDescriptor.Builder() public static final PropertyDescriptor HOSTNAME = new PropertyDescriptor.Builder()
@ -104,11 +103,21 @@ public abstract class ListFileTransfer extends AbstractListProcessor<FileInfo> {
} }
@Override @Override
protected List<FileInfo> performListing(final ProcessContext context, final Long minTimestamp) throws IOException { protected Integer countUnfilteredListing(final ProcessContext context) throws IOException {
return performListing(context, 0L, ListingMode.CONFIGURATION_VERIFICATION, false).size();
}
@Override
protected List<FileInfo> performListing(final ProcessContext context, final Long minTimestamp, final ListingMode listingMode) throws IOException {
return performListing(context, minTimestamp, listingMode, true);
}
protected List<FileInfo> performListing(final ProcessContext context, final Long minTimestamp, final ListingMode listingMode,
final boolean applyFilters) throws IOException {
final FileTransfer transfer = getFileTransfer(context); final FileTransfer transfer = getFileTransfer(context);
final List<FileInfo> listing; final List<FileInfo> listing;
try { try {
listing = transfer.getListing(); listing = transfer.getListing(applyFilters);
} finally { } finally {
IOUtils.closeQuietly(transfer); IOUtils.closeQuietly(transfer);
} }
@ -128,6 +137,12 @@ public abstract class ListFileTransfer extends AbstractListProcessor<FileInfo> {
return listing; return listing;
} }
@Override
protected String getListingContainerName(final ProcessContext context) {
return String.format("Remote Directory [%s] on [%s:%s]", getPath(context), context.getProperty(HOSTNAME).evaluateAttributeExpressions().getValue(),
context.getProperty(UNDEFAULTED_PORT).evaluateAttributeExpressions().getValue());
}
@Override @Override
protected RecordSchema getRecordSchema() { protected RecordSchema getRecordSchema() {
return FileInfo.getRecordSchema(); return FileInfo.getRecordSchema();

View File

@ -146,11 +146,17 @@ public class ListSFTP extends ListFileTransfer {
} }
@Override @Override
protected List<FileInfo> performListing(final ProcessContext context, final Long minTimestamp) throws IOException { protected List<FileInfo> performListing(final ProcessContext context, final Long minTimestamp, final ListingMode listingMode,
final List<FileInfo> listing = super.performListing(context, minTimestamp); final boolean applyFilters) throws IOException {
final List<FileInfo> listing = super.performListing(context, minTimestamp, listingMode, applyFilters);
if (!applyFilters) {
return listing;
}
final Predicate<FileInfo> filePredicate = listingMode == ListingMode.EXECUTION ? this.fileFilter : createFileFilter(context);
return listing.stream() return listing.stream()
.filter(fileFilter) .filter(filePredicate)
.collect(Collectors.toList()); .collect(Collectors.toList());
} }

View File

@ -190,14 +190,14 @@ public class FTPTransfer implements FileTransfer {
} }
@Override @Override
public List<FileInfo> getListing() throws IOException { public List<FileInfo> getListing(final boolean applyFilters) throws IOException {
final String path = ctx.getProperty(FileTransfer.REMOTE_PATH).evaluateAttributeExpressions().getValue(); final String path = ctx.getProperty(FileTransfer.REMOTE_PATH).evaluateAttributeExpressions().getValue();
final int depth = 0; final int depth = 0;
final int maxResults = ctx.getProperty(FileTransfer.REMOTE_POLL_BATCH_SIZE).asInteger(); final int maxResults = ctx.getProperty(FileTransfer.REMOTE_POLL_BATCH_SIZE).asInteger();
return getListing(path, depth, maxResults); return getListing(path, depth, maxResults, applyFilters);
} }
private List<FileInfo> getListing(final String path, final int depth, final int maxResults) throws IOException { private List<FileInfo> getListing(final String path, final int depth, final int maxResults, final boolean applyFilters) throws IOException {
final List<FileInfo> listing = new ArrayList<>(); final List<FileInfo> listing = new ArrayList<>();
if (maxResults < 1) { if (maxResults < 1) {
return listing; return listing;
@ -266,7 +266,7 @@ public class FTPTransfer implements FileTransfer {
// OR if is a link and we're supposed to follow symlink // OR if is a link and we're supposed to follow symlink
if ((recurse && file.isDirectory()) || (symlink && file.isSymbolicLink())) { if ((recurse && file.isDirectory()) || (symlink && file.isSymbolicLink())) {
try { try {
listing.addAll(getListing(newFullForwardPath, depth + 1, maxResults - count)); listing.addAll(getListing(newFullForwardPath, depth + 1, maxResults - count, applyFilters));
} catch (final IOException e) { } catch (final IOException e) {
logger.error("Unable to get listing from " + newFullForwardPath + "; skipping", e); logger.error("Unable to get listing from " + newFullForwardPath + "; skipping", e);
} }
@ -274,8 +274,8 @@ public class FTPTransfer implements FileTransfer {
// if is not a directory and is not a link and it matches // if is not a directory and is not a link and it matches
// FILE_FILTER_REGEX - then let's add it // FILE_FILTER_REGEX - then let's add it
if (!file.isDirectory() && !file.isSymbolicLink() && pathFilterMatches) { if (!file.isDirectory() && !file.isSymbolicLink() && (pathFilterMatches || !applyFilters)) {
if (pattern == null || pattern.matcher(filename).matches()) { if (pattern == null || !applyFilters || pattern.matcher(filename).matches()) {
listing.add(newFileInfo(file, path)); listing.add(newFileInfo(file, path));
count++; count++;
} }

View File

@ -34,7 +34,7 @@ public interface FileTransfer extends Closeable {
String getHomeDirectory(FlowFile flowFile) throws IOException; String getHomeDirectory(FlowFile flowFile) throws IOException;
List<FileInfo> getListing() throws IOException; List<FileInfo> getListing(boolean applyFilters) throws IOException;
FlowFile getRemoteFile(String remoteFileName, FlowFile flowFile, ProcessSession session) throws ProcessException, IOException; FlowFile getRemoteFile(String remoteFileName, FlowFile flowFile, ProcessSession session) throws ProcessException, IOException;

View File

@ -263,7 +263,7 @@ public class SFTPTransfer implements FileTransfer {
} }
@Override @Override
public List<FileInfo> getListing() throws IOException { public List<FileInfo> getListing(final boolean applyFilters) throws IOException {
final String path = ctx.getProperty(FileTransfer.REMOTE_PATH).evaluateAttributeExpressions().getValue(); final String path = ctx.getProperty(FileTransfer.REMOTE_PATH).evaluateAttributeExpressions().getValue();
final int depth = 0; final int depth = 0;
@ -277,11 +277,12 @@ public class SFTPTransfer implements FileTransfer {
} }
final List<FileInfo> listing = new ArrayList<>(1000); final List<FileInfo> listing = new ArrayList<>(1000);
getListing(path, depth, maxResults, listing); getListing(path, depth, maxResults, listing, applyFilters);
return listing; return listing;
} }
protected void getListing(final String path, final int depth, final int maxResults, final List<FileInfo> listing) throws IOException { protected void getListing(final String path, final int depth, final int maxResults, final List<FileInfo> listing,
final boolean applyFilters) throws IOException {
if (maxResults < 1 || listing.size() >= maxResults) { if (maxResults < 1 || listing.size() >= maxResults) {
return; return;
} }
@ -346,8 +347,8 @@ public class SFTPTransfer implements FileTransfer {
} }
// if is not a directory and is not a link and it matches FILE_FILTER_REGEX - then let's add it // if is not a directory and is not a link and it matches FILE_FILTER_REGEX - then let's add it
if (!entry.isDirectory() && !(entry.getAttributes().getType() == FileMode.Type.SYMLINK) && isPathMatch) { if (!entry.isDirectory() && !(entry.getAttributes().getType() == FileMode.Type.SYMLINK) && (!applyFilters || isPathMatch)) {
if (pattern == null || pattern.matcher(entryFilename).matches()) { if (pattern == null || !applyFilters || pattern.matcher(entryFilename).matches()) {
listing.add(newFileInfo(entry, path)); listing.add(newFileInfo(entry, path));
} }
} }
@ -379,7 +380,7 @@ public class SFTPTransfer implements FileTransfer {
final String newFullForwardPath = newFullPath.getPath().replace("\\", "/"); final String newFullForwardPath = newFullPath.getPath().replace("\\", "/");
try { try {
getListing(newFullForwardPath, depth + 1, maxResults, listing); getListing(newFullForwardPath, depth + 1, maxResults, listing, applyFilters);
} catch (final IOException e) { } catch (final IOException e) {
logger.error("Unable to get listing from " + newFullForwardPath + "; skipping", e); logger.error("Unable to get listing from " + newFullForwardPath + "; skipping", e);
} }

View File

@ -18,6 +18,8 @@
package org.apache.nifi.processors.standard; package org.apache.nifi.processors.standard;
import org.apache.commons.lang3.SystemUtils; import org.apache.commons.lang3.SystemUtils;
import org.apache.nifi.components.ConfigVerificationResult;
import org.apache.nifi.components.ConfigVerificationResult.Outcome;
import org.apache.nifi.components.PropertyDescriptor; import org.apache.nifi.components.PropertyDescriptor;
import org.apache.nifi.components.state.Scope; import org.apache.nifi.components.state.Scope;
import org.apache.nifi.flowfile.FlowFile; import org.apache.nifi.flowfile.FlowFile;
@ -233,27 +235,34 @@ public class TestListFile {
assertTrue(file1.createNewFile()); assertTrue(file1.createNewFile());
assertTrue(file1.setLastModified(time4millis)); assertTrue(file1.setLastModified(time4millis));
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 1 object. Of that, 1 matches the filter.");
// process first file and set new timestamp // process first file and set new timestamp
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles1 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles1 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
assertEquals(1, successFiles1.size()); assertEquals(1, successFiles1.size());
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 1 object. Of that, 1 matches the filter.");
// create second file // create second file
final File file2 = new File(TESTDIR + "/listing2.txt"); final File file2 = new File(TESTDIR + "/listing2.txt");
assertTrue(file2.createNewFile()); assertTrue(file2.createNewFile());
assertTrue(file2.setLastModified(time2millis)); assertTrue(file2.setLastModified(time2millis));
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 2 objects. Of those, 2 match the filter.");
// process second file after timestamp // process second file after timestamp
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles2 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles2 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
assertEquals(1, successFiles2.size()); assertEquals(1, successFiles2.size());
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 2 objects. Of those, 2 match the filter.");
// create third file // create third file
final File file3 = new File(TESTDIR + "/listing3.txt"); final File file3 = new File(TESTDIR + "/listing3.txt");
assertTrue(file3.createNewFile()); assertTrue(file3.createNewFile());
assertTrue(file3.setLastModified(time4millis)); assertTrue(file3.setLastModified(time4millis));
// 0 are new because the timestamp is before the min listed timestamp
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 3 match the filter.");
// process third file before timestamp // process third file before timestamp
runNext(); runNext();
@ -264,6 +273,7 @@ public class TestListFile {
// force state to reset and process all files // force state to reset and process all files
runner.removeProperty(ListFile.DIRECTORY); runner.removeProperty(ListFile.DIRECTORY);
runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath()); runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath());
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 3 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles4 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles4 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -271,6 +281,7 @@ public class TestListFile {
runNext(); runNext();
runner.assertTransferCount(ListFile.REL_SUCCESS, 0); runner.assertTransferCount(ListFile.REL_SUCCESS, 0);
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 3 match the filter.");
} }
@Test @Test
@ -309,6 +320,7 @@ public class TestListFile {
runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath()); runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath());
runNext.apply(true); runNext.apply(true);
runner.assertTransferCount(ListFile.REL_SUCCESS, 3); runner.assertTransferCount(ListFile.REL_SUCCESS, 3);
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 3 match the filter.");
// processor updates internal state, it shouldn't pick the same ones. // processor updates internal state, it shouldn't pick the same ones.
runNext.apply(false); runNext.apply(false);
@ -323,6 +335,7 @@ public class TestListFile {
assertEquals(2, successFiles2.size()); assertEquals(2, successFiles2.size());
assertEquals(file2.getName(), successFiles2.get(0).getAttribute("filename")); assertEquals(file2.getName(), successFiles2.get(0).getAttribute("filename"));
assertEquals(file1.getName(), successFiles2.get(1).getAttribute("filename")); assertEquals(file1.getName(), successFiles2.get(1).getAttribute("filename"));
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 2 match the filter.");
// exclude newest // exclude newest
runner.setProperty(ListFile.MIN_AGE, age1); runner.setProperty(ListFile.MIN_AGE, age1);
@ -333,6 +346,7 @@ public class TestListFile {
assertEquals(2, successFiles3.size()); assertEquals(2, successFiles3.size());
assertEquals(file3.getName(), successFiles3.get(0).getAttribute("filename")); assertEquals(file3.getName(), successFiles3.get(0).getAttribute("filename"));
assertEquals(file2.getName(), successFiles3.get(1).getAttribute("filename")); assertEquals(file2.getName(), successFiles3.get(1).getAttribute("filename"));
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 2 match the filter.");
// exclude oldest and newest // exclude oldest and newest
runner.setProperty(ListFile.MIN_AGE, age1); runner.setProperty(ListFile.MIN_AGE, age1);
@ -342,6 +356,7 @@ public class TestListFile {
final List<MockFlowFile> successFiles4 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles4 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
assertEquals(1, successFiles4.size()); assertEquals(1, successFiles4.size());
assertEquals(file2.getName(), successFiles4.get(0).getAttribute("filename")); assertEquals(file2.getName(), successFiles4.get(0).getAttribute("filename"));
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 1 matches the filter.");
} }
@ -377,26 +392,31 @@ public class TestListFile {
// check all files // check all files
runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath()); runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath());
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 3 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles1 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles1 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
assertEquals(3, successFiles1.size()); assertEquals(3, successFiles1.size());
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 3 match the filter.");
// exclude largest // exclude largest
runner.removeProperty(ListFile.MIN_AGE); runner.removeProperty(ListFile.MIN_AGE);
runner.removeProperty(ListFile.MAX_AGE); runner.removeProperty(ListFile.MAX_AGE);
runner.setProperty(ListFile.MIN_SIZE, "0 b"); runner.setProperty(ListFile.MIN_SIZE, "0 b");
runner.setProperty(ListFile.MAX_SIZE, "7500 b"); runner.setProperty(ListFile.MAX_SIZE, "7500 b");
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 2 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles2 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles2 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
assertEquals(2, successFiles2.size()); assertEquals(2, successFiles2.size());
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 2 match the filter.");
// exclude smallest // exclude smallest
runner.removeProperty(ListFile.MIN_AGE); runner.removeProperty(ListFile.MIN_AGE);
runner.removeProperty(ListFile.MAX_AGE); runner.removeProperty(ListFile.MAX_AGE);
runner.setProperty(ListFile.MIN_SIZE, "2500 b"); runner.setProperty(ListFile.MIN_SIZE, "2500 b");
runner.removeProperty(ListFile.MAX_SIZE); runner.removeProperty(ListFile.MAX_SIZE);
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 2 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles3 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles3 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -407,6 +427,7 @@ public class TestListFile {
runner.removeProperty(ListFile.MAX_AGE); runner.removeProperty(ListFile.MAX_AGE);
runner.setProperty(ListFile.MIN_SIZE, "2500 b"); runner.setProperty(ListFile.MIN_SIZE, "2500 b");
runner.setProperty(ListFile.MAX_SIZE, "7500 b"); runner.setProperty(ListFile.MAX_SIZE, "7500 b");
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 1 matches the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles4 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles4 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -444,6 +465,7 @@ public class TestListFile {
runner.removeProperty(ListFile.MIN_SIZE); runner.removeProperty(ListFile.MIN_SIZE);
runner.removeProperty(ListFile.MAX_SIZE); runner.removeProperty(ListFile.MAX_SIZE);
runner.setProperty(ListFile.IGNORE_HIDDEN_FILES, "false"); runner.setProperty(ListFile.IGNORE_HIDDEN_FILES, "false");
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 2 objects. Of those, 2 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles1 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles1 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -451,6 +473,7 @@ public class TestListFile {
// exclude hidden // exclude hidden
runner.setProperty(ListFile.IGNORE_HIDDEN_FILES, "true"); runner.setProperty(ListFile.IGNORE_HIDDEN_FILES, "true");
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 2 objects. Of those, 1 matches the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles2 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles2 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -472,6 +495,7 @@ public class TestListFile {
runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath()); runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath());
runner.setProperty(ListFile.FILE_FILTER, ".*"); runner.setProperty(ListFile.FILE_FILTER, ".*");
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 2 objects. Of those, 1 matches the filter.");
runNext(); runNext();
final List<MockFlowFile> successFiles = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -484,30 +508,33 @@ public class TestListFile {
assertTrue(subdir.mkdir()); assertTrue(subdir.mkdir());
assertTrue(subdir.setReadable(false)); assertTrue(subdir.setReadable(false));
final File file1 = new File(TESTDIR + "/subdir/unreadable.txt"); try {
assertTrue(file1.createNewFile()); final File file1 = new File(TESTDIR + "/subdir/unreadable.txt");
assertTrue(file1.setReadable(false)); assertTrue(file1.createNewFile());
assertTrue(file1.setReadable(false));
final File file2 = new File(TESTDIR + "/subdir/readable.txt"); final File file2 = new File(TESTDIR + "/subdir/readable.txt");
assertTrue(file2.createNewFile()); assertTrue(file2.createNewFile());
final File file3 = new File(TESTDIR + "/secondReadable.txt"); final File file3 = new File(TESTDIR + "/secondReadable.txt");
assertTrue(file3.createNewFile()); assertTrue(file3.createNewFile());
final long now = getTestModifiedTime(); final long now = getTestModifiedTime();
assertTrue(file1.setLastModified(now)); assertTrue(file1.setLastModified(now));
assertTrue(file2.setLastModified(now)); assertTrue(file2.setLastModified(now));
assertTrue(file3.setLastModified(now)); assertTrue(file3.setLastModified(now));
runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath()); runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath());
runner.setProperty(ListFile.FILE_FILTER, ".*"); runner.setProperty(ListFile.FILE_FILTER, ".*");
runNext(); assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 1 object. Of that, 1 matches the filter.");
runNext();
final List<MockFlowFile> successFiles = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
assertEquals(1, successFiles.size()); assertEquals(1, successFiles.size());
assertEquals("secondReadable.txt", successFiles.get(0).getAttribute("filename")); assertEquals("secondReadable.txt", successFiles.get(0).getAttribute("filename"));
} finally {
subdir.setReadable(true); subdir.setReadable(true);
}
} }
@Test @Test
@ -527,6 +554,7 @@ public class TestListFile {
// Run with privileges and with fitting filter // Run with privileges and with fitting filter
runner.setProperty(ListFile.FILE_FILTER, "file.*"); runner.setProperty(ListFile.FILE_FILTER, "file.*");
assertTrue(file.setLastModified(getTestModifiedTime())); assertTrue(file.setLastModified(getTestModifiedTime()));
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 1 object. Of that, 1 matches the filter.");
runNext(); runNext();
final List<MockFlowFile> successFiles2 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles2 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -535,6 +563,7 @@ public class TestListFile {
// Run without privileges and with fitting filter // Run without privileges and with fitting filter
assertTrue(file.setReadable(false)); assertTrue(file.setReadable(false));
assertTrue(file.setLastModified(getTestModifiedTime())); assertTrue(file.setLastModified(getTestModifiedTime()));
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 1 object. Of that, 0 match the filter.");
runNext(); runNext();
final List<MockFlowFile> successFiles3 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles3 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -566,6 +595,7 @@ public class TestListFile {
// check all files // check all files
runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath()); runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath());
runner.setProperty(ListFile.FILE_FILTER, ListFile.FILE_FILTER.getDefaultValue()); runner.setProperty(ListFile.FILE_FILTER, ListFile.FILE_FILTER.getDefaultValue());
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 4 objects. Of those, 4 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles1 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles1 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -574,9 +604,11 @@ public class TestListFile {
// filter file on pattern // filter file on pattern
// Modifying FILE_FILTER property reset listing status, so these files will be listed again. // Modifying FILE_FILTER property reset listing status, so these files will be listed again.
runner.setProperty(ListFile.FILE_FILTER, ".*-xyz-.*"); runner.setProperty(ListFile.FILE_FILTER, ".*-xyz-.*");
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 4 objects. Of those, 2 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS, 2); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS, 2);
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 4 objects. Of those, 2 match the filter.");
runNext(); runNext();
runner.assertTransferCount(ListFile.REL_SUCCESS, 0); runner.assertTransferCount(ListFile.REL_SUCCESS, 0);
} }
@ -611,6 +643,7 @@ public class TestListFile {
runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath()); runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath());
runner.setProperty(ListFile.FILE_FILTER, ListFile.FILE_FILTER.getDefaultValue()); runner.setProperty(ListFile.FILE_FILTER, ListFile.FILE_FILTER.getDefaultValue());
runner.setProperty(ListFile.RECURSE, "true"); runner.setProperty(ListFile.RECURSE, "true");
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 4 objects. Of those, 4 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
@ -620,6 +653,7 @@ public class TestListFile {
// filter path on pattern subdir1 // filter path on pattern subdir1
runner.setProperty(ListFile.PATH_FILTER, "subdir1"); runner.setProperty(ListFile.PATH_FILTER, "subdir1");
runner.setProperty(ListFile.RECURSE, "true"); runner.setProperty(ListFile.RECURSE, "true");
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 4 objects. Of those, 3 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles2 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles2 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -628,6 +662,7 @@ public class TestListFile {
// filter path on pattern subdir2 // filter path on pattern subdir2
runner.setProperty(ListFile.PATH_FILTER, "subdir2"); runner.setProperty(ListFile.PATH_FILTER, "subdir2");
runner.setProperty(ListFile.RECURSE, "true"); runner.setProperty(ListFile.RECURSE, "true");
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 4 objects. Of those, 1 matches the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles3 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles3 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -659,6 +694,7 @@ public class TestListFile {
// check all files // check all files
runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath()); runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath());
runner.setProperty(ListFile.RECURSE, "true"); runner.setProperty(ListFile.RECURSE, "true");
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 3 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS, 3); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS, 3);
final List<MockFlowFile> successFiles1 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles1 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -683,8 +719,9 @@ public class TestListFile {
} }
assertEquals(3, successFiles1.size()); assertEquals(3, successFiles1.size());
// exclude hidden // don't recurse
runner.setProperty(ListFile.RECURSE, "false"); runner.setProperty(ListFile.RECURSE, "false");
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 1 object. Of that, 1 matches the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
final List<MockFlowFile> successFiles2 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS); final List<MockFlowFile> successFiles2 = runner.getFlowFilesForRelationship(ListFile.REL_SUCCESS);
@ -710,6 +747,7 @@ public class TestListFile {
// check all files // check all files
runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath()); runner.setProperty(ListFile.DIRECTORY, testDir.getAbsolutePath());
runner.setProperty(ListFile.RECURSE, "true"); runner.setProperty(ListFile.RECURSE, "true");
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 3 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
runner.assertTransferCount(ListFile.REL_SUCCESS, 3); runner.assertTransferCount(ListFile.REL_SUCCESS, 3);
@ -802,6 +840,7 @@ public class TestListFile {
makeTestFile("/batch1-age5.txt", time5millis, fileTimes); makeTestFile("/batch1-age5.txt", time5millis, fileTimes);
// check files // check files
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 3 objects. Of those, 3 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
@ -815,6 +854,7 @@ public class TestListFile {
// should be ignored since it's older than age3 // should be ignored since it's older than age3
makeTestFile("/batch2-age4.txt", time4millis, fileTimes); makeTestFile("/batch2-age4.txt", time4millis, fileTimes);
assertVerificationOutcome(Outcome.SUCCESSFUL, "Successfully listed .* Found 6 objects. Of those, 6 match the filter.");
runNext(); runNext();
runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS); runner.assertAllFlowFilesTransferred(ListFile.REL_SUCCESS);
@ -880,4 +920,14 @@ public class TestListFile {
} }
} }
} }
private void assertVerificationOutcome(final Outcome expectedOutcome, final String expectedExplanationRegex) {
final List<ConfigVerificationResult> results = processor.verify(runner.getProcessContext(), runner.getLogger(), Collections.emptyMap());
assertEquals(1, results.size());
final ConfigVerificationResult result = results.get(0);
assertEquals(expectedOutcome, result.getOutcome());
assertTrue(String.format("Expected verification result to match pattern [%s]. Actual explanation was: %s", expectedExplanationRegex, result.getExplanation()),
result.getExplanation().matches(expectedExplanationRegex));
}
} }

View File

@ -29,7 +29,10 @@ import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors; import java.util.concurrent.Executors;
import java.util.concurrent.TimeUnit; import java.util.concurrent.TimeUnit;
import org.apache.nifi.components.ConfigVerificationResult;
import org.apache.nifi.components.ConfigVerificationResult.Outcome;
import org.apache.nifi.processor.ProcessContext; import org.apache.nifi.processor.ProcessContext;
import org.apache.nifi.processor.VerifiableProcessor;
import org.apache.nifi.processor.util.list.AbstractListProcessor; import org.apache.nifi.processor.util.list.AbstractListProcessor;
import org.apache.nifi.processors.standard.util.FTPTransfer; import org.apache.nifi.processors.standard.util.FTPTransfer;
import org.apache.nifi.processors.standard.util.FileInfo; import org.apache.nifi.processors.standard.util.FileInfo;
@ -47,6 +50,7 @@ import java.util.concurrent.atomic.AtomicInteger;
import java.util.stream.Collectors; import java.util.stream.Collectors;
import static org.junit.Assert.assertEquals; import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertTrue;
public class TestListSFTP { public class TestListSFTP {
@Rule @Rule
@ -95,7 +99,7 @@ public class TestListSFTP {
protected FileTransfer getFileTransfer(ProcessContext context) { protected FileTransfer getFileTransfer(ProcessContext context) {
return new SFTPTransfer(context, getLogger()){ return new SFTPTransfer(context, getLogger()){
@Override @Override
protected void getListing(String path, int depth, int maxResults, List<FileInfo> listing) throws IOException { protected void getListing(String path, int depth, int maxResults, List<FileInfo> listing, boolean applyFilters) throws IOException {
if (path.contains("subdir")) { if (path.contains("subdir")) {
reachScanningSubDir.countDown(); reachScanningSubDir.countDown();
try { try {
@ -105,7 +109,7 @@ public class TestListSFTP {
} }
} }
super.getListing(path, depth, maxResults, listing); super.getListing(path, depth, maxResults, listing, applyFilters);
} }
}; };
} }
@ -193,6 +197,7 @@ public class TestListSFTP {
Thread.sleep(AbstractListProcessor.LISTING_LAG_MILLIS.get(TimeUnit.MILLISECONDS) * 2); Thread.sleep(AbstractListProcessor.LISTING_LAG_MILLIS.get(TimeUnit.MILLISECONDS) * 2);
runner.run(); runner.run();
assertVerificationOutcome(runner, Outcome.SUCCESSFUL, ".* Found 3 objects. Of those, 3 match the filter.");
runner.assertTransferCount(ListSFTP.REL_SUCCESS, 3); runner.assertTransferCount(ListSFTP.REL_SUCCESS, 3);
@ -231,10 +236,22 @@ public class TestListSFTP {
runner.run(); runner.run();
assertVerificationOutcome(runner, Outcome.SUCCESSFUL, ".* Found 3 objects. Of those, 1 matches the filter.");
runner.assertTransferCount(ListSFTP.REL_SUCCESS, 1); runner.assertTransferCount(ListSFTP.REL_SUCCESS, 1);
final MockFlowFile retrievedFile = runner.getFlowFilesForRelationship(ListSFTP.REL_SUCCESS).get(0); final MockFlowFile retrievedFile = runner.getFlowFilesForRelationship(ListSFTP.REL_SUCCESS).get(0);
//the only file between the limits //the only file between the limits
retrievedFile.assertAttributeEquals("filename", "file.txt"); retrievedFile.assertAttributeEquals("filename", "file.txt");
} }
private void assertVerificationOutcome(final TestRunner runner, final Outcome expectedOutcome, final String expectedExplanationRegex) {
final List<ConfigVerificationResult> results = ((VerifiableProcessor) runner.getProcessor())
.verify(runner.getProcessContext(), runner.getLogger(), Collections.emptyMap());
assertEquals(1, results.size());
final ConfigVerificationResult result = results.get(0);
assertEquals(expectedOutcome, result.getOutcome());
assertTrue(String.format("Expected verification result to match pattern [%s]. Actual explanation was: %s", expectedExplanationRegex, result.getExplanation()),
result.getExplanation().matches(expectedExplanationRegex));
}
} }

View File

@ -144,7 +144,7 @@ public class ITestSFTPTransferWithSSHTestServer {
properties.put(SFTPTransfer.REMOTE_PATH, DIR_2); properties.put(SFTPTransfer.REMOTE_PATH, DIR_2);
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(2, listing.size()); assertEquals(2, listing.size());
@ -167,7 +167,7 @@ public class ITestSFTPTransferWithSSHTestServer {
properties.put(SFTPTransfer.IGNORE_DOTTED_FILES, "false"); properties.put(SFTPTransfer.IGNORE_DOTTED_FILES, "false");
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(3, listing.size()); assertEquals(3, listing.size());
@ -183,7 +183,7 @@ public class ITestSFTPTransferWithSSHTestServer {
properties.put(SFTPTransfer.RECURSIVE_SEARCH, "false"); properties.put(SFTPTransfer.RECURSIVE_SEARCH, "false");
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(0, listing.size()); assertEquals(0, listing.size());
} }
@ -196,7 +196,7 @@ public class ITestSFTPTransferWithSSHTestServer {
properties.put(SFTPTransfer.RECURSIVE_SEARCH, "true"); properties.put(SFTPTransfer.RECURSIVE_SEARCH, "true");
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(4, listing.size()); assertEquals(4, listing.size());
} }
@ -210,7 +210,7 @@ public class ITestSFTPTransferWithSSHTestServer {
properties.put(SFTPTransfer.FOLLOW_SYMLINK, "false"); properties.put(SFTPTransfer.FOLLOW_SYMLINK, "false");
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(0, listing.size()); assertEquals(0, listing.size());
} }
@ -224,7 +224,7 @@ public class ITestSFTPTransferWithSSHTestServer {
properties.put(SFTPTransfer.FOLLOW_SYMLINK, "true"); properties.put(SFTPTransfer.FOLLOW_SYMLINK, "true");
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(4, listing.size()); assertEquals(4, listing.size());
} }
@ -238,7 +238,7 @@ public class ITestSFTPTransferWithSSHTestServer {
// first listing is without batch size and shows 4 results // first listing is without batch size and shows 4 results
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(4, listing.size()); assertEquals(4, listing.size());
} }
@ -247,7 +247,7 @@ public class ITestSFTPTransferWithSSHTestServer {
properties.put(SFTPTransfer.REMOTE_POLL_BATCH_SIZE, "2"); properties.put(SFTPTransfer.REMOTE_POLL_BATCH_SIZE, "2");
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(2, listing.size()); assertEquals(2, listing.size());
} }
@ -263,7 +263,7 @@ public class ITestSFTPTransferWithSSHTestServer {
properties.put(SFTPTransfer.FILE_FILTER_REGEX, fileFilterRegex); properties.put(SFTPTransfer.FILE_FILTER_REGEX, fileFilterRegex);
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(2, listing.size()); assertEquals(2, listing.size());
@ -282,7 +282,7 @@ public class ITestSFTPTransferWithSSHTestServer {
properties.put(SFTPTransfer.PATH_FILTER_REGEX, pathFilterRegex); properties.put(SFTPTransfer.PATH_FILTER_REGEX, pathFilterRegex);
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(2, listing.size()); assertEquals(2, listing.size());
@ -306,7 +306,7 @@ public class ITestSFTPTransferWithSSHTestServer {
properties.put(SFTPTransfer.RECURSIVE_SEARCH, "true"); properties.put(SFTPTransfer.RECURSIVE_SEARCH, "true");
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
transfer.getListing(); transfer.getListing(true);
} }
} }
@ -317,7 +317,7 @@ public class ITestSFTPTransferWithSSHTestServer {
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
// verify the directory has two files // verify the directory has two files
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(2, listing.size()); assertEquals(2, listing.size());
@ -327,7 +327,7 @@ public class ITestSFTPTransferWithSSHTestServer {
} }
// verify there are now zero files // verify there are now zero files
final List<FileInfo> listingAfterDelete = transfer.getListing(); final List<FileInfo> listingAfterDelete = transfer.getListing(true);
assertNotNull(listingAfterDelete); assertNotNull(listingAfterDelete);
assertEquals(0, listingAfterDelete.size()); assertEquals(0, listingAfterDelete.size());
} }
@ -340,7 +340,7 @@ public class ITestSFTPTransferWithSSHTestServer {
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
// verify the directory has two files // verify the directory has two files
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(2, listing.size()); assertEquals(2, listing.size());
@ -352,7 +352,7 @@ public class ITestSFTPTransferWithSSHTestServer {
} }
// verify there are now zero files // verify there are now zero files
final List<FileInfo> listingAfterDelete = transfer.getListing(); final List<FileInfo> listingAfterDelete = transfer.getListing(true);
assertNotNull(listingAfterDelete); assertNotNull(listingAfterDelete);
assertEquals(0, listingAfterDelete.size()); assertEquals(0, listingAfterDelete.size());
} }
@ -374,7 +374,7 @@ public class ITestSFTPTransferWithSSHTestServer {
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
// verify the directory exists // verify the directory exists
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(0, listing.size()); assertEquals(0, listing.size());
@ -382,7 +382,7 @@ public class ITestSFTPTransferWithSSHTestServer {
// verify the directory no longer exists // verify the directory no longer exists
try { try {
transfer.getListing(); transfer.getListing(true);
Assert.fail("Should have thrown exception"); Assert.fail("Should have thrown exception");
} catch (FileNotFoundException e) { } catch (FileNotFoundException e) {
// nothing to do, expected // nothing to do, expected
@ -408,7 +408,7 @@ public class ITestSFTPTransferWithSSHTestServer {
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
// verify the directory does not exist // verify the directory does not exist
try { try {
transfer.getListing(); transfer.getListing(true);
Assert.fail("Should have failed"); Assert.fail("Should have failed");
} catch (FileNotFoundException e) { } catch (FileNotFoundException e) {
// Nothing to do, expected // Nothing to do, expected
@ -418,7 +418,7 @@ public class ITestSFTPTransferWithSSHTestServer {
transfer.ensureDirectoryExists(null, new File(absolutePath)); transfer.ensureDirectoryExists(null, new File(absolutePath));
// verify the directory now exists // verify the directory now exists
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(0, listing.size()); assertEquals(0, listing.size());
} }
@ -433,7 +433,7 @@ public class ITestSFTPTransferWithSSHTestServer {
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
// verify the directory does not exist // verify the directory does not exist
try { try {
transfer.getListing(); transfer.getListing(true);
Assert.fail("Should have failed"); Assert.fail("Should have failed");
} catch (FileNotFoundException e) { } catch (FileNotFoundException e) {
// Nothing to do, expected // Nothing to do, expected
@ -443,7 +443,7 @@ public class ITestSFTPTransferWithSSHTestServer {
transfer.ensureDirectoryExists(null, new File(absolutePath)); transfer.ensureDirectoryExists(null, new File(absolutePath));
// verify the directory now exists // verify the directory now exists
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(0, listing.size()); assertEquals(0, listing.size());
} }
@ -456,7 +456,7 @@ public class ITestSFTPTransferWithSSHTestServer {
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
// verify the directory already exists // verify the directory already exists
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(2, listing.size()); assertEquals(2, listing.size());
@ -475,7 +475,7 @@ public class ITestSFTPTransferWithSSHTestServer {
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
// verify the directory does not exist // verify the directory does not exist
try { try {
transfer.getListing(); transfer.getListing(true);
Assert.fail("Should have failed"); Assert.fail("Should have failed");
} catch (FileNotFoundException e) { } catch (FileNotFoundException e) {
// Nothing to do, expected // Nothing to do, expected
@ -485,7 +485,7 @@ public class ITestSFTPTransferWithSSHTestServer {
transfer.ensureDirectoryExists(null, new File(absolutePath)); transfer.ensureDirectoryExists(null, new File(absolutePath));
// verify the directory now exists // verify the directory now exists
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(0, listing.size()); assertEquals(0, listing.size());
} }
@ -499,7 +499,7 @@ public class ITestSFTPTransferWithSSHTestServer {
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
// verify the directory already exists // verify the directory already exists
final List<FileInfo> listing = transfer.getListing(); final List<FileInfo> listing = transfer.getListing(true);
assertNotNull(listing); assertNotNull(listing);
assertEquals(2, listing.size()); assertEquals(2, listing.size());
@ -519,7 +519,7 @@ public class ITestSFTPTransferWithSSHTestServer {
try(final SFTPTransfer transfer = createSFTPTransfer(properties)) { try(final SFTPTransfer transfer = createSFTPTransfer(properties)) {
// verify the directory does not exist // verify the directory does not exist
try { try {
transfer.getListing(); transfer.getListing(true);
Assert.fail("Should have failed"); Assert.fail("Should have failed");
} catch (FileNotFoundException e) { } catch (FileNotFoundException e) {
// Nothing to do, expected // Nothing to do, expected