NIFI-6735 - validate components before restarting processors following parameter context update.

This closes #3782.

Signed-off-by: Mark Payne <markap14@hotmail.com>
This commit is contained in:
Rob Fellows 2019-10-01 15:38:53 -04:00 committed by Mark Payne
parent 555004cdde
commit df90c65246
3 changed files with 259 additions and 41 deletions

View File

@ -865,6 +865,7 @@ public class ParameterContextResource extends ApplicationResource {
final ParameterContextEntity updatedEntity;
try {
updatedEntity = performParameterContextUpdate(asyncRequest, uri, replicateRequest, revision, updatedContextEntity);
asyncRequest.markStepComplete();
logger.info("Successfully updated Parameter Context with ID {}", updatedContextEntity.getId());
} finally {
// TODO: can almost certainly be refactored so that the same code is shared between VersionsResource and ParameterContextResource.
@ -968,8 +969,6 @@ public class ParameterContextResource extends ApplicationResource {
logger.info("Restarting {} Processors after having updated Parameter Context", processors.size());
}
asyncRequest.markStepComplete();
// Step 14. Restart all components
final Set<AffectedComponentEntity> componentsToStart = getUpdatedEntities(processors);
@ -978,6 +977,7 @@ public class ParameterContextResource extends ApplicationResource {
try {
componentLifecycle.scheduleComponents(uri, "root", componentsToStart, ScheduledState.RUNNING, startComponentsPause, InvalidComponentAction.SKIP);
asyncRequest.markStepComplete();
} catch (final IllegalStateException ise) {
// Component Lifecycle will restart the Processors only if they are valid. If IllegalStateException gets thrown, we need to provide
// a more intelligent error message as to exactly what happened, rather than indicate that the flow could not be updated.
@ -1003,8 +1003,6 @@ public class ParameterContextResource extends ApplicationResource {
logger.info("Re-Enabling {} Controller Services after having updated Parameter Context", controllerServices.size());
}
asyncRequest.markStepComplete();
// Step 13. Re-enable all disabled controller services
final CancellableTimedPause enableServicesPause = new CancellableTimedPause(250, Long.MAX_VALUE, TimeUnit.MILLISECONDS);
asyncRequest.setCancelCallback(enableServicesPause::cancel);
@ -1012,6 +1010,7 @@ public class ParameterContextResource extends ApplicationResource {
try {
componentLifecycle.activateControllerServices(uri, "root", servicesToEnable, ControllerServiceState.ENABLED, enableServicesPause, InvalidComponentAction.SKIP);
asyncRequest.markStepComplete();
} catch (final IllegalStateException ise) {
// Component Lifecycle will re-enable the Controller Services only if they are valid. If IllegalStateException gets thrown, we need to provide
// a more intelligent error message as to exactly what happened, rather than indicate that the Parameter Context could not be updated.

View File

@ -101,6 +101,16 @@ public class ClusterReplicationComponentLifecycle implements ComponentLifecycle
final NiFiUser user = NiFiUserUtils.getNiFiUser();
// If attempting to run the processors, validation must complete first
if (desiredState == ScheduledState.RUNNING) {
try {
waitForProcessorValidation(user, exampleUri, groupId, componentMap, pause);
} catch (InterruptedException e) {
Thread.currentThread().interrupt();
throw new LifecycleManagementException("Interrupted while waiting for processors to complete validation");
}
}
// Determine whether we should replicate only to the cluster coordinator, or if we should replicate directly to the cluster nodes themselves.
try {
final NodeResponse clusterResponse;
@ -156,6 +166,64 @@ public class ClusterReplicationComponentLifecycle implements ComponentLifecycle
return processorRevisions.stream().collect(Collectors.toMap(Revision::getComponentId, Function.identity()));
}
private boolean waitForProcessorValidation(final NiFiUser user, final URI originalUri, final String groupId,
final Map<String, AffectedComponentEntity> processors, final Pause pause) throws InterruptedException {
URI groupUri;
try {
groupUri = new URI(originalUri.getScheme(), originalUri.getUserInfo(), originalUri.getHost(),
originalUri.getPort(), "/nifi-api/process-groups/" + groupId + "/processors", "includeDescendantGroups=true", originalUri.getFragment());
} catch (URISyntaxException e) {
throw new RuntimeException(e);
}
final Map<String, String> headers = new HashMap<>();
final MultivaluedMap<String, String> requestEntity = new MultivaluedHashMap<>();
boolean continuePolling = true;
while (continuePolling) {
// Determine whether we should replicate only to the cluster coordinator, or if we should replicate directly to the cluster nodes themselves.
final NodeResponse clusterResponse;
if (getReplicationTarget() == ReplicationTarget.CLUSTER_NODES) {
clusterResponse = getRequestReplicator().replicate(user, HttpMethod.GET, groupUri, requestEntity, headers).awaitMergedResponse();
} else {
clusterResponse = getRequestReplicator().forwardToCoordinator(
getClusterCoordinatorNode(), user, HttpMethod.GET, groupUri, requestEntity, headers).awaitMergedResponse();
}
if (clusterResponse.getStatus() != Status.OK.getStatusCode()) {
return false;
}
final ProcessorsEntity processorsEntity = getResponseEntity(clusterResponse, ProcessorsEntity.class);
final Set<ProcessorEntity> processorEntities = processorsEntity.getProcessors();
if (isProcessorValidationComplete(processorEntities, processors)) {
logger.debug("All {} processors of interest now have been validated", processors.size());
return true;
}
// Not all of the processors are done validating. Pause for a bit and poll again.
continuePolling = pause.pause();
}
return false;
}
private boolean isProcessorValidationComplete(Set<ProcessorEntity> processorEntities, Map<String, AffectedComponentEntity> affectedComponents) {
updateAffectedProcessors(processorEntities, affectedComponents);
for (final ProcessorEntity entity : processorEntities) {
if (!affectedComponents.containsKey(entity.getId())) {
continue;
}
if (ProcessorDTO.VALIDATING.equals(entity.getComponent().getValidationStatus())) {
return false;
}
}
return true;
}
/**
* Periodically polls the process group with the given ID, waiting for all processors whose ID's are given to have the given Scheduled State.
*
@ -230,30 +298,32 @@ public class ClusterReplicationComponentLifecycle implements ComponentLifecycle
return entity;
}
private void updateAffectedProcessors(final Set<ProcessorEntity> processorEntities, final Map<String, AffectedComponentEntity> affectedComponents) {
// update the affected processors
processorEntities.stream()
.filter(entity -> affectedComponents.containsKey(entity.getId()))
.forEach(entity -> {
final AffectedComponentEntity affectedComponentEntity = affectedComponents.get(entity.getId());
affectedComponentEntity.setRevision(entity.getRevision());
// only consider update this component if the user had permissions to it
if (Boolean.TRUE.equals(affectedComponentEntity.getPermissions().getCanRead())) {
final AffectedComponentDTO affectedComponent = affectedComponentEntity.getComponent();
affectedComponent.setState(entity.getStatus().getAggregateSnapshot().getRunStatus());
affectedComponent.setActiveThreadCount(entity.getStatus().getAggregateSnapshot().getActiveThreadCount());
if (Boolean.TRUE.equals(entity.getPermissions().getCanRead())) {
affectedComponent.setValidationErrors(entity.getComponent().getValidationErrors());
}
}
});
}
private boolean isProcessorActionComplete(final Set<ProcessorEntity> processorEntities, final Map<String, AffectedComponentEntity> affectedComponents, final ScheduledState desiredState,
final InvalidComponentAction invalidComponentAction) throws LifecycleManagementException {
final String desiredStateName = desiredState.name();
// update the affected processors
processorEntities.stream()
.filter(entity -> affectedComponents.containsKey(entity.getId()))
.forEach(entity -> {
final AffectedComponentEntity affectedComponentEntity = affectedComponents.get(entity.getId());
affectedComponentEntity.setRevision(entity.getRevision());
// only consider update this component if the user had permissions to it
if (Boolean.TRUE.equals(affectedComponentEntity.getPermissions().getCanRead())) {
final AffectedComponentDTO affectedComponent = affectedComponentEntity.getComponent();
affectedComponent.setState(entity.getStatus().getAggregateSnapshot().getRunStatus());
affectedComponent.setActiveThreadCount(entity.getStatus().getAggregateSnapshot().getActiveThreadCount());
if (Boolean.TRUE.equals(entity.getPermissions().getCanRead())) {
affectedComponent.setValidationErrors(entity.getComponent().getValidationErrors());
}
}
});
updateAffectedProcessors(processorEntities, affectedComponents);
for (final ProcessorEntity entity : processorEntities) {
if (!affectedComponents.containsKey(entity.getId())) {
@ -320,6 +390,16 @@ public class ClusterReplicationComponentLifecycle implements ComponentLifecycle
final NiFiUser user = NiFiUserUtils.getNiFiUser();
// If enabling services, validation must complete first
if (desiredState == ControllerServiceState.ENABLED) {
try {
waitForControllerServiceValidation(user, originalUri, groupId, affectedServiceIds, pause);
} catch (InterruptedException e) {
Thread.currentThread().interrupt();
throw new LifecycleManagementException("Interrupted while waiting for Controller Services to complete validation");
}
}
// Determine whether we should replicate only to the cluster coordinator, or if we should replicate directly to the cluster nodes themselves.
try {
final NodeResponse clusterResponse;
@ -352,6 +432,67 @@ public class ClusterReplicationComponentLifecycle implements ComponentLifecycle
.collect(Collectors.toSet());
}
private boolean waitForControllerServiceValidation(final NiFiUser user, final URI originalUri, final String groupId,
final Set<String> serviceIds, final Pause pause)
throws InterruptedException {
URI groupUri;
try {
groupUri = new URI(originalUri.getScheme(), originalUri.getUserInfo(), originalUri.getHost(),
originalUri.getPort(), "/nifi-api/flow/process-groups/" + groupId + "/controller-services", "includeAncestorGroups=false,includeDescendantGroups=true", originalUri.getFragment());
} catch (URISyntaxException e) {
throw new RuntimeException(e);
}
final Map<String, String> headers = new HashMap<>();
final MultivaluedMap<String, String> requestEntity = new MultivaluedHashMap<>();
boolean continuePolling = true;
while (continuePolling) {
// Determine whether we should replicate only to the cluster coordinator, or if we should replicate directly to the cluster nodes themselves.
final NodeResponse clusterResponse;
if (getReplicationTarget() == ReplicationTarget.CLUSTER_NODES) {
clusterResponse = getRequestReplicator().replicate(user, HttpMethod.GET, groupUri, requestEntity, headers).awaitMergedResponse();
} else {
clusterResponse = getRequestReplicator().forwardToCoordinator(
getClusterCoordinatorNode(), user, HttpMethod.GET, groupUri, requestEntity, headers).awaitMergedResponse();
}
if (clusterResponse.getStatus() != Status.OK.getStatusCode()) {
return false;
}
final ControllerServicesEntity controllerServicesEntity = getResponseEntity(clusterResponse, ControllerServicesEntity.class);
final Set<ControllerServiceEntity> serviceEntities = controllerServicesEntity.getControllerServices();
final Map<String, AffectedComponentEntity> affectedServices = serviceEntities.stream()
.collect(Collectors.toMap(ControllerServiceEntity::getId, dtoFactory::createAffectedComponentEntity));
if (isControllerServiceValidationComplete(serviceEntities, affectedServices)) {
logger.debug("All {} controller services of interest have completed validation", affectedServices.size());
return true;
}
continuePolling = pause.pause();
}
return false;
}
private boolean isControllerServiceValidationComplete(final Set<ControllerServiceEntity> controllerServiceEntities, final Map<String, AffectedComponentEntity> affectedComponents) {
updateAffectedControllerServices(controllerServiceEntities, affectedComponents);
for (final ControllerServiceEntity entity : controllerServiceEntities) {
if (!affectedComponents.containsKey(entity.getId())) {
continue;
}
if (ControllerServiceDTO.VALIDATING.equals(entity.getComponent().getValidationStatus())) {
return false;
}
}
return true;
}
/**
* Periodically polls the process group with the given ID, waiting for all controller services whose ID's are given to have the given Controller Service State.
*

View File

@ -105,6 +105,9 @@ public class LocalComponentLifecycle implements ComponentLifecycle {
logger.debug("Starting components with ID's {} from Process Group {}", componentRevisions.keySet(), processGroupId);
// Wait for all affected processors to be either VALID or INVALID
waitForProcessorValidation(processGroupId, affectedComponents, pause);
serviceFacade.verifyScheduleComponents(processGroupId, ScheduledState.RUNNING, componentRevisions.keySet());
serviceFacade.scheduleComponents(processGroupId, ScheduledState.RUNNING, componentRevisions);
@ -130,6 +133,42 @@ public class LocalComponentLifecycle implements ComponentLifecycle {
waitForProcessorState(processGroupId, affectedComponents, ScheduledState.STOPPED, pause, invalidComponentAction);
}
/**
* Waits for all given Processors to complete validation
*
* @return <code>true</code> if all processors have completed validation, <code>false</code> if the given {@link Pause}
* indicated to give up before all of the processors have completed validation
*/
private boolean waitForProcessorValidation(final String groupId, final Map<String, AffectedComponentEntity> affectedComponents, final Pause pause) {
logger.debug("Waiting for {} processors to complete validation", affectedComponents.size());
boolean continuePolling = true;
while (continuePolling) {
final Set<ProcessorEntity> processorEntities = serviceFacade.getProcessors(groupId, true);
if (isProcessorValidationComplete(processorEntities, affectedComponents)) {
logger.debug("All {} processors of interest have completed validation", affectedComponents.size());
return true;
}
continuePolling = pause.pause();
}
return false;
}
private boolean isProcessorValidationComplete(final Set<ProcessorEntity> processorEntities, final Map<String, AffectedComponentEntity> affectedComponents) {
updateAffectedProcessors(processorEntities, affectedComponents);
for (final ProcessorEntity entity : processorEntities) {
if (!affectedComponents.containsKey(entity.getId())) {
continue;
}
if (ProcessorDTO.VALIDATING.equals(entity.getComponent().getValidationStatus())) {
return false;
}
}
return true;
}
/**
* Waits for all of the given Processors to reach the given Scheduled State.
*
@ -157,29 +196,33 @@ public class LocalComponentLifecycle implements ComponentLifecycle {
return false;
}
private void updateAffectedProcessors(final Set<ProcessorEntity> processorEntities, final Map<String, AffectedComponentEntity> affectedComponents) {
// update the affected processors
processorEntities.stream()
.filter(entity -> affectedComponents.containsKey(entity.getId()))
.forEach(entity -> {
final AffectedComponentEntity affectedComponentEntity = affectedComponents.get(entity.getId());
affectedComponentEntity.setRevision(entity.getRevision());
// only consider updating this component if the user has permissions to it
if (Boolean.TRUE.equals(affectedComponentEntity.getPermissions().getCanRead())) {
final AffectedComponentDTO affectedComponent = affectedComponentEntity.getComponent();
affectedComponent.setState(entity.getStatus().getAggregateSnapshot().getRunStatus());
affectedComponent.setActiveThreadCount(entity.getStatus().getAggregateSnapshot().getActiveThreadCount());
if (Boolean.TRUE.equals(entity.getPermissions().getCanRead())) {
affectedComponent.setValidationErrors(entity.getComponent().getValidationErrors());
}
}
});
}
private boolean isProcessorActionComplete(final Set<ProcessorEntity> processorEntities, final Map<String, AffectedComponentEntity> affectedComponents, final ScheduledState desiredState,
final InvalidComponentAction invalidComponentAction) throws LifecycleManagementException {
final String desiredStateName = desiredState.name();
// update the affected processors
processorEntities.stream()
.filter(entity -> affectedComponents.containsKey(entity.getId()))
.forEach(entity -> {
final AffectedComponentEntity affectedComponentEntity = affectedComponents.get(entity.getId());
affectedComponentEntity.setRevision(entity.getRevision());
// only consider updating this component if the user has permissions to it
if (Boolean.TRUE.equals(affectedComponentEntity.getPermissions().getCanRead())) {
final AffectedComponentDTO affectedComponent = affectedComponentEntity.getComponent();
affectedComponent.setState(entity.getStatus().getAggregateSnapshot().getRunStatus());
affectedComponent.setActiveThreadCount(entity.getStatus().getAggregateSnapshot().getActiveThreadCount());
if (Boolean.TRUE.equals(entity.getPermissions().getCanRead())) {
affectedComponent.setValidationErrors(entity.getComponent().getValidationErrors());
}
}
});
updateAffectedProcessors(processorEntities, affectedComponents);
for (final ProcessorEntity entity : processorEntities) {
if (!affectedComponents.containsKey(entity.getId())) {
@ -224,6 +267,8 @@ public class LocalComponentLifecycle implements ComponentLifecycle {
logger.debug("Enabling Controller Services with ID's {} from Process Group {}", serviceRevisions.keySet(), processGroupId);
waitForControllerServiceValidation(processGroupId, affectedServices, pause);
serviceFacade.verifyActivateControllerServices(processGroupId, ControllerServiceState.ENABLED, affectedServices.keySet());
serviceFacade.activateControllerServices(processGroupId, ControllerServiceState.ENABLED, serviceRevisions);
waitForControllerServiceState(processGroupId, affectedServices, ControllerServiceState.ENABLED, pause, invalidComponentAction);
@ -282,6 +327,39 @@ public class LocalComponentLifecycle implements ComponentLifecycle {
}
}
/**
* Waits for all given Controller Services to complete validation
*
* @return <code>true</code> if all processors have completed validation, <code>false</code> if the given {@link Pause}
* indicated to give up before all of the controller services have completed validation
*/
private boolean waitForControllerServiceValidation(final String groupId, final Map<String, AffectedComponentEntity> affectedComponents, final Pause pause) {
logger.debug("Waiting for {} controller services to complete validation", affectedComponents.size());
boolean continuePolling = true;
while (continuePolling) {
final Set<ControllerServiceEntity> serviceEntities = serviceFacade.getControllerServices(groupId, false, true);
if (isControllerServiceValidationComplete(serviceEntities, affectedComponents)) {
logger.debug("All {} controller services of interest have completed validation", affectedComponents.size());
return true;
}
continuePolling = pause.pause();
}
return false;
}
private boolean isControllerServiceValidationComplete(final Set<ControllerServiceEntity> controllerServiceEntities, final Map<String, AffectedComponentEntity> affectedComponents) {
updateAffectedControllerServices(controllerServiceEntities, affectedComponents);
for (final ControllerServiceEntity entity : controllerServiceEntities) {
if (!affectedComponents.containsKey(entity.getId())) {
continue;
}
if (ControllerServiceDTO.VALIDATING.equals(entity.getComponent().getValidationStatus())) {
return false;
}
}
return true;
}
/**
* Periodically polls the process group with the given ID, waiting for all controller services whose ID's are given to have the given Controller Service State.