YARN-9848. Revert YARN-4946. Contributed by Steven Rand.

This commit is contained in:
Akira Ajisaka 2020-10-16 01:04:45 +09:00
parent 392b26c23b
commit a2c1fb7c8c
No known key found for this signature in database
GPG Key ID: C1EDBB9CA400FD50
7 changed files with 25 additions and 254 deletions

View File

@ -93,7 +93,7 @@ public class RMAppManager implements EventHandler<RMAppManagerEvent>,
private int maxCompletedAppsInMemory;
private int maxCompletedAppsInStateStore;
protected int completedAppsInStateStore = 0;
protected LinkedList<ApplicationId> completedApps = new LinkedList<>();
private LinkedList<ApplicationId> completedApps = new LinkedList<>();
private final RMContext rmContext;
private final ApplicationMasterService masterService;
@ -323,72 +323,31 @@ public class RMAppManager implements EventHandler<RMAppManagerEvent>,
* check to see if hit the limit for max # completed apps kept
*/
protected synchronized void checkAppNumCompletedLimit() {
if (completedAppsInStateStore > maxCompletedAppsInStateStore) {
removeCompletedAppsFromStateStore();
}
if (completedApps.size() > maxCompletedAppsInMemory) {
removeCompletedAppsFromMemory();
}
}
private void removeCompletedAppsFromStateStore() {
int numDelete = completedAppsInStateStore - maxCompletedAppsInStateStore;
for (int i = 0; i < numDelete; i++) {
ApplicationId removeId = completedApps.get(i);
// check apps kept in state store.
while (completedAppsInStateStore > this.maxCompletedAppsInStateStore) {
ApplicationId removeId =
completedApps.get(completedApps.size() - completedAppsInStateStore);
RMApp removeApp = rmContext.getRMApps().get(removeId);
boolean deleteApp = shouldDeleteApp(removeApp);
if (deleteApp) {
LOG.info("Max number of completed apps kept in state store met:"
+ " maxCompletedAppsInStateStore = "
+ maxCompletedAppsInStateStore + ", removing app " + removeId
+ " from state store.");
rmContext.getStateStore().removeApplication(removeApp);
completedAppsInStateStore--;
} else {
LOG.info("Max number of completed apps kept in state store met:"
+ " maxCompletedAppsInStateStore = "
+ maxCompletedAppsInStateStore + ", but not removing app "
+ removeId
+ " from state store as log aggregation have not finished yet.");
}
LOG.info("Max number of completed apps kept in state store met:"
+ " maxCompletedAppsInStateStore = " + maxCompletedAppsInStateStore
+ ", removing app " + removeApp.getApplicationId()
+ " from state store.");
rmContext.getStateStore().removeApplication(removeApp);
completedAppsInStateStore--;
}
}
private void removeCompletedAppsFromMemory() {
int numDelete = completedApps.size() - maxCompletedAppsInMemory;
int offset = 0;
for (int i = 0; i < numDelete; i++) {
int deletionIdx = i - offset;
ApplicationId removeId = completedApps.get(deletionIdx);
RMApp removeApp = rmContext.getRMApps().get(removeId);
boolean deleteApp = shouldDeleteApp(removeApp);
if (deleteApp) {
++offset;
LOG.info("Application should be expired, max number of completed apps"
+ " kept in memory met: maxCompletedAppsInMemory = "
+ this.maxCompletedAppsInMemory + ", removing app " + removeId
+ " from memory: ");
completedApps.remove(deletionIdx);
rmContext.getRMApps().remove(removeId);
this.applicationACLsManager.removeApplication(removeId);
} else {
LOG.info("Application should be expired, max number of completed apps"
+ " kept in memory met: maxCompletedAppsInMemory = "
+ this.maxCompletedAppsInMemory + ", but not removing app "
+ removeId
+ " from memory as log aggregation have not finished yet.");
}
// check apps kept in memory.
while (completedApps.size() > this.maxCompletedAppsInMemory) {
ApplicationId removeId = completedApps.remove();
LOG.info("Application should be expired, max number of completed apps"
+ " kept in memory met: maxCompletedAppsInMemory = "
+ this.maxCompletedAppsInMemory + ", removing app " + removeId
+ " from memory: ");
rmContext.getRMApps().remove(removeId);
this.applicationACLsManager.removeApplication(removeId);
}
}
private boolean shouldDeleteApp(RMApp app) {
return !app.isLogAggregationEnabled()
|| app.isLogAggregationFinished();
}
@SuppressWarnings("unchecked")
protected void submitApplication(
ApplicationSubmissionContext submissionContext, long submitTime,

View File

@ -243,10 +243,6 @@ public interface RMApp extends EventHandler<RMAppEvent> {
*/
int getMaxAppAttempts();
boolean isLogAggregationEnabled();
boolean isLogAggregationFinished();
/**
* Returns the application type
* @return the application type.

View File

@ -1755,16 +1755,6 @@ public class RMAppImpl implements RMApp, Recoverable {
logAggregation.aggregateLogReport(nodeId, report, this);
}
@Override
public boolean isLogAggregationFinished() {
return logAggregation.isFinished();
}
@Override
public boolean isLogAggregationEnabled() {
return logAggregation.isEnabled();
}
public String getLogAggregationFailureMessagesForNM(NodeId nodeId) {
return logAggregation.getLogAggregationFailureMessagesForNM(nodeId);
}

View File

@ -18,23 +18,14 @@
package org.apache.hadoop.yarn.server.resourcemanager;
import static java.util.stream.Collectors.toSet;
import static org.mockito.Mockito.times;
import static org.mockito.Mockito.verify;
import java.util.List;
import java.util.Set;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.yarn.api.records.ApplicationId;
import org.apache.hadoop.yarn.api.records.ApplicationSubmissionContext;
import org.apache.hadoop.yarn.exceptions.YarnException;
import org.apache.hadoop.yarn.server.resourcemanager.recovery.RMStateStore;
import org.apache.hadoop.yarn.server.resourcemanager.rmapp.RMApp;
import org.apache.hadoop.yarn.server.resourcemanager.scheduler.YarnScheduler;
import org.apache.hadoop.yarn.server.resourcemanager.security.ClientToAMTokenSecretManagerInRM;
import org.apache.hadoop.yarn.server.security.ApplicationACLsManager;
import org.mockito.ArgumentCaptor;
/**
* Base class for AppManager related test.
@ -75,28 +66,6 @@ public class AppManagerTestBase {
return this.completedAppsInStateStore;
}
public List<ApplicationId> getCompletedApps() {
return completedApps;
}
public Set<ApplicationId> getFirstNCompletedApps(int n) {
return getCompletedApps().stream().limit(n).collect(toSet());
}
public Set<ApplicationId> getCompletedAppsWithEvenIdsInRange(int n) {
return getCompletedApps().stream().limit(n)
.filter(app -> app.getId() % 2 == 0).collect(toSet());
}
public Set<ApplicationId> getRemovedAppsFromStateStore(int numRemoves) {
ArgumentCaptor<RMApp> argumentCaptor =
ArgumentCaptor.forClass(RMApp.class);
verify(stateStore, times(numRemoves))
.removeApplication(argumentCaptor.capture());
return argumentCaptor.getAllValues().stream().map(RMApp::getApplicationId)
.collect(toSet());
}
public void submitApplication(
ApplicationSubmissionContext submissionContext, String user)
throws YarnException {

View File

@ -91,12 +91,10 @@ import java.io.IOException;
import java.nio.ByteBuffer;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Comparator;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.concurrent.ConcurrentMap;
import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.capacity.CapacitySchedulerConfiguration.PREFIX;
@ -141,52 +139,12 @@ public class TestAppManager extends AppManagerTestBase{
return list;
}
private static List<RMApp> newRMAppsMixedLogAggregationStatus(int n,
long time, RMAppState state) {
List<RMApp> list = Lists.newArrayList();
for (int i = 0; i < n; ++i) {
MockRMApp rmApp = new MockRMApp(i, time, state);
rmApp.setLogAggregationEnabled(true);
rmApp.setLogAggregationFinished(i % 2 == 0);
list.add(rmApp);
}
return list;
}
public RMContext mockRMContext(int n, long time) {
final ConcurrentMap<ApplicationId, RMApp> map = createRMAppsMap(n, time);
return createMockRMContextInternal(map);
}
public RMContext mockRMContextWithMixedLogAggregationStatus(int n,
long time) {
final ConcurrentMap<ApplicationId, RMApp> map =
createRMAppsMapMixedLogAggStatus(n, time);
return createMockRMContextInternal(map);
}
private ConcurrentMap<ApplicationId, RMApp> createRMAppsMap(int n,
long time) {
final List<RMApp> apps = newRMApps(n, time, RMAppState.FINISHED);
final ConcurrentMap<ApplicationId, RMApp> map = Maps.newConcurrentMap();
for (RMApp app : apps) {
map.put(app.getApplicationId(), app);
}
return map;
}
private ConcurrentMap<ApplicationId, RMApp> createRMAppsMapMixedLogAggStatus(
int n, long time) {
final List<RMApp> apps =
newRMAppsMixedLogAggregationStatus(n, time, RMAppState.FINISHED);
final ConcurrentMap<ApplicationId, RMApp> map = Maps.newConcurrentMap();
for (RMApp app : apps) {
map.put(app.getApplicationId(), app);
}
return map;
}
private RMContext createMockRMContextInternal(ConcurrentMap<ApplicationId, RMApp> map) {
Dispatcher rmDispatcher = new AsyncDispatcher();
ContainerAllocationExpirer containerAllocationExpirer = new ContainerAllocationExpirer(
rmDispatcher);
@ -238,12 +196,9 @@ public class TestAppManager extends AppManagerTestBase{
}
}
private void addToCompletedApps(TestRMAppManager appMonitor,
RMContext rmContext) {
// ensure applications are finished in order by their IDs
List<RMApp> sortedApps = new ArrayList<>(rmContext.getRMApps().values());
sortedApps.sort(Comparator.comparingInt(o -> o.getApplicationId().getId()));
for (RMApp app : sortedApps) {
protected void addToCompletedApps(
TestRMAppManager appMonitor, RMContext rmContext) {
for (RMApp app : rmContext.getRMApps().values()) {
if (app.getState() == RMAppState.FINISHED
|| app.getState() == RMAppState.KILLED
|| app.getState() == RMAppState.FAILED) {
@ -652,32 +607,18 @@ public class TestAppManager extends AppManagerTestBase{
addToCompletedApps(appMonitor, rmContext);
Assert.assertEquals("Number of completed apps incorrect", allApps,
appMonitor.getCompletedAppsListSize());
int numRemoveAppsFromStateStore = allApps - maxAppsInStateStore;
Set<ApplicationId> appsShouldBeRemovedFromStateStore = appMonitor
.getFirstNCompletedApps(numRemoveAppsFromStateStore);
appMonitor.checkAppNumCompletedLimit();
Set<ApplicationId> removedAppsFromStateStore = appMonitor
.getRemovedAppsFromStateStore(numRemoveAppsFromStateStore);
Assert.assertEquals("Number of apps incorrect after # completed check",
maxAppsInMemory, rmContext.getRMApps().size());
Assert.assertEquals("Number of completed apps incorrect after check",
maxAppsInMemory, appMonitor.getCompletedAppsListSize());
int numRemoveAppsFromStateStore = 10 - maxAppsInStateStore;
verify(rmContext.getStateStore(), times(numRemoveAppsFromStateStore))
.removeApplication(isA(RMApp.class));
Assert.assertEquals(maxAppsInStateStore,
appMonitor.getNumberOfCompletedAppsInStateStore());
List<ApplicationId> completedApps = appMonitor.getCompletedApps();
Assert.assertEquals(maxAppsInMemory, completedApps.size());
Assert.assertEquals(numRemoveAppsFromStateStore,
removedAppsFromStateStore.size());
Assert.assertEquals(numRemoveAppsFromStateStore,
Sets.intersection(appsShouldBeRemovedFromStateStore,
removedAppsFromStateStore).size());
}
@Test
@ -695,12 +636,9 @@ public class TestAppManager extends AppManagerTestBase{
addToCompletedApps(appMonitor, rmContext);
Assert.assertEquals("Number of completed apps incorrect", allApps,
appMonitor.getCompletedAppsListSize());
int numRemoveApps = allApps - maxAppsInMemory;
Set<ApplicationId> appsShouldBeRemoved = appMonitor
.getFirstNCompletedApps(numRemoveApps);
appMonitor.checkAppNumCompletedLimit();
int numRemoveApps = allApps - maxAppsInMemory;
Assert.assertEquals("Number of apps incorrect after # completed check",
maxAppsInMemory, rmContext.getRMApps().size());
Assert.assertEquals("Number of completed apps incorrect after check",
@ -709,56 +647,6 @@ public class TestAppManager extends AppManagerTestBase{
isA(RMApp.class));
Assert.assertEquals(maxAppsInMemory,
appMonitor.getNumberOfCompletedAppsInStateStore());
List<ApplicationId> completedApps = appMonitor.getCompletedApps();
Assert.assertEquals(maxAppsInMemory, completedApps.size());
Assert.assertEquals(numRemoveApps, appsShouldBeRemoved.size());
assertTrue(Collections.disjoint(completedApps, appsShouldBeRemoved));
}
@Test
public void testStateStoreAppLimitSomeAppsHaveNotFinishedLogAggregation() {
long now = System.currentTimeMillis();
final int allApps = 10;
RMContext rmContext =
mockRMContextWithMixedLogAggregationStatus(allApps, now - 20000);
Configuration conf = new YarnConfiguration();
int maxAppsInMemory = 2;
conf.setInt(YarnConfiguration.RM_MAX_COMPLETED_APPLICATIONS,
maxAppsInMemory);
// greater than maxCompletedAppsInMemory, reset to
// RM_MAX_COMPLETED_APPLICATIONS.
conf.setInt(YarnConfiguration.RM_STATE_STORE_MAX_COMPLETED_APPLICATIONS,
1000);
TestRMAppManager appMonitor = new TestRMAppManager(rmContext, conf);
addToCompletedApps(appMonitor, rmContext);
Assert.assertEquals("Number of completed apps incorrect", allApps,
appMonitor.getCompletedAppsListSize());
int numRemoveApps = allApps - maxAppsInMemory;
int effectiveNumRemoveApps = numRemoveApps / 2;
//only apps with even ID would be deleted due to log aggregation status
int expectedNumberOfAppsInMemory = maxAppsInMemory + effectiveNumRemoveApps;
Set<ApplicationId> appsShouldBeRemoved = appMonitor
.getCompletedAppsWithEvenIdsInRange(numRemoveApps);
appMonitor.checkAppNumCompletedLimit();
Assert.assertEquals("Number of apps incorrect after # completed check",
expectedNumberOfAppsInMemory, rmContext.getRMApps().size());
Assert.assertEquals("Number of completed apps incorrect after check",
expectedNumberOfAppsInMemory, appMonitor.getCompletedAppsListSize());
verify(rmContext.getStateStore(), times(effectiveNumRemoveApps))
.removeApplication(isA(RMApp.class));
Assert.assertEquals(expectedNumberOfAppsInMemory,
appMonitor.getNumberOfCompletedAppsInStateStore());
List<ApplicationId> completedApps = appMonitor.getCompletedApps();
Assert.assertEquals(expectedNumberOfAppsInMemory, completedApps.size());
Assert.assertEquals(effectiveNumRemoveApps, appsShouldBeRemoved.size());
assertTrue(Collections.disjoint(completedApps, appsShouldBeRemoved));
}
protected void setupDispatcher(RMContext rmContext, Configuration conf) {

View File

@ -146,17 +146,6 @@ public abstract class MockAsm extends MockApps {
public int getMaxAppAttempts() {
throw new UnsupportedOperationException("Not supported yet.");
}
@Override
public boolean isLogAggregationEnabled() {
throw new UnsupportedOperationException("Not supported yet.");
}
@Override
public boolean isLogAggregationFinished() {
throw new UnsupportedOperationException("Not supported yet.");
}
@Override
public ApplicationReport createAndGetApplicationReport(
String clientUserName,boolean allowAccess) {

View File

@ -70,8 +70,6 @@ public class MockRMApp implements RMApp {
int maxAppAttempts = 1;
List<ResourceRequest> amReqs;
private Set<String> applicationTags = null;
private boolean logAggregationEnabled;
private boolean logAggregationFinished;
public MockRMApp(int newid, long time, RMAppState newState) {
finish = time;
@ -238,24 +236,6 @@ public class MockRMApp implements RMApp {
return maxAppAttempts;
}
@Override
public boolean isLogAggregationEnabled() {
return logAggregationEnabled;
}
@Override
public boolean isLogAggregationFinished() {
return logAggregationFinished;
}
public void setLogAggregationEnabled(boolean enabled) {
this.logAggregationEnabled = enabled;
}
public void setLogAggregationFinished(boolean finished) {
this.logAggregationFinished = finished;
}
public void setNumMaxRetries(int maxAppAttempts) {
this.maxAppAttempts = maxAppAttempts;
}