YARN-11250. Capture the Performance Metrics of ZookeeperFederationStateStore. (#4738)

This commit is contained in:
slfan1989 2022-08-23 05:09:20 +08:00 committed by GitHub
parent 17daad34d4
commit eda4bb5dcd
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
6 changed files with 286 additions and 19 deletions

View File

@ -249,8 +249,7 @@ public class MemoryFederationStateStore implements FederationStateStore {
FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg); FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg);
} }
return GetApplicationHomeSubClusterResponse.newInstance( return GetApplicationHomeSubClusterResponse.newInstance(appId, applications.get(appId));
ApplicationHomeSubCluster.newInstance(appId, applications.get(appId)));
} }
@Override @Override

View File

@ -720,8 +720,7 @@ public class SQLFederationStateStore implements FederationStateStore {
FederationStateStoreUtils.returnToPool(LOG, cstmt); FederationStateStoreUtils.returnToPool(LOG, cstmt);
} }
return GetApplicationHomeSubClusterResponse return GetApplicationHomeSubClusterResponse
.newInstance(ApplicationHomeSubCluster .newInstance(request.getApplicationId(), homeRM);
.newInstance(request.getApplicationId(), homeRM));
} }
@Override @Override

View File

@ -0,0 +1,155 @@
/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with this
* work for additional information regarding copyright ownership. The ASF
* licenses this file to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
* <p>
* http://www.apache.org/licenses/LICENSE-2.0
* <p>
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
* License for the specific language governing permissions and limitations under
* the License.
*/
package org.apache.hadoop.yarn.server.federation.store.impl;
import org.apache.hadoop.classification.InterfaceAudience;
import org.apache.hadoop.classification.InterfaceStability;
import org.apache.hadoop.metrics2.MetricsCollector;
import org.apache.hadoop.metrics2.MetricsInfo;
import org.apache.hadoop.metrics2.MetricsSource;
import org.apache.hadoop.metrics2.MetricsSystem;
import org.apache.hadoop.metrics2.annotation.Metric;
import org.apache.hadoop.metrics2.annotation.Metrics;
import org.apache.hadoop.metrics2.lib.DefaultMetricsSystem;
import org.apache.hadoop.metrics2.lib.MetricsRegistry;
import org.apache.hadoop.metrics2.lib.MutableRate;
import static org.apache.hadoop.metrics2.lib.Interns.info;
@InterfaceAudience.Private
@InterfaceStability.Unstable
@Metrics(context="ZKFederationStateStore-op-durations")
public final class ZKFederationStateStoreOpDurations implements MetricsSource {
@Metric("Duration for a add application homeSubcluster call")
private MutableRate addAppHomeSubCluster;
@Metric("Duration for a update application homeSubcluster call")
private MutableRate updateAppHomeSubCluster;
@Metric("Duration for a get application homeSubcluster call")
private MutableRate getAppHomeSubCluster;
@Metric("Duration for a get applications homeSubcluster call")
private MutableRate getAppsHomeSubCluster;
@Metric("Duration for a delete applications homeSubcluster call")
private MutableRate deleteAppHomeSubCluster;
@Metric("Duration for a register subCluster call")
private MutableRate registerSubCluster;
@Metric("Duration for a deregister subCluster call")
private MutableRate deregisterSubCluster;
@Metric("Duration for a subCluster Heartbeat call")
private MutableRate subClusterHeartbeat;
@Metric("Duration for a get SubCluster call")
private MutableRate getSubCluster;
@Metric("Duration for a get SubClusters call")
private MutableRate getSubClusters;
@Metric("Duration for a get PolicyConfiguration call")
private MutableRate getPolicyConfiguration;
@Metric("Duration for a set PolicyConfiguration call")
private MutableRate setPolicyConfiguration;
@Metric("Duration for a get PolicyConfigurations call")
private MutableRate getPoliciesConfigurations;
protected static final MetricsInfo RECORD_INFO =
info("ZKFederationStateStoreOpDurations", "Durations of ZKFederationStateStore calls");
private final MetricsRegistry registry;
private static final ZKFederationStateStoreOpDurations INSTANCE =
new ZKFederationStateStoreOpDurations();
public static ZKFederationStateStoreOpDurations getInstance() {
return INSTANCE;
}
private ZKFederationStateStoreOpDurations() {
registry = new MetricsRegistry(RECORD_INFO);
registry.tag(RECORD_INFO, "ZKFederationStateStoreOpDurations");
MetricsSystem ms = DefaultMetricsSystem.instance();
if (ms != null) {
ms.register(RECORD_INFO.name(), RECORD_INFO.description(), this);
}
}
@Override
public synchronized void getMetrics(MetricsCollector collector, boolean all) {
registry.snapshot(collector.addRecord(registry.info()), all);
}
public void addAppHomeSubClusterDuration(long startTime, long endTime) {
addAppHomeSubCluster.add(endTime - startTime);
}
public void addUpdateAppHomeSubClusterDuration(long startTime, long endTime) {
updateAppHomeSubCluster.add(endTime - startTime);
}
public void addGetAppHomeSubClusterDuration(long startTime, long endTime) {
getAppHomeSubCluster.add(endTime - startTime);
}
public void addGetAppsHomeSubClusterDuration(long startTime, long endTime) {
getAppsHomeSubCluster.add(endTime - startTime);
}
public void addDeleteAppHomeSubClusterDuration(long startTime, long endTime) {
deleteAppHomeSubCluster.add(endTime - startTime);
}
public void addRegisterSubClusterDuration(long startTime, long endTime) {
registerSubCluster.add(endTime - startTime);
}
public void addDeregisterSubClusterDuration(long startTime, long endTime) {
deregisterSubCluster.add(endTime - startTime);
}
public void addSubClusterHeartbeatDuration(long startTime, long endTime) {
subClusterHeartbeat.add(endTime - startTime);
}
public void addGetSubClusterDuration(long startTime, long endTime) {
getSubCluster.add(endTime - startTime);
}
public void addGetSubClustersDuration(long startTime, long endTime) {
getSubClusters.add(endTime - startTime);
}
public void addGetPolicyConfigurationDuration(long startTime, long endTime) {
getPolicyConfiguration.add(endTime - startTime);
}
public void addSetPolicyConfigurationDuration(long startTime, long endTime) {
setPolicyConfiguration.add(endTime - startTime);
}
public void addGetPoliciesConfigurationsDuration(long startTime, long endTime) {
getPoliciesConfigurations.add(endTime - startTime);
}
}

View File

@ -25,6 +25,7 @@ import java.util.Calendar;
import java.util.List; import java.util.List;
import java.util.TimeZone; import java.util.TimeZone;
import org.apache.hadoop.classification.VisibleForTesting;
import org.apache.commons.lang3.NotImplementedException; import org.apache.commons.lang3.NotImplementedException;
import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.util.curator.ZKCuratorManager; import org.apache.hadoop.util.curator.ZKCuratorManager;
@ -84,6 +85,8 @@ import org.apache.hadoop.yarn.server.federation.store.utils.FederationMembership
import org.apache.hadoop.yarn.server.federation.store.utils.FederationPolicyStoreInputValidator; import org.apache.hadoop.yarn.server.federation.store.utils.FederationPolicyStoreInputValidator;
import org.apache.hadoop.yarn.server.federation.store.utils.FederationStateStoreUtils; import org.apache.hadoop.yarn.server.federation.store.utils.FederationStateStoreUtils;
import org.apache.hadoop.yarn.server.records.Version; import org.apache.hadoop.yarn.server.records.Version;
import org.apache.hadoop.yarn.util.Clock;
import org.apache.hadoop.yarn.util.SystemClock;
import org.apache.zookeeper.data.ACL; import org.apache.zookeeper.data.ACL;
import org.slf4j.Logger; import org.slf4j.Logger;
import org.slf4j.LoggerFactory; import org.slf4j.LoggerFactory;
@ -124,6 +127,12 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
private String membershipZNode; private String membershipZNode;
private String policiesZNode; private String policiesZNode;
private volatile Clock clock = SystemClock.getInstance();
@VisibleForTesting
private ZKFederationStateStoreOpDurations opDurations =
ZKFederationStateStoreOpDurations.getInstance();
@Override @Override
public void init(Configuration conf) throws YarnException { public void init(Configuration conf) throws YarnException {
LOG.info("Initializing ZooKeeper connection"); LOG.info("Initializing ZooKeeper connection");
@ -153,7 +162,6 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
String errMsg = "Cannot create base directories: " + e.getMessage(); String errMsg = "Cannot create base directories: " + e.getMessage();
FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg); FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg);
} }
} }
@Override @Override
@ -167,6 +175,7 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
public AddApplicationHomeSubClusterResponse addApplicationHomeSubCluster( public AddApplicationHomeSubClusterResponse addApplicationHomeSubCluster(
AddApplicationHomeSubClusterRequest request) throws YarnException { AddApplicationHomeSubClusterRequest request) throws YarnException {
long start = clock.getTime();
FederationApplicationHomeSubClusterStoreInputValidator.validate(request); FederationApplicationHomeSubClusterStoreInputValidator.validate(request);
ApplicationHomeSubCluster app = request.getApplicationHomeSubCluster(); ApplicationHomeSubCluster app = request.getApplicationHomeSubCluster();
ApplicationId appId = app.getApplicationId(); ApplicationId appId = app.getApplicationId();
@ -187,7 +196,8 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
String errMsg = "Cannot check app home subcluster for " + appId; String errMsg = "Cannot check app home subcluster for " + appId;
FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg); FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg);
} }
long end = clock.getTime();
opDurations.addAppHomeSubClusterDuration(start, end);
return AddApplicationHomeSubClusterResponse return AddApplicationHomeSubClusterResponse
.newInstance(homeSubCluster); .newInstance(homeSubCluster);
} }
@ -198,6 +208,7 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
UpdateApplicationHomeSubClusterRequest request) UpdateApplicationHomeSubClusterRequest request)
throws YarnException { throws YarnException {
long start = clock.getTime();
FederationApplicationHomeSubClusterStoreInputValidator.validate(request); FederationApplicationHomeSubClusterStoreInputValidator.validate(request);
ApplicationHomeSubCluster app = request.getApplicationHomeSubCluster(); ApplicationHomeSubCluster app = request.getApplicationHomeSubCluster();
ApplicationId appId = app.getApplicationId(); ApplicationId appId = app.getApplicationId();
@ -209,6 +220,9 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
SubClusterId newSubClusterId = SubClusterId newSubClusterId =
request.getApplicationHomeSubCluster().getHomeSubCluster(); request.getApplicationHomeSubCluster().getHomeSubCluster();
putApp(appId, newSubClusterId, true); putApp(appId, newSubClusterId, true);
long end = clock.getTime();
opDurations.addUpdateAppHomeSubClusterDuration(start, end);
return UpdateApplicationHomeSubClusterResponse.newInstance(); return UpdateApplicationHomeSubClusterResponse.newInstance();
} }
@ -216,6 +230,7 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
public GetApplicationHomeSubClusterResponse getApplicationHomeSubCluster( public GetApplicationHomeSubClusterResponse getApplicationHomeSubCluster(
GetApplicationHomeSubClusterRequest request) throws YarnException { GetApplicationHomeSubClusterRequest request) throws YarnException {
long start = clock.getTime();
FederationApplicationHomeSubClusterStoreInputValidator.validate(request); FederationApplicationHomeSubClusterStoreInputValidator.validate(request);
ApplicationId appId = request.getApplicationId(); ApplicationId appId = request.getApplicationId();
SubClusterId homeSubCluster = getApp(appId); SubClusterId homeSubCluster = getApp(appId);
@ -223,13 +238,15 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
String errMsg = "Application " + appId + " does not exist"; String errMsg = "Application " + appId + " does not exist";
FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg); FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg);
} }
return GetApplicationHomeSubClusterResponse.newInstance( long end = clock.getTime();
ApplicationHomeSubCluster.newInstance(appId, homeSubCluster)); opDurations.addGetAppHomeSubClusterDuration(start, end);
return GetApplicationHomeSubClusterResponse.newInstance(appId, homeSubCluster);
} }
@Override @Override
public GetApplicationsHomeSubClusterResponse getApplicationsHomeSubCluster( public GetApplicationsHomeSubClusterResponse getApplicationsHomeSubCluster(
GetApplicationsHomeSubClusterRequest request) throws YarnException { GetApplicationsHomeSubClusterRequest request) throws YarnException {
long start = clock.getTime();
List<ApplicationHomeSubCluster> result = new ArrayList<>(); List<ApplicationHomeSubCluster> result = new ArrayList<>();
try { try {
@ -244,7 +261,8 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
String errMsg = "Cannot get apps: " + e.getMessage(); String errMsg = "Cannot get apps: " + e.getMessage();
FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg); FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg);
} }
long end = clock.getTime();
opDurations.addGetAppsHomeSubClusterDuration(start, end);
return GetApplicationsHomeSubClusterResponse.newInstance(result); return GetApplicationsHomeSubClusterResponse.newInstance(result);
} }
@ -253,7 +271,7 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
deleteApplicationHomeSubCluster( deleteApplicationHomeSubCluster(
DeleteApplicationHomeSubClusterRequest request) DeleteApplicationHomeSubClusterRequest request)
throws YarnException { throws YarnException {
long start = clock.getTime();
FederationApplicationHomeSubClusterStoreInputValidator.validate(request); FederationApplicationHomeSubClusterStoreInputValidator.validate(request);
ApplicationId appId = request.getApplicationId(); ApplicationId appId = request.getApplicationId();
String appZNode = getNodePath(appsZNode, appId.toString()); String appZNode = getNodePath(appsZNode, appId.toString());
@ -276,13 +294,15 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
String errMsg = "Cannot delete app: " + e.getMessage(); String errMsg = "Cannot delete app: " + e.getMessage();
FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg); FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg);
} }
long end = clock.getTime();
opDurations.addDeleteAppHomeSubClusterDuration(start, end);
return DeleteApplicationHomeSubClusterResponse.newInstance(); return DeleteApplicationHomeSubClusterResponse.newInstance();
} }
@Override @Override
public SubClusterRegisterResponse registerSubCluster( public SubClusterRegisterResponse registerSubCluster(
SubClusterRegisterRequest request) throws YarnException { SubClusterRegisterRequest request) throws YarnException {
long start = clock.getTime();
FederationMembershipStateStoreInputValidator.validate(request); FederationMembershipStateStoreInputValidator.validate(request);
SubClusterInfo subClusterInfo = request.getSubClusterInfo(); SubClusterInfo subClusterInfo = request.getSubClusterInfo();
SubClusterId subclusterId = subClusterInfo.getSubClusterId(); SubClusterId subclusterId = subClusterInfo.getSubClusterId();
@ -297,12 +317,15 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
String errMsg = "Cannot register subcluster: " + e.getMessage(); String errMsg = "Cannot register subcluster: " + e.getMessage();
FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg); FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg);
} }
long end = clock.getTime();
opDurations.addRegisterSubClusterDuration(start, end);
return SubClusterRegisterResponse.newInstance(); return SubClusterRegisterResponse.newInstance();
} }
@Override @Override
public SubClusterDeregisterResponse deregisterSubCluster( public SubClusterDeregisterResponse deregisterSubCluster(
SubClusterDeregisterRequest request) throws YarnException { SubClusterDeregisterRequest request) throws YarnException {
long start = clock.getTime();
FederationMembershipStateStoreInputValidator.validate(request); FederationMembershipStateStoreInputValidator.validate(request);
SubClusterId subClusterId = request.getSubClusterId(); SubClusterId subClusterId = request.getSubClusterId();
SubClusterState state = request.getState(); SubClusterState state = request.getState();
@ -316,14 +339,15 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
subClusterInfo.setState(state); subClusterInfo.setState(state);
putSubclusterInfo(subClusterId, subClusterInfo, true); putSubclusterInfo(subClusterId, subClusterInfo, true);
} }
long end = clock.getTime();
opDurations.addDeregisterSubClusterDuration(start, end);
return SubClusterDeregisterResponse.newInstance(); return SubClusterDeregisterResponse.newInstance();
} }
@Override @Override
public SubClusterHeartbeatResponse subClusterHeartbeat( public SubClusterHeartbeatResponse subClusterHeartbeat(
SubClusterHeartbeatRequest request) throws YarnException { SubClusterHeartbeatRequest request) throws YarnException {
long start = clock.getTime();
FederationMembershipStateStoreInputValidator.validate(request); FederationMembershipStateStoreInputValidator.validate(request);
SubClusterId subClusterId = request.getSubClusterId(); SubClusterId subClusterId = request.getSubClusterId();
@ -340,14 +364,15 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
subClusterInfo.setCapability(request.getCapability()); subClusterInfo.setCapability(request.getCapability());
putSubclusterInfo(subClusterId, subClusterInfo, true); putSubclusterInfo(subClusterId, subClusterInfo, true);
long end = clock.getTime();
opDurations.addSubClusterHeartbeatDuration(start, end);
return SubClusterHeartbeatResponse.newInstance(); return SubClusterHeartbeatResponse.newInstance();
} }
@Override @Override
public GetSubClusterInfoResponse getSubCluster( public GetSubClusterInfoResponse getSubCluster(
GetSubClusterInfoRequest request) throws YarnException { GetSubClusterInfoRequest request) throws YarnException {
long start = clock.getTime();
FederationMembershipStateStoreInputValidator.validate(request); FederationMembershipStateStoreInputValidator.validate(request);
SubClusterId subClusterId = request.getSubClusterId(); SubClusterId subClusterId = request.getSubClusterId();
SubClusterInfo subClusterInfo = null; SubClusterInfo subClusterInfo = null;
@ -361,12 +386,15 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
String errMsg = "Cannot get subcluster: " + e.getMessage(); String errMsg = "Cannot get subcluster: " + e.getMessage();
FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg); FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg);
} }
long end = clock.getTime();
opDurations.addGetSubClusterDuration(start, end);
return GetSubClusterInfoResponse.newInstance(subClusterInfo); return GetSubClusterInfoResponse.newInstance(subClusterInfo);
} }
@Override @Override
public GetSubClustersInfoResponse getSubClusters( public GetSubClustersInfoResponse getSubClusters(
GetSubClustersInfoRequest request) throws YarnException { GetSubClustersInfoRequest request) throws YarnException {
long start = clock.getTime();
List<SubClusterInfo> result = new ArrayList<>(); List<SubClusterInfo> result = new ArrayList<>();
try { try {
@ -382,6 +410,8 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
String errMsg = "Cannot get subclusters: " + e.getMessage(); String errMsg = "Cannot get subclusters: " + e.getMessage();
FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg); FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg);
} }
long end = clock.getTime();
opDurations.addGetSubClustersDuration(start, end);
return GetSubClustersInfoResponse.newInstance(result); return GetSubClustersInfoResponse.newInstance(result);
} }
@ -389,7 +419,7 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
@Override @Override
public GetSubClusterPolicyConfigurationResponse getPolicyConfiguration( public GetSubClusterPolicyConfigurationResponse getPolicyConfiguration(
GetSubClusterPolicyConfigurationRequest request) throws YarnException { GetSubClusterPolicyConfigurationRequest request) throws YarnException {
long start = clock.getTime();
FederationPolicyStoreInputValidator.validate(request); FederationPolicyStoreInputValidator.validate(request);
String queue = request.getQueue(); String queue = request.getQueue();
SubClusterPolicyConfiguration policy = null; SubClusterPolicyConfiguration policy = null;
@ -404,6 +434,8 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
LOG.warn("Policy for queue: {} does not exist.", queue); LOG.warn("Policy for queue: {} does not exist.", queue);
return null; return null;
} }
long end = clock.getTime();
opDurations.addGetPolicyConfigurationDuration(start, end);
return GetSubClusterPolicyConfigurationResponse return GetSubClusterPolicyConfigurationResponse
.newInstance(policy); .newInstance(policy);
} }
@ -411,7 +443,7 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
@Override @Override
public SetSubClusterPolicyConfigurationResponse setPolicyConfiguration( public SetSubClusterPolicyConfigurationResponse setPolicyConfiguration(
SetSubClusterPolicyConfigurationRequest request) throws YarnException { SetSubClusterPolicyConfigurationRequest request) throws YarnException {
long start = clock.getTime();
FederationPolicyStoreInputValidator.validate(request); FederationPolicyStoreInputValidator.validate(request);
SubClusterPolicyConfiguration policy = SubClusterPolicyConfiguration policy =
request.getPolicyConfiguration(); request.getPolicyConfiguration();
@ -422,12 +454,15 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
String errMsg = "Cannot set policy: " + e.getMessage(); String errMsg = "Cannot set policy: " + e.getMessage();
FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg); FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg);
} }
long end = clock.getTime();
opDurations.addSetPolicyConfigurationDuration(start, end);
return SetSubClusterPolicyConfigurationResponse.newInstance(); return SetSubClusterPolicyConfigurationResponse.newInstance();
} }
@Override @Override
public GetSubClusterPoliciesConfigurationsResponse getPoliciesConfigurations( public GetSubClusterPoliciesConfigurationsResponse getPoliciesConfigurations(
GetSubClusterPoliciesConfigurationsRequest request) throws YarnException { GetSubClusterPoliciesConfigurationsRequest request) throws YarnException {
long start = clock.getTime();
List<SubClusterPolicyConfiguration> result = new ArrayList<>(); List<SubClusterPolicyConfiguration> result = new ArrayList<>();
try { try {
@ -443,6 +478,8 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
String errMsg = "Cannot get policies: " + e.getMessage(); String errMsg = "Cannot get policies: " + e.getMessage();
FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg); FederationStateStoreUtils.logAndThrowStoreException(LOG, errMsg);
} }
long end = clock.getTime();
opDurations.addGetPoliciesConfigurationsDuration(start, end);
return GetSubClusterPoliciesConfigurationsResponse.newInstance(result); return GetSubClusterPoliciesConfigurationsResponse.newInstance(result);
} }
@ -649,6 +686,11 @@ public class ZookeeperFederationStateStore implements FederationStateStore {
return cal.getTimeInMillis(); return cal.getTimeInMillis();
} }
@VisibleForTesting
public ZKFederationStateStoreOpDurations getOpDurations() {
return opDurations;
}
@Override @Override
public AddReservationHomeSubClusterResponse addReservationHomeSubCluster( public AddReservationHomeSubClusterResponse addReservationHomeSubCluster(
AddReservationHomeSubClusterRequest request) throws YarnException { AddReservationHomeSubClusterRequest request) throws YarnException {

View File

@ -20,6 +20,7 @@ package org.apache.hadoop.yarn.server.federation.store.records;
import org.apache.hadoop.classification.InterfaceAudience.Private; import org.apache.hadoop.classification.InterfaceAudience.Private;
import org.apache.hadoop.classification.InterfaceAudience.Public; import org.apache.hadoop.classification.InterfaceAudience.Public;
import org.apache.hadoop.classification.InterfaceStability.Unstable; import org.apache.hadoop.classification.InterfaceStability.Unstable;
import org.apache.hadoop.yarn.api.records.ApplicationId;
import org.apache.hadoop.yarn.util.Records; import org.apache.hadoop.yarn.util.Records;
/** /**
@ -42,7 +43,9 @@ public abstract class GetApplicationHomeSubClusterResponse {
@Private @Private
@Unstable @Unstable
public static GetApplicationHomeSubClusterResponse newInstance( public static GetApplicationHomeSubClusterResponse newInstance(
ApplicationHomeSubCluster applicationHomeSubCluster) { ApplicationId appId, SubClusterId homeSubCluster) {
ApplicationHomeSubCluster applicationHomeSubCluster =
ApplicationHomeSubCluster.newInstance(appId, homeSubCluster);
GetApplicationHomeSubClusterResponse mapResponse = GetApplicationHomeSubClusterResponse mapResponse =
Records.newRecord(GetApplicationHomeSubClusterResponse.class); Records.newRecord(GetApplicationHomeSubClusterResponse.class);
mapResponse.setApplicationHomeSubCluster(applicationHomeSubCluster); mapResponse.setApplicationHomeSubCluster(applicationHomeSubCluster);

View File

@ -25,14 +25,21 @@ import org.apache.curator.retry.RetryNTimes;
import org.apache.curator.test.TestingServer; import org.apache.curator.test.TestingServer;
import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.CommonConfigurationKeys; import org.apache.hadoop.fs.CommonConfigurationKeys;
import org.apache.hadoop.metrics2.MetricsRecord;
import org.apache.hadoop.metrics2.impl.MetricsCollectorImpl;
import org.apache.hadoop.metrics2.impl.MetricsRecords;
import org.apache.hadoop.util.Time;
import org.apache.hadoop.yarn.conf.YarnConfiguration; import org.apache.hadoop.yarn.conf.YarnConfiguration;
import org.apache.hadoop.yarn.exceptions.YarnException; import org.apache.hadoop.yarn.exceptions.YarnException;
import org.apache.hadoop.yarn.server.federation.store.FederationStateStore; import org.apache.hadoop.yarn.server.federation.store.FederationStateStore;
import org.junit.After; import org.junit.After;
import org.junit.Before; import org.junit.Before;
import org.junit.Test;
import org.slf4j.Logger; import org.slf4j.Logger;
import org.slf4j.LoggerFactory; import org.slf4j.LoggerFactory;
import static org.junit.Assert.assertEquals;
/** /**
* Unit tests for ZookeeperFederationStateStore. * Unit tests for ZookeeperFederationStateStore.
*/ */
@ -84,4 +91,66 @@ public class TestZookeeperFederationStateStore
super.setConf(getConf()); super.setConf(getConf());
return new ZookeeperFederationStateStore(); return new ZookeeperFederationStateStore();
} }
@Test
public void testMetricsInited() throws Exception {
ZookeeperFederationStateStore zkStateStore = (ZookeeperFederationStateStore) createStateStore();
ZKFederationStateStoreOpDurations zkStateStoreOpDurations = zkStateStore.getOpDurations();
MetricsCollectorImpl collector = new MetricsCollectorImpl();
long anyDuration = 10;
long start = Time.now();
long end = start + anyDuration;
zkStateStoreOpDurations.addAppHomeSubClusterDuration(start, end);
zkStateStoreOpDurations.addUpdateAppHomeSubClusterDuration(start, end);
zkStateStoreOpDurations.addGetAppHomeSubClusterDuration(start, end);
zkStateStoreOpDurations.addGetAppsHomeSubClusterDuration(start, end);
zkStateStoreOpDurations.addDeleteAppHomeSubClusterDuration(start, end);
zkStateStoreOpDurations.addRegisterSubClusterDuration(start, end);
zkStateStoreOpDurations.addDeregisterSubClusterDuration(start, end);
zkStateStoreOpDurations.addSubClusterHeartbeatDuration(start, end);
zkStateStoreOpDurations.addGetSubClusterDuration(start, end);
zkStateStoreOpDurations.addGetSubClustersDuration(start, end);
zkStateStoreOpDurations.addGetPolicyConfigurationDuration(start, end);
zkStateStoreOpDurations.addSetPolicyConfigurationDuration(start, end);
zkStateStoreOpDurations.addGetPoliciesConfigurationsDuration(start, end);
zkStateStoreOpDurations.getMetrics(collector, true);
assertEquals("Incorrect number of perf metrics", 1, collector.getRecords().size());
MetricsRecord record = collector.getRecords().get(0);
MetricsRecords.assertTag(record, ZKFederationStateStoreOpDurations.RECORD_INFO.name(),
"ZKFederationStateStoreOpDurations");
double expectAvgTime = anyDuration;
MetricsRecords.assertMetric(record, "AddAppHomeSubClusterAvgTime", expectAvgTime);
MetricsRecords.assertMetric(record, "UpdateAppHomeSubClusterAvgTime", expectAvgTime);
MetricsRecords.assertMetric(record, "GetAppHomeSubClusterAvgTime", expectAvgTime);
MetricsRecords.assertMetric(record, "GetAppsHomeSubClusterAvgTime", expectAvgTime);
MetricsRecords.assertMetric(record, "DeleteAppHomeSubClusterAvgTime", expectAvgTime);
MetricsRecords.assertMetric(record, "RegisterSubClusterAvgTime", expectAvgTime);
MetricsRecords.assertMetric(record, "DeregisterSubClusterAvgTime", expectAvgTime);
MetricsRecords.assertMetric(record, "SubClusterHeartbeatAvgTime", expectAvgTime);
MetricsRecords.assertMetric(record, "GetSubClusterAvgTime", expectAvgTime);
MetricsRecords.assertMetric(record, "GetSubClustersAvgTime", expectAvgTime);
MetricsRecords.assertMetric(record, "GetPolicyConfigurationAvgTime", expectAvgTime);
MetricsRecords.assertMetric(record, "SetPolicyConfigurationAvgTime", expectAvgTime);
MetricsRecords.assertMetric(record, "GetPoliciesConfigurationsAvgTime", expectAvgTime);
long expectOps = 1;
MetricsRecords.assertMetric(record, "AddAppHomeSubClusterNumOps", expectOps);
MetricsRecords.assertMetric(record, "UpdateAppHomeSubClusterNumOps", expectOps);
MetricsRecords.assertMetric(record, "GetAppHomeSubClusterNumOps", expectOps);
MetricsRecords.assertMetric(record, "GetAppsHomeSubClusterNumOps", expectOps);
MetricsRecords.assertMetric(record, "DeleteAppHomeSubClusterNumOps", expectOps);
MetricsRecords.assertMetric(record, "RegisterSubClusterNumOps", expectOps);
MetricsRecords.assertMetric(record, "DeregisterSubClusterNumOps", expectOps);
MetricsRecords.assertMetric(record, "SubClusterHeartbeatNumOps", expectOps);
MetricsRecords.assertMetric(record, "GetSubClusterNumOps", expectOps);
MetricsRecords.assertMetric(record, "GetSubClustersNumOps", expectOps);
MetricsRecords.assertMetric(record, "GetPolicyConfigurationNumOps", expectOps);
MetricsRecords.assertMetric(record, "SetPolicyConfigurationNumOps", expectOps);
MetricsRecords.assertMetric(record, "GetPoliciesConfigurationsNumOps", expectOps);
}
} }