HADOOP-17165. Implement service-user feature in DecayRPCScheduler. (#2240)
This commit is contained in:
parent
85119267be
commit
e5fe326270
|
@ -20,11 +20,14 @@ package org.apache.hadoop.ipc;
|
||||||
|
|
||||||
import java.lang.ref.WeakReference;
|
import java.lang.ref.WeakReference;
|
||||||
import java.util.ArrayList;
|
import java.util.ArrayList;
|
||||||
|
import java.util.Collection;
|
||||||
import java.util.Collections;
|
import java.util.Collections;
|
||||||
import java.util.HashMap;
|
import java.util.HashMap;
|
||||||
|
import java.util.HashSet;
|
||||||
import java.util.Iterator;
|
import java.util.Iterator;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
|
import java.util.Set;
|
||||||
import java.util.Timer;
|
import java.util.Timer;
|
||||||
import java.util.TimerTask;
|
import java.util.TimerTask;
|
||||||
import java.util.concurrent.ConcurrentHashMap;
|
import java.util.concurrent.ConcurrentHashMap;
|
||||||
|
@ -108,6 +111,13 @@ public class DecayRpcScheduler implements RpcScheduler,
|
||||||
public static final String IPC_FCQ_DECAYSCHEDULER_THRESHOLDS_KEY =
|
public static final String IPC_FCQ_DECAYSCHEDULER_THRESHOLDS_KEY =
|
||||||
"faircallqueue.decay-scheduler.thresholds";
|
"faircallqueue.decay-scheduler.thresholds";
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Service users will always be scheduled into the highest-priority queue.
|
||||||
|
* They are specified as a comma-separated list.
|
||||||
|
*/
|
||||||
|
public static final String IPC_DECAYSCHEDULER_SERVICE_USERS_KEY =
|
||||||
|
"decay-scheduler.service-users";
|
||||||
|
|
||||||
// Specifies the identity to use when the IdentityProvider cannot handle
|
// Specifies the identity to use when the IdentityProvider cannot handle
|
||||||
// a schedulable.
|
// a schedulable.
|
||||||
public static final String DECAYSCHEDULER_UNKNOWN_IDENTITY =
|
public static final String DECAYSCHEDULER_UNKNOWN_IDENTITY =
|
||||||
|
@ -178,6 +188,7 @@ public class DecayRpcScheduler implements RpcScheduler,
|
||||||
private static final double PRECISION = 0.0001;
|
private static final double PRECISION = 0.0001;
|
||||||
private MetricsProxy metricsProxy;
|
private MetricsProxy metricsProxy;
|
||||||
private final CostProvider costProvider;
|
private final CostProvider costProvider;
|
||||||
|
private Set<String> serviceUserNames;
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* This TimerTask will call decayCurrentCosts until
|
* This TimerTask will call decayCurrentCosts until
|
||||||
|
@ -229,6 +240,7 @@ public class DecayRpcScheduler implements RpcScheduler,
|
||||||
conf);
|
conf);
|
||||||
this.backOffResponseTimeThresholds =
|
this.backOffResponseTimeThresholds =
|
||||||
parseBackOffResponseTimeThreshold(ns, conf, numLevels);
|
parseBackOffResponseTimeThreshold(ns, conf, numLevels);
|
||||||
|
this.serviceUserNames = this.parseServiceUserNames(ns, conf);
|
||||||
|
|
||||||
// Setup response time metrics
|
// Setup response time metrics
|
||||||
responseTimeTotalInCurrWindow = new AtomicLongArray(numLevels);
|
responseTimeTotalInCurrWindow = new AtomicLongArray(numLevels);
|
||||||
|
@ -359,6 +371,12 @@ public class DecayRpcScheduler implements RpcScheduler,
|
||||||
return decimals;
|
return decimals;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
private Set<String> parseServiceUserNames(String ns, Configuration conf) {
|
||||||
|
Collection<String> collection = conf.getStringCollection(
|
||||||
|
ns + "." + IPC_DECAYSCHEDULER_SERVICE_USERS_KEY);
|
||||||
|
return new HashSet<>(collection);
|
||||||
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Generate default thresholds if user did not specify. Strategy is
|
* Generate default thresholds if user did not specify. Strategy is
|
||||||
* to halve each time, since queue usage tends to be exponential.
|
* to halve each time, since queue usage tends to be exponential.
|
||||||
|
@ -486,7 +504,7 @@ public class DecayRpcScheduler implements RpcScheduler,
|
||||||
AtomicLong value = entry.getValue().get(0);
|
AtomicLong value = entry.getValue().get(0);
|
||||||
|
|
||||||
long snapshot = value.get();
|
long snapshot = value.get();
|
||||||
int computedLevel = computePriorityLevel(snapshot);
|
int computedLevel = computePriorityLevel(snapshot, id);
|
||||||
|
|
||||||
nextCache.put(id, computedLevel);
|
nextCache.put(id, computedLevel);
|
||||||
}
|
}
|
||||||
|
@ -534,9 +552,15 @@ public class DecayRpcScheduler implements RpcScheduler,
|
||||||
* Given the cost for an identity, compute a scheduling decision.
|
* Given the cost for an identity, compute a scheduling decision.
|
||||||
*
|
*
|
||||||
* @param cost the cost for an identity
|
* @param cost the cost for an identity
|
||||||
|
* @param identity the identity of the user
|
||||||
* @return scheduling decision from 0 to numLevels - 1
|
* @return scheduling decision from 0 to numLevels - 1
|
||||||
*/
|
*/
|
||||||
private int computePriorityLevel(long cost) {
|
private int computePriorityLevel(long cost, Object identity) {
|
||||||
|
// The priority for service users is always 0
|
||||||
|
if (isServiceUser((String)identity)) {
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
long totalCallSnapshot = totalDecayedCallCost.get();
|
long totalCallSnapshot = totalDecayedCallCost.get();
|
||||||
|
|
||||||
double proportion = 0;
|
double proportion = 0;
|
||||||
|
@ -576,7 +600,7 @@ public class DecayRpcScheduler implements RpcScheduler,
|
||||||
// Cache was no good, compute it
|
// Cache was no good, compute it
|
||||||
List<AtomicLong> costList = callCosts.get(identity);
|
List<AtomicLong> costList = callCosts.get(identity);
|
||||||
long currentCost = costList == null ? 0 : costList.get(0).get();
|
long currentCost = costList == null ? 0 : costList.get(0).get();
|
||||||
int priority = computePriorityLevel(currentCost);
|
int priority = computePriorityLevel(currentCost, identity);
|
||||||
LOG.debug("compute priority for {} priority {}", identity, priority);
|
LOG.debug("compute priority for {} priority {}", identity, priority);
|
||||||
return priority;
|
return priority;
|
||||||
}
|
}
|
||||||
|
@ -598,6 +622,10 @@ public class DecayRpcScheduler implements RpcScheduler,
|
||||||
return cachedOrComputedPriorityLevel(identity);
|
return cachedOrComputedPriorityLevel(identity);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
private boolean isServiceUser(String userName) {
|
||||||
|
return this.serviceUserNames.contains(userName);
|
||||||
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
public boolean shouldBackOff(Schedulable obj) {
|
public boolean shouldBackOff(Schedulable obj) {
|
||||||
Boolean backOff = false;
|
Boolean backOff = false;
|
||||||
|
@ -698,6 +726,11 @@ public class DecayRpcScheduler implements RpcScheduler,
|
||||||
return thresholds;
|
return thresholds;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@VisibleForTesting
|
||||||
|
Set<String> getServiceUserNames() {
|
||||||
|
return serviceUserNames;
|
||||||
|
}
|
||||||
|
|
||||||
@VisibleForTesting
|
@VisibleForTesting
|
||||||
void forceDecay() {
|
void forceDecay() {
|
||||||
decayCurrentCosts();
|
decayCurrentCosts();
|
||||||
|
|
|
@ -2584,6 +2584,14 @@
|
||||||
</description>
|
</description>
|
||||||
</property>
|
</property>
|
||||||
|
|
||||||
|
<property>
|
||||||
|
<name>ipc.[port_number].decay-scheduler.service-users</name>
|
||||||
|
<value></value>
|
||||||
|
<description>Service users will always be scheduled into the highest-priority
|
||||||
|
queue. They are specified as a comma-separated list.
|
||||||
|
</description>
|
||||||
|
</property>
|
||||||
|
|
||||||
<property>
|
<property>
|
||||||
<name>ipc.[port_number].weighted-cost.lockshared</name>
|
<name>ipc.[port_number].weighted-cost.lockshared</name>
|
||||||
<value>10</value>
|
<value>10</value>
|
||||||
|
|
|
@ -91,6 +91,9 @@ This is configurable via the **identity provider**, which defaults to the **User
|
||||||
provider simply uses the username of the client submitting the request. However, a custom identity provider can be used
|
provider simply uses the username of the client submitting the request. However, a custom identity provider can be used
|
||||||
to performing throttling based on other groupings, or using an external identity provider.
|
to performing throttling based on other groupings, or using an external identity provider.
|
||||||
|
|
||||||
|
If particular users submit important requests and you don't want to limit them, you can set them up as the
|
||||||
|
**service-users**. They are always scheduled into the high-priority queue.
|
||||||
|
|
||||||
### Cost-based Fair Call Queue
|
### Cost-based Fair Call Queue
|
||||||
|
|
||||||
Though the fair call queue itself does a good job of mitigating the impact from users who submit a very high _number_
|
Though the fair call queue itself does a good job of mitigating the impact from users who submit a very high _number_
|
||||||
|
@ -138,6 +141,7 @@ omitted.
|
||||||
| decay-scheduler.backoff.responsetime.enable | DecayRpcScheduler | Whether or not to enable the backoff by response time feature. | false |
|
| decay-scheduler.backoff.responsetime.enable | DecayRpcScheduler | Whether or not to enable the backoff by response time feature. | false |
|
||||||
| decay-scheduler.backoff.responsetime.thresholds | DecayRpcScheduler | The response time thresholds, as time durations, for each priority queue. If the average response time for a queue is above this threshold, backoff will occur in lower priority queues. This should be a comma-separated list of length equal to the number of priority levels. | Threshold increases by 10s per level (e.g., for 4 levels: `10s,20s,30s,40s`) |
|
| decay-scheduler.backoff.responsetime.thresholds | DecayRpcScheduler | The response time thresholds, as time durations, for each priority queue. If the average response time for a queue is above this threshold, backoff will occur in lower priority queues. This should be a comma-separated list of length equal to the number of priority levels. | Threshold increases by 10s per level (e.g., for 4 levels: `10s,20s,30s,40s`) |
|
||||||
| decay-scheduler.metrics.top.user.count | DecayRpcScheduler | The number of top (i.e., heaviest) users to emit metric information about. | 10 |
|
| decay-scheduler.metrics.top.user.count | DecayRpcScheduler | The number of top (i.e., heaviest) users to emit metric information about. | 10 |
|
||||||
|
| decay-scheduler.service-users | DecayRpcScheduler | Service users will always be scheduled into the highest-priority queue. They are specified as a comma-separated list. | |
|
||||||
| weighted-cost.lockshared | WeightedTimeCostProvider | The weight multiplier to apply to the time spent in the processing phase which holds a shared (read) lock. | 10 |
|
| weighted-cost.lockshared | WeightedTimeCostProvider | The weight multiplier to apply to the time spent in the processing phase which holds a shared (read) lock. | 10 |
|
||||||
| weighted-cost.lockexclusive | WeightedTimeCostProvider | The weight multiplier to apply to the time spent in the processing phase which holds an exclusive (write) lock. | 100 |
|
| weighted-cost.lockexclusive | WeightedTimeCostProvider | The weight multiplier to apply to the time spent in the processing phase which holds an exclusive (write) lock. | 100 |
|
||||||
| weighted-cost.{handler,lockfree,response} | WeightedTimeCostProvider | The weight multiplier to apply to the time spent in the processing phases which do not involve holding a lock. See `org.apache.hadoop.ipc.ProcessingDetails.Timing` for more details on each phase. | 1 |
|
| weighted-cost.{handler,lockfree,response} | WeightedTimeCostProvider | The weight multiplier to apply to the time spent in the processing phases which do not involve holding a lock. See `org.apache.hadoop.ipc.ProcessingDetails.Timing` for more details on each phase. | 1 |
|
||||||
|
|
|
@ -172,6 +172,8 @@ public class TestCommonConfigurationFields extends TestConfigurationFieldsBase {
|
||||||
"ipc.[port_number].decay-scheduler.backoff.responsetime.thresholds");
|
"ipc.[port_number].decay-scheduler.backoff.responsetime.thresholds");
|
||||||
xmlPropsToSkipCompare.add(
|
xmlPropsToSkipCompare.add(
|
||||||
"ipc.[port_number].decay-scheduler.metrics.top.user.count");
|
"ipc.[port_number].decay-scheduler.metrics.top.user.count");
|
||||||
|
xmlPropsToSkipCompare.add(
|
||||||
|
"ipc.[port_number].decay-scheduler.service-users");
|
||||||
xmlPropsToSkipCompare.add("ipc.[port_number].weighted-cost.lockshared");
|
xmlPropsToSkipCompare.add("ipc.[port_number].weighted-cost.lockshared");
|
||||||
xmlPropsToSkipCompare.add("ipc.[port_number].weighted-cost.lockexclusive");
|
xmlPropsToSkipCompare.add("ipc.[port_number].weighted-cost.lockexclusive");
|
||||||
xmlPropsToSkipCompare.add("ipc.[port_number].weighted-cost.handler");
|
xmlPropsToSkipCompare.add("ipc.[port_number].weighted-cost.handler");
|
||||||
|
|
|
@ -20,9 +20,14 @@ package org.apache.hadoop.ipc;
|
||||||
|
|
||||||
import static java.lang.Thread.sleep;
|
import static java.lang.Thread.sleep;
|
||||||
|
|
||||||
|
import java.util.Map;
|
||||||
|
import org.eclipse.jetty.util.ajax.JSON;
|
||||||
import org.junit.Test;
|
import org.junit.Test;
|
||||||
|
|
||||||
import static org.junit.Assert.*;
|
import static org.junit.Assert.assertEquals;
|
||||||
|
import static org.junit.Assert.assertFalse;
|
||||||
|
import static org.junit.Assert.assertNotEquals;
|
||||||
|
import static org.junit.Assert.assertTrue;
|
||||||
import static org.mockito.Mockito.mock;
|
import static org.mockito.Mockito.mock;
|
||||||
import static org.mockito.Mockito.when;
|
import static org.mockito.Mockito.when;
|
||||||
|
|
||||||
|
@ -383,4 +388,37 @@ public class TestDecayRpcScheduler {
|
||||||
scheduler.addResponseTime("ignored", mockCall, emptyProcessingDetails);
|
scheduler.addResponseTime("ignored", mockCall, emptyProcessingDetails);
|
||||||
return priority;
|
return priority;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void testServiceUsers() {
|
||||||
|
Configuration conf = new Configuration();
|
||||||
|
conf.setLong("ipc.19."
|
||||||
|
+ DecayRpcScheduler.IPC_SCHEDULER_DECAYSCHEDULER_PERIOD_KEY, 999999);
|
||||||
|
conf.set("ipc.19." + DecayRpcScheduler.IPC_DECAYSCHEDULER_SERVICE_USERS_KEY,
|
||||||
|
"service1,service2");
|
||||||
|
scheduler = new DecayRpcScheduler(4, "ipc.19", conf);
|
||||||
|
|
||||||
|
assertTrue(scheduler.getServiceUserNames().contains("service1"));
|
||||||
|
assertTrue(scheduler.getServiceUserNames().contains("service2"));
|
||||||
|
|
||||||
|
for (int i = 0; i < 10; i++) {
|
||||||
|
getPriorityIncrementCallCount("user1");
|
||||||
|
getPriorityIncrementCallCount("service1");
|
||||||
|
getPriorityIncrementCallCount("service2");
|
||||||
|
}
|
||||||
|
|
||||||
|
assertNotEquals(0, scheduler.getPriorityLevel(mockCall("user1")));
|
||||||
|
// The priorities of service users should be always 0.
|
||||||
|
assertEquals(0, scheduler.getPriorityLevel(mockCall("service1")));
|
||||||
|
assertEquals(0, scheduler.getPriorityLevel(mockCall("service2")));
|
||||||
|
|
||||||
|
// DecayRpcScheduler caches priorities after decay
|
||||||
|
scheduler.forceDecay();
|
||||||
|
// Check priorities on cache
|
||||||
|
String summary = scheduler.getSchedulingDecisionSummary();
|
||||||
|
Map<String, Object> summaryMap = (Map<String, Object>) JSON.parse(summary);
|
||||||
|
assertNotEquals(0L, summaryMap.get("user1"));
|
||||||
|
assertEquals(0L, summaryMap.get("service1"));
|
||||||
|
assertEquals(0L, summaryMap.get("service2"));
|
||||||
|
}
|
||||||
}
|
}
|
Loading…
Reference in New Issue