YARN-4225. Add preemption status to yarn queue -status for capacity scheduler. (Eric Payne via wangda)
This commit is contained in:
parent
79c41b1d83
commit
7faa406f27
@ -1145,6 +1145,9 @@ Release 2.8.0 - UNRELEASED
|
|||||||
YARN-4452. NPE when submit Unmanaged application. (Naganarasimha G R
|
YARN-4452. NPE when submit Unmanaged application. (Naganarasimha G R
|
||||||
via junping_du)
|
via junping_du)
|
||||||
|
|
||||||
|
YARN-4225. Add preemption status to yarn queue -status for capacity scheduler.
|
||||||
|
(Eric Payne via wangda)
|
||||||
|
|
||||||
Release 2.7.3 - UNRELEASED
|
Release 2.7.3 - UNRELEASED
|
||||||
|
|
||||||
INCOMPATIBLE CHANGES
|
INCOMPATIBLE CHANGES
|
||||||
|
@ -500,4 +500,9 @@
|
|||||||
</Or>
|
</Or>
|
||||||
<Bug pattern="URF_UNREAD_PUBLIC_OR_PROTECTED_FIELD" />
|
<Bug pattern="URF_UNREAD_PUBLIC_OR_PROTECTED_FIELD" />
|
||||||
</Match>
|
</Match>
|
||||||
|
|
||||||
|
<Match>
|
||||||
|
<Package name="org.apache.hadoop.yarn.api.records.impl.pb" />
|
||||||
|
<Bug pattern="NP_BOOLEAN_RETURN_NULL" />
|
||||||
|
</Match>
|
||||||
</FindBugsFilter>
|
</FindBugsFilter>
|
||||||
|
@ -55,7 +55,8 @@ public static QueueInfo newInstance(String queueName, float capacity,
|
|||||||
float maximumCapacity, float currentCapacity,
|
float maximumCapacity, float currentCapacity,
|
||||||
List<QueueInfo> childQueues, List<ApplicationReport> applications,
|
List<QueueInfo> childQueues, List<ApplicationReport> applications,
|
||||||
QueueState queueState, Set<String> accessibleNodeLabels,
|
QueueState queueState, Set<String> accessibleNodeLabels,
|
||||||
String defaultNodeLabelExpression, QueueStatistics queueStatistics) {
|
String defaultNodeLabelExpression, QueueStatistics queueStatistics,
|
||||||
|
boolean preemptionDisabled) {
|
||||||
QueueInfo queueInfo = Records.newRecord(QueueInfo.class);
|
QueueInfo queueInfo = Records.newRecord(QueueInfo.class);
|
||||||
queueInfo.setQueueName(queueName);
|
queueInfo.setQueueName(queueName);
|
||||||
queueInfo.setCapacity(capacity);
|
queueInfo.setCapacity(capacity);
|
||||||
@ -67,6 +68,7 @@ public static QueueInfo newInstance(String queueName, float capacity,
|
|||||||
queueInfo.setAccessibleNodeLabels(accessibleNodeLabels);
|
queueInfo.setAccessibleNodeLabels(accessibleNodeLabels);
|
||||||
queueInfo.setDefaultNodeLabelExpression(defaultNodeLabelExpression);
|
queueInfo.setDefaultNodeLabelExpression(defaultNodeLabelExpression);
|
||||||
queueInfo.setQueueStatistics(queueStatistics);
|
queueInfo.setQueueStatistics(queueStatistics);
|
||||||
|
queueInfo.setPreemptionDisabled(preemptionDisabled);
|
||||||
return queueInfo;
|
return queueInfo;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -205,4 +207,16 @@ public abstract void setDefaultNodeLabelExpression(
|
|||||||
@Unstable
|
@Unstable
|
||||||
public abstract void setQueueStatistics(QueueStatistics queueStatistics);
|
public abstract void setQueueStatistics(QueueStatistics queueStatistics);
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Get the <em>preemption status</em> of the queue.
|
||||||
|
* @return if property is not in proto, return null;
|
||||||
|
* otherwise, return <em>preemption status</em> of the queue
|
||||||
|
*/
|
||||||
|
@Public
|
||||||
|
@Stable
|
||||||
|
public abstract Boolean getPreemptionDisabled();
|
||||||
|
|
||||||
|
@Private
|
||||||
|
@Unstable
|
||||||
|
public abstract void setPreemptionDisabled(boolean preemptionDisabled);
|
||||||
}
|
}
|
||||||
|
@ -416,6 +416,7 @@ message QueueInfoProto {
|
|||||||
repeated string accessibleNodeLabels = 8;
|
repeated string accessibleNodeLabels = 8;
|
||||||
optional string defaultNodeLabelExpression = 9;
|
optional string defaultNodeLabelExpression = 9;
|
||||||
optional QueueStatisticsProto queueStatistics = 10;
|
optional QueueStatisticsProto queueStatistics = 10;
|
||||||
|
optional bool preemptionDisabled = 11;
|
||||||
}
|
}
|
||||||
|
|
||||||
enum QueueACLProto {
|
enum QueueACLProto {
|
||||||
|
@ -152,5 +152,11 @@ private void printQueueInfo(PrintWriter writer, QueueInfo queueInfo) {
|
|||||||
labelList.append(nodeLabel);
|
labelList.append(nodeLabel);
|
||||||
}
|
}
|
||||||
writer.println(labelList.toString());
|
writer.println(labelList.toString());
|
||||||
|
|
||||||
|
Boolean preemptStatus = queueInfo.getPreemptionDisabled();
|
||||||
|
if (preemptStatus != null) {
|
||||||
|
writer.print("\tPreemption : ");
|
||||||
|
writer.println(preemptStatus ? "disabled" : "enabled");
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -665,7 +665,7 @@ public List<NodeReport> createFakeNodeReports() {
|
|||||||
|
|
||||||
public QueueInfo createFakeQueueInfo() {
|
public QueueInfo createFakeQueueInfo() {
|
||||||
return QueueInfo.newInstance("root", 100f, 100f, 50f, null,
|
return QueueInfo.newInstance("root", 100f, 100f, 50f, null,
|
||||||
createFakeAppReports(), QueueState.RUNNING, null, null, null);
|
createFakeAppReports(), QueueState.RUNNING, null, null, null, false);
|
||||||
}
|
}
|
||||||
|
|
||||||
public List<QueueUserACLInfo> createFakeQueueUserACLInfoList() {
|
public List<QueueUserACLInfo> createFakeQueueUserACLInfoList() {
|
||||||
|
@ -46,6 +46,7 @@
|
|||||||
|
|
||||||
import org.apache.commons.cli.Options;
|
import org.apache.commons.cli.Options;
|
||||||
import org.apache.commons.lang.time.DateFormatUtils;
|
import org.apache.commons.lang.time.DateFormatUtils;
|
||||||
|
import org.apache.hadoop.conf.Configuration;
|
||||||
import org.apache.hadoop.yarn.api.records.ApplicationAttemptId;
|
import org.apache.hadoop.yarn.api.records.ApplicationAttemptId;
|
||||||
import org.apache.hadoop.yarn.api.records.ApplicationAttemptReport;
|
import org.apache.hadoop.yarn.api.records.ApplicationAttemptReport;
|
||||||
import org.apache.hadoop.yarn.api.records.ApplicationId;
|
import org.apache.hadoop.yarn.api.records.ApplicationId;
|
||||||
@ -69,9 +70,15 @@
|
|||||||
import org.apache.hadoop.yarn.api.records.YarnApplicationAttemptState;
|
import org.apache.hadoop.yarn.api.records.YarnApplicationAttemptState;
|
||||||
import org.apache.hadoop.yarn.api.records.YarnApplicationState;
|
import org.apache.hadoop.yarn.api.records.YarnApplicationState;
|
||||||
import org.apache.hadoop.yarn.client.api.YarnClient;
|
import org.apache.hadoop.yarn.client.api.YarnClient;
|
||||||
|
import org.apache.hadoop.yarn.conf.YarnConfiguration;
|
||||||
import org.apache.hadoop.yarn.exceptions.ApplicationAttemptNotFoundException;
|
import org.apache.hadoop.yarn.exceptions.ApplicationAttemptNotFoundException;
|
||||||
import org.apache.hadoop.yarn.exceptions.ApplicationNotFoundException;
|
import org.apache.hadoop.yarn.exceptions.ApplicationNotFoundException;
|
||||||
import org.apache.hadoop.yarn.exceptions.ContainerNotFoundException;
|
import org.apache.hadoop.yarn.exceptions.ContainerNotFoundException;
|
||||||
|
import org.apache.hadoop.yarn.server.MiniYARNCluster;
|
||||||
|
import org.apache.hadoop.yarn.server.resourcemanager.reservation.ReservationSystemTestUtil;
|
||||||
|
import org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceScheduler;
|
||||||
|
import org.apache.hadoop.yarn.server.resourcemanager.scheduler.capacity.CapacityScheduler;
|
||||||
|
import org.apache.hadoop.yarn.server.resourcemanager.scheduler.capacity.CapacitySchedulerConfiguration;
|
||||||
import org.apache.hadoop.yarn.util.Records;
|
import org.apache.hadoop.yarn.util.Records;
|
||||||
import org.junit.Assert;
|
import org.junit.Assert;
|
||||||
import org.junit.Before;
|
import org.junit.Before;
|
||||||
@ -1324,7 +1331,7 @@ public void testGetQueueInfo() throws Exception {
|
|||||||
nodeLabels.add("GPU");
|
nodeLabels.add("GPU");
|
||||||
nodeLabels.add("JDK_7");
|
nodeLabels.add("JDK_7");
|
||||||
QueueInfo queueInfo = QueueInfo.newInstance("queueA", 0.4f, 0.8f, 0.5f,
|
QueueInfo queueInfo = QueueInfo.newInstance("queueA", 0.4f, 0.8f, 0.5f,
|
||||||
null, null, QueueState.RUNNING, nodeLabels, "GPU", null);
|
null, null, QueueState.RUNNING, nodeLabels, "GPU", null, false);
|
||||||
when(client.getQueueInfo(any(String.class))).thenReturn(queueInfo);
|
when(client.getQueueInfo(any(String.class))).thenReturn(queueInfo);
|
||||||
int result = cli.run(new String[] { "-status", "queueA" });
|
int result = cli.run(new String[] { "-status", "queueA" });
|
||||||
assertEquals(0, result);
|
assertEquals(0, result);
|
||||||
@ -1339,16 +1346,103 @@ public void testGetQueueInfo() throws Exception {
|
|||||||
pw.println("\tMaximum Capacity : " + "80.0%");
|
pw.println("\tMaximum Capacity : " + "80.0%");
|
||||||
pw.println("\tDefault Node Label expression : " + "GPU");
|
pw.println("\tDefault Node Label expression : " + "GPU");
|
||||||
pw.println("\tAccessible Node Labels : " + "JDK_7,GPU");
|
pw.println("\tAccessible Node Labels : " + "JDK_7,GPU");
|
||||||
|
pw.println("\tPreemption : " + "enabled");
|
||||||
pw.close();
|
pw.close();
|
||||||
String queueInfoStr = baos.toString("UTF-8");
|
String queueInfoStr = baos.toString("UTF-8");
|
||||||
Assert.assertEquals(queueInfoStr, sysOutStream.toString());
|
Assert.assertEquals(queueInfoStr, sysOutStream.toString());
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void testGetQueueInfoPreemptionEnabled() throws Exception {
|
||||||
|
CapacitySchedulerConfiguration conf = new CapacitySchedulerConfiguration();
|
||||||
|
ReservationSystemTestUtil.setupQueueConfiguration(conf);
|
||||||
|
conf.setClass(YarnConfiguration.RM_SCHEDULER, CapacityScheduler.class,
|
||||||
|
ResourceScheduler.class);
|
||||||
|
conf.setBoolean(YarnConfiguration.RM_SCHEDULER_ENABLE_MONITORS, true);
|
||||||
|
conf.set(YarnConfiguration.RM_SCHEDULER_MONITOR_POLICIES,
|
||||||
|
"org.apache.hadoop.yarn.server.resourcemanager.monitor.capacity."
|
||||||
|
+ "ProportionalCapacityPreemptionPolicy");
|
||||||
|
conf.setBoolean(YarnConfiguration.RM_SCHEDULER_ENABLE_MONITORS, true);
|
||||||
|
MiniYARNCluster cluster =
|
||||||
|
new MiniYARNCluster("testReservationAPIs", 2, 1, 1);
|
||||||
|
|
||||||
|
YarnClient yarnClient = null;
|
||||||
|
try {
|
||||||
|
cluster.init(conf);
|
||||||
|
cluster.start();
|
||||||
|
final Configuration yarnConf = cluster.getConfig();
|
||||||
|
yarnClient = YarnClient.createYarnClient();
|
||||||
|
yarnClient.init(yarnConf);
|
||||||
|
yarnClient.start();
|
||||||
|
|
||||||
|
QueueCLI cli = new QueueCLI();
|
||||||
|
cli.setClient(yarnClient);
|
||||||
|
cli.setSysOutPrintStream(sysOut);
|
||||||
|
cli.setSysErrPrintStream(sysErr);
|
||||||
|
sysOutStream.reset();
|
||||||
|
int result = cli.run(new String[] { "-status", "a1" });
|
||||||
|
assertEquals(0, result);
|
||||||
|
Assert.assertTrue(sysOutStream.toString()
|
||||||
|
.contains("Preemption : enabled"));
|
||||||
|
} finally {
|
||||||
|
// clean-up
|
||||||
|
if (yarnClient != null) {
|
||||||
|
yarnClient.stop();
|
||||||
|
}
|
||||||
|
cluster.stop();
|
||||||
|
cluster.close();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void testGetQueueInfoPreemptionDisabled() throws Exception {
|
||||||
|
CapacitySchedulerConfiguration conf = new CapacitySchedulerConfiguration();
|
||||||
|
ReservationSystemTestUtil.setupQueueConfiguration(conf);
|
||||||
|
conf.setClass(YarnConfiguration.RM_SCHEDULER, CapacityScheduler.class,
|
||||||
|
ResourceScheduler.class);
|
||||||
|
conf.setBoolean(YarnConfiguration.RM_SCHEDULER_ENABLE_MONITORS, true);
|
||||||
|
conf.set(YarnConfiguration.RM_SCHEDULER_MONITOR_POLICIES,
|
||||||
|
"org.apache.hadoop.yarn.server.resourcemanager.monitor.capacity."
|
||||||
|
+ "ProportionalCapacityPreemptionPolicy");
|
||||||
|
conf.setBoolean(YarnConfiguration.RM_SCHEDULER_ENABLE_MONITORS, true);
|
||||||
|
conf.setBoolean(
|
||||||
|
"yarn.scheduler.capacity.root.a.a1.disable_preemption", true);
|
||||||
|
MiniYARNCluster cluster =
|
||||||
|
new MiniYARNCluster("testReservationAPIs", 2, 1, 1);
|
||||||
|
|
||||||
|
YarnClient yarnClient = null;
|
||||||
|
try {
|
||||||
|
cluster.init(conf);
|
||||||
|
cluster.start();
|
||||||
|
final Configuration yarnConf = cluster.getConfig();
|
||||||
|
yarnClient = YarnClient.createYarnClient();
|
||||||
|
yarnClient.init(yarnConf);
|
||||||
|
yarnClient.start();
|
||||||
|
|
||||||
|
QueueCLI cli = new QueueCLI();
|
||||||
|
cli.setClient(yarnClient);
|
||||||
|
cli.setSysOutPrintStream(sysOut);
|
||||||
|
cli.setSysErrPrintStream(sysErr);
|
||||||
|
sysOutStream.reset();
|
||||||
|
int result = cli.run(new String[] { "-status", "a1" });
|
||||||
|
assertEquals(0, result);
|
||||||
|
Assert.assertTrue(sysOutStream.toString()
|
||||||
|
.contains("Preemption : disabled"));
|
||||||
|
} finally {
|
||||||
|
// clean-up
|
||||||
|
if (yarnClient != null) {
|
||||||
|
yarnClient.stop();
|
||||||
|
}
|
||||||
|
cluster.stop();
|
||||||
|
cluster.close();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
@Test
|
@Test
|
||||||
public void testGetQueueInfoWithEmptyNodeLabel() throws Exception {
|
public void testGetQueueInfoWithEmptyNodeLabel() throws Exception {
|
||||||
QueueCLI cli = createAndGetQueueCLI();
|
QueueCLI cli = createAndGetQueueCLI();
|
||||||
QueueInfo queueInfo = QueueInfo.newInstance("queueA", 0.4f, 0.8f, 0.5f,
|
QueueInfo queueInfo = QueueInfo.newInstance("queueA", 0.4f, 0.8f, 0.5f,
|
||||||
null, null, QueueState.RUNNING, null, null, null);
|
null, null, QueueState.RUNNING, null, null, null, true);
|
||||||
when(client.getQueueInfo(any(String.class))).thenReturn(queueInfo);
|
when(client.getQueueInfo(any(String.class))).thenReturn(queueInfo);
|
||||||
int result = cli.run(new String[] { "-status", "queueA" });
|
int result = cli.run(new String[] { "-status", "queueA" });
|
||||||
assertEquals(0, result);
|
assertEquals(0, result);
|
||||||
@ -1364,6 +1458,7 @@ public void testGetQueueInfoWithEmptyNodeLabel() throws Exception {
|
|||||||
pw.println("\tDefault Node Label expression : "
|
pw.println("\tDefault Node Label expression : "
|
||||||
+ NodeLabel.DEFAULT_NODE_LABEL_PARTITION);
|
+ NodeLabel.DEFAULT_NODE_LABEL_PARTITION);
|
||||||
pw.println("\tAccessible Node Labels : ");
|
pw.println("\tAccessible Node Labels : ");
|
||||||
|
pw.println("\tPreemption : " + "disabled");
|
||||||
pw.close();
|
pw.close();
|
||||||
String queueInfoStr = baos.toString("UTF-8");
|
String queueInfoStr = baos.toString("UTF-8");
|
||||||
Assert.assertEquals(queueInfoStr, sysOutStream.toString());
|
Assert.assertEquals(queueInfoStr, sysOutStream.toString());
|
||||||
|
@ -395,4 +395,17 @@ public void setQueueStatistics(QueueStatistics queueStatistics) {
|
|||||||
}
|
}
|
||||||
builder.setQueueStatistics(convertToProtoFormat(queueStatistics));
|
builder.setQueueStatistics(convertToProtoFormat(queueStatistics));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public Boolean getPreemptionDisabled() {
|
||||||
|
QueueInfoProtoOrBuilder p = viaProto ? proto : builder;
|
||||||
|
return (p.hasPreemptionDisabled()) ? p
|
||||||
|
.getPreemptionDisabled() : null;
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void setPreemptionDisabled(boolean preemptionDisabled) {
|
||||||
|
maybeInitBuilder();
|
||||||
|
builder.setPreemptionDisabled(preemptionDisabled);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
@ -488,7 +488,7 @@ public static void setup() throws Exception {
|
|||||||
// it is recursive(has sub queues)
|
// it is recursive(has sub queues)
|
||||||
typeValueCache.put(QueueInfo.class, QueueInfo.newInstance("root", 1.0f,
|
typeValueCache.put(QueueInfo.class, QueueInfo.newInstance("root", 1.0f,
|
||||||
1.0f, 0.1f, null, null, QueueState.RUNNING, ImmutableSet.of("x", "y"),
|
1.0f, 0.1f, null, null, QueueState.RUNNING, ImmutableSet.of("x", "y"),
|
||||||
"x && y", null));
|
"x && y", null, false));
|
||||||
generateByNewInstance(QueueStatistics.class);
|
generateByNewInstance(QueueStatistics.class);
|
||||||
generateByNewInstance(QueueUserACLInfo.class);
|
generateByNewInstance(QueueUserACLInfo.class);
|
||||||
generateByNewInstance(YarnClusterMetrics.class);
|
generateByNewInstance(YarnClusterMetrics.class);
|
||||||
|
@ -303,6 +303,7 @@ protected QueueInfo getQueueInfo() {
|
|||||||
queueInfo.setDefaultNodeLabelExpression(defaultLabelExpression);
|
queueInfo.setDefaultNodeLabelExpression(defaultLabelExpression);
|
||||||
queueInfo.setCurrentCapacity(getUsedCapacity());
|
queueInfo.setCurrentCapacity(getUsedCapacity());
|
||||||
queueInfo.setQueueStatistics(getQueueStatistics());
|
queueInfo.setQueueStatistics(getQueueStatistics());
|
||||||
|
queueInfo.setPreemptionDisabled(preemptionDisabled);
|
||||||
return queueInfo;
|
return queueInfo;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -149,7 +149,8 @@ private Queue createQueue(String name, Queue parent) {
|
|||||||
|
|
||||||
private Queue createQueue(String name, Queue parent, float capacity) {
|
private Queue createQueue(String name, Queue parent, float capacity) {
|
||||||
QueueMetrics metrics = QueueMetrics.forQueue(name, parent, false, conf);
|
QueueMetrics metrics = QueueMetrics.forQueue(name, parent, false, conf);
|
||||||
QueueInfo queueInfo = QueueInfo.newInstance(name, capacity, 1.0f, 0, null, null, QueueState.RUNNING, null, "", null);
|
QueueInfo queueInfo = QueueInfo.newInstance(name, capacity, 1.0f, 0, null,
|
||||||
|
null, QueueState.RUNNING, null, "", null, false);
|
||||||
ActiveUsersManager activeUsersManager = new ActiveUsersManager(metrics);
|
ActiveUsersManager activeUsersManager = new ActiveUsersManager(metrics);
|
||||||
Queue queue = mock(Queue.class);
|
Queue queue = mock(Queue.class);
|
||||||
when(queue.getMetrics()).thenReturn(metrics);
|
when(queue.getMetrics()).thenReturn(metrics);
|
||||||
|
Loading…
Reference in New Issue
Block a user