YARN-10428. Zombie applications in the YARN queue using FAIR + sizebasedweight. Contributed by Guang Yang, Andras Gyori

(cherry picked from commit 79a46599f7)
This commit is contained in:
Szilard Nemeth 2021-02-05 17:08:16 +01:00 committed by Akira Ajisaka
parent 580b6c400b
commit 0a726250ea
No known key found for this signature in database
GPG Key ID: C1EDBB9CA400FD50
2 changed files with 46 additions and 2 deletions

View File

@ -100,10 +100,12 @@ public FairOrderingPolicy() {
private double getMagnitude(SchedulableEntity r) { private double getMagnitude(SchedulableEntity r) {
double mag = r.getSchedulingResourceUsage().getCachedUsed( double mag = r.getSchedulingResourceUsage().getCachedUsed(
CommonNodeLabelsManager.ANY).getMemorySize(); CommonNodeLabelsManager.ANY).getMemorySize();
if (sizeBasedWeight) { if (sizeBasedWeight && mag != 0) {
double weight = Math.log1p(r.getSchedulingResourceUsage().getCachedDemand( double weight = Math.log1p(r.getSchedulingResourceUsage().getCachedDemand(
CommonNodeLabelsManager.ANY).getMemorySize()) / Math.log(2); CommonNodeLabelsManager.ANY).getMemorySize()) / Math.log(2);
mag = mag / weight; if (weight != 0) {
mag = mag / weight;
}
} }
return mag; return mag;
} }

View File

@ -23,7 +23,9 @@
import java.util.*; import java.util.*;
import org.apache.hadoop.yarn.api.records.NodeId; import org.apache.hadoop.yarn.api.records.NodeId;
import org.apache.hadoop.yarn.api.records.Priority;
import org.apache.hadoop.yarn.conf.YarnConfiguration; import org.apache.hadoop.yarn.conf.YarnConfiguration;
import org.apache.hadoop.yarn.nodelabels.CommonNodeLabelsManager;
import org.apache.hadoop.yarn.server.resourcemanager.MockRM; import org.apache.hadoop.yarn.server.resourcemanager.MockRM;
import org.apache.hadoop.yarn.server.resourcemanager.MockRMAppSubmissionData; import org.apache.hadoop.yarn.server.resourcemanager.MockRMAppSubmissionData;
import org.apache.hadoop.yarn.server.resourcemanager.MockRMAppSubmitter; import org.apache.hadoop.yarn.server.resourcemanager.MockRMAppSubmitter;
@ -346,4 +348,44 @@ public void testOrderingUsingAppDemand() {
assertEquals("Comparator Output", 0, assertEquals("Comparator Output", 0,
policy.getComparator().compare(r1, r2)); policy.getComparator().compare(r1, r2));
} }
@Test
public void testRemoveEntitiesWithSizeBasedWeightAsCompletedJobs() {
FairOrderingPolicy<MockSchedulableEntity> policy =
new FairOrderingPolicy<MockSchedulableEntity>();
policy.setSizeBasedWeight(true);
// Add 10 different schedulable entities
List<MockSchedulableEntity> entities = new ArrayList<>(10);
for (int i = 1; i <= 10; i++) {
MockSchedulableEntity r = new MockSchedulableEntity();
r.setApplicationPriority(Priority.newInstance(i));
r.setUsed(Resources.createResource(4 * i));
r.setPending(Resources.createResource(4 * i));
AbstractComparatorOrderingPolicy.updateSchedulingResourceUsage(
r.getSchedulingResourceUsage());
policy.addSchedulableEntity(r);
entities.add(r);
}
// Mark the first 5 entities as completed by setting
// the resources to 0
for (int i = 0; i < 5; i++) {
MockSchedulableEntity r = entities.get(i);
r.getSchedulingResourceUsage().setCachedUsed(
CommonNodeLabelsManager.ANY, Resources.createResource(0));
r.getSchedulingResourceUsage().setCachedPending(
CommonNodeLabelsManager.ANY, Resources.createResource(0));
policy.entityRequiresReordering(r);
}
policy.reorderScheduleEntities();
// Remove the first 5 elements
for (int i = 0; i < 5; i++) {
policy.removeSchedulableEntity(entities.get(i));
}
Assert.assertEquals(5, policy.getNumSchedulableEntities());
}
} }