YARN-2392. Add more diags about app retry limits on AM failures. Contributed by Steve Loughran

This commit is contained in:
Jian He 2015-06-04 11:14:09 -07:00
parent 5149dc7b97
commit 1970ca7cbc
3 changed files with 18 additions and 5 deletions

View File

@ -289,6 +289,9 @@ Release 2.8.0 - UNRELEASED
YARN-3467. Expose allocatedMB, allocatedVCores, and runningContainers metrics on
running Applications in RM Web UI. (Anubhav Dhoot via kasha)
YARN-2392. Add more diags about app retry limits on AM failures. (Steve
Loughran via jianhe)
OPTIMIZATIONS
YARN-3339. TestDockerContainerExecutor should pull a single image and not

View File

@ -1014,9 +1014,19 @@ private String getAppAttemptFailedDiagnostics(RMAppEvent event) {
+ " failed due to " + failedEvent.getDiagnostics()
+ ". Failing the application.";
} else if (this.isNumAttemptsBeyondThreshold) {
msg = "Application " + this.getApplicationId() + " failed "
+ this.maxAppAttempts + " times due to "
+ failedEvent.getDiagnostics() + ". Failing the application.";
int globalLimit = conf.getInt(YarnConfiguration.RM_AM_MAX_ATTEMPTS,
YarnConfiguration.DEFAULT_RM_AM_MAX_ATTEMPTS);
msg = String.format(
"Application %s failed %d times%s%s due to %s. Failing the application.",
getApplicationId(),
maxAppAttempts,
(attemptFailuresValidityInterval <= 0 ? ""
: (" in previous " + attemptFailuresValidityInterval
+ " milliseconds")),
(globalLimit == maxAppAttempts) ? ""
: (" (global limit =" + globalLimit
+ "; local limit is =" + maxAppAttempts + ")"),
failedEvent.getDiagnostics());
}
return msg;
}

View File

@ -1459,9 +1459,9 @@ private String getAMContainerCrashedDiagnostics(
.append(status.getDiagnostics());
if (this.getTrackingUrl() != null) {
diagnosticsBuilder.append("For more detailed output,").append(
" check application tracking page: ").append(
" check the application tracking page: ").append(
this.getTrackingUrl()).append(
" Then, click on links to logs of each attempt.\n");
" Then click on links to logs of each attempt.\n");
}
return diagnosticsBuilder.toString();
}