YARN-2392. Add more diags about app retry limits on AM failures. Contributed by Steve Loughran
This commit is contained in:
parent
5149dc7b97
commit
1970ca7cbc
@ -289,6 +289,9 @@ Release 2.8.0 - UNRELEASED
|
||||
YARN-3467. Expose allocatedMB, allocatedVCores, and runningContainers metrics on
|
||||
running Applications in RM Web UI. (Anubhav Dhoot via kasha)
|
||||
|
||||
YARN-2392. Add more diags about app retry limits on AM failures. (Steve
|
||||
Loughran via jianhe)
|
||||
|
||||
OPTIMIZATIONS
|
||||
|
||||
YARN-3339. TestDockerContainerExecutor should pull a single image and not
|
||||
|
@ -1014,9 +1014,19 @@ private String getAppAttemptFailedDiagnostics(RMAppEvent event) {
|
||||
+ " failed due to " + failedEvent.getDiagnostics()
|
||||
+ ". Failing the application.";
|
||||
} else if (this.isNumAttemptsBeyondThreshold) {
|
||||
msg = "Application " + this.getApplicationId() + " failed "
|
||||
+ this.maxAppAttempts + " times due to "
|
||||
+ failedEvent.getDiagnostics() + ". Failing the application.";
|
||||
int globalLimit = conf.getInt(YarnConfiguration.RM_AM_MAX_ATTEMPTS,
|
||||
YarnConfiguration.DEFAULT_RM_AM_MAX_ATTEMPTS);
|
||||
msg = String.format(
|
||||
"Application %s failed %d times%s%s due to %s. Failing the application.",
|
||||
getApplicationId(),
|
||||
maxAppAttempts,
|
||||
(attemptFailuresValidityInterval <= 0 ? ""
|
||||
: (" in previous " + attemptFailuresValidityInterval
|
||||
+ " milliseconds")),
|
||||
(globalLimit == maxAppAttempts) ? ""
|
||||
: (" (global limit =" + globalLimit
|
||||
+ "; local limit is =" + maxAppAttempts + ")"),
|
||||
failedEvent.getDiagnostics());
|
||||
}
|
||||
return msg;
|
||||
}
|
||||
|
@ -1459,9 +1459,9 @@ private String getAMContainerCrashedDiagnostics(
|
||||
.append(status.getDiagnostics());
|
||||
if (this.getTrackingUrl() != null) {
|
||||
diagnosticsBuilder.append("For more detailed output,").append(
|
||||
" check application tracking page: ").append(
|
||||
" check the application tracking page: ").append(
|
||||
this.getTrackingUrl()).append(
|
||||
" Then, click on links to logs of each attempt.\n");
|
||||
" Then click on links to logs of each attempt.\n");
|
||||
}
|
||||
return diagnosticsBuilder.toString();
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user