MAPREDUCE-2802. Ensure JobHistory filenames have jobId. Contributed by Jonathan Eagles.
git-svn-id: https://svn.apache.org/repos/asf/hadoop/common/trunk@1180220 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
parent
6b343adfe8
commit
047b175aac
@ -1549,6 +1549,9 @@ Release 0.23.0 - Unreleased
|
|||||||
MAPREDUCE-3033. Ensure Master interface pays attention to classic v/s yarn
|
MAPREDUCE-3033. Ensure Master interface pays attention to classic v/s yarn
|
||||||
frameworks. (Hitesh Shah via acmurthy)
|
frameworks. (Hitesh Shah via acmurthy)
|
||||||
|
|
||||||
|
MAPREDUCE-2802. Ensure JobHistory filenames have jobId. (Jonathan Eagles
|
||||||
|
via acmurthy)
|
||||||
|
|
||||||
Release 0.22.0 - Unreleased
|
Release 0.22.0 - Unreleased
|
||||||
|
|
||||||
INCOMPATIBLE CHANGES
|
INCOMPATIBLE CHANGES
|
||||||
|
@ -29,11 +29,11 @@
|
|||||||
|
|
||||||
public class FileNameIndexUtils {
|
public class FileNameIndexUtils {
|
||||||
|
|
||||||
static final String UNDERSCORE_ESCAPE = "%5F";
|
|
||||||
static final int JOB_NAME_TRIM_LENGTH = 50;
|
static final int JOB_NAME_TRIM_LENGTH = 50;
|
||||||
|
|
||||||
//This has to be underscore currently. Untill escape uses DELIMITER.
|
// Sanitize job history file for predictable parsing
|
||||||
static final String DELIMITER = "_";
|
static final String DELIMITER = "-";
|
||||||
|
static final String DELIMITER_ESCAPE = "%2D";
|
||||||
|
|
||||||
private static final int JOB_ID_INDEX = 0;
|
private static final int JOB_ID_INDEX = 0;
|
||||||
private static final int SUBMIT_TIME_INDEX = 1;
|
private static final int SUBMIT_TIME_INDEX = 1;
|
||||||
@ -54,7 +54,7 @@ public class FileNameIndexUtils {
|
|||||||
public static String getDoneFileName(JobIndexInfo indexInfo) throws IOException {
|
public static String getDoneFileName(JobIndexInfo indexInfo) throws IOException {
|
||||||
StringBuilder sb = new StringBuilder();
|
StringBuilder sb = new StringBuilder();
|
||||||
//JobId
|
//JobId
|
||||||
sb.append(escapeUnderscores(TypeConverter.fromYarn(indexInfo.getJobId()).toString()));
|
sb.append(escapeDelimiters(TypeConverter.fromYarn(indexInfo.getJobId()).toString()));
|
||||||
sb.append(DELIMITER);
|
sb.append(DELIMITER);
|
||||||
|
|
||||||
//StartTime
|
//StartTime
|
||||||
@ -62,11 +62,11 @@ public static String getDoneFileName(JobIndexInfo indexInfo) throws IOException
|
|||||||
sb.append(DELIMITER);
|
sb.append(DELIMITER);
|
||||||
|
|
||||||
//UserName
|
//UserName
|
||||||
sb.append(escapeUnderscores(getUserName(indexInfo)));
|
sb.append(escapeDelimiters(getUserName(indexInfo)));
|
||||||
sb.append(DELIMITER);
|
sb.append(DELIMITER);
|
||||||
|
|
||||||
//JobName
|
//JobName
|
||||||
sb.append(escapeUnderscores(trimJobName(getJobName(indexInfo))));
|
sb.append(escapeDelimiters(trimJobName(getJobName(indexInfo))));
|
||||||
sb.append(DELIMITER);
|
sb.append(DELIMITER);
|
||||||
|
|
||||||
//FinishTime
|
//FinishTime
|
||||||
@ -136,13 +136,13 @@ public static JobIndexInfo getIndexInfo(String jhFileName) throws IOException {
|
|||||||
*/
|
*/
|
||||||
public static String encodeJobHistoryFileName(String logFileName)
|
public static String encodeJobHistoryFileName(String logFileName)
|
||||||
throws IOException {
|
throws IOException {
|
||||||
String replacementUnderscoreEscape = null;
|
String replacementDelimiterEscape = null;
|
||||||
|
|
||||||
if (logFileName.contains(UNDERSCORE_ESCAPE)) {
|
// Temporarily protect the escape delimiters from encoding
|
||||||
replacementUnderscoreEscape = nonOccursString(logFileName);
|
if (logFileName.contains(DELIMITER_ESCAPE)) {
|
||||||
|
replacementDelimiterEscape = nonOccursString(logFileName);
|
||||||
|
|
||||||
logFileName = replaceStringInstances
|
logFileName = logFileName.replaceAll(DELIMITER_ESCAPE, replacementDelimiterEscape);
|
||||||
(logFileName, UNDERSCORE_ESCAPE, replacementUnderscoreEscape);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
String encodedFileName = null;
|
String encodedFileName = null;
|
||||||
@ -154,10 +154,10 @@ public static String encodeJobHistoryFileName(String logFileName)
|
|||||||
ioe.setStackTrace(uee.getStackTrace());
|
ioe.setStackTrace(uee.getStackTrace());
|
||||||
throw ioe;
|
throw ioe;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (replacementUnderscoreEscape != null) {
|
// Restore protected escape delimiters after encoding
|
||||||
encodedFileName = replaceStringInstances
|
if (replacementDelimiterEscape != null) {
|
||||||
(encodedFileName, replacementUnderscoreEscape, UNDERSCORE_ESCAPE);
|
encodedFileName = encodedFileName.replaceAll(replacementDelimiterEscape, DELIMITER_ESCAPE);
|
||||||
}
|
}
|
||||||
|
|
||||||
return encodedFileName;
|
return encodedFileName;
|
||||||
@ -214,29 +214,10 @@ private static String getNonEmptyString(String in) {
|
|||||||
return in;
|
return in;
|
||||||
}
|
}
|
||||||
|
|
||||||
private static String escapeUnderscores(String escapee) {
|
private static String escapeDelimiters(String escapee) {
|
||||||
return replaceStringInstances(escapee, "_", UNDERSCORE_ESCAPE);
|
return escapee.replaceAll(DELIMITER, DELIMITER_ESCAPE);
|
||||||
}
|
}
|
||||||
|
|
||||||
// I tolerate this code because I expect a low number of
|
|
||||||
// occurrences in a relatively short string
|
|
||||||
private static String replaceStringInstances
|
|
||||||
(String logFileName, String old, String replacement) {
|
|
||||||
int index = logFileName.indexOf(old);
|
|
||||||
|
|
||||||
while (index > 0) {
|
|
||||||
logFileName = (logFileName.substring(0, index)
|
|
||||||
+ replacement
|
|
||||||
+ replaceStringInstances
|
|
||||||
(logFileName.substring(index + old.length()),
|
|
||||||
old, replacement));
|
|
||||||
|
|
||||||
index = logFileName.indexOf(old);
|
|
||||||
}
|
|
||||||
|
|
||||||
return logFileName;
|
|
||||||
}
|
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Trims the job-name if required
|
* Trims the job-name if required
|
||||||
*/
|
*/
|
||||||
|
@ -0,0 +1,130 @@
|
|||||||
|
/**
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one
|
||||||
|
* or more contributor license agreements. See the NOTICE file
|
||||||
|
* distributed with this work for additional information
|
||||||
|
* regarding copyright ownership. The ASF licenses this file
|
||||||
|
* to you under the Apache License, Version 2.0 (the
|
||||||
|
* "License"); you may not use this file except in compliance
|
||||||
|
* with the License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
|
||||||
|
package org.apache.hadoop.mapreduce.v2.jobhistory;
|
||||||
|
|
||||||
|
import java.io.IOException;
|
||||||
|
|
||||||
|
import org.apache.hadoop.mapreduce.JobID;
|
||||||
|
import org.apache.hadoop.mapreduce.TypeConverter;
|
||||||
|
import org.apache.hadoop.mapreduce.v2.api.records.JobId;
|
||||||
|
|
||||||
|
import org.junit.Assert;
|
||||||
|
import org.junit.Test;
|
||||||
|
|
||||||
|
public class TestFileNameIndexUtils {
|
||||||
|
|
||||||
|
private static final String JOB_HISTORY_FILE_FORMATTER = "%s"
|
||||||
|
+ FileNameIndexUtils.DELIMITER + "%s"
|
||||||
|
+ FileNameIndexUtils.DELIMITER + "%s"
|
||||||
|
+ FileNameIndexUtils.DELIMITER + "%s"
|
||||||
|
+ FileNameIndexUtils.DELIMITER + "%s"
|
||||||
|
+ FileNameIndexUtils.DELIMITER + "%s"
|
||||||
|
+ FileNameIndexUtils.DELIMITER + "%s"
|
||||||
|
+ FileNameIndexUtils.DELIMITER + "%s"
|
||||||
|
+ JobHistoryUtils.JOB_HISTORY_FILE_EXTENSION;
|
||||||
|
|
||||||
|
private static final String JOB_ID = "job_1317928501754_0001";
|
||||||
|
private static final String SUBMIT_TIME = "1317928742025";
|
||||||
|
private static final String USER_NAME = "username";
|
||||||
|
private static final String USER_NAME_WITH_DELIMITER = "user"
|
||||||
|
+ FileNameIndexUtils.DELIMITER + "name";
|
||||||
|
private static final String USER_NAME_WITH_DELIMITER_ESCAPE = "user"
|
||||||
|
+ FileNameIndexUtils.DELIMITER_ESCAPE + "name";
|
||||||
|
private static final String JOB_NAME = "mapreduce";
|
||||||
|
private static final String JOB_NAME_WITH_DELIMITER = "map"
|
||||||
|
+ FileNameIndexUtils.DELIMITER + "reduce";
|
||||||
|
private static final String JOB_NAME_WITH_DELIMITER_ESCAPE = "map"
|
||||||
|
+ FileNameIndexUtils.DELIMITER_ESCAPE + "reduce";
|
||||||
|
private static final String FINISH_TIME = "1317928754958";
|
||||||
|
private static final String NUM_MAPS = "1";
|
||||||
|
private static final String NUM_REDUCES = "1";
|
||||||
|
private static final String JOB_STATUS = "SUCCEEDED";
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void testUserNamePercentEncoding() throws IOException{
|
||||||
|
JobIndexInfo info = new JobIndexInfo();
|
||||||
|
JobID oldJobId = JobID.forName(JOB_ID);
|
||||||
|
JobId jobId = TypeConverter.toYarn(oldJobId);
|
||||||
|
info.setJobId(jobId);
|
||||||
|
info.setSubmitTime(Long.parseLong(SUBMIT_TIME));
|
||||||
|
info.setUser(USER_NAME_WITH_DELIMITER);
|
||||||
|
info.setJobName(JOB_NAME);
|
||||||
|
info.setFinishTime(Long.parseLong(FINISH_TIME));
|
||||||
|
info.setNumMaps(Integer.parseInt(NUM_MAPS));
|
||||||
|
info.setNumReduces(Integer.parseInt(NUM_REDUCES));
|
||||||
|
info.setJobStatus(JOB_STATUS);
|
||||||
|
|
||||||
|
String jobHistoryFile = FileNameIndexUtils.getDoneFileName(info);
|
||||||
|
Assert.assertTrue("User name not encoded correctly into job history file",
|
||||||
|
jobHistoryFile.contains(USER_NAME_WITH_DELIMITER_ESCAPE));
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void testUserNamePercentDecoding() throws IOException {
|
||||||
|
String jobHistoryFile = String.format(JOB_HISTORY_FILE_FORMATTER,
|
||||||
|
JOB_ID,
|
||||||
|
SUBMIT_TIME,
|
||||||
|
USER_NAME_WITH_DELIMITER_ESCAPE,
|
||||||
|
JOB_NAME,
|
||||||
|
FINISH_TIME,
|
||||||
|
NUM_MAPS,
|
||||||
|
NUM_REDUCES,
|
||||||
|
JOB_STATUS);
|
||||||
|
|
||||||
|
JobIndexInfo info = FileNameIndexUtils.getIndexInfo(jobHistoryFile);
|
||||||
|
Assert.assertEquals("User name doesn't match",
|
||||||
|
USER_NAME_WITH_DELIMITER, info.getUser());
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void testJobNamePercentEncoding() throws IOException {
|
||||||
|
JobIndexInfo info = new JobIndexInfo();
|
||||||
|
JobID oldJobId = JobID.forName(JOB_ID);
|
||||||
|
JobId jobId = TypeConverter.toYarn(oldJobId);
|
||||||
|
info.setJobId(jobId);
|
||||||
|
info.setSubmitTime(Long.parseLong(SUBMIT_TIME));
|
||||||
|
info.setUser(USER_NAME);
|
||||||
|
info.setJobName(JOB_NAME_WITH_DELIMITER);
|
||||||
|
info.setFinishTime(Long.parseLong(FINISH_TIME));
|
||||||
|
info.setNumMaps(Integer.parseInt(NUM_MAPS));
|
||||||
|
info.setNumReduces(Integer.parseInt(NUM_REDUCES));
|
||||||
|
info.setJobStatus(JOB_STATUS);
|
||||||
|
|
||||||
|
String jobHistoryFile = FileNameIndexUtils.getDoneFileName(info);
|
||||||
|
Assert.assertTrue("Job name not encoded correctly into job history file",
|
||||||
|
jobHistoryFile.contains(JOB_NAME_WITH_DELIMITER_ESCAPE));
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void testJobNamePercentDecoding() throws IOException {
|
||||||
|
String jobHistoryFile = String.format(JOB_HISTORY_FILE_FORMATTER,
|
||||||
|
JOB_ID,
|
||||||
|
SUBMIT_TIME,
|
||||||
|
USER_NAME,
|
||||||
|
JOB_NAME_WITH_DELIMITER_ESCAPE,
|
||||||
|
FINISH_TIME,
|
||||||
|
NUM_MAPS,
|
||||||
|
NUM_REDUCES,
|
||||||
|
JOB_STATUS);
|
||||||
|
|
||||||
|
JobIndexInfo info = FileNameIndexUtils.getIndexInfo(jobHistoryFile);
|
||||||
|
Assert.assertEquals("Job name doesn't match",
|
||||||
|
JOB_NAME_WITH_DELIMITER, info.getJobName());
|
||||||
|
}
|
||||||
|
}
|
Loading…
Reference in New Issue
Block a user