HADOOP-7771. FsShell -copyToLocal, -get, etc. commands throw NPE if the destination directory does not exist. Contributed by John George and Daryn Sharp
git-svn-id: https://svn.apache.org/repos/asf/hadoop/common/trunk@1195760 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
parent
bb8fd6a267
commit
8f9661da48
@ -509,6 +509,10 @@ Release 0.23.0 - Unreleased
|
|||||||
HADOOP-7360. Preserve relative paths that do not contain globs in FsShell.
|
HADOOP-7360. Preserve relative paths that do not contain globs in FsShell.
|
||||||
(Daryn Sharp and Kihwal Lee via szetszwo)
|
(Daryn Sharp and Kihwal Lee via szetszwo)
|
||||||
|
|
||||||
|
HADOOP-7771. FsShell -copyToLocal, -get, etc. commands throw NPE if the
|
||||||
|
destination directory does not exist. (John George and Daryn Sharp
|
||||||
|
via szetszwo)
|
||||||
|
|
||||||
OPTIMIZATIONS
|
OPTIMIZATIONS
|
||||||
|
|
||||||
HADOOP-7333. Performance improvement in PureJavaCrc32. (Eric Caspole
|
HADOOP-7333. Performance improvement in PureJavaCrc32. (Eric Caspole
|
||||||
|
@ -55,6 +55,7 @@ abstract public class Command extends Configured {
|
|||||||
protected int exitCode = 0;
|
protected int exitCode = 0;
|
||||||
protected int numErrors = 0;
|
protected int numErrors = 0;
|
||||||
protected boolean recursive = false;
|
protected boolean recursive = false;
|
||||||
|
private int depth = 0;
|
||||||
protected ArrayList<Exception> exceptions = new ArrayList<Exception>();
|
protected ArrayList<Exception> exceptions = new ArrayList<Exception>();
|
||||||
|
|
||||||
private static final Log LOG = LogFactory.getLog(Command.class);
|
private static final Log LOG = LogFactory.getLog(Command.class);
|
||||||
@ -86,6 +87,10 @@ protected boolean isRecursive() {
|
|||||||
return recursive;
|
return recursive;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
protected int getDepth() {
|
||||||
|
return depth;
|
||||||
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Execute the command on the input path
|
* Execute the command on the input path
|
||||||
*
|
*
|
||||||
@ -269,6 +274,7 @@ protected void processArgument(PathData item) throws IOException {
|
|||||||
protected void processPathArgument(PathData item) throws IOException {
|
protected void processPathArgument(PathData item) throws IOException {
|
||||||
// null indicates that the call is not via recursion, ie. there is
|
// null indicates that the call is not via recursion, ie. there is
|
||||||
// no parent directory that was expanded
|
// no parent directory that was expanded
|
||||||
|
depth = 0;
|
||||||
processPaths(null, item);
|
processPaths(null, item);
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -326,7 +332,12 @@ protected void processPath(PathData item) throws IOException {
|
|||||||
* @throws IOException if anything goes wrong...
|
* @throws IOException if anything goes wrong...
|
||||||
*/
|
*/
|
||||||
protected void recursePath(PathData item) throws IOException {
|
protected void recursePath(PathData item) throws IOException {
|
||||||
|
try {
|
||||||
|
depth++;
|
||||||
processPaths(item, item.getDirectoryContents());
|
processPaths(item, item.getDirectoryContents());
|
||||||
|
} finally {
|
||||||
|
depth--;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
@ -20,13 +20,18 @@
|
|||||||
|
|
||||||
import java.io.File;
|
import java.io.File;
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
|
import java.io.InputStream;
|
||||||
import java.util.LinkedList;
|
import java.util.LinkedList;
|
||||||
|
|
||||||
|
import org.apache.hadoop.fs.FSDataOutputStream;
|
||||||
import org.apache.hadoop.fs.Path;
|
import org.apache.hadoop.fs.Path;
|
||||||
import org.apache.hadoop.fs.shell.PathExceptions.PathExistsException;
|
import org.apache.hadoop.fs.shell.PathExceptions.PathExistsException;
|
||||||
import org.apache.hadoop.fs.shell.PathExceptions.PathIOException;
|
import org.apache.hadoop.fs.shell.PathExceptions.PathIOException;
|
||||||
|
import org.apache.hadoop.fs.shell.PathExceptions.PathIsDirectoryException;
|
||||||
import org.apache.hadoop.fs.shell.PathExceptions.PathIsNotDirectoryException;
|
import org.apache.hadoop.fs.shell.PathExceptions.PathIsNotDirectoryException;
|
||||||
import org.apache.hadoop.fs.shell.PathExceptions.PathNotFoundException;
|
import org.apache.hadoop.fs.shell.PathExceptions.PathNotFoundException;
|
||||||
|
import org.apache.hadoop.fs.shell.PathExceptions.PathOperationException;
|
||||||
|
import org.apache.hadoop.io.IOUtils;
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Provides: argument processing to ensure the destination is valid
|
* Provides: argument processing to ensure the destination is valid
|
||||||
@ -106,43 +111,31 @@ protected void processArguments(LinkedList<PathData> args)
|
|||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
protected void processPaths(PathData parent, PathData ... items)
|
protected void processPathArgument(PathData src)
|
||||||
throws IOException {
|
throws IOException {
|
||||||
PathData savedDst = dst;
|
if (src.stat.isDirectory() && src.fs.equals(dst.fs)) {
|
||||||
try {
|
PathData target = getTargetPath(src);
|
||||||
// modify dst as we descend to append the basename of the
|
String srcPath = src.fs.makeQualified(src.path).toString();
|
||||||
// current directory being processed
|
String dstPath = dst.fs.makeQualified(target.path).toString();
|
||||||
if (parent != null) dst = dst.getPathDataForChild(parent);
|
if (dstPath.equals(srcPath)) {
|
||||||
super.processPaths(parent, items);
|
PathIOException e = new PathIOException(src.toString(),
|
||||||
} finally {
|
"are identical");
|
||||||
dst = savedDst;
|
e.setTargetPath(dstPath.toString());
|
||||||
|
throw e;
|
||||||
}
|
}
|
||||||
|
if (dstPath.startsWith(srcPath+Path.SEPARATOR)) {
|
||||||
|
PathIOException e = new PathIOException(src.toString(),
|
||||||
|
"is a subdirectory of itself");
|
||||||
|
e.setTargetPath(target.toString());
|
||||||
|
throw e;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
super.processPathArgument(src);
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
protected void processPath(PathData src) throws IOException {
|
protected void processPath(PathData src) throws IOException {
|
||||||
PathData target;
|
processPath(src, getTargetPath(src));
|
||||||
// if the destination is a directory, make target a child path,
|
|
||||||
// else use the destination as-is
|
|
||||||
if (dst.exists && dst.stat.isDirectory()) {
|
|
||||||
target = dst.getPathDataForChild(src);
|
|
||||||
} else {
|
|
||||||
target = dst;
|
|
||||||
}
|
|
||||||
if (target.exists && !overwrite) {
|
|
||||||
throw new PathExistsException(target.toString());
|
|
||||||
}
|
|
||||||
|
|
||||||
try {
|
|
||||||
// invoke processPath with both a source and resolved target
|
|
||||||
processPath(src, target);
|
|
||||||
} catch (PathIOException e) {
|
|
||||||
// add the target unless it already has one
|
|
||||||
if (e.getTargetPath() == null) {
|
|
||||||
e.setTargetPath(target.toString());
|
|
||||||
}
|
|
||||||
throw e;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
@ -151,6 +144,103 @@ protected void processPath(PathData src) throws IOException {
|
|||||||
* @param target for the operation
|
* @param target for the operation
|
||||||
* @throws IOException if anything goes wrong
|
* @throws IOException if anything goes wrong
|
||||||
*/
|
*/
|
||||||
protected abstract void processPath(PathData src, PathData target)
|
protected void processPath(PathData src, PathData dst) throws IOException {
|
||||||
throws IOException;
|
if (src.stat.isSymlink()) {
|
||||||
|
// TODO: remove when FileContext is supported, this needs to either
|
||||||
|
// copy the symlink or deref the symlink
|
||||||
|
throw new PathOperationException(src.toString());
|
||||||
|
} else if (src.stat.isFile()) {
|
||||||
|
copyFileToTarget(src, dst);
|
||||||
|
} else if (src.stat.isDirectory() && !isRecursive()) {
|
||||||
|
throw new PathIsDirectoryException(src.toString());
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
protected void recursePath(PathData src) throws IOException {
|
||||||
|
PathData savedDst = dst;
|
||||||
|
try {
|
||||||
|
// modify dst as we descend to append the basename of the
|
||||||
|
// current directory being processed
|
||||||
|
dst = getTargetPath(src);
|
||||||
|
if (dst.exists) {
|
||||||
|
if (!dst.stat.isDirectory()) {
|
||||||
|
throw new PathIsNotDirectoryException(dst.toString());
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
if (!dst.fs.mkdirs(dst.path)) {
|
||||||
|
// too bad we have no clue what failed
|
||||||
|
PathIOException e = new PathIOException(dst.toString());
|
||||||
|
e.setOperation("mkdir");
|
||||||
|
throw e;
|
||||||
|
}
|
||||||
|
dst.refreshStatus(); // need to update stat to know it exists now
|
||||||
|
}
|
||||||
|
super.recursePath(src);
|
||||||
|
} finally {
|
||||||
|
dst = savedDst;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
protected PathData getTargetPath(PathData src) throws IOException {
|
||||||
|
PathData target;
|
||||||
|
// on the first loop, the dst may be directory or a file, so only create
|
||||||
|
// a child path if dst is a dir; after recursion, it's always a dir
|
||||||
|
if ((getDepth() > 0) || (dst.exists && dst.stat.isDirectory())) {
|
||||||
|
target = dst.getPathDataForChild(src);
|
||||||
|
} else {
|
||||||
|
target = dst;
|
||||||
|
}
|
||||||
|
return target;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Copies the source file to the target.
|
||||||
|
* @param src item to copy
|
||||||
|
* @param target where to copy the item
|
||||||
|
* @throws IOException if copy fails
|
||||||
|
*/
|
||||||
|
protected void copyFileToTarget(PathData src, PathData target) throws IOException {
|
||||||
|
copyStreamToTarget(src.fs.open(src.path), target);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Copies the stream contents to a temporary file. If the copy is
|
||||||
|
* successful, the temporary file will be renamed to the real path,
|
||||||
|
* else the temporary file will be deleted.
|
||||||
|
* @param in the input stream for the copy
|
||||||
|
* @param target where to store the contents of the stream
|
||||||
|
* @throws IOException if copy fails
|
||||||
|
*/
|
||||||
|
protected void copyStreamToTarget(InputStream in, PathData target)
|
||||||
|
throws IOException {
|
||||||
|
if (target.exists && (target.stat.isDirectory() || !overwrite)) {
|
||||||
|
throw new PathExistsException(target.toString());
|
||||||
|
}
|
||||||
|
PathData tempFile = null;
|
||||||
|
try {
|
||||||
|
tempFile = target.createTempFile(target+"._COPYING_");
|
||||||
|
FSDataOutputStream out = target.fs.create(tempFile.path, true);
|
||||||
|
IOUtils.copyBytes(in, out, getConf(), true);
|
||||||
|
// the rename method with an option to delete the target is deprecated
|
||||||
|
if (target.exists && !target.fs.delete(target.path, false)) {
|
||||||
|
// too bad we don't know why it failed
|
||||||
|
PathIOException e = new PathIOException(target.toString());
|
||||||
|
e.setOperation("delete");
|
||||||
|
throw e;
|
||||||
|
}
|
||||||
|
if (!tempFile.fs.rename(tempFile.path, target.path)) {
|
||||||
|
// too bad we don't know why it failed
|
||||||
|
PathIOException e = new PathIOException(tempFile.toString());
|
||||||
|
e.setOperation("rename");
|
||||||
|
e.setTargetPath(target.toString());
|
||||||
|
throw e;
|
||||||
|
}
|
||||||
|
tempFile = null;
|
||||||
|
} finally {
|
||||||
|
if (tempFile != null) {
|
||||||
|
tempFile.fs.delete(tempFile.path, false);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
@ -26,13 +26,7 @@
|
|||||||
import org.apache.hadoop.classification.InterfaceAudience;
|
import org.apache.hadoop.classification.InterfaceAudience;
|
||||||
import org.apache.hadoop.classification.InterfaceStability;
|
import org.apache.hadoop.classification.InterfaceStability;
|
||||||
import org.apache.hadoop.fs.ChecksumFileSystem;
|
import org.apache.hadoop.fs.ChecksumFileSystem;
|
||||||
import org.apache.hadoop.fs.FSDataOutputStream;
|
|
||||||
import org.apache.hadoop.fs.FileUtil;
|
import org.apache.hadoop.fs.FileUtil;
|
||||||
import org.apache.hadoop.fs.LocalFileSystem;
|
|
||||||
import org.apache.hadoop.fs.shell.PathExceptions.PathExistsException;
|
|
||||||
import org.apache.hadoop.fs.shell.PathExceptions.PathIOException;
|
|
||||||
import org.apache.hadoop.fs.shell.PathExceptions.PathOperationException;
|
|
||||||
import org.apache.hadoop.io.IOUtils;
|
|
||||||
|
|
||||||
/** Various commands for copy files */
|
/** Various commands for copy files */
|
||||||
@InterfaceAudience.Private
|
@InterfaceAudience.Private
|
||||||
@ -95,18 +89,10 @@ protected void processOptions(LinkedList<String> args) throws IOException {
|
|||||||
CommandFormat cf = new CommandFormat(2, Integer.MAX_VALUE, "f");
|
CommandFormat cf = new CommandFormat(2, Integer.MAX_VALUE, "f");
|
||||||
cf.parse(args);
|
cf.parse(args);
|
||||||
setOverwrite(cf.getOpt("f"));
|
setOverwrite(cf.getOpt("f"));
|
||||||
|
// should have a -r option
|
||||||
|
setRecursive(true);
|
||||||
getRemoteDestination(args);
|
getRemoteDestination(args);
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
|
||||||
protected void processPath(PathData src, PathData target)
|
|
||||||
throws IOException {
|
|
||||||
if (!FileUtil.copy(src.fs, src.path, target.fs, target.path, false, overwrite, getConf())) {
|
|
||||||
// we have no idea what the error is... FileUtils masks it and in
|
|
||||||
// some cases won't even report an error
|
|
||||||
throw new PathIOException(src.toString());
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
@ -126,7 +112,6 @@ public static class Get extends CommandWithDestination {
|
|||||||
* It must be at least three characters long, required by
|
* It must be at least three characters long, required by
|
||||||
* {@link java.io.File#createTempFile(String, String, File)}.
|
* {@link java.io.File#createTempFile(String, String, File)}.
|
||||||
*/
|
*/
|
||||||
private static final String COPYTOLOCAL_PREFIX = "_copyToLocal_";
|
|
||||||
private boolean copyCrc;
|
private boolean copyCrc;
|
||||||
private boolean verifyChecksum;
|
private boolean verifyChecksum;
|
||||||
|
|
||||||
@ -144,7 +129,7 @@ protected void processOptions(LinkedList<String> args)
|
|||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
protected void processPath(PathData src, PathData target)
|
protected void copyFileToTarget(PathData src, PathData target)
|
||||||
throws IOException {
|
throws IOException {
|
||||||
src.fs.setVerifyChecksum(verifyChecksum);
|
src.fs.setVerifyChecksum(verifyChecksum);
|
||||||
|
|
||||||
@ -153,41 +138,10 @@ protected void processPath(PathData src, PathData target)
|
|||||||
copyCrc = false;
|
copyCrc = false;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (src.stat.isFile()) {
|
super.copyFileToTarget(src, target);
|
||||||
// copy the file and maybe its crc
|
|
||||||
copyFileToLocal(src, target);
|
|
||||||
if (copyCrc) {
|
if (copyCrc) {
|
||||||
copyFileToLocal(src.getChecksumFile(), target.getChecksumFile());
|
// should we delete real file if crc copy fails?
|
||||||
}
|
super.copyFileToTarget(src.getChecksumFile(), target.getChecksumFile());
|
||||||
} else if (src.stat.isDirectory()) {
|
|
||||||
// create the remote directory structure locally
|
|
||||||
if (!target.toFile().mkdirs()) {
|
|
||||||
throw new PathIOException(target.toString());
|
|
||||||
}
|
|
||||||
} else {
|
|
||||||
throw new PathOperationException(src.toString());
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
private void copyFileToLocal(PathData src, PathData target)
|
|
||||||
throws IOException {
|
|
||||||
File targetFile = target.toFile();
|
|
||||||
File tmpFile = FileUtil.createLocalTempFile(
|
|
||||||
targetFile, COPYTOLOCAL_PREFIX, true);
|
|
||||||
// too bad we can't tell exactly why it failed...
|
|
||||||
if (!FileUtil.copy(src.fs, src.path, tmpFile, false, getConf())) {
|
|
||||||
PathIOException e = new PathIOException(src.toString());
|
|
||||||
e.setOperation("copy");
|
|
||||||
e.setTargetPath(tmpFile.toString());
|
|
||||||
throw e;
|
|
||||||
}
|
|
||||||
|
|
||||||
// too bad we can't tell exactly why it failed...
|
|
||||||
if (!tmpFile.renameTo(targetFile)) {
|
|
||||||
PathIOException e = new PathIOException(tmpFile.toString());
|
|
||||||
e.setOperation("rename");
|
|
||||||
e.setTargetPath(targetFile.toString());
|
|
||||||
throw e;
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -208,6 +162,8 @@ protected void processOptions(LinkedList<String> args) throws IOException {
|
|||||||
cf.parse(args);
|
cf.parse(args);
|
||||||
setOverwrite(cf.getOpt("f"));
|
setOverwrite(cf.getOpt("f"));
|
||||||
getRemoteDestination(args);
|
getRemoteDestination(args);
|
||||||
|
// should have a -r option
|
||||||
|
setRecursive(true);
|
||||||
}
|
}
|
||||||
|
|
||||||
// commands operating on local paths have no need for glob expansion
|
// commands operating on local paths have no need for glob expansion
|
||||||
@ -223,30 +179,11 @@ protected void processArguments(LinkedList<PathData> args)
|
|||||||
throws IOException {
|
throws IOException {
|
||||||
// NOTE: this logic should be better, mimics previous implementation
|
// NOTE: this logic should be better, mimics previous implementation
|
||||||
if (args.size() == 1 && args.get(0).toString().equals("-")) {
|
if (args.size() == 1 && args.get(0).toString().equals("-")) {
|
||||||
if (dst.exists && !overwrite) {
|
copyStreamToTarget(System.in, getTargetPath(args.get(0)));
|
||||||
throw new PathExistsException(dst.toString());
|
|
||||||
}
|
|
||||||
copyFromStdin();
|
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
super.processArguments(args);
|
super.processArguments(args);
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
|
||||||
protected void processPath(PathData src, PathData target)
|
|
||||||
throws IOException {
|
|
||||||
target.fs.copyFromLocalFile(false, overwrite, src.path, target.path);
|
|
||||||
}
|
|
||||||
|
|
||||||
/** Copies from stdin to the destination file. */
|
|
||||||
protected void copyFromStdin() throws IOException {
|
|
||||||
FSDataOutputStream out = dst.fs.create(dst.path);
|
|
||||||
try {
|
|
||||||
IOUtils.copyBytes(System.in, out, getConf(), false);
|
|
||||||
} finally {
|
|
||||||
out.close();
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
public static class CopyFromLocal extends Put {
|
public static class CopyFromLocal extends Put {
|
||||||
|
@ -182,6 +182,19 @@ public PathData getChecksumFile() throws IOException {
|
|||||||
return new PathData(srcFs.getRawFileSystem(), srcPath.toString());
|
return new PathData(srcFs.getRawFileSystem(), srcPath.toString());
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Returns a temporary file for this PathData with the given extension.
|
||||||
|
* The file will be deleted on exit.
|
||||||
|
* @param extension for the temporary file
|
||||||
|
* @return PathData
|
||||||
|
* @throws IOException shouldn't happen
|
||||||
|
*/
|
||||||
|
public PathData createTempFile(String extension) throws IOException {
|
||||||
|
PathData tmpFile = new PathData(fs, uri+"._COPYING_");
|
||||||
|
fs.deleteOnExit(tmpFile.path);
|
||||||
|
return tmpFile;
|
||||||
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* Returns a list of PathData objects of the items contained in the given
|
* Returns a list of PathData objects of the items contained in the given
|
||||||
* directory.
|
* directory.
|
||||||
|
Loading…
Reference in New Issue
Block a user