HDFS-6678. MiniDFSCluster may still be partially running after initialization fails. Contributed by Chris Nauroth.
git-svn-id: https://svn.apache.org/repos/asf/hadoop/common/trunk@1610549 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
parent
3d9bea277a
commit
97b5fbc281
@ -303,6 +303,9 @@ Release 2.6.0 - UNRELEASED
|
|||||||
HADOOP-8158. Interrupting hadoop fs -put from the command line
|
HADOOP-8158. Interrupting hadoop fs -put from the command line
|
||||||
causes a LeaseExpiredException. (daryn via harsh)
|
causes a LeaseExpiredException. (daryn via harsh)
|
||||||
|
|
||||||
|
HDFS-6678. MiniDFSCluster may still be partially running after initialization
|
||||||
|
fails. (cnauroth)
|
||||||
|
|
||||||
Release 2.5.0 - UNRELEASED
|
Release 2.5.0 - UNRELEASED
|
||||||
|
|
||||||
INCOMPATIBLE CHANGES
|
INCOMPATIBLE CHANGES
|
||||||
|
@ -663,73 +663,81 @@ private void initMiniDFSCluster(
|
|||||||
boolean checkDataNodeHostConfig,
|
boolean checkDataNodeHostConfig,
|
||||||
Configuration[] dnConfOverlays)
|
Configuration[] dnConfOverlays)
|
||||||
throws IOException {
|
throws IOException {
|
||||||
ExitUtil.disableSystemExit();
|
boolean success = false;
|
||||||
|
|
||||||
synchronized (MiniDFSCluster.class) {
|
|
||||||
instanceId = instanceCount++;
|
|
||||||
}
|
|
||||||
|
|
||||||
this.conf = conf;
|
|
||||||
base_dir = new File(determineDfsBaseDir());
|
|
||||||
data_dir = new File(base_dir, "data");
|
|
||||||
this.waitSafeMode = waitSafeMode;
|
|
||||||
this.checkExitOnShutdown = checkExitOnShutdown;
|
|
||||||
|
|
||||||
int replication = conf.getInt(DFS_REPLICATION_KEY, 3);
|
|
||||||
conf.setInt(DFS_REPLICATION_KEY, Math.min(replication, numDataNodes));
|
|
||||||
int safemodeExtension = conf.getInt(
|
|
||||||
DFS_NAMENODE_SAFEMODE_EXTENSION_TESTING_KEY, 0);
|
|
||||||
conf.setInt(DFS_NAMENODE_SAFEMODE_EXTENSION_KEY, safemodeExtension);
|
|
||||||
conf.setInt(DFS_NAMENODE_DECOMMISSION_INTERVAL_KEY, 3); // 3 second
|
|
||||||
conf.setClass(NET_TOPOLOGY_NODE_SWITCH_MAPPING_IMPL_KEY,
|
|
||||||
StaticMapping.class, DNSToSwitchMapping.class);
|
|
||||||
|
|
||||||
// In an HA cluster, in order for the StandbyNode to perform checkpoints,
|
|
||||||
// it needs to know the HTTP port of the Active. So, if ephemeral ports
|
|
||||||
// are chosen, disable checkpoints for the test.
|
|
||||||
if (!nnTopology.allHttpPortsSpecified() &&
|
|
||||||
nnTopology.isHA()) {
|
|
||||||
LOG.info("MiniDFSCluster disabling checkpointing in the Standby node " +
|
|
||||||
"since no HTTP ports have been specified.");
|
|
||||||
conf.setBoolean(DFS_HA_STANDBY_CHECKPOINTS_KEY, false);
|
|
||||||
}
|
|
||||||
if (!nnTopology.allIpcPortsSpecified() &&
|
|
||||||
nnTopology.isHA()) {
|
|
||||||
LOG.info("MiniDFSCluster disabling log-roll triggering in the "
|
|
||||||
+ "Standby node since no IPC ports have been specified.");
|
|
||||||
conf.setInt(DFS_HA_LOGROLL_PERIOD_KEY, -1);
|
|
||||||
}
|
|
||||||
|
|
||||||
federation = nnTopology.isFederated();
|
|
||||||
try {
|
try {
|
||||||
createNameNodesAndSetConf(
|
ExitUtil.disableSystemExit();
|
||||||
nnTopology, manageNameDfsDirs, manageNameDfsSharedDirs,
|
|
||||||
enableManagedDfsDirsRedundancy,
|
synchronized (MiniDFSCluster.class) {
|
||||||
format, startOpt, clusterId, conf);
|
instanceId = instanceCount++;
|
||||||
} catch (IOException ioe) {
|
}
|
||||||
LOG.error("IOE creating namenodes. Permissions dump:\n" +
|
|
||||||
createPermissionsDiagnosisString(data_dir));
|
this.conf = conf;
|
||||||
throw ioe;
|
base_dir = new File(determineDfsBaseDir());
|
||||||
}
|
data_dir = new File(base_dir, "data");
|
||||||
if (format) {
|
this.waitSafeMode = waitSafeMode;
|
||||||
if (data_dir.exists() && !FileUtil.fullyDelete(data_dir)) {
|
this.checkExitOnShutdown = checkExitOnShutdown;
|
||||||
throw new IOException("Cannot remove data directory: " + data_dir +
|
|
||||||
|
int replication = conf.getInt(DFS_REPLICATION_KEY, 3);
|
||||||
|
conf.setInt(DFS_REPLICATION_KEY, Math.min(replication, numDataNodes));
|
||||||
|
int safemodeExtension = conf.getInt(
|
||||||
|
DFS_NAMENODE_SAFEMODE_EXTENSION_TESTING_KEY, 0);
|
||||||
|
conf.setInt(DFS_NAMENODE_SAFEMODE_EXTENSION_KEY, safemodeExtension);
|
||||||
|
conf.setInt(DFS_NAMENODE_DECOMMISSION_INTERVAL_KEY, 3); // 3 second
|
||||||
|
conf.setClass(NET_TOPOLOGY_NODE_SWITCH_MAPPING_IMPL_KEY,
|
||||||
|
StaticMapping.class, DNSToSwitchMapping.class);
|
||||||
|
|
||||||
|
// In an HA cluster, in order for the StandbyNode to perform checkpoints,
|
||||||
|
// it needs to know the HTTP port of the Active. So, if ephemeral ports
|
||||||
|
// are chosen, disable checkpoints for the test.
|
||||||
|
if (!nnTopology.allHttpPortsSpecified() &&
|
||||||
|
nnTopology.isHA()) {
|
||||||
|
LOG.info("MiniDFSCluster disabling checkpointing in the Standby node " +
|
||||||
|
"since no HTTP ports have been specified.");
|
||||||
|
conf.setBoolean(DFS_HA_STANDBY_CHECKPOINTS_KEY, false);
|
||||||
|
}
|
||||||
|
if (!nnTopology.allIpcPortsSpecified() &&
|
||||||
|
nnTopology.isHA()) {
|
||||||
|
LOG.info("MiniDFSCluster disabling log-roll triggering in the "
|
||||||
|
+ "Standby node since no IPC ports have been specified.");
|
||||||
|
conf.setInt(DFS_HA_LOGROLL_PERIOD_KEY, -1);
|
||||||
|
}
|
||||||
|
|
||||||
|
federation = nnTopology.isFederated();
|
||||||
|
try {
|
||||||
|
createNameNodesAndSetConf(
|
||||||
|
nnTopology, manageNameDfsDirs, manageNameDfsSharedDirs,
|
||||||
|
enableManagedDfsDirsRedundancy,
|
||||||
|
format, startOpt, clusterId, conf);
|
||||||
|
} catch (IOException ioe) {
|
||||||
|
LOG.error("IOE creating namenodes. Permissions dump:\n" +
|
||||||
createPermissionsDiagnosisString(data_dir));
|
createPermissionsDiagnosisString(data_dir));
|
||||||
|
throw ioe;
|
||||||
|
}
|
||||||
|
if (format) {
|
||||||
|
if (data_dir.exists() && !FileUtil.fullyDelete(data_dir)) {
|
||||||
|
throw new IOException("Cannot remove data directory: " + data_dir +
|
||||||
|
createPermissionsDiagnosisString(data_dir));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if (startOpt == StartupOption.RECOVER) {
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Start the DataNodes
|
||||||
|
startDataNodes(conf, numDataNodes, storageType, manageDataDfsDirs,
|
||||||
|
dnStartOpt != null ? dnStartOpt : startOpt,
|
||||||
|
racks, hosts, simulatedCapacities, setupHostsFile,
|
||||||
|
checkDataNodeAddrConfig, checkDataNodeHostConfig, dnConfOverlays);
|
||||||
|
waitClusterUp();
|
||||||
|
//make sure ProxyUsers uses the latest conf
|
||||||
|
ProxyUsers.refreshSuperUserGroupsConfiguration(conf);
|
||||||
|
success = true;
|
||||||
|
} finally {
|
||||||
|
if (!success) {
|
||||||
|
shutdown();
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if (startOpt == StartupOption.RECOVER) {
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
|
|
||||||
// Start the DataNodes
|
|
||||||
startDataNodes(conf, numDataNodes, storageType, manageDataDfsDirs,
|
|
||||||
dnStartOpt != null ? dnStartOpt : startOpt,
|
|
||||||
racks, hosts, simulatedCapacities, setupHostsFile,
|
|
||||||
checkDataNodeAddrConfig, checkDataNodeHostConfig, dnConfOverlays);
|
|
||||||
waitClusterUp();
|
|
||||||
//make sure ProxyUsers uses the latest conf
|
|
||||||
ProxyUsers.refreshSuperUserGroupsConfiguration(conf);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
Loading…
Reference in New Issue
Block a user