HDFS-8056. Decommissioned dead nodes should continue to be counted as dead after NN restart. (mingma)
This commit is contained in:
parent
ac1aa6c819
commit
1c4951a7a0
@ -1657,6 +1657,9 @@ Release 2.8.0 - UNRELEASED
|
||||
HDFS-9252. Change TestFileTruncate to use FsDatasetTestUtils to get block
|
||||
file size and genstamp. (Lei (Eddy) Xu via cmccabe)
|
||||
|
||||
HDFS-8056. Decommissioned dead nodes should continue to be counted as dead
|
||||
after NN restart. (mingma)
|
||||
|
||||
OPTIMIZATIONS
|
||||
|
||||
HDFS-8026. Trace FSOutputSummer#writeChecksumChunks rather than
|
||||
|
@ -1272,7 +1272,7 @@ public List<DatanodeDescriptor> getDatanodeListForReport(
|
||||
|
||||
if (listDeadNodes) {
|
||||
for (InetSocketAddress addr : includedNodes) {
|
||||
if (foundNodes.matchedBy(addr) || excludedNodes.match(addr)) {
|
||||
if (foundNodes.matchedBy(addr)) {
|
||||
continue;
|
||||
}
|
||||
// The remaining nodes are ones that are referenced by the hosts
|
||||
@ -1289,6 +1289,9 @@ public List<DatanodeDescriptor> getDatanodeListForReport(
|
||||
addr.getPort() == 0 ? defaultXferPort : addr.getPort(),
|
||||
defaultInfoPort, defaultInfoSecurePort, defaultIpcPort));
|
||||
setDatanodeDead(dn);
|
||||
if (excludedNodes.match(addr)) {
|
||||
dn.setDecommissioned();
|
||||
}
|
||||
nodes.add(dn);
|
||||
}
|
||||
}
|
||||
|
@ -923,6 +923,41 @@ public void testDecommissionWithNamenodeRestart()throws IOException, Interrupted
|
||||
cluster.shutdown();
|
||||
}
|
||||
|
||||
/**
|
||||
* Tests dead node count after restart of namenode
|
||||
**/
|
||||
@Test(timeout=360000)
|
||||
public void testDeadNodeCountAfterNamenodeRestart()throws Exception {
|
||||
LOG.info("Starting test testDeadNodeCountAfterNamenodeRestart");
|
||||
int numNamenodes = 1;
|
||||
int numDatanodes = 2;
|
||||
|
||||
startCluster(numNamenodes, numDatanodes, conf);
|
||||
|
||||
DFSClient client = getDfsClient(cluster.getNameNode(), conf);
|
||||
DatanodeInfo[] info = client.datanodeReport(DatanodeReportType.LIVE);
|
||||
DatanodeInfo excludedDatanode = info[0];
|
||||
String excludedDatanodeName = info[0].getXferAddr();
|
||||
|
||||
writeConfigFile(hostsFile, new ArrayList<String>(Arrays.asList(
|
||||
excludedDatanodeName, info[1].getXferAddr())));
|
||||
decommissionNode(0, excludedDatanode.getDatanodeUuid(), null,
|
||||
AdminStates.DECOMMISSIONED);
|
||||
|
||||
cluster.stopDataNode(excludedDatanodeName);
|
||||
DFSTestUtil.waitForDatanodeState(
|
||||
cluster, excludedDatanode.getDatanodeUuid(), false, 20000);
|
||||
|
||||
//Restart the namenode
|
||||
cluster.restartNameNode();
|
||||
|
||||
assertEquals("There should be one node alive", 1,
|
||||
client.datanodeReport(DatanodeReportType.LIVE).length);
|
||||
assertEquals("There should be one node dead", 1,
|
||||
client.datanodeReport(DatanodeReportType.DEAD).length);
|
||||
cluster.shutdown();
|
||||
}
|
||||
|
||||
/**
|
||||
* Test using a "registration name" in a host include file.
|
||||
*
|
||||
|
@ -151,7 +151,7 @@ public void testIncludeExcludeLists() throws IOException {
|
||||
Assert.assertEquals(1, dm.getDatanodeListForReport(HdfsConstants
|
||||
.DatanodeReportType.DEAD).size());
|
||||
excludedNodes.add(entry("127.0.0.3"));
|
||||
Assert.assertEquals(0, dm.getDatanodeListForReport(HdfsConstants
|
||||
Assert.assertEquals(1, dm.getDatanodeListForReport(HdfsConstants
|
||||
.DatanodeReportType.DEAD).size());
|
||||
}
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user