From 42863b9bafb9f77b76d9dcd26f0fcac859ea6f6a Mon Sep 17 00:00:00 2001 From: Tanping Wang Date: Thu, 23 Jun 2011 22:13:58 +0000 Subject: [PATCH] HDFS-2086. If the include hosts list contains host names, after restarting namenode, data nodes registration is denied. Contributed by Tanping Wang. git-svn-id: https://svn.apache.org/repos/asf/hadoop/common/trunk@1139090 13f79535-47bb-0310-9956-ffa450edef68 --- hdfs/CHANGES.txt | 3 + .../hdfs/server/namenode/FSNamesystem.java | 78 +++++++++++++--- .../hdfs/server/namenode/TestStartup.java | 92 ++++++++++++++++++- 3 files changed, 158 insertions(+), 15 deletions(-) diff --git a/hdfs/CHANGES.txt b/hdfs/CHANGES.txt index fffd576edb..016ab754b8 100644 --- a/hdfs/CHANGES.txt +++ b/hdfs/CHANGES.txt @@ -766,6 +766,9 @@ Trunk (unreleased changes) HDFS-1734. 'Chunk size to view' option is not working in Name Node UI. (Uma Maheswara Rao G via jitendra) + HDFS-2086. If the include hosts list contains host names, after restarting + namenode, data nodes registration is denied. Contributed by Tanping Wang. + Release 0.22.0 - Unreleased INCOMPATIBLE CHANGES diff --git a/hdfs/src/java/org/apache/hadoop/hdfs/server/namenode/FSNamesystem.java b/hdfs/src/java/org/apache/hadoop/hdfs/server/namenode/FSNamesystem.java index 19b5002364..d1d7286406 100644 --- a/hdfs/src/java/org/apache/hadoop/hdfs/server/namenode/FSNamesystem.java +++ b/hdfs/src/java/org/apache/hadoop/hdfs/server/namenode/FSNamesystem.java @@ -31,6 +31,7 @@ import java.io.PrintWriter; import java.lang.management.ManagementFactory; import java.net.InetAddress; import java.net.URI; +import java.net.UnknownHostException; import java.util.ArrayList; import java.util.Arrays; import java.util.Collection; @@ -3784,9 +3785,19 @@ public class FSNamesystem implements FSConstants, FSNamesystemMBean, nodes.add(dn); } //Remove any form of the this datanode in include/exclude lists. - mustList.remove(dn.getName()); - mustList.remove(dn.getHost()); - mustList.remove(dn.getHostName()); + try { + InetAddress inet = InetAddress.getByName(dn.getHost()); + // compare hostname(:port) + mustList.remove(inet.getHostName()); + mustList.remove(inet.getHostName()+":"+dn.getPort()); + // compare ipaddress(:port) + mustList.remove(inet.getHostAddress().toString()); + mustList.remove(inet.getHostAddress().toString()+ ":" +dn.getPort()); + } catch ( UnknownHostException e ) { + mustList.remove(dn.getName()); + mustList.remove(dn.getHost()); + LOG.warn(e); + } } } @@ -4031,23 +4042,62 @@ public class FSNamesystem implements FSConstants, FSNamesystemMBean, */ private boolean inHostsList(DatanodeID node, String ipAddr) { Set hostsList = hostsReader.getHosts(); - return (hostsList.isEmpty() || - (ipAddr != null && hostsList.contains(ipAddr)) || - hostsList.contains(node.getHost()) || - hostsList.contains(node.getName()) || - ((node instanceof DatanodeInfo) && - hostsList.contains(((DatanodeInfo)node).getHostName()))); + return checkInList(node, ipAddr, hostsList, false); } private boolean inExcludedHostsList(DatanodeID node, String ipAddr) { Set excludeList = hostsReader.getExcludedHosts(); - return ((ipAddr != null && excludeList.contains(ipAddr)) || - excludeList.contains(node.getHost()) || - excludeList.contains(node.getName()) || - ((node instanceof DatanodeInfo) && - excludeList.contains(((DatanodeInfo)node).getHostName()))); + return checkInList(node, ipAddr, excludeList, true); } + + /** + * Check if the given node (of DatanodeID or ipAddress) is in the (include or + * exclude) list. If ipAddress in null, check only based upon the given + * DatanodeID. If ipAddress is not null, the ipAddress should refers to the + * same host that given DatanodeID refers to. + * + * @param node, DatanodeID, the host DatanodeID + * @param ipAddress, if not null, should refers to the same host + * that DatanodeID refers to + * @param hostsList, the list of hosts in the include/exclude file + * @param isExcludeList, boolean, true if this is the exclude list + * @return boolean, if in the list + */ + private boolean checkInList(DatanodeID node, String ipAddress, + Set hostsList, boolean isExcludeList) { + InetAddress iaddr = null; + try { + if (ipAddress != null) { + iaddr = InetAddress.getByName(ipAddress); + } else { + iaddr = InetAddress.getByName(node.getHost()); + } + }catch (UnknownHostException e) { + LOG.warn("Unknown host in host list: "+ipAddress); + // can't resolve the host name. + if (isExcludeList){ + return true; + } else { + return false; + } + } + + // if include list is empty, host is in include list + if ( (!isExcludeList) && (hostsList.isEmpty()) ){ + return true; + } + return // compare ipaddress(:port) + (hostsList.contains(iaddr.getHostAddress().toString())) + || (hostsList.contains(iaddr.getHostAddress().toString() + ":" + + node.getPort())) + // compare hostname(:port) + || (hostsList.contains(iaddr.getHostName())) + || (hostsList.contains(iaddr.getHostName() + ":" + node.getPort())) + || ((node instanceof DatanodeInfo) && hostsList + .contains(((DatanodeInfo) node).getHostName())); + } + /** * Rereads the config to get hosts and exclude list file names. * Rereads the files to update the hosts and exclude lists. It diff --git a/hdfs/src/test/hdfs/org/apache/hadoop/hdfs/server/namenode/TestStartup.java b/hdfs/src/test/hdfs/org/apache/hadoop/hdfs/server/namenode/TestStartup.java index f7854777e9..4d600b2ed3 100644 --- a/hdfs/src/test/hdfs/org/apache/hadoop/hdfs/server/namenode/TestStartup.java +++ b/hdfs/src/test/hdfs/org/apache/hadoop/hdfs/server/namenode/TestStartup.java @@ -25,7 +25,9 @@ import java.io.FileInputStream; import java.io.FileOutputStream; import java.io.IOException; import java.io.RandomAccessFile; +import java.net.InetAddress; import java.net.URI; +import java.util.ArrayList; import java.util.Iterator; import java.util.List; import java.util.Properties; @@ -43,18 +45,21 @@ import org.apache.hadoop.fs.Path; import org.apache.hadoop.fs.permission.FsPermission; import org.apache.hadoop.fs.permission.PermissionStatus; +import org.apache.hadoop.hdfs.DFSClient; import org.apache.hadoop.hdfs.DFSConfigKeys; import org.apache.hadoop.hdfs.DFSTestUtil; import org.apache.hadoop.hdfs.HdfsConfiguration; import org.apache.hadoop.hdfs.MiniDFSCluster; +import org.apache.hadoop.hdfs.protocol.DatanodeInfo; +import org.apache.hadoop.hdfs.protocol.FSConstants.DatanodeReportType; import org.apache.hadoop.hdfs.protocol.FSConstants.SafeModeAction; import org.apache.hadoop.hdfs.server.common.Storage.StorageDirectory; import org.apache.hadoop.hdfs.server.namenode.NNStorage.NameNodeDirType; import org.apache.hadoop.hdfs.server.namenode.NNStorage.NameNodeFile; import org.apache.hadoop.io.IOUtils; import org.apache.hadoop.io.MD5Hash; -import org.apache.hadoop.test.GenericTestUtils; import org.apache.hadoop.util.StringUtils; +import org.junit.Assert; /** * Startup and checkpoint tests @@ -491,4 +496,89 @@ public class TestStartup extends TestCase { namenode.join(); } } + + /** + * This test tests hosts include list contains host names. After namenode + * restarts, the still alive datanodes should not have any trouble in getting + * registrant again. + */ + public void testNNRestart() throws IOException, InterruptedException { + MiniDFSCluster cluster = null; + FileSystem localFileSys; + Path hostsFile; + Path excludeFile; + Configuration conf = new HdfsConfiguration(); + int HEARTBEAT_INTERVAL = 1; // heartbeat interval in seconds + // Set up the hosts/exclude files. + localFileSys = FileSystem.getLocal(conf); + Path workingDir = localFileSys.getWorkingDirectory(); + Path dir = new Path(workingDir, "build/test/data/work-dir/restartnn"); + hostsFile = new Path(dir, "hosts"); + excludeFile = new Path(dir, "exclude"); + + // Setup conf + conf.set(DFSConfigKeys.DFS_HOSTS_EXCLUDE, excludeFile.toUri().getPath()); + writeConfigFile(localFileSys, excludeFile, null); + conf.set(DFSConfigKeys.DFS_HOSTS, hostsFile.toUri().getPath()); + // write into hosts file + ArrayListlist = new ArrayList(); + byte b[] = {127, 0, 0, 1}; + InetAddress inetAddress = InetAddress.getByAddress(b); + list.add(inetAddress.getHostName()); + writeConfigFile(localFileSys, hostsFile, list); + int numNameNodes = 1; + int numDatanodes = 1; + + try { + cluster = new MiniDFSCluster.Builder(conf).numNameNodes(numNameNodes) + .numDataNodes(numDatanodes).setupHostsFile(true).build(); + cluster.waitActive(); + + cluster.restartNameNode(); + NameNode nn = cluster.getNameNode(); + assertNotNull(nn); + Assert.assertTrue(cluster.isDataNodeUp()); + + DatanodeInfo[] info = nn.getDatanodeReport(DatanodeReportType.LIVE); + for (int i = 0 ; i < 5 && info.length != numDatanodes; i++) { + Thread.sleep(HEARTBEAT_INTERVAL * 1000); + info = nn.getDatanodeReport(DatanodeReportType.LIVE); + } + assertEquals("Number of live nodes should be "+numDatanodes, numDatanodes, + info.length); + + } catch (IOException e) { + fail(StringUtils.stringifyException(e)); + throw e; + } finally { + cleanupFile(localFileSys, excludeFile.getParent()); + if (cluster != null) { + cluster.shutdown(); + } + } + } + + private void writeConfigFile(FileSystem localFileSys, Path name, + ArrayList nodes) throws IOException { + // delete if it already exists + if (localFileSys.exists(name)) { + localFileSys.delete(name, true); + } + + if (nodes != null) { + FSDataOutputStream stm = localFileSys.create(name); + for (Iterator it = nodes.iterator(); it.hasNext();) { + String node = it.next(); + stm.writeBytes(node); + stm.writeBytes("\n"); + } + stm.close(); + } + } + + private void cleanupFile(FileSystem fileSys, Path name) throws IOException { + assertTrue(fileSys.exists(name)); + fileSys.delete(name, true); + assertTrue(!fileSys.exists(name)); + } }