HDFS-16087. Fix stuck issue in rbfbalance tool (#3141). Contributed by Eric Yin.
This commit is contained in:
parent
e1d00addb5
commit
de41ce8a16
@ -44,6 +44,7 @@ protected void disableWrite(FedBalanceContext context) throws IOException {
|
|||||||
Configuration conf = context.getConf();
|
Configuration conf = context.getConf();
|
||||||
String mount = context.getMount();
|
String mount = context.getMount();
|
||||||
MountTableProcedure.disableWrite(mount, conf);
|
MountTableProcedure.disableWrite(mount, conf);
|
||||||
|
updateStage(Stage.FINAL_DISTCP);
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
@ -0,0 +1,120 @@
|
|||||||
|
/**
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one
|
||||||
|
* or more contributor license agreements. See the NOTICE file
|
||||||
|
* distributed with this work for additional information
|
||||||
|
* regarding copyright ownership. The ASF licenses this file
|
||||||
|
* to you under the Apache License, Version 2.0 (the
|
||||||
|
* "License"); you may not use this file except in compliance
|
||||||
|
* with the License. You may obtain a copy of the License at
|
||||||
|
* <p>
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
* <p>
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
package org.apache.hadoop.hdfs.rbfbalance;
|
||||||
|
|
||||||
|
import org.apache.hadoop.conf.Configuration;
|
||||||
|
import org.apache.hadoop.fs.permission.FsPermission;
|
||||||
|
import org.apache.hadoop.ha.HAServiceProtocol;
|
||||||
|
import org.apache.hadoop.hdfs.DFSClient;
|
||||||
|
import org.apache.hadoop.hdfs.server.federation.MiniRouterDFSCluster;
|
||||||
|
import org.apache.hadoop.hdfs.server.federation.RouterConfigBuilder;
|
||||||
|
import org.apache.hadoop.hdfs.server.federation.StateStoreDFSCluster;
|
||||||
|
import org.apache.hadoop.hdfs.server.federation.resolver.ActiveNamenodeResolver;
|
||||||
|
import org.apache.hadoop.hdfs.server.federation.resolver.MountTableManager;
|
||||||
|
import org.apache.hadoop.hdfs.server.federation.router.RBFConfigKeys;
|
||||||
|
import org.apache.hadoop.hdfs.server.federation.router.Router;
|
||||||
|
import org.apache.hadoop.hdfs.server.federation.store.StateStoreService;
|
||||||
|
import org.apache.hadoop.hdfs.server.federation.store.impl.MountTableStoreImpl;
|
||||||
|
import org.apache.hadoop.hdfs.server.federation.store.protocol.AddMountTableEntryRequest;
|
||||||
|
import org.apache.hadoop.hdfs.server.federation.store.protocol.AddMountTableEntryResponse;
|
||||||
|
import org.apache.hadoop.hdfs.server.federation.store.records.MountTable;
|
||||||
|
import org.apache.hadoop.ipc.RemoteException;
|
||||||
|
import org.apache.hadoop.tools.fedbalance.DistCpProcedure.Stage;
|
||||||
|
import org.apache.hadoop.tools.fedbalance.FedBalanceContext;
|
||||||
|
import org.apache.hadoop.tools.fedbalance.TestDistCpProcedure;
|
||||||
|
import org.apache.hadoop.util.Time;
|
||||||
|
import org.junit.AfterClass;
|
||||||
|
import org.junit.BeforeClass;
|
||||||
|
|
||||||
|
import java.net.InetSocketAddress;
|
||||||
|
import java.net.URI;
|
||||||
|
import java.util.Collections;
|
||||||
|
|
||||||
|
import static org.apache.hadoop.hdfs.server.federation.FederationTestUtils.createNamenodeReport;
|
||||||
|
import static org.apache.hadoop.test.LambdaTestUtils.intercept;
|
||||||
|
import static org.junit.Assert.assertTrue;
|
||||||
|
|
||||||
|
|
||||||
|
public class TestRouterDistCpProcedure extends TestDistCpProcedure {
|
||||||
|
private static StateStoreDFSCluster cluster;
|
||||||
|
private static MiniRouterDFSCluster.RouterContext routerContext;
|
||||||
|
private static Configuration routerConf;
|
||||||
|
private static StateStoreService stateStore;
|
||||||
|
|
||||||
|
@BeforeClass
|
||||||
|
public static void globalSetUp() throws Exception {
|
||||||
|
cluster = new StateStoreDFSCluster(false, 1);
|
||||||
|
// Build and start a router with State Store + admin + RPC
|
||||||
|
Configuration conf = new RouterConfigBuilder()
|
||||||
|
.stateStore()
|
||||||
|
.admin()
|
||||||
|
.rpc()
|
||||||
|
.build();
|
||||||
|
cluster.addRouterOverrides(conf);
|
||||||
|
cluster.startRouters();
|
||||||
|
routerContext = cluster.getRandomRouter();
|
||||||
|
Router router = routerContext.getRouter();
|
||||||
|
stateStore = router.getStateStore();
|
||||||
|
|
||||||
|
// Add one name services for testing
|
||||||
|
ActiveNamenodeResolver membership = router.getNamenodeResolver();
|
||||||
|
membership.registerNamenode(createNamenodeReport("ns0", "nn1",
|
||||||
|
HAServiceProtocol.HAServiceState.ACTIVE));
|
||||||
|
stateStore.refreshCaches(true);
|
||||||
|
|
||||||
|
routerConf = new Configuration();
|
||||||
|
InetSocketAddress routerSocket = router.getAdminServerAddress();
|
||||||
|
routerConf.setSocketAddr(RBFConfigKeys.DFS_ROUTER_ADMIN_ADDRESS_KEY,
|
||||||
|
routerSocket);
|
||||||
|
}
|
||||||
|
|
||||||
|
@Override
|
||||||
|
public void testDisableWrite() throws Exception {
|
||||||
|
// Firstly add mount entry: /test-write->{ns0,/test-write}.
|
||||||
|
String mount = "/test-write";
|
||||||
|
MountTable newEntry = MountTable
|
||||||
|
.newInstance(mount, Collections.singletonMap("ns0", mount),
|
||||||
|
Time.now(), Time.now());
|
||||||
|
MountTableManager mountTable =
|
||||||
|
routerContext.getAdminClient().getMountTableManager();
|
||||||
|
AddMountTableEntryRequest addRequest =
|
||||||
|
AddMountTableEntryRequest.newInstance(newEntry);
|
||||||
|
AddMountTableEntryResponse addResponse =
|
||||||
|
mountTable.addMountTableEntry(addRequest);
|
||||||
|
assertTrue(addResponse.getStatus());
|
||||||
|
stateStore.loadCache(MountTableStoreImpl.class, true); // load cache.
|
||||||
|
|
||||||
|
// Construct client.
|
||||||
|
URI address = routerContext.getFileSystemURI();
|
||||||
|
DFSClient routerClient = new DFSClient(address, routerConf);
|
||||||
|
|
||||||
|
FedBalanceContext context = new FedBalanceContext
|
||||||
|
.Builder(null, null, mount, routerConf).build();
|
||||||
|
RouterDistCpProcedure dcProcedure = new RouterDistCpProcedure();
|
||||||
|
executeProcedure(dcProcedure, Stage.FINAL_DISTCP,
|
||||||
|
() -> dcProcedure.disableWrite(context));
|
||||||
|
intercept(RemoteException.class, "is in a read only mount point",
|
||||||
|
"Expect readonly exception.", () -> routerClient
|
||||||
|
.mkdirs(mount + "/dir", new FsPermission(020), false));
|
||||||
|
}
|
||||||
|
|
||||||
|
@AfterClass
|
||||||
|
public static void tearDown() {
|
||||||
|
cluster.stopRouter(routerContext);
|
||||||
|
}
|
||||||
|
}
|
@ -72,7 +72,7 @@ public class DistCpProcedure extends BalanceProcedure {
|
|||||||
LoggerFactory.getLogger(DistCpProcedure.class);
|
LoggerFactory.getLogger(DistCpProcedure.class);
|
||||||
|
|
||||||
/* Stages of this procedure. */
|
/* Stages of this procedure. */
|
||||||
enum Stage {
|
public enum Stage {
|
||||||
PRE_CHECK, INIT_DISTCP, DIFF_DISTCP, DISABLE_WRITE, FINAL_DISTCP, FINISH
|
PRE_CHECK, INIT_DISTCP, DIFF_DISTCP, DISABLE_WRITE, FINAL_DISTCP, FINISH
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -325,7 +325,7 @@ Stage getStage() {
|
|||||||
}
|
}
|
||||||
|
|
||||||
@VisibleForTesting
|
@VisibleForTesting
|
||||||
void updateStage(Stage value) {
|
protected void updateStage(Stage value) {
|
||||||
String oldStage = stage == null ? "null" : stage.name();
|
String oldStage = stage == null ? "null" : stage.name();
|
||||||
String newStage = value == null ? "null" : value.name();
|
String newStage = value == null ? "null" : value.name();
|
||||||
LOG.info("Stage updated from {} to {}.", oldStage, newStage);
|
LOG.info("Stage updated from {} to {}.", oldStage, newStage);
|
||||||
|
@ -389,7 +389,7 @@ private FedBalanceContext buildContext(Path src, Path dst, String mount,
|
|||||||
.setDiffThreshold(diffThreshold).build();
|
.setDiffThreshold(diffThreshold).build();
|
||||||
}
|
}
|
||||||
|
|
||||||
interface Call {
|
protected interface Call {
|
||||||
void execute() throws IOException, RetryException;
|
void execute() throws IOException, RetryException;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -400,8 +400,8 @@ interface Call {
|
|||||||
* @param target the target stage.
|
* @param target the target stage.
|
||||||
* @param call the function executing the procedure.
|
* @param call the function executing the procedure.
|
||||||
*/
|
*/
|
||||||
private static void executeProcedure(DistCpProcedure procedure, Stage target,
|
protected static void executeProcedure(DistCpProcedure procedure,
|
||||||
Call call) throws IOException {
|
Stage target, Call call) throws IOException {
|
||||||
Stage stage = Stage.PRE_CHECK;
|
Stage stage = Stage.PRE_CHECK;
|
||||||
procedure.updateStage(stage);
|
procedure.updateStage(stage);
|
||||||
while (stage != target) {
|
while (stage != target) {
|
||||||
|
Loading…
Reference in New Issue
Block a user