YARN-6533. Race condition in writing service record to registry in yarn native services. Contributed by Billie Rinaldi

This commit is contained in:
Jian He 2017-05-11 09:23:54 -07:00
parent ce05c6e981
commit a041373dd4
3 changed files with 11 additions and 22 deletions

View File

@ -503,7 +503,8 @@ public Iterable<String> getHostsList(Collection<ClusterNode> values,
*/
public void updateServiceRecord(StateAccessForProviders amState,
YarnRegistryViewForProviders yarnRegistry,
String containerId, String roleName, List<String> ip, String hostname) {
String containerId, String roleName, List<String> ip, String hostname)
throws IOException {
try {
RoleInstance role = null;
if(ip != null && !ip.isEmpty()){
@ -535,9 +536,6 @@ public void updateServiceRecord(StateAccessForProviders amState,
} catch (NoSuchNodeException e) {
// ignore - there is nothing to do if we don't find a container
log.warn("Owned container {} not found - {}", containerId, e);
} catch (IOException e) {
log.warn("Error updating container {} service record in registry",
containerId, e);
}
}
}

View File

@ -146,8 +146,15 @@ public boolean processContainerStatus(ContainerId containerId,
return false;
}
providerUtils.updateServiceRecord(amState, yarnRegistry,
containerId.toString(), instance.role, status.getIPs(), status.getHost());
try {
providerUtils.updateServiceRecord(amState, yarnRegistry,
containerId.toString(), instance.role, status.getIPs(), status.getHost());
} catch (IOException e) {
// could not write service record to ZK, log and retry
log.warn("Error updating container {} service record in registry, " +
"retrying", containerId, e);
return true;
}
// TODO publish ip and host
org.apache.slider.api.resource.Container container =
instance.providerRole.component.getContainer(containerId.toString());

View File

@ -1182,24 +1182,8 @@ public boolean registerComponent(ContainerId id, RoleInstance roleInstance)
return false;
}
// this is where component registrations go
String cid = RegistryPathUtils.encodeYarnID(id.toString());
ServiceRecord record = new ServiceRecord();
record.set(YarnRegistryAttributes.YARN_ID, cid);
record.description = roleInstance.getCompInstanceName();
log.info("Registering component " + roleInstance.getCompInstanceName()
+ ", containerId = " + id);
record.set(YarnRegistryAttributes.YARN_PERSISTENCE,
PersistencePolicies.CONTAINER);
setUserProvidedServiceRecordAttributes(
instance.providerRole.component.getConfiguration(), record);
try {
yarnRegistryOperations.putComponent(cid, record);
} catch (IOException e) {
log.warn("Failed to register container {}/{}: {}",
id, roleInstance.role, e, e);
return false;
}
org.apache.slider.api.resource.Container container =
new org.apache.slider.api.resource.Container();
container.setId(id.toString());