YARN-7307. Allow client/AM update supported resource types via YARN APIs. (Sunil G via wangda)
Change-Id: I14c5ea7252b7c17e86ab38f692b5f9d43196dbe0
This commit is contained in:
parent
a25b5aa0cf
commit
36e158ae98
@ -32,6 +32,7 @@
|
||||
import org.apache.hadoop.yarn.api.records.Container;
|
||||
import org.apache.hadoop.yarn.api.records.NMToken;
|
||||
import org.apache.hadoop.yarn.api.records.Resource;
|
||||
import org.apache.hadoop.yarn.api.records.ResourceTypeInfo;
|
||||
import org.apache.hadoop.yarn.proto.YarnServiceProtos.SchedulerResourceTypes;
|
||||
import org.apache.hadoop.yarn.util.Records;
|
||||
|
||||
@ -205,11 +206,41 @@ public abstract void setContainersFromPreviousAttempts(
|
||||
public abstract void setSchedulerResourceTypes(
|
||||
EnumSet<SchedulerResourceTypes> types);
|
||||
|
||||
/**
|
||||
* Get list of supported resource profiles from RM.
|
||||
*
|
||||
* @return a map of resource profiles and its capabilities.
|
||||
*/
|
||||
@Public
|
||||
@Unstable
|
||||
public abstract Map<String, Resource> getResourceProfiles();
|
||||
|
||||
/**
|
||||
* Set supported resource profiles for RM.
|
||||
*
|
||||
* @param profiles
|
||||
* a map of resource profiles with its capabilities.
|
||||
*/
|
||||
@Private
|
||||
@Unstable
|
||||
public abstract void setResourceProfiles(Map<String, Resource> profiles);
|
||||
|
||||
/**
|
||||
* Get available resource types supported by RM.
|
||||
*
|
||||
* @return a Map of RM settings
|
||||
*/
|
||||
@Public
|
||||
@Unstable
|
||||
public abstract List<ResourceTypeInfo> getResourceTypes();
|
||||
|
||||
/**
|
||||
* Set the resource types used by RM.
|
||||
*
|
||||
* @param types
|
||||
* a set of the resource types supported by RM.
|
||||
*/
|
||||
@Private
|
||||
@Unstable
|
||||
public abstract void setResourceTypes(List<ResourceTypeInfo> types);
|
||||
}
|
||||
|
@ -215,6 +215,12 @@ public static ResourceInformation newInstance(String name, String units) {
|
||||
Long.MAX_VALUE);
|
||||
}
|
||||
|
||||
public static ResourceInformation newInstance(String name, String units,
|
||||
ResourceTypes resourceType) {
|
||||
return ResourceInformation.newInstance(name, units, 0L, resourceType, 0L,
|
||||
Long.MAX_VALUE);
|
||||
}
|
||||
|
||||
public static ResourceInformation newInstance(String name, long value) {
|
||||
return ResourceInformation
|
||||
.newInstance(name, "", value, ResourceTypes.COUNTABLE, 0L,
|
||||
|
@ -975,6 +975,17 @@ public static boolean isAclEnabled(Configuration conf) {
|
||||
public static final String DEFAULT_RM_RESOURCE_PROFILES_SOURCE_FILE =
|
||||
"resource-profiles.json";
|
||||
|
||||
/**
|
||||
* Enable/disable loading resource-types.xml at client side.
|
||||
*/
|
||||
@Public
|
||||
@Unstable
|
||||
public static final String YARN_CLIENT_LOAD_RESOURCETYPES_FROM_SERVER = YARN_PREFIX
|
||||
+ "client.load.resource-types.from-server";
|
||||
@Public
|
||||
@Unstable
|
||||
public static final boolean DEFAULT_YARN_CLIENT_LOAD_RESOURCETYPES_FROM_SERVER = false;
|
||||
|
||||
/**
|
||||
* Timeout in seconds for YARN node graceful decommission.
|
||||
* This is the maximal time to wait for running containers and applications
|
||||
|
@ -44,8 +44,6 @@
|
||||
import java.util.Map;
|
||||
import java.util.concurrent.ConcurrentHashMap;
|
||||
|
||||
import static org.apache.hadoop.yarn.api.records.ResourceInformation.GPU_URI;
|
||||
|
||||
/**
|
||||
* Helper class to read the resource-types to be supported by the system.
|
||||
*/
|
||||
@ -581,4 +579,25 @@ public static List<ResourceTypeInfo> getResourcesTypeInfo() {
|
||||
}
|
||||
return array;
|
||||
}
|
||||
|
||||
/**
|
||||
* Reinitialize all resource types from external source (in case of client,
|
||||
* server will send the updated list and local resourceutils cache will be
|
||||
* updated as per server's list of resources)
|
||||
*
|
||||
* @param resourceTypeInfo
|
||||
* List of resource types
|
||||
*/
|
||||
public static void reinitializeResources(
|
||||
List<ResourceTypeInfo> resourceTypeInfo) {
|
||||
Map<String, ResourceInformation> resourceInformationMap = new HashMap<>();
|
||||
|
||||
for (ResourceTypeInfo resourceType : resourceTypeInfo) {
|
||||
resourceInformationMap.put(resourceType.getName(),
|
||||
ResourceInformation.newInstance(resourceType.getName(),
|
||||
resourceType.getDefaultUnit(), resourceType.getResourceType()));
|
||||
}
|
||||
ResourceUtils
|
||||
.initializeResourcesFromResourceInformationMap(resourceInformationMap);
|
||||
}
|
||||
}
|
||||
|
@ -49,6 +49,7 @@ message RegisterApplicationMasterResponseProto {
|
||||
repeated NMTokenProto nm_tokens_from_previous_attempts = 6;
|
||||
repeated SchedulerResourceTypes scheduler_resource_types = 7;
|
||||
optional ResourceProfilesProto resource_profiles = 8;
|
||||
repeated ResourceTypeInfoProto resource_types = 9;
|
||||
}
|
||||
|
||||
message FinishApplicationMasterRequestProto {
|
||||
|
@ -22,6 +22,7 @@
|
||||
import java.nio.ByteBuffer;
|
||||
import java.util.ArrayList;
|
||||
import java.util.EnumSet;
|
||||
import java.util.HashMap;
|
||||
import java.util.HashSet;
|
||||
import java.util.Iterator;
|
||||
import java.util.List;
|
||||
@ -105,6 +106,7 @@
|
||||
import org.apache.hadoop.yarn.api.records.QueueInfo;
|
||||
import org.apache.hadoop.yarn.api.records.QueueUserACLInfo;
|
||||
import org.apache.hadoop.yarn.api.records.Resource;
|
||||
import org.apache.hadoop.yarn.api.records.ResourceInformation;
|
||||
import org.apache.hadoop.yarn.api.records.ResourceTypeInfo;
|
||||
import org.apache.hadoop.yarn.api.records.SignalContainerCommand;
|
||||
import org.apache.hadoop.yarn.api.records.Token;
|
||||
@ -125,6 +127,7 @@
|
||||
import org.apache.hadoop.yarn.security.client.TimelineDelegationTokenIdentifier;
|
||||
import org.apache.hadoop.yarn.util.ConverterUtils;
|
||||
import org.apache.hadoop.yarn.util.Records;
|
||||
import org.apache.hadoop.yarn.util.resource.ResourceUtils;
|
||||
import org.apache.hadoop.yarn.util.timeline.TimelineUtils;
|
||||
|
||||
import com.google.common.annotations.VisibleForTesting;
|
||||
@ -148,6 +151,7 @@ public class YarnClientImpl extends YarnClient {
|
||||
String timelineDTRenewer;
|
||||
private boolean timelineV1ServiceEnabled;
|
||||
protected boolean timelineServiceBestEffort;
|
||||
private boolean loadResourceTypesFromServer;
|
||||
|
||||
private static final String ROOT = "root";
|
||||
|
||||
@ -199,6 +203,11 @@ protected void serviceInit(Configuration conf) throws Exception {
|
||||
timelineServiceBestEffort = conf.getBoolean(
|
||||
YarnConfiguration.TIMELINE_SERVICE_CLIENT_BEST_EFFORT,
|
||||
YarnConfiguration.DEFAULT_TIMELINE_SERVICE_CLIENT_BEST_EFFORT);
|
||||
|
||||
loadResourceTypesFromServer = conf.getBoolean(
|
||||
YarnConfiguration.YARN_CLIENT_LOAD_RESOURCETYPES_FROM_SERVER,
|
||||
YarnConfiguration.DEFAULT_YARN_CLIENT_LOAD_RESOURCETYPES_FROM_SERVER);
|
||||
|
||||
super.serviceInit(conf);
|
||||
}
|
||||
|
||||
@ -217,6 +226,13 @@ protected void serviceStart() throws Exception {
|
||||
} catch (IOException e) {
|
||||
throw new YarnRuntimeException(e);
|
||||
}
|
||||
|
||||
// Reinitialize local resource types cache from list of resources pulled from
|
||||
// RM.
|
||||
if (loadResourceTypesFromServer) {
|
||||
ResourceUtils.reinitializeResources(getResourceTypeInfo());
|
||||
}
|
||||
|
||||
super.serviceStart();
|
||||
}
|
||||
|
||||
|
@ -29,15 +29,18 @@
|
||||
import org.apache.hadoop.yarn.api.records.Container;
|
||||
import org.apache.hadoop.yarn.api.records.NMToken;
|
||||
import org.apache.hadoop.yarn.api.records.Resource;
|
||||
import org.apache.hadoop.yarn.api.records.ResourceTypeInfo;
|
||||
import org.apache.hadoop.yarn.api.records.impl.pb.ContainerPBImpl;
|
||||
import org.apache.hadoop.yarn.api.records.impl.pb.NMTokenPBImpl;
|
||||
import org.apache.hadoop.yarn.api.records.impl.pb.ProtoUtils;
|
||||
import org.apache.hadoop.yarn.api.records.impl.pb.ResourcePBImpl;
|
||||
import org.apache.hadoop.yarn.api.records.impl.pb.ResourceTypeInfoPBImpl;
|
||||
import org.apache.hadoop.yarn.proto.YarnProtos.ResourceProfilesProto;
|
||||
import org.apache.hadoop.yarn.proto.YarnProtos.ResourceProfileEntry;
|
||||
import org.apache.hadoop.yarn.proto.YarnProtos.ApplicationACLMapProto;
|
||||
import org.apache.hadoop.yarn.proto.YarnProtos.ContainerProto;
|
||||
import org.apache.hadoop.yarn.proto.YarnProtos.ResourceProto;
|
||||
import org.apache.hadoop.yarn.proto.YarnProtos.ResourceTypeInfoProto;
|
||||
import org.apache.hadoop.yarn.proto.YarnServiceProtos.NMTokenProto;
|
||||
import org.apache.hadoop.yarn.proto.YarnServiceProtos.RegisterApplicationMasterResponseProto;
|
||||
import org.apache.hadoop.yarn.proto.YarnServiceProtos.RegisterApplicationMasterResponseProtoOrBuilder;
|
||||
@ -62,6 +65,7 @@ public class RegisterApplicationMasterResponsePBImpl extends
|
||||
private List<NMToken> nmTokens = null;
|
||||
private EnumSet<SchedulerResourceTypes> schedulerResourceTypes = null;
|
||||
private Map<String, Resource> profiles = null;
|
||||
private List<ResourceTypeInfo> resourceTypeInfo = null;
|
||||
|
||||
public RegisterApplicationMasterResponsePBImpl() {
|
||||
builder = RegisterApplicationMasterResponseProto.newBuilder();
|
||||
@ -129,8 +133,10 @@ private void mergeLocalToBuilder() {
|
||||
if (profiles != null) {
|
||||
addResourceProfiles();
|
||||
}
|
||||
if (resourceTypeInfo != null) {
|
||||
addResourceTypeInfosToProto();
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
private void maybeInitBuilder() {
|
||||
if (viaProto || builder == null) {
|
||||
@ -514,4 +520,75 @@ private NMTokenProto convertToProtoFormat(NMToken token) {
|
||||
private NMToken convertFromProtoFormat(NMTokenProto proto) {
|
||||
return new NMTokenPBImpl(proto);
|
||||
}
|
||||
|
||||
private ResourceTypeInfoPBImpl convertFromProtoFormat(
|
||||
ResourceTypeInfoProto p) {
|
||||
return new ResourceTypeInfoPBImpl(p);
|
||||
}
|
||||
|
||||
private ResourceTypeInfoProto convertToProtoFormat(ResourceTypeInfo t) {
|
||||
return ((ResourceTypeInfoPBImpl) t).getProto();
|
||||
}
|
||||
|
||||
@Override
|
||||
public List<ResourceTypeInfo> getResourceTypes() {
|
||||
initResourceTypeInfosList();
|
||||
return this.resourceTypeInfo;
|
||||
}
|
||||
|
||||
@Override
|
||||
public void setResourceTypes(List<ResourceTypeInfo> types) {
|
||||
if (resourceTypeInfo == null) {
|
||||
builder.clearResourceTypes();
|
||||
}
|
||||
this.resourceTypeInfo = types;
|
||||
}
|
||||
|
||||
private void addResourceTypeInfosToProto() {
|
||||
maybeInitBuilder();
|
||||
builder.clearResourceTypes();
|
||||
if (resourceTypeInfo == null) {
|
||||
return;
|
||||
}
|
||||
Iterable<ResourceTypeInfoProto> iterable = new Iterable<ResourceTypeInfoProto>() {
|
||||
@Override
|
||||
public Iterator<ResourceTypeInfoProto> iterator() {
|
||||
return new Iterator<ResourceTypeInfoProto>() {
|
||||
|
||||
Iterator<ResourceTypeInfo> iter = resourceTypeInfo.iterator();
|
||||
|
||||
@Override
|
||||
public boolean hasNext() {
|
||||
return iter.hasNext();
|
||||
}
|
||||
|
||||
@Override
|
||||
public ResourceTypeInfoProto next() {
|
||||
return convertToProtoFormat(iter.next());
|
||||
}
|
||||
|
||||
@Override
|
||||
public void remove() {
|
||||
throw new UnsupportedOperationException();
|
||||
|
||||
}
|
||||
};
|
||||
|
||||
}
|
||||
};
|
||||
builder.addAllResourceTypes(iterable);
|
||||
}
|
||||
|
||||
private void initResourceTypeInfosList() {
|
||||
if (this.resourceTypeInfo != null) {
|
||||
return;
|
||||
}
|
||||
RegisterApplicationMasterResponseProtoOrBuilder p = viaProto ? proto : builder;
|
||||
List<ResourceTypeInfoProto> list = p.getResourceTypesList();
|
||||
resourceTypeInfo = new ArrayList<ResourceTypeInfo>();
|
||||
|
||||
for (ResourceTypeInfoProto a : list) {
|
||||
resourceTypeInfo.add(convertFromProtoFormat(a));
|
||||
}
|
||||
}
|
||||
}
|
||||
|
@ -3488,5 +3488,13 @@
|
||||
<value>auto</value>
|
||||
</property>
|
||||
|
||||
<property>
|
||||
<description>
|
||||
Provides an option for client to load supported resource types from RM
|
||||
instead of depending on local resource-types.xml file.
|
||||
</description>
|
||||
<name>yarn.client.load.resource-types.from-server</name>
|
||||
<value>false</value>
|
||||
</property>
|
||||
|
||||
</configuration>
|
||||
|
@ -74,6 +74,7 @@
|
||||
.SchedulerNodeReport;
|
||||
import org.apache.hadoop.yarn.server.resourcemanager.scheduler.YarnScheduler;
|
||||
import org.apache.hadoop.yarn.server.utils.BuilderUtils;
|
||||
import org.apache.hadoop.yarn.util.resource.ResourceUtils;
|
||||
import org.apache.hadoop.yarn.util.resource.Resources;
|
||||
|
||||
import java.io.IOException;
|
||||
@ -180,6 +181,7 @@ public void registerApplicationMaster(
|
||||
|
||||
response.setSchedulerResourceTypes(getScheduler()
|
||||
.getSchedulingResourceTypes());
|
||||
response.setResourceTypes(ResourceUtils.getResourcesTypeInfo());
|
||||
if (getRmContext().getYarnConfiguration().getBoolean(
|
||||
YarnConfiguration.RM_RESOURCE_PROFILES_ENABLED,
|
||||
YarnConfiguration.DEFAULT_RM_RESOURCE_PROFILES_ENABLED)) {
|
||||
|
Loading…
Reference in New Issue
Block a user