10 năm trước cách đây · 9ebbf1bfce
--- a/hadoop-yarn-project/CHANGES.txt
+++ b/hadoop-yarn-project/CHANGES.txt
@@ -24,6 +24,9 @@ Release 2.8.0 - UNRELEASED
 
				     YARN-3443. Create a 'ResourceHandler' subsystem to ease addition of support 
			
 
				     for new resource types on the NM. (Sidharta Seethana via junping_du)
			
 
				 
			
 
				+    YARN-3361. CapacityScheduler side changes to support non-exclusive node
			
 
				+    labels. (Wangda Tan via jianhe)
			
 
				+
			
 
				   IMPROVEMENTS
			
 
				 
			
 
				     YARN-1880. Cleanup TestApplicationClientProtocolOnHA
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-common/src/main/java/org/apache/hadoop/yarn/server/utils/BuilderUtils.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-common/src/main/java/org/apache/hadoop/yarn/server/utils/BuilderUtils.java
@@ -313,6 +313,7 @@ public class BuilderUtils {
 
				     request.setResourceName(r.getResourceName());
			
 
				     request.setCapability(r.getCapability());
			
 
				     request.setNumContainers(r.getNumContainers());
			
 
				+    request.setNodeLabelExpression(r.getNodeLabelExpression());
			
 
				     return request;
			
 
				   }
			
 
				 
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/rmapp/attempt/RMAppAttemptImpl.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/rmapp/attempt/RMAppAttemptImpl.java
@@ -146,7 +146,7 @@ public class RMAppAttemptImpl implements RMAppAttempt, Recoverable {
 
				   private ConcurrentMap<NodeId, List<ContainerStatus>>
			
 
				       finishedContainersSentToAM =
			
 
				       new ConcurrentHashMap<NodeId, List<ContainerStatus>>();
			
 
				-  private Container masterContainer;
			
 
				+  private volatile Container masterContainer;
			
 
				 
			
 
				   private float progress = 0;
			
 
				   private String host = "N/A";
			
@@ -762,13 +762,7 @@ public class RMAppAttemptImpl implements RMAppAttempt, Recoverable {
 
				 
			
 
				   @Override
			
 
				   public Container getMasterContainer() {
			
 
				-    this.readLock.lock();
			
 
				-
			
 
				-    try {
			
 
				-      return this.masterContainer;
			
 
				-    } finally {
			
 
				-      this.readLock.unlock();
			
 
				-    }
			
 
				+    return this.masterContainer;
			
 
				   }
			
 
				 
			
 
				   @InterfaceAudience.Private
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/AppSchedulingInfo.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/AppSchedulingInfo.java
@@ -73,10 +73,11 @@ public class AppSchedulingInfo {
 
				   /* Allocated by scheduler */
			
 
				   boolean pending = true; // for app metrics
			
 
				   
			
 
				+  private ResourceUsage appResourceUsage;
			
 
				  
			
 
				   public AppSchedulingInfo(ApplicationAttemptId appAttemptId,
			
 
				       String user, Queue queue, ActiveUsersManager activeUsersManager,
			
 
				-      long epoch) {
			
 
				+      long epoch, ResourceUsage appResourceUsage) {
			
 
				     this.applicationAttemptId = appAttemptId;
			
 
				     this.applicationId = appAttemptId.getApplicationId();
			
 
				     this.queue = queue;
			
@@ -84,6 +85,7 @@ public class AppSchedulingInfo {
 
				     this.user = user;
			
 
				     this.activeUsersManager = activeUsersManager;
			
 
				     this.containerIdCounter = new AtomicLong(epoch << EPOCH_BIT_SHIFT);
			
 
				+    this.appResourceUsage = appResourceUsage;
			
 
				   }
			
 
				 
			
 
				   public ApplicationId getApplicationId() {
			
@@ -191,13 +193,19 @@ public class AppSchedulingInfo {
 
				             lastRequestCapability);
			
 
				         
			
 
				         // update queue:
			
 
				+        Resource increasedResource = Resources.multiply(request.getCapability(),
			
 
				+            request.getNumContainers());
			
 
				         queue.incPendingResource(
			
 
				             request.getNodeLabelExpression(),
			
 
				-            Resources.multiply(request.getCapability(),
			
 
				-                request.getNumContainers()));
			
 
				+            increasedResource);
			
 
				+        appResourceUsage.incPending(request.getNodeLabelExpression(), increasedResource);
			
 
				         if (lastRequest != null) {
			
 
				+          Resource decreasedResource =
			
 
				+              Resources.multiply(lastRequestCapability, lastRequestContainers);
			
 
				           queue.decPendingResource(lastRequest.getNodeLabelExpression(),
			
 
				-              Resources.multiply(lastRequestCapability, lastRequestContainers));
			
 
				+              decreasedResource);
			
 
				+          appResourceUsage.decPending(lastRequest.getNodeLabelExpression(),
			
 
				+              decreasedResource);
			
 
				         }
			
 
				       }
			
 
				     }
			
@@ -385,6 +393,8 @@ public class AppSchedulingInfo {
 
				       checkForDeactivation();
			
 
				     }
			
 
				     
			
 
				+    appResourceUsage.decPending(offSwitchRequest.getNodeLabelExpression(),
			
 
				+        offSwitchRequest.getCapability());
			
 
				     queue.decPendingResource(offSwitchRequest.getNodeLabelExpression(),
			
 
				         offSwitchRequest.getCapability());
			
 
				   }
			
@@ -492,9 +502,10 @@ public class AppSchedulingInfo {
 
				   }
			
 
				   
			
 
				   public ResourceRequest cloneResourceRequest(ResourceRequest request) {
			
 
				-    ResourceRequest newRequest = ResourceRequest.newInstance(
			
 
				-        request.getPriority(), request.getResourceName(),
			
 
				-        request.getCapability(), 1, request.getRelaxLocality());
			
 
				+    ResourceRequest newRequest =
			
 
				+        ResourceRequest.newInstance(request.getPriority(),
			
 
				+            request.getResourceName(), request.getCapability(), 1,
			
 
				+            request.getRelaxLocality(), request.getNodeLabelExpression());
			
 
				     return newRequest;
			
 
				   }
			
 
				 }
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/ResourceUsage.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/ResourceUsage.java
@@ -27,6 +27,7 @@ import java.util.concurrent.locks.ReentrantReadWriteLock.WriteLock;
 
				 
			
 
				 import org.apache.hadoop.yarn.api.records.Resource;
			
 
				 import org.apache.hadoop.yarn.nodelabels.CommonNodeLabelsManager;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager;
			
 
				 import org.apache.hadoop.yarn.util.resource.Resources;
			
 
				 
			
 
				 /**
			
@@ -250,6 +251,10 @@ public class ResourceUsage {
 
				   }
			
 
				 
			
 
				   private Resource _get(String label, ResourceType type) {
			
 
				+    if (label == null) {
			
 
				+      label = RMNodeLabelsManager.NO_LABEL;
			
 
				+    }
			
 
				+    
			
 
				     try {
			
 
				       readLock.lock();
			
 
				       UsageByLabel usage = usages.get(label);
			
@@ -263,6 +268,9 @@ public class ResourceUsage {
 
				   }
			
 
				 
			
 
				   private UsageByLabel getAndAddIfMissing(String label) {
			
 
				+    if (label == null) {
			
 
				+      label = RMNodeLabelsManager.NO_LABEL;
			
 
				+    }
			
 
				     if (!usages.containsKey(label)) {
			
 
				       UsageByLabel u = new UsageByLabel(label);
			
 
				       usages.put(label, u);
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/SchedulerApplicationAttempt.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/SchedulerApplicationAttempt.java
@@ -56,6 +56,8 @@ import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainerImpl
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainerReservedEvent;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainerState;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmnode.RMNodeCleanContainerEvent;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.scheduler.capacity.SchedulingMode;
			
 
				+import org.apache.hadoop.yarn.util.resource.ResourceCalculator;
			
 
				 import org.apache.hadoop.yarn.util.resource.Resources;
			
 
				 
			
 
				 import com.google.common.base.Preconditions;
			
@@ -108,14 +110,24 @@ public class SchedulerApplicationAttempt {
 
				   private Set<ContainerId> pendingRelease = null;
			
 
				 
			
 
				   /**
			
 
				-   * Count how many times the application has been given an opportunity
			
 
				-   * to schedule a task at each priority. Each time the scheduler
			
 
				-   * asks the application for a task at this priority, it is incremented,
			
 
				-   * and each time the application successfully schedules a task, it
			
 
				+   * Count how many times the application has been given an opportunity to
			
 
				+   * schedule a task at each priority. Each time the scheduler asks the
			
 
				+   * application for a task at this priority, it is incremented, and each time
			
 
				+   * the application successfully schedules a task (at rack or node local), it
			
 
				    * is reset to 0.
			
 
				    */
			
 
				   Multiset<Priority> schedulingOpportunities = HashMultiset.create();
			
 
				   
			
 
				+  /**
			
 
				+   * Count how many times the application has been given an opportunity to
			
 
				+   * schedule a non-partitioned resource request at each priority. Each time the
			
 
				+   * scheduler asks the application for a task at this priority, it is
			
 
				+   * incremented, and each time the application successfully schedules a task,
			
 
				+   * it is reset to 0 when schedule any task at corresponding priority.
			
 
				+   */
			
 
				+  Multiset<Priority> missedNonPartitionedRequestSchedulingOpportunity =
			
 
				+      HashMultiset.create();
			
 
				+  
			
 
				   // Time of the last container scheduled at the current allowed level
			
 
				   protected Map<Priority, Long> lastScheduledContainer =
			
 
				       new HashMap<Priority, Long>();
			
@@ -132,7 +144,7 @@ public class SchedulerApplicationAttempt {
 
				     this.rmContext = rmContext;
			
 
				     this.appSchedulingInfo = 
			
 
				         new AppSchedulingInfo(applicationAttemptId, user, queue,  
			
 
				-            activeUsersManager, rmContext.getEpoch());
			
 
				+            activeUsersManager, rmContext.getEpoch(), attemptResourceUsage);
			
 
				     this.queue = queue;
			
 
				     this.pendingRelease = new HashSet<ContainerId>();
			
 
				     this.attemptId = applicationAttemptId;
			
@@ -489,6 +501,18 @@ public class SchedulerApplicationAttempt {
 
				     return this.appSchedulingInfo.isBlacklisted(resourceName);
			
 
				   }
			
 
				 
			
 
				+  public synchronized int addMissedNonPartitionedRequestSchedulingOpportunity(
			
 
				+      Priority priority) {
			
 
				+    missedNonPartitionedRequestSchedulingOpportunity.add(priority);
			
 
				+    return missedNonPartitionedRequestSchedulingOpportunity.count(priority);
			
 
				+  }
			
 
				+
			
 
				+  public synchronized void
			
 
				+      resetMissedNonPartitionedRequestSchedulingOpportunity(Priority priority) {
			
 
				+    missedNonPartitionedRequestSchedulingOpportunity.setCount(priority, 0);
			
 
				+  }
			
 
				+
			
 
				+  
			
 
				   public synchronized void addSchedulingOpportunity(Priority priority) {
			
 
				     schedulingOpportunities.setCount(priority,
			
 
				         schedulingOpportunities.count(priority) + 1);
			
@@ -518,6 +542,7 @@ public class SchedulerApplicationAttempt {
 
				   public synchronized void resetSchedulingOpportunities(Priority priority) {
			
 
				     resetSchedulingOpportunities(priority, System.currentTimeMillis());
			
 
				   }
			
 
				+
			
 
				   // used for continuous scheduling
			
 
				   public synchronized void resetSchedulingOpportunities(Priority priority,
			
 
				       long currentTimeMs) {
			
@@ -669,4 +694,13 @@ public class SchedulerApplicationAttempt {
 
				   public Set<String> getBlacklistedNodes() {
			
 
				     return this.appSchedulingInfo.getBlackListCopy();
			
 
				   }
			
 
				+  
			
 
				+  @Private
			
 
				+  public boolean hasPendingResourceRequest(ResourceCalculator rc,
			
 
				+      String nodePartition, Resource cluster,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				+    return SchedulerUtils.hasPendingResourceRequest(rc,
			
 
				+        this.attemptResourceUsage, nodePartition, cluster,
			
 
				+        schedulingMode);
			
 
				+  }
			
 
				 }
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/SchedulerUtils.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/SchedulerUtils.java
@@ -37,11 +37,10 @@ import org.apache.hadoop.yarn.factories.RecordFactory;
 
				 import org.apache.hadoop.yarn.factory.providers.RecordFactoryProvider;
			
 
				 import org.apache.hadoop.yarn.security.AccessType;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.scheduler.capacity.SchedulingMode;
			
 
				 import org.apache.hadoop.yarn.util.resource.ResourceCalculator;
			
 
				 import org.apache.hadoop.yarn.util.resource.Resources;
			
 
				 
			
 
				-import com.google.common.collect.Sets;
			
 
				-
			
 
				 /**
			
 
				  * Utilities shared by schedulers. 
			
 
				  */
			
@@ -235,9 +234,13 @@ public class SchedulerUtils {
 
				     if (labelExp == null && queueInfo != null
			
 
				         && ResourceRequest.ANY.equals(resReq.getResourceName())) {
			
 
				       labelExp = queueInfo.getDefaultNodeLabelExpression();
			
 
				-      resReq.setNodeLabelExpression(labelExp);
			
 
				     }
			
 
				     
			
 
				+    // If labelExp still equals to null, set it to be NO_LABEL
			
 
				+    resReq
			
 
				+        .setNodeLabelExpression(labelExp == null ? RMNodeLabelsManager.NO_LABEL
			
 
				+            : labelExp);
			
 
				+    
			
 
				     // we don't allow specify label expression other than resourceName=ANY now
			
 
				     if (!ResourceRequest.ANY.equals(resReq.getResourceName())
			
 
				         && labelExp != null && !labelExp.trim().isEmpty()) {
			
@@ -273,25 +276,6 @@ public class SchedulerUtils {
 
				     }
			
 
				   }
			
 
				   
			
 
				-  public static boolean checkQueueAccessToNode(Set<String> queueLabels,
			
 
				-      Set<String> nodeLabels) {
			
 
				-    // if queue's label is *, it can access any node
			
 
				-    if (queueLabels != null && queueLabels.contains(RMNodeLabelsManager.ANY)) {
			
 
				-      return true;
			
 
				-    }
			
 
				-    // any queue can access to a node without label
			
 
				-    if (nodeLabels == null || nodeLabels.isEmpty()) {
			
 
				-      return true;
			
 
				-    }
			
 
				-    // a queue can access to a node only if it contains any label of the node
			
 
				-    if (queueLabels != null
			
 
				-        && Sets.intersection(queueLabels, nodeLabels).size() > 0) {
			
 
				-      return true;
			
 
				-    }
			
 
				-    // sorry, you cannot access
			
 
				-    return false;
			
 
				-  }
			
 
				-  
			
 
				   public static void checkIfLabelInClusterNodeLabels(RMNodeLabelsManager mgr,
			
 
				       Set<String> labels) throws IOException {
			
 
				     if (mgr == null) {
			
@@ -311,26 +295,6 @@ public class SchedulerUtils {
 
				       }
			
 
				     }
			
 
				   }
			
 
				-  
			
 
				-  public static boolean checkNodeLabelExpression(Set<String> nodeLabels,
			
 
				-      String labelExpression) {
			
 
				-    // empty label expression can only allocate on node with empty labels
			
 
				-    if (labelExpression == null || labelExpression.trim().isEmpty()) {
			
 
				-      if (!nodeLabels.isEmpty()) {
			
 
				-        return false;
			
 
				-      }
			
 
				-    }
			
 
				-
			
 
				-    if (labelExpression != null) {
			
 
				-      for (String str : labelExpression.split("&&")) {
			
 
				-        if (!str.trim().isEmpty()
			
 
				-            && (nodeLabels == null || !nodeLabels.contains(str.trim()))) {
			
 
				-          return false;
			
 
				-        }
			
 
				-      }
			
 
				-    }
			
 
				-    return true;
			
 
				-  }
			
 
				 
			
 
				   public static boolean checkQueueLabelExpression(Set<String> queueLabels,
			
 
				       String labelExpression) {
			
@@ -360,4 +324,43 @@ public class SchedulerUtils {
 
				     }
			
 
				     return null;
			
 
				   }
			
 
				+  
			
 
				+  public static boolean checkResourceRequestMatchingNodePartition(
			
 
				+      ResourceRequest offswitchResourceRequest, String nodePartition,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				+    // We will only look at node label = nodeLabelToLookAt according to
			
 
				+    // schedulingMode and partition of node.
			
 
				+    String nodePartitionToLookAt = null;
			
 
				+    if (schedulingMode == SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY) {
			
 
				+      nodePartitionToLookAt = nodePartition;
			
 
				+    } else {
			
 
				+      nodePartitionToLookAt = RMNodeLabelsManager.NO_LABEL;
			
 
				+    }
			
 
				+    
			
 
				+    String askedNodePartition = offswitchResourceRequest.getNodeLabelExpression();
			
 
				+    if (null == askedNodePartition) {
			
 
				+      askedNodePartition = RMNodeLabelsManager.NO_LABEL;
			
 
				+    }
			
 
				+    return askedNodePartition.equals(nodePartitionToLookAt);
			
 
				+  }
			
 
				+  
			
 
				+  private static boolean hasPendingResourceRequest(ResourceCalculator rc,
			
 
				+      ResourceUsage usage, String partitionToLookAt, Resource cluster) {
			
 
				+    if (Resources.greaterThan(rc, cluster,
			
 
				+        usage.getPending(partitionToLookAt), Resources.none())) {
			
 
				+      return true;
			
 
				+    }
			
 
				+    return false;
			
 
				+  }
			
 
				+
			
 
				+  @Private
			
 
				+  public static boolean hasPendingResourceRequest(ResourceCalculator rc,
			
 
				+      ResourceUsage usage, String nodePartition, Resource cluster,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				+    String partitionToLookAt = nodePartition;
			
 
				+    if (schedulingMode == SchedulingMode.IGNORE_PARTITION_EXCLUSIVITY) {
			
 
				+      partitionToLookAt = RMNodeLabelsManager.NO_LABEL;
			
 
				+    }
			
 
				+    return hasPendingResourceRequest(rc, usage, partitionToLookAt, cluster);
			
 
				+  }
			
 
				 }
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/AbstractCSQueue.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/AbstractCSQueue.java
@@ -20,7 +20,6 @@ package org.apache.hadoop.yarn.server.resourcemanager.scheduler.capacity;
 
				 
			
 
				 import java.io.IOException;
			
 
				 import java.util.HashMap;
			
 
				-import java.util.HashSet;
			
 
				 import java.util.Map;
			
 
				 import java.util.Set;
			
 
				 
			
@@ -38,12 +37,12 @@ import org.apache.hadoop.yarn.api.records.Resource;
 
				 import org.apache.hadoop.yarn.conf.YarnConfiguration;
			
 
				 import org.apache.hadoop.yarn.factories.RecordFactory;
			
 
				 import org.apache.hadoop.yarn.factory.providers.RecordFactoryProvider;
			
 
				-import org.apache.hadoop.yarn.nodelabels.CommonNodeLabelsManager;
			
 
				 import org.apache.hadoop.yarn.security.AccessType;
			
 
				 import org.apache.hadoop.yarn.security.PrivilegedEntity;
			
 
				 import org.apache.hadoop.yarn.security.PrivilegedEntity.EntityType;
			
 
				 import org.apache.hadoop.yarn.security.YarnAuthorizationProvider;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.scheduler.NodeType;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.QueueMetrics;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceLimits;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceUsage;
			
@@ -56,6 +55,11 @@ import com.google.common.collect.Sets;
 
				 public abstract class AbstractCSQueue implements CSQueue {
			
 
				   private static final Log LOG = LogFactory.getLog(AbstractCSQueue.class);
			
 
				   
			
 
				+  static final CSAssignment NULL_ASSIGNMENT =
			
 
				+      new CSAssignment(Resources.createResource(0, 0), NodeType.NODE_LOCAL);
			
 
				+  
			
 
				+  static final CSAssignment SKIP_ASSIGNMENT = new CSAssignment(true);
			
 
				+  
			
 
				   CSQueue parent;
			
 
				   final String queueName;
			
 
				   volatile int numContainers;
			
@@ -343,16 +347,8 @@ public abstract class AbstractCSQueue implements CSQueue {
 
				   }
			
 
				   
			
 
				   synchronized void allocateResource(Resource clusterResource, 
			
 
				-      Resource resource, Set<String> nodeLabels) {
			
 
				-    
			
 
				-    // Update usedResources by labels
			
 
				-    if (nodeLabels == null || nodeLabels.isEmpty()) {
			
 
				-      queueUsage.incUsed(resource);
			
 
				-    } else {
			
 
				-      for (String label : Sets.intersection(accessibleLabels, nodeLabels)) {
			
 
				-        queueUsage.incUsed(label, resource);
			
 
				-      }
			
 
				-    }
			
 
				+      Resource resource, String nodePartition) {
			
 
				+    queueUsage.incUsed(nodePartition, resource);
			
 
				 
			
 
				     ++numContainers;
			
 
				     CSQueueUtils.updateQueueStatistics(resourceCalculator, this, getParent(),
			
@@ -360,15 +356,8 @@ public abstract class AbstractCSQueue implements CSQueue {
 
				   }
			
 
				   
			
 
				   protected synchronized void releaseResource(Resource clusterResource,
			
 
				-      Resource resource, Set<String> nodeLabels) {
			
 
				-    // Update usedResources by labels
			
 
				-    if (null == nodeLabels || nodeLabels.isEmpty()) {
			
 
				-      queueUsage.decUsed(resource);
			
 
				-    } else {
			
 
				-      for (String label : Sets.intersection(accessibleLabels, nodeLabels)) {
			
 
				-        queueUsage.decUsed(label, resource);
			
 
				-      }
			
 
				-    }
			
 
				+      Resource resource, String nodePartition) {
			
 
				+    queueUsage.decUsed(nodePartition, resource);
			
 
				 
			
 
				     CSQueueUtils.updateQueueStatistics(resourceCalculator, this, getParent(),
			
 
				         clusterResource, minimumAllocation);
			
@@ -434,103 +423,108 @@ public abstract class AbstractCSQueue implements CSQueue {
 
				                                         parentQ.getPreemptionDisabled());
			
 
				   }
			
 
				   
			
 
				-  private Resource getCurrentLimitResource(String nodeLabel,
			
 
				-      Resource clusterResource, ResourceLimits currentResourceLimits) {
			
 
				-    /*
			
 
				-     * Current limit resource: For labeled resource: limit = queue-max-resource
			
 
				-     * (TODO, this part need update when we support labeled-limit) For
			
 
				-     * non-labeled resource: limit = min(queue-max-resource,
			
 
				-     * limit-set-by-parent)
			
 
				-     */
			
 
				-    Resource queueMaxResource =
			
 
				-        Resources.multiplyAndNormalizeDown(resourceCalculator,
			
 
				-            labelManager.getResourceByLabel(nodeLabel, clusterResource),
			
 
				-            queueCapacities.getAbsoluteMaximumCapacity(nodeLabel), minimumAllocation);
			
 
				-    if (nodeLabel.equals(RMNodeLabelsManager.NO_LABEL)) {
			
 
				-      return Resources.min(resourceCalculator, clusterResource,
			
 
				-          queueMaxResource, currentResourceLimits.getLimit());
			
 
				+  private Resource getCurrentLimitResource(String nodePartition,
			
 
				+      Resource clusterResource, ResourceLimits currentResourceLimits,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				+    if (schedulingMode == SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY) {
			
 
				+      /*
			
 
				+       * Current limit resource: For labeled resource: limit = queue-max-resource
			
 
				+       * (TODO, this part need update when we support labeled-limit) For
			
 
				+       * non-labeled resource: limit = min(queue-max-resource,
			
 
				+       * limit-set-by-parent)
			
 
				+       */
			
 
				+      Resource queueMaxResource =
			
 
				+          Resources.multiplyAndNormalizeDown(resourceCalculator,
			
 
				+              labelManager.getResourceByLabel(nodePartition, clusterResource),
			
 
				+              queueCapacities.getAbsoluteMaximumCapacity(nodePartition), minimumAllocation);
			
 
				+      if (nodePartition.equals(RMNodeLabelsManager.NO_LABEL)) {
			
 
				+        return Resources.min(resourceCalculator, clusterResource,
			
 
				+            queueMaxResource, currentResourceLimits.getLimit());
			
 
				+      }
			
 
				+      return queueMaxResource;  
			
 
				+    } else if (schedulingMode == SchedulingMode.IGNORE_PARTITION_EXCLUSIVITY) {
			
 
				+      // When we doing non-exclusive resource allocation, maximum capacity of
			
 
				+      // all queues on this label equals to total resource with the label.
			
 
				+      return labelManager.getResourceByLabel(nodePartition, clusterResource);
			
 
				     }
			
 
				-    return queueMaxResource;
			
 
				+    
			
 
				+    return Resources.none();
			
 
				   }
			
 
				   
			
 
				   synchronized boolean canAssignToThisQueue(Resource clusterResource,
			
 
				-      Set<String> nodeLabels, ResourceLimits currentResourceLimits,
			
 
				-      Resource nowRequired, Resource resourceCouldBeUnreserved) {
			
 
				-    // Get label of this queue can access, it's (nodeLabel AND queueLabel)
			
 
				-    Set<String> labelCanAccess;
			
 
				-    if (null == nodeLabels || nodeLabels.isEmpty()) {
			
 
				-      labelCanAccess = new HashSet<String>();
			
 
				-      // Any queue can always access any node without label
			
 
				-      labelCanAccess.add(RMNodeLabelsManager.NO_LABEL);
			
 
				-    } else {
			
 
				-      labelCanAccess = new HashSet<String>(
			
 
				-          accessibleLabels.contains(CommonNodeLabelsManager.ANY) ? nodeLabels
			
 
				-              : Sets.intersection(accessibleLabels, nodeLabels));
			
 
				-    }
			
 
				-    
			
 
				-    for (String label : labelCanAccess) {
			
 
				-      // New total resource = used + required
			
 
				-      Resource newTotalResource =
			
 
				-          Resources.add(queueUsage.getUsed(label), nowRequired);
			
 
				-
			
 
				-      Resource currentLimitResource =
			
 
				-          getCurrentLimitResource(label, clusterResource, currentResourceLimits);
			
 
				-
			
 
				-      // if reservation continous looking enabled, check to see if could we
			
 
				-      // potentially use this node instead of a reserved node if the application
			
 
				-      // has reserved containers.
			
 
				-      // TODO, now only consider reservation cases when the node has no label
			
 
				-      if (this.reservationsContinueLooking
			
 
				-          && label.equals(RMNodeLabelsManager.NO_LABEL)
			
 
				-          && Resources.greaterThan(resourceCalculator, clusterResource,
			
 
				-              resourceCouldBeUnreserved, Resources.none())) {
			
 
				-        // resource-without-reserved = used - reserved
			
 
				-        Resource newTotalWithoutReservedResource =
			
 
				-            Resources.subtract(newTotalResource, resourceCouldBeUnreserved);
			
 
				-        
			
 
				-        // when total-used-without-reserved-resource < currentLimit, we still
			
 
				-        // have chance to allocate on this node by unreserving some containers
			
 
				-        if (Resources.lessThan(resourceCalculator, clusterResource,
			
 
				-            newTotalWithoutReservedResource, currentLimitResource)) {
			
 
				-          if (LOG.isDebugEnabled()) {
			
 
				-            LOG.debug("try to use reserved: " + getQueueName()
			
 
				-                + " usedResources: " + queueUsage.getUsed()
			
 
				-                + ", clusterResources: " + clusterResource
			
 
				-                + ", reservedResources: " + resourceCouldBeUnreserved
			
 
				-                + ", capacity-without-reserved: "
			
 
				-                + newTotalWithoutReservedResource + ", maxLimitCapacity: "
			
 
				-                + currentLimitResource); 
			
 
				-          }
			
 
				-          return true;
			
 
				+      String nodePartition, ResourceLimits currentResourceLimits,
			
 
				+      Resource nowRequired, Resource resourceCouldBeUnreserved,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				+    // New total resource = used + required
			
 
				+    Resource newTotalResource =
			
 
				+        Resources.add(queueUsage.getUsed(nodePartition), nowRequired);
			
 
				+
			
 
				+    // Get current limited resource: 
			
 
				+    // - When doing RESPECT_PARTITION_EXCLUSIVITY allocation, we will respect
			
 
				+    // queues' max capacity.
			
 
				+    // - When doing IGNORE_PARTITION_EXCLUSIVITY allocation, we will not respect
			
 
				+    // queue's max capacity, queue's max capacity on the partition will be
			
 
				+    // considered to be 100%. Which is a queue can use all resource in the
			
 
				+    // partition. 
			
 
				+    // Doing this because: for non-exclusive allocation, we make sure there's
			
 
				+    // idle resource on the partition, to avoid wastage, such resource will be
			
 
				+    // leveraged as much as we can, and preemption policy will reclaim it back
			
 
				+    // when partitoned-resource-request comes back.  
			
 
				+    Resource currentLimitResource =
			
 
				+        getCurrentLimitResource(nodePartition, clusterResource,
			
 
				+            currentResourceLimits, schedulingMode);
			
 
				+
			
 
				+    // if reservation continous looking enabled, check to see if could we
			
 
				+    // potentially use this node instead of a reserved node if the application
			
 
				+    // has reserved containers.
			
 
				+    // TODO, now only consider reservation cases when the node has no label
			
 
				+    if (this.reservationsContinueLooking
			
 
				+        && nodePartition.equals(RMNodeLabelsManager.NO_LABEL)
			
 
				+        && Resources.greaterThan(resourceCalculator, clusterResource,
			
 
				+            resourceCouldBeUnreserved, Resources.none())) {
			
 
				+      // resource-without-reserved = used - reserved
			
 
				+      Resource newTotalWithoutReservedResource =
			
 
				+          Resources.subtract(newTotalResource, resourceCouldBeUnreserved);
			
 
				+
			
 
				+      // when total-used-without-reserved-resource < currentLimit, we still
			
 
				+      // have chance to allocate on this node by unreserving some containers
			
 
				+      if (Resources.lessThan(resourceCalculator, clusterResource,
			
 
				+          newTotalWithoutReservedResource, currentLimitResource)) {
			
 
				+        if (LOG.isDebugEnabled()) {
			
 
				+          LOG.debug("try to use reserved: " + getQueueName()
			
 
				+              + " usedResources: " + queueUsage.getUsed()
			
 
				+              + ", clusterResources: " + clusterResource
			
 
				+              + ", reservedResources: " + resourceCouldBeUnreserved
			
 
				+              + ", capacity-without-reserved: "
			
 
				+              + newTotalWithoutReservedResource + ", maxLimitCapacity: "
			
 
				+              + currentLimitResource);
			
 
				         }
			
 
				+        return true;
			
 
				       }
			
 
				-      
			
 
				-      // Otherwise, if any of the label of this node beyond queue limit, we
			
 
				-      // cannot allocate on this node. Consider a small epsilon here.
			
 
				-      if (Resources.greaterThan(resourceCalculator, clusterResource,
			
 
				-          newTotalResource, currentLimitResource)) {
			
 
				-        return false;
			
 
				-      }
			
 
				+    }
			
 
				 
			
 
				-      if (LOG.isDebugEnabled()) {
			
 
				-        LOG.debug(getQueueName()
			
 
				-            + "Check assign to queue, label=" + label
			
 
				-            + " usedResources: " + queueUsage.getUsed(label)
			
 
				-            + " clusterResources: " + clusterResource
			
 
				-            + " currentUsedCapacity "
			
 
				-            + Resources.divide(resourceCalculator, clusterResource,
			
 
				-                queueUsage.getUsed(label),
			
 
				-                labelManager.getResourceByLabel(label, clusterResource))
			
 
				-            + " max-capacity: "
			
 
				-            + queueCapacities.getAbsoluteMaximumCapacity(label)
			
 
				-            + ")");
			
 
				-      }
			
 
				-      return true;
			
 
				+    // Check if we over current-resource-limit computed.
			
 
				+    if (Resources.greaterThan(resourceCalculator, clusterResource,
			
 
				+        newTotalResource, currentLimitResource)) {
			
 
				+      return false;
			
 
				     }
			
 
				-    
			
 
				-    // Actually, this will not happen, since labelCanAccess will be always
			
 
				-    // non-empty
			
 
				-    return false;
			
 
				+
			
 
				+    if (LOG.isDebugEnabled()) {
			
 
				+      LOG.debug(getQueueName()
			
 
				+          + "Check assign to queue, nodePartition="
			
 
				+          + nodePartition
			
 
				+          + " usedResources: "
			
 
				+          + queueUsage.getUsed(nodePartition)
			
 
				+          + " clusterResources: "
			
 
				+          + clusterResource
			
 
				+          + " currentUsedCapacity "
			
 
				+          + Resources.divide(resourceCalculator, clusterResource,
			
 
				+              queueUsage.getUsed(nodePartition),
			
 
				+              labelManager.getResourceByLabel(nodePartition, clusterResource))
			
 
				+          + " max-capacity: "
			
 
				+          + queueCapacities.getAbsoluteMaximumCapacity(nodePartition) + ")");
			
 
				+    }
			
 
				+    return true;
			
 
				   }
			
 
				   
			
 
				   @Override
			
@@ -556,4 +550,33 @@ public abstract class AbstractCSQueue implements CSQueue {
 
				       parent.decPendingResource(nodeLabel, resourceToDec);
			
 
				     }
			
 
				   }
			
 
				+  
			
 
				+  /**
			
 
				+   * Return if the queue has pending resource on given nodePartition and
			
 
				+   * schedulingMode. 
			
 
				+   */
			
 
				+  boolean hasPendingResourceRequest(String nodePartition, 
			
 
				+      Resource cluster, SchedulingMode schedulingMode) {
			
 
				+    return SchedulerUtils.hasPendingResourceRequest(resourceCalculator,
			
 
				+        queueUsage, nodePartition, cluster, schedulingMode);
			
 
				+  }
			
 
				+  
			
 
				+  boolean accessibleToPartition(String nodePartition) {
			
 
				+    // if queue's label is *, it can access any node
			
 
				+    if (accessibleLabels != null
			
 
				+        && accessibleLabels.contains(RMNodeLabelsManager.ANY)) {
			
 
				+      return true;
			
 
				+    }
			
 
				+    // any queue can access to a node without label
			
 
				+    if (nodePartition == null
			
 
				+        || nodePartition.equals(RMNodeLabelsManager.NO_LABEL)) {
			
 
				+      return true;
			
 
				+    }
			
 
				+    // a queue can access to a node only if it contains any label of the node
			
 
				+    if (accessibleLabels != null && accessibleLabels.contains(nodePartition)) {
			
 
				+      return true;
			
 
				+    }
			
 
				+    // sorry, you cannot access
			
 
				+    return false;
			
 
				+  }
			
 
				 }
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CSQueue.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CSQueue.java
@@ -190,10 +190,13 @@ extends org.apache.hadoop.yarn.server.resourcemanager.scheduler.Queue {
 
				    * @param clusterResource the resource of the cluster.
			
 
				    * @param node node on which resources are available
			
 
				    * @param resourceLimits how much overall resource of this queue can use. 
			
 
				+   * @param schedulingMode Type of exclusive check when assign container on a 
			
 
				+   * NodeManager, see {@link SchedulingMode}.
			
 
				    * @return the assignment
			
 
				    */
			
 
				   public CSAssignment assignContainers(Resource clusterResource,
			
 
				-      FiCaSchedulerNode node, ResourceLimits resourceLimits);
			
 
				+      FiCaSchedulerNode node, ResourceLimits resourceLimits,
			
 
				+      SchedulingMode schedulingMode);
			
 
				   
			
 
				   /**
			
 
				    * A container assigned to the queue has completed.
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CapacityScheduler.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CapacityScheduler.java
@@ -35,6 +35,7 @@ import java.util.concurrent.ConcurrentHashMap;
 
				 import java.util.concurrent.atomic.AtomicBoolean;
			
 
				 import java.util.concurrent.atomic.AtomicInteger;
			
 
				 
			
 
				+import org.apache.commons.lang.StringUtils;
			
 
				 import org.apache.commons.logging.Log;
			
 
				 import org.apache.commons.logging.LogFactory;
			
 
				 import org.apache.hadoop.classification.InterfaceAudience.LimitedPrivate;
			
@@ -1114,28 +1115,30 @@ public class CapacityScheduler extends
 
				     if (reservedContainer != null) {
			
 
				       FiCaSchedulerApp reservedApplication =
			
 
				           getCurrentAttemptForContainer(reservedContainer.getContainerId());
			
 
				-      
			
 
				+
			
 
				       // Try to fulfill the reservation
			
 
				-      LOG.info("Trying to fulfill reservation for application " + 
			
 
				-          reservedApplication.getApplicationId() + " on node: " + 
			
 
				-          node.getNodeID());
			
 
				-      
			
 
				-      LeafQueue queue = ((LeafQueue)reservedApplication.getQueue());
			
 
				-      assignment = queue.assignContainers(
			
 
				+      LOG.info("Trying to fulfill reservation for application "
			
 
				+          + reservedApplication.getApplicationId() + " on node: "
			
 
				+          + node.getNodeID());
			
 
				+
			
 
				+      LeafQueue queue = ((LeafQueue) reservedApplication.getQueue());
			
 
				+      assignment =
			
 
				+          queue.assignContainers(
			
 
				               clusterResource,
			
 
				               node,
			
 
				               // TODO, now we only consider limits for parent for non-labeled
			
 
				               // resources, should consider labeled resources as well.
			
 
				               new ResourceLimits(labelManager.getResourceByLabel(
			
 
				-                  RMNodeLabelsManager.NO_LABEL, clusterResource)));
			
 
				+                  RMNodeLabelsManager.NO_LABEL, clusterResource)),
			
 
				+              SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				       if (assignment.isFulfilledReservation()) {
			
 
				         CSAssignment tmp =
			
 
				             new CSAssignment(reservedContainer.getReservedResource(),
			
 
				-              assignment.getType());
			
 
				+                assignment.getType());
			
 
				         Resources.addTo(assignment.getAssignmentInformation().getAllocated(),
			
 
				-          reservedContainer.getReservedResource());
			
 
				+            reservedContainer.getReservedResource());
			
 
				         tmp.getAssignmentInformation().addAllocationDetails(
			
 
				-          reservedContainer.getContainerId(), queue.getQueuePath());
			
 
				+            reservedContainer.getContainerId(), queue.getQueuePath());
			
 
				         tmp.getAssignmentInformation().incrAllocations();
			
 
				         updateSchedulerHealth(lastNodeUpdateTime, node, tmp);
			
 
				         schedulerHealth.updateSchedulerFulfilledReservationCounts(1);
			
@@ -1143,16 +1146,13 @@ public class CapacityScheduler extends
 
				 
			
 
				       RMContainer excessReservation = assignment.getExcessReservation();
			
 
				       if (excessReservation != null) {
			
 
				-      Container container = excessReservation.getContainer();
			
 
				-      queue.completedContainer(
			
 
				-          clusterResource, assignment.getApplication(), node, 
			
 
				-          excessReservation, 
			
 
				-          SchedulerUtils.createAbnormalContainerStatus(
			
 
				-              container.getId(), 
			
 
				-              SchedulerUtils.UNRESERVED_CONTAINER), 
			
 
				-          RMContainerEventType.RELEASED, null, true);
			
 
				+        Container container = excessReservation.getContainer();
			
 
				+        queue.completedContainer(clusterResource, assignment.getApplication(),
			
 
				+            node, excessReservation, SchedulerUtils
			
 
				+                .createAbnormalContainerStatus(container.getId(),
			
 
				+                    SchedulerUtils.UNRESERVED_CONTAINER),
			
 
				+            RMContainerEventType.RELEASED, null, true);
			
 
				       }
			
 
				-
			
 
				     }
			
 
				 
			
 
				     // Try to schedule more if there are no reservations to fulfill
			
@@ -1163,22 +1163,61 @@ public class CapacityScheduler extends
 
				           LOG.debug("Trying to schedule on node: " + node.getNodeName() +
			
 
				               ", available: " + node.getAvailableResource());
			
 
				         }
			
 
				+
			
 
				         assignment = root.assignContainers(
			
 
				             clusterResource,
			
 
				             node,
			
 
				             // TODO, now we only consider limits for parent for non-labeled
			
 
				             // resources, should consider labeled resources as well.
			
 
				             new ResourceLimits(labelManager.getResourceByLabel(
			
 
				-                RMNodeLabelsManager.NO_LABEL, clusterResource)));
			
 
				+                RMNodeLabelsManager.NO_LABEL, clusterResource)),
			
 
				+            SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				+        if (Resources.greaterThan(calculator, clusterResource,
			
 
				+            assignment.getResource(), Resources.none())) {
			
 
				+          updateSchedulerHealth(lastNodeUpdateTime, node, assignment);
			
 
				+          return;
			
 
				+        }
			
 
				+        
			
 
				+        // Only do non-exclusive allocation when node has node-labels.
			
 
				+        if (StringUtils.equals(node.getPartition(),
			
 
				+            RMNodeLabelsManager.NO_LABEL)) {
			
 
				+          return;
			
 
				+        }
			
 
				+        
			
 
				+        // Only do non-exclusive allocation when the node-label supports that
			
 
				+        try {
			
 
				+          if (rmContext.getNodeLabelManager().isExclusiveNodeLabel(
			
 
				+              node.getPartition())) {
			
 
				+            return;
			
 
				+          }
			
 
				+        } catch (IOException e) {
			
 
				+          LOG.warn("Exception when trying to get exclusivity of node label="
			
 
				+              + node.getPartition(), e);
			
 
				+          return;
			
 
				+        }
			
 
				+        
			
 
				+        // Try to use NON_EXCLUSIVE
			
 
				+        assignment = root.assignContainers(
			
 
				+            clusterResource,
			
 
				+            node,
			
 
				+            // TODO, now we only consider limits for parent for non-labeled
			
 
				+            // resources, should consider labeled resources as well.
			
 
				+            new ResourceLimits(labelManager.getResourceByLabel(
			
 
				+                RMNodeLabelsManager.NO_LABEL, clusterResource)),
			
 
				+            SchedulingMode.IGNORE_PARTITION_EXCLUSIVITY);
			
 
				         updateSchedulerHealth(lastNodeUpdateTime, node, assignment);
			
 
				+        if (Resources.greaterThan(calculator, clusterResource,
			
 
				+            assignment.getResource(), Resources.none())) {
			
 
				+          return;
			
 
				+        }
			
 
				       }
			
 
				     } else {
			
 
				-      LOG.info("Skipping scheduling since node " + node.getNodeID() + 
			
 
				-          " is reserved by application " + 
			
 
				-          node.getReservedContainer().getContainerId().getApplicationAttemptId()
			
 
				-          );
			
 
				+      LOG.info("Skipping scheduling since node "
			
 
				+          + node.getNodeID()
			
 
				+          + " is reserved by application "
			
 
				+          + node.getReservedContainer().getContainerId()
			
 
				+              .getApplicationAttemptId());
			
 
				     }
			
 
				-  
			
 
				   }
			
 
				 
			
 
				   @Override
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CapacitySchedulerConfiguration.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CapacitySchedulerConfiguration.java
@@ -319,6 +319,11 @@ public class CapacitySchedulerConfiguration extends ReservationSchedulerConfigur
 
				     		getMaximumApplicationMasterResourcePercent());
			
 
				   }
			
 
				   
			
 
				+  public void setMaximumApplicationMasterResourcePerQueuePercent(String queue,
			
 
				+      float percent) {
			
 
				+    setFloat(getQueuePrefix(queue) + MAXIMUM_AM_RESOURCE_SUFFIX, percent);
			
 
				+  }
			
 
				+  
			
 
				   public float getNonLabeledQueueCapacity(String queue) {
			
 
				     float capacity = queue.equals("root") ? 100.0f : getFloat(
			
 
				         getQueuePrefix(queue) + CAPACITY, UNDEFINED);
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/LeafQueue.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/LeafQueue.java
@@ -24,7 +24,6 @@ import java.util.Collection;
 
				 import java.util.Collections;
			
 
				 import java.util.Comparator;
			
 
				 import java.util.HashMap;
			
 
				-import java.util.HashSet;
			
 
				 import java.util.Iterator;
			
 
				 import java.util.List;
			
 
				 import java.util.Map;
			
@@ -58,6 +57,7 @@ import org.apache.hadoop.yarn.factory.providers.RecordFactoryProvider;
 
				 import org.apache.hadoop.yarn.nodelabels.CommonNodeLabelsManager;
			
 
				 import org.apache.hadoop.yarn.security.AccessType;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.rmapp.attempt.RMAppAttempt;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainer;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainerEventType;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainerState;
			
@@ -718,39 +718,11 @@ public class LeafQueue extends AbstractCSQueue {
 
				       ApplicationAttemptId applicationAttemptId) {
			
 
				     return applicationAttemptMap.get(applicationAttemptId);
			
 
				   }
			
 
				-
			
 
				-  private static final CSAssignment NULL_ASSIGNMENT =
			
 
				-      new CSAssignment(Resources.createResource(0, 0), NodeType.NODE_LOCAL);
			
 
				-  
			
 
				-  private static final CSAssignment SKIP_ASSIGNMENT = new CSAssignment(true);
			
 
				-  
			
 
				-  private static Set<String> getRequestLabelSetByExpression(
			
 
				-      String labelExpression) {
			
 
				-    Set<String> labels = new HashSet<String>();
			
 
				-    if (null == labelExpression) {
			
 
				-      return labels;
			
 
				-    }
			
 
				-    for (String l : labelExpression.split("&&")) {
			
 
				-      if (l.trim().isEmpty()) {
			
 
				-        continue;
			
 
				-      }
			
 
				-      labels.add(l.trim());
			
 
				-    }
			
 
				-    return labels;
			
 
				-  }
			
 
				-  
			
 
				-  private boolean checkResourceRequestMatchingNodeLabel(ResourceRequest offswitchResourceRequest,
			
 
				-      FiCaSchedulerNode node) {
			
 
				-    String askedNodeLabel = offswitchResourceRequest.getNodeLabelExpression();
			
 
				-    if (null == askedNodeLabel) {
			
 
				-      askedNodeLabel = RMNodeLabelsManager.NO_LABEL;
			
 
				-    }
			
 
				-    return askedNodeLabel.equals(node.getPartition());
			
 
				-  }
			
 
				   
			
 
				   @Override
			
 
				   public synchronized CSAssignment assignContainers(Resource clusterResource,
			
 
				-      FiCaSchedulerNode node, ResourceLimits currentResourceLimits) {
			
 
				+      FiCaSchedulerNode node, ResourceLimits currentResourceLimits,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				     updateCurrentResourceLimits(currentResourceLimits, clusterResource);
			
 
				     
			
 
				     if(LOG.isDebugEnabled()) {
			
@@ -758,12 +730,6 @@ public class LeafQueue extends AbstractCSQueue {
 
				         + " #applications=" + activeApplications.size());
			
 
				     }
			
 
				     
			
 
				-    // if our queue cannot access this node, just return
			
 
				-    if (!SchedulerUtils.checkQueueAccessToNode(accessibleLabels,
			
 
				-        node.getLabels())) {
			
 
				-      return NULL_ASSIGNMENT;
			
 
				-    }
			
 
				-    
			
 
				     // Check for reserved resources
			
 
				     RMContainer reservedContainer = node.getReservedContainer();
			
 
				     if (reservedContainer != null) {
			
@@ -771,8 +737,26 @@ public class LeafQueue extends AbstractCSQueue {
 
				           getApplication(reservedContainer.getApplicationAttemptId());
			
 
				       synchronized (application) {
			
 
				         return assignReservedContainer(application, node, reservedContainer,
			
 
				-            clusterResource);
			
 
				+            clusterResource, schedulingMode);
			
 
				+      }
			
 
				+    }
			
 
				+    
			
 
				+    // if our queue cannot access this node, just return
			
 
				+    if (schedulingMode == SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY
			
 
				+        && !accessibleToPartition(node.getPartition())) {
			
 
				+      return NULL_ASSIGNMENT;
			
 
				+    }
			
 
				+    
			
 
				+    // Check if this queue need more resource, simply skip allocation if this
			
 
				+    // queue doesn't need more resources.
			
 
				+    if (!hasPendingResourceRequest(node.getPartition(),
			
 
				+        clusterResource, schedulingMode)) {
			
 
				+      if (LOG.isDebugEnabled()) {
			
 
				+        LOG.debug("Skip this queue=" + getQueuePath()
			
 
				+            + ", because it doesn't need more resource, schedulingMode="
			
 
				+            + schedulingMode.name() + " node-partition=" + node.getPartition());
			
 
				       }
			
 
				+      return NULL_ASSIGNMENT;
			
 
				     }
			
 
				     
			
 
				     // Try to assign containers to applications in order
			
@@ -783,6 +767,17 @@ public class LeafQueue extends AbstractCSQueue {
 
				         + application.getApplicationId());
			
 
				         application.showRequests();
			
 
				       }
			
 
				+      
			
 
				+      // Check if application needs more resource, skip if it doesn't need more.
			
 
				+      if (!application.hasPendingResourceRequest(resourceCalculator,
			
 
				+          node.getPartition(), clusterResource, schedulingMode)) {
			
 
				+        if (LOG.isDebugEnabled()) {
			
 
				+          LOG.debug("Skip app_attempt=" + application.getApplicationAttemptId()
			
 
				+              + ", because it doesn't need more resource, schedulingMode="
			
 
				+              + schedulingMode.name() + " node-label=" + node.getPartition());
			
 
				+        }
			
 
				+        continue;
			
 
				+      }
			
 
				 
			
 
				       synchronized (application) {
			
 
				         // Check if this resource is on the blacklist
			
@@ -806,10 +801,27 @@ public class LeafQueue extends AbstractCSQueue {
 
				             continue;
			
 
				           }
			
 
				           
			
 
				+          // AM container allocation doesn't support non-exclusive allocation to
			
 
				+          // avoid painful of preempt an AM container
			
 
				+          if (schedulingMode == SchedulingMode.IGNORE_PARTITION_EXCLUSIVITY) {
			
 
				+            RMAppAttempt rmAppAttempt =
			
 
				+                csContext.getRMContext().getRMApps()
			
 
				+                    .get(application.getApplicationId()).getCurrentAppAttempt();
			
 
				+            if (null == rmAppAttempt.getMasterContainer()) {
			
 
				+              if (LOG.isDebugEnabled()) {
			
 
				+                LOG.debug("Skip allocating AM container to app_attempt="
			
 
				+                    + application.getApplicationAttemptId()
			
 
				+                    + ", don't allow to allocate AM container in non-exclusive mode");
			
 
				+              }
			
 
				+              break;
			
 
				+            }
			
 
				+          }
			
 
				+          
			
 
				           // Is the node-label-expression of this offswitch resource request
			
 
				           // matches the node's label?
			
 
				           // If not match, jump to next priority.
			
 
				-          if (!checkResourceRequestMatchingNodeLabel(anyRequest, node)) {
			
 
				+          if (!SchedulerUtils.checkResourceRequestMatchingNodePartition(
			
 
				+              anyRequest, node.getPartition(), schedulingMode)) {
			
 
				             continue;
			
 
				           }
			
 
				           
			
@@ -822,10 +834,6 @@ public class LeafQueue extends AbstractCSQueue {
 
				             }
			
 
				           }
			
 
				           
			
 
				-          Set<String> requestedNodeLabels =
			
 
				-              getRequestLabelSetByExpression(anyRequest
			
 
				-                  .getNodeLabelExpression());
			
 
				-
			
 
				           // Compute user-limit & set headroom
			
 
				           // Note: We compute both user-limit & headroom with the highest 
			
 
				           //       priority request as the target. 
			
@@ -833,27 +841,61 @@ public class LeafQueue extends AbstractCSQueue {
 
				           //       before all higher priority ones are serviced.
			
 
				           Resource userLimit = 
			
 
				               computeUserLimitAndSetHeadroom(application, clusterResource, 
			
 
				-                  required, requestedNodeLabels);          
			
 
				+                  required, node.getPartition(), schedulingMode);          
			
 
				           
			
 
				           // Check queue max-capacity limit
			
 
				-          if (!super.canAssignToThisQueue(clusterResource, node.getLabels(),
			
 
				-              this.currentResourceLimits, required, application.getCurrentReservation())) {
			
 
				+          if (!super.canAssignToThisQueue(clusterResource, node.getPartition(),
			
 
				+              this.currentResourceLimits, required,
			
 
				+              application.getCurrentReservation(), schedulingMode)) {
			
 
				             return NULL_ASSIGNMENT;
			
 
				           }
			
 
				 
			
 
				           // Check user limit
			
 
				           if (!canAssignToUser(clusterResource, application.getUser(), userLimit,
			
 
				-              application, true, requestedNodeLabels)) {
			
 
				+              application, true, node.getPartition())) {
			
 
				             break;
			
 
				           }
			
 
				 
			
 
				           // Inform the application it is about to get a scheduling opportunity
			
 
				           application.addSchedulingOpportunity(priority);
			
 
				           
			
 
				+          // Increase missed-non-partitioned-resource-request-opportunity.
			
 
				+          // This is to make sure non-partitioned-resource-request will prefer
			
 
				+          // to be allocated to non-partitioned nodes
			
 
				+          int missedNonPartitionedRequestSchedulingOpportunity = 0;
			
 
				+          if (anyRequest.getNodeLabelExpression().equals(
			
 
				+              RMNodeLabelsManager.NO_LABEL)) {
			
 
				+            missedNonPartitionedRequestSchedulingOpportunity =
			
 
				+                application
			
 
				+                    .addMissedNonPartitionedRequestSchedulingOpportunity(priority);
			
 
				+          }
			
 
				+          
			
 
				+          if (schedulingMode == SchedulingMode.IGNORE_PARTITION_EXCLUSIVITY) {
			
 
				+            // Before doing allocation, we need to check scheduling opportunity to
			
 
				+            // make sure : non-partitioned resource request should be scheduled to
			
 
				+            // non-partitioned partition first.
			
 
				+            if (missedNonPartitionedRequestSchedulingOpportunity < scheduler
			
 
				+                .getNumClusterNodes()) {
			
 
				+              if (LOG.isDebugEnabled()) {
			
 
				+                LOG.debug("Skip app_attempt="
			
 
				+                    + application.getApplicationAttemptId()
			
 
				+                    + " priority="
			
 
				+                    + priority
			
 
				+                    + " because missed-non-partitioned-resource-request"
			
 
				+                    + " opportunity under requred:"
			
 
				+                    + " Now=" + missedNonPartitionedRequestSchedulingOpportunity
			
 
				+                    + " required="
			
 
				+                    + scheduler.getNumClusterNodes());
			
 
				+              }
			
 
				+
			
 
				+              break;
			
 
				+            }
			
 
				+          }
			
 
				+          
			
 
				           // Try to schedule
			
 
				           CSAssignment assignment =  
			
 
				             assignContainersOnNode(clusterResource, node, application, priority, 
			
 
				-                null);
			
 
				+                null, schedulingMode);
			
 
				 
			
 
				           // Did the application skip this node?
			
 
				           if (assignment.getSkipped()) {
			
@@ -870,9 +912,9 @@ public class LeafQueue extends AbstractCSQueue {
 
				             // Book-keeping 
			
 
				             // Note: Update headroom to account for current allocation too...
			
 
				             allocateResource(clusterResource, application, assigned,
			
 
				-                node.getLabels());
			
 
				+                node.getPartition());
			
 
				             
			
 
				-            // Don't reset scheduling opportunities for non-local assignments
			
 
				+            // Don't reset scheduling opportunities for offswitch assignments
			
 
				             // otherwise the app will be delayed for each non-local assignment.
			
 
				             // This helps apps with many off-cluster requests schedule faster.
			
 
				             if (assignment.getType() != NodeType.OFF_SWITCH) {
			
@@ -881,6 +923,10 @@ public class LeafQueue extends AbstractCSQueue {
 
				               }
			
 
				               application.resetSchedulingOpportunities(priority);
			
 
				             }
			
 
				+            // Non-exclusive scheduling opportunity is different: we need reset
			
 
				+            // it every time to make sure non-labeled resource request will be
			
 
				+            // most likely allocated on non-labeled nodes first. 
			
 
				+            application.resetMissedNonPartitionedRequestSchedulingOpportunity(priority);
			
 
				             
			
 
				             // Done
			
 
				             return assignment;
			
@@ -904,7 +950,8 @@ public class LeafQueue extends AbstractCSQueue {
 
				 
			
 
				   private synchronized CSAssignment assignReservedContainer(
			
 
				       FiCaSchedulerApp application, FiCaSchedulerNode node,
			
 
				-      RMContainer rmContainer, Resource clusterResource) {
			
 
				+      RMContainer rmContainer, Resource clusterResource,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				     // Do we still need this reservation?
			
 
				     Priority priority = rmContainer.getReservedPriority();
			
 
				     if (application.getTotalRequiredResources(priority) == 0) {
			
@@ -915,7 +962,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				     // Try to assign if we have sufficient resources
			
 
				     CSAssignment tmp =
			
 
				         assignContainersOnNode(clusterResource, node, application, priority,
			
 
				-          rmContainer);
			
 
				+          rmContainer, schedulingMode);
			
 
				     
			
 
				     // Doesn't matter... since it's already charged for at time of reservation
			
 
				     // "re-reservation" is *free*
			
@@ -929,7 +976,8 @@ public class LeafQueue extends AbstractCSQueue {
 
				   protected Resource getHeadroom(User user, Resource queueCurrentLimit,
			
 
				       Resource clusterResource, FiCaSchedulerApp application, Resource required) {
			
 
				     return getHeadroom(user, queueCurrentLimit, clusterResource,
			
 
				-	  computeUserLimit(application, clusterResource, required, user, null));
			
 
				+        computeUserLimit(application, clusterResource, required, user,
			
 
				+            RMNodeLabelsManager.NO_LABEL, SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY));
			
 
				   }
			
 
				   
			
 
				   private Resource getHeadroom(User user, Resource currentResourceLimit,
			
@@ -973,7 +1021,8 @@ public class LeafQueue extends AbstractCSQueue {
 
				 
			
 
				   @Lock({LeafQueue.class, FiCaSchedulerApp.class})
			
 
				   Resource computeUserLimitAndSetHeadroom(FiCaSchedulerApp application,
			
 
				-      Resource clusterResource, Resource required, Set<String> requestedLabels) {
			
 
				+      Resource clusterResource, Resource required, String nodePartition,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				     String user = application.getUser();
			
 
				     User queueUser = getUser(user);
			
 
				 
			
@@ -981,7 +1030,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				     // TODO, need consider headroom respect labels also
			
 
				     Resource userLimit =
			
 
				         computeUserLimit(application, clusterResource, required,
			
 
				-            queueUser, requestedLabels);
			
 
				+            queueUser, nodePartition, schedulingMode);
			
 
				 
			
 
				     setQueueResourceLimitsInfo(clusterResource);
			
 
				     
			
@@ -1010,34 +1059,18 @@ public class LeafQueue extends AbstractCSQueue {
 
				   @Lock(NoLock.class)
			
 
				   private Resource computeUserLimit(FiCaSchedulerApp application,
			
 
				       Resource clusterResource, Resource required, User user,
			
 
				-      Set<String> requestedLabels) {
			
 
				+      String nodePartition, SchedulingMode schedulingMode) {
			
 
				     // What is our current capacity? 
			
 
				     // * It is equal to the max(required, queue-capacity) if
			
 
				     //   we're running below capacity. The 'max' ensures that jobs in queues
			
 
				     //   with miniscule capacity (< 1 slot) make progress
			
 
				     // * If we're running over capacity, then its
			
 
				     //   (usedResources + required) (which extra resources we are allocating)
			
 
				-    Resource queueCapacity = Resource.newInstance(0, 0);
			
 
				-    if (requestedLabels != null && !requestedLabels.isEmpty()) {
			
 
				-      // if we have multiple labels to request, we will choose to use the first
			
 
				-      // label
			
 
				-      String firstLabel = requestedLabels.iterator().next();
			
 
				-      queueCapacity =
			
 
				-          Resources
			
 
				-              .max(resourceCalculator, clusterResource, queueCapacity,
			
 
				-                  Resources.multiplyAndNormalizeUp(resourceCalculator,
			
 
				-                      labelManager.getResourceByLabel(firstLabel,
			
 
				-                          clusterResource),
			
 
				-                      queueCapacities.getAbsoluteCapacity(firstLabel),
			
 
				-                      minimumAllocation));
			
 
				-    } else {
			
 
				-      // else there's no label on request, just to use absolute capacity as
			
 
				-      // capacity for nodes without label
			
 
				-      queueCapacity =
			
 
				-          Resources.multiplyAndNormalizeUp(resourceCalculator, labelManager
			
 
				-                .getResourceByLabel(CommonNodeLabelsManager.NO_LABEL, clusterResource),
			
 
				-              queueCapacities.getAbsoluteCapacity(), minimumAllocation);
			
 
				-    }
			
 
				+    Resource queueCapacity =
			
 
				+        Resources.multiplyAndNormalizeUp(resourceCalculator,
			
 
				+            labelManager.getResourceByLabel(nodePartition, clusterResource),
			
 
				+            queueCapacities.getAbsoluteCapacity(nodePartition),
			
 
				+            minimumAllocation);
			
 
				 
			
 
				     // Allow progress for queues with miniscule capacity
			
 
				     queueCapacity =
			
@@ -1047,33 +1080,56 @@ public class LeafQueue extends AbstractCSQueue {
 
				             required);
			
 
				 
			
 
				     Resource currentCapacity =
			
 
				-        Resources.lessThan(resourceCalculator, clusterResource, 
			
 
				-            queueUsage.getUsed(), queueCapacity) ?
			
 
				-            queueCapacity : Resources.add(queueUsage.getUsed(), required);
			
 
				+        Resources.lessThan(resourceCalculator, clusterResource,
			
 
				+            queueUsage.getUsed(nodePartition), queueCapacity) ? queueCapacity
			
 
				+            : Resources.add(queueUsage.getUsed(nodePartition), required);
			
 
				     
			
 
				     // Never allow a single user to take more than the 
			
 
				     // queue's configured capacity * user-limit-factor.
			
 
				     // Also, the queue's configured capacity should be higher than 
			
 
				     // queue-hard-limit * ulMin
			
 
				     
			
 
				-    final int activeUsers = activeUsersManager.getNumActiveUsers();  
			
 
				-    		
			
 
				-    Resource limit =
			
 
				+    final int activeUsers = activeUsersManager.getNumActiveUsers();
			
 
				+    
			
 
				+    // User limit resource is determined by:
			
 
				+    // max{currentCapacity / #activeUsers, currentCapacity * user-limit-percentage%)
			
 
				+    Resource userLimitResource = Resources.max(
			
 
				+        resourceCalculator, clusterResource, 
			
 
				+        Resources.divideAndCeil(
			
 
				+            resourceCalculator, currentCapacity, activeUsers),
			
 
				+        Resources.divideAndCeil(
			
 
				+            resourceCalculator, 
			
 
				+            Resources.multiplyAndRoundDown(
			
 
				+                currentCapacity, userLimit), 
			
 
				+            100)
			
 
				+        );
			
 
				+    
			
 
				+    // User limit is capped by maxUserLimit
			
 
				+    // - maxUserLimit = queueCapacity * user-limit-factor (RESPECT_PARTITION_EXCLUSIVITY)
			
 
				+    // - maxUserLimit = total-partition-resource (IGNORE_PARTITION_EXCLUSIVITY)
			
 
				+    //
			
 
				+    // In IGNORE_PARTITION_EXCLUSIVITY mode, if a queue cannot access a
			
 
				+    // partition, its guaranteed resource on that partition is 0. And
			
 
				+    // user-limit-factor computation is based on queue's guaranteed capacity. So
			
 
				+    // we will not cap user-limit as well as used resource when doing
			
 
				+    // IGNORE_PARTITION_EXCLUSIVITY allocation.
			
 
				+    Resource maxUserLimit = Resources.none();
			
 
				+    if (schedulingMode == SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY) {
			
 
				+      maxUserLimit =
			
 
				+          Resources.multiplyAndRoundDown(queueCapacity, userLimitFactor);
			
 
				+    } else if (schedulingMode == SchedulingMode.IGNORE_PARTITION_EXCLUSIVITY) {
			
 
				+      maxUserLimit =
			
 
				+          labelManager.getResourceByLabel(nodePartition, clusterResource);
			
 
				+    }
			
 
				+    
			
 
				+    // Cap final user limit with maxUserLimit
			
 
				+    userLimitResource =
			
 
				         Resources.roundUp(
			
 
				             resourceCalculator, 
			
 
				             Resources.min(
			
 
				                 resourceCalculator, clusterResource,   
			
 
				-                Resources.max(
			
 
				-                    resourceCalculator, clusterResource, 
			
 
				-                    Resources.divideAndCeil(
			
 
				-                        resourceCalculator, currentCapacity, activeUsers),
			
 
				-                    Resources.divideAndCeil(
			
 
				-                        resourceCalculator, 
			
 
				-                        Resources.multiplyAndRoundDown(
			
 
				-                            currentCapacity, userLimit), 
			
 
				-                        100)
			
 
				-                    ), 
			
 
				-                Resources.multiplyAndRoundDown(queueCapacity, userLimitFactor)
			
 
				+                  userLimitResource,
			
 
				+                  maxUserLimit
			
 
				                 ), 
			
 
				             minimumAllocation);
			
 
				 
			
@@ -1081,11 +1137,11 @@ public class LeafQueue extends AbstractCSQueue {
 
				       String userName = application.getUser();
			
 
				       LOG.debug("User limit computation for " + userName + 
			
 
				           " in queue " + getQueueName() +
			
 
				-          " userLimit=" + userLimit +
			
 
				+          " userLimitPercent=" + userLimit +
			
 
				           " userLimitFactor=" + userLimitFactor +
			
 
				           " required: " + required + 
			
 
				           " consumed: " + user.getUsed() + 
			
 
				-          " limit: " + limit +
			
 
				+          " user-limit-resource: " + userLimitResource +
			
 
				           " queueCapacity: " + queueCapacity + 
			
 
				           " qconsumed: " + queueUsage.getUsed() +
			
 
				           " currentCapacity: " + currentCapacity +
			
@@ -1093,31 +1149,26 @@ public class LeafQueue extends AbstractCSQueue {
 
				           " clusterCapacity: " + clusterResource
			
 
				       );
			
 
				     }
			
 
				-    user.setUserResourceLimit(limit);
			
 
				-    return limit;
			
 
				+    user.setUserResourceLimit(userLimitResource);
			
 
				+    return userLimitResource;
			
 
				   }
			
 
				   
			
 
				   @Private
			
 
				   protected synchronized boolean canAssignToUser(Resource clusterResource,
			
 
				       String userName, Resource limit, FiCaSchedulerApp application,
			
 
				-      boolean checkReservations, Set<String> requestLabels) {
			
 
				+      boolean checkReservations, String nodePartition) {
			
 
				     User user = getUser(userName);
			
 
				-    
			
 
				-    String label = CommonNodeLabelsManager.NO_LABEL;
			
 
				-    if (requestLabels != null && !requestLabels.isEmpty()) {
			
 
				-      label = requestLabels.iterator().next();
			
 
				-    }
			
 
				 
			
 
				     // Note: We aren't considering the current request since there is a fixed
			
 
				     // overhead of the AM, but it's a > check, not a >= check, so...
			
 
				     if (Resources
			
 
				         .greaterThan(resourceCalculator, clusterResource,
			
 
				-            user.getUsed(label),
			
 
				+            user.getUsed(nodePartition),
			
 
				             limit)) {
			
 
				       // if enabled, check to see if could we potentially use this node instead
			
 
				       // of a reserved node if the application has reserved containers
			
 
				       if (this.reservationsContinueLooking && checkReservations
			
 
				-          && label.equals(CommonNodeLabelsManager.NO_LABEL)) {
			
 
				+          && nodePartition.equals(CommonNodeLabelsManager.NO_LABEL)) {
			
 
				         if (Resources.lessThanOrEqual(
			
 
				             resourceCalculator,
			
 
				             clusterResource,
			
@@ -1136,7 +1187,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				       if (LOG.isDebugEnabled()) {
			
 
				         LOG.debug("User " + userName + " in queue " + getQueueName()
			
 
				             + " will exceed limit - " + " consumed: "
			
 
				-            + user.getUsed() + " limit: " + limit);
			
 
				+            + user.getUsed(nodePartition) + " limit: " + limit);
			
 
				       }
			
 
				       return false;
			
 
				     }
			
@@ -1176,7 +1227,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				 
			
 
				   private CSAssignment assignContainersOnNode(Resource clusterResource,
			
 
				       FiCaSchedulerNode node, FiCaSchedulerApp application, Priority priority,
			
 
				-      RMContainer reservedContainer) {
			
 
				+      RMContainer reservedContainer, SchedulingMode schedulingMode) {
			
 
				 
			
 
				     CSAssignment assigned;
			
 
				 
			
@@ -1190,7 +1241,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				       assigned =
			
 
				           assignNodeLocalContainers(clusterResource, nodeLocalResourceRequest, 
			
 
				             node, application, priority, reservedContainer,
			
 
				-            allocatedContainer);
			
 
				+            allocatedContainer, schedulingMode);
			
 
				       if (Resources.greaterThan(resourceCalculator, clusterResource,
			
 
				         assigned.getResource(), Resources.none())) {
			
 
				 
			
@@ -1219,7 +1270,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				       assigned = 
			
 
				           assignRackLocalContainers(clusterResource, rackLocalResourceRequest, 
			
 
				             node, application, priority, reservedContainer,
			
 
				-            allocatedContainer);
			
 
				+            allocatedContainer, schedulingMode);
			
 
				       if (Resources.greaterThan(resourceCalculator, clusterResource,
			
 
				         assigned.getResource(), Resources.none())) {
			
 
				 
			
@@ -1248,7 +1299,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				       assigned =
			
 
				           assignOffSwitchContainers(clusterResource, offSwitchResourceRequest,
			
 
				             node, application, priority, reservedContainer,
			
 
				-            allocatedContainer);
			
 
				+            allocatedContainer, schedulingMode);
			
 
				 
			
 
				       // update locality statistics
			
 
				       if (allocatedContainer.getValue() != null) {
			
@@ -1314,16 +1365,17 @@ public class LeafQueue extends AbstractCSQueue {
 
				 
			
 
				   @Private
			
 
				   protected boolean checkLimitsToReserve(Resource clusterResource,
			
 
				-      FiCaSchedulerApp application, Resource capability) {
			
 
				+      FiCaSchedulerApp application, Resource capability, String nodePartition,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				     // we can't reserve if we got here based on the limit
			
 
				     // checks assuming we could unreserve!!!
			
 
				     Resource userLimit = computeUserLimitAndSetHeadroom(application,
			
 
				-        clusterResource, capability, null);
			
 
				+        clusterResource, capability, nodePartition, schedulingMode);
			
 
				 
			
 
				     // Check queue max-capacity limit,
			
 
				     // TODO: Consider reservation on labels
			
 
				-    if (!canAssignToThisQueue(clusterResource, null,
			
 
				-        this.currentResourceLimits, capability, Resources.none())) {
			
 
				+    if (!canAssignToThisQueue(clusterResource, RMNodeLabelsManager.NO_LABEL,
			
 
				+        this.currentResourceLimits, capability, Resources.none(), schedulingMode)) {
			
 
				       if (LOG.isDebugEnabled()) {
			
 
				         LOG.debug("was going to reserve but hit queue limit");
			
 
				       }
			
@@ -1332,7 +1384,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				 
			
 
				     // Check user limit
			
 
				     if (!canAssignToUser(clusterResource, application.getUser(), userLimit,
			
 
				-        application, false, null)) {
			
 
				+        application, false, nodePartition)) {
			
 
				       if (LOG.isDebugEnabled()) {
			
 
				         LOG.debug("was going to reserve but hit user limit");
			
 
				       }
			
@@ -1345,12 +1397,13 @@ public class LeafQueue extends AbstractCSQueue {
 
				   private CSAssignment assignNodeLocalContainers(Resource clusterResource,
			
 
				       ResourceRequest nodeLocalResourceRequest, FiCaSchedulerNode node,
			
 
				       FiCaSchedulerApp application, Priority priority,
			
 
				-      RMContainer reservedContainer, MutableObject allocatedContainer) {
			
 
				+      RMContainer reservedContainer, MutableObject allocatedContainer,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				     if (canAssign(application, priority, node, NodeType.NODE_LOCAL, 
			
 
				         reservedContainer)) {
			
 
				       return assignContainer(clusterResource, node, application, priority,
			
 
				           nodeLocalResourceRequest, NodeType.NODE_LOCAL, reservedContainer,
			
 
				-          allocatedContainer);
			
 
				+          allocatedContainer, schedulingMode);
			
 
				     }
			
 
				 
			
 
				     return new CSAssignment(Resources.none(), NodeType.NODE_LOCAL);
			
@@ -1359,12 +1412,13 @@ public class LeafQueue extends AbstractCSQueue {
 
				   private CSAssignment assignRackLocalContainers(Resource clusterResource,
			
 
				       ResourceRequest rackLocalResourceRequest, FiCaSchedulerNode node,
			
 
				       FiCaSchedulerApp application, Priority priority,
			
 
				-      RMContainer reservedContainer, MutableObject allocatedContainer) {
			
 
				+      RMContainer reservedContainer, MutableObject allocatedContainer,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				     if (canAssign(application, priority, node, NodeType.RACK_LOCAL,
			
 
				         reservedContainer)) {
			
 
				       return assignContainer(clusterResource, node, application, priority,
			
 
				           rackLocalResourceRequest, NodeType.RACK_LOCAL, reservedContainer,
			
 
				-          allocatedContainer);
			
 
				+          allocatedContainer, schedulingMode);
			
 
				     }
			
 
				 
			
 
				     return new CSAssignment(Resources.none(), NodeType.RACK_LOCAL);
			
@@ -1373,16 +1427,21 @@ public class LeafQueue extends AbstractCSQueue {
 
				   private CSAssignment assignOffSwitchContainers(Resource clusterResource,
			
 
				       ResourceRequest offSwitchResourceRequest, FiCaSchedulerNode node,
			
 
				       FiCaSchedulerApp application, Priority priority,
			
 
				-      RMContainer reservedContainer, MutableObject allocatedContainer) {
			
 
				+      RMContainer reservedContainer, MutableObject allocatedContainer,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				     if (canAssign(application, priority, node, NodeType.OFF_SWITCH,
			
 
				         reservedContainer)) {
			
 
				       return assignContainer(clusterResource, node, application, priority,
			
 
				           offSwitchResourceRequest, NodeType.OFF_SWITCH, reservedContainer,
			
 
				-          allocatedContainer);
			
 
				+          allocatedContainer, schedulingMode);
			
 
				     }
			
 
				     
			
 
				     return new CSAssignment(Resources.none(), NodeType.OFF_SWITCH);
			
 
				   }
			
 
				+  
			
 
				+  private int getActualNodeLocalityDelay() {
			
 
				+    return Math.min(scheduler.getNumClusterNodes(), getNodeLocalityDelay());
			
 
				+  }
			
 
				 
			
 
				   boolean canAssign(FiCaSchedulerApp application, Priority priority, 
			
 
				       FiCaSchedulerNode node, NodeType type, RMContainer reservedContainer) {
			
@@ -1417,10 +1476,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				     if (type == NodeType.RACK_LOCAL) {
			
 
				       // 'Delay' rack-local just a little bit...
			
 
				       long missedOpportunities = application.getSchedulingOpportunities(priority);
			
 
				-      return (
			
 
				-          Math.min(scheduler.getNumClusterNodes(), getNodeLocalityDelay()) < 
			
 
				-          missedOpportunities
			
 
				-          );
			
 
				+      return getActualNodeLocalityDelay() < missedOpportunities;
			
 
				     }
			
 
				 
			
 
				     // Check if we need containers on this host
			
@@ -1460,7 +1516,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				   private CSAssignment assignContainer(Resource clusterResource, FiCaSchedulerNode node,
			
 
				       FiCaSchedulerApp application, Priority priority, 
			
 
				       ResourceRequest request, NodeType type, RMContainer rmContainer,
			
 
				-      MutableObject createdContainer) {
			
 
				+      MutableObject createdContainer, SchedulingMode schedulingMode) {
			
 
				     if (LOG.isDebugEnabled()) {
			
 
				       LOG.debug("assignContainers: node=" + node.getNodeName()
			
 
				         + " application=" + application.getApplicationId()
			
@@ -1469,9 +1525,8 @@ public class LeafQueue extends AbstractCSQueue {
 
				     }
			
 
				     
			
 
				     // check if the resource request can access the label
			
 
				-    if (!SchedulerUtils.checkNodeLabelExpression(
			
 
				-        node.getLabels(),
			
 
				-        request.getNodeLabelExpression())) {
			
 
				+    if (!SchedulerUtils.checkResourceRequestMatchingNodePartition(request,
			
 
				+        node.getPartition(), schedulingMode)) {
			
 
				       // this is a reserved container, but we cannot allocate it now according
			
 
				       // to label not match. This can be caused by node label changed
			
 
				       // We should un-reserve this container.
			
@@ -1576,8 +1631,8 @@ public class LeafQueue extends AbstractCSQueue {
 
				           // If we're trying to reserve a container here, not container will be
			
 
				           // unreserved for reserving the new one. Check limits again before
			
 
				           // reserve the new container
			
 
				-          if (!checkLimitsToReserve(clusterResource, 
			
 
				-              application, capability)) {
			
 
				+          if (!checkLimitsToReserve(clusterResource,
			
 
				+              application, capability, node.getPartition(), schedulingMode)) {
			
 
				             return new CSAssignment(Resources.none(), type);
			
 
				           }
			
 
				         }
			
@@ -1666,7 +1721,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				         // Book-keeping
			
 
				         if (removed) {
			
 
				           releaseResource(clusterResource, application,
			
 
				-              container.getResource(), node.getLabels());
			
 
				+              container.getResource(), node.getPartition());
			
 
				           LOG.info("completedContainer" +
			
 
				               " container=" + container +
			
 
				               " queue=" + this +
			
@@ -1684,13 +1739,13 @@ public class LeafQueue extends AbstractCSQueue {
 
				 
			
 
				   synchronized void allocateResource(Resource clusterResource,
			
 
				       SchedulerApplicationAttempt application, Resource resource,
			
 
				-      Set<String> nodeLabels) {
			
 
				-    super.allocateResource(clusterResource, resource, nodeLabels);
			
 
				+      String nodePartition) {
			
 
				+    super.allocateResource(clusterResource, resource, nodePartition);
			
 
				     
			
 
				     // Update user metrics
			
 
				     String userName = application.getUser();
			
 
				     User user = getUser(userName);
			
 
				-    user.assignContainer(resource, nodeLabels);
			
 
				+    user.assignContainer(resource, nodePartition);
			
 
				     // Note this is a bit unconventional since it gets the object and modifies
			
 
				     // it here, rather then using set routine
			
 
				     Resources.subtractFrom(application.getHeadroom(), resource); // headroom
			
@@ -1707,13 +1762,13 @@ public class LeafQueue extends AbstractCSQueue {
 
				   }
			
 
				 
			
 
				   synchronized void releaseResource(Resource clusterResource, 
			
 
				-      FiCaSchedulerApp application, Resource resource, Set<String> nodeLabels) {
			
 
				-    super.releaseResource(clusterResource, resource, nodeLabels);
			
 
				+      FiCaSchedulerApp application, Resource resource, String nodePartition) {
			
 
				+    super.releaseResource(clusterResource, resource, nodePartition);
			
 
				     
			
 
				     // Update user metrics
			
 
				     String userName = application.getUser();
			
 
				     User user = getUser(userName);
			
 
				-    user.releaseContainer(resource, nodeLabels);
			
 
				+    user.releaseContainer(resource, nodePartition);
			
 
				     metrics.setAvailableResourcesToUser(userName, application.getHeadroom());
			
 
				       
			
 
				     LOG.info(getQueueName() + 
			
@@ -1723,7 +1778,8 @@ public class LeafQueue extends AbstractCSQueue {
 
				   
			
 
				   private void updateAbsoluteCapacityResource(Resource clusterResource) {
			
 
				     absoluteCapacityResource =
			
 
				-        Resources.multiplyAndNormalizeUp(resourceCalculator, clusterResource,
			
 
				+        Resources.multiplyAndNormalizeUp(resourceCalculator, labelManager
			
 
				+            .getResourceByLabel(RMNodeLabelsManager.NO_LABEL, clusterResource),
			
 
				             queueCapacities.getAbsoluteCapacity(), minimumAllocation);
			
 
				   }
			
 
				   
			
@@ -1769,8 +1825,9 @@ public class LeafQueue extends AbstractCSQueue {
 
				     // Update application properties
			
 
				     for (FiCaSchedulerApp application : activeApplications) {
			
 
				       synchronized (application) {
			
 
				-        computeUserLimitAndSetHeadroom(application, clusterResource, 
			
 
				-            Resources.none(), null);
			
 
				+        computeUserLimitAndSetHeadroom(application, clusterResource,
			
 
				+            Resources.none(), RMNodeLabelsManager.NO_LABEL,
			
 
				+            SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				       }
			
 
				     }
			
 
				   }
			
@@ -1828,25 +1885,12 @@ public class LeafQueue extends AbstractCSQueue {
 
				       }
			
 
				     }
			
 
				 
			
 
				-    public void assignContainer(Resource resource,
			
 
				-        Set<String> nodeLabels) {
			
 
				-      if (nodeLabels == null || nodeLabels.isEmpty()) {
			
 
				-        userResourceUsage.incUsed(resource);
			
 
				-      } else {
			
 
				-        for (String label : nodeLabels) {
			
 
				-          userResourceUsage.incUsed(label, resource);
			
 
				-        }
			
 
				-      }
			
 
				+    public void assignContainer(Resource resource, String nodePartition) {
			
 
				+      userResourceUsage.incUsed(nodePartition, resource);
			
 
				     }
			
 
				 
			
 
				-    public void releaseContainer(Resource resource, Set<String> nodeLabels) {
			
 
				-      if (nodeLabels == null || nodeLabels.isEmpty()) {
			
 
				-        userResourceUsage.decUsed(resource);
			
 
				-      } else {
			
 
				-        for (String label : nodeLabels) {
			
 
				-          userResourceUsage.decUsed(label, resource);
			
 
				-        }
			
 
				-      }
			
 
				+    public void releaseContainer(Resource resource, String nodePartition) {
			
 
				+      userResourceUsage.decUsed(nodePartition, resource);
			
 
				     }
			
 
				 
			
 
				     public Resource getUserResourceLimit() {
			
@@ -1869,7 +1913,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				       FiCaSchedulerNode node =
			
 
				           scheduler.getNode(rmContainer.getContainer().getNodeId());
			
 
				       allocateResource(clusterResource, attempt, rmContainer.getContainer()
			
 
				-          .getResource(), node.getLabels());
			
 
				+          .getResource(), node.getPartition());
			
 
				     }
			
 
				     getParent().recoverContainer(clusterResource, attempt, rmContainer);
			
 
				   }
			
@@ -1909,7 +1953,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				       FiCaSchedulerNode node =
			
 
				           scheduler.getNode(rmContainer.getContainer().getNodeId());
			
 
				       allocateResource(clusterResource, application, rmContainer.getContainer()
			
 
				-          .getResource(), node.getLabels());
			
 
				+          .getResource(), node.getPartition());
			
 
				       LOG.info("movedContainer" + " container=" + rmContainer.getContainer()
			
 
				           + " resource=" + rmContainer.getContainer().getResource()
			
 
				           + " queueMoveIn=" + this + " usedCapacity=" + getUsedCapacity()
			
@@ -1927,7 +1971,7 @@ public class LeafQueue extends AbstractCSQueue {
 
				       FiCaSchedulerNode node =
			
 
				           scheduler.getNode(rmContainer.getContainer().getNodeId());
			
 
				       releaseResource(clusterResource, application, rmContainer.getContainer()
			
 
				-          .getResource(), node.getLabels());
			
 
				+          .getResource(), node.getPartition());
			
 
				       LOG.info("movedContainer" + " container=" + rmContainer.getContainer()
			
 
				           + " resource=" + rmContainer.getContainer().getResource()
			
 
				           + " queueMoveOut=" + this + " usedCapacity=" + getUsedCapacity()
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/ParentQueue.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/ParentQueue.java
@@ -56,8 +56,6 @@ import org.apache.hadoop.yarn.server.resourcemanager.scheduler.ActiveUsersManage
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.NodeType;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceLimits;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.SchedulerApplicationAttempt;
			
 
				-import org.apache.hadoop.yarn.server.resourcemanager.scheduler.SchedulerUtils;
			
 
				-import org.apache.hadoop.yarn.server.resourcemanager.scheduler.common.AssignmentInformation;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.common.fica.FiCaSchedulerApp;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.common.fica.FiCaSchedulerNode;
			
 
				 import org.apache.hadoop.yarn.util.resource.Resources;
			
@@ -377,16 +375,29 @@ public class ParentQueue extends AbstractCSQueue {
 
				 
			
 
				   @Override
			
 
				   public synchronized CSAssignment assignContainers(Resource clusterResource,
			
 
				-      FiCaSchedulerNode node, ResourceLimits resourceLimits) {
			
 
				-    CSAssignment assignment = 
			
 
				-        new CSAssignment(Resources.createResource(0, 0), NodeType.NODE_LOCAL);
			
 
				-    Set<String> nodeLabels = node.getLabels();
			
 
				-    
			
 
				+      FiCaSchedulerNode node, ResourceLimits resourceLimits,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				     // if our queue cannot access this node, just return
			
 
				-    if (!SchedulerUtils.checkQueueAccessToNode(accessibleLabels, nodeLabels)) {
			
 
				-      return assignment;
			
 
				+    if (schedulingMode == SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY
			
 
				+        && !accessibleToPartition(node.getPartition())) {
			
 
				+      return NULL_ASSIGNMENT;
			
 
				+    }
			
 
				+    
			
 
				+    // Check if this queue need more resource, simply skip allocation if this
			
 
				+    // queue doesn't need more resources.
			
 
				+    if (!super.hasPendingResourceRequest(node.getPartition(),
			
 
				+        clusterResource, schedulingMode)) {
			
 
				+      if (LOG.isDebugEnabled()) {
			
 
				+        LOG.debug("Skip this queue=" + getQueuePath()
			
 
				+            + ", because it doesn't need more resource, schedulingMode="
			
 
				+            + schedulingMode.name() + " node-partition=" + node.getPartition());
			
 
				+      }
			
 
				+      return NULL_ASSIGNMENT;
			
 
				     }
			
 
				     
			
 
				+    CSAssignment assignment = 
			
 
				+        new CSAssignment(Resources.createResource(0, 0), NodeType.NODE_LOCAL);
			
 
				+    
			
 
				     while (canAssign(clusterResource, node)) {
			
 
				       if (LOG.isDebugEnabled()) {
			
 
				         LOG.debug("Trying to assign containers to child-queue of "
			
@@ -396,15 +407,17 @@ public class ParentQueue extends AbstractCSQueue {
 
				       // Are we over maximum-capacity for this queue?
			
 
				       // This will also consider parent's limits and also continuous reservation
			
 
				       // looking
			
 
				-      if (!super.canAssignToThisQueue(clusterResource, nodeLabels, resourceLimits,
			
 
				-          minimumAllocation, Resources.createResource(getMetrics()
			
 
				-              .getReservedMB(), getMetrics().getReservedVirtualCores()))) {
			
 
				+      if (!super.canAssignToThisQueue(clusterResource, node.getPartition(),
			
 
				+          resourceLimits, minimumAllocation, Resources.createResource(
			
 
				+              getMetrics().getReservedMB(), getMetrics()
			
 
				+                  .getReservedVirtualCores()), schedulingMode)) {
			
 
				         break;
			
 
				       }
			
 
				       
			
 
				       // Schedule
			
 
				-      CSAssignment assignedToChild = 
			
 
				-          assignContainersToChildQueues(clusterResource, node, resourceLimits);
			
 
				+      CSAssignment assignedToChild =
			
 
				+          assignContainersToChildQueues(clusterResource, node, resourceLimits,
			
 
				+              schedulingMode);
			
 
				       assignment.setType(assignedToChild.getType());
			
 
				       
			
 
				       // Done if no child-queue assigned anything
			
@@ -413,7 +426,7 @@ public class ParentQueue extends AbstractCSQueue {
 
				               assignedToChild.getResource(), Resources.none())) {
			
 
				         // Track resource utilization for the parent-queue
			
 
				         super.allocateResource(clusterResource, assignedToChild.getResource(),
			
 
				-            nodeLabels);
			
 
				+            node.getPartition());
			
 
				         
			
 
				         // Track resource utilization in this pass of the scheduler
			
 
				         Resources
			
@@ -510,7 +523,8 @@ public class ParentQueue extends AbstractCSQueue {
 
				   }
			
 
				   
			
 
				   private synchronized CSAssignment assignContainersToChildQueues(
			
 
				-      Resource cluster, FiCaSchedulerNode node, ResourceLimits limits) {
			
 
				+      Resource cluster, FiCaSchedulerNode node, ResourceLimits limits,
			
 
				+      SchedulingMode schedulingMode) {
			
 
				     CSAssignment assignment = 
			
 
				         new CSAssignment(Resources.createResource(0, 0), NodeType.NODE_LOCAL);
			
 
				     
			
@@ -523,12 +537,13 @@ public class ParentQueue extends AbstractCSQueue {
 
				         LOG.debug("Trying to assign to queue: " + childQueue.getQueuePath()
			
 
				           + " stats: " + childQueue);
			
 
				       }
			
 
				-      
			
 
				+
			
 
				       // Get ResourceLimits of child queue before assign containers
			
 
				       ResourceLimits childLimits =
			
 
				           getResourceLimitsOfChild(childQueue, cluster, limits);
			
 
				       
			
 
				-      assignment = childQueue.assignContainers(cluster, node, childLimits);
			
 
				+      assignment = childQueue.assignContainers(cluster, node, 
			
 
				+          childLimits, schedulingMode);
			
 
				       if(LOG.isDebugEnabled()) {
			
 
				         LOG.debug("Assigned to queue: " + childQueue.getQueuePath() +
			
 
				           " stats: " + childQueue + " --> " + 
			
@@ -584,7 +599,7 @@ public class ParentQueue extends AbstractCSQueue {
 
				       // Book keeping
			
 
				       synchronized (this) {
			
 
				         super.releaseResource(clusterResource, rmContainer.getContainer()
			
 
				-            .getResource(), node.getLabels());
			
 
				+            .getResource(), node.getPartition());
			
 
				 
			
 
				         LOG.info("completedContainer" +
			
 
				             " queue=" + getQueueName() + 
			
@@ -653,7 +668,7 @@ public class ParentQueue extends AbstractCSQueue {
 
				       FiCaSchedulerNode node =
			
 
				           scheduler.getNode(rmContainer.getContainer().getNodeId());
			
 
				       super.allocateResource(clusterResource, rmContainer.getContainer()
			
 
				-          .getResource(), node.getLabels());
			
 
				+          .getResource(), node.getPartition());
			
 
				     }
			
 
				     if (parent != null) {
			
 
				       parent.recoverContainer(clusterResource, attempt, rmContainer);
			
@@ -681,7 +696,7 @@ public class ParentQueue extends AbstractCSQueue {
 
				       FiCaSchedulerNode node =
			
 
				           scheduler.getNode(rmContainer.getContainer().getNodeId());
			
 
				       super.allocateResource(clusterResource, rmContainer.getContainer()
			
 
				-          .getResource(), node.getLabels());
			
 
				+          .getResource(), node.getPartition());
			
 
				       LOG.info("movedContainer" + " queueMoveIn=" + getQueueName()
			
 
				           + " usedCapacity=" + getUsedCapacity() + " absoluteUsedCapacity="
			
 
				           + getAbsoluteUsedCapacity() + " used=" + queueUsage.getUsed() + " cluster="
			
@@ -701,7 +716,7 @@ public class ParentQueue extends AbstractCSQueue {
 
				           scheduler.getNode(rmContainer.getContainer().getNodeId());
			
 
				       super.releaseResource(clusterResource,
			
 
				           rmContainer.getContainer().getResource(),
			
 
				-          node.getLabels());
			
 
				+          node.getPartition());
			
 
				       LOG.info("movedContainer" + " queueMoveOut=" + getQueueName()
			
 
				           + " usedCapacity=" + getUsedCapacity() + " absoluteUsedCapacity="
			
 
				           + getAbsoluteUsedCapacity() + " used=" + queueUsage.getUsed() + " cluster="
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/SchedulingMode.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/SchedulingMode.java
@@ -0,0 +1,44 @@
 
				+/**
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.yarn.server.resourcemanager.scheduler.capacity;
			
 
				+
			
 
				+/**
			
 
				+ * Scheduling modes, see below for detailed explanations 
			
 
				+ */
			
 
				+public enum SchedulingMode {
			
 
				+  /**
			
 
				+   * <p>
			
 
				+   * When a node has partition (say partition=x), only application in the queue
			
 
				+   * can access to partition=x AND requires for partition=x resource can get
			
 
				+   * chance to allocate on the node.
			
 
				+   * </p>
			
 
				+   * 
			
 
				+   * <p>
			
 
				+   * When a node has no partition, only application requires non-partitioned
			
 
				+   * resource can get chance to allocate on the node.
			
 
				+   * </p>
			
 
				+   */
			
 
				+  RESPECT_PARTITION_EXCLUSIVITY,
			
 
				+  
			
 
				+  /**
			
 
				+   * Only used when a node has partition AND the partition isn't an exclusive
			
 
				+   * partition AND application requires non-partitioned resource.
			
 
				+   */
			
 
				+  IGNORE_PARTITION_EXCLUSIVITY
			
 
				+}
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/Application.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/Application.java
@@ -54,6 +54,7 @@ import org.apache.hadoop.yarn.exceptions.YarnException;
 
				 import org.apache.hadoop.yarn.factories.RecordFactory;
			
 
				 import org.apache.hadoop.yarn.factory.providers.RecordFactoryProvider;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.Task.State;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.Allocation;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.NodeType;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceScheduler;
			
@@ -277,6 +278,9 @@ public class Application {
 
				     } else {
			
 
				       request.setNumContainers(request.getNumContainers() + 1);
			
 
				     }
			
 
				+    if (request.getNodeLabelExpression() == null) {
			
 
				+      request.setNodeLabelExpression(RMNodeLabelsManager.NO_LABEL);
			
 
				+    }
			
 
				     
			
 
				     // Note this down for next interaction with ResourceManager
			
 
				     ask.remove(request);
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/MockAM.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/MockAM.java
@@ -150,8 +150,14 @@ public class MockAM {
 
				   public AllocateResponse allocate(
			
 
				       String host, int memory, int numContainers,
			
 
				       List<ContainerId> releases, String labelExpression) throws Exception {
			
 
				+    return allocate(host, memory, numContainers, 1, releases, labelExpression);
			
 
				+  }
			
 
				+  
			
 
				+  public AllocateResponse allocate(
			
 
				+      String host, int memory, int numContainers, int priority,
			
 
				+      List<ContainerId> releases, String labelExpression) throws Exception {
			
 
				     List<ResourceRequest> reqs =
			
 
				-        createReq(new String[] { host }, memory, 1, numContainers,
			
 
				+        createReq(new String[] { host }, memory, priority, numContainers,
			
 
				             labelExpression);
			
 
				     return allocate(reqs, releases);
			
 
				   }
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/MockRM.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/MockRM.java
@@ -21,6 +21,8 @@ package org.apache.hadoop.yarn.server.resourcemanager;
 
				 import java.io.IOException;
			
 
				 import java.nio.ByteBuffer;
			
 
				 import java.security.PrivilegedAction;
			
 
				+import java.util.Arrays;
			
 
				+import java.util.Collection;
			
 
				 import java.util.List;
			
 
				 import java.util.Map;
			
 
				 
			
@@ -200,10 +202,18 @@ public class MockRM extends ResourceManager {
 
				   
			
 
				   public boolean waitForState(MockNM nm, ContainerId containerId,
			
 
				       RMContainerState containerState, int timeoutMillisecs) throws Exception {
			
 
				+    return waitForState(Arrays.asList(nm), containerId, containerState,
			
 
				+        timeoutMillisecs);
			
 
				+  }
			
 
				+  
			
 
				+  public boolean waitForState(Collection<MockNM> nms, ContainerId containerId,
			
 
				+      RMContainerState containerState, int timeoutMillisecs) throws Exception {
			
 
				     RMContainer container = getResourceScheduler().getRMContainer(containerId);
			
 
				     int timeoutSecs = 0;
			
 
				     while(container == null && timeoutSecs++ < timeoutMillisecs / 100) {
			
 
				-      nm.nodeHeartbeat(true);
			
 
				+      for (MockNM nm : nms) {
			
 
				+        nm.nodeHeartbeat(true);
			
 
				+      }
			
 
				       container = getResourceScheduler().getRMContainer(containerId);
			
 
				       System.out.println("Waiting for container " + containerId + " to be allocated.");
			
 
				       Thread.sleep(100);
			
@@ -217,9 +227,11 @@ public class MockRM extends ResourceManager {
 
				         && timeoutSecs++ < timeoutMillisecs / 100) {
			
 
				       System.out.println("Container : " + containerId + " State is : "
			
 
				           + container.getState() + " Waiting for state : " + containerState);
			
 
				-      nm.nodeHeartbeat(true);
			
 
				+      for (MockNM nm : nms) {
			
 
				+        nm.nodeHeartbeat(true);
			
 
				+      }
			
 
				       Thread.sleep(100);
			
 
				-      
			
 
				+
			
 
				       if (timeoutMillisecs <= timeoutSecs * 100) {
			
 
				         return false;
			
 
				       }
			
@@ -650,11 +662,28 @@ public class MockRM extends ResourceManager {
 
				     am.waitForState(RMAppAttemptState.FINISHED);
			
 
				     rm.waitForState(rmApp.getApplicationId(), RMAppState.FINISHED);
			
 
				   }
			
 
				+  
			
 
				+  @SuppressWarnings("rawtypes")
			
 
				+  private static void waitForSchedulerAppAttemptAdded(
			
 
				+      ApplicationAttemptId attemptId, MockRM rm) throws InterruptedException {
			
 
				+    int tick = 0;
			
 
				+    // Wait for at most 5 sec
			
 
				+    while (null == ((AbstractYarnScheduler) rm.getResourceScheduler())
			
 
				+        .getApplicationAttempt(attemptId) && tick < 50) {
			
 
				+      Thread.sleep(100);
			
 
				+      if (tick % 10 == 0) {
			
 
				+        System.out.println("waiting for SchedulerApplicationAttempt="
			
 
				+            + attemptId + " added.");
			
 
				+      }
			
 
				+      tick++;
			
 
				+    }
			
 
				+  }
			
 
				 
			
 
				   public static MockAM launchAM(RMApp app, MockRM rm, MockNM nm)
			
 
				       throws Exception {
			
 
				     rm.waitForState(app.getApplicationId(), RMAppState.ACCEPTED);
			
 
				     RMAppAttempt attempt = app.getCurrentAppAttempt();
			
 
				+    waitForSchedulerAppAttemptAdded(attempt.getAppAttemptId(), rm);
			
 
				     System.out.println("Launch AM " + attempt.getAppAttemptId());
			
 
				     nm.nodeHeartbeat(true);
			
 
				     MockAM am = rm.sendAMLaunched(attempt.getAppAttemptId());
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestApplicationLimits.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestApplicationLimits.java
@@ -612,7 +612,7 @@ public class TestApplicationLimits {
 
				 
			
 
				     // Schedule to compute 
			
 
				     queue.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-        clusterResource));
			
 
				+        clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     Resource expectedHeadroom = Resources.createResource(10*16*GB, 1);
			
 
				     assertEquals(expectedHeadroom, app_0_0.getHeadroom());
			
 
				 
			
@@ -632,7 +632,7 @@ public class TestApplicationLimits {
 
				 
			
 
				     // Schedule to compute 
			
 
				     queue.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-        clusterResource)); // Schedule to compute
			
 
				+        clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY); // Schedule to compute
			
 
				     assertEquals(expectedHeadroom, app_0_0.getHeadroom());
			
 
				     assertEquals(expectedHeadroom, app_0_1.getHeadroom());// no change
			
 
				     
			
@@ -652,7 +652,7 @@ public class TestApplicationLimits {
 
				     
			
 
				     // Schedule to compute 
			
 
				     queue.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-        clusterResource)); // Schedule to compute
			
 
				+        clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY); // Schedule to compute
			
 
				     expectedHeadroom = Resources.createResource(10*16*GB / 2, 1); // changes
			
 
				     assertEquals(expectedHeadroom, app_0_0.getHeadroom());
			
 
				     assertEquals(expectedHeadroom, app_0_1.getHeadroom());
			
@@ -661,7 +661,7 @@ public class TestApplicationLimits {
 
				     // Now reduce cluster size and check for the smaller headroom
			
 
				     clusterResource = Resources.createResource(90*16*GB);
			
 
				     queue.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-        clusterResource)); // Schedule to compute
			
 
				+        clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY); // Schedule to compute
			
 
				     expectedHeadroom = Resources.createResource(9*16*GB / 2, 1); // changes
			
 
				     assertEquals(expectedHeadroom, app_0_0.getHeadroom());
			
 
				     assertEquals(expectedHeadroom, app_0_1.getHeadroom());
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestChildQueueOrder.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestChildQueueOrder.java
@@ -44,6 +44,7 @@ import org.apache.hadoop.yarn.event.DrainDispatcher;
 
				 import org.apache.hadoop.yarn.server.resourcemanager.RMContext;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.ahs.RMApplicationHistoryWriter;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.metrics.SystemMetricsPublisher;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.ContainerAllocationExpirer;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainer;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainerEventType;
			
@@ -133,7 +134,7 @@ public class TestChildQueueOrder {
 
				         final Resource allocatedResource = Resources.createResource(allocation);
			
 
				         if (queue instanceof ParentQueue) {
			
 
				           ((ParentQueue)queue).allocateResource(clusterResource, 
			
 
				-              allocatedResource, null);
			
 
				+              allocatedResource, RMNodeLabelsManager.NO_LABEL);
			
 
				         } else {
			
 
				           FiCaSchedulerApp app1 = getMockApplication(0, "");
			
 
				           ((LeafQueue)queue).allocateResource(clusterResource, app1, 
			
@@ -145,7 +146,7 @@ public class TestChildQueueOrder {
 
				           doReturn(new CSAssignment(Resources.none(), type)).
			
 
				           when(queue)
			
 
				               .assignContainers(eq(clusterResource), eq(node),
			
 
				-                  any(ResourceLimits.class));
			
 
				+                  any(ResourceLimits.class), any(SchedulingMode.class));
			
 
				 
			
 
				           // Mock the node's resource availability
			
 
				           Resource available = node.getAvailableResource();
			
@@ -157,7 +158,7 @@ public class TestChildQueueOrder {
 
				       }
			
 
				     }).
			
 
				     when(queue).assignContainers(eq(clusterResource), eq(node), 
			
 
				-        any(ResourceLimits.class));
			
 
				+        any(ResourceLimits.class), any(SchedulingMode.class));
			
 
				     doNothing().when(node).releaseContainer(any(Container.class));
			
 
				   }
			
 
				 
			
@@ -241,6 +242,14 @@ public class TestChildQueueOrder {
 
				     CSQueue b = queues.get(B);
			
 
				     CSQueue c = queues.get(C);
			
 
				     CSQueue d = queues.get(D);
			
 
				+    
			
 
				+    // Make a/b/c/d has >0 pending resource, so that allocation will continue.
			
 
				+    queues.get(CapacitySchedulerConfiguration.ROOT).getQueueResourceUsage()
			
 
				+        .incPending(Resources.createResource(1 * GB));
			
 
				+    a.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				+    b.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				+    c.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				+    d.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				 
			
 
				     final String user_0 = "user_0";
			
 
				 
			
@@ -275,7 +284,7 @@ public class TestChildQueueOrder {
 
				     stubQueueAllocation(c, clusterResource, node_0, 0*GB);
			
 
				     stubQueueAllocation(d, clusterResource, node_0, 0*GB);
			
 
				     root.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-        clusterResource));
			
 
				+        clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     for(int i=0; i < 2; i++)
			
 
				     {
			
 
				       stubQueueAllocation(a, clusterResource, node_0, 0*GB);
			
@@ -283,7 +292,7 @@ public class TestChildQueueOrder {
 
				       stubQueueAllocation(c, clusterResource, node_0, 0*GB);
			
 
				       stubQueueAllocation(d, clusterResource, node_0, 0*GB);
			
 
				       root.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-          clusterResource));
			
 
				+          clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     } 
			
 
				     for(int i=0; i < 3; i++)
			
 
				     {
			
@@ -292,7 +301,7 @@ public class TestChildQueueOrder {
 
				       stubQueueAllocation(c, clusterResource, node_0, 1*GB);
			
 
				       stubQueueAllocation(d, clusterResource, node_0, 0*GB);
			
 
				       root.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-          clusterResource));
			
 
				+          clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     }  
			
 
				     for(int i=0; i < 4; i++)
			
 
				     {
			
@@ -301,7 +310,7 @@ public class TestChildQueueOrder {
 
				       stubQueueAllocation(c, clusterResource, node_0, 0*GB);
			
 
				       stubQueueAllocation(d, clusterResource, node_0, 1*GB);
			
 
				       root.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-          clusterResource));
			
 
				+          clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     }    
			
 
				     verifyQueueMetrics(a, 1*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 2*GB, clusterResource);
			
@@ -335,7 +344,7 @@ public class TestChildQueueOrder {
 
				       stubQueueAllocation(c, clusterResource, node_0, 0*GB);
			
 
				       stubQueueAllocation(d, clusterResource, node_0, 0*GB);
			
 
				       root.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-          clusterResource));
			
 
				+          clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     }
			
 
				     verifyQueueMetrics(a, 3*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 2*GB, clusterResource);
			
@@ -363,7 +372,7 @@ public class TestChildQueueOrder {
 
				     stubQueueAllocation(c, clusterResource, node_0, 0*GB);
			
 
				     stubQueueAllocation(d, clusterResource, node_0, 0*GB);
			
 
				     root.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-        clusterResource));
			
 
				+        clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verifyQueueMetrics(a, 2*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 3*GB, clusterResource);
			
 
				     verifyQueueMetrics(c, 3*GB, clusterResource);
			
@@ -390,7 +399,7 @@ public class TestChildQueueOrder {
 
				     stubQueueAllocation(c, clusterResource, node_0, 0*GB);
			
 
				     stubQueueAllocation(d, clusterResource, node_0, 0*GB);
			
 
				     root.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-        clusterResource));
			
 
				+        clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verifyQueueMetrics(a, 3*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 2*GB, clusterResource);
			
 
				     verifyQueueMetrics(c, 3*GB, clusterResource);
			
@@ -405,12 +414,14 @@ public class TestChildQueueOrder {
 
				     stubQueueAllocation(c, clusterResource, node_0, 0*GB);
			
 
				     stubQueueAllocation(d, clusterResource, node_0, 1*GB);
			
 
				     root.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-        clusterResource));
			
 
				+        clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     InOrder allocationOrder = inOrder(d,b);
			
 
				-    allocationOrder.verify(d).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), any(ResourceLimits.class));
			
 
				-    allocationOrder.verify(b).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), any(ResourceLimits.class));
			
 
				+    allocationOrder.verify(d).assignContainers(eq(clusterResource),
			
 
				+        any(FiCaSchedulerNode.class), any(ResourceLimits.class),
			
 
				+        any(SchedulingMode.class));
			
 
				+    allocationOrder.verify(b).assignContainers(eq(clusterResource),
			
 
				+        any(FiCaSchedulerNode.class), any(ResourceLimits.class),
			
 
				+        any(SchedulingMode.class));
			
 
				     verifyQueueMetrics(a, 3*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 2*GB, clusterResource);
			
 
				     verifyQueueMetrics(c, 3*GB, clusterResource);
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestContainerAllocation.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestContainerAllocation.java
@@ -19,6 +19,8 @@
 
				 package org.apache.hadoop.yarn.server.resourcemanager.scheduler.capacity;
			
 
				 
			
 
				 import java.util.ArrayList;
			
 
				+import java.util.Arrays;
			
 
				+import java.util.HashSet;
			
 
				 import java.util.List;
			
 
				 import java.util.Set;
			
 
				 
			
@@ -32,6 +34,7 @@ import org.apache.hadoop.yarn.api.records.Container;
 
				 import org.apache.hadoop.yarn.api.records.ContainerId;
			
 
				 import org.apache.hadoop.yarn.api.records.LogAggregationContext;
			
 
				 import org.apache.hadoop.yarn.api.records.NodeId;
			
 
				+import org.apache.hadoop.yarn.api.records.NodeLabel;
			
 
				 import org.apache.hadoop.yarn.api.records.Priority;
			
 
				 import org.apache.hadoop.yarn.api.records.Resource;
			
 
				 import org.apache.hadoop.yarn.api.records.ResourceRequest;
			
@@ -51,9 +54,13 @@ import org.apache.hadoop.yarn.server.resourcemanager.rmapp.attempt.RMAppAttempt;
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmapp.attempt.RMAppAttemptState;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainer;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainerState;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.rmnode.RMNode;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceScheduler;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.SchedulerAppReport;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.scheduler.SchedulerNode;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.YarnScheduler;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.scheduler.common.fica.FiCaSchedulerApp;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.scheduler.event.NodeUpdateSchedulerEvent;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.security.RMContainerTokenSecretManager;
			
 
				 import org.apache.hadoop.yarn.server.utils.BuilderUtils;
			
 
				 import org.junit.Assert;
			
@@ -327,387 +334,4 @@ public class TestContainerAllocation {
 
				     rm1.waitForState(attempt.getAppAttemptId(), RMAppAttemptState.ALLOCATED);
			
 
				     MockRM.launchAndRegisterAM(app1, rm1, nm1);
			
 
				   }
			
 
				-  
			
 
				-  private Configuration getConfigurationWithQueueLabels(Configuration config) {
			
 
				-    CapacitySchedulerConfiguration conf =
			
 
				-        new CapacitySchedulerConfiguration(config);
			
 
				-    
			
 
				-    // Define top-level queues
			
 
				-    conf.setQueues(CapacitySchedulerConfiguration.ROOT, new String[] {"a", "b", "c"});
			
 
				-    conf.setCapacityByLabel(CapacitySchedulerConfiguration.ROOT, "x", 100);
			
 
				-    conf.setCapacityByLabel(CapacitySchedulerConfiguration.ROOT, "y", 100);
			
 
				-
			
 
				-    final String A = CapacitySchedulerConfiguration.ROOT + ".a";
			
 
				-    conf.setCapacity(A, 10);
			
 
				-    conf.setMaximumCapacity(A, 15);
			
 
				-    conf.setAccessibleNodeLabels(A, toSet("x"));
			
 
				-    conf.setCapacityByLabel(A, "x", 100);
			
 
				-    
			
 
				-    final String B = CapacitySchedulerConfiguration.ROOT + ".b";
			
 
				-    conf.setCapacity(B, 20);
			
 
				-    conf.setAccessibleNodeLabels(B, toSet("y"));
			
 
				-    conf.setCapacityByLabel(B, "y", 100);
			
 
				-    
			
 
				-    final String C = CapacitySchedulerConfiguration.ROOT + ".c";
			
 
				-    conf.setCapacity(C, 70);
			
 
				-    conf.setMaximumCapacity(C, 70);
			
 
				-    conf.setAccessibleNodeLabels(C, RMNodeLabelsManager.EMPTY_STRING_SET);
			
 
				-    
			
 
				-    // Define 2nd-level queues
			
 
				-    final String A1 = A + ".a1";
			
 
				-    conf.setQueues(A, new String[] {"a1"});
			
 
				-    conf.setCapacity(A1, 100);
			
 
				-    conf.setMaximumCapacity(A1, 100);
			
 
				-    conf.setCapacityByLabel(A1, "x", 100);
			
 
				-    
			
 
				-    final String B1 = B + ".b1";
			
 
				-    conf.setQueues(B, new String[] {"b1"});
			
 
				-    conf.setCapacity(B1, 100);
			
 
				-    conf.setMaximumCapacity(B1, 100);
			
 
				-    conf.setCapacityByLabel(B1, "y", 100);
			
 
				-
			
 
				-    final String C1 = C + ".c1";
			
 
				-    conf.setQueues(C, new String[] {"c1"});
			
 
				-    conf.setCapacity(C1, 100);
			
 
				-    conf.setMaximumCapacity(C1, 100);
			
 
				-    
			
 
				-    return conf;
			
 
				-  }
			
 
				-  
			
 
				-  private void checkTaskContainersHost(ApplicationAttemptId attemptId,
			
 
				-      ContainerId containerId, ResourceManager rm, String host) {
			
 
				-    YarnScheduler scheduler = rm.getRMContext().getScheduler();
			
 
				-    SchedulerAppReport appReport = scheduler.getSchedulerAppInfo(attemptId);
			
 
				-
			
 
				-    Assert.assertTrue(appReport.getLiveContainers().size() > 0);
			
 
				-    for (RMContainer c : appReport.getLiveContainers()) {
			
 
				-      if (c.getContainerId().equals(containerId)) {
			
 
				-        Assert.assertEquals(host, c.getAllocatedNode().getHost());
			
 
				-      }
			
 
				-    }
			
 
				-  }
			
 
				-  
			
 
				-  @SuppressWarnings("unchecked")
			
 
				-  private <E> Set<E> toSet(E... elements) {
			
 
				-    Set<E> set = Sets.newHashSet(elements);
			
 
				-    return set;
			
 
				-  }
			
 
				-  
			
 
				-  @Test (timeout = 300000)
			
 
				-  public void testContainerAllocationWithSingleUserLimits() throws Exception {
			
 
				-    final RMNodeLabelsManager mgr = new NullRMNodeLabelsManager();
			
 
				-    mgr.init(conf);
			
 
				-
			
 
				-    // set node -> label
			
 
				-    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y"));
			
 
				-    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("x"),
			
 
				-        NodeId.newInstance("h2", 0), toSet("y")));
			
 
				-
			
 
				-    // inject node label manager
			
 
				-    MockRM rm1 = new MockRM(TestUtils.getConfigurationWithDefaultQueueLabels(conf)) {
			
 
				-      @Override
			
 
				-      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				-        return mgr;
			
 
				-      }
			
 
				-    };
			
 
				-
			
 
				-    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				-    rm1.start();
			
 
				-    MockNM nm1 = rm1.registerNode("h1:1234", 8000); // label = x
			
 
				-    rm1.registerNode("h2:1234", 8000); // label = y
			
 
				-    MockNM nm3 = rm1.registerNode("h3:1234", 8000); // label = <empty>
			
 
				-
			
 
				-    // launch an app to queue a1 (label = x), and check all container will
			
 
				-    // be allocated in h1
			
 
				-    RMApp app1 = rm1.submitApp(200, "app", "user", null, "a1");
			
 
				-    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm1);
			
 
				-    
			
 
				-    // A has only 10% of x, so it can only allocate one container in label=empty
			
 
				-    ContainerId containerId =
			
 
				-        ContainerId.newContainerId(am1.getApplicationAttemptId(), 2);
			
 
				-    am1.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "");
			
 
				-    Assert.assertTrue(rm1.waitForState(nm3, containerId,
			
 
				-          RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    // Cannot allocate 2nd label=empty container
			
 
				-    containerId =
			
 
				-        ContainerId.newContainerId(am1.getApplicationAttemptId(), 3);
			
 
				-    am1.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "");
			
 
				-    Assert.assertFalse(rm1.waitForState(nm3, containerId,
			
 
				-          RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-
			
 
				-    // A has default user limit = 100, so it can use all resource in label = x
			
 
				-    // We can allocate floor(8000 / 1024) = 7 containers
			
 
				-    for (int id = 3; id <= 8; id++) {
			
 
				-      containerId =
			
 
				-          ContainerId.newContainerId(am1.getApplicationAttemptId(), id);
			
 
				-      am1.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "x");
			
 
				-      Assert.assertTrue(rm1.waitForState(nm1, containerId,
			
 
				-          RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    }
			
 
				-    rm1.close();
			
 
				-  }
			
 
				-  
			
 
				-  @Test(timeout = 300000)
			
 
				-  public void testContainerAllocateWithComplexLabels() throws Exception {
			
 
				-    /*
			
 
				-     * Queue structure:
			
 
				-     *                      root (*)
			
 
				-     *                  ________________
			
 
				-     *                 /                \
			
 
				-     *               a x(100%), y(50%)   b y(50%), z(100%)
			
 
				-     *               ________________    ______________
			
 
				-     *              /                   /              \
			
 
				-     *             a1 (x,y)         b1(no)              b2(y,z)
			
 
				-     *               100%                          y = 100%, z = 100%
			
 
				-     *                           
			
 
				-     * Node structure:
			
 
				-     * h1 : x
			
 
				-     * h2 : y
			
 
				-     * h3 : y
			
 
				-     * h4 : z
			
 
				-     * h5 : NO
			
 
				-     * 
			
 
				-     * Total resource:
			
 
				-     * x: 4G
			
 
				-     * y: 6G
			
 
				-     * z: 2G
			
 
				-     * *: 2G
			
 
				-     * 
			
 
				-     * Resource of
			
 
				-     * a1: x=4G, y=3G, NO=0.2G
			
 
				-     * b1: NO=0.9G (max=1G)
			
 
				-     * b2: y=3, z=2G, NO=0.9G (max=1G)
			
 
				-     * 
			
 
				-     * Each node can only allocate two containers
			
 
				-     */
			
 
				-
			
 
				-    // set node -> label
			
 
				-    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y", "z"));
			
 
				-    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0),
			
 
				-        toSet("x"), NodeId.newInstance("h2", 0), toSet("y"),
			
 
				-        NodeId.newInstance("h3", 0), toSet("y"), NodeId.newInstance("h4", 0),
			
 
				-        toSet("z"), NodeId.newInstance("h5", 0),
			
 
				-        RMNodeLabelsManager.EMPTY_STRING_SET));
			
 
				-
			
 
				-    // inject node label manager
			
 
				-    MockRM rm1 = new MockRM(TestUtils.getComplexConfigurationWithQueueLabels(conf)) {
			
 
				-      @Override
			
 
				-      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				-        return mgr;
			
 
				-      }
			
 
				-    };
			
 
				-
			
 
				-    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				-    rm1.start();
			
 
				-    MockNM nm1 = rm1.registerNode("h1:1234", 2048);
			
 
				-    MockNM nm2 = rm1.registerNode("h2:1234", 2048);
			
 
				-    MockNM nm3 = rm1.registerNode("h3:1234", 2048);
			
 
				-    MockNM nm4 = rm1.registerNode("h4:1234", 2048);
			
 
				-    MockNM nm5 = rm1.registerNode("h5:1234", 2048);
			
 
				-    
			
 
				-    ContainerId containerId;
			
 
				-
			
 
				-    // launch an app to queue a1 (label = x), and check all container will
			
 
				-    // be allocated in h1
			
 
				-    RMApp app1 = rm1.submitApp(1024, "app", "user", null, "a1");
			
 
				-    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm1);
			
 
				-
			
 
				-    // request a container (label = y). can be allocated on nm2 
			
 
				-    am1.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "y");
			
 
				-    containerId =
			
 
				-        ContainerId.newContainerId(am1.getApplicationAttemptId(), 2L);
			
 
				-    Assert.assertTrue(rm1.waitForState(nm2, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    checkTaskContainersHost(am1.getApplicationAttemptId(), containerId, rm1,
			
 
				-        "h2");
			
 
				-
			
 
				-    // launch an app to queue b1 (label = y), and check all container will
			
 
				-    // be allocated in h5
			
 
				-    RMApp app2 = rm1.submitApp(1024, "app", "user", null, "b1");
			
 
				-    MockAM am2 = MockRM.launchAndRegisterAM(app2, rm1, nm5);
			
 
				-
			
 
				-    // request a container for AM, will succeed
			
 
				-    // and now b1's queue capacity will be used, cannot allocate more containers
			
 
				-    // (Maximum capacity reached)
			
 
				-    am2.allocate("*", 1024, 1, new ArrayList<ContainerId>());
			
 
				-    containerId = ContainerId.newContainerId(am2.getApplicationAttemptId(), 2);
			
 
				-    Assert.assertFalse(rm1.waitForState(nm4, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    Assert.assertFalse(rm1.waitForState(nm5, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    
			
 
				-    // launch an app to queue b2
			
 
				-    RMApp app3 = rm1.submitApp(1024, "app", "user", null, "b2");
			
 
				-    MockAM am3 = MockRM.launchAndRegisterAM(app3, rm1, nm5);
			
 
				-
			
 
				-    // request a container. try to allocate on nm1 (label = x) and nm3 (label =
			
 
				-    // y,z). Will successfully allocate on nm3
			
 
				-    am3.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "y");
			
 
				-    containerId = ContainerId.newContainerId(am3.getApplicationAttemptId(), 2);
			
 
				-    Assert.assertFalse(rm1.waitForState(nm1, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    Assert.assertTrue(rm1.waitForState(nm3, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    checkTaskContainersHost(am3.getApplicationAttemptId(), containerId, rm1,
			
 
				-        "h3");
			
 
				-    
			
 
				-    // try to allocate container (request label = z) on nm4 (label = y,z). 
			
 
				-    // Will successfully allocate on nm4 only.
			
 
				-    am3.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "z");
			
 
				-    containerId = ContainerId.newContainerId(am3.getApplicationAttemptId(), 3L);
			
 
				-    Assert.assertTrue(rm1.waitForState(nm4, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    checkTaskContainersHost(am3.getApplicationAttemptId(), containerId, rm1,
			
 
				-        "h4");
			
 
				-
			
 
				-    rm1.close();
			
 
				-  }
			
 
				-
			
 
				-  @Test (timeout = 120000)
			
 
				-  public void testContainerAllocateWithLabels() throws Exception {
			
 
				-    // set node -> label
			
 
				-    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y"));
			
 
				-    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("x"),
			
 
				-        NodeId.newInstance("h2", 0), toSet("y")));
			
 
				-
			
 
				-    // inject node label manager
			
 
				-    MockRM rm1 = new MockRM(getConfigurationWithQueueLabels(conf)) {
			
 
				-      @Override
			
 
				-      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				-        return mgr;
			
 
				-      }
			
 
				-    };
			
 
				-
			
 
				-    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				-    rm1.start();
			
 
				-    MockNM nm1 = rm1.registerNode("h1:1234", 8000); // label = x
			
 
				-    MockNM nm2 = rm1.registerNode("h2:1234", 8000); // label = y
			
 
				-    MockNM nm3 = rm1.registerNode("h3:1234", 8000); // label = <empty>
			
 
				-    
			
 
				-    ContainerId containerId;
			
 
				-
			
 
				-    // launch an app to queue a1 (label = x), and check all container will
			
 
				-    // be allocated in h1
			
 
				-    RMApp app1 = rm1.submitApp(200, "app", "user", null, "a1");
			
 
				-    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm3);
			
 
				-
			
 
				-    // request a container.
			
 
				-    am1.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "x");
			
 
				-    containerId =
			
 
				-        ContainerId.newContainerId(am1.getApplicationAttemptId(), 2);
			
 
				-    Assert.assertFalse(rm1.waitForState(nm2, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    Assert.assertTrue(rm1.waitForState(nm1, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    checkTaskContainersHost(am1.getApplicationAttemptId(), containerId, rm1,
			
 
				-        "h1");
			
 
				-
			
 
				-    // launch an app to queue b1 (label = y), and check all container will
			
 
				-    // be allocated in h2
			
 
				-    RMApp app2 = rm1.submitApp(200, "app", "user", null, "b1");
			
 
				-    MockAM am2 = MockRM.launchAndRegisterAM(app2, rm1, nm3);
			
 
				-
			
 
				-    // request a container.
			
 
				-    am2.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "y");
			
 
				-    containerId = ContainerId.newContainerId(am2.getApplicationAttemptId(), 2);
			
 
				-    Assert.assertFalse(rm1.waitForState(nm1, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    Assert.assertTrue(rm1.waitForState(nm2, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    checkTaskContainersHost(am2.getApplicationAttemptId(), containerId, rm1,
			
 
				-        "h2");
			
 
				-    
			
 
				-    // launch an app to queue c1 (label = ""), and check all container will
			
 
				-    // be allocated in h3
			
 
				-    RMApp app3 = rm1.submitApp(200, "app", "user", null, "c1");
			
 
				-    MockAM am3 = MockRM.launchAndRegisterAM(app3, rm1, nm3);
			
 
				-
			
 
				-    // request a container.
			
 
				-    am3.allocate("*", 1024, 1, new ArrayList<ContainerId>());
			
 
				-    containerId = ContainerId.newContainerId(am3.getApplicationAttemptId(), 2);
			
 
				-    Assert.assertFalse(rm1.waitForState(nm2, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    Assert.assertTrue(rm1.waitForState(nm3, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    checkTaskContainersHost(am3.getApplicationAttemptId(), containerId, rm1,
			
 
				-        "h3");
			
 
				-
			
 
				-    rm1.close();
			
 
				-  }
			
 
				-  
			
 
				-  @Test (timeout = 120000)
			
 
				-  public void testContainerAllocateWithDefaultQueueLabels() throws Exception {
			
 
				-    // This test is pretty much similar to testContainerAllocateWithLabel.
			
 
				-    // Difference is, this test doesn't specify label expression in ResourceRequest,
			
 
				-    // instead, it uses default queue label expression
			
 
				-
			
 
				-    // set node -> label
			
 
				-    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y"));
			
 
				-    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("x"),
			
 
				-        NodeId.newInstance("h2", 0), toSet("y")));
			
 
				-
			
 
				-    // inject node label manager
			
 
				-    MockRM rm1 = new MockRM(TestUtils.getConfigurationWithDefaultQueueLabels(conf)) {
			
 
				-      @Override
			
 
				-      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				-        return mgr;
			
 
				-      }
			
 
				-    };
			
 
				-
			
 
				-    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				-    rm1.start();
			
 
				-    MockNM nm1 = rm1.registerNode("h1:1234", 8000); // label = x
			
 
				-    MockNM nm2 = rm1.registerNode("h2:1234", 8000); // label = y
			
 
				-    MockNM nm3 = rm1.registerNode("h3:1234", 8000); // label = <empty>
			
 
				-    
			
 
				-    ContainerId containerId;
			
 
				-
			
 
				-    // launch an app to queue a1 (label = x), and check all container will
			
 
				-    // be allocated in h1
			
 
				-    RMApp app1 = rm1.submitApp(200, "app", "user", null, "a1");
			
 
				-    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm1);
			
 
				-
			
 
				-    // request a container.
			
 
				-    am1.allocate("*", 1024, 1, new ArrayList<ContainerId>());
			
 
				-    containerId =
			
 
				-        ContainerId.newContainerId(am1.getApplicationAttemptId(), 2);
			
 
				-    Assert.assertFalse(rm1.waitForState(nm3, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    Assert.assertTrue(rm1.waitForState(nm1, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    checkTaskContainersHost(am1.getApplicationAttemptId(), containerId, rm1,
			
 
				-        "h1");
			
 
				-
			
 
				-    // launch an app to queue b1 (label = y), and check all container will
			
 
				-    // be allocated in h2
			
 
				-    RMApp app2 = rm1.submitApp(200, "app", "user", null, "b1");
			
 
				-    MockAM am2 = MockRM.launchAndRegisterAM(app2, rm1, nm2);
			
 
				-
			
 
				-    // request a container.
			
 
				-    am2.allocate("*", 1024, 1, new ArrayList<ContainerId>());
			
 
				-    containerId = ContainerId.newContainerId(am2.getApplicationAttemptId(), 2);
			
 
				-    Assert.assertFalse(rm1.waitForState(nm3, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    Assert.assertTrue(rm1.waitForState(nm2, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    checkTaskContainersHost(am2.getApplicationAttemptId(), containerId, rm1,
			
 
				-        "h2");
			
 
				-    
			
 
				-    // launch an app to queue c1 (label = ""), and check all container will
			
 
				-    // be allocated in h3
			
 
				-    RMApp app3 = rm1.submitApp(200, "app", "user", null, "c1");
			
 
				-    MockAM am3 = MockRM.launchAndRegisterAM(app3, rm1, nm3);
			
 
				-
			
 
				-    // request a container.
			
 
				-    am3.allocate("*", 1024, 1, new ArrayList<ContainerId>());
			
 
				-    containerId = ContainerId.newContainerId(am3.getApplicationAttemptId(), 2);
			
 
				-    Assert.assertFalse(rm1.waitForState(nm2, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    Assert.assertTrue(rm1.waitForState(nm3, containerId,
			
 
				-        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				-    checkTaskContainersHost(am3.getApplicationAttemptId(), containerId, rm1,
			
 
				-        "h3");
			
 
				-
			
 
				-    rm1.close();
			
 
				-  }
			
 
				 }
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestLeafQueue.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestLeafQueue.java
@@ -351,7 +351,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // Only 1 container
			
 
				     a.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-        clusterResource));
			
 
				+        clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(
			
 
				         (int)(node_0.getTotalResource().getMemory() * a.getCapacity()) - (1*GB),
			
 
				         a.getMetrics().getAvailableMB());
			
@@ -487,7 +487,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // Only 1 container
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(1*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(1*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -498,7 +498,7 @@ public class TestLeafQueue {
 
				     // Also 2nd -> minCapacity = 1024 since (.1 * 8G) < minAlloc, also
			
 
				     // you can get one container more than user-limit
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -507,7 +507,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // Can't allocate 3rd due to user-limit
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -517,7 +517,7 @@ public class TestLeafQueue {
 
				     // Bump up user-limit-factor, now allocate should work
			
 
				     a.setUserLimitFactor(10);
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(3*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(3*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -526,7 +526,7 @@ public class TestLeafQueue {
 
				 
			
 
				     // One more should work, for app_1, due to user-limit-factor
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(4*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(3*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(1*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -537,7 +537,7 @@ public class TestLeafQueue {
 
				     // Now - no more allocs since we are at max-cap
			
 
				     a.setMaxCapacity(0.5f);
			
 
				     a.assignContainers(clusterResource, node_0, new ResourceLimits(
			
 
				-        clusterResource));
			
 
				+        clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(4*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(3*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(1*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -653,21 +653,21 @@ public class TestLeafQueue {
 
				 
			
 
				     // 1 container to user_0
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
 
				 
			
 
				     // Again one to user_0 since he hasn't exceeded user limit yet
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(3*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(1*GB, app_1.getCurrentConsumption().getMemory());
			
 
				 
			
 
				     // One more to user_0 since he is the only active user
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(4*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(2*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -719,10 +719,10 @@ public class TestLeafQueue {
 
				         1, qb.getActiveUsersManager().getNumActiveUsers());
			
 
				     //get headroom
			
 
				     qb.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     qb.computeUserLimitAndSetHeadroom(app_0, clusterResource, app_0
			
 
				         .getResourceRequest(u0Priority, ResourceRequest.ANY).getCapability(),
			
 
				-        null);
			
 
				+        "", SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				 
			
 
				     //maxqueue 16G, userlimit 13G, - 4G used = 9G
			
 
				     assertEquals(9*GB,app_0.getHeadroom().getMemory());
			
@@ -739,10 +739,10 @@ public class TestLeafQueue {
 
				             u1Priority, recordFactory)));
			
 
				     qb.submitApplicationAttempt(app_2, user_1);
			
 
				     qb.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     qb.computeUserLimitAndSetHeadroom(app_0, clusterResource, app_0
			
 
				         .getResourceRequest(u0Priority, ResourceRequest.ANY).getCapability(),
			
 
				-        null);
			
 
				+        "", SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				 
			
 
				     assertEquals(8*GB, qb.getUsedResources().getMemory());
			
 
				     assertEquals(4*GB, app_0.getCurrentConsumption().getMemory());
			
@@ -782,12 +782,12 @@ public class TestLeafQueue {
 
				     qb.submitApplicationAttempt(app_1, user_0);
			
 
				     qb.submitApplicationAttempt(app_3, user_1);
			
 
				     qb.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     qb.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     qb.computeUserLimitAndSetHeadroom(app_3, clusterResource, app_3
			
 
				         .getResourceRequest(u1Priority, ResourceRequest.ANY).getCapability(),
			
 
				-        null);
			
 
				+        "", SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(4*GB, qb.getUsedResources().getMemory());
			
 
				     //maxqueue 16G, userlimit 7G, used (by each user) 2G, headroom 5G (both)
			
 
				     assertEquals(5*GB, app_3.getHeadroom().getMemory());
			
@@ -803,13 +803,13 @@ public class TestLeafQueue {
 
				               TestUtils.createResourceRequest(ResourceRequest.ANY, 6*GB, 1, true,
			
 
				                       u0Priority, recordFactory)));
			
 
				     qb.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     qb.computeUserLimitAndSetHeadroom(app_4, clusterResource, app_4
			
 
				         .getResourceRequest(u0Priority, ResourceRequest.ANY).getCapability(),
			
 
				-        null);
			
 
				+        "", SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     qb.computeUserLimitAndSetHeadroom(app_3, clusterResource, app_3
			
 
				         .getResourceRequest(u1Priority, ResourceRequest.ANY).getCapability(),
			
 
				-        null);
			
 
				+        "", SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     
			
 
				     
			
 
				     //app3 is user1, active from last test case
			
@@ -876,7 +876,7 @@ public class TestLeafQueue {
 
				                 priority, recordFactory)));
			
 
				 
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(1*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(1*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -893,7 +893,7 @@ public class TestLeafQueue {
 
				             priority, recordFactory)));
			
 
				 
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(1*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(1*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -982,7 +982,7 @@ public class TestLeafQueue {
 
				 
			
 
				     // 1 container to user_0
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -993,7 +993,7 @@ public class TestLeafQueue {
 
				 
			
 
				     // Again one to user_0 since he hasn't exceeded user limit yet
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(3*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(1*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1010,7 +1010,7 @@ public class TestLeafQueue {
 
				     // No more to user_0 since he is already over user-limit
			
 
				     // and no more containers to queue since it's already at max-cap
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(3*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(1*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1024,7 +1024,7 @@ public class TestLeafQueue {
 
				             priority, recordFactory)));
			
 
				     assertEquals(1, a.getActiveUsersManager().getNumActiveUsers());
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(0*GB, app_2.getHeadroom().getMemory());   // hit queue max-cap 
			
 
				   }
			
 
				 
			
@@ -1095,7 +1095,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // Only 1 container
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(1*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(1*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1103,7 +1103,7 @@ public class TestLeafQueue {
 
				     // Also 2nd -> minCapacity = 1024 since (.1 * 8G) < minAlloc, also
			
 
				     // you can get one container more than user-limit
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1111,7 +1111,7 @@ public class TestLeafQueue {
 
				     // Can't allocate 3rd due to user-limit
			
 
				     a.setUserLimit(25);
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1130,7 +1130,7 @@ public class TestLeafQueue {
 
				     // user_0 is at limit inspite of high user-limit-factor
			
 
				     a.setUserLimitFactor(10);
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(5*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1140,7 +1140,7 @@ public class TestLeafQueue {
 
				     // Now allocations should goto app_0 since 
			
 
				     // user_0 is at user-limit not above it
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(6*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(3*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1151,7 +1151,7 @@ public class TestLeafQueue {
 
				     // Now - no more allocs since we are at max-cap
			
 
				     a.setMaxCapacity(0.5f);
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(6*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(3*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1163,7 +1163,7 @@ public class TestLeafQueue {
 
				     a.setMaxCapacity(1.0f);
			
 
				     a.setUserLimitFactor(1);
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(7*GB, a.getUsedResources().getMemory()); 
			
 
				     assertEquals(3*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1172,7 +1172,7 @@ public class TestLeafQueue {
 
				 
			
 
				     // Now we should assign to app_3 again since user_2 is under user-limit
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(8*GB, a.getUsedResources().getMemory()); 
			
 
				     assertEquals(3*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1272,7 +1272,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // Only 1 container
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(1*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(1*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1283,7 +1283,7 @@ public class TestLeafQueue {
 
				     // Also 2nd -> minCapacity = 1024 since (.1 * 8G) < minAlloc, also
			
 
				     // you can get one container more than user-limit
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1292,7 +1292,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // Now, reservation should kick in for app_1
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(6*GB, a.getUsedResources().getMemory()); 
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1309,7 +1309,7 @@ public class TestLeafQueue {
 
				             ContainerExitStatus.KILLED_BY_RESOURCEMANAGER),
			
 
				         RMContainerEventType.KILL, null, true);
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(5*GB, a.getUsedResources().getMemory()); 
			
 
				     assertEquals(1*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1326,7 +1326,7 @@ public class TestLeafQueue {
 
				             ContainerExitStatus.KILLED_BY_RESOURCEMANAGER),
			
 
				         RMContainerEventType.KILL, null, true);
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(4*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(0*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(4*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1394,7 +1394,7 @@ public class TestLeafQueue {
 
				     // Start testing...
			
 
				 
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1404,7 +1404,7 @@ public class TestLeafQueue {
 
				 
			
 
				     // Now, reservation should kick in for app_1
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(6*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1418,7 +1418,7 @@ public class TestLeafQueue {
 
				     doReturn(-1).when(a).getNodeLocalityDelay();
			
 
				     
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(10*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(4*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1435,7 +1435,7 @@ public class TestLeafQueue {
 
				             ContainerExitStatus.KILLED_BY_RESOURCEMANAGER),
			
 
				         RMContainerEventType.KILL, null, true);
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(8*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(0*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(8*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1504,7 +1504,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // Only 1 container
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(1*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(1*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1512,14 +1512,14 @@ public class TestLeafQueue {
 
				     // Also 2nd -> minCapacity = 1024 since (.1 * 8G) < minAlloc, also
			
 
				     // you can get one container more than user-limit
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
 
				     
			
 
				     // Now, reservation should kick in for app_1
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(6*GB, a.getUsedResources().getMemory()); 
			
 
				     assertEquals(2*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1534,7 +1534,7 @@ public class TestLeafQueue {
 
				             ContainerExitStatus.KILLED_BY_RESOURCEMANAGER),
			
 
				         RMContainerEventType.KILL, null, true);
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(5*GB, a.getUsedResources().getMemory()); 
			
 
				     assertEquals(1*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1544,7 +1544,7 @@ public class TestLeafQueue {
 
				 
			
 
				     // Re-reserve
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(5*GB, a.getUsedResources().getMemory()); 
			
 
				     assertEquals(1*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1554,7 +1554,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // Try to schedule on node_1 now, should *move* the reservation
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(9*GB, a.getUsedResources().getMemory()); 
			
 
				     assertEquals(1*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(4*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1572,7 +1572,7 @@ public class TestLeafQueue {
 
				             ContainerExitStatus.KILLED_BY_RESOURCEMANAGER),
			
 
				         RMContainerEventType.KILL, null, true);
			
 
				     CSAssignment assignment = a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(8*GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(0*GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(4*GB, app_1.getCurrentConsumption().getMemory());
			
@@ -1644,7 +1644,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // Start with off switch, shouldn't allocate due to delay scheduling
			
 
				     assignment = a.assignContainers(clusterResource, node_2,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0, never()).allocate(any(NodeType.class), eq(node_2), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(1, app_0.getSchedulingOpportunities(priority));
			
@@ -1653,7 +1653,7 @@ public class TestLeafQueue {
 
				 
			
 
				     // Another off switch, shouldn't allocate due to delay scheduling
			
 
				     assignment = a.assignContainers(clusterResource, node_2,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0, never()).allocate(any(NodeType.class), eq(node_2), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(2, app_0.getSchedulingOpportunities(priority));
			
@@ -1662,7 +1662,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // Another off switch, shouldn't allocate due to delay scheduling
			
 
				     assignment = a.assignContainers(clusterResource, node_2,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0, never()).allocate(any(NodeType.class), eq(node_2), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(3, app_0.getSchedulingOpportunities(priority));
			
@@ -1672,7 +1672,7 @@ public class TestLeafQueue {
 
				     // Another off switch, now we should allocate 
			
 
				     // since missedOpportunities=3 and reqdContainers=3
			
 
				     assignment = a.assignContainers(clusterResource, node_2,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0).allocate(eq(NodeType.OFF_SWITCH), eq(node_2), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(4, app_0.getSchedulingOpportunities(priority)); // should NOT reset
			
@@ -1681,7 +1681,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // NODE_LOCAL - node_0
			
 
				     assignment = a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0).allocate(eq(NodeType.NODE_LOCAL), eq(node_0), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority)); // should reset
			
@@ -1690,7 +1690,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // NODE_LOCAL - node_1
			
 
				     assignment = a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0).allocate(eq(NodeType.NODE_LOCAL), eq(node_1), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority)); // should reset
			
@@ -1719,14 +1719,14 @@ public class TestLeafQueue {
 
				     
			
 
				     // Shouldn't assign RACK_LOCAL yet
			
 
				     assignment = a.assignContainers(clusterResource, node_3,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(1, app_0.getSchedulingOpportunities(priority));
			
 
				     assertEquals(2, app_0.getTotalRequiredResources(priority));
			
 
				     assertEquals(NodeType.NODE_LOCAL, assignment.getType()); // None->NODE_LOCAL
			
 
				 
			
 
				     // Should assign RACK_LOCAL now
			
 
				     assignment = a.assignContainers(clusterResource, node_3,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0).allocate(eq(NodeType.RACK_LOCAL), eq(node_3), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority)); // should reset
			
@@ -1808,7 +1808,7 @@ public class TestLeafQueue {
 
				     // Start with off switch, shouldn't allocate P1 due to delay scheduling
			
 
				     // thus, no P2 either!
			
 
				     a.assignContainers(clusterResource, node_2,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0, never()).allocate(any(NodeType.class), eq(node_2), 
			
 
				         eq(priority_1), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(1, app_0.getSchedulingOpportunities(priority_1));
			
@@ -1821,7 +1821,7 @@ public class TestLeafQueue {
 
				     // Another off-switch, shouldn't allocate P1 due to delay scheduling
			
 
				     // thus, no P2 either!
			
 
				     a.assignContainers(clusterResource, node_2,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0, never()).allocate(any(NodeType.class), eq(node_2), 
			
 
				         eq(priority_1), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(2, app_0.getSchedulingOpportunities(priority_1));
			
@@ -1833,7 +1833,7 @@ public class TestLeafQueue {
 
				 
			
 
				     // Another off-switch, shouldn't allocate OFF_SWITCH P1
			
 
				     a.assignContainers(clusterResource, node_2,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0).allocate(eq(NodeType.OFF_SWITCH), eq(node_2), 
			
 
				         eq(priority_1), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(3, app_0.getSchedulingOpportunities(priority_1));
			
@@ -1845,7 +1845,7 @@ public class TestLeafQueue {
 
				 
			
 
				     // Now, DATA_LOCAL for P1
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0).allocate(eq(NodeType.NODE_LOCAL), eq(node_0), 
			
 
				         eq(priority_1), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority_1));
			
@@ -1857,7 +1857,7 @@ public class TestLeafQueue {
 
				 
			
 
				     // Now, OFF_SWITCH for P2
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0, never()).allocate(any(NodeType.class), eq(node_1), 
			
 
				         eq(priority_1), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority_1));
			
@@ -1934,7 +1934,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // NODE_LOCAL - node_0_1
			
 
				     a.assignContainers(clusterResource, node_0_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0).allocate(eq(NodeType.NODE_LOCAL), eq(node_0_0), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority)); // should reset
			
@@ -1943,7 +1943,7 @@ public class TestLeafQueue {
 
				     // No allocation on node_1_0 even though it's node/rack local since
			
 
				     // required(ANY) == 0
			
 
				     a.assignContainers(clusterResource, node_1_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0, never()).allocate(any(NodeType.class), eq(node_1_0), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority)); // Still zero
			
@@ -1960,7 +1960,7 @@ public class TestLeafQueue {
 
				     // No allocation on node_0_1 even though it's node/rack local since
			
 
				     // required(rack_1) == 0
			
 
				     a.assignContainers(clusterResource, node_0_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0, never()).allocate(any(NodeType.class), eq(node_1_0), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(1, app_0.getSchedulingOpportunities(priority)); 
			
@@ -1968,7 +1968,7 @@ public class TestLeafQueue {
 
				     
			
 
				     // NODE_LOCAL - node_1
			
 
				     a.assignContainers(clusterResource, node_1_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0).allocate(eq(NodeType.NODE_LOCAL), eq(node_1_0), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority)); // should reset
			
@@ -2221,7 +2221,7 @@ public class TestLeafQueue {
 
				     // node_0_1  
			
 
				     // Shouldn't allocate since RR(rack_0) = null && RR(ANY) = relax: false
			
 
				     a.assignContainers(clusterResource, node_0_1, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0, never()).allocate(any(NodeType.class), eq(node_0_1), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority)); // should be 0
			
@@ -2244,7 +2244,7 @@ public class TestLeafQueue {
 
				     // node_1_1  
			
 
				     // Shouldn't allocate since RR(rack_1) = relax: false
			
 
				     a.assignContainers(clusterResource, node_1_1, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0, never()).allocate(any(NodeType.class), eq(node_0_1), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority)); // should be 0
			
@@ -2275,7 +2275,7 @@ public class TestLeafQueue {
 
				     // node_1_1  
			
 
				     // Shouldn't allocate since node_1_1 is blacklisted
			
 
				     a.assignContainers(clusterResource, node_1_1, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0, never()).allocate(any(NodeType.class), eq(node_1_1), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority)); // should be 0
			
@@ -2304,7 +2304,7 @@ public class TestLeafQueue {
 
				     // node_1_1  
			
 
				     // Shouldn't allocate since rack_1 is blacklisted
			
 
				     a.assignContainers(clusterResource, node_1_1, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0, never()).allocate(any(NodeType.class), eq(node_1_1), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority)); // should be 0
			
@@ -2331,7 +2331,7 @@ public class TestLeafQueue {
 
				 
			
 
				     // Now, should allocate since RR(rack_1) = relax: true
			
 
				     a.assignContainers(clusterResource, node_1_1, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0,never()).allocate(eq(NodeType.RACK_LOCAL), eq(node_1_1), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority)); 
			
@@ -2362,7 +2362,7 @@ public class TestLeafQueue {
 
				     // host_1_1: 7G
			
 
				 
			
 
				     a.assignContainers(clusterResource, node_1_0, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verify(app_0).allocate(eq(NodeType.NODE_LOCAL), eq(node_1_0), 
			
 
				         any(Priority.class), any(ResourceRequest.class), any(Container.class));
			
 
				     assertEquals(0, app_0.getSchedulingOpportunities(priority)); 
			
@@ -2445,7 +2445,7 @@ public class TestLeafQueue {
 
				 
			
 
				     try {
			
 
				       a.assignContainers(clusterResource, node_0, 
			
 
				-          new ResourceLimits(clusterResource));
			
 
				+          new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     } catch (NullPointerException e) {
			
 
				       Assert.fail("NPE when allocating container on node but "
			
 
				           + "forget to set off-switch request should be handled");
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestNodeLabelContainerAllocation.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestNodeLabelContainerAllocation.java
@@ -0,0 +1,1027 @@
 
				+/**
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.yarn.server.resourcemanager.scheduler.capacity;
			
 
				+
			
 
				+import java.util.ArrayList;
			
 
				+import java.util.Arrays;
			
 
				+import java.util.HashSet;
			
 
				+import java.util.Set;
			
 
				+
			
 
				+import org.apache.hadoop.conf.Configuration;
			
 
				+import org.apache.hadoop.yarn.api.records.ApplicationAttemptId;
			
 
				+import org.apache.hadoop.yarn.api.records.ContainerId;
			
 
				+import org.apache.hadoop.yarn.api.records.NodeId;
			
 
				+import org.apache.hadoop.yarn.api.records.NodeLabel;
			
 
				+import org.apache.hadoop.yarn.api.records.Priority;
			
 
				+import org.apache.hadoop.yarn.api.records.ResourceRequest;
			
 
				+import org.apache.hadoop.yarn.conf.YarnConfiguration;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.MockAM;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.MockNM;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.MockRM;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.ResourceManager;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.NullRMNodeLabelsManager;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.rmapp.RMApp;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainer;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainerState;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.rmnode.RMNode;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceScheduler;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.scheduler.SchedulerAppReport;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.scheduler.SchedulerNode;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.scheduler.YarnScheduler;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.scheduler.common.fica.FiCaSchedulerApp;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.scheduler.event.NodeUpdateSchedulerEvent;
			
 
				+import org.junit.Assert;
			
 
				+import org.junit.Before;
			
 
				+import org.junit.Test;
			
 
				+
			
 
				+import com.google.common.collect.ImmutableMap;
			
 
				+import com.google.common.collect.ImmutableSet;
			
 
				+import com.google.common.collect.Sets;
			
 
				+
			
 
				+public class TestNodeLabelContainerAllocation {
			
 
				+  private final int GB = 1024;
			
 
				+
			
 
				+  private YarnConfiguration conf;
			
 
				+  
			
 
				+  RMNodeLabelsManager mgr;
			
 
				+
			
 
				+  @Before
			
 
				+  public void setUp() throws Exception {
			
 
				+    conf = new YarnConfiguration();
			
 
				+    conf.setClass(YarnConfiguration.RM_SCHEDULER, CapacityScheduler.class,
			
 
				+      ResourceScheduler.class);
			
 
				+    mgr = new NullRMNodeLabelsManager();
			
 
				+    mgr.init(conf);
			
 
				+  }
			
 
				+  
			
 
				+  private Configuration getConfigurationWithQueueLabels(Configuration config) {
			
 
				+    CapacitySchedulerConfiguration conf =
			
 
				+        new CapacitySchedulerConfiguration(config);
			
 
				+    
			
 
				+    // Define top-level queues
			
 
				+    conf.setQueues(CapacitySchedulerConfiguration.ROOT, new String[] {"a", "b", "c"});
			
 
				+    conf.setCapacityByLabel(CapacitySchedulerConfiguration.ROOT, "x", 100);
			
 
				+    conf.setCapacityByLabel(CapacitySchedulerConfiguration.ROOT, "y", 100);
			
 
				+
			
 
				+    final String A = CapacitySchedulerConfiguration.ROOT + ".a";
			
 
				+    conf.setCapacity(A, 10);
			
 
				+    conf.setMaximumCapacity(A, 15);
			
 
				+    conf.setAccessibleNodeLabels(A, toSet("x"));
			
 
				+    conf.setCapacityByLabel(A, "x", 100);
			
 
				+    
			
 
				+    final String B = CapacitySchedulerConfiguration.ROOT + ".b";
			
 
				+    conf.setCapacity(B, 20);
			
 
				+    conf.setAccessibleNodeLabels(B, toSet("y"));
			
 
				+    conf.setCapacityByLabel(B, "y", 100);
			
 
				+    
			
 
				+    final String C = CapacitySchedulerConfiguration.ROOT + ".c";
			
 
				+    conf.setCapacity(C, 70);
			
 
				+    conf.setMaximumCapacity(C, 70);
			
 
				+    conf.setAccessibleNodeLabels(C, RMNodeLabelsManager.EMPTY_STRING_SET);
			
 
				+    
			
 
				+    // Define 2nd-level queues
			
 
				+    final String A1 = A + ".a1";
			
 
				+    conf.setQueues(A, new String[] {"a1"});
			
 
				+    conf.setCapacity(A1, 100);
			
 
				+    conf.setMaximumCapacity(A1, 100);
			
 
				+    conf.setCapacityByLabel(A1, "x", 100);
			
 
				+    
			
 
				+    final String B1 = B + ".b1";
			
 
				+    conf.setQueues(B, new String[] {"b1"});
			
 
				+    conf.setCapacity(B1, 100);
			
 
				+    conf.setMaximumCapacity(B1, 100);
			
 
				+    conf.setCapacityByLabel(B1, "y", 100);
			
 
				+
			
 
				+    final String C1 = C + ".c1";
			
 
				+    conf.setQueues(C, new String[] {"c1"});
			
 
				+    conf.setCapacity(C1, 100);
			
 
				+    conf.setMaximumCapacity(C1, 100);
			
 
				+    
			
 
				+    return conf;
			
 
				+  }
			
 
				+  
			
 
				+  private void checkTaskContainersHost(ApplicationAttemptId attemptId,
			
 
				+      ContainerId containerId, ResourceManager rm, String host) {
			
 
				+    YarnScheduler scheduler = rm.getRMContext().getScheduler();
			
 
				+    SchedulerAppReport appReport = scheduler.getSchedulerAppInfo(attemptId);
			
 
				+
			
 
				+    Assert.assertTrue(appReport.getLiveContainers().size() > 0);
			
 
				+    for (RMContainer c : appReport.getLiveContainers()) {
			
 
				+      if (c.getContainerId().equals(containerId)) {
			
 
				+        Assert.assertEquals(host, c.getAllocatedNode().getHost());
			
 
				+      }
			
 
				+    }
			
 
				+  }
			
 
				+  
			
 
				+  @SuppressWarnings("unchecked")
			
 
				+  private <E> Set<E> toSet(E... elements) {
			
 
				+    Set<E> set = Sets.newHashSet(elements);
			
 
				+    return set;
			
 
				+  }
			
 
				+  
			
 
				+  
			
 
				+  @Test (timeout = 300000)
			
 
				+  public void testContainerAllocationWithSingleUserLimits() throws Exception {
			
 
				+    final RMNodeLabelsManager mgr = new NullRMNodeLabelsManager();
			
 
				+    mgr.init(conf);
			
 
				+
			
 
				+    // set node -> label
			
 
				+    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y"));
			
 
				+    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("x"),
			
 
				+        NodeId.newInstance("h2", 0), toSet("y")));
			
 
				+
			
 
				+    // inject node label manager
			
 
				+    MockRM rm1 = new MockRM(TestUtils.getConfigurationWithDefaultQueueLabels(conf)) {
			
 
				+      @Override
			
 
				+      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				+        return mgr;
			
 
				+      }
			
 
				+    };
			
 
				+
			
 
				+    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				+    rm1.start();
			
 
				+    MockNM nm1 = rm1.registerNode("h1:1234", 8000); // label = x
			
 
				+    rm1.registerNode("h2:1234", 8000); // label = y
			
 
				+    MockNM nm3 = rm1.registerNode("h3:1234", 8000); // label = <empty>
			
 
				+
			
 
				+    // launch an app to queue a1 (label = x), and check all container will
			
 
				+    // be allocated in h1
			
 
				+    RMApp app1 = rm1.submitApp(200, "app", "user", null, "a1");
			
 
				+    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm1);
			
 
				+    
			
 
				+    // A has only 10% of x, so it can only allocate one container in label=empty
			
 
				+    ContainerId containerId =
			
 
				+        ContainerId.newContainerId(am1.getApplicationAttemptId(), 2);
			
 
				+    am1.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "");
			
 
				+    Assert.assertTrue(rm1.waitForState(nm3, containerId,
			
 
				+          RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    // Cannot allocate 2nd label=empty container
			
 
				+    containerId =
			
 
				+        ContainerId.newContainerId(am1.getApplicationAttemptId(), 3);
			
 
				+    am1.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "");
			
 
				+    Assert.assertFalse(rm1.waitForState(nm3, containerId,
			
 
				+          RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+
			
 
				+    // A has default user limit = 100, so it can use all resource in label = x
			
 
				+    // We can allocate floor(8000 / 1024) = 7 containers
			
 
				+    for (int id = 3; id <= 8; id++) {
			
 
				+      containerId =
			
 
				+          ContainerId.newContainerId(am1.getApplicationAttemptId(), id);
			
 
				+      am1.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "x");
			
 
				+      Assert.assertTrue(rm1.waitForState(nm1, containerId,
			
 
				+          RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    }
			
 
				+    rm1.close();
			
 
				+  }
			
 
				+  
			
 
				+  @Test(timeout = 300000)
			
 
				+  public void testContainerAllocateWithComplexLabels() throws Exception {
			
 
				+    /*
			
 
				+     * Queue structure:
			
 
				+     *                      root (*)
			
 
				+     *                  ________________
			
 
				+     *                 /                \
			
 
				+     *               a x(100%), y(50%)   b y(50%), z(100%)
			
 
				+     *               ________________    ______________
			
 
				+     *              /                   /              \
			
 
				+     *             a1 (x,y)         b1(no)              b2(y,z)
			
 
				+     *               100%                          y = 100%, z = 100%
			
 
				+     *                           
			
 
				+     * Node structure:
			
 
				+     * h1 : x
			
 
				+     * h2 : y
			
 
				+     * h3 : y
			
 
				+     * h4 : z
			
 
				+     * h5 : NO
			
 
				+     * 
			
 
				+     * Total resource:
			
 
				+     * x: 4G
			
 
				+     * y: 6G
			
 
				+     * z: 2G
			
 
				+     * *: 2G
			
 
				+     * 
			
 
				+     * Resource of
			
 
				+     * a1: x=4G, y=3G, NO=0.2G
			
 
				+     * b1: NO=0.9G (max=1G)
			
 
				+     * b2: y=3, z=2G, NO=0.9G (max=1G)
			
 
				+     * 
			
 
				+     * Each node can only allocate two containers
			
 
				+     */
			
 
				+
			
 
				+    // set node -> label
			
 
				+    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y", "z"));
			
 
				+    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0),
			
 
				+        toSet("x"), NodeId.newInstance("h2", 0), toSet("y"),
			
 
				+        NodeId.newInstance("h3", 0), toSet("y"), NodeId.newInstance("h4", 0),
			
 
				+        toSet("z"), NodeId.newInstance("h5", 0),
			
 
				+        RMNodeLabelsManager.EMPTY_STRING_SET));
			
 
				+
			
 
				+    // inject node label manager
			
 
				+    MockRM rm1 = new MockRM(TestUtils.getComplexConfigurationWithQueueLabels(conf)) {
			
 
				+      @Override
			
 
				+      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				+        return mgr;
			
 
				+      }
			
 
				+    };
			
 
				+
			
 
				+    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				+    rm1.start();
			
 
				+    MockNM nm1 = rm1.registerNode("h1:1234", 2048);
			
 
				+    MockNM nm2 = rm1.registerNode("h2:1234", 2048);
			
 
				+    MockNM nm3 = rm1.registerNode("h3:1234", 2048);
			
 
				+    MockNM nm4 = rm1.registerNode("h4:1234", 2048);
			
 
				+    MockNM nm5 = rm1.registerNode("h5:1234", 2048);
			
 
				+    
			
 
				+    ContainerId containerId;
			
 
				+
			
 
				+    // launch an app to queue a1 (label = x), and check all container will
			
 
				+    // be allocated in h1
			
 
				+    RMApp app1 = rm1.submitApp(1024, "app", "user", null, "a1");
			
 
				+    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm1);
			
 
				+
			
 
				+    // request a container (label = y). can be allocated on nm2 
			
 
				+    am1.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "y");
			
 
				+    containerId =
			
 
				+        ContainerId.newContainerId(am1.getApplicationAttemptId(), 2L);
			
 
				+    Assert.assertTrue(rm1.waitForState(nm2, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    checkTaskContainersHost(am1.getApplicationAttemptId(), containerId, rm1,
			
 
				+        "h2");
			
 
				+
			
 
				+    // launch an app to queue b1 (label = y), and check all container will
			
 
				+    // be allocated in h5
			
 
				+    RMApp app2 = rm1.submitApp(1024, "app", "user", null, "b1");
			
 
				+    MockAM am2 = MockRM.launchAndRegisterAM(app2, rm1, nm5);
			
 
				+
			
 
				+    // request a container for AM, will succeed
			
 
				+    // and now b1's queue capacity will be used, cannot allocate more containers
			
 
				+    // (Maximum capacity reached)
			
 
				+    am2.allocate("*", 1024, 1, new ArrayList<ContainerId>());
			
 
				+    containerId = ContainerId.newContainerId(am2.getApplicationAttemptId(), 2);
			
 
				+    Assert.assertFalse(rm1.waitForState(nm4, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    Assert.assertFalse(rm1.waitForState(nm5, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    
			
 
				+    // launch an app to queue b2
			
 
				+    RMApp app3 = rm1.submitApp(1024, "app", "user", null, "b2");
			
 
				+    MockAM am3 = MockRM.launchAndRegisterAM(app3, rm1, nm5);
			
 
				+
			
 
				+    // request a container. try to allocate on nm1 (label = x) and nm3 (label =
			
 
				+    // y,z). Will successfully allocate on nm3
			
 
				+    am3.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "y");
			
 
				+    containerId = ContainerId.newContainerId(am3.getApplicationAttemptId(), 2);
			
 
				+    Assert.assertFalse(rm1.waitForState(nm1, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    Assert.assertTrue(rm1.waitForState(nm3, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    checkTaskContainersHost(am3.getApplicationAttemptId(), containerId, rm1,
			
 
				+        "h3");
			
 
				+    
			
 
				+    // try to allocate container (request label = z) on nm4 (label = y,z). 
			
 
				+    // Will successfully allocate on nm4 only.
			
 
				+    am3.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "z");
			
 
				+    containerId = ContainerId.newContainerId(am3.getApplicationAttemptId(), 3L);
			
 
				+    Assert.assertTrue(rm1.waitForState(nm4, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    checkTaskContainersHost(am3.getApplicationAttemptId(), containerId, rm1,
			
 
				+        "h4");
			
 
				+
			
 
				+    rm1.close();
			
 
				+  }
			
 
				+
			
 
				+  @Test (timeout = 120000)
			
 
				+  public void testContainerAllocateWithLabels() throws Exception {
			
 
				+    // set node -> label
			
 
				+    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y"));
			
 
				+    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("x"),
			
 
				+        NodeId.newInstance("h2", 0), toSet("y")));
			
 
				+
			
 
				+    // inject node label manager
			
 
				+    MockRM rm1 = new MockRM(getConfigurationWithQueueLabels(conf)) {
			
 
				+      @Override
			
 
				+      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				+        return mgr;
			
 
				+      }
			
 
				+    };
			
 
				+
			
 
				+    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				+    rm1.start();
			
 
				+    MockNM nm1 = rm1.registerNode("h1:1234", 8000); // label = x
			
 
				+    MockNM nm2 = rm1.registerNode("h2:1234", 8000); // label = y
			
 
				+    MockNM nm3 = rm1.registerNode("h3:1234", 8000); // label = <empty>
			
 
				+    
			
 
				+    ContainerId containerId;
			
 
				+
			
 
				+    // launch an app to queue a1 (label = x), and check all container will
			
 
				+    // be allocated in h1
			
 
				+    RMApp app1 = rm1.submitApp(200, "app", "user", null, "a1");
			
 
				+    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm3);
			
 
				+
			
 
				+    // request a container.
			
 
				+    am1.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "x");
			
 
				+    containerId =
			
 
				+        ContainerId.newContainerId(am1.getApplicationAttemptId(), 2);
			
 
				+    Assert.assertFalse(rm1.waitForState(nm2, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    Assert.assertTrue(rm1.waitForState(nm1, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    checkTaskContainersHost(am1.getApplicationAttemptId(), containerId, rm1,
			
 
				+        "h1");
			
 
				+
			
 
				+    // launch an app to queue b1 (label = y), and check all container will
			
 
				+    // be allocated in h2
			
 
				+    RMApp app2 = rm1.submitApp(200, "app", "user", null, "b1");
			
 
				+    MockAM am2 = MockRM.launchAndRegisterAM(app2, rm1, nm3);
			
 
				+
			
 
				+    // request a container.
			
 
				+    am2.allocate("*", 1024, 1, new ArrayList<ContainerId>(), "y");
			
 
				+    containerId = ContainerId.newContainerId(am2.getApplicationAttemptId(), 2);
			
 
				+    Assert.assertFalse(rm1.waitForState(nm1, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    Assert.assertTrue(rm1.waitForState(nm2, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    checkTaskContainersHost(am2.getApplicationAttemptId(), containerId, rm1,
			
 
				+        "h2");
			
 
				+    
			
 
				+    // launch an app to queue c1 (label = ""), and check all container will
			
 
				+    // be allocated in h3
			
 
				+    RMApp app3 = rm1.submitApp(200, "app", "user", null, "c1");
			
 
				+    MockAM am3 = MockRM.launchAndRegisterAM(app3, rm1, nm3);
			
 
				+
			
 
				+    // request a container.
			
 
				+    am3.allocate("*", 1024, 1, new ArrayList<ContainerId>());
			
 
				+    containerId = ContainerId.newContainerId(am3.getApplicationAttemptId(), 2);
			
 
				+    Assert.assertFalse(rm1.waitForState(nm2, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    Assert.assertTrue(rm1.waitForState(nm3, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    checkTaskContainersHost(am3.getApplicationAttemptId(), containerId, rm1,
			
 
				+        "h3");
			
 
				+
			
 
				+    rm1.close();
			
 
				+  }
			
 
				+  
			
 
				+  @Test (timeout = 120000)
			
 
				+  public void testContainerAllocateWithDefaultQueueLabels() throws Exception {
			
 
				+    // This test is pretty much similar to testContainerAllocateWithLabel.
			
 
				+    // Difference is, this test doesn't specify label expression in ResourceRequest,
			
 
				+    // instead, it uses default queue label expression
			
 
				+
			
 
				+    // set node -> label
			
 
				+    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y"));
			
 
				+    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("x"),
			
 
				+        NodeId.newInstance("h2", 0), toSet("y")));
			
 
				+
			
 
				+    // inject node label manager
			
 
				+    MockRM rm1 = new MockRM(TestUtils.getConfigurationWithDefaultQueueLabels(conf)) {
			
 
				+      @Override
			
 
				+      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				+        return mgr;
			
 
				+      }
			
 
				+    };
			
 
				+
			
 
				+    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				+    rm1.start();
			
 
				+    MockNM nm1 = rm1.registerNode("h1:1234", 8000); // label = x
			
 
				+    MockNM nm2 = rm1.registerNode("h2:1234", 8000); // label = y
			
 
				+    MockNM nm3 = rm1.registerNode("h3:1234", 8000); // label = <empty>
			
 
				+    
			
 
				+    ContainerId containerId;
			
 
				+
			
 
				+    // launch an app to queue a1 (label = x), and check all container will
			
 
				+    // be allocated in h1
			
 
				+    RMApp app1 = rm1.submitApp(200, "app", "user", null, "a1");
			
 
				+    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm1);
			
 
				+
			
 
				+    // request a container.
			
 
				+    am1.allocate("*", 1024, 1, new ArrayList<ContainerId>());
			
 
				+    containerId =
			
 
				+        ContainerId.newContainerId(am1.getApplicationAttemptId(), 2);
			
 
				+    Assert.assertFalse(rm1.waitForState(nm3, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    Assert.assertTrue(rm1.waitForState(nm1, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    checkTaskContainersHost(am1.getApplicationAttemptId(), containerId, rm1,
			
 
				+        "h1");
			
 
				+
			
 
				+    // launch an app to queue b1 (label = y), and check all container will
			
 
				+    // be allocated in h2
			
 
				+    RMApp app2 = rm1.submitApp(200, "app", "user", null, "b1");
			
 
				+    MockAM am2 = MockRM.launchAndRegisterAM(app2, rm1, nm2);
			
 
				+
			
 
				+    // request a container.
			
 
				+    am2.allocate("*", 1024, 1, new ArrayList<ContainerId>());
			
 
				+    containerId = ContainerId.newContainerId(am2.getApplicationAttemptId(), 2);
			
 
				+    Assert.assertFalse(rm1.waitForState(nm3, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    Assert.assertTrue(rm1.waitForState(nm2, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    checkTaskContainersHost(am2.getApplicationAttemptId(), containerId, rm1,
			
 
				+        "h2");
			
 
				+    
			
 
				+    // launch an app to queue c1 (label = ""), and check all container will
			
 
				+    // be allocated in h3
			
 
				+    RMApp app3 = rm1.submitApp(200, "app", "user", null, "c1");
			
 
				+    MockAM am3 = MockRM.launchAndRegisterAM(app3, rm1, nm3);
			
 
				+
			
 
				+    // request a container.
			
 
				+    am3.allocate("*", 1024, 1, new ArrayList<ContainerId>());
			
 
				+    containerId = ContainerId.newContainerId(am3.getApplicationAttemptId(), 2);
			
 
				+    Assert.assertFalse(rm1.waitForState(nm2, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    Assert.assertTrue(rm1.waitForState(nm3, containerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    checkTaskContainersHost(am3.getApplicationAttemptId(), containerId, rm1,
			
 
				+        "h3");
			
 
				+
			
 
				+    rm1.close();
			
 
				+  }
			
 
				+  
			
 
				+  private void checkPendingResource(MockRM rm, int priority,
			
 
				+      ApplicationAttemptId attemptId, int memory) {
			
 
				+    CapacityScheduler cs = (CapacityScheduler) rm.getRMContext().getScheduler();
			
 
				+    FiCaSchedulerApp app = cs.getApplicationAttempt(attemptId);
			
 
				+    ResourceRequest rr =
			
 
				+        app.getAppSchedulingInfo().getResourceRequest(
			
 
				+            Priority.newInstance(priority), "*");
			
 
				+    Assert.assertEquals(memory,
			
 
				+        rr.getCapability().getMemory() * rr.getNumContainers());
			
 
				+  }
			
 
				+  
			
 
				+  private void checkLaunchedContainerNumOnNode(MockRM rm, NodeId nodeId,
			
 
				+      int numContainers) {
			
 
				+    CapacityScheduler cs = (CapacityScheduler) rm.getRMContext().getScheduler();
			
 
				+    SchedulerNode node = cs.getSchedulerNode(nodeId);
			
 
				+    Assert.assertEquals(numContainers, node.getNumContainers());
			
 
				+  }
			
 
				+  
			
 
				+  @Test
			
 
				+  public void testPreferenceOfNeedyAppsTowardsNodePartitions() throws Exception {
			
 
				+    /**
			
 
				+     * Test case: Submit two application to a queue (app1 first then app2), app1
			
 
				+     * asked for no-label, app2 asked for label=x, when node1 has label=x
			
 
				+     * doing heart beat, app2 will get allocation first, even if app2 submits later
			
 
				+     * than app1
			
 
				+     */
			
 
				+    
			
 
				+    // set node -> label
			
 
				+    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y"));
			
 
				+    // Makes y to be non-exclusive node labels
			
 
				+    mgr.updateNodeLabels(Arrays.asList(NodeLabel.newInstance("y", false)));
			
 
				+    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("y")));
			
 
				+
			
 
				+    // inject node label manager
			
 
				+    MockRM rm1 = new MockRM(TestUtils.getConfigurationWithQueueLabels(conf)) {
			
 
				+      @Override
			
 
				+      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				+        return mgr;
			
 
				+      }
			
 
				+    };
			
 
				+
			
 
				+    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				+    rm1.start();
			
 
				+    MockNM nm1 = rm1.registerNode("h1:1234", 8 * GB); // label = y
			
 
				+    MockNM nm2 = rm1.registerNode("h2:1234", 100 * GB); // label = <empty>
			
 
				+
			
 
				+    // launch an app to queue b1 (label = y), AM container should be launched in nm2
			
 
				+    RMApp app1 = rm1.submitApp(1 * GB, "app", "user", null, "b1");
			
 
				+    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm2);
			
 
				+    
			
 
				+    // launch another app to queue b1 (label = y), AM container should be launched in nm2
			
 
				+    RMApp app2 = rm1.submitApp(1 * GB, "app", "user", null, "b1");
			
 
				+    MockAM am2 = MockRM.launchAndRegisterAM(app2, rm1, nm2);
			
 
				+
			
 
				+    // request container and nm1 do heartbeat (nm2 has label=y), note that app1
			
 
				+    // request non-labeled container, and app2 request labeled container, app2
			
 
				+    // will get allocated first even if app1 submitted first.  
			
 
				+    am1.allocate("*", 1 * GB, 8, new ArrayList<ContainerId>());
			
 
				+    am2.allocate("*", 1 * GB, 8, new ArrayList<ContainerId>(), "y");
			
 
				+    
			
 
				+    CapacityScheduler cs = (CapacityScheduler) rm1.getResourceScheduler();
			
 
				+    RMNode rmNode1 = rm1.getRMContext().getRMNodes().get(nm1.getNodeId());
			
 
				+    RMNode rmNode2 = rm1.getRMContext().getRMNodes().get(nm2.getNodeId());
			
 
				+    
			
 
				+    // Do node heartbeats many times
			
 
				+    for (int i = 0; i < 50; i++) {
			
 
				+      cs.handle(new NodeUpdateSchedulerEvent(rmNode1));
			
 
				+      cs.handle(new NodeUpdateSchedulerEvent(rmNode2));
			
 
				+    }
			
 
				+    
			
 
				+    // App2 will get preference to be allocated on node1, and node1 will be all
			
 
				+    // used by App2.
			
 
				+    FiCaSchedulerApp schedulerApp1 = cs.getApplicationAttempt(am1.getApplicationAttemptId());
			
 
				+    FiCaSchedulerApp schedulerApp2 = cs.getApplicationAttempt(am2.getApplicationAttemptId());
			
 
				+    // app1 get nothing in nm1 (partition=y)
			
 
				+    checkNumOfContainersInAnAppOnGivenNode(0, nm1.getNodeId(), schedulerApp1);
			
 
				+    checkNumOfContainersInAnAppOnGivenNode(9, nm2.getNodeId(), schedulerApp1);
			
 
				+    // app2 get all resource in nm1 (partition=y)
			
 
				+    checkNumOfContainersInAnAppOnGivenNode(8, nm1.getNodeId(), schedulerApp2);
			
 
				+    checkNumOfContainersInAnAppOnGivenNode(1, nm2.getNodeId(), schedulerApp2);
			
 
				+    
			
 
				+    rm1.close();
			
 
				+  }
			
 
				+  
			
 
				+  private void checkNumOfContainersInAnAppOnGivenNode(int expectedNum,
			
 
				+      NodeId nodeId, FiCaSchedulerApp app) {
			
 
				+    int num = 0;
			
 
				+    for (RMContainer container : app.getLiveContainers()) {
			
 
				+      if (container.getAllocatedNode().equals(nodeId)) {
			
 
				+        num++;
			
 
				+      }
			
 
				+    }
			
 
				+    Assert.assertEquals(expectedNum, num);
			
 
				+  }
			
 
				+  
			
 
				+  @Test
			
 
				+  public void
			
 
				+      testPreferenceOfNeedyPrioritiesUnderSameAppTowardsNodePartitions()
			
 
				+          throws Exception {
			
 
				+    /**
			
 
				+     * Test case: Submit one application, it asks label="" in priority=1 and
			
 
				+     * label="x" in priority=2, when a node with label=x heartbeat, priority=2
			
 
				+     * will get allocation first even if there're pending resource in priority=1
			
 
				+     */
			
 
				+    
			
 
				+    // set node -> label
			
 
				+    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y"));
			
 
				+    // Makes y to be non-exclusive node labels
			
 
				+    mgr.updateNodeLabels(Arrays.asList(NodeLabel.newInstance("y", false)));
			
 
				+    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("y")));
			
 
				+
			
 
				+    // inject node label manager
			
 
				+    MockRM rm1 = new MockRM(TestUtils.getConfigurationWithQueueLabels(conf)) {
			
 
				+      @Override
			
 
				+      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				+        return mgr;
			
 
				+      }
			
 
				+    };
			
 
				+
			
 
				+    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				+    rm1.start();
			
 
				+    MockNM nm1 = rm1.registerNode("h1:1234", 8 * GB); // label = y
			
 
				+    MockNM nm2 = rm1.registerNode("h2:1234", 100 * GB); // label = <empty>
			
 
				+    
			
 
				+    ContainerId nextContainerId;
			
 
				+
			
 
				+    // launch an app to queue b1 (label = y), AM container should be launched in nm3
			
 
				+    RMApp app1 = rm1.submitApp(1 * GB, "app", "user", null, "b1");
			
 
				+    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm2);
			
 
				+    
			
 
				+    // request containers from am2, priority=1 asks for "" and priority=2 asks
			
 
				+    // for "y", "y" container should be allocated first
			
 
				+    nextContainerId =
			
 
				+        ContainerId.newContainerId(am1.getApplicationAttemptId(), 2);
			
 
				+    am1.allocate("*", 1 * GB, 1, 1, new ArrayList<ContainerId>(), "");
			
 
				+    am1.allocate("*", 1 * GB, 1, 2, new ArrayList<ContainerId>(), "y");
			
 
				+    Assert.assertTrue(rm1.waitForState(nm1, nextContainerId,
			
 
				+        RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    
			
 
				+    // Check pending resource for am2, priority=1 doesn't get allocated before
			
 
				+    // priority=2 allocated
			
 
				+    checkPendingResource(rm1, 1, am1.getApplicationAttemptId(), 1 * GB);
			
 
				+    checkPendingResource(rm1, 2, am1.getApplicationAttemptId(), 0 * GB);
			
 
				+    
			
 
				+    rm1.close();
			
 
				+  }
			
 
				+  
			
 
				+  @Test
			
 
				+  public void testNonLabeledResourceRequestGetPreferrenceToNonLabeledNode()
			
 
				+      throws Exception {
			
 
				+    /**
			
 
				+     * Test case: Submit one application, it asks 6 label="" containers, NM1
			
 
				+     * with label=y and NM2 has no label, NM1/NM2 doing heartbeat together. Even
			
 
				+     * if NM1 has idle resource, containers are all allocated to NM2 since
			
 
				+     * non-labeled request should get allocation on non-labeled nodes first.
			
 
				+     */
			
 
				+    
			
 
				+    // set node -> label
			
 
				+    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y"));
			
 
				+    // Makes x to be non-exclusive node labels
			
 
				+    mgr.updateNodeLabels(Arrays.asList(NodeLabel.newInstance("x", false)));
			
 
				+    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("x")));
			
 
				+
			
 
				+    // inject node label manager
			
 
				+    MockRM rm1 = new MockRM(TestUtils.getConfigurationWithQueueLabels(conf)) {
			
 
				+      @Override
			
 
				+      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				+        return mgr;
			
 
				+      }
			
 
				+    };
			
 
				+
			
 
				+    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				+    rm1.start();
			
 
				+    MockNM nm1 = rm1.registerNode("h1:1234", 8 * GB); // label = y
			
 
				+    MockNM nm2 = rm1.registerNode("h2:1234", 100 * GB); // label = <empty>
			
 
				+    
			
 
				+    ContainerId nextContainerId;
			
 
				+
			
 
				+    // launch an app to queue b1 (label = y), AM container should be launched in nm3
			
 
				+    RMApp app1 = rm1.submitApp(1 * GB, "app", "user", null, "b1");
			
 
				+    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm2);
			
 
				+    
			
 
				+    // request containers from am2, priority=1 asks for "" * 6 (id from 4 to 9),
			
 
				+    // nm2/nm3 do
			
 
				+    // heartbeat at the same time, check containers are always allocated to nm3.
			
 
				+    // This is to verify when there's resource available in non-labeled
			
 
				+    // partition, non-labeled resource should allocate to non-labeled partition
			
 
				+    // first.
			
 
				+    am1.allocate("*", 1 * GB, 6, 1, new ArrayList<ContainerId>(), "");
			
 
				+    for (int i = 2; i < 2 + 6; i++) {
			
 
				+      nextContainerId =
			
 
				+          ContainerId.newContainerId(am1.getApplicationAttemptId(), i);
			
 
				+      Assert.assertTrue(rm1.waitForState(Arrays.asList(nm1, nm2),
			
 
				+          nextContainerId, RMContainerState.ALLOCATED, 10 * 1000));
			
 
				+    }
			
 
				+    // no more container allocated on nm1
			
 
				+    checkLaunchedContainerNumOnNode(rm1, nm1.getNodeId(), 0);
			
 
				+    // all 7 (1 AM container + 6 task container) containers allocated on nm2
			
 
				+    checkLaunchedContainerNumOnNode(rm1, nm2.getNodeId(), 7);   
			
 
				+    
			
 
				+    rm1.close();
			
 
				+  }
			
 
				+
			
 
				+  @Test
			
 
				+  public void testPreferenceOfQueuesTowardsNodePartitions()
			
 
				+      throws Exception {
			
 
				+    /**
			
 
				+     * Test case: have a following queue structure:
			
 
				+     * 
			
 
				+     * <pre>
			
 
				+     *            root
			
 
				+     *         /   |   \
			
 
				+     *        a     b    c
			
 
				+     *       / \   / \  /  \
			
 
				+     *      a1 a2 b1 b2 c1 c2
			
 
				+     *     (x)    (x)   (x)
			
 
				+     * </pre>
			
 
				+     * 
			
 
				+     * Only a1, b1, c1 can access label=x, and their default label=x Each each
			
 
				+     * has one application, asks for 5 containers. NM1 has label=x
			
 
				+     * 
			
 
				+     * NM1/NM2 doing heartbeat for 15 times, it should allocate all 15
			
 
				+     * containers with label=x
			
 
				+     */
			
 
				+    
			
 
				+    CapacitySchedulerConfiguration csConf =
			
 
				+        new CapacitySchedulerConfiguration(this.conf);
			
 
				+    
			
 
				+    // Define top-level queues
			
 
				+    csConf.setQueues(CapacitySchedulerConfiguration.ROOT, new String[] {"a", "b", "c"});
			
 
				+    csConf.setCapacityByLabel(CapacitySchedulerConfiguration.ROOT, "x", 100);
			
 
				+
			
 
				+    final String A = CapacitySchedulerConfiguration.ROOT + ".a";
			
 
				+    csConf.setCapacity(A, 33);
			
 
				+    csConf.setAccessibleNodeLabels(A, toSet("x"));
			
 
				+    csConf.setCapacityByLabel(A, "x", 33);
			
 
				+    csConf.setQueues(A, new String[] {"a1", "a2"});
			
 
				+    
			
 
				+    final String B = CapacitySchedulerConfiguration.ROOT + ".b";
			
 
				+    csConf.setCapacity(B, 33);
			
 
				+    csConf.setAccessibleNodeLabels(B, toSet("x"));
			
 
				+    csConf.setCapacityByLabel(B, "x", 33);
			
 
				+    csConf.setQueues(B, new String[] {"b1", "b2"});
			
 
				+    
			
 
				+    final String C = CapacitySchedulerConfiguration.ROOT + ".c";
			
 
				+    csConf.setCapacity(C, 34);
			
 
				+    csConf.setAccessibleNodeLabels(C, toSet("x"));
			
 
				+    csConf.setCapacityByLabel(C, "x", 34);
			
 
				+    csConf.setQueues(C, new String[] {"c1", "c2"});
			
 
				+    
			
 
				+    // Define 2nd-level queues
			
 
				+    final String A1 = A + ".a1";
			
 
				+    csConf.setCapacity(A1, 50);
			
 
				+    csConf.setCapacityByLabel(A1, "x", 100);
			
 
				+    csConf.setDefaultNodeLabelExpression(A1, "x");
			
 
				+    
			
 
				+    final String A2 = A + ".a2";
			
 
				+    csConf.setCapacity(A2, 50);
			
 
				+    csConf.setCapacityByLabel(A2, "x", 0);
			
 
				+    
			
 
				+    final String B1 = B + ".b1";
			
 
				+    csConf.setCapacity(B1, 50);
			
 
				+    csConf.setCapacityByLabel(B1, "x", 100);
			
 
				+    csConf.setDefaultNodeLabelExpression(B1, "x");
			
 
				+    
			
 
				+    final String B2 = B + ".b2";
			
 
				+    csConf.setCapacity(B2, 50);
			
 
				+    csConf.setCapacityByLabel(B2, "x", 0);
			
 
				+    
			
 
				+    final String C1 = C + ".c1";
			
 
				+    csConf.setCapacity(C1, 50);
			
 
				+    csConf.setCapacityByLabel(C1, "x", 100);
			
 
				+    csConf.setDefaultNodeLabelExpression(C1, "x");
			
 
				+    
			
 
				+    final String C2 = C + ".c2";
			
 
				+    csConf.setCapacity(C2, 50);
			
 
				+    csConf.setCapacityByLabel(C2, "x", 0);
			
 
				+    
			
 
				+    // set node -> label
			
 
				+    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y"));
			
 
				+    // Makes x to be non-exclusive node labels
			
 
				+    mgr.updateNodeLabels(Arrays.asList(NodeLabel.newInstance("x", false)));
			
 
				+    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("x")));
			
 
				+
			
 
				+    // inject node label manager
			
 
				+    MockRM rm1 = new MockRM(csConf) {
			
 
				+      @Override
			
 
				+      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				+        return mgr;
			
 
				+      }
			
 
				+    };
			
 
				+
			
 
				+    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				+    rm1.start();
			
 
				+    MockNM nm1 = rm1.registerNode("h1:1234", 20 * GB); // label = x
			
 
				+    MockNM nm2 = rm1.registerNode("h2:1234", 100 * GB); // label = <empty>
			
 
				+
			
 
				+    // app1 -> a1
			
 
				+    RMApp app1 = rm1.submitApp(1 * GB, "app", "user", null, "a1");
			
 
				+    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm1);
			
 
				+    
			
 
				+    // app2 -> a2
			
 
				+    RMApp app2 = rm1.submitApp(1 * GB, "app", "user", null, "a2");
			
 
				+    MockAM am2 = MockRM.launchAndRegisterAM(app2, rm1, nm2);
			
 
				+    
			
 
				+    // app3 -> b1
			
 
				+    RMApp app3 = rm1.submitApp(1 * GB, "app", "user", null, "b1");
			
 
				+    MockAM am3 = MockRM.launchAndRegisterAM(app3, rm1, nm1);
			
 
				+    
			
 
				+    // app4 -> b2
			
 
				+    RMApp app4 = rm1.submitApp(1 * GB, "app", "user", null, "b2");
			
 
				+    MockAM am4 = MockRM.launchAndRegisterAM(app4, rm1, nm2);
			
 
				+    
			
 
				+    // app5 -> c1
			
 
				+    RMApp app5 = rm1.submitApp(1 * GB, "app", "user", null, "c1");
			
 
				+    MockAM am5 = MockRM.launchAndRegisterAM(app5, rm1, nm1);
			
 
				+    
			
 
				+    // app6 -> b2
			
 
				+    RMApp app6 = rm1.submitApp(1 * GB, "app", "user", null, "c2");
			
 
				+    MockAM am6 = MockRM.launchAndRegisterAM(app6, rm1, nm2);
			
 
				+    
			
 
				+    // Each application request 5 * 1GB container
			
 
				+    am1.allocate("*", 1 * GB, 5, new ArrayList<ContainerId>());
			
 
				+    am2.allocate("*", 1 * GB, 5, new ArrayList<ContainerId>());
			
 
				+    am3.allocate("*", 1 * GB, 5, new ArrayList<ContainerId>());
			
 
				+    am4.allocate("*", 1 * GB, 5, new ArrayList<ContainerId>());
			
 
				+    am5.allocate("*", 1 * GB, 5, new ArrayList<ContainerId>());
			
 
				+    am6.allocate("*", 1 * GB, 5, new ArrayList<ContainerId>());
			
 
				+    
			
 
				+    // NM1 do 15 heartbeats
			
 
				+    CapacityScheduler cs = (CapacityScheduler) rm1.getResourceScheduler();
			
 
				+    RMNode rmNode1 = rm1.getRMContext().getRMNodes().get(nm1.getNodeId());
			
 
				+    for (int i = 0; i < 15; i++) {
			
 
				+      cs.handle(new NodeUpdateSchedulerEvent(rmNode1));
			
 
				+    }
			
 
				+    
			
 
				+    // NM1 get 15 new containers (total is 18, 15 task containers and 3 AM
			
 
				+    // containers)
			
 
				+    checkLaunchedContainerNumOnNode(rm1, nm1.getNodeId(), 18);
			
 
				+
			
 
				+    // Check pending resource each application
			
 
				+    // APP1/APP3/APP5 get satisfied, and APP2/APP2/APP3 get nothing.
			
 
				+    checkPendingResource(rm1, 1, am1.getApplicationAttemptId(), 0 * GB);
			
 
				+    checkPendingResource(rm1, 1, am2.getApplicationAttemptId(), 5 * GB);
			
 
				+    checkPendingResource(rm1, 1, am3.getApplicationAttemptId(), 0 * GB);
			
 
				+    checkPendingResource(rm1, 1, am4.getApplicationAttemptId(), 5 * GB);
			
 
				+    checkPendingResource(rm1, 1, am5.getApplicationAttemptId(), 0 * GB);
			
 
				+    checkPendingResource(rm1, 1, am6.getApplicationAttemptId(), 5 * GB);
			
 
				+
			
 
				+    rm1.close();
			
 
				+  }
			
 
				+  
			
 
				+  @Test
			
 
				+  public void testQueuesWithoutAccessUsingPartitionedNodes() throws Exception {
			
 
				+    /**
			
 
				+     * Test case: have a following queue structure:
			
 
				+     * 
			
 
				+     * <pre>
			
 
				+     *            root
			
 
				+     *         /      \
			
 
				+     *        a        b
			
 
				+     *        (x)
			
 
				+     * </pre>
			
 
				+     * 
			
 
				+     * Only a can access label=x, two nodes in the cluster, n1 has x and n2 has
			
 
				+     * no-label.
			
 
				+     * 
			
 
				+     * When user-limit-factor=5, submit one application in queue b and request
			
 
				+     * for infinite containers should be able to use up all cluster resources.
			
 
				+     */
			
 
				+    
			
 
				+    CapacitySchedulerConfiguration csConf =
			
 
				+        new CapacitySchedulerConfiguration(this.conf);
			
 
				+    
			
 
				+    // Define top-level queues
			
 
				+    csConf.setQueues(CapacitySchedulerConfiguration.ROOT, new String[] {"a", "b"});
			
 
				+    csConf.setCapacityByLabel(CapacitySchedulerConfiguration.ROOT, "x", 100);
			
 
				+
			
 
				+    final String A = CapacitySchedulerConfiguration.ROOT + ".a";
			
 
				+    csConf.setCapacity(A, 50);
			
 
				+    csConf.setAccessibleNodeLabels(A, toSet("x"));
			
 
				+    csConf.setCapacityByLabel(A, "x", 100);
			
 
				+    
			
 
				+    final String B = CapacitySchedulerConfiguration.ROOT + ".b";
			
 
				+    csConf.setCapacity(B, 50);
			
 
				+    csConf.setAccessibleNodeLabels(B, new HashSet<String>());
			
 
				+    csConf.setUserLimitFactor(B, 5);
			
 
				+    
			
 
				+    // set node -> label
			
 
				+    mgr.addToCluserNodeLabels(ImmutableSet.of("x"));
			
 
				+    // Makes x to be non-exclusive node labels
			
 
				+    mgr.updateNodeLabels(Arrays.asList(NodeLabel.newInstance("x", false)));
			
 
				+    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("x")));
			
 
				+
			
 
				+    // inject node label manager
			
 
				+    MockRM rm1 = new MockRM(csConf) {
			
 
				+      @Override
			
 
				+      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				+        return mgr;
			
 
				+      }
			
 
				+    };
			
 
				+
			
 
				+    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				+    rm1.start();
			
 
				+    MockNM nm1 = rm1.registerNode("h1:1234", 10 * GB); // label = x
			
 
				+    MockNM nm2 = rm1.registerNode("h2:1234", 10 * GB); // label = <empty>
			
 
				+
			
 
				+    // app1 -> b
			
 
				+    RMApp app1 = rm1.submitApp(1 * GB, "app", "user", null, "b");
			
 
				+    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm2);
			
 
				+    
			
 
				+    // Each application request 5 * 1GB container
			
 
				+    am1.allocate("*", 1 * GB, 50, new ArrayList<ContainerId>());
			
 
				+    
			
 
				+    // NM1 do 50 heartbeats
			
 
				+    CapacityScheduler cs = (CapacityScheduler) rm1.getResourceScheduler();
			
 
				+    RMNode rmNode1 = rm1.getRMContext().getRMNodes().get(nm1.getNodeId());
			
 
				+    RMNode rmNode2 = rm1.getRMContext().getRMNodes().get(nm2.getNodeId());
			
 
				+    
			
 
				+    SchedulerNode schedulerNode1 = cs.getSchedulerNode(nm1.getNodeId());
			
 
				+    
			
 
				+    // How much cycles we waited to be allocated when available resource only on
			
 
				+    // partitioned node
			
 
				+    int cycleWaited = 0;
			
 
				+    for (int i = 0; i < 50; i++) {
			
 
				+      cs.handle(new NodeUpdateSchedulerEvent(rmNode1));
			
 
				+      cs.handle(new NodeUpdateSchedulerEvent(rmNode2));
			
 
				+      if (schedulerNode1.getNumContainers() == 0) {
			
 
				+        cycleWaited++;
			
 
				+      }
			
 
				+    }
			
 
				+    // We will will 10 cycles before get allocated on partitioned node
			
 
				+    // NM2 can allocate 10 containers totally, exclude already allocated AM
			
 
				+    // container, we will wait 9 to fulfill non-partitioned node, and need wait
			
 
				+    // one more cycle before allocating to non-partitioned node 
			
 
				+    Assert.assertEquals(10, cycleWaited);
			
 
				+    
			
 
				+    // Both NM1/NM2 launched 10 containers, cluster resource is exhausted
			
 
				+    checkLaunchedContainerNumOnNode(rm1, nm1.getNodeId(), 10);
			
 
				+    checkLaunchedContainerNumOnNode(rm1, nm2.getNodeId(), 10);
			
 
				+
			
 
				+    rm1.close();
			
 
				+  }
			
 
				+  
			
 
				+  @Test
			
 
				+  public void testAMContainerAllocationWillAlwaysBeExclusive()
			
 
				+      throws Exception {
			
 
				+    /**
			
 
				+     * Test case: Submit one application without partition, trying to allocate a
			
 
				+     * node has partition=x, it should fail to allocate since AM container will
			
 
				+     * always respect exclusivity for partitions
			
 
				+     */
			
 
				+    
			
 
				+    // set node -> label
			
 
				+    mgr.addToCluserNodeLabels(ImmutableSet.of("x", "y"));
			
 
				+    // Makes x to be non-exclusive node labels
			
 
				+    mgr.updateNodeLabels(Arrays.asList(NodeLabel.newInstance("x", false)));
			
 
				+    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("x")));
			
 
				+
			
 
				+    // inject node label manager
			
 
				+    MockRM rm1 = new MockRM(TestUtils.getConfigurationWithQueueLabels(conf)) {
			
 
				+      @Override
			
 
				+      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				+        return mgr;
			
 
				+      }
			
 
				+    };
			
 
				+
			
 
				+    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				+    rm1.start();
			
 
				+    MockNM nm1 = rm1.registerNode("h1:1234", 8 * GB); // label = x
			
 
				+
			
 
				+    // launch an app to queue b1 (label = y), AM container should be launched in nm3
			
 
				+    rm1.submitApp(1 * GB, "app", "user", null, "b1");
			
 
				+   
			
 
				+    CapacityScheduler cs = (CapacityScheduler) rm1.getResourceScheduler();
			
 
				+    RMNode rmNode1 = rm1.getRMContext().getRMNodes().get(nm1.getNodeId());
			
 
				+    
			
 
				+    // Heartbeat for many times, app1 should get nothing
			
 
				+    for (int i = 0; i < 50; i++) {
			
 
				+      cs.handle(new NodeUpdateSchedulerEvent(rmNode1));
			
 
				+    }
			
 
				+    
			
 
				+    Assert.assertEquals(0, cs.getSchedulerNode(nm1.getNodeId())
			
 
				+        .getNumContainers());
			
 
				+    
			
 
				+    rm1.close();
			
 
				+  }
			
 
				+  
			
 
				+  @Test
			
 
				+  public void
			
 
				+      testQueueMaxCapacitiesWillNotBeHonoredWhenNotRespectingExclusivity()
			
 
				+          throws Exception {
			
 
				+    /**
			
 
				+     * Test case: have a following queue structure:
			
 
				+     * 
			
 
				+     * <pre>
			
 
				+     *            root
			
 
				+     *         /      \
			
 
				+     *        a        b
			
 
				+     *        (x)     (x)
			
 
				+     * </pre>
			
 
				+     * 
			
 
				+     * a/b can access x, both of them has max-capacity-on-x = 50
			
 
				+     * 
			
 
				+     * When doing non-exclusive allocation, app in a (or b) can use 100% of x
			
 
				+     * resource.
			
 
				+     */
			
 
				+
			
 
				+    CapacitySchedulerConfiguration csConf =
			
 
				+        new CapacitySchedulerConfiguration(this.conf);
			
 
				+
			
 
				+    // Define top-level queues
			
 
				+    csConf.setQueues(CapacitySchedulerConfiguration.ROOT, new String[] { "a",
			
 
				+        "b" });
			
 
				+    csConf.setCapacityByLabel(CapacitySchedulerConfiguration.ROOT, "x", 100);
			
 
				+
			
 
				+    final String A = CapacitySchedulerConfiguration.ROOT + ".a";
			
 
				+    csConf.setCapacity(A, 50);
			
 
				+    csConf.setAccessibleNodeLabels(A, toSet("x"));
			
 
				+    csConf.setCapacityByLabel(A, "x", 50);
			
 
				+    csConf.setMaximumCapacityByLabel(A, "x", 50);
			
 
				+
			
 
				+    final String B = CapacitySchedulerConfiguration.ROOT + ".b";
			
 
				+    csConf.setCapacity(B, 50);
			
 
				+    csConf.setAccessibleNodeLabels(B, toSet("x"));
			
 
				+    csConf.setCapacityByLabel(B, "x", 50);
			
 
				+    csConf.setMaximumCapacityByLabel(B, "x", 50);
			
 
				+
			
 
				+    // set node -> label
			
 
				+    mgr.addToCluserNodeLabels(ImmutableSet.of("x"));
			
 
				+    // Makes x to be non-exclusive node labels
			
 
				+    mgr.updateNodeLabels(Arrays.asList(NodeLabel.newInstance("x", false)));
			
 
				+    mgr.addLabelsToNode(ImmutableMap.of(NodeId.newInstance("h1", 0), toSet("x")));
			
 
				+
			
 
				+    // inject node label manager
			
 
				+    MockRM rm1 = new MockRM(csConf) {
			
 
				+      @Override
			
 
				+      public RMNodeLabelsManager createNodeLabelManager() {
			
 
				+        return mgr;
			
 
				+      }
			
 
				+    };
			
 
				+
			
 
				+    rm1.getRMContext().setNodeLabelManager(mgr);
			
 
				+    rm1.start();
			
 
				+    MockNM nm1 = rm1.registerNode("h1:1234", 10 * GB); // label = x
			
 
				+    MockNM nm2 = rm1.registerNode("h2:1234", 10 * GB); // label = <empty>
			
 
				+
			
 
				+    // app1 -> a
			
 
				+    RMApp app1 = rm1.submitApp(1 * GB, "app", "user", null, "a");
			
 
				+    MockAM am1 = MockRM.launchAndRegisterAM(app1, rm1, nm2);
			
 
				+
			
 
				+    // app1 asks for 10 partition= containers
			
 
				+    am1.allocate("*", 1 * GB, 10, new ArrayList<ContainerId>());
			
 
				+
			
 
				+    // NM1 do 50 heartbeats
			
 
				+    CapacityScheduler cs = (CapacityScheduler) rm1.getResourceScheduler();
			
 
				+    RMNode rmNode1 = rm1.getRMContext().getRMNodes().get(nm1.getNodeId());
			
 
				+
			
 
				+    SchedulerNode schedulerNode1 = cs.getSchedulerNode(nm1.getNodeId());
			
 
				+
			
 
				+    for (int i = 0; i < 50; i++) {
			
 
				+      cs.handle(new NodeUpdateSchedulerEvent(rmNode1));
			
 
				+    }
			
 
				+    
			
 
				+    // app1 gets all resource in partition=x
			
 
				+    Assert.assertEquals(10, schedulerNode1.getNumContainers());
			
 
				+
			
 
				+    rm1.close();
			
 
				+  }
			
 
				+}
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestParentQueue.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestParentQueue.java
@@ -23,7 +23,6 @@ import static org.junit.Assert.assertFalse;
 
				 import static org.junit.Assert.assertTrue;
			
 
				 import static org.junit.Assert.fail;
			
 
				 import static org.mockito.Matchers.any;
			
 
				-import static org.mockito.Matchers.anyBoolean;
			
 
				 import static org.mockito.Matchers.eq;
			
 
				 import static org.mockito.Mockito.doAnswer;
			
 
				 import static org.mockito.Mockito.doReturn;
			
@@ -45,6 +44,7 @@ import org.apache.hadoop.yarn.api.records.Resource;
 
				 import org.apache.hadoop.yarn.conf.YarnConfiguration;
			
 
				 import org.apache.hadoop.yarn.security.YarnAuthorizationProvider;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.RMContext;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.NodeType;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceLimits;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.scheduler.common.fica.FiCaSchedulerApp;
			
@@ -146,7 +146,7 @@ public class TestParentQueue {
 
				         final Resource allocatedResource = Resources.createResource(allocation);
			
 
				         if (queue instanceof ParentQueue) {
			
 
				           ((ParentQueue)queue).allocateResource(clusterResource, 
			
 
				-              allocatedResource, null);
			
 
				+              allocatedResource, RMNodeLabelsManager.NO_LABEL);
			
 
				         } else {
			
 
				           FiCaSchedulerApp app1 = getMockApplication(0, "");
			
 
				           ((LeafQueue)queue).allocateResource(clusterResource, app1, 
			
@@ -157,7 +157,7 @@ public class TestParentQueue {
 
				         if (allocation > 0) {
			
 
				           doReturn(new CSAssignment(Resources.none(), type)).when(queue)
			
 
				               .assignContainers(eq(clusterResource), eq(node),
			
 
				-                  any(ResourceLimits.class));
			
 
				+                  any(ResourceLimits.class), any(SchedulingMode.class));
			
 
				 
			
 
				           // Mock the node's resource availability
			
 
				           Resource available = node.getAvailableResource();
			
@@ -168,7 +168,7 @@ public class TestParentQueue {
 
				         return new CSAssignment(allocatedResource, type);
			
 
				       }
			
 
				     }).when(queue).assignContainers(eq(clusterResource), eq(node),
			
 
				-        any(ResourceLimits.class));
			
 
				+        any(ResourceLimits.class), any(SchedulingMode.class));
			
 
				   }
			
 
				   
			
 
				   private float computeQueueAbsoluteUsedCapacity(CSQueue queue, 
			
@@ -228,11 +228,16 @@ public class TestParentQueue {
 
				     LeafQueue a = (LeafQueue)queues.get(A);
			
 
				     LeafQueue b = (LeafQueue)queues.get(B);
			
 
				     
			
 
				+    a.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				+    b.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				+    queues.get(CapacitySchedulerConfiguration.ROOT).getQueueResourceUsage()
			
 
				+    .incPending(Resources.createResource(1 * GB));
			
 
				+    
			
 
				     // Simulate B returning a container on node_0
			
 
				     stubQueueAllocation(a, clusterResource, node_0, 0*GB);
			
 
				     stubQueueAllocation(b, clusterResource, node_0, 1*GB);
			
 
				     root.assignContainers(clusterResource, node_0, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verifyQueueMetrics(a, 0*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 1*GB, clusterResource);
			
 
				     
			
@@ -240,12 +245,12 @@ public class TestParentQueue {
 
				     stubQueueAllocation(a, clusterResource, node_1, 2*GB);
			
 
				     stubQueueAllocation(b, clusterResource, node_1, 1*GB);
			
 
				     root.assignContainers(clusterResource, node_1, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     InOrder allocationOrder = inOrder(a, b);
			
 
				     allocationOrder.verify(a).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(b).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     verifyQueueMetrics(a, 2*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 2*GB, clusterResource);
			
 
				 
			
@@ -254,12 +259,12 @@ public class TestParentQueue {
 
				     stubQueueAllocation(a, clusterResource, node_0, 1*GB);
			
 
				     stubQueueAllocation(b, clusterResource, node_0, 2*GB);
			
 
				     root.assignContainers(clusterResource, node_0, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     allocationOrder = inOrder(b, a);
			
 
				     allocationOrder.verify(b).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(a).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     verifyQueueMetrics(a, 3*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 4*GB, clusterResource);
			
 
				 
			
@@ -268,12 +273,12 @@ public class TestParentQueue {
 
				     stubQueueAllocation(a, clusterResource, node_0, 0*GB);
			
 
				     stubQueueAllocation(b, clusterResource, node_0, 4*GB);
			
 
				     root.assignContainers(clusterResource, node_0, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     allocationOrder = inOrder(b, a);
			
 
				     allocationOrder.verify(b).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(a).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     verifyQueueMetrics(a, 3*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 8*GB, clusterResource);
			
 
				 
			
@@ -282,12 +287,12 @@ public class TestParentQueue {
 
				     stubQueueAllocation(a, clusterResource, node_1, 1*GB);
			
 
				     stubQueueAllocation(b, clusterResource, node_1, 1*GB);
			
 
				     root.assignContainers(clusterResource, node_1, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     allocationOrder = inOrder(a, b);
			
 
				     allocationOrder.verify(b).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(a).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     verifyQueueMetrics(a, 4*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 9*GB, clusterResource);
			
 
				   }
			
@@ -448,16 +453,27 @@ public class TestParentQueue {
 
				 
			
 
				     // Start testing
			
 
				     CSQueue a = queues.get(A);
			
 
				+    a.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				     CSQueue b = queues.get(B);
			
 
				+    b.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				     CSQueue c = queues.get(C);
			
 
				+    c.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				     CSQueue d = queues.get(D);
			
 
				+    d.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				 
			
 
				     CSQueue a1 = queues.get(A1);
			
 
				+    a1.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				     CSQueue a2 = queues.get(A2);
			
 
				+    a2.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				 
			
 
				     CSQueue b1 = queues.get(B1);
			
 
				+    b1.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				     CSQueue b2 = queues.get(B2);
			
 
				+    b2.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				     CSQueue b3 = queues.get(B3);
			
 
				+    b3.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				+    queues.get(CapacitySchedulerConfiguration.ROOT).getQueueResourceUsage()
			
 
				+    .incPending(Resources.createResource(1 * GB));
			
 
				 
			
 
				     // Simulate C returning a container on node_0
			
 
				     stubQueueAllocation(a, clusterResource, node_0, 0*GB);
			
@@ -465,7 +481,7 @@ public class TestParentQueue {
 
				     stubQueueAllocation(c, clusterResource, node_0, 1*GB);
			
 
				     stubQueueAllocation(d, clusterResource, node_0, 0*GB);
			
 
				     root.assignContainers(clusterResource, node_0, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verifyQueueMetrics(a, 0*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 0*GB, clusterResource);
			
 
				     verifyQueueMetrics(c, 1*GB, clusterResource);
			
@@ -478,7 +494,7 @@ public class TestParentQueue {
 
				     stubQueueAllocation(b2, clusterResource, node_1, 4*GB);
			
 
				     stubQueueAllocation(c, clusterResource, node_1, 0*GB);
			
 
				     root.assignContainers(clusterResource, node_1, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verifyQueueMetrics(a, 0*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 4*GB, clusterResource);
			
 
				     verifyQueueMetrics(c, 1*GB, clusterResource);
			
@@ -490,14 +506,14 @@ public class TestParentQueue {
 
				     stubQueueAllocation(b3, clusterResource, node_0, 2*GB);
			
 
				     stubQueueAllocation(c, clusterResource, node_0, 2*GB);
			
 
				     root.assignContainers(clusterResource, node_0, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     InOrder allocationOrder = inOrder(a, c, b);
			
 
				     allocationOrder.verify(a).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(c).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(b).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     verifyQueueMetrics(a, 1*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 6*GB, clusterResource);
			
 
				     verifyQueueMetrics(c, 3*GB, clusterResource);
			
@@ -517,16 +533,16 @@ public class TestParentQueue {
 
				     stubQueueAllocation(b1, clusterResource, node_2, 1*GB);
			
 
				     stubQueueAllocation(c, clusterResource, node_2, 1*GB);
			
 
				     root.assignContainers(clusterResource, node_2, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     allocationOrder = inOrder(a, a2, a1, b, c);
			
 
				     allocationOrder.verify(a).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(a2).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(b).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(c).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     verifyQueueMetrics(a, 3*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 8*GB, clusterResource);
			
 
				     verifyQueueMetrics(c, 4*GB, clusterResource);
			
@@ -622,12 +638,16 @@ public class TestParentQueue {
 
				     // Start testing
			
 
				     LeafQueue a = (LeafQueue)queues.get(A);
			
 
				     LeafQueue b = (LeafQueue)queues.get(B);
			
 
				+    a.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				+    b.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				+    queues.get(CapacitySchedulerConfiguration.ROOT).getQueueResourceUsage()
			
 
				+    .incPending(Resources.createResource(1 * GB));
			
 
				     
			
 
				     // Simulate B returning a container on node_0
			
 
				     stubQueueAllocation(a, clusterResource, node_0, 0*GB, NodeType.OFF_SWITCH);
			
 
				     stubQueueAllocation(b, clusterResource, node_0, 1*GB, NodeType.OFF_SWITCH);
			
 
				     root.assignContainers(clusterResource, node_0, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verifyQueueMetrics(a, 0*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 1*GB, clusterResource);
			
 
				     
			
@@ -636,12 +656,12 @@ public class TestParentQueue {
 
				     stubQueueAllocation(a, clusterResource, node_1, 2*GB, NodeType.RACK_LOCAL);
			
 
				     stubQueueAllocation(b, clusterResource, node_1, 1*GB, NodeType.OFF_SWITCH);
			
 
				     root.assignContainers(clusterResource, node_1, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     InOrder allocationOrder = inOrder(a, b);
			
 
				     allocationOrder.verify(a).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(b).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     verifyQueueMetrics(a, 2*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 2*GB, clusterResource);
			
 
				     
			
@@ -651,12 +671,12 @@ public class TestParentQueue {
 
				     stubQueueAllocation(a, clusterResource, node_0, 1*GB, NodeType.NODE_LOCAL);
			
 
				     stubQueueAllocation(b, clusterResource, node_0, 2*GB, NodeType.OFF_SWITCH);
			
 
				     root.assignContainers(clusterResource, node_0, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     allocationOrder = inOrder(b, a);
			
 
				     allocationOrder.verify(b).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(a).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     verifyQueueMetrics(a, 2*GB, clusterResource);
			
 
				     verifyQueueMetrics(b, 4*GB, clusterResource);
			
 
				 
			
@@ -691,12 +711,19 @@ public class TestParentQueue {
 
				     // Start testing
			
 
				     LeafQueue b3 = (LeafQueue)queues.get(B3);
			
 
				     LeafQueue b2 = (LeafQueue)queues.get(B2);
			
 
				+    b2.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				+    b3.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				+    queues.get(CapacitySchedulerConfiguration.ROOT).getQueueResourceUsage()
			
 
				+    .incPending(Resources.createResource(1 * GB));
			
 
				+    
			
 
				+    CSQueue b = queues.get(B);
			
 
				+    b.getQueueResourceUsage().incPending(Resources.createResource(1 * GB));
			
 
				     
			
 
				     // Simulate B3 returning a container on node_0
			
 
				     stubQueueAllocation(b2, clusterResource, node_0, 0*GB, NodeType.OFF_SWITCH);
			
 
				     stubQueueAllocation(b3, clusterResource, node_0, 1*GB, NodeType.OFF_SWITCH);
			
 
				     root.assignContainers(clusterResource, node_0, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     verifyQueueMetrics(b2, 0*GB, clusterResource);
			
 
				     verifyQueueMetrics(b3, 1*GB, clusterResource);
			
 
				     
			
@@ -705,12 +732,12 @@ public class TestParentQueue {
 
				     stubQueueAllocation(b2, clusterResource, node_1, 1*GB, NodeType.RACK_LOCAL);
			
 
				     stubQueueAllocation(b3, clusterResource, node_1, 1*GB, NodeType.OFF_SWITCH);
			
 
				     root.assignContainers(clusterResource, node_1, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     InOrder allocationOrder = inOrder(b2, b3);
			
 
				     allocationOrder.verify(b2).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(b3).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     verifyQueueMetrics(b2, 1*GB, clusterResource);
			
 
				     verifyQueueMetrics(b3, 2*GB, clusterResource);
			
 
				     
			
@@ -720,12 +747,12 @@ public class TestParentQueue {
 
				     stubQueueAllocation(b2, clusterResource, node_0, 1*GB, NodeType.NODE_LOCAL);
			
 
				     stubQueueAllocation(b3, clusterResource, node_0, 1*GB, NodeType.OFF_SWITCH);
			
 
				     root.assignContainers(clusterResource, node_0, 
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     allocationOrder = inOrder(b3, b2);
			
 
				     allocationOrder.verify(b3).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     allocationOrder.verify(b2).assignContainers(eq(clusterResource), 
			
 
				-        any(FiCaSchedulerNode.class), anyResourceLimits());
			
 
				+        any(FiCaSchedulerNode.class), anyResourceLimits(), any(SchedulingMode.class));
			
 
				     verifyQueueMetrics(b2, 1*GB, clusterResource);
			
 
				     verifyQueueMetrics(b3, 3*GB, clusterResource);
			
 
				 
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestReservations.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestReservations.java
@@ -48,10 +48,10 @@ import org.apache.hadoop.yarn.conf.YarnConfiguration;
 
				 import org.apache.hadoop.yarn.event.DrainDispatcher;
			
 
				 import org.apache.hadoop.yarn.factories.RecordFactory;
			
 
				 import org.apache.hadoop.yarn.factory.providers.RecordFactoryProvider;
			
 
				-import org.apache.hadoop.yarn.nodelabels.CommonNodeLabelsManager;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.RMContext;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.ahs.RMApplicationHistoryWriter;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.metrics.SystemMetricsPublisher;
			
 
				+import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmapp.RMApp;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.ContainerAllocationExpirer;
			
 
				 import org.apache.hadoop.yarn.server.resourcemanager.rmcontainer.RMContainer;
			
@@ -266,7 +266,7 @@ public class TestReservations {
 
				     // Start testing...
			
 
				     // Only AM
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -278,7 +278,7 @@ public class TestReservations {
 
				 
			
 
				     // Only 1 map - simulating reduce
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(5 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(5 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -290,7 +290,7 @@ public class TestReservations {
 
				 
			
 
				     // Only 1 map to other node - simulating reduce
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(8 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -305,7 +305,7 @@ public class TestReservations {
 
				 
			
 
				     // try to assign reducer (5G on node 0 and should reserve)
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(13 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(5 * GB, a.getMetrics().getReservedMB());
			
@@ -321,7 +321,7 @@ public class TestReservations {
 
				 
			
 
				     // assign reducer to node 2
			
 
				     a.assignContainers(clusterResource, node_2,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(18 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(13 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(5 * GB, a.getMetrics().getReservedMB());
			
@@ -338,7 +338,7 @@ public class TestReservations {
 
				     // node_1 heartbeat and unreserves from node_0 in order to allocate
			
 
				     // on node_1
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(18 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(18 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -422,7 +422,7 @@ public class TestReservations {
 
				     // Start testing...
			
 
				     // Only AM
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -434,7 +434,7 @@ public class TestReservations {
 
				 
			
 
				     // Only 1 map - simulating reduce
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(5 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(5 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -446,7 +446,7 @@ public class TestReservations {
 
				 
			
 
				     // Only 1 map to other node - simulating reduce
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(8 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -461,7 +461,7 @@ public class TestReservations {
 
				 
			
 
				     // try to assign reducer (5G on node 0 and should reserve)
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(13 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(5 * GB, a.getMetrics().getReservedMB());
			
@@ -477,7 +477,7 @@ public class TestReservations {
 
				 
			
 
				     // assign reducer to node 2
			
 
				     a.assignContainers(clusterResource, node_2,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(18 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(13 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(5 * GB, a.getMetrics().getReservedMB());
			
@@ -494,7 +494,7 @@ public class TestReservations {
 
				     // node_1 heartbeat and won't unreserve from node_0, potentially stuck
			
 
				     // if AM doesn't handle
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(18 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(13 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(5 * GB, a.getMetrics().getReservedMB());
			
@@ -570,7 +570,7 @@ public class TestReservations {
 
				     // Start testing...
			
 
				     // Only AM
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -581,7 +581,7 @@ public class TestReservations {
 
				 
			
 
				     // Only 1 map - simulating reduce
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(5 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(5 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -592,7 +592,7 @@ public class TestReservations {
 
				 
			
 
				     // Only 1 map to other node - simulating reduce
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(8 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -606,7 +606,7 @@ public class TestReservations {
 
				 
			
 
				     // try to assign reducer (5G on node 0 and should reserve)
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(13 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(5 * GB, a.getMetrics().getReservedMB());
			
@@ -621,7 +621,7 @@ public class TestReservations {
 
				 
			
 
				     // could allocate but told need to unreserve first
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(13 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(13 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -823,7 +823,7 @@ public class TestReservations {
 
				     // Start testing...
			
 
				     // Only AM
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -834,7 +834,7 @@ public class TestReservations {
 
				 
			
 
				     // Only 1 map - simulating reduce
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(5 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(5 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -845,7 +845,7 @@ public class TestReservations {
 
				 
			
 
				     // Only 1 map to other node - simulating reduce
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(8 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -860,15 +860,16 @@ public class TestReservations {
 
				     Resource capability = Resources.createResource(32 * GB, 0);
			
 
				     boolean res =
			
 
				         a.canAssignToThisQueue(clusterResource,
			
 
				-            CommonNodeLabelsManager.EMPTY_STRING_SET, new ResourceLimits(
			
 
				-                clusterResource), capability, Resources.none());
			
 
				+            RMNodeLabelsManager.NO_LABEL, new ResourceLimits(
			
 
				+                clusterResource), capability, Resources.none(),
			
 
				+            SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertFalse(res);
			
 
				 
			
 
				     // now add in reservations and make sure it continues if config set
			
 
				     // allocate to queue so that the potential new capacity is greater then
			
 
				     // absoluteMaxCapacity
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(13 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(5 * GB, a.getMetrics().getReservedMB());
			
@@ -881,16 +882,17 @@ public class TestReservations {
 
				     capability = Resources.createResource(5 * GB, 0);
			
 
				     res =
			
 
				         a.canAssignToThisQueue(clusterResource,
			
 
				-            CommonNodeLabelsManager.EMPTY_STRING_SET, new ResourceLimits(
			
 
				-                clusterResource), capability, Resources
			
 
				-                .createResource(5 * GB));
			
 
				+            RMNodeLabelsManager.NO_LABEL, new ResourceLimits(
			
 
				+                clusterResource), capability, Resources.createResource(5 * GB),
			
 
				+            SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertTrue(res);
			
 
				 
			
 
				     // tell to not check reservations
			
 
				     res =
			
 
				         a.canAssignToThisQueue(clusterResource,
			
 
				-            CommonNodeLabelsManager.EMPTY_STRING_SET, new ResourceLimits(
			
 
				-                clusterResource), capability, Resources.none());
			
 
				+            RMNodeLabelsManager.NO_LABEL, new ResourceLimits(
			
 
				+                clusterResource), capability, Resources.none(),
			
 
				+            SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertFalse(res);
			
 
				 
			
 
				     refreshQueuesTurnOffReservationsContLook(a, csConf);
			
@@ -899,15 +901,16 @@ public class TestReservations {
 
				     // in since feature is off
			
 
				     res =
			
 
				         a.canAssignToThisQueue(clusterResource,
			
 
				-            CommonNodeLabelsManager.EMPTY_STRING_SET, new ResourceLimits(
			
 
				-                clusterResource), capability, Resources.none());
			
 
				+            RMNodeLabelsManager.NO_LABEL, new ResourceLimits(
			
 
				+                clusterResource), capability, Resources.none(),
			
 
				+            SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertFalse(res);
			
 
				 
			
 
				     res =
			
 
				         a.canAssignToThisQueue(clusterResource,
			
 
				-            CommonNodeLabelsManager.EMPTY_STRING_SET, new ResourceLimits(
			
 
				-                clusterResource), capability, Resources
			
 
				-                .createResource(5 * GB));
			
 
				+            RMNodeLabelsManager.NO_LABEL, new ResourceLimits(
			
 
				+                clusterResource), capability, Resources.createResource(5 * GB),
			
 
				+            SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertFalse(res);
			
 
				   }
			
 
				 
			
@@ -1008,7 +1011,7 @@ public class TestReservations {
 
				     // Start testing...
			
 
				     // Only AM
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -1019,7 +1022,7 @@ public class TestReservations {
 
				 
			
 
				     // Only 1 map - simulating reduce
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(5 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(5 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -1030,7 +1033,7 @@ public class TestReservations {
 
				 
			
 
				     // Only 1 map to other node - simulating reduce
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(8 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -1044,7 +1047,7 @@ public class TestReservations {
 
				     // allocate to queue so that the potential new capacity is greater then
			
 
				     // absoluteMaxCapacity
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(13 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(5 * GB, app_0.getCurrentReservation().getMemory());
			
@@ -1059,18 +1062,18 @@ public class TestReservations {
 
				     // set limit so subtrace reservations it can continue
			
 
				     Resource limit = Resources.createResource(12 * GB, 0);
			
 
				     boolean res = a.canAssignToUser(clusterResource, user_0, limit, app_0,
			
 
				-        true, null);
			
 
				+        true, "");
			
 
				     assertTrue(res);
			
 
				 
			
 
				     // tell it not to check for reservations and should fail as already over
			
 
				     // limit
			
 
				-    res = a.canAssignToUser(clusterResource, user_0, limit, app_0, false, null);
			
 
				+    res = a.canAssignToUser(clusterResource, user_0, limit, app_0, false, "");
			
 
				     assertFalse(res);
			
 
				 
			
 
				     refreshQueuesTurnOffReservationsContLook(a, csConf);
			
 
				 
			
 
				     // should now return false since feature off
			
 
				-    res = a.canAssignToUser(clusterResource, user_0, limit, app_0, true, null);
			
 
				+    res = a.canAssignToUser(clusterResource, user_0, limit, app_0, true, "");
			
 
				     assertFalse(res);
			
 
				   }
			
 
				 
			
@@ -1143,7 +1146,7 @@ public class TestReservations {
 
				     // Start testing...
			
 
				     // Only AM
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(2 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(2 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -1155,7 +1158,7 @@ public class TestReservations {
 
				 
			
 
				     // Only 1 map - simulating reduce
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(5 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(5 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -1167,7 +1170,7 @@ public class TestReservations {
 
				 
			
 
				     // Only 1 map to other node - simulating reduce
			
 
				     a.assignContainers(clusterResource, node_1,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(8 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -1183,7 +1186,7 @@ public class TestReservations {
 
				     // some resource. Even with continous reservation looking, we don't allow 
			
 
				     // unreserve resource to reserve container.
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(Resources.createResource(10 * GB)));
			
 
				+        new ResourceLimits(Resources.createResource(10 * GB)), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(8 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -1199,7 +1202,7 @@ public class TestReservations {
 
				     // used (8G) + required (5G). It will not reserved since it has to unreserve
			
 
				     // some resource. Unfortunately, there's nothing to unreserve.
			
 
				     a.assignContainers(clusterResource, node_2,
			
 
				-        new ResourceLimits(Resources.createResource(10 * GB)));
			
 
				+        new ResourceLimits(Resources.createResource(10 * GB)), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(8 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(8 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -1213,7 +1216,7 @@ public class TestReservations {
 
				 
			
 
				     // let it assign 5G to node_2
			
 
				     a.assignContainers(clusterResource, node_2,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(13 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(13 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(0 * GB, a.getMetrics().getReservedMB());
			
@@ -1226,7 +1229,7 @@ public class TestReservations {
 
				 
			
 
				     // reserve 8G node_0
			
 
				     a.assignContainers(clusterResource, node_0,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(21 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(13 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(8 * GB, a.getMetrics().getReservedMB());
			
@@ -1241,7 +1244,7 @@ public class TestReservations {
 
				     // continued to try due to having reservation above,
			
 
				     // but hits queue limits so can't reserve anymore.
			
 
				     a.assignContainers(clusterResource, node_2,
			
 
				-        new ResourceLimits(clusterResource));
			
 
				+        new ResourceLimits(clusterResource), SchedulingMode.RESPECT_PARTITION_EXCLUSIVITY);
			
 
				     assertEquals(21 * GB, a.getUsedResources().getMemory());
			
 
				     assertEquals(13 * GB, app_0.getCurrentConsumption().getMemory());
			
 
				     assertEquals(8 * GB, a.getMetrics().getReservedMB());
			
--- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestUtils.java
+++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/TestUtils.java
@@ -160,6 +160,7 @@ public class TestUtils {
 
				     request.setCapability(capability);
			
 
				     request.setRelaxLocality(relaxLocality);
			
 
				     request.setPriority(priority);
			
 
				+    request.setNodeLabelExpression(RMNodeLabelsManager.NO_LABEL);
			
 
				     return request;
			
 
				   }
			
 
				   
			
@@ -273,6 +274,7 @@ public class TestUtils {
 
				     conf.setCapacity(B1, 100);
			
 
				     conf.setMaximumCapacity(B1, 100);
			
 
				     conf.setCapacityByLabel(B1, "y", 100);
			
 
				+    conf.setMaximumApplicationMasterResourcePerQueuePercent(B1, 1f);
			
 
				 
			
 
				     final String C1 = C + ".c1";
			
 
				     conf.setQueues(C, new String[] {"c1"});