diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetrics.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetrics.java index 20a5a1ff790..4cb31358d58 100644 --- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetrics.java +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetrics.java @@ -19,6 +19,8 @@ package org.apache.hadoop.yarn.server.resourcemanager.scheduler; import static org.apache.hadoop.metrics2.lib.Interns.info; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler + .QueueMetricsForCustomResources.MetricsForCustomResource.*; import java.util.ArrayList; import java.util.HashMap; @@ -45,7 +47,8 @@ import org.apache.hadoop.yarn.conf.YarnConfiguration; import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager; import org.apache.hadoop.yarn.server.resourcemanager.rmapp.RMAppState; -import org.apache.hadoop.yarn.server.utils.BuilderUtils; +import org.apache.hadoop.yarn.server.resourcemanager.scheduler + .QueueMetricsForCustomResources.MetricsForCustomResource; import org.slf4j.Logger; import org.slf4j.LoggerFactory; @@ -114,6 +117,7 @@ protected final MetricsSystem metricsSystem; protected final Map users; protected final Configuration conf; + protected final QueueMetricsForCustomResources queueMetricsForCustomResources; protected QueueMetrics(MetricsSystem ms, String queueName, Queue parent, boolean enableUserMetrics, Configuration conf) { @@ -123,6 +127,7 @@ protected QueueMetrics(MetricsSystem ms, String queueName, Queue parent, this.users = enableUserMetrics ? new HashMap() : null; metricsSystem = ms; + this.queueMetricsForCustomResources = new QueueMetricsForCustomResources(); this.conf = conf; runningTime = buildBuckets(conf); } @@ -350,9 +355,11 @@ public void moveAppTo(AppSchedulingInfo app) { * @param limit resource limit */ public void setAvailableResourcesToQueue(String partition, Resource limit) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { availableMB.set(limit.getMemorySize()); availableVCores.set(limit.getVirtualCores()); + queueMetricsForCustomResources.set(MetricsForCustomResource.AVAILABLE, + limit); } } @@ -392,7 +399,7 @@ public void setAvailableResourcesToUser(String partition, */ public void incrPendingResources(String partition, String user, int containers, Resource res) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { _incrPendingResources(containers, res); QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { @@ -408,12 +415,14 @@ private void _incrPendingResources(int containers, Resource res) { pendingContainers.incr(containers); pendingMB.incr(res.getMemorySize() * containers); pendingVCores.incr(res.getVirtualCores() * containers); + queueMetricsForCustomResources.increaseWithMultiplier(PENDING, res, + containers); } public void decrPendingResources(String partition, String user, int containers, Resource res) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { _decrPendingResources(containers, res); QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { @@ -429,6 +438,8 @@ private void _decrPendingResources(int containers, Resource res) { pendingContainers.decr(containers); pendingMB.decr(res.getMemorySize() * containers); pendingVCores.decr(res.getVirtualCores() * containers); + queueMetricsForCustomResources.decreaseWithMultiplier(PENDING, res, + containers); } public void incrNodeTypeAggregations(String user, NodeType type) { @@ -452,12 +463,15 @@ public void incrNodeTypeAggregations(String user, NodeType type) { public void allocateResources(String partition, String user, int containers, Resource res, boolean decrPending) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { allocatedContainers.incr(containers); aggregateContainersAllocated.incr(containers); allocatedMB.incr(res.getMemorySize() * containers); allocatedVCores.incr(res.getVirtualCores() * containers); + queueMetricsForCustomResources.increaseWithMultiplier(ALLOCATED, res, + containers); + if (decrPending) { _decrPendingResources(containers, res); } @@ -479,12 +493,14 @@ public void allocateResources(String partition, String user, * @param res */ public void allocateResources(String partition, String user, Resource res) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { allocatedMB.incr(res.getMemorySize()); allocatedVCores.incr(res.getVirtualCores()); + queueMetricsForCustomResources.increase(ALLOCATED, res); pendingMB.decr(res.getMemorySize()); pendingVCores.decr(res.getVirtualCores()); + queueMetricsForCustomResources.decrease(PENDING, res); QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { @@ -498,11 +514,14 @@ public void allocateResources(String partition, String user, Resource res) { public void releaseResources(String partition, String user, int containers, Resource res) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { allocatedContainers.decr(containers); aggregateContainersReleased.incr(containers); allocatedMB.decr(res.getMemorySize() * containers); allocatedVCores.decr(res.getVirtualCores() * containers); + queueMetricsForCustomResources.decreaseWithMultiplier(ALLOCATED, res, + containers); + QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { userMetrics.releaseResources(partition, user, containers, res); @@ -519,9 +538,11 @@ public void releaseResources(String partition, * @param user * @param res */ - public void releaseResources(String user, Resource res) { + private void releaseResources(String user, Resource res) { allocatedMB.decr(res.getMemorySize()); allocatedVCores.decr(res.getVirtualCores()); + queueMetricsForCustomResources.decrease(ALLOCATED, res); + QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { userMetrics.releaseResources(user, res); @@ -552,8 +573,17 @@ public void updatePreemptedVcoreSeconds(long vcoreSeconds) { } } + public void updatePreemptedSecondsForCustomResources(Resource res, + long seconds) { + queueMetricsForCustomResources + .increaseWithMultiplier(AGGREGATE_PREEMPTED_SECONDS, res, seconds); + if (parent != null) { + parent.updatePreemptedSecondsForCustomResources(res, seconds); + } + } + public void reserveResource(String partition, String user, Resource res) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { reserveResource(user, res); } } @@ -562,6 +592,7 @@ public void reserveResource(String user, Resource res) { reservedContainers.incr(); reservedMB.incr(res.getMemorySize()); reservedVCores.incr(res.getVirtualCores()); + queueMetricsForCustomResources.increase(RESERVED, res); QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { userMetrics.reserveResource(user, res); @@ -571,10 +602,11 @@ public void reserveResource(String user, Resource res) { } } - public void unreserveResource(String user, Resource res) { + private void unreserveResource(String user, Resource res) { reservedContainers.decr(); reservedMB.decr(res.getMemorySize()); reservedVCores.decr(res.getVirtualCores()); + queueMetricsForCustomResources.decrease(RESERVED, res); QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { userMetrics.unreserveResource(user, res); @@ -585,7 +617,7 @@ public void unreserveResource(String user, Resource res) { } public void unreserveResource(String partition, String user, Resource res) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { unreserveResource(user, res); } } @@ -647,10 +679,19 @@ public int getAppsKilled() { public int getAppsFailed() { return appsFailed.value(); } - + public Resource getAllocatedResources() { - return BuilderUtils.newResource(allocatedMB.value(), - (int) allocatedVCores.value()); + if (queueMetricsForCustomResources.isThereAnyAllocatedResource()) { + return Resource.newInstance(allocatedMB.value(), allocatedVCores.value(), + queueMetricsForCustomResources.getAllocatedCustomResources()); + } + return Resource.newInstance(allocatedMB.value(), + allocatedVCores.value()); + } + + public float getMaxUtilizationOfCustomResources(Resource clusterResource) { + return queueMetricsForCustomResources + .getMaxAllocationUtilization(clusterResource); } public long getAllocatedMB() { diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetricsForCustomResources.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetricsForCustomResources.java new file mode 100644 index 00000000000..9ae60f156b6 --- /dev/null +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetricsForCustomResources.java @@ -0,0 +1,128 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * http://www.apache.org/licenses/LICENSE-2.0 + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.hadoop.yarn.server.resourcemanager.scheduler; + +import com.google.common.annotations.VisibleForTesting; +import com.google.common.collect.Maps; +import org.apache.hadoop.yarn.api.records.Resource; +import org.apache.hadoop.yarn.api.records.ResourceInformation; +import org.apache.hadoop.yarn.util.resource.ResourceUtils; + +import java.util.Map; +import java.util.function.BiFunction; + +public class QueueMetricsForCustomResources { + private final Map allocatedCustomResources = Maps.newHashMap(); + private final Map availableCustomResources = Maps.newHashMap(); + private final Map pendingCustomResources = Maps.newHashMap(); + private final Map reservedCustomResources = Maps.newHashMap(); + private final Map aggregatePreemptedSecondsForCustomResources = + Maps.newHashMap(); + + public enum MetricsForCustomResource { + ALLOCATED, AVAILABLE, PENDING, RESERVED, AGGREGATE_PREEMPTED_SECONDS + } + + public void increase(MetricsForCustomResource metricsType, Resource res) { + update(metricsType, res, Long::sum); + } + + public void increaseWithMultiplier(MetricsForCustomResource metricsType, + Resource res, long multiplier) { + update(metricsType, res, (v1, v2) -> v1 + v2 * multiplier); + } + + public void decrease(MetricsForCustomResource metricsType, Resource res) { + update(metricsType, res, (v1, v2) -> v1 - v2); + } + + public void decreaseWithMultiplier(MetricsForCustomResource metricsType, + Resource res, int containers) { + update(metricsType, res, (v1, v2) -> v1 - v2 * containers); + } + + public void set(MetricsForCustomResource metricsType, Resource res) { + update(metricsType, res, (v1, v2) -> v2); + } + + private void update(MetricsForCustomResource metricsType, + Resource res, BiFunction operation) { + if (ResourceUtils.getNumberOfKnownResourceTypes() > 2) { + ResourceInformation[] resources = res.getResources(); + + for (int i = 2; i < resources.length; i++) { + ResourceInformation resource = resources[i]; + Map metrics = getMetricsByType(metricsType); + + // Map.merge only applies operation if there is a value for the key in + // the map + if (!metrics.containsKey(resource.getName())) { + metrics.put(resource.getName(), 0L); + } + metrics.merge(resource.getName(), + resource.getValue(), operation); + } + } + } + + boolean isThereAnyAllocatedResource() { + return allocatedCustomResources.size() > 0; + } + + public Map getAllocatedCustomResources() { + return allocatedCustomResources; + } + + public float getMaxAllocationUtilization(Resource clusterResource) { + float maxUtilization = 0; + if (!allocatedCustomResources.isEmpty()) { + for (Map.Entry customRes : allocatedCustomResources + .entrySet()) { + long clusterResourceUtilization = + clusterResource.getResourceValue(customRes.getKey()); + if (clusterResourceUtilization != 0) { + float utilization = + (float) customRes.getValue() / clusterResourceUtilization; + if (utilization > maxUtilization) { + maxUtilization = utilization; + } + } + } + } + return maxUtilization; + } + + @VisibleForTesting + Map getMetricsByType( + MetricsForCustomResource metricsType) { + switch (metricsType) { + case AVAILABLE: + return availableCustomResources; + case ALLOCATED: + return allocatedCustomResources; + case PENDING: + return pendingCustomResources; + case RESERVED: + return reservedCustomResources; + case AGGREGATE_PREEMPTED_SECONDS: + return aggregatePreemptedSecondsForCustomResources; + default: + throw new IllegalStateException( + "No map found for metrics type: " + metricsType); + } + } +} diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CapacityScheduler.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CapacityScheduler.java index 75d61442577..36883c3eeda 100644 --- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CapacityScheduler.java +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CapacityScheduler.java @@ -2106,7 +2106,8 @@ protected void completedContainerInternal( private void updateQueuePreemptionMetrics( CSQueue queue, RMContainer rmc) { QueueMetrics qMetrics = queue.getMetrics(); - long usedMillis = rmc.getFinishTime() - rmc.getCreationTime(); + final long usedMillis = rmc.getFinishTime() - rmc.getCreationTime(); + final long usedSeconds = usedMillis / DateUtils.MILLIS_PER_SECOND; Resource containerResource = rmc.getAllocatedResource(); qMetrics.preemptContainer(); long mbSeconds = (containerResource.getMemorySize() * usedMillis) @@ -2115,6 +2116,8 @@ private void updateQueuePreemptionMetrics( / DateUtils.MILLIS_PER_SECOND; qMetrics.updatePreemptedMemoryMBSeconds(mbSeconds); qMetrics.updatePreemptedVcoreSeconds(vcSeconds); + qMetrics.updatePreemptedSecondsForCustomResources(containerResource, + usedSeconds); } @Lock(Lock.NoLock.class) diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueHierarchy.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueHierarchy.java new file mode 100644 index 00000000000..5b0ddf5bc9e --- /dev/null +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueHierarchy.java @@ -0,0 +1,69 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * http://www.apache.org/licenses/LICENSE-2.0 + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.hadoop.yarn.server.resourcemanager.scheduler; + +import com.google.common.collect.Lists; +import java.util.List; + +public final class QueueHierarchy { + private List queues; + + private QueueHierarchy(List queues) { + this.queues = queues; + } + + String queueAtLevel(int level) { + if (level < 0 || level > queues.size() - 1) { + throw new IllegalArgumentException(String.format( + "Level should be between 0 and %d as number of queues" + + "in this hierarchy is: %d", queues.size() - 1, queues.size())); + } + return queues.get(level); + } + + int size() { + return queues.size(); + } + + public static QueueHierarchy create(List queues) { + validateQueues(queues); + return new QueueHierarchy(queues); + } + + public static QueueHierarchy create(String root, String leaf) { + return create(Lists.newArrayList(root, leaf)); + } + + private static void validateQueues(List queues) { + if (queues.size() < 2) { + throw new IllegalArgumentException( + "Should specify parent and leaf queue at least!"); + } + for (int i = 0; i < queues.size(); i++) { + String queue = queues.get(i); + if (i > 0) { + String parentQueue = queues.get(i - 1); + if (!queue.startsWith(parentQueue + ".")) { + throw new IllegalArgumentException(String.format( + "The name of child queue should start with its" + + "parent queue name! Parent: %s, Child: %s", + parentQueue, queue)); + } + } + } + } +} diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetricsTestcase.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetricsTestcase.java new file mode 100644 index 00000000000..cb81cbd3b6a --- /dev/null +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetricsTestcase.java @@ -0,0 +1,425 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * http://www.apache.org/licenses/LICENSE-2.0 + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.hadoop.yarn.server.resourcemanager.scheduler; + +import com.google.common.collect.ImmutableMap; +import com.google.common.collect.Lists; +import com.google.common.collect.Maps; +import org.apache.hadoop.metrics2.MetricsSystem; +import org.apache.hadoop.yarn.api.records.Resource; +import org.apache.hadoop.yarn.resourcetypes.ResourceTypesTestHelper; +import org.apache.hadoop.yarn.server.resourcemanager.scheduler.QueueMetricsForCustomResources.MetricsForCustomResource; +import org.apache.hadoop.yarn.server.resourcemanager.scheduler.TestQueueMetrics.MultiQueueSetup; + +import java.util.List; +import java.util.Map; +import java.util.function.Function; + +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AGGREGATE_CONTAINERS_ALLOCATED; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AGGREGATE_CONTAINERS_RELEASED; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AGGREGATE_MEMORY_MB_SECONDS_PREEMPTED; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AGGREGATE_VCORE_SECONDS_PREEMPTED; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_CONTAINERS; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_MB; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_V_CORES; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.PENDING_CONTAINERS; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.PENDING_MB; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.PENDING_V_CORES; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.RESERVED_CONTAINERS; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.RESERVED_MB; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.RESERVED_V_CORES; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.TestQueueMetricsForCustomResources.assertCustomResourceValue; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.TestQueueMetricsForCustomResources.assertCustomResourceValueInternal; + +public final class QueueMetricsTestcase { + private enum MetricsAssertType { + ALL, PARENT_QUEUE_ONLY + } + + public static final class Builder { + private MetricsSystem ms; + private Map customResourceValues = Maps.newHashMap(); + private int containers; + private int containersToDecrease; + private int vCores; + private int vCoresToDecrease; + private long customResToDecrease; + private List queues = Lists.newArrayList(); + private QueueHierarchy queueHierarchy; + private String user; + private String partition; + private long memoryMB; + private long memoryMBToDecrease; + + private Builder() { + } + + public static Builder create() { + return new Builder(); + } + + public Builder withContainers(int containers) { + this.containers = containers; + return this; + } + + public Builder withContainersToDecrease(int containersToDecrease) { + this.containersToDecrease = containersToDecrease; + return this; + } + + public Builder withVCores(int vCores) { + this.vCores = vCores; + return this; + } + + public Builder withVCoresToDecrease(int vCoresToDecrease) { + this.vCoresToDecrease = vCoresToDecrease; + return this; + } + + public Builder withMemoryMB(long memoryMB) { + this.memoryMB = memoryMB; + return this; + } + + public Builder withMemoryMBToDecrease(long memoryMBToDecrease) { + this.memoryMBToDecrease = memoryMBToDecrease; + return this; + } + + public Builder withCustomResourceValue(String name, Long value) { + customResourceValues.put(name, value); + return this; + } + + public Builder withCustomResToDecrease(long customResToDecrease) { + this.customResToDecrease = customResToDecrease; + return this; + } + + public Builder withParentQueueName(String parentQueueName) { + this.queues.add(0, parentQueueName); + return this; + } + + public Builder withLeafQueueName(String leafQueueName) { + this.queues.add(1, leafQueueName); + return this; + } + + public Builder withQueueHierarchy(String... queues) { + if (!this.queues.isEmpty()) { + throw new IllegalStateException("Either of parent/leaf queues or " + + "queue hierarchy should be specified!"); + } + this.queues = Lists.newArrayList(queues); + return this; + } + + public Builder withUser(String user) { + this.user = user; + return this; + } + + public Builder withPartition(String partition) { + this.partition = partition; + return this; + } + + public Builder withMetricSystem(MetricsSystem ms) { + this.ms = ms; + return this; + } + + public QueueMetricsTestcase build() { + this.queueHierarchy = QueueHierarchy.create(Lists.newArrayList(queues)); + return new QueueMetricsTestcase(this); + } + } + + private static final String CUSTOM_RES_1 = "custom_res_1"; + private static final String CUSTOM_RES_2 = "custom_res_2"; + private final MetricsSystem ms; + private final QueueHierarchy queueHierarchy; + private final Map customResourceValues; + private final int containers; + private final int containersToDecrease; + private final int vCores; + private final int vCoresToDecrease; + private final long memoryMB; + private final long memoryMBToDecrease; + private final long customResToDecrease; + private final String user; + private final String partition; + + private QueueMetricsTestcase(Builder builder) { + this.ms = builder.ms; + this.queueHierarchy = builder.queueHierarchy; + this.customResourceValues = builder.customResourceValues; + this.containers = builder.containers; + this.containersToDecrease = builder.containersToDecrease; + this.vCores = builder.vCores; + this.vCoresToDecrease = builder.vCoresToDecrease; + this.memoryMB = builder.memoryMB; + this.memoryMBToDecrease = builder.memoryMBToDecrease; + this.customResToDecrease = builder.customResToDecrease; + this.user = builder.user; + this.partition = builder.partition; + } + + void testIncreasePendingResources() { + testIncreasePendingResourcesInternal(true); + } + + void testIncreasePendingResourcesWithoutContainer() { + testIncreasePendingResourcesInternal(false); + } + + private void testIncreasePendingResourcesInternal(boolean useContainers) { + final int containers; + if (useContainers) { + containers = this.containers; + } else { + containers = 1; + } + + MultiQueueSetup mqs = new MultiQueueSetup(ms, queueHierarchy, user); + mqs.getLeafMetrics().incrPendingResources(partition, mqs.user, containers, + createResource()); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .gaugeInt(PENDING_CONTAINERS, containers) + .gaugeLong(PENDING_MB, containers * memoryMB) + .gaugeInt(PENDING_V_CORES, containers * vCores) + .checkAgainst(mqs.getLeafQueueSource()); + assertMetrics(mqs, checker, MetricsForCustomResource.PENDING, + getModifiedCustomResourceValues(v -> v * containers)); + } + + public void testDecreasePendingResources() { + final int containersAfterDecrease = containers - containersToDecrease; + final int vcoresAfterDecrease = + (vCores * containers) - (vCoresToDecrease * containersToDecrease); + final long memoryAfterDecrease = (memoryMB * containers) + - (memoryMBToDecrease * containersToDecrease); + + MultiQueueSetup mqs = new MultiQueueSetup(ms, queueHierarchy, user); + mqs.getLeafMetrics().decrPendingResources(partition, user, + containersToDecrease, + ResourceTypesTestHelper.newResource(memoryMBToDecrease, + vCoresToDecrease, + ImmutableMap. builder() + .put(CUSTOM_RES_1, String.valueOf(customResToDecrease)) + .put(CUSTOM_RES_2, String.valueOf(customResToDecrease)) + .build())); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .gaugeInt(PENDING_CONTAINERS, containersAfterDecrease) + .gaugeLong(PENDING_MB, memoryAfterDecrease) + .gaugeInt(PENDING_V_CORES, vcoresAfterDecrease) + .checkAgainst(mqs.getLeafQueueSource()); + + assertMetrics(mqs, checker, MetricsForCustomResource.PENDING, + getModifiedCustomResourceValues(v -> v * containers + - (customResToDecrease * containersToDecrease))); + } + + public void testAllocateResources(boolean decreasePending) { + MultiQueueSetup mqs = new MultiQueueSetup(ms, queueHierarchy, user); + mqs.getLeafMetrics().allocateResources(partition, mqs.user, containers, + createResource(), decreasePending); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .gaugeInt(ALLOCATED_CONTAINERS, containers) + .counter(AGGREGATE_CONTAINERS_ALLOCATED, containers) + .gaugeLong(ALLOCATED_MB, containers * memoryMB) + .gaugeInt(ALLOCATED_V_CORES, containers * vCores) + .gaugeInt(PENDING_CONTAINERS, 0) + .gaugeLong(PENDING_MB, 0) + .gaugeInt(PENDING_V_CORES, 0) + .checkAgainst(mqs.getLeafQueueSource()); + if (decreasePending) { + assertMetrics(mqs, checker, MetricsForCustomResource.PENDING, + getModifiedCustomResourceValues(v -> 0L)); + } + if (!customResourceValues.isEmpty()) { + assertMetrics(mqs, checker, MetricsForCustomResource.ALLOCATED, + getModifiedCustomResourceValues(v -> v * containers)); + } + } + + public void testAllocateResourcesWithoutContainer() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, queueHierarchy, user); + mqs.getLeafMetrics().allocateResources(partition, mqs.user, + createResource()); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .gaugeLong(ALLOCATED_MB, memoryMB) + .gaugeInt(ALLOCATED_V_CORES, vCores) + .gaugeInt(PENDING_CONTAINERS, 1) + .gaugeLong(PENDING_MB, 0) + .gaugeInt(PENDING_V_CORES, 0) + .checkAgainst(mqs.getLeafQueueSource()); + assertMetrics(mqs, checker, MetricsForCustomResource.PENDING, + getModifiedCustomResourceValues(v -> 0L)); + assertMetrics(mqs, checker, MetricsForCustomResource.ALLOCATED, + getModifiedCustomResourceValues(v -> v)); + } + + public void testReleaseResourcesWithContainers() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, queueHierarchy, user); + mqs.getLeafMetrics().releaseResources(partition, mqs.user, containers, + createResource()); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .counter(AGGREGATE_CONTAINERS_ALLOCATED, containers) + .counter(AGGREGATE_CONTAINERS_RELEASED, containers) + .checkAgainst(mqs.getLeafQueueSource()); + assertMetrics(mqs, checker, MetricsForCustomResource.ALLOCATED, + getModifiedCustomResourceValues(v -> 0L)); + } + + public void testUpdatePreemptedSeconds(int seconds) { + MultiQueueSetup mqs = new MultiQueueSetup(ms, queueHierarchy, user); + mqs.getLeafMetrics().updatePreemptedMemoryMBSeconds(memoryMB * seconds); + mqs.getLeafMetrics().updatePreemptedVcoreSeconds(vCores * seconds); + mqs.getLeafMetrics().updatePreemptedSecondsForCustomResources( + createResource(), seconds); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .counter(AGGREGATE_MEMORY_MB_SECONDS_PREEMPTED, memoryMB * seconds) + .counter(AGGREGATE_VCORE_SECONDS_PREEMPTED, vCores * seconds) + .checkAgainst(mqs.getLeafQueueSource()); + assertMetricsParentQueueOnly(mqs, checker, + MetricsForCustomResource.AGGREGATE_PREEMPTED_SECONDS, + getModifiedCustomResourceValues(v -> v * seconds)); + } + + public void testReserveResources() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, queueHierarchy, user); + mqs.getLeafMetrics().reserveResource(partition, mqs.user, createResource()); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .gaugeInt(RESERVED_CONTAINERS, 1) + .gaugeLong(RESERVED_MB, memoryMB) + .gaugeInt(RESERVED_V_CORES, vCores) + .checkAgainst(mqs.getLeafQueueSource()); + assertMetrics(mqs, checker, MetricsForCustomResource.RESERVED, + getModifiedCustomResourceValues(v -> v)); + } + + public void testUnreserveResources() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, queueHierarchy, user); + mqs.getLeafMetrics().unreserveResource(partition, mqs.user, + createResource()); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .gaugeInt(RESERVED_CONTAINERS, 0) + .gaugeLong(RESERVED_MB, 0) + .gaugeInt(RESERVED_V_CORES, 0) + .checkAgainst(mqs.getLeafQueueSource()); + assertMetrics(mqs, checker, MetricsForCustomResource.RESERVED, + getModifiedCustomResourceValues(v -> 0L)); + } + + public void testGetAllocatedResources() { + testAllocateResources(false); + MultiQueueSetup mqs = new MultiQueueSetup(ms, queueHierarchy, user); + Resource res = mqs.getLeafMetrics().getAllocatedResources(); + if (customResourceValues.size() > 0) { + assertCustomResourceValueInternal(MetricsForCustomResource.ALLOCATED, + CUSTOM_RES_1, customResourceValues.get(CUSTOM_RES_1) * containers, + res.getResourceValue(CUSTOM_RES_1)); + assertCustomResourceValueInternal(MetricsForCustomResource.ALLOCATED, + CUSTOM_RES_2, customResourceValues.get(CUSTOM_RES_2) * containers, + res.getResourceValue(CUSTOM_RES_2)); + } + } + + private void assertMetrics(MultiQueueSetup mqs, + ResourceMetricsChecker checker, + MetricsForCustomResource metricsType, + Map expectedCustomResourceValues) { + assertMetricsInternal(mqs, checker, metricsType, MetricsAssertType.ALL, + expectedCustomResourceValues); + } + + private void assertMetricsParentQueueOnly(MultiQueueSetup mqs, + ResourceMetricsChecker checker, + MetricsForCustomResource metricsType, + Map expectedCustomResourceValues) { + assertMetricsInternal(mqs, checker, metricsType, + MetricsAssertType.PARENT_QUEUE_ONLY, expectedCustomResourceValues); + } + + private void assertMetricsInternal(MultiQueueSetup mqs, + ResourceMetricsChecker checker, MetricsForCustomResource metricsType, + MetricsAssertType metricsAssertType, + Map expectedCustomResourceValues) { + checker = ResourceMetricsChecker.createFromChecker(checker) + .checkAgainst(mqs.getRootQueueSource()); + + if (metricsAssertType == MetricsAssertType.ALL) { + checker = ResourceMetricsChecker.createFromChecker(checker) + .checkAgainst(mqs.getLeafUserSource()); + ResourceMetricsChecker.createFromChecker(checker) + .checkAgainst(mqs.getRootUserSource()); + } + + assertCustomResourceValue(mqs.getRootMetrics(), metricsType, CUSTOM_RES_1, + expectedCustomResourceValues.get(CUSTOM_RES_1)); + assertCustomResourceValue(mqs.getRootMetrics(), metricsType, CUSTOM_RES_2, + expectedCustomResourceValues.get(CUSTOM_RES_2)); + assertCustomResourceValue(mqs.getLeafMetrics(), metricsType, CUSTOM_RES_1, + expectedCustomResourceValues.get(CUSTOM_RES_1)); + assertCustomResourceValue(mqs.getLeafMetrics(), metricsType, CUSTOM_RES_2, + expectedCustomResourceValues.get(CUSTOM_RES_2)); + } + + private Map getModifiedCustomResourceValues( + Function func) { + Map modifiedValues = Maps.newHashMap(); + for (Map.Entry res : customResourceValues + .entrySet()) { + modifiedValues.put(res.getKey(), func.apply(res.getValue())); + } + return modifiedValues; + } + + private Resource createResource() { + if (!customResourceValues.isEmpty()) { + return ResourceTypesTestHelper.newResource(memoryMB, vCores, + ImmutableMap. builder() + .put(CUSTOM_RES_1, + String.valueOf(customResourceValues.get(CUSTOM_RES_1))) + .put(CUSTOM_RES_2, + String.valueOf(customResourceValues.get(CUSTOM_RES_2))) + .build()); + } + return ResourceTypesTestHelper.newResource(memoryMB, vCores, + Maps.newHashMap()); + } +} diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/ResourceMetricsChecker.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/ResourceMetricsChecker.java index cd617d7b9d0..05341aab10e 100644 --- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/ResourceMetricsChecker.java +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/ResourceMetricsChecker.java @@ -27,34 +27,31 @@ import static org.apache.hadoop.test.MetricsAsserts.assertCounter; import static org.apache.hadoop.test.MetricsAsserts.assertGauge; import static org.apache.hadoop.test.MetricsAsserts.getMetrics; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.AGGREGATE_CONTAINERS_ALLOCATED; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.AGGREGATE_CONTAINERS_RELEASED; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_CONTAINERS; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_MB; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_V_CORES; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.AVAILABLE_MB; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.AVAILABLE_V_CORES; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.PENDING_CONTAINERS; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricType.COUNTER_LONG; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricType.GAUGE_INT; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricType.GAUGE_LONG; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AGGREGATE_CONTAINERS_ALLOCATED; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AGGREGATE_CONTAINERS_RELEASED; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_CONTAINERS; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_MB; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_V_CORES; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AVAILABLE_MB; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AVAILABLE_V_CORES; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.PENDING_CONTAINERS; import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.PENDING_MB; import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.PENDING_V_CORES; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.RESERVED_CONTAINERS; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.RESERVED_MB; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.RESERVED_CONTAINERS; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.RESERVED_MB; import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.RESERVED_V_CORES; final class ResourceMetricsChecker { private final static Logger LOG = LoggerFactory.getLogger(ResourceMetricsChecker.class); + enum ResourceMetricType { + GAUGE_INT, GAUGE_LONG, COUNTER_INT, COUNTER_LONG + } + private static final ResourceMetricsChecker INITIAL_CHECKER = new ResourceMetricsChecker() .gaugeLong(ALLOCATED_MB, 0) @@ -72,29 +69,41 @@ .gaugeInt(RESERVED_CONTAINERS, 0); enum ResourceMetricsKey { - ALLOCATED_MB("AllocatedMB"), - ALLOCATED_V_CORES("AllocatedVCores"), - ALLOCATED_CONTAINERS("AllocatedContainers"), - AGGREGATE_CONTAINERS_ALLOCATED("AggregateContainersAllocated"), - AGGREGATE_CONTAINERS_RELEASED("AggregateContainersReleased"), - AVAILABLE_MB("AvailableMB"), - AVAILABLE_V_CORES("AvailableVCores"), - PENDING_MB("PendingMB"), - PENDING_V_CORES("PendingVCores"), - PENDING_CONTAINERS("PendingContainers"), - RESERVED_MB("ReservedMB"), - RESERVED_V_CORES("ReservedVCores"), - RESERVED_CONTAINERS("ReservedContainers"); + ALLOCATED_MB("AllocatedMB", GAUGE_LONG), + ALLOCATED_V_CORES("AllocatedVCores", GAUGE_INT), + ALLOCATED_CONTAINERS("AllocatedContainers", GAUGE_INT), + AGGREGATE_CONTAINERS_ALLOCATED("AggregateContainersAllocated", + COUNTER_LONG), + AGGREGATE_CONTAINERS_RELEASED("AggregateContainersReleased", + COUNTER_LONG), + AVAILABLE_MB("AvailableMB", GAUGE_LONG), + AVAILABLE_V_CORES("AvailableVCores", GAUGE_INT), + PENDING_MB("PendingMB", GAUGE_LONG), + PENDING_V_CORES("PendingVCores", GAUGE_INT), + PENDING_CONTAINERS("PendingContainers", GAUGE_INT), + RESERVED_MB("ReservedMB", GAUGE_LONG), + RESERVED_V_CORES("ReservedVCores", GAUGE_INT), + RESERVED_CONTAINERS("ReservedContainers", GAUGE_INT), + AGGREGATE_VCORE_SECONDS_PREEMPTED( + "AggregateVcoreSecondsPreempted", COUNTER_LONG), + AGGREGATE_MEMORY_MB_SECONDS_PREEMPTED( + "AggregateMemoryMBSecondsPreempted", COUNTER_LONG); private String value; + private ResourceMetricType type; - ResourceMetricsKey(String value) { + ResourceMetricsKey(String value, ResourceMetricType type) { this.value = value; + this.type = type; } public String getValue() { return value; } + + public ResourceMetricType getType() { + return type; + } } private final Map gaugesLong; @@ -123,20 +132,31 @@ public static ResourceMetricsChecker create() { } ResourceMetricsChecker gaugeLong(ResourceMetricsKey key, long value) { + ensureTypeIsCorrect(key, GAUGE_LONG); gaugesLong.put(key, value); return this; } ResourceMetricsChecker gaugeInt(ResourceMetricsKey key, int value) { + ensureTypeIsCorrect(key, GAUGE_INT); gaugesInt.put(key, value); return this; } ResourceMetricsChecker counter(ResourceMetricsKey key, long value) { + ensureTypeIsCorrect(key, COUNTER_LONG); counters.put(key, value); return this; } + private void ensureTypeIsCorrect(ResourceMetricsKey + key, ResourceMetricType actualType) { + if (key.type != actualType) { + throw new IllegalStateException("Metrics type should be " + key.type + + " instead of " + actualType + " for metrics: " + key.value); + } + } + ResourceMetricsChecker checkAgainst(MetricsSource source) { if (source == null) { throw new IllegalStateException("MetricsSource should not be null!"); diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetrics.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetrics.java index c971d655e59..6667670d3f7 100644 --- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetrics.java +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetrics.java @@ -27,6 +27,7 @@ import static org.mockito.Mockito.mock; import static org.mockito.Mockito.when; +import com.google.common.collect.Lists; import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.metrics2.MetricsRecordBuilder; import org.apache.hadoop.metrics2.MetricsSource; @@ -46,7 +47,76 @@ import org.junit.Before; import org.junit.Test; +import java.util.List; + public class TestQueueMetrics { + static class MultiQueueSetup { + private List queueMetrics = Lists.newArrayList(); + private List queueSources = Lists.newArrayList(); + private List userSources = Lists.newArrayList(); + + final String user; + + MultiQueueSetup(MetricsSystem ms, QueueHierarchy queueHierarchy, + String user) { + this.user = user; + init(ms, queueHierarchy); + + getLeafMetrics().submitApp(user); + + for (int i = 0; i < queueHierarchy.size(); i++) { + String queue = queueHierarchy.queueAtLevel(i); + userSources.add(userSource(ms, queue, user)); + } + + } + + private void init(MetricsSystem ms, QueueHierarchy queueHierarchy) { + for (int i = 0; i < queueHierarchy.size(); i++) { + final String queueName = queueHierarchy.queueAtLevel(i); + //root queue + if (i == 0) { + queueMetrics.add(QueueMetrics.forQueue(ms, queueName, null, + true, conf)); + } else { + Queue parentQueue = createMockQueue(queueMetrics.get(i - 1)); + queueMetrics.add( + QueueMetrics.forQueue(ms, queueName, parentQueue, true, conf)); + } + queueSources.add(queueSource(ms, queueName)); + } + } + + QueueMetrics getRootMetrics() { + return queueMetrics.get(0); + } + + QueueMetrics getLeafMetrics() { + return queueMetrics.get(queueMetrics.size() - 1); + } + + MetricsSource getRootQueueSource() { + return queueSources.get(0); + } + + MetricsSource getLeafQueueSource() { + return queueSources.get(queueSources.size() - 1); + } + + MetricsSource getRootUserSource() { + return userSources.get(0); + } + + MetricsSource getLeafUserSource() { + return userSources.get(userSources.size() - 1); + } + } + private static Queue createMockQueue(QueueMetrics metrics) { + Queue queue = mock(Queue.class); + when(queue.getMetrics()).thenReturn(metrics); + return queue; + } + private static final int GB = 1024; // MB private static final Configuration conf = new Configuration(); private MetricsSystem ms; @@ -396,66 +466,59 @@ public void testNodeTypeMetrics() { @Test public void testTwoLevelWithUserMetrics() { - String parentQueueName = "root"; - String leafQueueName = "root.leaf"; String user = "alice"; - - QueueMetrics parentMetrics = - QueueMetrics.forQueue(ms, parentQueueName, null, true, conf); - Queue parentQueue = mock(Queue.class); - when(parentQueue.getMetrics()).thenReturn(parentMetrics); - QueueMetrics metrics = - QueueMetrics.forQueue(ms, leafQueueName, parentQueue, true, conf); - MetricsSource parentQueueSource = queueSource(ms, parentQueueName); - MetricsSource queueSource = queueSource(ms, leafQueueName); AppSchedulingInfo app = mockApp(user); - metrics.submitApp(user); - MetricsSource userSource = userSource(ms, leafQueueName, user); - MetricsSource parentUserSource = userSource(ms, parentQueueName, user); + MultiQueueSetup mqs = new MultiQueueSetup(ms, + QueueHierarchy.create("root", "root.leaf"), user); AppMetricsChecker appMetricsQueueSourceChecker = AppMetricsChecker.create() .counter(APPS_SUBMITTED, 1) - .checkAgainst(queueSource, true); + .checkAgainst(mqs.getLeafQueueSource(), true); AppMetricsChecker appMetricsParentQueueSourceChecker = AppMetricsChecker.create() .counter(APPS_SUBMITTED, 1) - .checkAgainst(parentQueueSource, true); + .checkAgainst(mqs.getRootQueueSource(), true); AppMetricsChecker appMetricsUserSourceChecker = AppMetricsChecker.create() .counter(APPS_SUBMITTED, 1) - .checkAgainst(userSource, true); + .checkAgainst(mqs.getLeafUserSource(), true); AppMetricsChecker appMetricsParentUserSourceChecker = AppMetricsChecker.create() .counter(APPS_SUBMITTED, 1) - .checkAgainst(parentUserSource, true); + .checkAgainst(mqs.getRootUserSource(), true); - metrics.submitAppAttempt(user); + mqs.getLeafMetrics().submitAppAttempt(user); appMetricsQueueSourceChecker = AppMetricsChecker.createFromChecker(appMetricsQueueSourceChecker) .gaugeInt(APPS_PENDING, 1) - .checkAgainst(queueSource, true); + .checkAgainst(mqs.getLeafQueueSource(), true); appMetricsParentQueueSourceChecker = AppMetricsChecker.createFromChecker(appMetricsParentQueueSourceChecker) .gaugeInt(APPS_PENDING, 1) - .checkAgainst(parentQueueSource, true); + .checkAgainst(mqs.getRootQueueSource(), true); appMetricsUserSourceChecker = AppMetricsChecker.createFromChecker(appMetricsUserSourceChecker) .gaugeInt(APPS_PENDING, 1) - .checkAgainst(userSource, true); + .checkAgainst(mqs.getLeafUserSource(), true); appMetricsParentUserSourceChecker = AppMetricsChecker.createFromChecker(appMetricsParentUserSourceChecker) .gaugeInt(APPS_PENDING, 1) - .checkAgainst(parentUserSource, true); + .checkAgainst(mqs.getRootUserSource(), true); - parentMetrics.setAvailableResourcesToQueue(RMNodeLabelsManager.NO_LABEL, + mqs.getRootMetrics().setAvailableResourcesToQueue( + RMNodeLabelsManager.NO_LABEL, Resources.createResource(100*GB, 100)); - metrics.setAvailableResourcesToQueue(RMNodeLabelsManager.NO_LABEL, + mqs.getLeafMetrics().setAvailableResourcesToQueue( + RMNodeLabelsManager.NO_LABEL, Resources.createResource(100*GB, 100)); - parentMetrics.setAvailableResourcesToUser(RMNodeLabelsManager.NO_LABEL, + mqs.getRootMetrics().setAvailableResourcesToUser( + RMNodeLabelsManager.NO_LABEL, user, Resources.createResource(10*GB, 10)); - metrics.setAvailableResourcesToUser(RMNodeLabelsManager.NO_LABEL, + mqs.getLeafMetrics().setAvailableResourcesToUser( + RMNodeLabelsManager.NO_LABEL, user, Resources.createResource(10*GB, 10)); - metrics.incrPendingResources(RMNodeLabelsManager.NO_LABEL, + mqs.getLeafMetrics().incrPendingResources( + RMNodeLabelsManager.NO_LABEL, user, 5, Resources.createResource(3*GB, 3)); ResourceMetricsChecker resMetricsQueueSourceChecker = @@ -465,7 +528,7 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(PENDING_MB, 15 * GB) .gaugeInt(PENDING_V_CORES, 15) .gaugeInt(PENDING_CONTAINERS, 5) - .checkAgainst(queueSource); + .checkAgainst(mqs.getLeafQueueSource()); ResourceMetricsChecker resMetricsParentQueueSourceChecker = ResourceMetricsChecker.create() .gaugeLong(AVAILABLE_MB, 100 * GB) @@ -473,7 +536,7 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(PENDING_MB, 15 * GB) .gaugeInt(PENDING_V_CORES, 15) .gaugeInt(PENDING_CONTAINERS, 5) - .checkAgainst(parentQueueSource); + .checkAgainst(mqs.getRootQueueSource()); ResourceMetricsChecker resMetricsUserSourceChecker = ResourceMetricsChecker.create() .gaugeLong(AVAILABLE_MB, 10 * GB) @@ -481,7 +544,7 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(PENDING_MB, 15 * GB) .gaugeInt(PENDING_V_CORES, 15) .gaugeInt(PENDING_CONTAINERS, 5) - .checkAgainst(userSource); + .checkAgainst(mqs.getLeafUserSource()); ResourceMetricsChecker resMetricsParentUserSourceChecker = ResourceMetricsChecker.create() .gaugeLong(AVAILABLE_MB, 10 * GB) @@ -489,23 +552,23 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(PENDING_MB, 15 * GB) .gaugeInt(PENDING_V_CORES, 15) .gaugeInt(PENDING_CONTAINERS, 5) - .checkAgainst(parentUserSource); + .checkAgainst(mqs.getRootUserSource()); - metrics.runAppAttempt(app.getApplicationId(), user); + mqs.getLeafMetrics().runAppAttempt(app.getApplicationId(), user); appMetricsQueueSourceChecker = AppMetricsChecker.createFromChecker(appMetricsQueueSourceChecker) .gaugeInt(APPS_PENDING, 0) .gaugeInt(APPS_RUNNING, 1) - .checkAgainst(queueSource, true); + .checkAgainst(mqs.getLeafQueueSource(), true); appMetricsUserSourceChecker = AppMetricsChecker.createFromChecker(appMetricsUserSourceChecker) .gaugeInt(APPS_PENDING, 0) .gaugeInt(APPS_RUNNING, 1) - .checkAgainst(userSource, true); + .checkAgainst(mqs.getLeafUserSource(), true); - metrics.allocateResources(RMNodeLabelsManager.NO_LABEL, + mqs.getLeafMetrics().allocateResources(RMNodeLabelsManager.NO_LABEL, user, 3, Resources.createResource(2*GB, 2), true); - metrics.reserveResource(RMNodeLabelsManager.NO_LABEL, + mqs.getLeafMetrics().reserveResource(RMNodeLabelsManager.NO_LABEL, user, Resources.createResource(3*GB, 3)); // Available resources is set externally, as it depends on dynamic // configurable cluster/queue resources @@ -521,7 +584,7 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(RESERVED_MB, 3 * GB) .gaugeInt(RESERVED_V_CORES, 3) .gaugeInt(RESERVED_CONTAINERS, 1) - .checkAgainst(queueSource); + .checkAgainst(mqs.getLeafQueueSource()); resMetricsParentQueueSourceChecker = ResourceMetricsChecker .createFromChecker(resMetricsParentQueueSourceChecker) @@ -535,7 +598,7 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(RESERVED_MB, 3 * GB) .gaugeInt(RESERVED_V_CORES, 3) .gaugeInt(RESERVED_CONTAINERS, 1) - .checkAgainst(parentQueueSource); + .checkAgainst(mqs.getRootQueueSource()); resMetricsUserSourceChecker = ResourceMetricsChecker.createFromChecker(resMetricsUserSourceChecker) .gaugeLong(ALLOCATED_MB, 6 * GB) @@ -548,7 +611,7 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(RESERVED_MB, 3 * GB) .gaugeInt(RESERVED_V_CORES, 3) .gaugeInt(RESERVED_CONTAINERS, 1) - .checkAgainst(userSource); + .checkAgainst(mqs.getLeafUserSource()); resMetricsParentUserSourceChecker = ResourceMetricsChecker .createFromChecker(resMetricsParentUserSourceChecker) .gaugeLong(ALLOCATED_MB, 6 * GB) @@ -561,11 +624,11 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(RESERVED_MB, 3 * GB) .gaugeInt(RESERVED_V_CORES, 3) .gaugeInt(RESERVED_CONTAINERS, 1) - .checkAgainst(parentUserSource); + .checkAgainst(mqs.getRootUserSource()); - metrics.releaseResources(RMNodeLabelsManager.NO_LABEL, + mqs.getLeafMetrics().releaseResources(RMNodeLabelsManager.NO_LABEL, user, 1, Resources.createResource(2*GB, 2)); - metrics.unreserveResource(RMNodeLabelsManager.NO_LABEL, + mqs.getLeafMetrics().unreserveResource(RMNodeLabelsManager.NO_LABEL, user, Resources.createResource(3*GB, 3)); ResourceMetricsChecker.createFromChecker(resMetricsQueueSourceChecker) .gaugeLong(ALLOCATED_MB, 4 * GB) @@ -575,7 +638,7 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(RESERVED_MB, 0) .gaugeInt(RESERVED_V_CORES, 0) .gaugeInt(RESERVED_CONTAINERS, 0) - .checkAgainst(queueSource); + .checkAgainst(mqs.getLeafQueueSource()); ResourceMetricsChecker.createFromChecker(resMetricsParentQueueSourceChecker) .gaugeLong(ALLOCATED_MB, 4 * GB) .gaugeInt(ALLOCATED_V_CORES, 4) @@ -584,7 +647,7 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(RESERVED_MB, 0) .gaugeInt(RESERVED_V_CORES, 0) .gaugeInt(RESERVED_CONTAINERS, 0) - .checkAgainst(parentQueueSource); + .checkAgainst(mqs.getRootQueueSource()); ResourceMetricsChecker.createFromChecker(resMetricsUserSourceChecker) .gaugeLong(ALLOCATED_MB, 4 * GB) .gaugeInt(ALLOCATED_V_CORES, 4) @@ -593,7 +656,7 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(RESERVED_MB, 0) .gaugeInt(RESERVED_V_CORES, 0) .gaugeInt(RESERVED_CONTAINERS, 0) - .checkAgainst(userSource); + .checkAgainst(mqs.getLeafUserSource()); ResourceMetricsChecker.createFromChecker(resMetricsParentUserSourceChecker) .gaugeLong(ALLOCATED_MB, 4 * GB) .gaugeInt(ALLOCATED_V_CORES, 4) @@ -602,46 +665,46 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(RESERVED_MB, 0) .gaugeInt(RESERVED_V_CORES, 0) .gaugeInt(RESERVED_CONTAINERS, 0) - .checkAgainst(parentUserSource); + .checkAgainst(mqs.getRootUserSource()); - metrics.finishAppAttempt( + mqs.getLeafMetrics().finishAppAttempt( app.getApplicationId(), app.isPending(), app.getUser()); appMetricsQueueSourceChecker = AppMetricsChecker .createFromChecker(appMetricsQueueSourceChecker) .counter(APPS_SUBMITTED, 1) .gaugeInt(APPS_RUNNING, 0) - .checkAgainst(queueSource, true); + .checkAgainst(mqs.getLeafQueueSource(), true); appMetricsParentQueueSourceChecker = AppMetricsChecker .createFromChecker(appMetricsParentQueueSourceChecker) .counter(APPS_SUBMITTED, 1) .gaugeInt(APPS_PENDING, 0) .gaugeInt(APPS_RUNNING, 0) - .checkAgainst(parentQueueSource, true); + .checkAgainst(mqs.getRootQueueSource(), true); appMetricsUserSourceChecker = AppMetricsChecker .createFromChecker(appMetricsUserSourceChecker) .counter(APPS_SUBMITTED, 1) .gaugeInt(APPS_RUNNING, 0) - .checkAgainst(userSource, true); + .checkAgainst(mqs.getLeafUserSource(), true); appMetricsParentUserSourceChecker = AppMetricsChecker .createFromChecker(appMetricsParentUserSourceChecker) .counter(APPS_SUBMITTED, 1) .gaugeInt(APPS_PENDING, 0) .gaugeInt(APPS_RUNNING, 0) - .checkAgainst(parentUserSource, true); + .checkAgainst(mqs.getRootUserSource(), true); - metrics.finishApp(user, RMAppState.FINISHED); + mqs.getLeafMetrics().finishApp(user, RMAppState.FINISHED); AppMetricsChecker.createFromChecker(appMetricsQueueSourceChecker) .counter(APPS_COMPLETED, 1) - .checkAgainst(queueSource, true); + .checkAgainst(mqs.getLeafQueueSource(), true); AppMetricsChecker.createFromChecker(appMetricsParentQueueSourceChecker) .counter(APPS_COMPLETED, 1) - .checkAgainst(parentQueueSource, true); + .checkAgainst(mqs.getRootQueueSource(), true); AppMetricsChecker.createFromChecker(appMetricsUserSourceChecker) .counter(APPS_COMPLETED, 1) - .checkAgainst(userSource, true); + .checkAgainst(mqs.getLeafUserSource(), true); AppMetricsChecker.createFromChecker(appMetricsParentUserSourceChecker) .counter(APPS_COMPLETED, 1) - .checkAgainst(parentUserSource, true); + .checkAgainst(mqs.getRootUserSource(), true); } @Test @@ -719,7 +782,7 @@ private static void checkAggregatedNodeTypes(MetricsSource source, assertCounter("AggregateOffSwitchContainersAllocated", offSwitch, rb); } - private static AppSchedulingInfo mockApp(String user) { + static AppSchedulingInfo mockApp(String user) { AppSchedulingInfo app = mock(AppSchedulingInfo.class); when(app.getUser()).thenReturn(user); ApplicationId appId = BuilderUtils.newApplicationId(1, 1); @@ -732,7 +795,7 @@ public static MetricsSource queueSource(MetricsSystem ms, String queue) { return ms.getSource(QueueMetrics.sourceName(queue).toString()); } - private static MetricsSource userSource(MetricsSystem ms, String queue, + static MetricsSource userSource(MetricsSystem ms, String queue, String user) { return ms.getSource(QueueMetrics.sourceName(queue). append(",user=").append(user).toString()); diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetricsForCustomResources.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetricsForCustomResources.java new file mode 100644 index 00000000000..d02e1da6baa --- /dev/null +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetricsForCustomResources.java @@ -0,0 +1,475 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * http://www.apache.org/licenses/LICENSE-2.0 + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.hadoop.yarn.server.resourcemanager.scheduler; + +import com.google.common.collect.ImmutableMap; +import org.apache.hadoop.conf.Configuration; +import org.apache.hadoop.metrics2.MetricsSource; +import org.apache.hadoop.metrics2.MetricsSystem; +import org.apache.hadoop.metrics2.impl.MetricsSystemImpl; +import org.apache.hadoop.yarn.api.records.Resource; +import org.apache.hadoop.yarn.api.records.ResourceInformation; +import org.apache.hadoop.yarn.conf.YarnConfiguration; +import org.apache.hadoop.yarn.resourcetypes.ResourceTypesTestHelper; +import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager; +import org.apache.hadoop.yarn.server.resourcemanager.scheduler.QueueMetricsForCustomResources.MetricsForCustomResource; + +import org.apache.hadoop.yarn.server.resourcemanager.scheduler + .TestQueueMetrics.MultiQueueSetup; +import org.apache.hadoop.yarn.util.resource.ResourceUtils; +import org.junit.Before; +import org.junit.Test; + +import java.util.HashMap; +import java.util.Map; + +import static org.apache.hadoop.yarn.conf.YarnConfiguration.DEFAULT_RM_SCHEDULER_MAXIMUM_ALLOCATION_MB; +import static org.apache.hadoop.yarn.conf.YarnConfiguration.DEFAULT_RM_SCHEDULER_MAXIMUM_ALLOCATION_VCORES; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AVAILABLE_MB; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AVAILABLE_V_CORES; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.TestQueueMetrics.queueSource; +import static org.junit.Assert.assertEquals; +import static org.junit.Assert.assertNotNull; + +public class TestQueueMetricsForCustomResources { + public static final long GB = 1024; // MB + private static final Configuration conf = new Configuration(); + private static final String CUSTOM_RES_1 = "custom_res_1"; + private static final String CUSTOM_RES_2 = "custom_res_2"; + private static final String ROOT_QUEUE_NAME = "root"; + private static final String LEAF_QUEUE_NAME = "root.leaf"; + public static final String USER = "alice"; + + private MetricsSystem ms; + + @Before + public void setUp() { + ms = new MetricsSystemImpl(); + QueueMetrics.clearQueueMetrics(); + initializeResourceTypes(); + } + + private void initializeResourceTypes() { + Map riMap = new HashMap<>(); + + ResourceInformation memory = ResourceInformation.newInstance( + ResourceInformation.MEMORY_MB.getName(), + ResourceInformation.MEMORY_MB.getUnits(), + YarnConfiguration.DEFAULT_RM_SCHEDULER_MINIMUM_ALLOCATION_MB, + DEFAULT_RM_SCHEDULER_MAXIMUM_ALLOCATION_MB); + ResourceInformation vcores = ResourceInformation.newInstance( + ResourceInformation.VCORES.getName(), + ResourceInformation.VCORES.getUnits(), + YarnConfiguration.DEFAULT_RM_SCHEDULER_MINIMUM_ALLOCATION_VCORES, + DEFAULT_RM_SCHEDULER_MAXIMUM_ALLOCATION_VCORES); + ResourceInformation res1 = ResourceInformation.newInstance(CUSTOM_RES_1, + ResourceInformation.VCORES.getUnits(), 0, 2000); + ResourceInformation res2 = ResourceInformation.newInstance(CUSTOM_RES_2, + ResourceInformation.VCORES.getUnits(), 0, 2000); + + riMap.put(ResourceInformation.MEMORY_URI, memory); + riMap.put(ResourceInformation.VCORES_URI, vcores); + riMap.put(CUSTOM_RES_1, res1); + riMap.put(CUSTOM_RES_2, res2); + ResourceUtils.initializeResourcesFromResourceInformationMap(riMap); + } + + static void assertCustomResourceValue(QueueMetrics metrics, + MetricsForCustomResource metricsType, String resourceName, + long expectedValue) { + Map metricsValues = metrics.queueMetricsForCustomResources + .getMetricsByType(metricsType); + Long value = metricsValues.get(resourceName); + assertCustomResourceValueInternal(metricsType, resourceName, + expectedValue, value); + } + + static void assertCustomResourceValueInternal( + MetricsForCustomResource metricsType, String resourceName, long + expectedValue, Long value) { + assertNotNull( + "QueueMetrics should have custom resource metrics value " + + "for resource: " + resourceName, value); + assertEquals(String.format( + "QueueMetrics should have custom resource metrics value %d " + + "for resource: %s for metrics type %s", + expectedValue, resourceName, metricsType), expectedValue, + (long) value); + } + + @Test + public void testSetAvailableResourcesToQueue1() { + String queueName = "single"; + QueueMetrics metrics = QueueMetrics.forQueue(ms, queueName, null, + false, conf); + MetricsSource queueSource = queueSource(ms, queueName); + + metrics.setAvailableResourcesToQueue(ResourceTypesTestHelper.newResource( + GB, 4, + ImmutableMap. builder() + .put(CUSTOM_RES_1, String.valueOf(5 * GB)) + .put(CUSTOM_RES_2, String.valueOf(6 * GB)) + .build())); + ResourceMetricsChecker.create() + .gaugeLong(AVAILABLE_MB, GB) + .gaugeInt(AVAILABLE_V_CORES, 4) + .checkAgainst(queueSource); + + assertCustomResourceValue(metrics, + MetricsForCustomResource.AVAILABLE, CUSTOM_RES_1, 5 * GB); + assertCustomResourceValue(metrics, + MetricsForCustomResource.AVAILABLE, CUSTOM_RES_2, 6 * GB); + } + + @Test + public void testSetAvailableResourcesToQueue2() { + String queueName = "single"; + QueueMetrics metrics = QueueMetrics.forQueue(ms, queueName, null, + false, conf); + MetricsSource queueSource = queueSource(ms, queueName); + + metrics.setAvailableResourcesToQueue(null, + ResourceTypesTestHelper.newResource(GB, 4, + ImmutableMap. builder() + .put(CUSTOM_RES_1, String.valueOf(15 * GB)) + .put(CUSTOM_RES_2, String.valueOf(20 * GB)) + .build())); + ResourceMetricsChecker.create() + .gaugeLong(AVAILABLE_MB, GB) + .gaugeInt(AVAILABLE_V_CORES, 4) + .checkAgainst(queueSource); + + assertCustomResourceValue(metrics, + MetricsForCustomResource.AVAILABLE, CUSTOM_RES_1, 15 * GB); + assertCustomResourceValue(metrics, + MetricsForCustomResource.AVAILABLE, CUSTOM_RES_2, 20 * GB); + } + + @Test + public void testIncreasePendingResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withContainersToDecrease(2) + .withVCores(4) + .withVCoresToDecrease(2) + .withMemoryMB(4 * GB) + .withMemoryMBToDecrease(GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .withCustomResToDecrease(2 * GB) + .build(); + + testcase.testIncreasePendingResources(); + } + + @Test + public void testDecreasePendingResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withContainersToDecrease(2) + .withVCores(4) + .withVCoresToDecrease(2) + .withMemoryMB(4 * GB) + .withMemoryMBToDecrease(GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .withCustomResToDecrease(2 * GB) + .build(); + + testcase.testIncreasePendingResources(); + testcase.testDecreasePendingResources(); + } + + @Test + public void testAllocateResourcesWithoutDecreasePending() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + testcase.testAllocateResources(false); + } + + @Test + public void testAllocateResourcesWithDecreasePending() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withContainersToDecrease(2) + .withVCores(4) + .withVCoresToDecrease(2) + .withMemoryMB(4 * GB) + .withMemoryMBToDecrease(GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .withCustomResToDecrease(2 * GB) + .build(); + + //first, increase pending resources + testcase.testIncreasePendingResources(); + + //then allocate with decrease pending resources + testcase.testAllocateResources(true); + } + + @Test + public void testAllocateResourcesWithoutContainer() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + //first, increase pending resources + testcase.testIncreasePendingResourcesWithoutContainer(); + + testcase.testAllocateResourcesWithoutContainer(); + } + + @Test + public void testReleaseResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withContainersToDecrease(2) + .withVCores(4) + .withVCoresToDecrease(2) + .withMemoryMB(4 * GB) + .withMemoryMBToDecrease(GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .withCustomResToDecrease(2 * GB) + .build(); + + //first, allocate some resources + testcase.testAllocateResources(false); + + testcase.testReleaseResourcesWithContainers(); + } + + @Test + public void testUpdatePreemptedSecondsForCustomResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withQueueHierarchy("root", "root.subQueue", "root.subQueue.subQueue2", + "root.subQueue.subQueue2.leafQueue") + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + final int seconds = 1; + testcase.testUpdatePreemptedSeconds(seconds); + } + + @Test + public void testUpdatePreemptedSecondsForCustomResourcesMoreSeconds() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withQueueHierarchy("root", "root.subQueue", "root.subQueue.subQueue2", + "root.subQueue.subQueue2.leafQueue") + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + final int seconds = 15; + testcase.testUpdatePreemptedSeconds(seconds); + } + + @Test + public void testReserveResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + testcase.testReserveResources(); + } + + @Test + public void testUnreserveResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + testcase.testReserveResources(); + testcase.testUnreserveResources(); + } + + @Test + public void testGetAllocatedResourcesWithCustomResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + testcase.testGetAllocatedResources(); + } + + @Test + public void testGetAllocatedResourcesWithoutCustomResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .build(); + + testcase.testGetAllocatedResources(); + } + + @Test + public void testGetMaxUtilizationOfCustomResourcesWithoutAllocatedResource() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, + QueueHierarchy.create(ROOT_QUEUE_NAME, LEAF_QUEUE_NAME), USER); + Resource clusterResource = ResourceTypesTestHelper.newResource(4 * GB, 8, + ImmutableMap.builder() + .put(CUSTOM_RES_1, + String.valueOf(0L)) + .put(CUSTOM_RES_2, + String.valueOf(0L)) + .build()); + float utilization = mqs.getLeafMetrics() + .getMaxUtilizationOfCustomResources(clusterResource); + assertEquals(0, utilization, 0.0); + } + + @Test + public void testGetMaxUtilizationOfCustomResourcesWithAllocatedResource() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, + QueueHierarchy.create(ROOT_QUEUE_NAME, LEAF_QUEUE_NAME), USER); + + Resource allocatedResource = ResourceTypesTestHelper.newResource(4 * GB, 8, + ImmutableMap.builder() + .put(CUSTOM_RES_1, + String.valueOf(10L)) + .put(CUSTOM_RES_2, + String.valueOf(20L)) + .build()); + mqs.getLeafMetrics().allocateResources(RMNodeLabelsManager.NO_LABEL, + mqs.user, 1, allocatedResource, false); + + Resource clusterResource = ResourceTypesTestHelper.newResource(4 * GB, 8, + ImmutableMap.builder() + .put(CUSTOM_RES_1, + String.valueOf(0L)) + .put(CUSTOM_RES_2, + String.valueOf(0L)) + .build()); + float utilization = mqs.getLeafMetrics() + .getMaxUtilizationOfCustomResources(clusterResource); + assertEquals(0, utilization, 0.0); + } + + @Test + public void testGetMaxUtilizationOfCustomResourcesWithAllocatedResource2() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, + QueueHierarchy.create(ROOT_QUEUE_NAME, LEAF_QUEUE_NAME), USER); + + Resource allocatedResource = ResourceTypesTestHelper.newResource(4 * GB, 8, + ImmutableMap.builder() + .put(CUSTOM_RES_1, + String.valueOf(10L)) + .put(CUSTOM_RES_2, + String.valueOf(20L)) + .build()); + mqs.getLeafMetrics().allocateResources(RMNodeLabelsManager.NO_LABEL, + mqs.user, 1, allocatedResource, false); + + Resource clusterResource = ResourceTypesTestHelper.newResource(4 * GB, 8, + ImmutableMap.builder() + .put(CUSTOM_RES_1, + String.valueOf(5L)) + .put(CUSTOM_RES_2, + String.valueOf(5L)) + .build()); + float utilization = mqs.getLeafMetrics() + .getMaxUtilizationOfCustomResources(clusterResource); + assertEquals(4.0, utilization, 0.0); + } + +}