diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetrics.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetrics.java index 20a5a1ff790..0a0e9d627e7 100644 --- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetrics.java +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetrics.java @@ -19,6 +19,8 @@ package org.apache.hadoop.yarn.server.resourcemanager.scheduler; import static org.apache.hadoop.metrics2.lib.Interns.info; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler + .QueueMetricsForCustomResources.MetricsForCustomResource.*; import java.util.ArrayList; import java.util.HashMap; @@ -45,6 +47,8 @@ import org.apache.hadoop.yarn.conf.YarnConfiguration; import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager; import org.apache.hadoop.yarn.server.resourcemanager.rmapp.RMAppState; +import org.apache.hadoop.yarn.server.resourcemanager.scheduler + .QueueMetricsForCustomResources.MetricsForCustomResource; import org.apache.hadoop.yarn.server.utils.BuilderUtils; import org.slf4j.Logger; import org.slf4j.LoggerFactory; @@ -114,6 +118,7 @@ protected final MetricsSystem metricsSystem; protected final Map users; protected final Configuration conf; + protected final QueueMetricsForCustomResources queueMetricsForCustomResources; protected QueueMetrics(MetricsSystem ms, String queueName, Queue parent, boolean enableUserMetrics, Configuration conf) { @@ -123,6 +128,7 @@ protected QueueMetrics(MetricsSystem ms, String queueName, Queue parent, this.users = enableUserMetrics ? new HashMap() : null; metricsSystem = ms; + this.queueMetricsForCustomResources = new QueueMetricsForCustomResources(); this.conf = conf; runningTime = buildBuckets(conf); } @@ -350,9 +356,11 @@ public void moveAppTo(AppSchedulingInfo app) { * @param limit resource limit */ public void setAvailableResourcesToQueue(String partition, Resource limit) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { availableMB.set(limit.getMemorySize()); availableVCores.set(limit.getVirtualCores()); + queueMetricsForCustomResources.set(MetricsForCustomResource.AVAILABLE, + limit); } } @@ -392,7 +400,7 @@ public void setAvailableResourcesToUser(String partition, */ public void incrPendingResources(String partition, String user, int containers, Resource res) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { _incrPendingResources(containers, res); QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { @@ -408,12 +416,14 @@ private void _incrPendingResources(int containers, Resource res) { pendingContainers.incr(containers); pendingMB.incr(res.getMemorySize() * containers); pendingVCores.incr(res.getVirtualCores() * containers); + queueMetricsForCustomResources.increaseWithMultiplier(PENDING, res, + containers); } public void decrPendingResources(String partition, String user, int containers, Resource res) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { _decrPendingResources(containers, res); QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { @@ -429,6 +439,8 @@ private void _decrPendingResources(int containers, Resource res) { pendingContainers.decr(containers); pendingMB.decr(res.getMemorySize() * containers); pendingVCores.decr(res.getVirtualCores() * containers); + queueMetricsForCustomResources.decreaseWithMultiplier(PENDING, res, + containers); } public void incrNodeTypeAggregations(String user, NodeType type) { @@ -452,12 +464,15 @@ public void incrNodeTypeAggregations(String user, NodeType type) { public void allocateResources(String partition, String user, int containers, Resource res, boolean decrPending) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { allocatedContainers.incr(containers); aggregateContainersAllocated.incr(containers); allocatedMB.incr(res.getMemorySize() * containers); allocatedVCores.incr(res.getVirtualCores() * containers); + queueMetricsForCustomResources.increaseWithMultiplier(ALLOCATED, res, + containers); + if (decrPending) { _decrPendingResources(containers, res); } @@ -479,12 +494,14 @@ public void allocateResources(String partition, String user, * @param res */ public void allocateResources(String partition, String user, Resource res) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { allocatedMB.incr(res.getMemorySize()); allocatedVCores.incr(res.getVirtualCores()); + queueMetricsForCustomResources.increase(ALLOCATED, res); pendingMB.decr(res.getMemorySize()); pendingVCores.decr(res.getVirtualCores()); + queueMetricsForCustomResources.decrease(PENDING, res); QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { @@ -498,11 +515,14 @@ public void allocateResources(String partition, String user, Resource res) { public void releaseResources(String partition, String user, int containers, Resource res) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { allocatedContainers.decr(containers); aggregateContainersReleased.incr(containers); allocatedMB.decr(res.getMemorySize() * containers); allocatedVCores.decr(res.getVirtualCores() * containers); + queueMetricsForCustomResources.decreaseWithMultiplier(ALLOCATED, res, + containers); + QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { userMetrics.releaseResources(partition, user, containers, res); @@ -519,9 +539,11 @@ public void releaseResources(String partition, * @param user * @param res */ - public void releaseResources(String user, Resource res) { + private void releaseResources(String user, Resource res) { allocatedMB.decr(res.getMemorySize()); allocatedVCores.decr(res.getVirtualCores()); + queueMetricsForCustomResources.decrease(ALLOCATED, res); + QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { userMetrics.releaseResources(user, res); @@ -552,8 +574,18 @@ public void updatePreemptedVcoreSeconds(long vcoreSeconds) { } } + public void updatePreemptedSecondsForCustomResources(Resource res, + long seconds) { + queueMetricsForCustomResources + .increaseWithMultiplier(AGGREGATE_PREEMPTED_SECONDS, res, seconds); + if (parent != null) { + parent.queueMetricsForCustomResources.increaseWithMultiplier( + AGGREGATE_PREEMPTED_SECONDS, res, seconds); + } + } + public void reserveResource(String partition, String user, Resource res) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { reserveResource(user, res); } } @@ -562,6 +594,7 @@ public void reserveResource(String user, Resource res) { reservedContainers.incr(); reservedMB.incr(res.getMemorySize()); reservedVCores.incr(res.getVirtualCores()); + queueMetricsForCustomResources.increase(RESERVED, res); QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { userMetrics.reserveResource(user, res); @@ -571,10 +604,11 @@ public void reserveResource(String user, Resource res) { } } - public void unreserveResource(String user, Resource res) { + private void unreserveResource(String user, Resource res) { reservedContainers.decr(); reservedMB.decr(res.getMemorySize()); reservedVCores.decr(res.getVirtualCores()); + queueMetricsForCustomResources.decrease(RESERVED, res); QueueMetrics userMetrics = getUserMetrics(user); if (userMetrics != null) { userMetrics.unreserveResource(user, res); @@ -585,7 +619,7 @@ public void unreserveResource(String user, Resource res) { } public void unreserveResource(String partition, String user, Resource res) { - if(partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { + if (partition == null || partition.equals(RMNodeLabelsManager.NO_LABEL)) { unreserveResource(user, res); } } @@ -647,10 +681,18 @@ public int getAppsKilled() { public int getAppsFailed() { return appsFailed.value(); } - + public Resource getAllocatedResources() { + if (queueMetricsForCustomResources.isThereAnyAllocatedResource()) { + return Resource.newInstance(allocatedMB.value(), allocatedVCores.value(), + queueMetricsForCustomResources.getAllocatedCustomResources()); + } return BuilderUtils.newResource(allocatedMB.value(), - (int) allocatedVCores.value()); + allocatedVCores.value()); + } + + public float getMaxUtilizationOfCustomResources(Resource clusterResource) { + return queueMetricsForCustomResources.getMaxAllocationUtilization(clusterResource); } public long getAllocatedMB() { diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetricsForCustomResources.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetricsForCustomResources.java new file mode 100644 index 00000000000..b2948163195 --- /dev/null +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetricsForCustomResources.java @@ -0,0 +1,128 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * http://www.apache.org/licenses/LICENSE-2.0 + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.hadoop.yarn.server.resourcemanager.scheduler; + +import com.google.common.annotations.VisibleForTesting; +import com.google.common.collect.Maps; +import org.apache.hadoop.yarn.api.records.Resource; +import org.apache.hadoop.yarn.api.records.ResourceInformation; +import org.apache.hadoop.yarn.util.resource.ResourceUtils; + +import java.util.Map; +import java.util.function.BiFunction; + +public class QueueMetricsForCustomResources { + private final Map allocatedCustomResources = Maps.newHashMap(); + private final Map availableCustomResources = Maps.newHashMap(); + private final Map pendingCustomResources = Maps.newHashMap(); + private final Map reservedCustomResources = Maps.newHashMap(); + private final Map aggregatePreemptedSecondsForCustomResources = + Maps.newHashMap(); + + public enum MetricsForCustomResource { + ALLOCATED, AVAILABLE, PENDING, RESERVED, AGGREGATE_PREEMPTED_SECONDS + } + + public void increase(MetricsForCustomResource metricsType, Resource res) { + update(metricsType, res, Long::sum); + } + + public void increaseWithMultiplier(MetricsForCustomResource metricsType, + Resource res, long multiplier) { + update(metricsType, res, (v1, v2) -> v1 + v2 * multiplier); + } + + public void decrease(MetricsForCustomResource metricsType, Resource res) { + update(metricsType, res, (v1, v2) -> v1 - v2); + } + + public void decreaseWithMultiplier(MetricsForCustomResource metricsType, + Resource res, int containers) { + update(metricsType, res, (v1, v2) -> v1 - v2 * containers); + } + + public void set(MetricsForCustomResource metricsType, Resource res) { + update(metricsType, res, (v1, v2) -> v2); + } + + private void update(MetricsForCustomResource metricsType, + Resource res, BiFunction operation) { + if (ResourceUtils.getNumberOfKnownResourceTypes() > 2) { + ResourceInformation[] resources = res.getResources(); + + for (int i = 2; i < resources.length; i++) { + ResourceInformation resource = resources[i]; + Map metrics = getMetricsByType(metricsType); + + // Map.merge only applies operation if there is a value for the key in + // the map + if (!metrics.containsKey(resource.getName())) { + metrics.put(resource.getName(), 0L); + } + metrics.merge(resource.getName(), + resource.getValue(), operation); + } + } + } + + boolean isThereAnyAllocatedResource() { + return allocatedCustomResources.size() > 0; + } + + public Map getAllocatedCustomResources() { + return allocatedCustomResources; + } + + public float getMaxAllocationUtilization(Resource clusterResource) { + float maxUtilization = 0; + if (!allocatedCustomResources.isEmpty()) { + for (Map.Entry customRes : allocatedCustomResources + .entrySet()) { + long clusterResourceUtilization = + clusterResource.getResourceValue(customRes.getKey()); + if (clusterResourceUtilization != 0) { + float utilization = + (float) customRes.getValue() / clusterResourceUtilization; + if (utilization > maxUtilization) { + maxUtilization = utilization; + } + } + } + } + return maxUtilization; + } + + @VisibleForTesting + Map getMetricsByType( + MetricsForCustomResource metricsType) { + switch(metricsType) { + case AVAILABLE: + return availableCustomResources; + case ALLOCATED: + return allocatedCustomResources; + case PENDING: + return pendingCustomResources; + case RESERVED: + return reservedCustomResources; + case AGGREGATE_PREEMPTED_SECONDS: + return aggregatePreemptedSecondsForCustomResources; + default: + throw new IllegalStateException("No map found for metrics type: " + + metricsType); + } + } +} diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CapacityScheduler.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CapacityScheduler.java index 75d61442577..36883c3eeda 100644 --- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CapacityScheduler.java +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/capacity/CapacityScheduler.java @@ -2106,7 +2106,8 @@ protected void completedContainerInternal( private void updateQueuePreemptionMetrics( CSQueue queue, RMContainer rmc) { QueueMetrics qMetrics = queue.getMetrics(); - long usedMillis = rmc.getFinishTime() - rmc.getCreationTime(); + final long usedMillis = rmc.getFinishTime() - rmc.getCreationTime(); + final long usedSeconds = usedMillis / DateUtils.MILLIS_PER_SECOND; Resource containerResource = rmc.getAllocatedResource(); qMetrics.preemptContainer(); long mbSeconds = (containerResource.getMemorySize() * usedMillis) @@ -2115,6 +2116,8 @@ private void updateQueuePreemptionMetrics( / DateUtils.MILLIS_PER_SECOND; qMetrics.updatePreemptedMemoryMBSeconds(mbSeconds); qMetrics.updatePreemptedVcoreSeconds(vcSeconds); + qMetrics.updatePreemptedSecondsForCustomResources(containerResource, + usedSeconds); } @Lock(Lock.NoLock.class) diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetricsTestcase.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetricsTestcase.java new file mode 100644 index 00000000000..447244bb87b --- /dev/null +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/QueueMetricsTestcase.java @@ -0,0 +1,424 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * http://www.apache.org/licenses/LICENSE-2.0 + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.hadoop.yarn.server.resourcemanager.scheduler; + +import com.google.common.collect.ImmutableMap; +import com.google.common.collect.Maps; +import org.apache.hadoop.metrics2.MetricsSystem; +import org.apache.hadoop.yarn.api.records.Resource; +import org.apache.hadoop.yarn.resourcetypes.ResourceTypesTestHelper; +import org.apache.hadoop.yarn.server.resourcemanager.scheduler + .QueueMetricsForCustomResources.MetricsForCustomResource; +import org.apache.hadoop.yarn.server.resourcemanager.scheduler + .TestQueueMetrics.MultiQueueSetup; + +import java.util.Map; +import java.util.function.Function; + +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler + .ResourceMetricsChecker.ResourceMetricsKey.*; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler + .TestQueueMetricsForCustomResources.assertCustomResourceValue; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler + .TestQueueMetricsForCustomResources.assertCustomResourceValueInternal; + +public class QueueMetricsTestcase { + + private enum MetricsAssertType { + ALL, PARENT_QUEUE_ONLY + } + + public static final class Builder { + private MetricsSystem ms; + private Map customResourceValues = Maps.newHashMap(); + private int containers; + private int containersToDecrease; + private int vCores; + private int vCoresToDecrease; + private long customResToDecrease; + private String parentQueueName; + private String leafQueueName; + private String user; + private String partition; + private long memoryMB; + private long memoryMBToDecrease; + + private Builder() { + } + + public static Builder create() { + return new Builder(); + } + + public Builder withContainers(int containers) { + this.containers = containers; + return this; + } + + public Builder withContainersToDecrease(int containersToDecrease) { + this.containersToDecrease = containersToDecrease; + return this; + } + + public Builder withVCores(int vCores) { + this.vCores = vCores; + return this; + } + + public Builder withVCoresToDecrease(int vCoresToDecrease) { + this.vCoresToDecrease = vCoresToDecrease; + return this; + } + + public Builder withMemoryMB(long memoryMB) { + this.memoryMB = memoryMB; + return this; + } + + public Builder withMemoryMBToDecrease(long memoryMBToDecrease) { + this.memoryMBToDecrease = memoryMBToDecrease; + return this; + } + + public Builder withCustomResourceValue(String name, Long value) { + customResourceValues.put(name, value); + return this; + } + + public Builder withCustomResToDecrease(long customResToDecrease) { + this.customResToDecrease = customResToDecrease; + return this; + } + + public Builder withParentQueueName(String parentQueueName) { + this.parentQueueName = parentQueueName; + return this; + } + + public Builder withLeafQueueName(String leafQueueName) { + this.leafQueueName = leafQueueName; + return this; + } + + public Builder withUser(String user) { + this.user = user; + return this; + } + + public Builder withPartition(String partition) { + this.partition = partition; + return this; + } + + public QueueMetricsTestcase build() { + return new QueueMetricsTestcase(ms, leafQueueName, parentQueueName, user, + partition, customResourceValues, containers, containersToDecrease, + vCores, vCoresToDecrease, memoryMB, memoryMBToDecrease, + customResToDecrease); + } + + public Builder withMetricSystem(MetricsSystem ms) { + this.ms = ms; + return this; + } + } + + private static final String CUSTOM_RES_1 = "custom_res_1"; + private static final String CUSTOM_RES_2 = "custom_res_2"; + private final MetricsSystem ms; + private final String leafQueueName; + private final String parentQueueName; + private final Map customResourceValues; + private final int containers; + private final int containersToDecrease; + private final int vCores; + private final int vCoresToDecrease; + private final long memoryMB; + private final long memoryMBToDecrease; + private final long customResToDecrease; + private final String user; + private final String partition; + + + private QueueMetricsTestcase(MetricsSystem ms, String leafQueueName, String + parentQueueName, String user, String partition, Map + customResourceValues, int containers, int containersToDecrease, int + vCores, int vCoresToDecrease, long memoryMB, long memoryMBToDecrease, + long customResToDecrease) { + this.ms = ms; + this.leafQueueName = leafQueueName; + this.parentQueueName = parentQueueName; + this.customResourceValues = customResourceValues; + this.containers = containers; + this.containersToDecrease = containersToDecrease; + this.vCores = vCores; + this.vCoresToDecrease = vCoresToDecrease; + this.memoryMB = memoryMB; + this.memoryMBToDecrease = memoryMBToDecrease; + this.customResToDecrease = customResToDecrease; + this.user = user; + this.partition = partition; + } + + void testIncreasePendingResources() { + testIncreasePendingResourcesInternal(true); + } + + void testIncreasePendingResourcesWithoutContainer() { + testIncreasePendingResourcesInternal(false); + } + + private void testIncreasePendingResourcesInternal(boolean useContainers) { + final int containers; + if (useContainers) { + containers = this.containers; + } else { + containers = 1; + } + + MultiQueueSetup mqs = new MultiQueueSetup(ms, + parentQueueName, leafQueueName, user); + mqs.leafMetrics.incrPendingResources(partition, mqs.user, containers, + createResource()); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .gaugeInt(PENDING_CONTAINERS, containers) + .gaugeLong(PENDING_MB, containers * memoryMB) + .gaugeInt(PENDING_V_CORES, containers * vCores) + .checkAgainst(mqs.leafQueueSource); + assertMetrics(mqs, checker, MetricsForCustomResource.PENDING, + getModifiedCustomResourceValues(v -> v * containers)); + } + + public void testDecreasePendingResources() { + final int containersAfterDecrease = containers - containersToDecrease; + final int vcoresAfterDecrease = + (vCores * containers) - (vCoresToDecrease * containersToDecrease); + final long memoryAfterDecrease = (memoryMB * containers) + - (memoryMBToDecrease * containersToDecrease); + + MultiQueueSetup mqs = new MultiQueueSetup(ms, + parentQueueName, leafQueueName, user); + mqs.leafMetrics.decrPendingResources(partition, user, containersToDecrease, + ResourceTypesTestHelper.newResource(memoryMBToDecrease, vCoresToDecrease, + ImmutableMap. builder() + .put(CUSTOM_RES_1, String.valueOf(customResToDecrease)) + .put(CUSTOM_RES_2, String.valueOf(customResToDecrease)) + .build())); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .gaugeInt(PENDING_CONTAINERS, containersAfterDecrease) + .gaugeLong(PENDING_MB, memoryAfterDecrease) + .gaugeInt(PENDING_V_CORES, vcoresAfterDecrease) + .checkAgainst(mqs.leafQueueSource); + + assertMetrics(mqs, checker, MetricsForCustomResource.PENDING, + getModifiedCustomResourceValues(v -> v * containers + - (customResToDecrease * containersToDecrease))); + } + + public void testAllocateResources(boolean decreasePending) { + MultiQueueSetup mqs = new MultiQueueSetup(ms, + parentQueueName, leafQueueName, user); + mqs.leafMetrics.allocateResources(partition, mqs.user, containers, + createResource(), decreasePending); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .gaugeInt(ALLOCATED_CONTAINERS, containers) + .counter(AGGREGATE_CONTAINERS_ALLOCATED, containers) + .gaugeLong(ALLOCATED_MB, containers * memoryMB) + .gaugeInt(ALLOCATED_V_CORES, containers * vCores) + .gaugeInt(PENDING_CONTAINERS, 0) + .gaugeLong(PENDING_MB, 0) + .gaugeInt(PENDING_V_CORES, 0) + .checkAgainst(mqs.leafQueueSource); + if (decreasePending) { + assertMetrics(mqs, checker, MetricsForCustomResource.PENDING, + getModifiedCustomResourceValues(v -> 0L)); + } + if (!customResourceValues.isEmpty()) { + assertMetrics(mqs, checker, MetricsForCustomResource.ALLOCATED, + getModifiedCustomResourceValues(v -> v * containers)); + } + } + + public void testAllocateResourcesWithoutContainer() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, + parentQueueName, leafQueueName, user); + mqs.leafMetrics.allocateResources(partition, mqs.user, + createResource()); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .gaugeLong(ALLOCATED_MB, memoryMB) + .gaugeInt(ALLOCATED_V_CORES, vCores) + .gaugeInt(PENDING_CONTAINERS, 1) + .gaugeLong(PENDING_MB, 0) + .gaugeInt(PENDING_V_CORES, 0) + .checkAgainst(mqs.leafQueueSource); + assertMetrics(mqs, checker, MetricsForCustomResource.PENDING, + getModifiedCustomResourceValues(v -> 0L)); + assertMetrics(mqs, checker, MetricsForCustomResource.ALLOCATED, + getModifiedCustomResourceValues(v -> v)); + } + + public void testReleaseResourcesWithContainers() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, + parentQueueName, leafQueueName, user); + mqs.leafMetrics.releaseResources(partition, mqs.user, containers, + createResource()); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .counter(AGGREGATE_CONTAINERS_ALLOCATED, containers) + .counter(AGGREGATE_CONTAINERS_RELEASED, containers) + .checkAgainst(mqs.leafQueueSource); + assertMetrics(mqs, checker, MetricsForCustomResource.ALLOCATED, + getModifiedCustomResourceValues(v -> 0L)); + } + + public void testUpdatePreemptedSeconds(int seconds) { + MultiQueueSetup mqs = new MultiQueueSetup(ms, + parentQueueName, leafQueueName, user); + mqs.leafMetrics.updatePreemptedMemoryMBSeconds(memoryMB * seconds); + mqs.leafMetrics.updatePreemptedVcoreSeconds(vCores * seconds); + mqs.leafMetrics.updatePreemptedSecondsForCustomResources( + createResource(), seconds); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .counter(AGGREGATE_MEMORY_MB_SECONDS_PREEMPTED, memoryMB * seconds) + .counter(AGGREGATE_VCORE_SECONDS_PREEMPTED, vCores * seconds) + .checkAgainst(mqs.leafQueueSource); + assertMetricsParentQueueOnly(mqs, checker, + MetricsForCustomResource.AGGREGATE_PREEMPTED_SECONDS, + getModifiedCustomResourceValues(v -> v * seconds)); + } + + public void testReserveResources() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, + parentQueueName, leafQueueName, user); + mqs.leafMetrics.reserveResource(partition, mqs.user, createResource()); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .gaugeInt(RESERVED_CONTAINERS, 1) + .gaugeLong(RESERVED_MB, memoryMB) + .gaugeInt(RESERVED_V_CORES, vCores) + .checkAgainst(mqs.leafQueueSource); + assertMetrics(mqs, checker, MetricsForCustomResource.RESERVED, + getModifiedCustomResourceValues(v -> v)); + } + + public void testUnreserveResources() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, + parentQueueName, leafQueueName, user); + mqs.leafMetrics.unreserveResource(partition, mqs.user, + createResource()); + + ResourceMetricsChecker checker = ResourceMetricsChecker + .create() + .gaugeInt(RESERVED_CONTAINERS, 0) + .gaugeLong(RESERVED_MB, 0) + .gaugeInt(RESERVED_V_CORES, 0) + .checkAgainst(mqs.leafQueueSource); + assertMetrics(mqs, checker, MetricsForCustomResource.RESERVED, + getModifiedCustomResourceValues(v -> 0L)); + } + + public void testGetAllocatedResources() { + testAllocateResources(false); + MultiQueueSetup mqs = new MultiQueueSetup(ms, + parentQueueName, leafQueueName, user); + Resource res = mqs.leafMetrics.getAllocatedResources(); + if (customResourceValues.size() > 0) { + assertCustomResourceValueInternal(MetricsForCustomResource.ALLOCATED, + CUSTOM_RES_1, customResourceValues.get(CUSTOM_RES_1) * containers, + res.getResourceValue(CUSTOM_RES_1)); + assertCustomResourceValueInternal(MetricsForCustomResource.ALLOCATED, + CUSTOM_RES_2, customResourceValues.get(CUSTOM_RES_2) * containers, + res.getResourceValue(CUSTOM_RES_2)); + } + } + + private void assertMetrics(MultiQueueSetup mqs, + ResourceMetricsChecker checker, + MetricsForCustomResource metricsType, + Map expectedCustomResourceValues) { + assertMetricsInternal(mqs, checker, metricsType, MetricsAssertType.ALL, + expectedCustomResourceValues); + } + + private void assertMetricsParentQueueOnly(MultiQueueSetup mqs, + ResourceMetricsChecker checker, + MetricsForCustomResource metricsType, + Map expectedCustomResourceValues) { + assertMetricsInternal(mqs, checker, metricsType, + MetricsAssertType.PARENT_QUEUE_ONLY, expectedCustomResourceValues); + } + + private void assertMetricsInternal(MultiQueueSetup mqs, + ResourceMetricsChecker checker, MetricsForCustomResource metricsType, + MetricsAssertType metricsAssertType, + Map expectedCustomResourceValues) { + checker = ResourceMetricsChecker.createFromChecker(checker) + .checkAgainst(mqs.parentQueueSource); + + if (metricsAssertType == MetricsAssertType.ALL) { + checker = ResourceMetricsChecker.createFromChecker(checker) + .checkAgainst(mqs.userSource); + ResourceMetricsChecker.createFromChecker(checker) + .checkAgainst(mqs.parentUserSource); + } + + assertCustomResourceValue(mqs.parentMetrics, metricsType, CUSTOM_RES_1, + expectedCustomResourceValues.get(CUSTOM_RES_1)); + assertCustomResourceValue(mqs.parentMetrics, metricsType, CUSTOM_RES_2, + expectedCustomResourceValues.get(CUSTOM_RES_2)); + assertCustomResourceValue(mqs.leafMetrics, metricsType, CUSTOM_RES_1, + expectedCustomResourceValues.get(CUSTOM_RES_1)); + assertCustomResourceValue(mqs.leafMetrics, metricsType, CUSTOM_RES_2, + expectedCustomResourceValues.get(CUSTOM_RES_2)); + } + + private Map getModifiedCustomResourceValues( + Function func) { + Map modifiedValues = Maps.newHashMap(); + for (Map.Entry res : customResourceValues + .entrySet()) { + modifiedValues.put(res.getKey(), func.apply(res.getValue())); + } + return modifiedValues; + } + + private Resource createResource() { + if (!customResourceValues.isEmpty()) { + return ResourceTypesTestHelper.newResource(memoryMB, vCores, + ImmutableMap. builder() + .put(CUSTOM_RES_1, + String.valueOf(customResourceValues.get(CUSTOM_RES_1))) + .put(CUSTOM_RES_2, + String.valueOf(customResourceValues.get(CUSTOM_RES_2))) + .build()); + } + return ResourceTypesTestHelper.newResource(memoryMB, vCores, + Maps.newHashMap()); + } +} diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/ResourceMetricsChecker.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/ResourceMetricsChecker.java index cd617d7b9d0..7c84e8923d9 100644 --- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/ResourceMetricsChecker.java +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/ResourceMetricsChecker.java @@ -27,34 +27,31 @@ import static org.apache.hadoop.test.MetricsAsserts.assertCounter; import static org.apache.hadoop.test.MetricsAsserts.assertGauge; import static org.apache.hadoop.test.MetricsAsserts.getMetrics; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.AGGREGATE_CONTAINERS_ALLOCATED; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.AGGREGATE_CONTAINERS_RELEASED; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_CONTAINERS; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_MB; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_V_CORES; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.AVAILABLE_MB; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.AVAILABLE_V_CORES; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.PENDING_CONTAINERS; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricType.COUNTER_LONG; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricType.GAUGE_INT; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricType.GAUGE_LONG; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AGGREGATE_CONTAINERS_ALLOCATED; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AGGREGATE_CONTAINERS_RELEASED; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_CONTAINERS; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_MB; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.ALLOCATED_V_CORES; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AVAILABLE_MB; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AVAILABLE_V_CORES; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.PENDING_CONTAINERS; import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.PENDING_MB; import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.PENDING_V_CORES; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.RESERVED_CONTAINERS; -import static org.apache.hadoop.yarn.server.resourcemanager.scheduler - .ResourceMetricsChecker.ResourceMetricsKey.RESERVED_MB; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.RESERVED_CONTAINERS; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.RESERVED_MB; import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.RESERVED_V_CORES; final class ResourceMetricsChecker { private final static Logger LOG = LoggerFactory.getLogger(ResourceMetricsChecker.class); + enum ResourceMetricType { + GAUGE_INT, GAUGE_LONG, COUNTER_INT, COUNTER_LONG + } + private static final ResourceMetricsChecker INITIAL_CHECKER = new ResourceMetricsChecker() .gaugeLong(ALLOCATED_MB, 0) @@ -72,29 +69,41 @@ .gaugeInt(RESERVED_CONTAINERS, 0); enum ResourceMetricsKey { - ALLOCATED_MB("AllocatedMB"), - ALLOCATED_V_CORES("AllocatedVCores"), - ALLOCATED_CONTAINERS("AllocatedContainers"), - AGGREGATE_CONTAINERS_ALLOCATED("AggregateContainersAllocated"), - AGGREGATE_CONTAINERS_RELEASED("AggregateContainersReleased"), - AVAILABLE_MB("AvailableMB"), - AVAILABLE_V_CORES("AvailableVCores"), - PENDING_MB("PendingMB"), - PENDING_V_CORES("PendingVCores"), - PENDING_CONTAINERS("PendingContainers"), - RESERVED_MB("ReservedMB"), - RESERVED_V_CORES("ReservedVCores"), - RESERVED_CONTAINERS("ReservedContainers"); + ALLOCATED_MB("AllocatedMB", GAUGE_LONG), + ALLOCATED_V_CORES("AllocatedVCores", GAUGE_INT), + ALLOCATED_CONTAINERS("AllocatedContainers", GAUGE_INT), + AGGREGATE_CONTAINERS_ALLOCATED("AggregateContainersAllocated", + COUNTER_LONG), + AGGREGATE_CONTAINERS_RELEASED("AggregateContainersReleased", + COUNTER_LONG), + AVAILABLE_MB("AvailableMB", GAUGE_LONG), + AVAILABLE_V_CORES("AvailableVCores", GAUGE_INT), + PENDING_MB("PendingMB", GAUGE_LONG), + PENDING_V_CORES("PendingVCores", GAUGE_INT), + PENDING_CONTAINERS("PendingContainers", GAUGE_INT), + RESERVED_MB("ReservedMB", GAUGE_LONG), + RESERVED_V_CORES("ReservedVCores", GAUGE_INT), + RESERVED_CONTAINERS("ReservedContainers", GAUGE_INT), + AGGREGATE_VCORE_SECONDS_PREEMPTED( + "AggregateVcoreSecondsPreempted", COUNTER_LONG), + AGGREGATE_MEMORY_MB_SECONDS_PREEMPTED( + "AggregateMemoryMBSecondsPreempted", COUNTER_LONG); private String value; + private ResourceMetricType type; - ResourceMetricsKey(String value) { + ResourceMetricsKey(String value, ResourceMetricType type) { this.value = value; + this.type = type; } public String getValue() { return value; } + + public ResourceMetricType getType() { + return type; + } } private final Map gaugesLong; @@ -123,20 +132,31 @@ public static ResourceMetricsChecker create() { } ResourceMetricsChecker gaugeLong(ResourceMetricsKey key, long value) { + ensureTypeIsCorrect(key, GAUGE_LONG); gaugesLong.put(key, value); return this; } ResourceMetricsChecker gaugeInt(ResourceMetricsKey key, int value) { + ensureTypeIsCorrect(key, GAUGE_INT); gaugesInt.put(key, value); return this; } ResourceMetricsChecker counter(ResourceMetricsKey key, long value) { + ensureTypeIsCorrect(key, COUNTER_LONG); counters.put(key, value); return this; } + private void ensureTypeIsCorrect(ResourceMetricsKey + key, ResourceMetricType actualType) { + if (key.type != actualType) { + throw new IllegalStateException("Metrics type should be " + key.type + + " instead of " + actualType + " for metrics: " + key.value); + } + } + ResourceMetricsChecker checkAgainst(MetricsSource source) { if (source == null) { throw new IllegalStateException("MetricsSource should not be null!"); diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetrics.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetrics.java index 0b36496b6c8..3d45ca1d4d7 100644 --- a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetrics.java +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetrics.java @@ -47,6 +47,38 @@ import org.junit.Test; public class TestQueueMetrics { + static class MultiQueueSetup { + final MetricsSource parentQueueSource; + final MetricsSource leafQueueSource; + final MetricsSource userSource; + final MetricsSource parentUserSource; + final QueueMetrics parentMetrics; + final QueueMetrics leafMetrics; + final String parentQueueName; + final String leafQueueName; + final String user; + + MultiQueueSetup(MetricsSystem ms, String parentQueueName, + String leafQueueName, String user) { + this.parentQueueName = parentQueueName; + this.leafQueueName = leafQueueName; + this.user = user; + + parentMetrics = + QueueMetrics.forQueue(ms, parentQueueName, null, true, conf); + Queue parentQueue = mock(Queue.class); + when(parentQueue.getMetrics()).thenReturn(parentMetrics); + leafMetrics = + QueueMetrics.forQueue(ms, leafQueueName, parentQueue, true, conf); + parentQueueSource = queueSource(ms, parentQueueName); + leafQueueSource = queueSource(ms, leafQueueName); + + leafMetrics.submitApp(user); + userSource = userSource(ms, leafQueueName, user); + parentUserSource = userSource(ms, parentQueueName, user); + } + } + private static final int GB = 1024; // MB private static final Configuration conf = new Configuration(); private MetricsSystem ms; @@ -103,7 +135,7 @@ public void testDefaultSingleQueueMetrics() { .gaugeLong(ALLOCATED_MB, 6 * GB) .gaugeInt(ALLOCATED_V_CORES, 6) .gaugeInt(ALLOCATED_CONTAINERS, 3) - .counter(AGGREGATE_CONTAINERS_ALLOCATED, 3) + .gaugeLong(AGGREGATE_CONTAINERS_ALLOCATED, 3) .gaugeLong(PENDING_MB, 9 * GB) .gaugeInt(PENDING_V_CORES, 9) .gaugeInt(PENDING_CONTAINERS, 2) @@ -286,7 +318,7 @@ public void testSingleQueueWithUserMetrics() { .gaugeLong(ALLOCATED_MB, 6 * GB) .gaugeInt(ALLOCATED_V_CORES, 6) .gaugeInt(ALLOCATED_CONTAINERS, 3) - .counter(AGGREGATE_CONTAINERS_ALLOCATED, 3) + .gaugeLong(AGGREGATE_CONTAINERS_ALLOCATED, 3) .gaugeLong(PENDING_MB, 9 * GB) .gaugeInt(PENDING_V_CORES, 9) .gaugeInt(PENDING_CONTAINERS, 2) @@ -376,80 +408,78 @@ public void testTwoLevelWithUserMetrics() { String parentQueueName = "root"; String leafQueueName = "root.leaf"; String user = "alice"; - - QueueMetrics parentMetrics = - QueueMetrics.forQueue(ms, parentQueueName, null, true, conf); - Queue parentQueue = mock(Queue.class); - when(parentQueue.getMetrics()).thenReturn(parentMetrics); - QueueMetrics metrics = - QueueMetrics.forQueue(ms, leafQueueName, parentQueue, true, conf); - MetricsSource parentQueueSource = queueSource(ms, parentQueueName); - MetricsSource queueSource = queueSource(ms, leafQueueName); AppSchedulingInfo app = mockApp(user); - metrics.submitApp(user); - MetricsSource userSource = userSource(ms, leafQueueName, user); - MetricsSource parentUserSource = userSource(ms, parentQueueName, user); + MultiQueueSetup mqs = new MultiQueueSetup(ms, + parentQueueName, leafQueueName, user); - AppMetricsChecker appMetricsChecker = AppMetricsChecker.create() + AppMetricsChecker appMetricsChecker = AppMetricsChecker + .create() .counter(APPS_SUBMITTED, 1) - .checkAgainst(queueSource, true); - appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(parentQueueSource, true); - appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(userSource, true); - appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(parentUserSource, true); - - metrics.submitAppAttempt(user); - appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) + .checkAgainst(mqs.leafQueueSource, true); + appMetricsChecker = AppMetricsChecker + .createFromChecker(appMetricsChecker) + .checkAgainst(mqs.parentQueueSource, true); + appMetricsChecker = AppMetricsChecker + .createFromChecker(appMetricsChecker) + .checkAgainst(mqs.userSource, true); + appMetricsChecker = AppMetricsChecker + .createFromChecker(appMetricsChecker) + .checkAgainst(mqs.parentUserSource, true);; + + mqs.leafMetrics.submitAppAttempt(user); + appMetricsChecker = AppMetricsChecker + .createFromChecker(appMetricsChecker) .gaugeInt(APPS_PENDING, 1) - .checkAgainst(queueSource, true); - appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(parentQueueSource, true); - appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(userSource, true); - appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(parentUserSource, true); - - parentMetrics.setAvailableResourcesToQueue(RMNodeLabelsManager.NO_LABEL, + .checkAgainst(mqs.leafQueueSource, true); + appMetricsChecker = AppMetricsChecker + .createFromChecker(appMetricsChecker) + .checkAgainst(mqs.parentQueueSource, true); + appMetricsChecker = AppMetricsChecker + .createFromChecker(appMetricsChecker) + .checkAgainst(mqs.userSource, true); + appMetricsChecker = AppMetricsChecker + .createFromChecker(appMetricsChecker) + .checkAgainst(mqs.parentUserSource, true); + + mqs.parentMetrics.setAvailableResourcesToQueue(RMNodeLabelsManager.NO_LABEL, Resources.createResource(100*GB, 100)); - metrics.setAvailableResourcesToQueue(RMNodeLabelsManager.NO_LABEL, + mqs.leafMetrics.setAvailableResourcesToQueue(RMNodeLabelsManager.NO_LABEL, Resources.createResource(100*GB, 100)); - parentMetrics.setAvailableResourcesToUser(RMNodeLabelsManager.NO_LABEL, + mqs.parentMetrics.setAvailableResourcesToUser(RMNodeLabelsManager.NO_LABEL, user, Resources.createResource(10*GB, 10)); - metrics.setAvailableResourcesToUser(RMNodeLabelsManager.NO_LABEL, + mqs.leafMetrics.setAvailableResourcesToUser(RMNodeLabelsManager.NO_LABEL, user, Resources.createResource(10*GB, 10)); - metrics.incrPendingResources(RMNodeLabelsManager.NO_LABEL, + mqs.leafMetrics.incrPendingResources(RMNodeLabelsManager.NO_LABEL, user, 5, Resources.createResource(3*GB, 3)); - + ResourceMetricsChecker rmChecker = ResourceMetricsChecker.create() .gaugeLong(AVAILABLE_MB, 100 * GB) .gaugeInt(AVAILABLE_V_CORES, 100) .gaugeLong(PENDING_MB, 15 * GB) .gaugeInt(PENDING_V_CORES, 15) .gaugeInt(PENDING_CONTAINERS, 5) - .checkAgainst(queueSource); + .checkAgainst(mqs.leafQueueSource); rmChecker = ResourceMetricsChecker.createFromChecker(rmChecker) - .checkAgainst(parentQueueSource); + .checkAgainst(mqs.parentQueueSource); rmChecker = ResourceMetricsChecker.createFromChecker(rmChecker) .gaugeLong(AVAILABLE_MB, 10 * GB) .gaugeInt(AVAILABLE_V_CORES, 10) - .checkAgainst(userSource); + .checkAgainst(mqs.userSource); rmChecker = ResourceMetricsChecker.createFromChecker(rmChecker) - .checkAgainst(parentUserSource); + .checkAgainst(mqs.parentUserSource); - metrics.runAppAttempt(app.getApplicationId(), user); + mqs.leafMetrics.runAppAttempt(app.getApplicationId(), user); appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) .gaugeInt(APPS_PENDING, 0) .gaugeInt(APPS_RUNNING, 1) - .checkAgainst(queueSource, true); + .checkAgainst(mqs.leafQueueSource, true); appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(userSource, true); + .checkAgainst(mqs.userSource, true); - metrics.allocateResources(RMNodeLabelsManager.NO_LABEL, + mqs.leafMetrics.allocateResources(RMNodeLabelsManager.NO_LABEL, user, 3, Resources.createResource(2*GB, 2), true); - metrics.reserveResource(RMNodeLabelsManager.NO_LABEL, + mqs.leafMetrics.reserveResource(RMNodeLabelsManager.NO_LABEL, user, Resources.createResource(3*GB, 3)); // Available resources is set externally, as it depends on dynamic // configurable cluster/queue resources @@ -466,19 +496,19 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(RESERVED_MB, 3 * GB) .gaugeInt(RESERVED_V_CORES, 3) .gaugeInt(RESERVED_CONTAINERS, 1) - .checkAgainst(queueSource); + .checkAgainst(mqs.leafQueueSource); rmChecker = ResourceMetricsChecker.createFromChecker(rmChecker) - .checkAgainst(queueSource); + .checkAgainst(mqs.leafQueueSource); rmChecker = ResourceMetricsChecker.createFromChecker(rmChecker) .gaugeLong(AVAILABLE_MB, 10 * GB) .gaugeInt(AVAILABLE_V_CORES, 10) - .checkAgainst(userSource); + .checkAgainst(mqs.userSource); rmChecker = ResourceMetricsChecker.createFromChecker(rmChecker) - .checkAgainst(parentUserSource); + .checkAgainst(mqs.parentUserSource); - metrics.releaseResources(RMNodeLabelsManager.NO_LABEL, + mqs.leafMetrics.releaseResources(RMNodeLabelsManager.NO_LABEL, user, 1, Resources.createResource(2*GB, 2)); - metrics.unreserveResource(RMNodeLabelsManager.NO_LABEL, + mqs.leafMetrics.unreserveResource(RMNodeLabelsManager.NO_LABEL, user, Resources.createResource(3*GB, 3)); rmChecker = ResourceMetricsChecker.createFromChecker(rmChecker) .gaugeLong(AVAILABLE_MB, 100 * GB) @@ -490,38 +520,38 @@ public void testTwoLevelWithUserMetrics() { .gaugeLong(RESERVED_MB, 0) .gaugeInt(RESERVED_V_CORES, 0) .gaugeInt(RESERVED_CONTAINERS, 0) - .checkAgainst(queueSource); + .checkAgainst(mqs.leafQueueSource); rmChecker = ResourceMetricsChecker.createFromChecker(rmChecker) - .checkAgainst(parentQueueSource); + .checkAgainst(mqs.parentQueueSource); rmChecker = ResourceMetricsChecker.createFromChecker(rmChecker) .gaugeLong(AVAILABLE_MB, 10 * GB) .gaugeInt(AVAILABLE_V_CORES, 10) - .checkAgainst(userSource); + .checkAgainst(mqs.userSource); ResourceMetricsChecker.createFromChecker(rmChecker) - .checkAgainst(parentUserSource); + .checkAgainst(mqs.parentUserSource); - metrics.finishAppAttempt( + mqs.leafMetrics.finishAppAttempt( app.getApplicationId(), app.isPending(), app.getUser()); appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) .gaugeInt(APPS_RUNNING, 0) - .checkAgainst(queueSource, true); + .checkAgainst(mqs.leafQueueSource, true); appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(parentQueueSource, true); + .checkAgainst(mqs.parentQueueSource, true); appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(userSource, true); + .checkAgainst(mqs.userSource, true); appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(parentUserSource, true); + .checkAgainst(mqs.parentUserSource, true); - metrics.finishApp(user, RMAppState.FINISHED); + mqs.leafMetrics.finishApp(user, RMAppState.FINISHED); appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) .counter(APPS_COMPLETED, 1) - .checkAgainst(queueSource, true); + .checkAgainst(mqs.leafQueueSource, true); appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(parentQueueSource, true); + .checkAgainst(mqs.parentQueueSource, true); appMetricsChecker = AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(userSource, true); + .checkAgainst(mqs.userSource, true); AppMetricsChecker.createFromChecker(appMetricsChecker) - .checkAgainst(parentUserSource, true); + .checkAgainst(mqs.parentUserSource, true); } @Test @@ -599,7 +629,7 @@ private static void checkAggregatedNodeTypes(MetricsSource source, assertCounter("AggregateOffSwitchContainersAllocated", offSwitch, rb); } - private static AppSchedulingInfo mockApp(String user) { + static AppSchedulingInfo mockApp(String user) { AppSchedulingInfo app = mock(AppSchedulingInfo.class); when(app.getUser()).thenReturn(user); ApplicationId appId = BuilderUtils.newApplicationId(1, 1); @@ -612,7 +642,7 @@ public static MetricsSource queueSource(MetricsSystem ms, String queue) { return ms.getSource(QueueMetrics.sourceName(queue).toString()); } - private static MetricsSource userSource(MetricsSystem ms, String queue, + static MetricsSource userSource(MetricsSystem ms, String queue, String user) { return ms.getSource(QueueMetrics.sourceName(queue). append(",user=").append(user).toString()); diff --git a/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetricsForCustomResources.java b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetricsForCustomResources.java new file mode 100644 index 00000000000..0b26f4865f6 --- /dev/null +++ b/hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-resourcemanager/src/test/java/org/apache/hadoop/yarn/server/resourcemanager/scheduler/TestQueueMetricsForCustomResources.java @@ -0,0 +1,475 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * http://www.apache.org/licenses/LICENSE-2.0 + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.hadoop.yarn.server.resourcemanager.scheduler; + +import com.google.common.collect.ImmutableMap; +import org.apache.hadoop.conf.Configuration; +import org.apache.hadoop.metrics2.MetricsSource; +import org.apache.hadoop.metrics2.MetricsSystem; +import org.apache.hadoop.metrics2.impl.MetricsSystemImpl; +import org.apache.hadoop.yarn.api.records.Resource; +import org.apache.hadoop.yarn.api.records.ResourceInformation; +import org.apache.hadoop.yarn.conf.YarnConfiguration; +import org.apache.hadoop.yarn.resourcetypes.ResourceTypesTestHelper; +import org.apache.hadoop.yarn.server.resourcemanager.nodelabels.RMNodeLabelsManager; +import org.apache.hadoop.yarn.server.resourcemanager.scheduler.QueueMetricsForCustomResources.MetricsForCustomResource; + +import org.apache.hadoop.yarn.server.resourcemanager.scheduler + .TestQueueMetrics.MultiQueueSetup; +import org.apache.hadoop.yarn.util.resource.ResourceUtils; +import org.junit.Before; +import org.junit.Test; + +import java.util.HashMap; +import java.util.Map; + +import static org.apache.hadoop.yarn.conf.YarnConfiguration.DEFAULT_RM_SCHEDULER_MAXIMUM_ALLOCATION_MB; +import static org.apache.hadoop.yarn.conf.YarnConfiguration.DEFAULT_RM_SCHEDULER_MAXIMUM_ALLOCATION_VCORES; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AVAILABLE_MB; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.ResourceMetricsChecker.ResourceMetricsKey.AVAILABLE_V_CORES; +import static org.apache.hadoop.yarn.server.resourcemanager.scheduler.TestQueueMetrics.queueSource; +import static org.junit.Assert.assertEquals; +import static org.junit.Assert.assertNotNull; + +public class TestQueueMetricsForCustomResources { + public static final long GB = 1024; // MB + private static final Configuration conf = new Configuration(); + private static final String CUSTOM_RES_1 = "custom_res_1"; + private static final String CUSTOM_RES_2 = "custom_res_2"; + private static final String ROOT_QUEUE_NAME = "root"; + private static final String LEAF_QUEUE_NAME = "root.leaf"; + public static final String USER = "alice"; + + private MetricsSystem ms; + + @Before + public void setUp() { + ms = new MetricsSystemImpl(); + QueueMetrics.clearQueueMetrics(); + initializeResourceTypes(); + } + + private void initializeResourceTypes() { + Map riMap = new HashMap<>(); + + ResourceInformation memory = ResourceInformation.newInstance( + ResourceInformation.MEMORY_MB.getName(), + ResourceInformation.MEMORY_MB.getUnits(), + YarnConfiguration.DEFAULT_RM_SCHEDULER_MINIMUM_ALLOCATION_MB, + DEFAULT_RM_SCHEDULER_MAXIMUM_ALLOCATION_MB); + ResourceInformation vcores = ResourceInformation.newInstance( + ResourceInformation.VCORES.getName(), + ResourceInformation.VCORES.getUnits(), + YarnConfiguration.DEFAULT_RM_SCHEDULER_MINIMUM_ALLOCATION_VCORES, + DEFAULT_RM_SCHEDULER_MAXIMUM_ALLOCATION_VCORES); + ResourceInformation res1 = ResourceInformation.newInstance(CUSTOM_RES_1, + ResourceInformation.VCORES.getUnits(), 0, 2000); + ResourceInformation res2 = ResourceInformation.newInstance(CUSTOM_RES_2, + ResourceInformation.VCORES.getUnits(), 0, 2000); + + riMap.put(ResourceInformation.MEMORY_URI, memory); + riMap.put(ResourceInformation.VCORES_URI, vcores); + riMap.put(CUSTOM_RES_1, res1); + riMap.put(CUSTOM_RES_2, res2); + ResourceUtils.initializeResourcesFromResourceInformationMap(riMap); + } + + static void assertCustomResourceValue(QueueMetrics metrics, + MetricsForCustomResource metricsType, String resourceName, + long expectedValue) { + Map metricsValues = metrics.queueMetricsForCustomResources + .getMetricsByType(metricsType); + Long value = metricsValues.get(resourceName); + assertCustomResourceValueInternal(metricsType, resourceName, + expectedValue, value); + } + + static void assertCustomResourceValueInternal( + MetricsForCustomResource metricsType, String resourceName, long + expectedValue, Long value) { + assertNotNull( + "QueueMetrics should have custom resource metrics value" + + "for resource: " + resourceName, value); + assertEquals(String.format( + "QueueMetrics should have custom resource metrics value %d " + + "for resource: %s for metrics type %s", + expectedValue, resourceName, metricsType), expectedValue, + (long) value); + } + + @Test + public void testSetAvailableResourcesToQueue1() { + String queueName = "single"; + QueueMetrics metrics = QueueMetrics.forQueue(ms, queueName, null, + false, conf); + MetricsSource queueSource = queueSource(ms, queueName); + + metrics.setAvailableResourcesToQueue(ResourceTypesTestHelper.newResource( + GB, 4, + ImmutableMap. builder() + .put(CUSTOM_RES_1, String.valueOf(5 * GB)) + .put(CUSTOM_RES_2, String.valueOf(6 * GB)) + .build())); + ResourceMetricsChecker.create() + .gaugeLong(AVAILABLE_MB, GB) + .gaugeInt(AVAILABLE_V_CORES, 4) + .checkAgainst(queueSource); + + assertCustomResourceValue(metrics, + MetricsForCustomResource.AVAILABLE, CUSTOM_RES_1, 5 * GB); + assertCustomResourceValue(metrics, + MetricsForCustomResource.AVAILABLE, CUSTOM_RES_2, 6 * GB); + } + + @Test + public void testSetAvailableResourcesToQueue2() { + String queueName = "single"; + QueueMetrics metrics = QueueMetrics.forQueue(ms, queueName, null, + false, conf); + MetricsSource queueSource = queueSource(ms, queueName); + + metrics.setAvailableResourcesToQueue(null, + ResourceTypesTestHelper.newResource(GB, 4, + ImmutableMap. builder() + .put(CUSTOM_RES_1, String.valueOf(15 * GB)) + .put(CUSTOM_RES_2, String.valueOf(20 * GB)) + .build())); + ResourceMetricsChecker.create() + .gaugeLong(AVAILABLE_MB, GB) + .gaugeInt(AVAILABLE_V_CORES, 4) + .checkAgainst(queueSource); + + assertCustomResourceValue(metrics, + MetricsForCustomResource.AVAILABLE, CUSTOM_RES_1, 15 * GB); + assertCustomResourceValue(metrics, + MetricsForCustomResource.AVAILABLE, CUSTOM_RES_2, 20 * GB); + } + + @Test + public void testIncreasePendingResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withContainersToDecrease(2) + .withVCores(4) + .withVCoresToDecrease(2) + .withMemoryMB(4 * GB) + .withMemoryMBToDecrease(GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .withCustomResToDecrease(2 * GB) + .build(); + + testcase.testIncreasePendingResources(); + } + + @Test + public void testDecreasePendingResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withContainersToDecrease(2) + .withVCores(4) + .withVCoresToDecrease(2) + .withMemoryMB(4 * GB) + .withMemoryMBToDecrease(GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .withCustomResToDecrease(2 * GB) + .build(); + + testcase.testIncreasePendingResources(); + testcase.testDecreasePendingResources(); + } + + @Test + public void testAllocateResourcesWithoutDecreasePending() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + testcase.testAllocateResources(false); + } + + @Test + public void testAllocateResourcesWithDecreasePending() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withContainersToDecrease(2) + .withVCores(4) + .withVCoresToDecrease(2) + .withMemoryMB(4 * GB) + .withMemoryMBToDecrease(GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .withCustomResToDecrease(2 * GB) + .build(); + + //first, increase pending resources + testcase.testIncreasePendingResources(); + + //then allocate with decrease pending resources + testcase.testAllocateResources(true); + } + + @Test + public void testAllocateResourcesWithoutContainer() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + //first, increase pending resources + testcase.testIncreasePendingResourcesWithoutContainer(); + + testcase.testAllocateResourcesWithoutContainer(); + } + + @Test + public void testReleaseResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withContainersToDecrease(2) + .withVCores(4) + .withVCoresToDecrease(2) + .withMemoryMB(4 * GB) + .withMemoryMBToDecrease(GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .withCustomResToDecrease(2 * GB) + .build(); + + //first, allocate some resources + testcase.testAllocateResources(false); + + testcase.testReleaseResourcesWithContainers(); + } + + @Test + public void testUpdatePreemptedSecondsForCustomResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + final int seconds = 1; + testcase.testUpdatePreemptedSeconds(seconds); + } + + @Test + public void testUpdatePreemptedSecondsForCustomResources2() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + final int seconds = 15; + testcase.testUpdatePreemptedSeconds(seconds); + } + + @Test + public void testReserveResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + testcase.testReserveResources(); + } + + @Test + public void testUnreserveResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + testcase.testReserveResources(); + testcase.testUnreserveResources(); + } + + @Test + public void testGetAllocatedResourcesWithCustomResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .withCustomResourceValue(CUSTOM_RES_1, 15 * GB) + .withCustomResourceValue(CUSTOM_RES_2, 20 * GB) + .build(); + + testcase.testGetAllocatedResources(); + } + + @Test + public void testGetAllocatedResourcesWithoutCustomResources() { + QueueMetricsTestcase testcase = QueueMetricsTestcase.Builder.create() + .withMetricSystem(ms) + .withParentQueueName(ROOT_QUEUE_NAME) + .withLeafQueueName(LEAF_QUEUE_NAME) + .withUser(USER) + .withPartition(RMNodeLabelsManager.NO_LABEL) + .withContainers(5) + .withVCores(4) + .withMemoryMB(4 * GB) + .build(); + + testcase.testGetAllocatedResources(); + } + + @Test + public void testGetMaxUtilizationOfCustomResourcesWithoutAllocatedResource() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, + ROOT_QUEUE_NAME, LEAF_QUEUE_NAME, USER); + Resource clusterResource = ResourceTypesTestHelper.newResource(4 * GB, 8, + ImmutableMap.builder() + .put(CUSTOM_RES_1, + String.valueOf(0L)) + .put(CUSTOM_RES_2, + String.valueOf(0L)) + .build()); + float utilization = mqs.leafMetrics + .getMaxUtilizationOfCustomResources(clusterResource); + assertEquals(0, utilization, 0.0); + } + + @Test + public void testGetMaxUtilizationOfCustomResourcesWithAllocatedResource() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, + ROOT_QUEUE_NAME, LEAF_QUEUE_NAME, USER); + + Resource allocatedResource = ResourceTypesTestHelper.newResource(4 * GB, 8, + ImmutableMap.builder() + .put(CUSTOM_RES_1, + String.valueOf(10L)) + .put(CUSTOM_RES_2, + String.valueOf(20L)) + .build()); + mqs.leafMetrics.allocateResources(RMNodeLabelsManager.NO_LABEL, mqs.user, 1, + allocatedResource, false); + + Resource clusterResource = ResourceTypesTestHelper.newResource(4 * GB, 8, + ImmutableMap.builder() + .put(CUSTOM_RES_1, + String.valueOf(0L)) + .put(CUSTOM_RES_2, + String.valueOf(0L)) + .build()); + float utilization = mqs.leafMetrics + .getMaxUtilizationOfCustomResources(clusterResource); + assertEquals(0, utilization, 0.0); + } + + @Test + public void testGetMaxUtilizationOfCustomResourcesWithAllocatedResource2() { + MultiQueueSetup mqs = new MultiQueueSetup(ms, + ROOT_QUEUE_NAME, LEAF_QUEUE_NAME, USER); + + Resource allocatedResource = ResourceTypesTestHelper.newResource(4 * GB, 8, + ImmutableMap.builder() + .put(CUSTOM_RES_1, + String.valueOf(10L)) + .put(CUSTOM_RES_2, + String.valueOf(20L)) + .build()); + mqs.leafMetrics.allocateResources(RMNodeLabelsManager.NO_LABEL, mqs.user, 1, + allocatedResource, false); + + Resource clusterResource = ResourceTypesTestHelper.newResource(4 * GB, 8, + ImmutableMap.builder() + .put(CUSTOM_RES_1, + String.valueOf(5L)) + .put(CUSTOM_RES_2, + String.valueOf(5L)) + .build()); + float utilization = mqs.leafMetrics + .getMaxUtilizationOfCustomResources(clusterResource); + assertEquals(4.0, utilization, 0.0); + } + +}