apache
diff --git a/‎flink-autoscaler/src/main/java/org/apache/flink/autoscaler/JobVertexScaler.java
Lines changed: 44 additions & 21 deletions b/‎flink-autoscaler/src/main/java/org/apache/flink/autoscaler/JobVertexScaler.java
Lines changed: 44 additions & 21 deletions
diff --git a/‎flink-autoscaler/src/main/java/org/apache/flink/autoscaler/ScalingExecutor.java
Lines changed: 6 additions & 2 deletions b/‎flink-autoscaler/src/main/java/org/apache/flink/autoscaler/ScalingExecutor.java
Lines changed: 6 additions & 2 deletions
diff --git a/‎flink-autoscaler/src/main/java/org/apache/flink/autoscaler/topology/JobTopology.java
Lines changed: 3 additions & 3 deletions b/‎flink-autoscaler/src/main/java/org/apache/flink/autoscaler/topology/JobTopology.java
Lines changed: 3 additions & 3 deletions
diff --git a/‎flink-autoscaler/src/main/java/org/apache/flink/autoscaler/topology/ShipStrategy.java
Lines changed: 55 additions & 0 deletions b/‎flink-autoscaler/src/main/java/org/apache/flink/autoscaler/topology/ShipStrategy.java
Lines changed: 55 additions & 0 deletions
diff --git a/‎flink-autoscaler/src/main/java/org/apache/flink/autoscaler/topology/VertexInfo.java
Lines changed: 8 additions & 5 deletions b/‎flink-autoscaler/src/main/java/org/apache/flink/autoscaler/topology/VertexInfo.java
Lines changed: 8 additions & 5 deletions
diff --git a/‎flink-autoscaler/src/main/java/org/apache/flink/autoscaler/tuning/MemoryTuning.java
Lines changed: 12 additions & 9 deletions b/‎flink-autoscaler/src/main/java/org/apache/flink/autoscaler/tuning/MemoryTuning.java
Lines changed: 12 additions & 9 deletions
diff --git a/‎flink-autoscaler/src/test/java/org/apache/flink/autoscaler/BacklogBasedScalingTest.java
Lines changed: 5 additions & 4 deletions b/‎flink-autoscaler/src/test/java/org/apache/flink/autoscaler/BacklogBasedScalingTest.java
Lines changed: 5 additions & 4 deletions
@@ -22,6 +22,7 @@
 import org.apache.flink.autoscaler.event.AutoScalerEventHandler;
 import org.apache.flink.autoscaler.metrics.EvaluatedScalingMetric;
 import org.apache.flink.autoscaler.metrics.ScalingMetric;
+import org.apache.flink.autoscaler.topology.ShipStrategy;
 import org.apache.flink.autoscaler.utils.AutoScalerUtils;
 import org.apache.flink.configuration.Configuration;
 import org.apache.flink.runtime.jobgraph.JobVertexID;
@@ -34,6 +35,7 @@
 import java.time.Duration;
 import java.time.Instant;
 import java.time.ZoneId;
+import java.util.Collection;
 import java.util.Map;
 import java.util.SortedMap;
 
@@ -48,6 +50,7 @@
 import static org.apache.flink.autoscaler.metrics.ScalingMetric.MAX_PARALLELISM;
 import static org.apache.flink.autoscaler.metrics.ScalingMetric.PARALLELISM;
 import static org.apache.flink.autoscaler.metrics.ScalingMetric.TRUE_PROCESSING_RATE;
+import static org.apache.flink.autoscaler.topology.ShipStrategy.HASH;
 
 /** Component responsible for computing vertex parallelism based on the scaling metrics. */
 public class JobVertexScaler<KEY, Context extends JobAutoScalerContext<KEY>> {
@@ -71,6 +74,7 @@ public JobVertexScaler(AutoScalerEventHandler<KEY, Context> autoScalerEventHandl
     public int computeScaleTargetParallelism(
             Context context,
             JobVertexID vertex,
+            Collection<ShipStrategy> inputShipStrategies,
             Map<ScalingMetric, EvaluatedScalingMetric> evaluatedMetrics,
             SortedMap<Instant, ScalingSummary> history,
             Duration restartTime) {
@@ -121,6 +125,7 @@ public int computeScaleTargetParallelism(
         int newParallelism =
                 scale(
                         currentParallelism,
+                        inputShipStrategies,
                         (int) evaluatedMetrics.get(MAX_PARALLELISM).getCurrent(),
                         scaleFactor,
                         Math.min(currentParallelism, conf.getInteger(VERTEX_MIN_PARALLELISM)),
@@ -245,50 +250,68 @@ private boolean detectIneffectiveScaleUp(
         }
     }
 
+    /**
+     * Computing the newParallelism. In general, newParallelism = currentParallelism * scaleFactor.
+     * But we limit newParallelism between parallelismLowerLimit and min(parallelismUpperLimit,
+     * maxParallelism).
+     *
+     * <p>Also, in order to ensure the data is evenly spread across subtasks, we try to adjust the
+     * parallelism for source and keyed vertex such that it divides the maxParallelism without a
+     * remainder.
+     */
     @VisibleForTesting
     protected static int scale(
-            int parallelism,
-            int numKeyGroups,
+            int currentParallelism,
+            Collection<ShipStrategy> inputShipStrategies,
+            int maxParallelism,
             double scaleFactor,
-            int minParallelism,
-            int maxParallelism) {
+            int parallelismLowerLimit,
+            int parallelismUpperLimit) {
         Preconditions.checkArgument(
-                minParallelism <= maxParallelism,
-                "The minimum parallelism must not be greater than the maximum parallelism.");
-        if (minParallelism > numKeyGroups) {
+                parallelismLowerLimit <= parallelismUpperLimit,
+                "The parallelism lower limitation must not be greater than the parallelism upper limitation.");
+        if (parallelismLowerLimit > maxParallelism) {
             LOG.warn(
                     "Specified autoscaler minimum parallelism {} is greater than the operator max parallelism {}. The min parallelism will be set to the operator max parallelism.",
-                    minParallelism,
-                    numKeyGroups);
+                    parallelismLowerLimit,
+                    maxParallelism);
         }
-        if (numKeyGroups < maxParallelism && maxParallelism != Integer.MAX_VALUE) {
+        if (maxParallelism < parallelismUpperLimit && parallelismUpperLimit != Integer.MAX_VALUE) {
             LOG.debug(
                     "Specified autoscaler maximum parallelism {} is greater than the operator max parallelism {}. This means the operator max parallelism can never be reached.",
-                    maxParallelism,
-                    numKeyGroups);
+                    parallelismUpperLimit,
+                    maxParallelism);
         }
 
         int newParallelism =
                 // Prevent integer overflow when converting from double to integer.
                 // We do not have to detect underflow because doubles cannot
                 // underflow.
-                (int) Math.min(Math.ceil(scaleFactor * parallelism), Integer.MAX_VALUE);
+                (int) Math.min(Math.ceil(scaleFactor * currentParallelism), Integer.MAX_VALUE);
 
-        // Cap parallelism at either number of key groups or parallelism limit
-        final int upperBound = Math.min(numKeyGroups, maxParallelism);
+        // Cap parallelism at either maxParallelism(number of key groups or source partitions) or
+        // parallelism upper limit
+        final int upperBound = Math.min(maxParallelism, parallelismUpperLimit);
 
         // Apply min/max parallelism
-        newParallelism = Math.min(Math.max(minParallelism, newParallelism), upperBound);
+        newParallelism = Math.min(Math.max(parallelismLowerLimit, newParallelism), upperBound);
+
+        var adjustByMaxParallelism =
+                inputShipStrategies.isEmpty() || inputShipStrategies.contains(HASH);
+        if (!adjustByMaxParallelism) {
+            return newParallelism;
+        }
 
-        // Try to adjust the parallelism such that it divides the number of key groups without a
-        // remainder => state is evenly spread across subtasks
-        for (int p = newParallelism; p <= numKeyGroups / 2 && p <= upperBound; p++) {
-            if (numKeyGroups % p == 0) {
+        // When the shuffle type of vertex inputs contains keyBy or vertex is a source, we try to
+        // adjust the parallelism such that it divides the maxParallelism without a remainder
+        // => data is evenly spread across subtasks
+        for (int p = newParallelism; p <= maxParallelism / 2 && p <= upperBound; p++) {
+            if (maxParallelism % p == 0) {
                 return p;
             }
         }
 
-        // If key group adjustment fails, use originally computed parallelism
+        // If parallelism adjustment fails, use originally computed parallelism
         return newParallelism;
     }
 
 
@@ -102,7 +102,8 @@ public boolean scaleResource(
         var restartTime = scalingTracking.getMaxRestartTimeOrDefault(conf);
 
         var scalingSummaries =
-                computeScalingSummary(context, evaluatedMetrics, scalingHistory, restartTime);
+                computeScalingSummary(
+                        context, evaluatedMetrics, scalingHistory, restartTime, jobTopology);
 
         if (scalingSummaries.isEmpty()) {
             LOG.info("All job vertices are currently running at their target parallelism.");
@@ -203,7 +204,8 @@ Map<JobVertexID, ScalingSummary> computeScalingSummary(
             Context context,
             EvaluatedMetrics evaluatedMetrics,
             Map<JobVertexID, SortedMap<Instant, ScalingSummary>> scalingHistory,
-            Duration restartTime) {
+            Duration restartTime,
+            JobTopology jobTopology) {
         LOG.debug("Restart time used in scaling summary computation: {}", restartTime);
 
         if (isJobUnderMemoryPressure(context, evaluatedMetrics.getGlobalMetrics())) {
@@ -225,10 +227,12 @@ Map<JobVertexID, ScalingSummary> computeScalingSummary(
                             } else {
                                 var currentParallelism =
                                         (int) metrics.get(ScalingMetric.PARALLELISM).getCurrent();
+
                                 var newParallelism =
                                         jobVertexScaler.computeScaleTargetParallelism(
                                                 context,
                                                 v,
+                                                jobTopology.get(v).getInputs().values(),
                                                 metrics,
                                                 scalingHistory.getOrDefault(
                                                         v, Collections.emptySortedMap()),
 
@@ -61,7 +61,7 @@ public JobTopology(VertexInfo... vertexInfo) {
 
     public JobTopology(Set<VertexInfo> vertexInfo) {
 
-        Map<JobVertexID, Map<JobVertexID, String>> vertexOutputs = new HashMap<>();
+        Map<JobVertexID, Map<JobVertexID, ShipStrategy>> vertexOutputs = new HashMap<>();
         vertexInfos =
                 ImmutableMap.copyOf(
                         vertexInfo.stream().collect(Collectors.toMap(VertexInfo::getId, v -> v)));
@@ -145,7 +145,7 @@ public static JobTopology fromJsonPlan(
 
         for (JsonNode node : nodes) {
             var vertexId = JobVertexID.fromHexString(node.get("id").asText());
-            var inputs = new HashMap<JobVertexID, String>();
+            var inputs = new HashMap<JobVertexID, ShipStrategy>();
             var ioMetrics = metrics.get(vertexId);
             var finished = finishedVertices.contains(vertexId);
             vertexInfo.add(
@@ -160,7 +160,7 @@ public static JobTopology fromJsonPlan(
                 for (JsonNode input : node.get("inputs")) {
                     inputs.put(
                             JobVertexID.fromHexString(input.get("id").asText()),
-                            input.get("ship_strategy").asText());
+                            ShipStrategy.of(input.get("ship_strategy").asText()));
                 }
             }
         }
 
@@ -0,0 +1,55 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.flink.autoscaler.topology;
+
+import javax.annotation.Nonnull;
+
+/** The ship strategy between 2 JobVertices. */
+public enum ShipStrategy {
+    HASH,
+
+    REBALANCE,
+
+    RESCALE,
+
+    FORWARD,
+
+    CUSTOM,
+
+    BROADCAST,
+
+    GLOBAL,
+
+    SHUFFLE,
+
+    UNKNOWN;
+
+    /**
+     * Generates a ShipStrategy from a string, or returns {@link #UNKNOWN} if the value cannot match
+     * any ShipStrategy.
+     */
+    @Nonnull
+    public static ShipStrategy of(String value) {
+        for (ShipStrategy shipStrategy : ShipStrategy.values()) {
+            if (shipStrategy.toString().equalsIgnoreCase(value)) {
+                return shipStrategy;
+            }
+        }
+        return UNKNOWN;
+    }
+}
@@ -31,10 +31,10 @@ public class VertexInfo {
     private final JobVertexID id;
 
     // All input vertices and the ship_strategy
-    private final Map<JobVertexID, String> inputs;
+    private final Map<JobVertexID, ShipStrategy> inputs;
 
     // All output vertices and the ship_strategy
-    private Map<JobVertexID, String> outputs;
+    private Map<JobVertexID, ShipStrategy> outputs;
 
     private final int parallelism;
 
@@ -48,7 +48,7 @@ public class VertexInfo {
 
     public VertexInfo(
             JobVertexID id,
-            Map<JobVertexID, String> inputs,
+            Map<JobVertexID, ShipStrategy> inputs,
             int parallelism,
             int maxParallelism,
             boolean finished,
@@ -65,7 +65,7 @@ public VertexInfo(
     @VisibleForTesting
     public VertexInfo(
             JobVertexID id,
-            Map<JobVertexID, String> inputs,
+            Map<JobVertexID, ShipStrategy> inputs,
             int parallelism,
             int maxParallelism,
             IOMetrics ioMetrics) {
@@ -74,7 +74,10 @@ public VertexInfo(
 
     @VisibleForTesting
     public VertexInfo(
-            JobVertexID id, Map<JobVertexID, String> inputs, int parallelism, int maxParallelism) {
+            JobVertexID id,
+            Map<JobVertexID, ShipStrategy> inputs,
+            int parallelism,
+            int maxParallelism) {
         this(id, inputs, parallelism, maxParallelism, null);
     }
 
 
@@ -26,6 +26,7 @@
 import org.apache.flink.autoscaler.metrics.EvaluatedScalingMetric;
 import org.apache.flink.autoscaler.metrics.ScalingMetric;
 import org.apache.flink.autoscaler.topology.JobTopology;
+import org.apache.flink.autoscaler.topology.ShipStrategy;
 import org.apache.flink.autoscaler.topology.VertexInfo;
 import org.apache.flink.autoscaler.utils.ResourceCheckUtils;
 import org.apache.flink.configuration.Configuration;
@@ -53,6 +54,8 @@
 import static org.apache.flink.autoscaler.metrics.ScalingMetric.HEAP_MEMORY_USED;
 import static org.apache.flink.autoscaler.metrics.ScalingMetric.MANAGED_MEMORY_USED;
 import static org.apache.flink.autoscaler.metrics.ScalingMetric.METASPACE_MEMORY_USED;
+import static org.apache.flink.autoscaler.topology.ShipStrategy.FORWARD;
+import static org.apache.flink.autoscaler.topology.ShipStrategy.RESCALE;
 
 /** Tunes the TaskManager memory. */
 public class MemoryTuning {
@@ -254,9 +257,9 @@ private static MemorySize adjustNetworkMemory(
         long maxNetworkMemory = 0;
         for (VertexInfo vertexInfo : jobTopology.getVertexInfos().values()) {
             // Add max amount of memory for each input gate
-            for (Map.Entry<JobVertexID, String> inputEntry : vertexInfo.getInputs().entrySet()) {
-                final JobVertexID inputVertexId = inputEntry.getKey();
-                final String shipStrategy = inputEntry.getValue();
+            for (var inputEntry : vertexInfo.getInputs().entrySet()) {
+                var inputVertexId = inputEntry.getKey();
+                var shipStrategy = inputEntry.getValue();
                 maxNetworkMemory +=
                         calculateNetworkSegmentNumber(
                                         updatedParallelisms.get(vertexInfo.getId()),
@@ -268,9 +271,9 @@ private static MemorySize adjustNetworkMemory(
             }
             // Add max amount of memory for each output gate
             // Usually, there is just one output per task
-            for (Map.Entry<JobVertexID, String> outputEntry : vertexInfo.getOutputs().entrySet()) {
-                final JobVertexID outputVertexId = outputEntry.getKey();
-                final String shipStrategy = outputEntry.getValue();
+            for (var outputEntry : vertexInfo.getOutputs().entrySet()) {
+                var outputVertexId = outputEntry.getKey();
+                var shipStrategy = outputEntry.getValue();
                 maxNetworkMemory +=
                         calculateNetworkSegmentNumber(
                                         updatedParallelisms.get(vertexInfo.getId()),
@@ -300,15 +303,15 @@ private static MemorySize adjustNetworkMemory(
     static int calculateNetworkSegmentNumber(
             int currentVertexParallelism,
             int connectedVertexParallelism,
-            String shipStrategy,
+            ShipStrategy shipStrategy,
             int buffersPerChannel,
             int floatingBuffers) {
         // TODO When the parallelism is changed via the rescale api, the FORWARD may be changed to
         // RESCALE. This logic may needs to be updated after FLINK-33123.
         if (currentVertexParallelism == connectedVertexParallelism
-                && "FORWARD".equals(shipStrategy)) {
+                && FORWARD.equals(shipStrategy)) {
             return buffersPerChannel + floatingBuffers;
-        } else if ("FORWARD".equals(shipStrategy) || "RESCALE".equals(shipStrategy)) {
+        } else if (FORWARD.equals(shipStrategy) || RESCALE.equals(shipStrategy)) {
             final int channelCount =
                     (int) Math.ceil(connectedVertexParallelism / (double) currentVertexParallelism);
             return channelCount * buffersPerChannel + floatingBuffers;
 
@@ -45,6 +45,7 @@
 
 import static org.apache.flink.autoscaler.JobAutoScalerImpl.AUTOSCALER_ERROR;
 import static org.apache.flink.autoscaler.TestingAutoscalerUtils.createDefaultJobAutoScalerContext;
+import static org.apache.flink.autoscaler.topology.ShipStrategy.REBALANCE;
 import static org.assertj.core.api.Assertions.assertThat;
 import static org.junit.jupiter.api.Assertions.assertEquals;
 import static org.junit.jupiter.api.Assertions.assertTrue;
@@ -81,7 +82,7 @@ public void setup() {
                                 new VertexInfo(source1, Map.of(), 1, 720, new IOMetrics(0, 0, 0)),
                                 new VertexInfo(
                                         sink,
-                                        Map.of(source1, "REBALANCE"),
+                                        Map.of(source1, REBALANCE),
                                         1,
                                         720,
                                         new IOMetrics(0, 0, 0))));
@@ -157,7 +158,7 @@ public void test() throws Exception {
         metricsCollector.setJobTopology(
                 new JobTopology(
                         new VertexInfo(source1, Map.of(), 4, 24),
-                        new VertexInfo(sink, Map.of(source1, "REBALANCE"), 4, 720)));
+                        new VertexInfo(sink, Map.of(source1, REBALANCE), 4, 720)));
 
         metricsCollector.updateMetrics(
                 source1,
@@ -239,7 +240,7 @@ public void test() throws Exception {
         metricsCollector.setJobTopology(
                 new JobTopology(
                         new VertexInfo(source1, Map.of(), 2, 24),
-                        new VertexInfo(sink, Map.of(source1, "REBALANCE"), 2, 720)));
+                        new VertexInfo(sink, Map.of(source1, REBALANCE), 2, 720)));
 
         /* Test stability while processing backlog. */
 
@@ -361,7 +362,7 @@ public void shouldTrackRestartDurationCorrectly() throws Exception {
         metricsCollector.setJobTopology(
                 new JobTopology(
                         new VertexInfo(source1, Map.of(), 4, 720),
-                        new VertexInfo(sink, Map.of(source1, "REBALANCE"), 4, 720)));
+                        new VertexInfo(sink, Map.of(source1, REBALANCE), 4, 720)));
 
         var expectedEndTime = Instant.ofEpochMilli(10);
         metricsCollector.setJobUpdateTs(expectedEndTime);