ray-project · bveeramani · Nov 25, 2025 · Nov 17, 2025 · Nov 17, 2025 · Nov 17, 2025
diff --git a/release/release_data_tests.yaml b/release/release_data_tests.yaml
@@ -178,22 +178,32 @@
 
   matrix:
     setup:
-      # This test consistently fails on fixed-size clusters due to head OOM from
-      # too many objects references on the head node. So, we only run it on
-      # autoscaling clusters.
-      scaling: [autoscaling]
+      scaling: [fixed_size]
       shuffle_strategy: [sort_shuffle_pull_based, hash_shuffle]
       columns:
         - "column08 column13 column14"   # 84 groups
         - "column02 column14"  # 7M groups
 
+    adjustments:
+      # Ray Data OOMs with hash shuffle on autoscaling clusters. So, only run
+      # autoscaling variants with sort shuffle. For more information, see
+      # https://github.com/ray-project/ray/issues/58734.
+      - with:
+          scaling: autoscaling
+          shuffle_strategy: sort_shuffle_pull_based
+          columns: "column08 column13 column14"
+      - with:
+          scaling: autoscaling
+          shuffle_strategy: sort_shuffle_pull_based
+          columns: "column02 column14"
+
   cluster:
     cluster_compute: "{{scaling}}_all_to_all_compute.yaml"
 
   run:
     timeout: 3600
     script: >
-      python groupby_benchmark.py --sf 10 --map-groups --group-by {{columns}}
+      python groupby_benchmark.py --sf 100 --map-groups --group-by {{columns}}
       --shuffle-strategy {{shuffle_strategy}}
 
 ###############