ROCm · neoblizz · Nov 17, 2025 · Nov 18, 2025 · Nov 18, 2025 · Nov 18, 2025
@@ -36,9 +36,10 @@ if [ "$CONTAINER_RUNTIME" = "apptainer" ]; then
 
 elif [ "$CONTAINER_RUNTIME" = "docker" ]; then
     echo "[INFO] Checking Docker images..."
-    IMAGE_NAME="iris-dev-triton-aafec41"
+    # Use GitHub variable if set, otherwise default to iris-dev
+    IMAGE_NAME=${DOCKER_IMAGE_NAME:-"iris-dev"}
 
-    # Check if the triton image exists
+    # Check if the image exists
     if docker image inspect "$IMAGE_NAME" &> /dev/null; then
         echo "[INFO] Using existing Docker image: $IMAGE_NAME"
     else

@@ -86,7 +86,9 @@ if [ "$CONTAINER_RUNTIME" = "apptainer" ]; then
     exit $EXIT_CODE
 
 elif [ "$CONTAINER_RUNTIME" = "docker" ]; then
-    IMAGE_NAME=${CUSTOM_IMAGE:-${DOCKER_IMAGE_NAME:-"iris-dev-triton-aafec41"}}
+    # Use custom image if provided, otherwise use GitHub variable or default
+    # GitHub Actions sets DOCKER_IMAGE_NAME, locally defaults to iris-dev
+    IMAGE_NAME=${CUSTOM_IMAGE:-${DOCKER_IMAGE_NAME:-"iris-dev"}}
 
     if ! docker image inspect "$IMAGE_NAME" &> /dev/null; then
         echo "[ERROR] Docker image $IMAGE_NAME not found" >&2

@@ -25,7 +25,8 @@ if [ "$CONTAINER_RUNTIME" = "apptainer" ]; then
     bash apptainer/run.sh "$@"
 elif [ "$CONTAINER_RUNTIME" = "docker" ]; then
     echo "[INFO] Running with Docker..."
-    IMAGE_NAME=${1:-"iris-dev-triton-aafec41"}
+    # Use GitHub variable if set, otherwise default to iris-dev
+    IMAGE_NAME=${1:-${DOCKER_IMAGE_NAME:-"iris-dev"}}
     WORKSPACE_DIR=${2:-"$(pwd)"}
     bash docker/run.sh "$IMAGE_NAME" "$WORKSPACE_DIR"
 fi

@@ -3,16 +3,28 @@
 # Copyright (c) 2025 Advanced Micro Devices, Inc. All rights reserved.
 #
 # Run Iris tests in a container
-# Usage: run_tests.sh <num_ranks> [gpu_devices]
+# Usage: run_tests.sh <test_dir> <num_ranks> [gpu_devices]
+#   test_dir: subdirectory under tests/ (e.g., examples, unittests, ccl)
+#   num_ranks: number of GPU ranks (1, 2, 4, or 8)
+#   gpu_devices: comma-separated GPU device IDs (optional)
 
 set -e
 
-NUM_RANKS=$1
-GPU_DEVICES=${2:-""}
+TEST_DIR=$1
+NUM_RANKS=$2
+GPU_DEVICES=${3:-""}
 
-if [ -z "$NUM_RANKS" ]; then
-    echo "[ERROR] NUM_RANKS not provided"
-    echo "Usage: $0 <num_ranks> [gpu_devices]"
+if [ -z "$TEST_DIR" ] || [ -z "$NUM_RANKS" ]; then
+    echo "[ERROR] Missing required arguments"
+    echo "Usage: $0 <test_dir> <num_ranks> [gpu_devices]"
+    echo "  test_dir: examples, unittests, or ccl"
+    echo "  num_ranks: 1, 2, 4, or 8"
+    exit 1
+fi
+
+# Validate test directory
+if [ ! -d "tests/$TEST_DIR" ]; then
+    echo "[ERROR] Test directory tests/$TEST_DIR does not exist"
     exit 1
 fi
 
@@ -29,23 +41,12 @@ fi
     set -e
     pip install -e .
 
-    # Run examples tests
-    for test_file in tests/examples/test_*.py; do
-        echo \"Testing: \$test_file with $NUM_RANKS ranks\"
-        python tests/run_tests_distributed.py --num_ranks $NUM_RANKS \"\$test_file\" -v --tb=short --durations=10
+    # Run tests in the specified directory
+    for test_file in tests/$TEST_DIR/test_*.py; do
+        if [ -f \"\$test_file\" ]; then
+            echo \"Testing: \$test_file with $NUM_RANKS ranks\"
+            python tests/run_tests_distributed.py --num_ranks $NUM_RANKS \"\$test_file\" -v --tb=short --durations=10
+        fi
     done
-
-    # Run unit tests
-    for test_file in tests/unittests/test_*.py; do
-        echo \"Testing: \$test_file with $NUM_RANKS ranks\"
-        python tests/run_tests_distributed.py --num_ranks $NUM_RANKS \"\$test_file\" -v --tb=short --durations=10
-    done
-
-    # Run ccl tests
-    # DISABLED: CCL host-side APIs have issues for some data types/algorithms
-    # for test_file in tests/ccl/test_*.py; do
-    #     echo \"Testing: \$test_file with $NUM_RANKS ranks\"
-    #     python tests/run_tests_distributed.py --num_ranks $NUM_RANKS \"\$test_file\" -v --tb=short --durations=10
-    # done
 "
 
@@ -11,6 +11,9 @@ concurrency:
   group: ${{ github.workflow }}-${{ github.head_ref || github.ref }}
   cancel-in-progress: ${{ github.ref != 'refs/heads/main' }}
 
+env:
+  DOCKER_IMAGE_NAME: ${{ vars.DOCKER_IMAGE_NAME || 'iris-dev-triton-aafec41' }}
+
 jobs:
   build-container-image:
     runs-on: [self-hosted, mi3008x]

@@ -11,6 +11,9 @@ concurrency:
   group: ${{ github.workflow }}-${{ github.head_ref || github.ref }}
   cancel-in-progress: ${{ github.ref != 'refs/heads/main' }}
 
+env:
+  DOCKER_IMAGE_NAME: ${{ vars.DOCKER_IMAGE_NAME || 'iris-dev-triton-aafec41' }}
+
 jobs:
   build-container-image:
     runs-on: [self-hosted, mi3008x]