From 62a7aa2efc6e5046277952102e5379cced628244 Mon Sep 17 00:00:00 2001
From: Sai Enduri <saimanas.enduri@amd.com>
Date: Mon, 16 Jun 2025 15:19:32 -0700
Subject: [PATCH] Update CI flakes. (#7244)

---
 .github/workflows/pr-test-amd.yml | 26 +-------------------------
 test/srt/test_bench_serving.py    |  2 +-
 2 files changed, 2 insertions(+), 26 deletions(-)

diff --git a/.github/workflows/pr-test-amd.yml b/.github/workflows/pr-test-amd.yml
index afbcda40a..52499eeaa 100644
--- a/.github/workflows/pr-test-amd.yml
+++ b/.github/workflows/pr-test-amd.yml
@@ -46,7 +46,7 @@ jobs:
       - name: Evaluate Accuracy
         timeout-minutes: 30
         run: |
-          bash scripts/amd_ci_exec.sh python3 test_eval_accuracy_large.py
+          bash scripts/amd_ci_exec.sh -e SGLANG_USE_AITER=0 python3 test_eval_accuracy_large.py
           bash scripts/amd_ci_exec.sh python3 test_eval_fp8_accuracy.py
           bash scripts/amd_ci_exec.sh python3 models/test_qwen_models.py
 
@@ -266,30 +266,6 @@ jobs:
         run: |
           bash scripts/amd_ci_exec.sh python3 run_suite.py --suite per-commit-2-gpu-amd
 
-  unit-test-backend-4-gpu-amd:
-    if: (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
-      github.event.pull_request.draft == false
-    strategy:
-      matrix:
-        runner: [linux-mi300-gpu-4]
-    runs-on: ${{matrix.runner}}
-    steps:
-      - name: Checkout code
-        uses: actions/checkout@v4
-
-      - name: Start CI container
-        run: bash scripts/amd_ci_start_container.sh
-        env:
-          GITHUB_WORKSPACE: ${{ github.workspace }}
-
-      - name: Install dependencies
-        run: bash scripts/amd_ci_install_dependency.sh
-
-      - name: Run test
-        timeout-minutes: 40
-        run: |
-          bash scripts/amd_ci_exec.sh python3 run_suite.py --suite per-commit-4-gpu-amd
-
   unit-test-backend-8-gpu-amd:
     if: (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
       github.event.pull_request.draft == false
diff --git a/test/srt/test_bench_serving.py b/test/srt/test_bench_serving.py
index f7317b191..3626ed81e 100644
--- a/test/srt/test_bench_serving.py
+++ b/test/srt/test_bench_serving.py
@@ -31,7 +31,7 @@ class TestBenchServing(CustomTestCase):
                 f'Output throughput: {res["output_throughput"]:.2f} token/s\n'
             )
             if is_in_amd_ci():
-                self.assertGreater(res["output_throughput"], 3150)
+                self.assertGreater(res["output_throughput"], 3050)
             else:
                 self.assertGreater(res["output_throughput"], 3800)