diff --git a/scripts/ci/ci_install_dependency.sh b/scripts/ci/ci_install_dependency.sh index 83108a0e1..3f1bae524 100755 --- a/scripts/ci/ci_install_dependency.sh +++ b/scripts/ci/ci_install_dependency.sh @@ -10,6 +10,9 @@ else CU_VERSION="cu126" fi +# Clear torch compilation cache +python3 -c 'import os, shutil, tempfile, getpass; cache_dir = os.environ.get("TORCHINDUCTOR_CACHE_DIR") or os.path.join(tempfile.gettempdir(), "torchinductor_" + getpass.getuser()); shutil.rmtree(cache_dir, ignore_errors=True)' + # Kill existing processes SCRIPT_DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )" bash "${SCRIPT_DIR}/../killall_sglang.sh" diff --git a/test/srt/test_dp_attention.py b/test/srt/test_dp_attention.py index f997382f9..37b89c445 100644 --- a/test/srt/test_dp_attention.py +++ b/test/srt/test_dp_attention.py @@ -44,19 +44,6 @@ class TestDPAttentionDP2TP2(CustomTestCase): def tearDownClass(cls): kill_process_tree(cls.process.pid) - def test_mmlu(self): - args = SimpleNamespace( - base_url=self.base_url, - model=self.model, - eval_name="mmlu", - num_examples=64, - num_threads=32, - ) - - metrics = run_eval(args) - print(f"{metrics=}") - self.assertGreater(metrics["score"], 0.5) - def test_mgsm_en(self): args = SimpleNamespace( base_url=self.base_url, @@ -165,19 +152,6 @@ class TestDPAttentionMinimumTokenLoadBalance(CustomTestCase): def tearDownClass(cls): kill_process_tree(cls.process.pid) - def test_mmlu(self): - args = SimpleNamespace( - base_url=self.base_url, - model=self.model, - eval_name="mmlu", - num_examples=64, - num_threads=32, - ) - - metrics = run_eval(args) - print(f"{metrics=}") - self.assertGreater(metrics["score"], 0.5) - def test_mgsm_en(self): args = SimpleNamespace( base_url=self.base_url,