From 32318178611b2cbbeddb272e8388ea25f4b64cf5 Mon Sep 17 00:00:00 2001 From: Lianmin Zheng Date: Sun, 29 Dec 2024 23:05:50 -0800 Subject: [PATCH] Revert "[feat] Add math eval to CI" (#2656) --- test/srt/test_eval_accuracy_large.py | 11 ----------- test/srt/test_eval_accuracy_mini.py | 12 ------------ 2 files changed, 23 deletions(-) diff --git a/test/srt/test_eval_accuracy_large.py b/test/srt/test_eval_accuracy_large.py index bda6053ee..f7fb3cec3 100644 --- a/test/srt/test_eval_accuracy_large.py +++ b/test/srt/test_eval_accuracy_large.py @@ -68,17 +68,6 @@ class TestEvalAccuracyLarge(unittest.TestCase): metrics = run_eval(args) self.assertGreater(metrics["score"], 0.835) - def test_math(self): - args = SimpleNamespace( - base_url=self.base_url, - model=self.model, - eval_name="math", - num_examples=5000, - num_threads=1024 - ) - - metrics = run_eval(args) - self.assertGreaterEqual(metrics["score"], 0.519 - 0.01) # -1% to account for sampling variance if __name__ == "__main__": unittest.main() diff --git a/test/srt/test_eval_accuracy_mini.py b/test/srt/test_eval_accuracy_mini.py index 74741aba5..a008c3869 100644 --- a/test/srt/test_eval_accuracy_mini.py +++ b/test/srt/test_eval_accuracy_mini.py @@ -37,18 +37,6 @@ class TestEvalAccuracyMini(unittest.TestCase): metrics = run_eval(args) self.assertGreaterEqual(metrics["score"], 0.65) - def test_math(self): - args = SimpleNamespace( - base_url=self.base_url, - model=self.model, - eval_name="math", - num_examples=64, - num_threads=32, - temperature=0.1, - ) - metrics = run_eval(args) - self.assertGreaterEqual(metrics["score"], 0.519 - 0.03) # -3% to account for sampling variance - if __name__ == "__main__": unittest.main()