fix: update dsv3 fp4 ut (#10584)

This commit is contained in:
Yineng Zhang
2025-09-17 14:34:58 -07:00
committed by GitHub
parent b73ac629cd
commit 564050766d

View File

@@ -141,8 +141,8 @@ class TestDeepseekV3FP4MTP(CustomTestCase):
f'{metrics["accuracy"]=:.3f}\n'
f"{avg_spec_accept_length=:.2f}\n"
)
self.assertGreater(metrics["accuracy"], 0.935)
self.assertGreater(avg_spec_accept_length, 2.9)
self.assertGreater(metrics["accuracy"], 0.94)
self.assertGreater(avg_spec_accept_length, 2.04)
def test_bs_1_speed(self):
args = BenchArgs(port=int(self.base_url.split(":")[-1]), max_new_tokens=2048)
@@ -156,8 +156,8 @@ class TestDeepseekV3FP4MTP(CustomTestCase):
f"{acc_length=:.2f}\n"
f"{speed=:.2f} token/s\n"
)
self.assertGreater(acc_length, 2.9)
self.assertGreater(speed, 130)
self.assertGreater(acc_length, 2.04)
self.assertGreater(speed, 150)
class TestDeepseekV3FP4CutlassMoE(CustomTestCase):