Support gathering expert distribution details (#6665)
This commit is contained in:
@@ -23,9 +23,8 @@ class TestExpertDistribution(CustomTestCase):
|
||||
dict(model_path="deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct"),
|
||||
dict(model_path="Qwen/Qwen1.5-MoE-A2.7B"),
|
||||
dict(model_path="Qwen/Qwen1.5-MoE-A2.7B", tp_size=2),
|
||||
# TODO enable in next PR
|
||||
# dict(model_path="Qwen/Qwen1.5-MoE-A2.7B", mode="per_pass"),
|
||||
# dict(model_path="Qwen/Qwen1.5-MoE-A2.7B", mode="per_token"),
|
||||
dict(model_path="Qwen/Qwen1.5-MoE-A2.7B", mode="per_pass"),
|
||||
dict(model_path="Qwen/Qwen1.5-MoE-A2.7B", mode="per_token"),
|
||||
]:
|
||||
with self.subTest(info=info):
|
||||
self._execute_core(**info)
|
||||
|
||||
Reference in New Issue
Block a user