refactor qwen moe code, use communicator to support tp+dp (#6581)
This commit is contained in:
@@ -146,7 +146,7 @@ class TestDisaggregationAccuracy(CustomTestCase):
|
||||
self.assertGreater(metrics["accuracy"], 0.62)
|
||||
|
||||
def test_logprob(self):
|
||||
prompt = "The capital of taiwan is "
|
||||
prompt = "The capital of france is "
|
||||
response = requests.post(
|
||||
self.lb_url + "/generate",
|
||||
json={
|
||||
|
||||
Reference in New Issue
Block a user