DP Enhancement (#8280)

This commit is contained in:
Cheng Wan
2025-07-24 21:36:21 -07:00
committed by GitHub
parent 28d4d47280
commit c0fb25e949
20 changed files with 665 additions and 1116 deletions

View File

@@ -35,7 +35,7 @@ class TestPureDP(CustomTestCase):
"--cuda-graph-max-bs",
"128",
"--max-running-requests",
"128",
"512",
"--mem-fraction-static",
"0.5",
],
@@ -81,7 +81,7 @@ class TestHybridDPTP(CustomTestCase):
"--cuda-graph-max-bs",
"128",
"--max-running-requests",
"128",
"256",
],
)
@@ -170,7 +170,7 @@ class TestNoGatherdBuffer(CustomTestCase):
"--cuda-graph-max-bs",
"32",
"--max-running-requests",
"128",
"512",
],
)
@@ -217,7 +217,7 @@ class TestTBO(CustomTestCase):
"--cuda-graph-max-bs",
"128",
"--max-running-requests",
"128",
"512",
],
)
@@ -273,7 +273,7 @@ class TestMTP(CustomTestCase):
"--cuda-graph-max-bs",
"32",
"--max-running-requests",
"32",
"64",
],
)
@@ -343,7 +343,7 @@ class TestMTPWithTBO(CustomTestCase):
"--cuda-graph-max-bs",
"32",
"--max-running-requests",
"32",
"128",
],
)

File diff suppressed because it is too large Load Diff