[Feature] Support EAGLE 3 (#4247)

This commit is contained in:
James Liu
2025-03-18 10:35:23 -04:00
committed by GitHub
parent 8baf9a0c18
commit 9e0186f352
11 changed files with 385 additions and 22 deletions

View File

@@ -287,7 +287,10 @@ class ServerArgs:
# NEXTN shares the same implementation of EAGLE
self.speculative_algorithm = "EAGLE"
if self.speculative_algorithm == "EAGLE":
if (
self.speculative_algorithm == "EAGLE"
or self.speculative_algorithm == "EAGLE3"
):
if self.max_running_requests is None:
self.max_running_requests = 32
self.disable_overlap_schedule = True
@@ -779,7 +782,7 @@ class ServerArgs:
parser.add_argument(
"--speculative-algorithm",
type=str,
choices=["EAGLE", "NEXTN"],
choices=["EAGLE", "EAGLE3", "NEXTN"],
help="Speculative algorithm.",
)
parser.add_argument(