Update CI threshold & Improve code style (#2159)

This commit is contained in:
Lianmin Zheng
2024-11-24 06:29:38 -08:00
committed by GitHub
parent e3938b2f9c
commit 5652c56535
8 changed files with 126 additions and 41 deletions

View File

@@ -212,6 +212,7 @@ def extend(reqs, model_runner):
token_to_kv_pool=model_runner.token_to_kv_pool,
tree_cache=None,
model_config=model_runner.model_config,
enable_overlap=False,
)
batch.prepare_for_extend()
model_worker_batch = batch.get_model_worker_batch()