Report median instead of mean in bench_latency.py (#1269)

This commit is contained in:
Lianmin Zheng
2024-08-30 06:05:01 -07:00
committed by GitHub
parent 55f5976b42
commit 79ece2c51f
3 changed files with 8 additions and 14 deletions

View File

@@ -50,8 +50,6 @@ for name, cls in _CONFIG_REGISTRY.items():
with contextlib.suppress(ValueError):
AutoConfig.register(name, cls)
from sglang.srt.utils import is_multimodal_model
def download_from_hf(model_path: str):
if os.path.exists(model_path):
@@ -60,12 +58,6 @@ def download_from_hf(model_path: str):
return snapshot_download(model_path, allow_patterns=["*.json", "*.bin", "*.model"])
def get_config_json(model_path: str):
with open(os.path.join(model_path, "configs.json")) as f:
config = json.load(f)
return config
def get_config(
model: str,
trust_remote_code: bool,