Allow overwrite flashinfer use_tensorcore (#2169)

This commit is contained in:
Lianmin Zheng
2024-11-24 20:58:17 -08:00
committed by GitHub
parent dd44173dad
commit 8e1adb8441
6 changed files with 18 additions and 10 deletions

View File

@@ -407,7 +407,7 @@ async def async_request_profile(api_url: str) -> RequestFuncOutput:
def get_model(pretrained_model_name_or_path: str) -> str:
if os.getenv("SGLANG_USE_MODELSCOPE", "False").lower() == "true":
if os.getenv("SGLANG_USE_MODELSCOPE", "false").lower() == "true":
import huggingface_hub.constants
from modelscope import snapshot_download