Support weight loading without mmap (#7469)

This commit is contained in:
Yuhong Guo
2025-06-24 06:13:59 +08:00
committed by GitHub
parent e5ddeb04d5
commit e5afb88b1c
4 changed files with 21 additions and 2 deletions

View File

@@ -101,6 +101,7 @@ GLOBAL_SERVER_ARGS_KEYS = [
"torchao_config",
"triton_attention_reduce_in_fp32",
"num_reserved_decode_tokens",
"weight_loader_disable_mmap",
]
# Put some global args for easy access