Pr fix max workers (#1456)
Co-authored-by: baolujia <baolujia@shizhuang-inc.com> Co-authored-by: Lianmin Zheng <lianminzheng@gmail.com>
This commit is contained in:
@@ -123,6 +123,7 @@ class TokenizerManager:
|
|||||||
initializer=init_global_processor,
|
initializer=init_global_processor,
|
||||||
mp_context=mp.get_context("fork"),
|
mp_context=mp.get_context("fork"),
|
||||||
initargs=(server_args,),
|
initargs=(server_args,),
|
||||||
|
max_workers=os.environ.get("SGLANG_CPU_COUNT", os.cpu_count()),
|
||||||
)
|
)
|
||||||
else:
|
else:
|
||||||
self.tokenizer = get_tokenizer(
|
self.tokenizer = get_tokenizer(
|
||||||
|
|||||||
Reference in New Issue
Block a user