Files
sglang/python/sglang/global_config.py

38 lines
1.0 KiB
Python
Raw Normal View History

"""Global configurations"""
2024-09-15 08:52:18 -07:00
import os
class GlobalConfig:
def __init__(self):
# Verbosity level
# 0: do not output anything
# 2: output final text after every run
self.verbosity = 0
2024-07-13 05:29:46 -07:00
# Default backend of the language
self.default_backend = None
2024-07-13 05:29:46 -07:00
# Runtime constants: New generation token ratio estimation
2024-07-23 22:06:02 -07:00
self.init_new_token_ratio = 0.7
self.base_min_new_token_ratio = 0.1
2024-07-23 22:06:02 -07:00
self.new_token_ratio_decay = 0.001
2024-07-13 05:29:46 -07:00
2024-07-15 02:01:09 -07:00
# Runtime constants: others
self.num_continue_decode_steps = 10
2024-07-23 22:06:02 -07:00
self.retract_decode_steps = 20
2024-09-15 08:52:18 -07:00
self.flashinfer_workspace_size = os.environ.get(
"FLASHINFER_WORKSPACE_SIZE", 384 * 1024 * 1024
)
2024-07-13 05:29:46 -07:00
# Output tokenization configs
self.skip_special_tokens_in_output = True
self.spaces_between_special_tokens_in_out = True
2024-07-13 05:29:46 -07:00
# Interpreter optimization configs
2024-05-13 15:56:00 -07:00
self.enable_precache_with_tracing = True
self.enable_parallel_encoding = True
2024-07-13 23:39:37 -07:00
global_config = GlobalConfig()