[DP Attention] Refactor: adding some utility functions (#9136)
This commit is contained in:
@@ -84,7 +84,6 @@ GLOBAL_SERVER_ARGS_KEYS = [
|
||||
"device",
|
||||
"disable_chunked_prefix_cache",
|
||||
"disable_radix_cache",
|
||||
"enable_dp_attention",
|
||||
"enable_two_batch_overlap",
|
||||
"tbo_token_distribution_threshold",
|
||||
"enable_dp_lm_head",
|
||||
|
||||
Reference in New Issue
Block a user