Simplify the nan detection and greedy check in sampler (#1709)
This commit is contained in:
@@ -53,6 +53,7 @@ global_server_args_dict = {
|
||||
"triton_attention_reduce_in_fp32": ServerArgs.triton_attention_reduce_in_fp32,
|
||||
"disable_mla": ServerArgs.disable_mla,
|
||||
"torchao_config": ServerArgs.torchao_config,
|
||||
"disable_nan_detection": ServerArgs.disable_nan_detection,
|
||||
}
|
||||
|
||||
|
||||
|
||||
Reference in New Issue
Block a user