Use cutlass fp4 gemm by default (#11813)
This commit is contained in:
@@ -79,7 +79,7 @@ CUTEDSL_MOE_SCALAR_INPUT_SCALE = get_bool_env_var(
|
|||||||
"SGLANG_CUTEDSL_MOE_SCALAR_INPUT_SCALE", "true"
|
"SGLANG_CUTEDSL_MOE_SCALAR_INPUT_SCALE", "true"
|
||||||
)
|
)
|
||||||
USE_CUTLASS_BACKEND_FOR_FP4_GEMM = get_bool_env_var(
|
USE_CUTLASS_BACKEND_FOR_FP4_GEMM = get_bool_env_var(
|
||||||
"SGLANG_USE_CUTLASS_BACKEND_FOR_FP4_GEMM"
|
"SGLANG_USE_CUTLASS_BACKEND_FOR_FP4_GEMM", "true"
|
||||||
)
|
)
|
||||||
# TODO make it true by default when the DeepEP PR is merged
|
# TODO make it true by default when the DeepEP PR is merged
|
||||||
CUTEDSL_MOE_NVFP4_DISPATCH = get_bool_env_var(
|
CUTEDSL_MOE_NVFP4_DISPATCH = get_bool_env_var(
|
||||||
|
|||||||
Reference in New Issue
Block a user