Add compile flags for cutlass 3.x (#3013)

Co-authored-by: HandH1998 <1335248067@qq.com>
This commit is contained in:
Ke Bao
2025-01-21 00:04:12 +08:00
committed by GitHub
parent 41a0ccd4f1
commit 5dfcacfcb1

View File

@@ -30,6 +30,7 @@ include_dirs = [
root / "src" / "sgl-kernel" / "csrc",
]
nvcc_flags = [
"-DNDEBUG",
"-O3",
"-Xcompiler",
"-fPIC",
@@ -37,6 +38,7 @@ nvcc_flags = [
"-gencode=arch=compute_80,code=sm_80",
"-gencode=arch=compute_89,code=sm_89",
"-gencode=arch=compute_90,code=sm_90",
"-gencode=arch=compute_90a,code=sm_90a",
"-U__CUDA_NO_HALF_OPERATORS__",
"-U__CUDA_NO_HALF2_OPERATORS__",
]