diff --git a/sgl-kernel/setup.py b/sgl-kernel/setup.py index 25319af7a..9f9867113 100644 --- a/sgl-kernel/setup.py +++ b/sgl-kernel/setup.py @@ -30,6 +30,7 @@ include_dirs = [ root / "src" / "sgl-kernel" / "csrc", ] nvcc_flags = [ + "-DNDEBUG", "-O3", "-Xcompiler", "-fPIC", @@ -37,6 +38,7 @@ nvcc_flags = [ "-gencode=arch=compute_80,code=sm_80", "-gencode=arch=compute_89,code=sm_89", "-gencode=arch=compute_90,code=sm_90", + "-gencode=arch=compute_90a,code=sm_90a", "-U__CUDA_NO_HALF_OPERATORS__", "-U__CUDA_NO_HALF2_OPERATORS__", ]