@@ -22,7 +22,9 @@ find_package(CUDAToolkit REQUIRED)
22
22
set_property (GLOBAL PROPERTY CUDA_SEPARABLE_COMPILATION ON )
23
23
24
24
message (STATUS "Detected CUDA_VERSION=${CUDA_VERSION} " )
25
- if ("${CUDA_VERSION} " VERSION_GREATER_EQUAL "12.8" )
25
+ if ("${CUDA_VERSION} " VERSION_GREATER_EQUAL "13.0" )
26
+ message ("CUDA_VERSION ${CUDA_VERSION} >= 13.0" )
27
+ elseif ("${CUDA_VERSION} " VERSION_GREATER_EQUAL "12.8" )
26
28
message ("CUDA_VERSION ${CUDA_VERSION} >= 12.8" )
27
29
elseif ("${CUDA_VERSION} " VERSION_GREATER_EQUAL "12.4" )
28
30
message ("CUDA_VERSION ${CUDA_VERSION} >= 12.4" )
@@ -128,9 +130,16 @@ option(SGL_KERNEL_ENABLE_FP8 "Enable FP8" ON)
128
130
option (SGL_KERNEL_ENABLE_FP4 "Enable FP4" OFF )
129
131
option (SGL_KERNEL_ENABLE_FA3 "Enable FA3" OFF )
130
132
131
- if ("${CUDA_VERSION} " VERSION_GREATER_EQUAL "12.8" OR SGL_KERNEL_ENABLE_SM100A )
133
+ if ("${CUDA_VERSION} " VERSION_GREATER_EQUAL "13.0" OR SGL_KERNEL_ENABLE_SM100A )
134
+ list (APPEND SGL_KERNEL_CUDA_FLAGS
135
+ "-gencode=arch=compute_100,code=sm_110"
136
+ "-gencode=arch=compute_100a,code=sm_110a"
137
+ )
138
+ elseif ("${CUDA_VERSION} " VERSION_GREATER_EQUAL "12.8" OR SGL_KERNEL_ENABLE_SM100A )
132
139
list (APPEND SGL_KERNEL_CUDA_FLAGS
133
140
"-gencode=arch=compute_100,code=sm_100"
141
+ "-gencode=arch=compute_100,code=sm_101"
142
+ "-gencode=arch=compute_100,code=sm_101a"
134
143
"-gencode=arch=compute_100a,code=sm_100a"
135
144
"-gencode=arch=compute_120,code=sm_120"
136
145
)
0 commit comments