Skip to content

Commit af6de8c

Browse files
committed
[https://nvbugs/5545522][fix] Correct Cutlass with PDL support
Signed-off-by: Jin Li <[email protected]>
1 parent 2cde4e4 commit af6de8c

File tree

2 files changed

+5
-1
lines changed

2 files changed

+5
-1
lines changed

cpp/tensorrt_llm/kernels/cutlass_kernels/CMakeLists.txt

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -65,6 +65,8 @@ function(process_target target_name enable_hopper enable_blackwell)
6565
if(${enable_hopper} AND "90" IN_LIST CMAKE_CUDA_ARCHITECTURES_ORIG)
6666
# No kernels should be parsed, unless hopper is specified. This is a build
6767
# time improvement
68+
target_compile_options(${target_name}
69+
PRIVATE "-DCUTLASS_ENABLE_GDC_FOR_SM90=1")
6870
target_compile_definitions(${target_name} PUBLIC COMPILE_HOPPER_TMA_GEMMS)
6971
target_compile_definitions(${target_name}
7072
PUBLIC COMPILE_HOPPER_TMA_GROUPED_GEMMS)
@@ -77,6 +79,8 @@ function(process_target target_name enable_hopper enable_blackwell)
7779
OR "121" IN_LIST CMAKE_CUDA_ARCHITECTURES_ORIG
7880
))
7981

82+
target_compile_options(${target_name}
83+
PRIVATE "-DCUTLASS_ENABLE_GDC_FOR_SM100=1")
8084
# Both 100 and 103 support these kernels
8185
if("100" IN_LIST CMAKE_CUDA_ARCHITECTURES_ORIG
8286
OR "103" IN_LIST CMAKE_CUDA_ARCHITECTURES_ORIG)

0 commit comments

Comments
 (0)