From fdb0f1950228aa2d0718f2fad2ddda3ce4a89d9b Mon Sep 17 00:00:00 2001 From: Tianlei Wu Date: Fri, 1 May 2026 07:04:30 -0700 Subject: [PATCH] Fix cuda 13 build error --- onnxruntime/contrib_ops/cuda/bert/gqa_unfused_attention.cu | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/onnxruntime/contrib_ops/cuda/bert/gqa_unfused_attention.cu b/onnxruntime/contrib_ops/cuda/bert/gqa_unfused_attention.cu index f65a041a80630..8aac549aeba01 100644 --- a/onnxruntime/contrib_ops/cuda/bert/gqa_unfused_attention.cu +++ b/onnxruntime/contrib_ops/cuda/bert/gqa_unfused_attention.cu @@ -4,7 +4,7 @@ // GQA-capable unfused CUDA attention kernel. See header for contract. #include -#include +#include "core/providers/cuda/cu_inc/cub.cuh" #include #include #include "core/common/safeint.h"