libcudacxx: diagnose extended lambdas in invocability traits

Aminsed · Aminsed · commit b1c2267ff267 · 2025-11-23T01:00:58.000-05:00
diff --git a/libcudacxx/include/cuda/std/__functional/invoke.h b/libcudacxx/include/cuda/std/__functional/invoke.h
@@ -33,13 +33,39 @@
 #include <cuda/std/__type_traits/is_same.h>
 #include <cuda/std/__type_traits/is_void.h>
 #include <cuda/std/__type_traits/nat.h>
+#include <cuda/std/__type_traits/remove_cvref.h>
 #include <cuda/std/__utility/declval.h>
 #include <cuda/std/__utility/forward.h>
 
 #include <cuda/std/__cccl/prologue.h>
 
 _CCCL_BEGIN_NAMESPACE_CUDA_STD
 
+namespace __detail
+{
+
+#if _CCCL_CUDA_COMPILER(NVCC) && defined(__CUDACC_EXTENDED_LAMBDA__) && !_CCCL_DEVICE_COMPILATION() \
+  && (defined(__nv_is_extended_device_lambda_closure_type)                                          \
+      || defined(__nv_is_extended_host_device_lambda_closure_type))
+template <class _Fn>
+_CCCL_INLINE_VISIBILITY constexpr bool __disallow_extended_lambda_invocability_v =
+#  if defined(__nv_is_extended_device_lambda_closure_type)
+  __nv_is_extended_device_lambda_closure_type(remove_cvref_t<_Fn>) ||
+#  else
+  false ||
+#  endif
+#  if defined(__nv_is_extended_host_device_lambda_closure_type)
+  __nv_is_extended_host_device_lambda_closure_type(remove_cvref_t<_Fn>);
+#  else
+  false;
+#  endif
+#else
+template <class>
+_CCCL_INLINE_VISIBILITY constexpr bool __disallow_extended_lambda_invocability_v = false;
+#endif
+
+} // namespace __detail
+
 struct __any
 {
   _CCCL_API inline __any(...);
@@ -214,17 +240,35 @@ struct _CCCL_TYPE_VISIBILITY_DEFAULT invoke_result //
 
 template <class _Fn, class... _Args>
 struct _CCCL_TYPE_VISIBILITY_DEFAULT is_invocable : bool_constant<__is_invocable<_Fn, _Args...>>
-{};
+{
+#if _CCCL_CUDA_COMPILER(NVCC) && defined(__CUDACC_EXTENDED_LAMBDA__) && !_CCCL_DEVICE_COMPILATION() \
+  && (defined(__nv_is_extended_device_lambda_closure_type)                                          \
+      || defined(__nv_is_extended_host_device_lambda_closure_type))
+  static_assert(!__detail::__disallow_extended_lambda_invocability_v<_Fn>,
+                "Attempt to use an extended __device__ or __host__ __device__ lambda in a context "
+                "that requires querying its invocability in host code. Use a named function object or "
+                "cuda::proclaim_return_type instead.");
+#endif
+};
 
 template <class _Ret, class _Fn, class... _Args>
 struct _CCCL_TYPE_VISIBILITY_DEFAULT is_invocable_r : bool_constant<__is_invocable_r<_Ret, _Fn, _Args...>>
-{};
+{
+#if _CCCL_CUDA_COMPILER(NVCC) && defined(__CUDACC_EXTENDED_LAMBDA__) && !_CCCL_DEVICE_COMPILATION() \
+  && (defined(__nv_is_extended_device_lambda_closure_type)                                          \
+      || defined(__nv_is_extended_host_device_lambda_closure_type))
+  static_assert(!__detail::__disallow_extended_lambda_invocability_v<_Fn>,
+                "Attempt to use an extended __device__ or __host__ __device__ lambda in a context "
+                "that requires querying its invocability in host code. Use a named function object or "
+                "cuda::proclaim_return_type instead.");
+#endif
+};
 
 template <class _Fn, class... _Args>
-inline constexpr bool is_invocable_v = __is_invocable<_Fn, _Args...>;
+inline constexpr bool is_invocable_v = is_invocable<_Fn, _Args...>::value;
 
 template <class _Ret, class _Fn, class... _Args>
-inline constexpr bool is_invocable_r_v = __is_invocable_r<_Ret, _Fn, _Args...>;
+inline constexpr bool is_invocable_r_v = is_invocable_r<_Ret, _Fn, _Args...>::value;
 
 // is_nothrow_invocable
 
@@ -243,22 +287,40 @@ template <class _Ret, class _Fp, class... _Args>
 inline constexpr bool __nothrow_invocable_r_imp<true, true, _Ret, _Fp, _Args...> =
   noexcept(::cuda::std::__invoke(::cuda::std::declval<_Fp>(), ::cuda::std::declval<_Args>()...));
 
-template <class _Fp, class... _Args>
-inline constexpr bool is_nothrow_invocable_v =
-  __nothrow_invocable_r_imp<__is_invocable<_Fp, _Args...>, true, void, _Fp, _Args...>;
-
-template <class _Ret, class _Fp, class... _Args>
-inline constexpr bool is_nothrow_invocable_r_v =
-  __nothrow_invocable_r_imp<__is_invocable_r<_Ret, _Fp, _Args...>, is_void_v<_Ret>, _Ret, _Fp, _Args...>;
-
 template <class _Fn, class... _Args>
-struct _CCCL_TYPE_VISIBILITY_DEFAULT is_nothrow_invocable : bool_constant<is_nothrow_invocable_v<_Fn, _Args...>>
-{};
+struct _CCCL_TYPE_VISIBILITY_DEFAULT is_nothrow_invocable
+    : bool_constant<__nothrow_invocable_r_imp<__is_invocable<_Fn, _Args...>, true, void, _Fn, _Args...>>
+{
+#if _CCCL_CUDA_COMPILER(NVCC) && defined(__CUDACC_EXTENDED_LAMBDA__) && !_CCCL_DEVICE_COMPILATION() \
+  && (defined(__nv_is_extended_device_lambda_closure_type)                                          \
+      || defined(__nv_is_extended_host_device_lambda_closure_type))
+  static_assert(!__detail::__disallow_extended_lambda_invocability_v<_Fn>,
+                "Attempt to use an extended __device__ or __host__ __device__ lambda in a context "
+                "that requires querying its invocability in host code. Use a named function object or "
+                "cuda::proclaim_return_type instead.");
+#endif
+};
 
 template <class _Ret, class _Fn, class... _Args>
-struct _CCCL_TYPE_VISIBILITY_DEFAULT
-is_nothrow_invocable_r : bool_constant<is_nothrow_invocable_r_v<_Ret, _Fn, _Args...>>
-{};
+struct _CCCL_TYPE_VISIBILITY_DEFAULT is_nothrow_invocable_r
+    : bool_constant<
+        __nothrow_invocable_r_imp<__is_invocable_r<_Ret, _Fn, _Args...>, is_void_v<_Ret>, _Ret, _Fn, _Args...>>
+{
+#if _CCCL_CUDA_COMPILER(NVCC) && defined(__CUDACC_EXTENDED_LAMBDA__) && !_CCCL_DEVICE_COMPILATION() \
+  && (defined(__nv_is_extended_device_lambda_closure_type)                                          \
+      || defined(__nv_is_extended_host_device_lambda_closure_type))
+  static_assert(!__detail::__disallow_extended_lambda_invocability_v<_Fn>,
+                "Attempt to use an extended __device__ or __host__ __device__ lambda in a context "
+                "that requires querying its invocability in host code. Use a named function object or "
+                "cuda::proclaim_return_type instead.");
+#endif
+};
+
+template <class _Fp, class... _Args>
+inline constexpr bool is_nothrow_invocable_v = is_nothrow_invocable<_Fp, _Args...>::value;
+
+template <class _Ret, class _Fp, class... _Args>
+inline constexpr bool is_nothrow_invocable_r_v = is_nothrow_invocable_r<_Ret, _Fp, _Args...>::value;
 
 // Not going directly through __invoke_result_t because we want the additional device lambda checks in invoke_result
 template <class _Fn, class... _Args>
diff --git a/libcudacxx/test/libcudacxx/std/utilities/meta/meta.rel/is_invocable.extended_device_lambda.fail.cpp b/libcudacxx/test/libcudacxx/std/utilities/meta/meta.rel/is_invocable.extended_device_lambda.fail.cpp
@@ -0,0 +1,31 @@
+//===----------------------------------------------------------------------===//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+
+// type_traits
+
+// is_invocable should diagnose extended lambdas in host code.
+
+// UNSUPPORTED: clang && (!nvcc)
+
+#include <cuda/std/type_traits>
+
+#include "test_macros.h"
+
+template <class Fn>
+void instantiate()
+{
+  (void) cuda::std::is_invocable_v<Fn>;
+}
+
+int main(int, char**)
+{
+#if TEST_CUDA_COMPILER(NVCC) || TEST_COMPILER(NVRTC)
+  instantiate<decltype([] __device__() {})>();
+#endif
+  return 0;
+}
diff --git a/libcudacxx/test/libcudacxx/std/utilities/meta/meta.rel/is_invocable.extended_host_device_lambda.fail.cpp b/libcudacxx/test/libcudacxx/std/utilities/meta/meta.rel/is_invocable.extended_host_device_lambda.fail.cpp
@@ -0,0 +1,31 @@
+//===----------------------------------------------------------------------===//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+
+// type_traits
+
+// is_invocable should diagnose extended lambdas in host code.
+
+// UNSUPPORTED: clang && (!nvcc)
+
+#include <cuda/std/type_traits>
+
+#include "test_macros.h"
+
+template <class Fn>
+void instantiate()
+{
+  (void) cuda::std::is_invocable_v<Fn>;
+}
+
+int main(int, char**)
+{
+#if TEST_CUDA_COMPILER(NVCC) || TEST_COMPILER(NVRTC)
+  instantiate<decltype([] __host__ __device__() {})>();
+#endif
+  return 0;
+}
diff --git a/libcudacxx/test/libcudacxx/std/utilities/meta/meta.rel/is_nothrow_invocable.extended_device_lambda.fail.cpp b/libcudacxx/test/libcudacxx/std/utilities/meta/meta.rel/is_nothrow_invocable.extended_device_lambda.fail.cpp
@@ -0,0 +1,31 @@
+//===----------------------------------------------------------------------===//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+
+// type_traits
+
+// is_nothrow_invocable should diagnose extended lambdas in host code.
+
+// UNSUPPORTED: clang && (!nvcc)
+
+#include <cuda/std/type_traits>
+
+#include "test_macros.h"
+
+template <class Fn>
+void instantiate()
+{
+  (void) cuda::std::is_nothrow_invocable_v<Fn>;
+}
+
+int main(int, char**)
+{
+#if TEST_CUDA_COMPILER(NVCC) || TEST_COMPILER(NVRTC)
+  instantiate<decltype([] __device__() {})>();
+#endif
+  return 0;
+}