We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b66a8d6 commit 5f1ef3bCopy full SHA for 5f1ef3b
cpp/include/raft/linalg/contractions.cuh
@@ -159,6 +159,12 @@ struct Policy4x4<half, _veclen> {
159
typedef KernelPolicy<half, _veclen, 64, 4, 4, 16, 16> Policy;
160
typedef ColKernelPolicy<half, _veclen, 64, 4, 4, 16, 16> ColPolicy;
161
};
162
+
163
+template <int _veclen>
164
+struct Policy4x4<uint8_t, _veclen> {
165
+ typedef KernelPolicy<uint8_t, _veclen, 64, 4, 4, 16, 16> Policy;
166
+ typedef ColKernelPolicy<uint8_t, _veclen, 64, 4, 4, 16, 16> ColPolicy;
167
+};
168
/** @} */
169
170
/**
@@ -182,6 +188,12 @@ struct Policy4x4Skinny<double, _veclen> {
182
188
typedef ColKernelPolicy<double, _veclen, 8, 4, 4, 8, 8> ColPolicy;
183
189
184
190
191
192
+struct Policy4x4Skinny<uint8_t, _veclen> {
193
+ typedef KernelPolicy<uint8_t, _veclen, 8, 4, 4, 8, 8> Policy;
194
+ typedef ColKernelPolicy<uint8_t, _veclen, 8, 4, 4, 8, 8> ColPolicy;
195
196
185
197
186
198
* @defgroup Policy2x8 16 elements per thread Policy with k-block = 16
187
199
* @{
0 commit comments