Skip to content

Commit 57e907e

Browse files
committed
Fix CI failure
1 parent 8d29fa8 commit 57e907e

File tree

2 files changed

+8
-1
lines changed

2 files changed

+8
-1
lines changed

include/cute/util/sycl_vec.hpp

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -59,10 +59,17 @@ using float2 = vector_t<float, 2>;
5959
using float4 = vector_t<float, 4>;
6060
using float8 = vector_t<float, 8>;
6161

62+
#ifndef __SYCL_DEVICE_ONLY__
63+
using half = sycl::half;
64+
using half2 = vector_t<half, 2>;
65+
using half4 = vector_t<half, 4>;
66+
using half8 = vector_t<half, 8>;
67+
#else
6268
using half = _Float16;
6369
using half2 = vector_t<_Float16, 2>;
6470
using half4 = vector_t<_Float16, 4>;
6571
using half8 = vector_t<_Float16, 8>;
72+
#endif
6673

6774
using short2 = vector_t<short, 2>;
6875
using short4 = vector_t<short, 4>;

tools/copy_debug/copy_debug.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -117,7 +117,7 @@ void copy(int global_M, int global_N) {
117117

118118
auto gridDim = cutlasscompat::dim3(1);
119119
auto blockDim = cutlasscompat::dim3(SUBGROUP_SIZE);
120-
launch<copy_kernel<CopyInstruction, decltype(tensor_S), fragment_size>, CopyKernelName<CopyInstruction, decltype(tensor_S), fragment_size>>(
120+
launch<copy_kernel<CopyInstruction, decltype(tensor_S), fragment_size>, CopyKernelName<CopyInstruction, decltype(tensor_S)>>(
121121
launch_policy{gridDim, blockDim,
122122
kernel_properties{sycl_exp::sub_group_size<SUBGROUP_SIZE>}},
123123
tensor_S);

0 commit comments

Comments
 (0)