Skip to content

Commit 0e231c3

Browse files
committed
Fix test_unit_cute_intel_xe
Fixup
1 parent 0899195 commit 0e231c3

File tree

4 files changed

+12
-11
lines changed

4 files changed

+12
-11
lines changed

test/unit/CMakeLists.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -95,8 +95,8 @@ function(cutlass_test_unit_add_executable NAME)
9595
PUBLIC
9696
GTest::gtest
9797
# TODO: This change works for resolving 'cutlasscompat.hpp' not found issue, fix this if it blocks merging
98-
cutlass_test_unit_infra
99-
cutlass_test_unit_infra_lib
98+
# cutlass_test_unit_infra
99+
# cutlass_test_unit_infra_lib
100100
)
101101
else()
102102
target_link_libraries(

test/unit/cute/core/CMakeLists.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@
2828

2929
cutlass_test_unit_add_executable(
3030
cutlass_test_unit_cute_core
31-
WITHOUT_CUDA
31+
# WITHOUT_CUDA
3232
array_subbyte.cpp
3333
bitfield.cpp
3434
coalesce.cpp

test/unit/cute/intel_xe/copy_block.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -265,7 +265,7 @@ struct copy_op<uint16_t, load, XE_2D_U16x2x16_ST_N, M, N, false> {
265265
}
266266
};
267267

268-
template <class load, class store, int32_t M_, int32_t N_>
268+
template <class load, class store, uint32_t M_, uint32_t N_>
269269
struct copy_op<uint32_t, load, store, M_, N_, true> {
270270
void operator()() {
271271
//

test/unit/flash_attention/flash_attention_prefill/flash_prefill_testbed_3x.hpp

Lines changed: 8 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -225,11 +225,11 @@ struct TestbedImpl {
225225
//
226226
// Methods
227227
//
228-
template <class, class, class> class convert_fp8_to_fp16_name;
228+
template <class, class> class convert_fp8_to_fp16_name;
229229

230-
template <typename SrcT, typename DstT, typename Runner>
230+
template <typename SrcT, typename DstT>
231231
void convert_fp8_to_fp16(const SrcT* d_src, DstT* d_dst, size_t size) {
232-
cutlasscompat::get_default_queue().parallel_for<convert_fp8_to_fp16_name<SrcT, DstT, Runner>>(size, [=](auto indx) {
232+
cutlasscompat::get_default_queue().parallel_for<convert_fp8_to_fp16_name<SrcT, DstT>>(size, [=](auto indx) {
233233
d_dst[indx] = static_cast<DstT>(d_src[indx]);
234234
}).wait();
235235
}
@@ -241,7 +241,7 @@ struct TestbedImpl {
241241
using outType = cute::conditional_t<is_fp8_v<Tin>, half_t, Tin>;
242242
if constexpr(is_fp8_v<Tin>) {
243243
cutlass::DeviceAllocation<outType> out(in.size());
244-
convert_fp8_to_fp16<Tin, outType, TestbedImpl>(in.get(), out.get(), in.size());
244+
convert_fp8_to_fp16<Tin, outType>(in.get(), out.get(), in.size());
245245
return out;
246246
} else {
247247
return in;
@@ -625,7 +625,7 @@ struct TestbedImpl {
625625

626626
#if !defined(SYCL_EXT_ONEAPI_WORK_GROUP_SCRATCH_MEMORY)
627627
using namespace cutlasscompat::experimental;
628-
auto event = launch<cutlass::device_kernel<FlashAttention>, FlashAttention>(
628+
auto event = launch<cutlass::device_kernel<FlashAttention>>(
629629
launch_policy{sycl_grid, sycl_block, local_mem_size{static_cast<std::size_t>(smem_size)},
630630
kernel_properties{sycl_exp::sub_group_size<FlashAttention::DispatchPolicy::SubgroupSize>}},
631631
params);
@@ -680,8 +680,9 @@ template <
680680
typename FlashAttention
681681
>
682682
struct Testbed3x {
683-
using TestBedImpl = typename detail::TestbedImpl<FlashAttention>;
684-
TestBedImpl impl_;
683+
// using TestBedImp = typename detail::TestbedImpl<FlashAttention>;
684+
// TestBedImp impl_;
685+
detail::TestbedImpl<FlashAttention> impl_;
685686

686687
//
687688
// Methods

0 commit comments

Comments
 (0)