Skip to content

Commit 838aae9

Browse files
committed
address comment
1 parent 3ef225f commit 838aae9

File tree

2 files changed

+2
-9
lines changed

2 files changed

+2
-9
lines changed

include/cutlass/epilogue/collective/xe_array_epilogue.hpp

Lines changed: 1 addition & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -439,12 +439,8 @@ class CollectiveEpilogue<
439439
Tensor trC_ori = make_tensor<ElementC>(Shape<Int<FragmentSize>>{});
440440
copy(params.xe_load_c.with(get<0>(load_store_tensors)), tCgD(_, epi_m, epi_n), trC_ori);
441441
auto trC_ori_frag = recast<Array<ElementC, FragmentSize>>(trC_ori);
442-
CUTLASS_PRAGMA_UNROLL
443-
for (int i = 0; i < size(trC_frag); ++i) {
444-
trC_frag(i) = cutlass::NumericArrayConverter<typename TiledMma::ValTypeC, ElementC, FragmentSize>{}(trC_ori_frag(i));
445-
}
442+
*(trC_frag.data()) = cutlass::NumericArrayConverter<typename TiledMma::ValTypeC, ElementC, FragmentSize>{}(*(trC_ori_frag.data()));
446443
}
447-
448444
}
449445

450446
cst_callbacks.previsit(epi_m, epi_n, 0, is_C_load_needed);

include/cutlass/epilogue/collective/xe_epilogue.hpp

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -418,10 +418,7 @@ class CollectiveEpilogue<
418418
Tensor trC_ori = make_tensor<ElementC>(Shape<Int<FragmentSize>>{});
419419
copy(params.xe_load_c, tCgC(_, epi_m, epi_n), trC_ori);
420420
auto trC_ori_frag = recast<Array<ElementC, FragmentSize>>(trC_ori);
421-
CUTLASS_PRAGMA_UNROLL
422-
for (int i = 0; i < size(trC_frag); ++i) {
423-
trC_frag(i) = cutlass::NumericArrayConverter<typename TiledMma::ValTypeC, ElementC, FragmentSize>{}(trC_ori_frag(i));
424-
}
421+
*(trC_frag.data()) = cutlass::NumericArrayConverter<typename TiledMma::ValTypeC, ElementC, FragmentSize>{}(*(trC_ori_frag.data()));
425422
}
426423
}
427424

0 commit comments

Comments
 (0)