diff --git a/include/cute/arch/copy_xe.hpp b/include/cute/arch/copy_xe.hpp index eab804619a..6dd696e06a 100644 --- a/include/cute/arch/copy_xe.hpp +++ b/include/cute/arch/copy_xe.hpp @@ -211,12 +211,12 @@ struct XE_2D_U16x16x16x2x1_LD_N int height, int pitch, int2_ coord, T *dst) { #if defined(ARCH_PVC_ACTIVATED) - static_assert(sizeof(T) == 2, "Expected T to have size 2"); - uint16 tmp = __builtin_IB_subgroup_block_read_flat_u32_m16k16v1( - long(baseoffset), width - 1, height - 1, pitch - 1, coord); - *(uint16 *)dst = *reinterpret_cast(&tmp); + static_assert(sizeof(T) == 2, "Expected T to have size 2"); + uint16 tmp = __builtin_IB_subgroup_block_read_flat_u32_m16k16v1( + long(baseoffset), width - 1, height - 1, pitch - 1, coord); + *(uint16 *)dst = *reinterpret_cast(&tmp); #else - CUTE_INVALID_CONTROL_PATH("Trying to use block loads on non-PVC hardware") + CUTE_INVALID_CONTROL_PATH("Trying to use block loads on non-PVC hardware") #endif } };