From 0678c20a08e1d7e804876eb810cd26af6d29e9a0 Mon Sep 17 00:00:00 2001 From: Mehdi Goli Date: Fri, 26 Apr 2024 17:50:43 +0100 Subject: [PATCH] Update include/cute/arch/copy_xe.hpp Co-authored-by: Atharva Dubey --- include/cute/arch/copy_xe.hpp | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/include/cute/arch/copy_xe.hpp b/include/cute/arch/copy_xe.hpp index eab804619..6dd696e06 100644 --- a/include/cute/arch/copy_xe.hpp +++ b/include/cute/arch/copy_xe.hpp @@ -211,12 +211,12 @@ struct XE_2D_U16x16x16x2x1_LD_N int height, int pitch, int2_ coord, T *dst) { #if defined(ARCH_PVC_ACTIVATED) - static_assert(sizeof(T) == 2, "Expected T to have size 2"); - uint16 tmp = __builtin_IB_subgroup_block_read_flat_u32_m16k16v1( - long(baseoffset), width - 1, height - 1, pitch - 1, coord); - *(uint16 *)dst = *reinterpret_cast(&tmp); + static_assert(sizeof(T) == 2, "Expected T to have size 2"); + uint16 tmp = __builtin_IB_subgroup_block_read_flat_u32_m16k16v1( + long(baseoffset), width - 1, height - 1, pitch - 1, coord); + *(uint16 *)dst = *reinterpret_cast(&tmp); #else - CUTE_INVALID_CONTROL_PATH("Trying to use block loads on non-PVC hardware") + CUTE_INVALID_CONTROL_PATH("Trying to use block loads on non-PVC hardware") #endif } };