Skip to content

Commit

Permalink
Update include/cute/arch/copy_xe.hpp
Browse files Browse the repository at this point in the history
Co-authored-by: Atharva Dubey <[email protected]>
  • Loading branch information
mehdi-goli and AD2605 authored Apr 26, 2024
1 parent 71e8b8c commit 0678c20
Showing 1 changed file with 5 additions and 5 deletions.
10 changes: 5 additions & 5 deletions include/cute/arch/copy_xe.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -211,12 +211,12 @@ struct XE_2D_U16x16x16x2x1_LD_N
int height, int pitch, int2_ coord,
T *dst) {
#if defined(ARCH_PVC_ACTIVATED)
static_assert(sizeof(T) == 2, "Expected T to have size 2");
uint16 tmp = __builtin_IB_subgroup_block_read_flat_u32_m16k16v1(
long(baseoffset), width - 1, height - 1, pitch - 1, coord);
*(uint16 *)dst = *reinterpret_cast<uint16 *>(&tmp);
static_assert(sizeof(T) == 2, "Expected T to have size 2");
uint16 tmp = __builtin_IB_subgroup_block_read_flat_u32_m16k16v1(
long(baseoffset), width - 1, height - 1, pitch - 1, coord);
*(uint16 *)dst = *reinterpret_cast<uint16 *>(&tmp);
#else
CUTE_INVALID_CONTROL_PATH("Trying to use block loads on non-PVC hardware")
CUTE_INVALID_CONTROL_PATH("Trying to use block loads on non-PVC hardware")
#endif
}
};
Expand Down

0 comments on commit 0678c20

Please sign in to comment.