Skip to content

Commit 569acc3

Browse files
committed
fix issue
1 parent dc37dd6 commit 569acc3

1 file changed

Lines changed: 2 additions & 2 deletions

File tree

include/mscclpp/gpu_data_types.hpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1268,8 +1268,8 @@ MSCCLPP_DEVICE_INLINE f8_e4m3b15x4 to<f8_e4m3b15x4, f32x4>(const f32x4& v) {
12681268
return to<f8_e4m3b15x4, f16x4>(h);
12691269
#elif defined(MSCCLPP_DEVICE_HIP) && defined(__gfx942__)
12701270
f16x4 h;
1271-
h.words[0] = __builtin_bit_cast(uint32_t, __builtin_amdgcn_cvt_pkrtz(v.data[0], v.data[1]));
1272-
h.words[1] = __builtin_bit_cast(uint32_t, __builtin_amdgcn_cvt_pkrtz(v.data[2], v.data[3]));
1271+
h.words[0] = __builtin_bit_cast(uint32_t, __floats2half2_rn(v.data[0], v.data[1]));
1272+
h.words[1] = __builtin_bit_cast(uint32_t, __floats2half2_rn(v.data[2], v.data[3]));
12731273
return to<f8_e4m3b15x4, f16x4>(h);
12741274
#else
12751275
f8_e4m3b15x4 result;

0 commit comments

Comments
 (0)