Skip to content

Commit e68a04a

Browse files
committed
[CPU] enable f16 dst for s8/u8 inputs in fc
1 parent 268b02c commit e68a04a

File tree

2 files changed

+6
-2
lines changed

2 files changed

+6
-2
lines changed

src/plugins/intel_cpu/src/nodes/executors/fullyconnected_implementations.cpp

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -86,8 +86,12 @@ static const TypeMapping dnnlFCTypeMapping {
8686
{{_bf16, _f16, _any, _any}, {bypass(), bypass(), use<0>(), use<0>()}},
8787
{{_f16, _bf16, _any, _any}, {bypass(), bypass(), use<0>(), use<0>()}},
8888
// quantization configuration
89-
// int8 inner_product does not support f16 output and bias
89+
// int8 inner_product does not support f16 output or bias (f16 output is only supported on X86_64 platforms)
90+
#if defined(OPENVINO_ARCH_X86_64)
91+
{{_u8 | _i8, _i8, _u8 | _i8 | _i32 | _bf16 | _f32 | _dynamic, _u8 | _i8 | _i32 | _bf16 | _f16 | _f32}, {bypass(), bypass(), bypass(), bypass()}},
92+
#else
9093
{{_u8 | _i8, _i8, _u8 | _i8 | _i32 | _bf16 | _f32 | _dynamic, _u8 | _i8 | _i32 | _bf16 | _f32}, {bypass(), bypass(), bypass(), bypass()}},
94+
#endif
9195
{{_u8 | _i8, _i8, _f16, _u8 | _i8 | _i32 | _bf16 | _f32}, {bypass(), bypass(), just<f32>(), bypass()}},
9296
{{_u8 | _i8, _i8, _any, _any}, {bypass(), bypass(), just<f32>(), just<f32>()}},
9397
// compresses int weights (@todo more strict requrements for output precision?)

0 commit comments

Comments
 (0)