@@ -2799,7 +2799,11 @@ static void init_qd8_f16_qc8w_gemm_config(void) {
2799
2799
qd8_f16_qc8w_gemm_config .pack_weights_and_biases = NULL ; // Override the default packing function.
2800
2800
qd8_f16_qc8w_gemm_config .packed_stride_weights_and_biases = NULL ; // Override the default packing function.
2801
2801
qd8_f16_qc8w_gemm_config .pack_gemm_gio = (xnn_packw_gemm_gio_ukernel_fn ) xnn_pack_qs8_gemm_gio_w ;
2802
+ #if XNN_ENABLE_AVX256VNNI
2802
2803
qd8_f16_qc8w_gemm_config .pack_gemm_goi = (xnn_packw_gemm_goi_ukernel_fn ) xnn_qs8_packw_gemm_goi_ukernel_x64c4__avx256vnni_prfm ;
2804
+ #else
2805
+ qd8_f16_qc8w_gemm_config .pack_gemm_goi = (xnn_packw_gemm_goi_ukernel_fn ) xnn_pack_qs8_gemm_goi_w ;
2806
+ #endif
2803
2807
qd8_f16_qc8w_gemm_config .mr = 16 ;
2804
2808
qd8_f16_qc8w_gemm_config .nr = 64 ;
2805
2809
qd8_f16_qc8w_gemm_config .log2_kr = 2 ;
@@ -3389,7 +3393,11 @@ static void init_qd8_f32_qc8w_gemm_config(void) {
3389
3393
qd8_f32_qc8w_gemm_config .pack_weights_and_biases = NULL ; // Override the default packing function.
3390
3394
qd8_f32_qc8w_gemm_config .packed_stride_weights_and_biases = NULL ; // Override the default packing function.
3391
3395
qd8_f32_qc8w_gemm_config .pack_gemm_gio = (xnn_packw_gemm_gio_ukernel_fn ) xnn_pack_qs8_gemm_gio_w ;
3396
+ #if XNN_ENABLE_AVX256VNNI
3392
3397
qd8_f32_qc8w_gemm_config .pack_gemm_goi = (xnn_packw_gemm_goi_ukernel_fn ) xnn_qs8_packw_gemm_goi_ukernel_x64c4__avx256vnni_prfm ;
3398
+ #else
3399
+ qd8_f32_qc8w_gemm_config .pack_gemm_goi = (xnn_packw_gemm_goi_ukernel_fn ) xnn_pack_qs8_gemm_goi_w ;
3400
+ #endif
3393
3401
qd8_f32_qc8w_gemm_config .mr = 16 ;
3394
3402
qd8_f32_qc8w_gemm_config .nr = 64 ;
3395
3403
qd8_f32_qc8w_gemm_config .log2_kr = 2 ;
@@ -4089,7 +4097,11 @@ static void init_qs8_qc8w_gemm_config(void) {
4089
4097
qs8_qc8w_gemm_config .pack_weights_and_biases = NULL ; // Override the default packing function.
4090
4098
qs8_qc8w_gemm_config .packed_stride_weights_and_biases = NULL ; // Override the default packing function.
4091
4099
qs8_qc8w_gemm_config .pack_gemm_gio = (xnn_packw_gemm_gio_ukernel_fn ) xnn_pack_qs8_gemm_gio_w ;
4100
+ #if XNN_ENABLE_AVX256VNNI
4092
4101
qs8_qc8w_gemm_config .pack_gemm_goi = (xnn_packw_gemm_goi_ukernel_fn ) xnn_qs8_packw_gemm_goi_ukernel_x64c4__avx256vnni_prfm ;
4102
+ #else
4103
+ qs8_qc8w_gemm_config .pack_gemm_goi = (xnn_packw_gemm_goi_ukernel_fn ) xnn_pack_qs8_gemm_goi_w ;
4104
+ #endif
4093
4105
qs8_qc8w_gemm_config .pack_igemm_goki = (xnn_pack_conv_goki_w_fn ) xnn_pack_qs8_conv_goki_w ;
4094
4106
qs8_qc8w_gemm_config .pack_igemm_kgo = (xnn_pack_conv_kgo_w_fn ) xnn_pack_qs8_conv_kgo_w ;
4095
4107
qs8_qc8w_gemm_config .pack_deconv_goki = (xnn_pack_deconv_goki_w_fn ) xnn_pack_qs8_deconv_goki_w ;
0 commit comments