Skip to content

Commit 93655de

Browse files
committed
cpu: x64: binary injector: add rhs_addr_cache_reg to forked/diverged kernels
1 parent 4a49ca7 commit 93655de

File tree

3 files changed

+3
-3
lines changed

3 files changed

+3
-3
lines changed

src/cpu/x64/jit_avx512_core_fork_bf16_dw_conv_kernel.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -591,7 +591,7 @@ void jit_avx512_fork_dw_conv_fwd_kernel_bf16::generate() {
591591
% (cpu_isa_traits<avx512_core>::vlen / sizeof(float));
592592
static constexpr bool use_exact_tail_scalar_bcast = false;
593593
const binary_injector::rhs_arg_static_params_t rhs_sp {
594-
helper_vmm_idx, r10, r11, preserve_gpr,
594+
helper_vmm_idx, r10, r11, r12, preserve_gpr,
595595
preserve_vmm, GET_OFF(post_ops_binary_rhs_arg_vec),
596596
GET_OFF(dst_orig), memory_desc_wrapper(&dst_md_),
597597
tail_size, k_oc_tail_mask, use_exact_tail_scalar_bcast};

src/cpu/x64/jit_gemm_convolution_utils.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -66,7 +66,7 @@ struct jit_pp_kernel_t : pp_kernel_t, public jit_generator {
6666
static constexpr size_t tail_size = 0;
6767
static constexpr bool use_exact_tail_scalar_bcast = false;
6868
const binary_injector::rhs_arg_static_params_t rhs_sp {
69-
helper_vmm_idx, r13, r14, preserve_gpr,
69+
helper_vmm_idx, r13, r14, r15, preserve_gpr,
7070
preserve_vmm, PARAM_OFF(post_ops_binary_rhs_arg_vec),
7171
PARAM_OFF(dst_orig), memory_desc_wrapper(pd->dst_md()),
7272
tail_size, kreg_rem_mask, use_exact_tail_scalar_bcast};

src/cpu/x64/jit_uni_fork_dw_conv_kernel_f32.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -772,7 +772,7 @@ void jit_uni_fork_dw_conv_fwd_kernel_f32<isa>::generate() {
772772
% (cpu_isa_traits<isa>::vlen / sizeof(float));
773773
static constexpr bool use_exact_tail_scalar_bcast = false;
774774
const binary_injector::rhs_arg_static_params_t rhs_sp {
775-
helper_vmm_idx, r10, r11, preserve_gpr,
775+
helper_vmm_idx, r10, r11, r12, preserve_gpr,
776776
preserve_vmm, GET_OFF(post_ops_binary_rhs_arg_vec),
777777
GET_OFF(dst_orig), memory_desc_wrapper(&dst_md_),
778778
tail_size, k_oc_tail_mask, use_exact_tail_scalar_bcast};

0 commit comments

Comments
 (0)