We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent d5e879b commit ec49a98Copy full SHA for ec49a98
src/cpu/x64/matmul/brgemm_matmul_utils.cpp
@@ -1672,9 +1672,7 @@ float matmul_amx_blocking_params_t::get_thread_balance_scores() {
1672
// returns score for current blocking parameters' values in range [0, 1]
1673
// for copied data reusage
1674
float matmul_amx_blocking_params_t::get_copied_data_reusage_scores() {
1675
- // Values based on measured performance
1676
- const bool is_lda_4k = (current_lda_ * a_dt_sz) % 4096 == 0;
1677
- const dim_t effective_m_chunk_sz = 64 * (is_lda_4k ? 1 : 4);
+ const dim_t effective_m_chunk_sz = 64 * 4;
1678
const dim_t desired_M_chunk_size = is_runtime_M
1679
? effective_m_chunk_sz
1680
: nstl::min(M, effective_m_chunk_sz);
0 commit comments