We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 04c22c9 commit fcc7e5eCopy full SHA for fcc7e5e
1 file changed
src/cpu/x64/jit_brgemm_conv_utils.cpp
@@ -610,7 +610,9 @@ status_t brg_blocking_t::estimate_brgemm_ur() {
610
= exec_type == exec_trans && ic_block % simd_w == 0 && !is_xf32
611
? simd_w
612
: vnni_block;
613
- K_tail = kh_koef * rnd_up(ic % ic_block, ic_ceil);
+ K_tail = kh_koef
614
+ * (exec_type == exec_trans ? rnd_up(ic % ic_block, ic_ceil)
615
+ : (ic % ic_block));
616
}
617
618
const auto vK = K > 0 ? K : K_tail;
0 commit comments