Skip to content

Commit fcc7e5e

Browse files
committed
x64: brgemm conv: fix K_tail calculation
1 parent 04c22c9 commit fcc7e5e

1 file changed

Lines changed: 3 additions & 1 deletion

File tree

src/cpu/x64/jit_brgemm_conv_utils.cpp

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -610,7 +610,9 @@ status_t brg_blocking_t::estimate_brgemm_ur() {
610610
= exec_type == exec_trans && ic_block % simd_w == 0 && !is_xf32
611611
? simd_w
612612
: vnni_block;
613-
K_tail = kh_koef * rnd_up(ic % ic_block, ic_ceil);
613+
K_tail = kh_koef
614+
* (exec_type == exec_trans ? rnd_up(ic % ic_block, ic_ceil)
615+
: (ic % ic_block));
614616
}
615617

616618
const auto vK = K > 0 ? K : K_tail;

0 commit comments

Comments
 (0)