Skip to content

Commit 36a1036

Browse files
[FORK][FIX] Limit microkernel unrolling factor
[FORK][FEATURE] DQ IP: performance enhansments
1 parent 0bbc7a7 commit 36a1036

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

src/cpu/x64/brgemm/jit_brgemm_kernel.cpp

+2-1
Original file line numberDiff line numberDiff line change
@@ -3130,7 +3130,8 @@ void jit_brgemm_kernel_t<Wmm>::ldb_loop(int bd_block2, bool is_bdb_tail,
31303130
}
31313131
rdb_group = rdb_group / brg.rd_block;
31323132
auto rbd_blocks = brg.rdb / rdb_group;
3133-
auto max_rdb_unroll = 8;
3133+
// unrolling is limited to prevent exceeding L1i cache
3134+
auto max_rdb_unroll = brg.with_src_dyn_quant ? 8 : 2;
31343135

31353136
if (brg.with_wei_decomp && rdb_group <= max_rdb_unroll) {
31363137
if (rbd_blocks > 0) {

0 commit comments

Comments
 (0)