Skip to content

Commit 00c3465

Browse files
author
dmitrygo
committed
[FORK][FIX] Restore choose_loop_order logic for weights decompression case
1 parent dc69ce5 commit 00c3465

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

src/cpu/x64/jit_brgemm_inner_product_utils.cpp

+2-1
Original file line numberDiff line numberDiff line change
@@ -1885,7 +1885,8 @@ void jit_brgemm_ip_fwd_conf_t::choose_loop_order() {
18851885
const bool is_int8 = one_of(src_dt, u8, s8) && wei_dt == s8;
18861886
const bool is_compute_amx = (is_xf16 || is_int8) && is_amx;
18871887

1888-
if ((os_block < 32 || do_occ_osc) && (is_compute_amx || is_f32_avx2))
1888+
// Better to keep ocb loop outermost for weights_decompression case due to overhead on weights unpack into intermediate buffer
1889+
if ((os_block < 32 || do_occ_osc) && (is_compute_amx || is_f32_avx2) && !weights_decompression)
18891890
loop_order = icc_occ_osc_ocb_osb;
18901891
}
18911892

0 commit comments

Comments
 (0)