@@ -215,7 +215,7 @@ void jit_avx512_common_convolution_fwd_t<src_type, wei_type,
215
215
start_copy = start;
216
216
217
217
auto par_conv = jit_conv_call_s ();
218
- size_t src_c_stride = src_d.blk_off (0 , 1 );
218
+ size_t src_c_stride = src_d.blk_off (0 , 1 ) - src_d. off_l ( 0 ) ;
219
219
size_t wht_ic_stride = wht_blk_off (weights_d, 0 , 0 , 1 );
220
220
221
221
for (int icb_l2 = 0 ; icb_l2 < jcp.nb_ic ; icb_l2 += jcp.nb_ic_L2 ) {
@@ -338,9 +338,9 @@ void jit_avx512_common_convolution_fwd_t<src_type, wei_type,
338
338
start_copy = start;
339
339
340
340
auto par_conv = jit_conv_call_s ();
341
- size_t src_h_stride = src_d.blk_off (0 , 0 , 1 );
342
- size_t src_c_stride = src_d.blk_off (0 , 1 );
343
- size_t dst_h_stride = dst_d.blk_off (0 , 0 , 1 );
341
+ size_t src_h_stride = src_d.blk_off (0 , 0 , 1 ) - src_d. off_l ( 0 ) ;
342
+ size_t src_c_stride = src_d.blk_off (0 , 1 ) - src_d. off_l ( 0 ) ;
343
+ size_t dst_h_stride = dst_d.blk_off (0 , 0 , 1 ) - dst_d. off_l ( 0 ) ;
344
344
size_t wht_h_stride = wht_blk_off (weights_d, 0 , 0 , 0 , 1 );
345
345
size_t wht_ic_stride = wht_blk_off (weights_d, 0 , 0 , 1 );
346
346
@@ -495,10 +495,10 @@ void jit_avx512_common_convolution_fwd_t<src_type, wei_type,
495
495
start_copy = start;
496
496
497
497
auto par_conv = jit_conv_call_s ();
498
- size_t src_d_stride = src_d.blk_off (0 , 0 , 1 );
499
- size_t src_h_stride = src_d.blk_off (0 , 0 , 0 , 1 );
500
- size_t src_c_stride = src_d.blk_off (0 , 1 );
501
- size_t dst_h_stride = dst_d.blk_off (0 , 0 , 0 , 1 );
498
+ size_t src_d_stride = src_d.blk_off (0 , 0 , 1 ) - src_d. off_l ( 0 ) ;
499
+ size_t src_h_stride = src_d.blk_off (0 , 0 , 0 , 1 ) - src_d. off_l ( 0 ) ;
500
+ size_t src_c_stride = src_d.blk_off (0 , 1 ) - src_d. off_l ( 0 ) ;
501
+ size_t dst_h_stride = dst_d.blk_off (0 , 0 , 0 , 1 ) - dst_d. off_l ( 0 ) ;
502
502
size_t wht_d_stride = wht_blk_off (weights_d, 0 , 0 , 0 , 1 );
503
503
size_t wht_h_stride = wht_blk_off (weights_d, 0 , 0 , 0 , 0 , 1 );
504
504
size_t wht_ic_stride = wht_blk_off (weights_d, 0 , 0 , 1 );
@@ -653,7 +653,7 @@ void jit_avx512_common_convolution_bwd_data_t<diff_dst_type, wei_type,
653
653
start_copy = start;
654
654
655
655
auto par_conv = jit_conv_call_s ();
656
- size_t diff_dst_c_stride = diff_dst_d.blk_off (0 , 1 );
656
+ size_t diff_dst_c_stride = diff_dst_d.blk_off (0 , 1 ) - diff_dst_d. off_l ( 0 ) ;
657
657
size_t wht_oc_stride = wht_blk_off (weights_d, 0 , 1 );
658
658
659
659
for (int ocb_l2 = 0 ; ocb_l2 < jcp.nb_oc ; ocb_l2 += jcp.nb_oc_L2 ) {
@@ -762,9 +762,9 @@ void jit_avx512_common_convolution_bwd_data_t<diff_dst_type, wei_type,
762
762
start_copy = start;
763
763
764
764
auto par_conv = jit_conv_call_s ();
765
- size_t diff_src_h_stride = diff_src_d.blk_off (0 , 0 , 1 );
766
- size_t diff_dst_h_stride = diff_dst_d.blk_off (0 , 0 , 1 );
767
- size_t diff_dst_c_stride = diff_dst_d.blk_off (0 , 1 );
765
+ size_t diff_src_h_stride = diff_src_d.blk_off (0 , 0 , 1 ) - diff_src_d. off_l ( 0 ) ;
766
+ size_t diff_dst_h_stride = diff_dst_d.blk_off (0 , 0 , 1 ) - diff_dst_d. off_l ( 0 ) ;
767
+ size_t diff_dst_c_stride = diff_dst_d.blk_off (0 , 1 ) - diff_dst_d. off_l ( 0 ) ;
768
768
size_t wht_h_stride = wht_blk_off (weights_d, 0 , 0 , 0 , 1 );
769
769
size_t wht_oc_stride = wht_blk_off (weights_d, 0 , 1 );
770
770
@@ -923,11 +923,11 @@ void jit_avx512_common_convolution_bwd_data_t<diff_dst_type, wei_type,
923
923
start_copy = start;
924
924
925
925
auto par_conv = jit_conv_call_s ();
926
- size_t diff_src_h_stride = diff_src_d.blk_off (0 , 0 , 0 , 1 );
927
- size_t diff_src_d_stride = diff_src_d.blk_off (0 , 0 , 1 );
928
- size_t diff_dst_h_stride = diff_dst_d.blk_off (0 , 0 , 0 , 1 );
929
- size_t diff_dst_d_stride = diff_dst_d.blk_off (0 , 0 , 1 );
930
- size_t diff_dst_c_stride = diff_dst_d.blk_off (0 , 1 );
926
+ size_t diff_src_h_stride = diff_src_d.blk_off (0 , 0 , 0 , 1 ) - diff_src_d. off_l ( 0 ) ;
927
+ size_t diff_src_d_stride = diff_src_d.blk_off (0 , 0 , 1 ) - diff_src_d. off_l ( 0 ) ;
928
+ size_t diff_dst_h_stride = diff_dst_d.blk_off (0 , 0 , 0 , 1 ) - diff_dst_d. off_l ( 0 ) ;
929
+ size_t diff_dst_d_stride = diff_dst_d.blk_off (0 , 0 , 1 ) - diff_dst_d. off_l ( 0 ) ;
930
+ size_t diff_dst_c_stride = diff_dst_d.blk_off (0 , 1 ) - diff_dst_d. off_l ( 0 ) ;
931
931
size_t wht_h_stride = wht_blk_off (weights_d, 0 , 0 , 0 , 0 , 1 );
932
932
size_t wht_d_stride = wht_blk_off (weights_d, 0 , 0 , 0 , 1 );
933
933
size_t wht_oc_stride = wht_blk_off (weights_d, 0 , 1 );
0 commit comments