We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent f82148b commit 4e29b77Copy full SHA for 4e29b77
src/cpu/x64/jit_uni_dw_conv_kernel_f32.cpp
@@ -844,6 +844,8 @@ void jit_uni_dw_conv_bwd_data_kernel_f32<isa>::apply_postprocess(int ur_ch_block
844
const auto &p = attr_.post_ops_;
845
std::size_t post_ops_data_offset = 0;
846
int depthwise_inj_idx = 0;
847
+ base_post_ops_data_offset += reg64_size;
848
+ push(reg_d_weights);
849
for (int i = 0; i < p.len(); i++) {
850
auto& post_op = p.entry_[i];
851
if (post_op.is_depthwise()) {
@@ -864,6 +866,8 @@ void jit_uni_dw_conv_bwd_data_kernel_f32<isa>::apply_postprocess(int ur_ch_block
864
866
depthwise_inj_idx++;
865
867
}
868
869
+ pop(reg_d_weights);
870
+ base_post_ops_data_offset -= reg64_size;
871
872
873
template <cpu_isa_t isa>
0 commit comments