Skip to content

Commit 70231ac

Browse files
annop-wdensamoilov
authored andcommitted
cpu: aarch64: Add key_generic_acc to booking scratchpad for dst_acc
1 parent af32908 commit 70231ac

10 files changed

+11
-10
lines changed

src/common/memory_tracking.hpp

+1
Original file line numberDiff line numberDiff line change
@@ -227,6 +227,7 @@ enum {
227227
key_gemm_blocked_a,
228228
key_gemm_blocked_b,
229229
key_gemm_accumulator,
230+
key_generic_acc,
230231
key_gnorm_cvt,
231232
key_gnorm_reduction,
232233
key_gnorm_tmp_mean,

src/cpu/aarch64/acl_convolution_utils.hpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -104,7 +104,7 @@ status_t execute_forward_conv_acl(
104104
// If we have an unfused sum post op, put the result in a scratchpad tensor.
105105
// Result will be summed to the dst during acl_post_ops.execute
106106
auto dst_base = use_dst_acc_for_sum
107-
? scratchpad.get<void>(memory_tracking::names::key_none)
107+
? scratchpad.get<void>(memory_tracking::names::key_generic_acc)
108108
: CTX_OUT_MEM(dst_data_t *, DNNL_ARG_DST);
109109
acl_conv_obj.dst_tensor.allocator()->import_memory(dst_base);
110110

src/cpu/aarch64/acl_deconvolution.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ status_t acl_deconvolution_fwd_t::execute_forward(const exec_ctx_t &ctx) const {
3737
// If we have an unfused sum post op, put the result in a scratchpad tensor.
3838
// Result will be summed to the dst during acl_post_ops.execute
3939
auto dst_base = use_dst_acc_for_sum
40-
? scratchpad.get<void>(memory_tracking::names::key_none)
40+
? scratchpad.get<void>(memory_tracking::names::key_generic_acc)
4141
: CTX_OUT_MEM(void *, DNNL_ARG_DST);
4242

4343
// Retrieve primitive resource and configured Compute Library objects

src/cpu/aarch64/acl_deconvolution.hpp

+2-2
Original file line numberDiff line numberDiff line change
@@ -89,7 +89,7 @@ struct acl_deconvolution_fwd_t : public primitive_t {
8989
, post_ops() {}
9090

9191
DECLARE_COMMON_PD_T(
92-
"acl:deconv", acl_deconvolution_fwd_t, USE_GLOBAL_SCRATCHPAD);
92+
"acl", acl_deconvolution_fwd_t, USE_GLOBAL_SCRATCHPAD);
9393

9494
status_t init(engine_t *engine) {
9595
using namespace data_type;
@@ -296,7 +296,7 @@ struct acl_deconvolution_fwd_t : public primitive_t {
296296

297297
if (acl_pd_conf.use_dst_acc_for_sum) {
298298
auto scratchpad = scratchpad_registry().registrar();
299-
scratchpad.book(memory_tracking::names::key_none,
299+
scratchpad.book(memory_tracking::names::key_generic_acc,
300300
dst_d.nelems(), dst_d.data_type_size());
301301
}
302302

src/cpu/aarch64/acl_depthwise_convolution.hpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -99,7 +99,7 @@ struct acl_depthwise_convolution_fwd_t : public primitive_t {
9999
if (acp_.use_dst_acc_for_sum) {
100100
const memory_desc_wrapper dst_d(&dst_md_);
101101
auto scratchpad = scratchpad_registry().registrar();
102-
scratchpad.book(memory_tracking::names::key_none,
102+
scratchpad.book(memory_tracking::names::key_generic_acc,
103103
dst_d.nelems(), dst_d.data_type_size());
104104
}
105105

src/cpu/aarch64/acl_gemm_convolution.hpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -94,7 +94,7 @@ struct acl_gemm_convolution_fwd_t : public primitive_t {
9494
if (acp_.use_dst_acc_for_sum) {
9595
const memory_desc_wrapper dst_d(&dst_md_);
9696
auto scratchpad = scratchpad_registry().registrar();
97-
scratchpad.book(memory_tracking::names::key_none,
97+
scratchpad.book(memory_tracking::names::key_generic_acc,
9898
dst_d.nelems(), dst_d.data_type_size());
9999
}
100100

src/cpu/aarch64/acl_indirect_gemm_convolution.hpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -103,7 +103,7 @@ struct acl_indirect_gemm_convolution_fwd_t : public primitive_t {
103103
if (acp_.use_dst_acc_for_sum) {
104104
const memory_desc_wrapper dst_d(&dst_md_);
105105
auto scratchpad = scratchpad_registry().registrar();
106-
scratchpad.book(memory_tracking::names::key_none,
106+
scratchpad.book(memory_tracking::names::key_generic_acc,
107107
dst_d.nelems(), dst_d.data_type_size());
108108
}
109109

src/cpu/aarch64/acl_inner_product.cpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@ status_t acl_inner_product_fwd_t::execute_forward(const exec_ctx_t &ctx) const {
4646
// If we have an unfused sum post op, put the result in a scratchpad tensor.
4747
// Result will be summed to the dst during acl_post_ops.execute
4848
auto dst_base = use_dst_acc_for_sum
49-
? scratchpad.get<void>(memory_tracking::names::key_none)
49+
? scratchpad.get<void>(memory_tracking::names::key_generic_acc)
5050
: CTX_OUT_MEM(void *, DNNL_ARG_DST);
5151
acl_obj.dst_tensor.allocator()->import_memory(dst_base);
5252

src/cpu/aarch64/acl_inner_product.hpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -121,7 +121,7 @@ struct acl_inner_product_fwd_t : public primitive_t {
121121
if (aip.use_dst_acc_for_sum) {
122122
const memory_desc_wrapper dst_d(&dst_md_);
123123
auto scratchpad = scratchpad_registry().registrar();
124-
scratchpad.book(memory_tracking::names::key_none,
124+
scratchpad.book(memory_tracking::names::key_generic_acc,
125125
dst_d.nelems(), dst_d.data_type_size());
126126
}
127127

src/cpu/aarch64/acl_winograd_convolution.hpp

+1-1
Original file line numberDiff line numberDiff line change
@@ -106,7 +106,7 @@ struct acl_wino_convolution_fwd_t : public primitive_t {
106106
if (acp_.use_dst_acc_for_sum) {
107107
const memory_desc_wrapper dst_d(&dst_md_);
108108
auto scratchpad = scratchpad_registry().registrar();
109-
scratchpad.book(memory_tracking::names::key_none,
109+
scratchpad.book(memory_tracking::names::key_generic_acc,
110110
dst_d.nelems(), dst_d.data_type_size());
111111
}
112112

0 commit comments

Comments
 (0)