1
1
/* ******************************************************************************
2
- * Copyright 2024- 2025 Intel Corporation
2
+ * Copyright 2025 Intel Corporation
3
3
*
4
4
* Licensed under the Apache License, Version 2.0 (the "License");
5
5
* you may not use this file except in compliance with the License.
@@ -40,16 +40,14 @@ namespace impl {
40
40
namespace graph {
41
41
namespace dnnl_impl {
42
42
43
- template <bool quantized>
44
- status_t sdp_primitive_v1_kernel_t <quantized>::compile_impl(
43
+ status_t sdp_primitive_v1_kernel_t::compile_impl (
45
44
const dnnl_partition_impl_t *part, const engine_t *g_engine,
46
45
const std::vector<logical_tensor_t > &inputs,
47
46
const std::vector<logical_tensor_t > &outputs) {
48
47
// sdp_primitive_v1_kernel_t only supports Intel GPU.
49
48
#if defined(DNNL_WITH_SYCL) && DNNL_GPU_VENDOR != DNNL_VENDOR_INTEL
50
49
return status::unimplemented;
51
50
#endif
52
- if (quantized) { return status::unimplemented; }
53
51
54
52
p_engine_ = make_dnnl_engine (*g_engine);
55
53
g_alloc_
@@ -110,8 +108,7 @@ status_t sdp_primitive_v1_kernel_t<quantized>::compile_impl(
110
108
return status::success;
111
109
}
112
110
113
- template <bool quantized>
114
- void sdp_primitive_v1_kernel_t <quantized>::prepare_args_set(
111
+ void sdp_primitive_v1_kernel_t::prepare_args_set (
115
112
const execution_args_set_t *res, const std::vector<tensor_t > &inputs,
116
113
const std::vector<tensor_t > &outputs, const scratchpad_t &scratchpad) {
117
114
// update the data of partition in/outputs args
@@ -131,9 +128,8 @@ void sdp_primitive_v1_kernel_t<quantized>::prepare_args_set(
131
128
}
132
129
}
133
130
134
- template <bool quantized>
135
- status_t sdp_primitive_v1_kernel_t <quantized>::execute_impl(
136
- const stream_t *g_stream, const std::vector<tensor_t > &inputs,
131
+ status_t sdp_primitive_v1_kernel_t::execute_impl (const stream_t *g_stream,
132
+ const std::vector<tensor_t > &inputs,
137
133
const std::vector<tensor_t > &outputs) {
138
134
dnnl::stream p_stream = make_dnnl_stream (p_engine_, *g_stream);
139
135
@@ -154,9 +150,8 @@ status_t sdp_primitive_v1_kernel_t<quantized>::execute_impl(
154
150
}
155
151
156
152
#ifdef DNNL_WITH_SYCL
157
- template <bool quantized>
158
- status_t sdp_primitive_v1_kernel_t <quantized>::sycl_execute_impl(
159
- const stream_t *g_stream, const std::vector<tensor_t > &inputs,
153
+ status_t sdp_primitive_v1_kernel_t::sycl_execute_impl (const stream_t *g_stream,
154
+ const std::vector<tensor_t > &inputs,
160
155
const std::vector<tensor_t > &outputs,
161
156
const std::vector<::sycl::event> &sycl_deps,
162
157
::sycl::event *sycl_event) {
@@ -193,9 +188,8 @@ status_t sdp_primitive_v1_kernel_t<quantized>::sycl_execute_impl(
193
188
#endif
194
189
195
190
#if DNNL_GPU_RUNTIME == DNNL_RUNTIME_OCL
196
- template <bool quantized>
197
- status_t sdp_primitive_v1_kernel_t <quantized>::ocl_execute_impl(
198
- const stream_t *g_stream, const std::vector<tensor_t > &inputs,
191
+ status_t sdp_primitive_v1_kernel_t::ocl_execute_impl (const stream_t *g_stream,
192
+ const std::vector<tensor_t > &inputs,
199
193
const std::vector<tensor_t > &outputs,
200
194
const std::vector<cl_event> &cl_deps, cl_event *ret_event) {
201
195
// sdp_primitive_v1_kernel_t only supports Intel GPU.
@@ -230,8 +224,7 @@ status_t sdp_primitive_v1_kernel_t<quantized>::ocl_execute_impl(
230
224
}
231
225
#endif
232
226
233
- template struct sdp_primitive_v1_kernel_t <false >;
234
- template struct sdp_primitive_v1_kernel_t <true >;
227
+ struct sdp_primitive_v1_kernel_t ;
235
228
236
229
} // namespace dnnl_impl
237
230
} // namespace graph
0 commit comments