@@ -56,6 +56,25 @@ struct deconv_eltw_test_params {
56
56
size_t expected_not_fused_primitives;
57
57
};
58
58
59
+ struct deconv_new_shape_infer_test_params {
60
+ ov::PartialShape in_shape;
61
+ ov::PartialShape out_shape;
62
+ ov::PartialShape kernel;
63
+ ov::Strides stride;
64
+ ov::CoordinateDiff pad;
65
+ ov::Strides dilation;
66
+ uint32_t groups;
67
+ data_types data_type;
68
+ format input_format;
69
+ data_types weights_type;
70
+ format weights_format;
71
+ data_types default_type;
72
+ format default_format;
73
+ size_t expected_fused_primitives;
74
+ size_t expected_fused_primitives_onednn;
75
+ size_t expected_not_fused_primitives;
76
+ };
77
+
59
78
class DeconvolutionFusingTest : public ::BaseFusingTest<deconv_test_params> {
60
79
public:
61
80
void execute (deconv_test_params& p, bool is_caching_test = false ) {
@@ -94,6 +113,60 @@ class DeconvolutionFusingTest : public ::BaseFusingTest<deconv_test_params> {
94
113
}
95
114
};
96
115
116
+ class DeconvolutionFusingNewShapeInferTest : public ::BaseFusingTest<deconv_new_shape_infer_test_params> {
117
+ public:
118
+ void SetUp () override {
119
+ rg.set_seed (GET_SUITE_NAME);
120
+ cfg_fused = get_test_default_config (engine);
121
+ cfg_not_fused = get_test_default_config (engine);
122
+
123
+ cfg_fused.set_property (ov::intel_gpu::optimize_data (true ));
124
+ cfg_fused.set_property (ov::intel_gpu::allow_new_shape_infer (true ));
125
+ cfg_not_fused.set_property (ov::intel_gpu::optimize_data (false ));
126
+ cfg_not_fused.set_property (ov::intel_gpu::allow_new_shape_infer (true ));
127
+ cfg_not_fused.set_property (ov::intel_gpu::allow_static_input_reorder (true ));
128
+ }
129
+
130
+ void execute (deconv_new_shape_infer_test_params& p, bool is_caching_test = false ) {
131
+ execute (p, get_mem (get_input_layout (p)), is_caching_test);
132
+ }
133
+ void execute (deconv_new_shape_infer_test_params& p, cldnn::memory::ptr input_prim, bool is_caching_test = false ) {
134
+ if (engine.get_device_info ().supports_immad )
135
+ p.expected_fused_primitives = p.expected_fused_primitives_onednn ;
136
+
137
+ network::ptr network_not_fused = get_network (this ->engine , this ->topology_non_fused , cfg_not_fused, get_test_stream_ptr (cfg_not_fused), is_caching_test);
138
+ network::ptr network_fused = get_network (this ->engine , this ->topology_fused , cfg_fused, get_test_stream_ptr (cfg_fused), is_caching_test);
139
+ network_fused->set_input_data (" input" , input_prim);
140
+ network_not_fused->set_input_data (" input" , input_prim);
141
+
142
+ compare (*network_not_fused, *network_fused, p);
143
+ auto find_conv = [](primitive_info& p) -> bool {
144
+ if (p.original_id == " deconv" )
145
+ return true ;
146
+ return false ;
147
+ };
148
+
149
+ auto pi_fused = network_fused->get_primitives_info ();
150
+ auto info_fused = std::find_if (pi_fused.begin (), pi_fused.end (), find_conv);
151
+ if (info_fused != pi_fused.end ())
152
+ std::cout << " kernel: " << info_fused->kernel_id << std::endl;
153
+ }
154
+
155
+ layout get_input_layout (deconv_new_shape_infer_test_params& p) {
156
+ auto pad = p.pad ;
157
+ std::vector<int > pad_ = { 0 , 0 , static_cast <int >(pad[0 ]) };
158
+ return layout{ p.in_shape , p.data_type , p.input_format , padding{ pad_ } };
159
+ }
160
+
161
+ layout get_weights_layout (deconv_new_shape_infer_test_params& p) {
162
+ return layout{ p.kernel , p.weights_type , p.weights_format };
163
+ }
164
+
165
+ layout get_bias_layout (deconv_new_shape_infer_test_params& p) {
166
+ return layout{ ov::PartialShape{1 , static_cast <int64_t >(p.out_shape .get_shape ().at (1 )), 1 }, p.default_type , format::bfyx };
167
+ }
168
+ };
169
+
97
170
class ConvEltwTest : public ::BaseFusingTest<deconv_eltw_test_params> {
98
171
public:
99
172
@@ -147,6 +220,9 @@ class ConvEltwTest : public ::BaseFusingTest<deconv_eltw_test_params> {
147
220
#define CASE_DECONV_FP32_7 { 1 , 16 , 4 , 5 }, { 1 , 32 , 7 , 9 }, { 1 , 1 , 1 , 1 }, { 2 , 2 }, { 0 , 0 }, { 1 , 1 }, 1 , data_types::f32, format::b_fs_yx_fsv16, data_types::f32, format::is_os_yx_isv16_osv16, data_types::f32, format::bfyx
148
221
#define CASE_DECONV_FP32_8 { 1 , 32 , 4 , 5 }, { 1 , 32 , 7 , 9 }, { 1 , 1 , 3 , 3 }, { 2 , 2 }, { 1 , 1 }, { 1 , 1 }, 32 , data_types::f32, format::b_fs_yx_fsv16, data_types::f32, format::gs_oiyx_gsv16, data_types::f32, format::bfyx
149
222
223
+ // 1D deconv
224
+ #define CASE_DECONV_1D_FP32_1 { 1 , 512 , 1500 }, { 1 , 256 , 12008 }, { 256 , 512 , 16 }, { 8 }, { 0 }, { 1 }, 1 , data_types::f32, format::bfyx, data_types::f32, format::oiyx, data_types::f32, format::bfyx
225
+
150
226
#define CASE_DECONV_FP16_1 { 1 , 15 , 4 , 5 }, { 1 , 30 , 6 , 7 }, { 1 , 1 , 3 , 3 }, { 1 , 1 }, { 0 , 0 }, { 1 , 1 }, 1 , data_types::f16, format::bfyx, data_types::f16, format::oiyx, data_types::f16, format::bfyx
151
227
#define CASE_DECONV_FP16_2 { 1 , 16 , 4 , 5 }, { 1 , 32 , 6 , 7 }, { 1 , 1 , 3 , 3 }, { 1 , 1 }, { 0 , 0 }, { 1 , 1 }, 1 , data_types::f16, format::b_fs_yx_fsv16, data_types::f16, format::is_os_yx_isv16_osv16, data_types::f16, format::bfyx
152
228
#define CASE_DECONV_FP16_3 { 1 , 16 , 4 , 5 }, { 1 , 32 , 4 , 5 }, { 1 , 1 , 1 , 1 }, { 1 , 1 }, { 0 , 0 }, { 1 , 1 }, 1 , data_types::f16, format::b_fs_yx_fsv16, data_types::f16, format::is_os_yx_isv16_osv16, data_types::f16, format::bfyx
@@ -390,6 +466,33 @@ INSTANTIATE_TEST_SUITE_P(fusings_gpu, deconv_bias, ::testing::ValuesIn(std::vect
390
466
deconv_test_params{ CASE_DECONV_S8S8_3D_3, 2 , 2 , 3 },
391
467
}));
392
468
469
+ class deconv_bias_1d : public DeconvolutionFusingNewShapeInferTest {};
470
+ TEST_P (deconv_bias_1d, basic) {
471
+ auto p = GetParam ();
472
+ create_topologies (
473
+ input_layout (" input" , get_input_layout (p)),
474
+ data (" weights" , get_mem (get_weights_layout (p))),
475
+ data (" bias" , get_mem (get_bias_layout (p))),
476
+ deconvolution (" deconv" , input_info (" input" ), { " weights" }, p.groups , p.stride , p.pad , p.dilation ),
477
+ eltwise (" bias_add" , { input_info (" deconv" ), input_info (" bias" ) }, eltwise_mode::sum),
478
+ reorder (" out" , input_info (" bias_add" ), p.default_format , data_types::f32)
479
+ );
480
+
481
+ if (engine.get_device_info ().supports_immad &&
482
+ p.default_type == data_types::f16 &&
483
+ p.weights_format == format::is_os_yx_isv16_osv16) {
484
+ GTEST_SKIP (); // Issue: 94154
485
+ }
486
+
487
+ // Need much higher tolerance because of deconvolution -> convolution optimization
488
+ tolerance = 1 .f ;
489
+ execute (p);
490
+ }
491
+
492
+ INSTANTIATE_TEST_SUITE_P (fusings_gpu, deconv_bias_1d, ::testing::ValuesIn(std::vector<deconv_new_shape_infer_test_params>{
493
+ deconv_new_shape_infer_test_params{ CASE_DECONV_1D_FP32_1, 2 , 2 , 3 },
494
+ }));
495
+
393
496
class deconv_scale : public DeconvolutionFusingTest {};
394
497
TEST_P (deconv_scale, basic) {
395
498
auto p = GetParam ();
0 commit comments