File tree 2 files changed +38
-35
lines changed
tests/benchdnn/inputs/graph/complex_fusion
2 files changed +38
-35
lines changed Original file line number Diff line number Diff line change 17
17
--reset --dt=f32,bf16,f16 --case=complex_fusion/mha/sdpa-plain-implicit-causal-mask-fp32-bs1.json
18
18
# f16 inputs + f32 intermediates + f16 outputs
19
19
--reset --case=complex_fusion/mha/sdpa-plain-simplified-f16-f32.json
20
+ --reset --dt=1:f16+2:f16+3:f16+4:f16+6:f16+104:f16 --case=complex_fusion/mha/sdpa-plain-implicit-causal-mask-fp32-bs1.json
21
+
20
22
# bf16 inputs + f32 intermediates + bf16 outputs
21
23
--reset --dt=1:bf16+2:bf16+3:bf16+4:bf16+5:bf16+6:bf16+104:bf16 --case=complex_fusion/mha/sdpa-plain-simplified-f16-f32.json
24
+ --reset --dt=1:bf16+2:bf16+3:bf16+4:bf16+6:bf16+104:bf16 --case=complex_fusion/mha/sdpa-plain-implicit-causal-mask-fp32-bs1.json
22
25
23
26
# int8 graphs
24
27
--reset --case=complex_fusion/mha/MHA-GPT-inf-int8-bs1.json
Original file line number Diff line number Diff line change 1
1
{
2
- "version" : " 3.7 .0" ,
2
+ "version" : " 3.8 .0" ,
3
3
"engine_kind" : " cpu" ,
4
4
"fpmath_mode" : " strict" ,
5
5
"fpmath_mode_apply_to_int" : " false" ,
6
6
"input_ports" : [
7
- 0 ,
8
7
1 ,
9
- 3 ,
10
- 8 ,
11
- 11
8
+ 2 ,
9
+ 4 ,
10
+ 5 ,
11
+ 3
12
12
],
13
13
"output_ports" : [
14
- 12
14
+ 6
15
15
],
16
16
"graph" : [
17
17
{
30
30
},
31
31
"inputs" : [
32
32
{
33
- "id" : 0 ,
33
+ "id" : 1 ,
34
34
"dtype" : " f32" ,
35
35
"shape" : [
36
36
1 ,
48
48
"property_type" : " undef"
49
49
},
50
50
{
51
- "id" : 1 ,
51
+ "id" : 2 ,
52
52
"dtype" : " f32" ,
53
53
"shape" : [
54
54
1 ,
68
68
],
69
69
"outputs" : [
70
70
{
71
- "id" : 2 ,
71
+ "id" : 101 ,
72
72
"dtype" : " f32" ,
73
73
"shape" : [
74
74
1 ,
99
99
},
100
100
"inputs" : [
101
101
{
102
- "id" : 2 ,
102
+ "id" : 101 ,
103
103
"dtype" : " f32" ,
104
104
"shape" : [
105
105
1 ,
117
117
"property_type" : " undef"
118
118
},
119
119
{
120
- "id" : 3 ,
120
+ "id" : 4 ,
121
121
"dtype" : " f32" ,
122
122
"shape" : [
123
123
1
131
131
],
132
132
"outputs" : [
133
133
{
134
- "id" : 4 ,
134
+ "id" : 102 ,
135
135
"dtype" : " f32" ,
136
136
"shape" : [
137
137
1 ,
151
151
]
152
152
},
153
153
{
154
- "id" : 2 ,
154
+ "id" : 40 ,
155
155
"name" : " genindex_row" ,
156
156
"kind" : " GenIndex" ,
157
157
"attrs" : {
162
162
},
163
163
"inputs" : [
164
164
{
165
- "id" : 4 ,
165
+ "id" : 102 ,
166
166
"dtype" : " f32" ,
167
167
"shape" : [
168
168
1 ,
182
182
],
183
183
"outputs" : [
184
184
{
185
- "id" : 5 ,
185
+ "id" : 1021 ,
186
186
"dtype" : " s32" ,
187
187
"shape" : [
188
188
1 ,
202
202
]
203
203
},
204
204
{
205
- "id" : 3 ,
205
+ "id" : 41 ,
206
206
"name" : " genindex_col" ,
207
207
"kind" : " GenIndex" ,
208
208
"attrs" : {
213
213
},
214
214
"inputs" : [
215
215
{
216
- "id" : 4 ,
216
+ "id" : 102 ,
217
217
"dtype" : " f32" ,
218
218
"shape" : [
219
219
1 ,
233
233
],
234
234
"outputs" : [
235
235
{
236
- "id" : 6 ,
236
+ "id" : 1022 ,
237
237
"dtype" : " s32" ,
238
238
"shape" : [
239
239
1 ,
253
253
]
254
254
},
255
255
{
256
- "id" : 4 ,
256
+ "id" : 42 ,
257
257
"name" : " mask_greater_equal" ,
258
258
"kind" : " GreaterEqual" ,
259
259
"attrs" : {
264
264
},
265
265
"inputs" : [
266
266
{
267
- "id" : 5 ,
267
+ "id" : 1021 ,
268
268
"dtype" : " s32" ,
269
269
"shape" : [
270
270
1 ,
282
282
"property_type" : " undef"
283
283
},
284
284
{
285
- "id" : 6 ,
285
+ "id" : 1022 ,
286
286
"dtype" : " s32" ,
287
287
"shape" : [
288
288
1 ,
302
302
],
303
303
"outputs" : [
304
304
{
305
- "id" : 7 ,
305
+ "id" : 1023 ,
306
306
"dtype" : " boolean" ,
307
307
"shape" : [
308
308
1 ,
322
322
]
323
323
},
324
324
{
325
- "id" : 5 ,
325
+ "id" : 2 ,
326
326
"name" : " Select" ,
327
327
"kind" : " Select" ,
328
328
"attrs" : {
333
333
},
334
334
"inputs" : [
335
335
{
336
- "id" : 7 ,
336
+ "id" : 1023 ,
337
337
"dtype" : " boolean" ,
338
338
"shape" : [
339
339
1 ,
351
351
"property_type" : " undef"
352
352
},
353
353
{
354
- "id" : 4 ,
354
+ "id" : 102 ,
355
355
"dtype" : " f32" ,
356
356
"shape" : [
357
357
1 ,
369
369
"property_type" : " undef"
370
370
},
371
371
{
372
- "id" : 8 ,
372
+ "id" : 5 ,
373
373
"dtype" : " f32" ,
374
374
"shape" : [
375
375
1
383
383
],
384
384
"outputs" : [
385
385
{
386
- "id" : 9 ,
386
+ "id" : 103 ,
387
387
"dtype" : " f32" ,
388
388
"shape" : [
389
389
1 ,
403
403
]
404
404
},
405
405
{
406
- "id" : 6 ,
406
+ "id" : 3 ,
407
407
"name" : " softmax" ,
408
408
"kind" : " SoftMax" ,
409
409
"attrs" : {
414
414
},
415
415
"inputs" : [
416
416
{
417
- "id" : 9 ,
417
+ "id" : 103 ,
418
418
"dtype" : " f32" ,
419
419
"shape" : [
420
420
1 ,
434
434
],
435
435
"outputs" : [
436
436
{
437
- "id" : 10 ,
437
+ "id" : 104 ,
438
438
"dtype" : " f32" ,
439
439
"shape" : [
440
440
1 ,
454
454
]
455
455
},
456
456
{
457
- "id" : 7 ,
457
+ "id" : 4 ,
458
458
"name" : " matmul_v" ,
459
459
"kind" : " MatMul" ,
460
460
"attrs" : {
469
469
},
470
470
"inputs" : [
471
471
{
472
- "id" : 10 ,
472
+ "id" : 104 ,
473
473
"dtype" : " f32" ,
474
474
"shape" : [
475
475
1 ,
487
487
"property_type" : " undef"
488
488
},
489
489
{
490
- "id" : 11 ,
490
+ "id" : 3 ,
491
491
"dtype" : " f32" ,
492
492
"shape" : [
493
493
1 ,
507
507
],
508
508
"outputs" : [
509
509
{
510
- "id" : 12 ,
510
+ "id" : 6 ,
511
511
"dtype" : " f32" ,
512
512
"shape" : [
513
513
1 ,
527
527
]
528
528
}
529
529
]
530
- }
530
+ }
You can’t perform that action at this time.
0 commit comments