Skip to content

Commit df61ffb

Browse files
committed
benchdnn: inputs: graph: test f32 intermediates for implicit mask
1 parent 80f4f02 commit df61ffb

File tree

2 files changed

+38
-35
lines changed

2 files changed

+38
-35
lines changed

tests/benchdnn/inputs/graph/complex_fusion/harness_mha_all

+3
Original file line numberDiff line numberDiff line change
@@ -17,8 +17,11 @@
1717
--reset --dt=f32,bf16,f16 --case=complex_fusion/mha/sdpa-plain-implicit-causal-mask-fp32-bs1.json
1818
# f16 inputs + f32 intermediates + f16 outputs
1919
--reset --case=complex_fusion/mha/sdpa-plain-simplified-f16-f32.json
20+
--reset --dt=1:f16+2:f16+3:f16+4:f16+6:f16+104:f16 --case=complex_fusion/mha/sdpa-plain-implicit-causal-mask-fp32-bs1.json
21+
2022
# bf16 inputs + f32 intermediates + bf16 outputs
2123
--reset --dt=1:bf16+2:bf16+3:bf16+4:bf16+5:bf16+6:bf16+104:bf16 --case=complex_fusion/mha/sdpa-plain-simplified-f16-f32.json
24+
--reset --dt=1:bf16+2:bf16+3:bf16+4:bf16+6:bf16+104:bf16 --case=complex_fusion/mha/sdpa-plain-implicit-causal-mask-fp32-bs1.json
2225

2326
# int8 graphs
2427
--reset --case=complex_fusion/mha/MHA-GPT-inf-int8-bs1.json

tests/benchdnn/inputs/graph/complex_fusion/mha/sdpa-plain-implicit-causal-mask-fp32-bs1.json

+35-35
Original file line numberDiff line numberDiff line change
@@ -1,17 +1,17 @@
11
{
2-
"version": "3.7.0",
2+
"version": "3.8.0",
33
"engine_kind": "cpu",
44
"fpmath_mode": "strict",
55
"fpmath_mode_apply_to_int": "false",
66
"input_ports": [
7-
0,
87
1,
9-
3,
10-
8,
11-
11
8+
2,
9+
4,
10+
5,
11+
3
1212
],
1313
"output_ports": [
14-
12
14+
6
1515
],
1616
"graph": [
1717
{
@@ -30,7 +30,7 @@
3030
},
3131
"inputs": [
3232
{
33-
"id": 0,
33+
"id": 1,
3434
"dtype": "f32",
3535
"shape": [
3636
1,
@@ -48,7 +48,7 @@
4848
"property_type": "undef"
4949
},
5050
{
51-
"id": 1,
51+
"id": 2,
5252
"dtype": "f32",
5353
"shape": [
5454
1,
@@ -68,7 +68,7 @@
6868
],
6969
"outputs": [
7070
{
71-
"id": 2,
71+
"id": 101,
7272
"dtype": "f32",
7373
"shape": [
7474
1,
@@ -99,7 +99,7 @@
9999
},
100100
"inputs": [
101101
{
102-
"id": 2,
102+
"id": 101,
103103
"dtype": "f32",
104104
"shape": [
105105
1,
@@ -117,7 +117,7 @@
117117
"property_type": "undef"
118118
},
119119
{
120-
"id": 3,
120+
"id": 4,
121121
"dtype": "f32",
122122
"shape": [
123123
1
@@ -131,7 +131,7 @@
131131
],
132132
"outputs": [
133133
{
134-
"id": 4,
134+
"id": 102,
135135
"dtype": "f32",
136136
"shape": [
137137
1,
@@ -151,7 +151,7 @@
151151
]
152152
},
153153
{
154-
"id": 2,
154+
"id": 40,
155155
"name": "genindex_row",
156156
"kind": "GenIndex",
157157
"attrs": {
@@ -162,7 +162,7 @@
162162
},
163163
"inputs": [
164164
{
165-
"id": 4,
165+
"id": 102,
166166
"dtype": "f32",
167167
"shape": [
168168
1,
@@ -182,7 +182,7 @@
182182
],
183183
"outputs": [
184184
{
185-
"id": 5,
185+
"id": 1021,
186186
"dtype": "s32",
187187
"shape": [
188188
1,
@@ -202,7 +202,7 @@
202202
]
203203
},
204204
{
205-
"id": 3,
205+
"id": 41,
206206
"name": "genindex_col",
207207
"kind": "GenIndex",
208208
"attrs": {
@@ -213,7 +213,7 @@
213213
},
214214
"inputs": [
215215
{
216-
"id": 4,
216+
"id": 102,
217217
"dtype": "f32",
218218
"shape": [
219219
1,
@@ -233,7 +233,7 @@
233233
],
234234
"outputs": [
235235
{
236-
"id": 6,
236+
"id": 1022,
237237
"dtype": "s32",
238238
"shape": [
239239
1,
@@ -253,7 +253,7 @@
253253
]
254254
},
255255
{
256-
"id": 4,
256+
"id": 42,
257257
"name": "mask_greater_equal",
258258
"kind": "GreaterEqual",
259259
"attrs": {
@@ -264,7 +264,7 @@
264264
},
265265
"inputs": [
266266
{
267-
"id": 5,
267+
"id": 1021,
268268
"dtype": "s32",
269269
"shape": [
270270
1,
@@ -282,7 +282,7 @@
282282
"property_type": "undef"
283283
},
284284
{
285-
"id": 6,
285+
"id": 1022,
286286
"dtype": "s32",
287287
"shape": [
288288
1,
@@ -302,7 +302,7 @@
302302
],
303303
"outputs": [
304304
{
305-
"id": 7,
305+
"id": 1023,
306306
"dtype": "boolean",
307307
"shape": [
308308
1,
@@ -322,7 +322,7 @@
322322
]
323323
},
324324
{
325-
"id": 5,
325+
"id": 2,
326326
"name": "Select",
327327
"kind": "Select",
328328
"attrs": {
@@ -333,7 +333,7 @@
333333
},
334334
"inputs": [
335335
{
336-
"id": 7,
336+
"id": 1023,
337337
"dtype": "boolean",
338338
"shape": [
339339
1,
@@ -351,7 +351,7 @@
351351
"property_type": "undef"
352352
},
353353
{
354-
"id": 4,
354+
"id": 102,
355355
"dtype": "f32",
356356
"shape": [
357357
1,
@@ -369,7 +369,7 @@
369369
"property_type": "undef"
370370
},
371371
{
372-
"id": 8,
372+
"id": 5,
373373
"dtype": "f32",
374374
"shape": [
375375
1
@@ -383,7 +383,7 @@
383383
],
384384
"outputs": [
385385
{
386-
"id": 9,
386+
"id": 103,
387387
"dtype": "f32",
388388
"shape": [
389389
1,
@@ -403,7 +403,7 @@
403403
]
404404
},
405405
{
406-
"id": 6,
406+
"id": 3,
407407
"name": "softmax",
408408
"kind": "SoftMax",
409409
"attrs": {
@@ -414,7 +414,7 @@
414414
},
415415
"inputs": [
416416
{
417-
"id": 9,
417+
"id": 103,
418418
"dtype": "f32",
419419
"shape": [
420420
1,
@@ -434,7 +434,7 @@
434434
],
435435
"outputs": [
436436
{
437-
"id": 10,
437+
"id": 104,
438438
"dtype": "f32",
439439
"shape": [
440440
1,
@@ -454,7 +454,7 @@
454454
]
455455
},
456456
{
457-
"id": 7,
457+
"id": 4,
458458
"name": "matmul_v",
459459
"kind": "MatMul",
460460
"attrs": {
@@ -469,7 +469,7 @@
469469
},
470470
"inputs": [
471471
{
472-
"id": 10,
472+
"id": 104,
473473
"dtype": "f32",
474474
"shape": [
475475
1,
@@ -487,7 +487,7 @@
487487
"property_type": "undef"
488488
},
489489
{
490-
"id": 11,
490+
"id": 3,
491491
"dtype": "f32",
492492
"shape": [
493493
1,
@@ -507,7 +507,7 @@
507507
],
508508
"outputs": [
509509
{
510-
"id": 12,
510+
"id": 6,
511511
"dtype": "f32",
512512
"shape": [
513513
1,
@@ -527,4 +527,4 @@
527527
]
528528
}
529529
]
530-
}
530+
}

0 commit comments

Comments
 (0)