|
11 | 11 | --reset --dt=f32,bf16,f16 --case=complex_fusion/mha/GQA-fp16-v2.json
|
12 | 12 | --reset --dt=f32,bf16,f16 --case=complex_fusion/mha/sdpa-plain-wo-mask-f16.json
|
13 | 13 | --reset --dt=f32,bf16,f16 --case=complex_fusion/mha/sdpa-plain-implicit-causal-mask-fp32-bs1.json
|
| 14 | +--reset --dt=0:f32+1:f32+10:f32+13:f32+14:f32 --case=complex_fusion/mha/sdpa-plain-training-forward-bf16-f32.json |
| 15 | +--reset --case=complex_fusion/mha/sdpa-plain-training-backward-f32.json |
14 | 16 |
|
15 | 17 | # f16 inputs + f32 intermediates + f16 outputs
|
16 | 18 | --reset --op-kind=1:Multiply,1:Divide --case=complex_fusion/mha/sdpa-plain-simplified-f16-f32.json
|
|
38 | 40 | --reset --dt=2:f32+5:f32 --case=complex_fusion/mha/sdpa-plain-wo-mask-f16.json
|
39 | 41 | --reset --dt=2:f32+6:f32 --case=complex_fusion/mha/sdpa-plain-wo-scale-f16-bs1.json
|
40 | 42 | --reset --case=complex_fusion/mha/sdpa-plain-bottom-right-implicit-causal-mask-f16-f32.json
|
| 43 | +--reset --dt=0:f16+1:f16+10:f16+13:f16+14:f16 --case=complex_fusion/mha/sdpa-plain-training-forward-bf16-f32.json |
| 44 | +--reset --dt=16:f16+17:f16+32:f16+33:f16+34:f16+36:f16+44:f16+45:f16+47:f16 --case=complex_fusion/mha/sdpa-plain-training-backward-bf16-f32.json |
41 | 45 | # q_seq_len != kv_seq_len
|
42 | 46 | --reset --in-shapes=1:1x16x128x64+24:1x16x128x64 --case=complex_fusion/mha/sdpa-plain-bottom-right-implicit-causal-mask-f16-f32.json
|
43 | 47 |
|
|
63 | 67 | --reset --dt=2:f32+5:f32+0:bf16+1:bf16+4:bf16+7:bf16+9:bf16+10:bf16 --case=complex_fusion/mha/sdpa-plain-wo-mask-f16.json
|
64 | 68 | --reset --dt=2:f32+6:f32+0:bf16+1:bf16+5:bf16+7:bf16+8:bf16+9:bf16 --case=complex_fusion/mha/sdpa-plain-wo-scale-f16-bs1.json
|
65 | 69 | --reset --dt=0:bf16+1:bf16+4:bf16+22:bf16+24:bf16+25:bf16 --case=complex_fusion/mha/sdpa-plain-bottom-right-implicit-causal-mask-f16-f32.json
|
| 70 | +--reset --case=complex_fusion/mha/sdpa-plain-training-forward-bf16-f32.json |
| 71 | +--reset --case=complex_fusion/mha/sdpa-plain-training-backward-bf16-f32.json |
66 | 72 |
|
67 | 73 | # int8 graphs
|
68 | 74 | --reset --case=complex_fusion/mha/MHA-GPT-inf-int8-bs1.json
|
|
0 commit comments