@@ -2939,78 +2939,78 @@ bool X86InstrInfo::findCommutedOpIndices(const MachineInstr &MI,
2939
2939
case X86::VPDPBUUDSYrr:
2940
2940
case X86::VPDPBUUDrr:
2941
2941
case X86::VPDPBUUDYrr:
2942
- case X86::VPDPBSSDSZ128r :
2943
- case X86::VPDPBSSDSZ128rk :
2944
- case X86::VPDPBSSDSZ128rkz :
2945
- case X86::VPDPBSSDSZ256r :
2946
- case X86::VPDPBSSDSZ256rk :
2947
- case X86::VPDPBSSDSZ256rkz :
2948
- case X86::VPDPBSSDSZr :
2949
- case X86::VPDPBSSDSZrk :
2950
- case X86::VPDPBSSDSZrkz :
2951
- case X86::VPDPBSSDZ128r :
2952
- case X86::VPDPBSSDZ128rk :
2953
- case X86::VPDPBSSDZ128rkz :
2954
- case X86::VPDPBSSDZ256r :
2955
- case X86::VPDPBSSDZ256rk :
2956
- case X86::VPDPBSSDZ256rkz :
2957
- case X86::VPDPBSSDZr :
2958
- case X86::VPDPBSSDZrk :
2959
- case X86::VPDPBSSDZrkz :
2960
- case X86::VPDPBUUDSZ128r :
2961
- case X86::VPDPBUUDSZ128rk :
2962
- case X86::VPDPBUUDSZ128rkz :
2963
- case X86::VPDPBUUDSZ256r :
2964
- case X86::VPDPBUUDSZ256rk :
2965
- case X86::VPDPBUUDSZ256rkz :
2966
- case X86::VPDPBUUDSZr :
2967
- case X86::VPDPBUUDSZrk :
2968
- case X86::VPDPBUUDSZrkz :
2969
- case X86::VPDPBUUDZ128r :
2970
- case X86::VPDPBUUDZ128rk :
2971
- case X86::VPDPBUUDZ128rkz :
2972
- case X86::VPDPBUUDZ256r :
2973
- case X86::VPDPBUUDZ256rk :
2974
- case X86::VPDPBUUDZ256rkz :
2975
- case X86::VPDPBUUDZr :
2976
- case X86::VPDPBUUDZrk :
2977
- case X86::VPDPBUUDZrkz :
2978
- case X86::VPDPWSSDZ128r :
2979
- case X86::VPDPWSSDZ128rk :
2980
- case X86::VPDPWSSDZ128rkz :
2981
- case X86::VPDPWSSDZ256r :
2982
- case X86::VPDPWSSDZ256rk :
2983
- case X86::VPDPWSSDZ256rkz :
2984
- case X86::VPDPWSSDZr :
2985
- case X86::VPDPWSSDZrk :
2986
- case X86::VPDPWSSDZrkz :
2987
- case X86::VPDPWSSDSZ128r :
2988
- case X86::VPDPWSSDSZ128rk :
2989
- case X86::VPDPWSSDSZ128rkz :
2990
- case X86::VPDPWSSDSZ256r :
2991
- case X86::VPDPWSSDSZ256rk :
2992
- case X86::VPDPWSSDSZ256rkz :
2993
- case X86::VPDPWSSDSZr :
2994
- case X86::VPDPWSSDSZrk :
2995
- case X86::VPDPWSSDSZrkz :
2996
- case X86::VPDPWUUDZ128r :
2997
- case X86::VPDPWUUDZ128rk :
2998
- case X86::VPDPWUUDZ128rkz :
2999
- case X86::VPDPWUUDZ256r :
3000
- case X86::VPDPWUUDZ256rk :
3001
- case X86::VPDPWUUDZ256rkz :
3002
- case X86::VPDPWUUDZr :
3003
- case X86::VPDPWUUDZrk :
3004
- case X86::VPDPWUUDZrkz :
3005
- case X86::VPDPWUUDSZ128r :
3006
- case X86::VPDPWUUDSZ128rk :
3007
- case X86::VPDPWUUDSZ128rkz :
3008
- case X86::VPDPWUUDSZ256r :
3009
- case X86::VPDPWUUDSZ256rk :
3010
- case X86::VPDPWUUDSZ256rkz :
3011
- case X86::VPDPWUUDSZr :
3012
- case X86::VPDPWUUDSZrk :
3013
- case X86::VPDPWUUDSZrkz :
2942
+ case X86::VPDPBSSDSZ128rr :
2943
+ case X86::VPDPBSSDSZ128rrk :
2944
+ case X86::VPDPBSSDSZ128rrkz :
2945
+ case X86::VPDPBSSDSZ256rr :
2946
+ case X86::VPDPBSSDSZ256rrk :
2947
+ case X86::VPDPBSSDSZ256rrkz :
2948
+ case X86::VPDPBSSDSZrr :
2949
+ case X86::VPDPBSSDSZrrk :
2950
+ case X86::VPDPBSSDSZrrkz :
2951
+ case X86::VPDPBSSDZ128rr :
2952
+ case X86::VPDPBSSDZ128rrk :
2953
+ case X86::VPDPBSSDZ128rrkz :
2954
+ case X86::VPDPBSSDZ256rr :
2955
+ case X86::VPDPBSSDZ256rrk :
2956
+ case X86::VPDPBSSDZ256rrkz :
2957
+ case X86::VPDPBSSDZrr :
2958
+ case X86::VPDPBSSDZrrk :
2959
+ case X86::VPDPBSSDZrrkz :
2960
+ case X86::VPDPBUUDSZ128rr :
2961
+ case X86::VPDPBUUDSZ128rrk :
2962
+ case X86::VPDPBUUDSZ128rrkz :
2963
+ case X86::VPDPBUUDSZ256rr :
2964
+ case X86::VPDPBUUDSZ256rrk :
2965
+ case X86::VPDPBUUDSZ256rrkz :
2966
+ case X86::VPDPBUUDSZrr :
2967
+ case X86::VPDPBUUDSZrrk :
2968
+ case X86::VPDPBUUDSZrrkz :
2969
+ case X86::VPDPBUUDZ128rr :
2970
+ case X86::VPDPBUUDZ128rrk :
2971
+ case X86::VPDPBUUDZ128rrkz :
2972
+ case X86::VPDPBUUDZ256rr :
2973
+ case X86::VPDPBUUDZ256rrk :
2974
+ case X86::VPDPBUUDZ256rrkz :
2975
+ case X86::VPDPBUUDZrr :
2976
+ case X86::VPDPBUUDZrrk :
2977
+ case X86::VPDPBUUDZrrkz :
2978
+ case X86::VPDPWSSDZ128rr :
2979
+ case X86::VPDPWSSDZ128rrk :
2980
+ case X86::VPDPWSSDZ128rrkz :
2981
+ case X86::VPDPWSSDZ256rr :
2982
+ case X86::VPDPWSSDZ256rrk :
2983
+ case X86::VPDPWSSDZ256rrkz :
2984
+ case X86::VPDPWSSDZrr :
2985
+ case X86::VPDPWSSDZrrk :
2986
+ case X86::VPDPWSSDZrrkz :
2987
+ case X86::VPDPWSSDSZ128rr :
2988
+ case X86::VPDPWSSDSZ128rrk :
2989
+ case X86::VPDPWSSDSZ128rrkz :
2990
+ case X86::VPDPWSSDSZ256rr :
2991
+ case X86::VPDPWSSDSZ256rrk :
2992
+ case X86::VPDPWSSDSZ256rrkz :
2993
+ case X86::VPDPWSSDSZrr :
2994
+ case X86::VPDPWSSDSZrrk :
2995
+ case X86::VPDPWSSDSZrrkz :
2996
+ case X86::VPDPWUUDZ128rr :
2997
+ case X86::VPDPWUUDZ128rrk :
2998
+ case X86::VPDPWUUDZ128rrkz :
2999
+ case X86::VPDPWUUDZ256rr :
3000
+ case X86::VPDPWUUDZ256rrk :
3001
+ case X86::VPDPWUUDZ256rrkz :
3002
+ case X86::VPDPWUUDZrr :
3003
+ case X86::VPDPWUUDZrrk :
3004
+ case X86::VPDPWUUDZrrkz :
3005
+ case X86::VPDPWUUDSZ128rr :
3006
+ case X86::VPDPWUUDSZ128rrk :
3007
+ case X86::VPDPWUUDSZ128rrkz :
3008
+ case X86::VPDPWUUDSZ256rr :
3009
+ case X86::VPDPWUUDSZ256rrk :
3010
+ case X86::VPDPWUUDSZ256rrkz :
3011
+ case X86::VPDPWUUDSZrr :
3012
+ case X86::VPDPWUUDSZrrk :
3013
+ case X86::VPDPWUUDSZrrkz :
3014
3014
case X86::VPMADD52HUQrr:
3015
3015
case X86::VPMADD52HUQYrr:
3016
3016
case X86::VPMADD52HUQZ128r:
@@ -10822,15 +10822,15 @@ bool X86InstrInfo::getMachineCombinerPatterns(
10822
10822
}
10823
10823
break ;
10824
10824
}
10825
- case X86::VPDPWSSDZ128r :
10826
- case X86::VPDPWSSDZ128m :
10827
- case X86::VPDPWSSDZ256r :
10828
- case X86::VPDPWSSDZ256m :
10829
- case X86::VPDPWSSDZr :
10830
- case X86::VPDPWSSDZm : {
10831
- if (Subtarget.hasBWI () && !Subtarget.hasFastDPWSSD ()) {
10832
- Patterns.push_back (X86MachineCombinerPattern::DPWSSD);
10833
- return true ;
10825
+ case X86::VPDPWSSDZ128rr :
10826
+ case X86::VPDPWSSDZ128rm :
10827
+ case X86::VPDPWSSDZ256rr :
10828
+ case X86::VPDPWSSDZ256rm :
10829
+ case X86::VPDPWSSDZrr :
10830
+ case X86::VPDPWSSDZrm : {
10831
+ if (Subtarget.hasBWI () && !Subtarget.hasFastDPWSSD ()) {
10832
+ Patterns.push_back (X86MachineCombinerPattern::DPWSSD);
10833
+ return true ;
10834
10834
}
10835
10835
break ;
10836
10836
}
@@ -10866,11 +10866,11 @@ genAlternativeDpCodeSequence(MachineInstr &Root, const TargetInstrInfo &TII,
10866
10866
MaddOpc = X86::VPMADDWDrm;
10867
10867
AddOpc = X86::VPADDDrr;
10868
10868
break ;
10869
- case X86::VPDPWSSDZ128r :
10869
+ case X86::VPDPWSSDZ128rr :
10870
10870
MaddOpc = X86::VPMADDWDZ128rr;
10871
10871
AddOpc = X86::VPADDDZ128rr;
10872
10872
break ;
10873
- case X86::VPDPWSSDZ128m :
10873
+ case X86::VPDPWSSDZ128rm :
10874
10874
MaddOpc = X86::VPMADDWDZ128rm;
10875
10875
AddOpc = X86::VPADDDZ128rr;
10876
10876
break ;
@@ -10886,23 +10886,23 @@ genAlternativeDpCodeSequence(MachineInstr &Root, const TargetInstrInfo &TII,
10886
10886
MaddOpc = X86::VPMADDWDYrm;
10887
10887
AddOpc = X86::VPADDDYrr;
10888
10888
break ;
10889
- case X86::VPDPWSSDZ256r :
10889
+ case X86::VPDPWSSDZ256rr :
10890
10890
MaddOpc = X86::VPMADDWDZ256rr;
10891
10891
AddOpc = X86::VPADDDZ256rr;
10892
10892
break ;
10893
- case X86::VPDPWSSDZ256m :
10893
+ case X86::VPDPWSSDZ256rm :
10894
10894
MaddOpc = X86::VPMADDWDZ256rm;
10895
10895
AddOpc = X86::VPADDDZ256rr;
10896
10896
break ;
10897
10897
// vpdpwssd zmm2,zmm3,zmm1
10898
10898
// -->
10899
10899
// vpmaddwd zmm3,zmm3,zmm1
10900
10900
// vpaddd zmm2,zmm2,zmm3
10901
- case X86::VPDPWSSDZr :
10901
+ case X86::VPDPWSSDZrr :
10902
10902
MaddOpc = X86::VPMADDWDZrr;
10903
10903
AddOpc = X86::VPADDDZrr;
10904
10904
break ;
10905
- case X86::VPDPWSSDZm :
10905
+ case X86::VPDPWSSDZrm :
10906
10906
MaddOpc = X86::VPMADDWDZrm;
10907
10907
AddOpc = X86::VPADDDZrr;
10908
10908
break ;
0 commit comments