diff options
author | Simon Pilgrim <llvm-dev@redking.me.uk> | 2018-05-01 14:25:01 +0000 |
---|---|---|
committer | Simon Pilgrim <llvm-dev@redking.me.uk> | 2018-05-01 14:25:01 +0000 |
commit | dd8eae128b8b1fbffef8d0abeac981346f682557 (patch) | |
tree | 1f5c178e9b439cc7a6cc47272540bf7b3f65bcaf /llvm/lib | |
parent | 14c1085317cf5f44c773908535fe2220839b6e4f (diff) | |
download | bcm5719-llvm-dd8eae128b8b1fbffef8d0abeac981346f682557.tar.gz bcm5719-llvm-dd8eae128b8b1fbffef8d0abeac981346f682557.zip |
[X86] Split WriteFShuffle into XMM and YMM/ZMM scheduler classes
Removes more WriteFShuffle InstRW overrides
llvm-svn: 331264
Diffstat (limited to 'llvm/lib')
-rwxr-xr-x | llvm/lib/Target/X86/X86SchedBroadwell.td | 13 | ||||
-rw-r--r-- | llvm/lib/Target/X86/X86SchedHaswell.td | 13 | ||||
-rw-r--r-- | llvm/lib/Target/X86/X86SchedSandyBridge.td | 13 | ||||
-rw-r--r-- | llvm/lib/Target/X86/X86SchedSkylakeClient.td | 13 | ||||
-rwxr-xr-x | llvm/lib/Target/X86/X86SchedSkylakeServer.td | 29 | ||||
-rw-r--r-- | llvm/lib/Target/X86/X86Schedule.td | 3 | ||||
-rw-r--r-- | llvm/lib/Target/X86/X86ScheduleAtom.td | 1 | ||||
-rw-r--r-- | llvm/lib/Target/X86/X86ScheduleBtVer2.td | 22 | ||||
-rw-r--r-- | llvm/lib/Target/X86/X86ScheduleSLM.td | 3 | ||||
-rw-r--r-- | llvm/lib/Target/X86/X86ScheduleZnver1.td | 1 |
10 files changed, 22 insertions, 89 deletions
diff --git a/llvm/lib/Target/X86/X86SchedBroadwell.td b/llvm/lib/Target/X86/X86SchedBroadwell.td index 3b58b528097..daa624492bc 100755 --- a/llvm/lib/Target/X86/X86SchedBroadwell.td +++ b/llvm/lib/Target/X86/X86SchedBroadwell.td @@ -168,7 +168,8 @@ defm : BWWriteResPair<WriteFMAY, [BWPort01], 5, [1], 1, 6>; // Fused Multiply defm : BWWriteResPair<WriteFSign, [BWPort5], 1>; // Floating point fabs/fchs. defm : BWWriteResPair<WriteFLogic, [BWPort5], 1, [1], 1, 5>; // Floating point and/or/xor logicals. defm : BWWriteResPair<WriteFLogicY, [BWPort5], 1, [1], 1, 6>; // Floating point and/or/xor logicals (YMM/ZMM). -defm : BWWriteResPair<WriteFShuffle, [BWPort5], 1>; // Floating point vector shuffles. +defm : BWWriteResPair<WriteFShuffle, [BWPort5], 1, [1], 1, 5>; // Floating point vector shuffles. +defm : BWWriteResPair<WriteFShuffleY, [BWPort5], 1, [1], 1, 6>; // Floating point vector shuffles (YMM/ZMM). defm : BWWriteResPair<WriteFVarShuffle, [BWPort5], 1, [1], 1, 5>; // Floating point vector variable shuffles. defm : BWWriteResPair<WriteFVarShuffleY, [BWPort5], 1, [1], 1, 6>; // Floating point vector variable shuffles. defm : BWWriteResPair<WriteFBlend, [BWPort015], 1, [1], 1, 5>; // Floating point vector blends. @@ -1088,8 +1089,6 @@ def: InstRW<[BWWriteResGroup75], (instregex "VPACKSSDWYrm", "VPACKUSWBYrm", "VPALIGNRYrmi", "VPBLENDWYrmi", - "VPERMILPDYmi", - "VPERMILPSYmi", "VPSHUFBYrm", "VPSHUFDYmi", "VPSHUFHWYmi", @@ -1101,13 +1100,7 @@ def: InstRW<[BWWriteResGroup75], (instregex "VPACKSSDWYrm", "VPUNPCKLBWYrm", "VPUNPCKLDQYrm", "VPUNPCKLQDQYrm", - "VPUNPCKLWDYrm", - "VSHUFPDYrmi", - "VSHUFPSYrmi", - "VUNPCKHPDYrm", - "VUNPCKHPSYrm", - "VUNPCKLPDYrm", - "VUNPCKLPSYrm")>; + "VPUNPCKLWDYrm")>; def BWWriteResGroup76 : SchedWriteRes<[BWPort23,BWPort15]> { let Latency = 7; diff --git a/llvm/lib/Target/X86/X86SchedHaswell.td b/llvm/lib/Target/X86/X86SchedHaswell.td index 0c36c5be315..fc55578fa4b 100644 --- a/llvm/lib/Target/X86/X86SchedHaswell.td +++ b/llvm/lib/Target/X86/X86SchedHaswell.td @@ -165,7 +165,8 @@ defm : HWWriteResPair<WriteFMAY, [HWPort01], 5, [1], 1, 7>; defm : HWWriteResPair<WriteFSign, [HWPort0], 1>; defm : HWWriteResPair<WriteFLogic, [HWPort5], 1, [1], 1, 6>; defm : HWWriteResPair<WriteFLogicY, [HWPort5], 1, [1], 1, 7>; -defm : HWWriteResPair<WriteFShuffle, [HWPort5], 1>; +defm : HWWriteResPair<WriteFShuffle, [HWPort5], 1, [1], 1, 5>; +defm : HWWriteResPair<WriteFShuffleY, [HWPort5], 1, [1], 1, 7>; defm : HWWriteResPair<WriteFVarShuffle, [HWPort5], 1, [1], 1, 6>; defm : HWWriteResPair<WriteFVarShuffleY, [HWPort5], 1, [1], 1, 7>; defm : HWWriteResPair<WriteFBlend, [HWPort015], 1, [1], 1, 6>; @@ -900,8 +901,6 @@ def: InstRW<[HWWriteResGroup13_1], (instregex "VPACKSSDWYrm", "VPACKUSWBYrm", "VPALIGNRYrmi", "VPBLENDWYrmi", - "VPERMILPDYmi", - "VPERMILPSYmi", "VPMOVSXBDYrm", "VPMOVSXBQYrm", "VPMOVSXWQYrm", @@ -916,13 +915,7 @@ def: InstRW<[HWWriteResGroup13_1], (instregex "VPACKSSDWYrm", "VPUNPCKLBWYrm", "VPUNPCKLDQYrm", "VPUNPCKLQDQYrm", - "VPUNPCKLWDYrm", - "VSHUFPDYrmi", - "VSHUFPSYrmi", - "VUNPCKHPDYrm", - "VUNPCKHPSYrm", - "VUNPCKLPDYrm", - "VUNPCKLPSYrm")>; + "VPUNPCKLWDYrm")>; def HWWriteResGroup14 : SchedWriteRes<[HWPort6,HWPort23]> { let Latency = 6; diff --git a/llvm/lib/Target/X86/X86SchedSandyBridge.td b/llvm/lib/Target/X86/X86SchedSandyBridge.td index f2d6a3f4a64..5ef051fe666 100644 --- a/llvm/lib/Target/X86/X86SchedSandyBridge.td +++ b/llvm/lib/Target/X86/X86SchedSandyBridge.td @@ -152,7 +152,8 @@ defm : SBWriteResPair<WriteCvtF2F, [SBPort1], 3>; defm : SBWriteResPair<WriteFSign, [SBPort5], 1>; defm : SBWriteResPair<WriteFLogic, [SBPort5], 1, [1], 1, 6>; defm : SBWriteResPair<WriteFLogicY, [SBPort5], 1, [1], 1, 7>; -defm : SBWriteResPair<WriteFShuffle, [SBPort5], 1>; +defm : SBWriteResPair<WriteFShuffle, [SBPort5], 1, [1], 1, 5>; +defm : SBWriteResPair<WriteFShuffleY,[SBPort5], 1, [1], 1, 7>; defm : SBWriteResPair<WriteFVarShuffle, [SBPort5], 1>; defm : SBWriteResPair<WriteFVarShuffleY,[SBPort5], 1>; defm : SBWriteResPair<WriteFBlend, [SBPort05], 1, [1], 1, 6>; @@ -1140,16 +1141,8 @@ def SBWriteResGroup73 : SchedWriteRes<[SBPort5,SBPort23]> { let ResourceCycles = [1,1]; } def: InstRW<[SBWriteResGroup73], (instregex "VPERM2F128rm", - "VPERMILPDYmi", "VPERMILPDYrm", - "VPERMILPSYmi", - "VPERMILPSYrm", - "VSHUFPDYrmi", - "VSHUFPSYrmi", - "VUNPCKHPDYrm", - "VUNPCKHPSYrm", - "VUNPCKLPDYrm", - "VUNPCKLPSYrm")>; + "VPERMILPSYrm")>; def SBWriteResGroup75 : SchedWriteRes<[SBPort23,SBPort05]> { let Latency = 8; diff --git a/llvm/lib/Target/X86/X86SchedSkylakeClient.td b/llvm/lib/Target/X86/X86SchedSkylakeClient.td index 3f68e927dc5..63469e4d973 100644 --- a/llvm/lib/Target/X86/X86SchedSkylakeClient.td +++ b/llvm/lib/Target/X86/X86SchedSkylakeClient.td @@ -165,7 +165,8 @@ defm : SKLWriteResPair<WriteFMAY, [SKLPort01], 4, [1], 1, 7>; // Fused Multipl defm : SKLWriteResPair<WriteFSign, [SKLPort0], 1>; // Floating point fabs/fchs. defm : SKLWriteResPair<WriteFLogic, [SKLPort015], 1, [1], 1, 6>; // Floating point and/or/xor logicals. defm : SKLWriteResPair<WriteFLogicY, [SKLPort015], 1, [1], 1, 7>; // Floating point and/or/xor logicals (YMM/ZMM). -defm : SKLWriteResPair<WriteFShuffle, [SKLPort5], 1>; // Floating point vector shuffles. +defm : SKLWriteResPair<WriteFShuffle, [SKLPort5], 1, [1], 1, 5>; // Floating point vector shuffles. +defm : SKLWriteResPair<WriteFShuffleY, [SKLPort5], 1, [1], 1, 7>; // Floating point vector shuffles (YMM/ZMM). defm : SKLWriteResPair<WriteFVarShuffle, [SKLPort5], 1>; // Floating point vector shuffles. defm : SKLWriteResPair<WriteFVarShuffleY, [SKLPort5], 1>; // Floating point vector shuffles. defm : SKLWriteResPair<WriteFBlend, [SKLPort015], 1, [1], 1, 6>; // Floating point vector blends. @@ -1519,9 +1520,7 @@ def: InstRW<[SKLWriteResGroup108], (instregex "FCOM32m", "VPBLENDWYrmi", "VPBROADCASTBYrm", "VPBROADCASTWYrm", - "VPERMILPDYmi", "VPERMILPDYrm", - "VPERMILPSYmi", "VPERMILPSYrm", "VPMOVSXBDYrm", "VPMOVSXBQYrm", @@ -1537,13 +1536,7 @@ def: InstRW<[SKLWriteResGroup108], (instregex "FCOM32m", "VPUNPCKLBWYrm", "VPUNPCKLDQYrm", "VPUNPCKLQDQYrm", - "VPUNPCKLWDYrm", - "VSHUFPDYrmi", - "VSHUFPSYrmi", - "VUNPCKHPDYrm", - "VUNPCKHPSYrm", - "VUNPCKLPDYrm", - "VUNPCKLPSYrm")>; + "VPUNPCKLWDYrm")>; def SKLWriteResGroup109 : SchedWriteRes<[SKLPort01,SKLPort23]> { let Latency = 8; diff --git a/llvm/lib/Target/X86/X86SchedSkylakeServer.td b/llvm/lib/Target/X86/X86SchedSkylakeServer.td index cce237cfe50..89e4577e60c 100755 --- a/llvm/lib/Target/X86/X86SchedSkylakeServer.td +++ b/llvm/lib/Target/X86/X86SchedSkylakeServer.td @@ -165,7 +165,8 @@ defm : SKXWriteResPair<WriteFMAY, [SKXPort015], 4, [1], 1, 7>; // Fused Multiply defm : SKXWriteResPair<WriteFSign, [SKXPort0], 1>; // Floating point fabs/fchs. defm : SKXWriteResPair<WriteFLogic, [SKXPort015], 1, [1], 1, 6>; // Floating point and/or/xor logicals. defm : SKXWriteResPair<WriteFLogicY, [SKXPort015], 1, [1], 1, 7>; // Floating point and/or/xor logicals (YMM/ZMM). -defm : SKXWriteResPair<WriteFShuffle, [SKXPort5], 1>; // Floating point vector shuffles. +defm : SKXWriteResPair<WriteFShuffle, [SKXPort5], 1, [1], 1, 5>; // Floating point vector shuffles. +defm : SKXWriteResPair<WriteFShuffleY, [SKXPort5], 1, [1], 1, 7>; // Floating point vector shuffles (YMM/ZMM). defm : SKXWriteResPair<WriteFVarShuffle, [SKXPort5], 1>; // Floating point vector variable shuffles. defm : SKXWriteResPair<WriteFVarShuffleY, [SKXPort5], 1>; // Floating point vector variable shuffles. defm : SKXWriteResPair<WriteFBlend, [SKXPort015], 1, [1], 1, 6>; // Floating point vector blends. @@ -2703,17 +2704,11 @@ def: InstRW<[SKXWriteResGroup119], (instregex "FCOM32m", "VPBROADCASTWYrm", "VPBROADCASTWZ256m(b?)", "VPBROADCASTWZm(b?)", - "VPERMILPDYmi", "VPERMILPDYrm", - "VPERMILPDZ256m(b?)i", "VPERMILPDZ256rm(b?)", - "VPERMILPDZm(b?)i", "VPERMILPDZrm(b?)", - "VPERMILPSYmi", "VPERMILPSYrm", - "VPERMILPSZ256m(b?)i", "VPERMILPSZ256rm(b?)", - "VPERMILPSZm(b?)i", "VPERMILPSZrm(b?)", "VPMOVSXBDYrm", "VPMOVSXBQYrm", @@ -2757,25 +2752,7 @@ def: InstRW<[SKXWriteResGroup119], (instregex "FCOM32m", "VPUNPCKLQDQZrm(b?)", "VPUNPCKLWDYrm", "VPUNPCKLWDZ256rm(b?)", - "VPUNPCKLWDZrm(b?)", - "VSHUFPDYrmi", - "VSHUFPDZ256rm(b?)i", - "VSHUFPDZrm(b?)i", - "VSHUFPSYrmi", - "VSHUFPSZ256rm(b?)i", - "VSHUFPSZrm(b?)i", - "VUNPCKHPDYrm", - "VUNPCKHPDZ256rm(b?)", - "VUNPCKHPDZrm(b?)", - "VUNPCKHPSYrm", - "VUNPCKHPSZ256rm(b?)", - "VUNPCKHPSZrm(b?)", - "VUNPCKLPDYrm", - "VUNPCKLPDZ256rm(b?)", - "VUNPCKLPDZrm(b?)", - "VUNPCKLPSYrm", - "VUNPCKLPSZ256rm(b?)", - "VUNPCKLPSZrm(b?)")>; + "VPUNPCKLWDZrm(b?)")>; def SKXWriteResGroup120 : SchedWriteRes<[SKXPort01,SKXPort23]> { let Latency = 8; diff --git a/llvm/lib/Target/X86/X86Schedule.td b/llvm/lib/Target/X86/X86Schedule.td index 758f035e5ef..cf0e3db0b0d 100644 --- a/llvm/lib/Target/X86/X86Schedule.td +++ b/llvm/lib/Target/X86/X86Schedule.td @@ -105,6 +105,7 @@ defm WriteFSign : X86SchedWritePair; // Floating point fabs/fchs. defm WriteFLogic : X86SchedWritePair; // Floating point and/or/xor logicals. defm WriteFLogicY : X86SchedWritePair; // Floating point and/or/xor logicals (YMM/ZMM). defm WriteFShuffle : X86SchedWritePair; // Floating point vector shuffles. +defm WriteFShuffleY : X86SchedWritePair; // Floating point vector shuffles (YMM/ZMM). defm WriteFVarShuffle : X86SchedWritePair; // Floating point vector variable shuffles. defm WriteFVarShuffleY : X86SchedWritePair; // Floating point vector variable shuffles (YMM/ZMM). defm WriteFBlend : X86SchedWritePair; // Floating point vector blends. @@ -212,7 +213,7 @@ def SchedWriteFLogic def SchedWriteFShuffle : X86SchedWriteWidths<WriteFShuffle, WriteFShuffle, - WriteFShuffle, WriteFShuffle>; + WriteFShuffleY, WriteFShuffleY>; def SchedWriteFVarShuffle : X86SchedWriteWidths<WriteFVarShuffle, WriteFVarShuffle, WriteFVarShuffleY, WriteFVarShuffleY>; diff --git a/llvm/lib/Target/X86/X86ScheduleAtom.td b/llvm/lib/Target/X86/X86ScheduleAtom.td index 3090d25b516..6979044c452 100644 --- a/llvm/lib/Target/X86/X86ScheduleAtom.td +++ b/llvm/lib/Target/X86/X86ScheduleAtom.td @@ -214,6 +214,7 @@ defm : AtomWriteResPair<WriteFSign, [AtomPort1], [AtomPort1]>; defm : AtomWriteResPair<WriteFLogic, [AtomPort01], [AtomPort0]>; defm : AtomWriteResPair<WriteFLogicY, [AtomPort01], [AtomPort0]>; // NOTE: Doesn't exist on Atom. defm : AtomWriteResPair<WriteFShuffle, [AtomPort0], [AtomPort0]>; +defm : AtomWriteResPair<WriteFShuffleY, [AtomPort0], [AtomPort0]>; // NOTE: Doesn't exist on Atom. defm : AtomWriteResPair<WriteFVarShuffle, [AtomPort0], [AtomPort0]>; // NOTE: Doesn't exist on Atom. defm : AtomWriteResPair<WriteFVarShuffleY, [AtomPort0], [AtomPort0]>; // NOTE: Doesn't exist on Atom. defm : AtomWriteResPair<WriteFMA, [AtomPort0], [AtomPort0]>; // NOTE: Doesn't exist on Atom. diff --git a/llvm/lib/Target/X86/X86ScheduleBtVer2.td b/llvm/lib/Target/X86/X86ScheduleBtVer2.td index 10a695d4b7f..15f3464241c 100644 --- a/llvm/lib/Target/X86/X86ScheduleBtVer2.td +++ b/llvm/lib/Target/X86/X86ScheduleBtVer2.td @@ -330,6 +330,7 @@ defm : JWriteResFpuPair<WriteFSign, [JFPU1, JFPM], 2>; defm : JWriteResFpuPair<WriteFLogic, [JFPU01, JFPX], 1>; defm : JWriteResYMMPair<WriteFLogicY, [JFPU01, JFPX], 1, [2, 2], 2>; defm : JWriteResFpuPair<WriteFShuffle, [JFPU01, JFPX], 1>; +defm : JWriteResYMMPair<WriteFShuffleY, [JFPU01, JFPX], 1, [2, 2], 2>; defm : JWriteResFpuPair<WriteFVarShuffle, [JFPU01, JFPX], 2, [1, 4], 3>; defm : JWriteResYMMPair<WriteFVarShuffleY,[JFPU01, JFPX], 3, [2, 6], 6>; defm : JWriteResFpuPair<WriteFBlend, [JFPU01, JFPX], 1>; @@ -685,27 +686,6 @@ def JWriteVCVTPDYLd: SchedWriteRes<[JLAGU, JFPU1, JSTC, JFPX]> { } def : InstRW<[JWriteVCVTPDYLd, ReadAfterLd], (instrs VCVTPD2DQYrm, VCVTTPD2DQYrm, VCVTPD2PSYrm)>; -def JWriteShuffleY: SchedWriteRes<[JFPU01, JFPX]> { - let ResourceCycles = [2, 2]; - let NumMicroOps = 2; -} -def : InstRW<[JWriteShuffleY], (instrs VMOVDDUPYrr, VMOVSHDUPYrr, VMOVSLDUPYrr, - VPERMILPDYri, VPERMILPSYri, VSHUFPDYrri, - VSHUFPSYrri, VUNPCKHPDYrr, VUNPCKHPSYrr, - VUNPCKLPDYrr, VUNPCKLPSYrr)>; - -def JWriteShuffleYLd: SchedWriteRes<[JLAGU, JFPU01, JFPX]> { - let Latency = 6; - let ResourceCycles = [2, 2, 2]; - let NumMicroOps = 2; -} -def : InstRW<[JWriteShuffleYLd, ReadAfterLd], (instrs VMOVDDUPYrm, VMOVSHDUPYrm, - VMOVSLDUPYrm, VPERMILPDYmi, - VPERMILPSYmi, VSHUFPDYrmi, - VSHUFPSYrmi, VUNPCKHPDYrm, - VUNPCKHPSYrm, VUNPCKLPDYrm, - VUNPCKLPSYrm)>; - def JWriteVBROADCASTYLd: SchedWriteRes<[JLAGU, JFPU01, JFPX]> { let Latency = 6; let ResourceCycles = [1, 2, 4]; diff --git a/llvm/lib/Target/X86/X86ScheduleSLM.td b/llvm/lib/Target/X86/X86ScheduleSLM.td index 9ea9eb00cee..6c4e1faea77 100644 --- a/llvm/lib/Target/X86/X86ScheduleSLM.td +++ b/llvm/lib/Target/X86/X86ScheduleSLM.td @@ -143,7 +143,8 @@ defm : SLMWriteResPair<WriteCvtF2F, [SLM_FPC_RSV01], 4>; defm : SLMWriteResPair<WriteFSign, [SLM_FPC_RSV01], 1>; defm : SLMWriteResPair<WriteFLogic, [SLM_FPC_RSV01], 1>; defm : SLMWriteResPair<WriteFLogicY, [SLM_FPC_RSV01], 1>; -defm : SLMWriteResPair<WriteFShuffle, [SLM_FPC_RSV0], 1>; +defm : SLMWriteResPair<WriteFShuffle, [SLM_FPC_RSV0], 1>; +defm : SLMWriteResPair<WriteFShuffleY, [SLM_FPC_RSV0], 1>; defm : SLMWriteResPair<WriteFVarShuffle, [SLM_FPC_RSV0], 1>; defm : SLMWriteResPair<WriteFVarShuffleY,[SLM_FPC_RSV0], 1>; defm : SLMWriteResPair<WriteFBlend, [SLM_FPC_RSV0], 1>; diff --git a/llvm/lib/Target/X86/X86ScheduleZnver1.td b/llvm/lib/Target/X86/X86ScheduleZnver1.td index 2e92c53b531..4d8887186a0 100644 --- a/llvm/lib/Target/X86/X86ScheduleZnver1.td +++ b/llvm/lib/Target/X86/X86ScheduleZnver1.td @@ -209,6 +209,7 @@ defm : ZnWriteResFpuPair<WriteFSign, [ZnFPU3], 2>; defm : ZnWriteResFpuPair<WriteFLogic, [ZnFPU], 1>; defm : ZnWriteResFpuPair<WriteFLogicY, [ZnFPU], 1>; defm : ZnWriteResFpuPair<WriteFShuffle, [ZnFPU12], 1>; +defm : ZnWriteResFpuPair<WriteFShuffleY, [ZnFPU12], 1>; defm : ZnWriteResFpuPair<WriteFVarShuffle, [ZnFPU12], 1>; defm : ZnWriteResFpuPair<WriteFVarShuffleY,[ZnFPU12], 1>; defm : ZnWriteResFpuPair<WriteFMul, [ZnFPU0], 5>; |