diff options
| author | Matt Arsenault <Matthew.Arsenault@amd.com> | 2019-07-19 14:15:18 +0000 | 
|---|---|---|
| committer | Matt Arsenault <Matthew.Arsenault@amd.com> | 2019-07-19 14:15:18 +0000 | 
| commit | fecf43eba3630aeb55c56e5d308f99a7bd05bfbe (patch) | |
| tree | f65a92ab47e7aed8b45afa1e0396de4197491f85 /llvm/lib/Target/AMDGPU/SIISelLowering.cpp | |
| parent | 3fd917d8860e9bdcabc14c536da4377307906be0 (diff) | |
| download | bcm5719-llvm-fecf43eba3630aeb55c56e5d308f99a7bd05bfbe.tar.gz bcm5719-llvm-fecf43eba3630aeb55c56e5d308f99a7bd05bfbe.zip | |
AMDGPU/GlobalISel: Rewrite lowerFormalArguments
This should now handle everything except structs passed as multiple
registers.
I think most of the packing logic should be handled by
handleAssignments, but I'm unclear on what the contract is for
multiple registers. This is copying how x86 handles this.
This does change the behavior of the test_sgpr_alignment0 amdgpu_vs
test. I don't think shader arguments should try to follow the
alignment, and registers need to be repacked. I also don't think it
matters, since I think the pointers are packed to the beginning of the
argument list anyway.
llvm-svn: 366582
Diffstat (limited to 'llvm/lib/Target/AMDGPU/SIISelLowering.cpp')
| -rw-r--r-- | llvm/lib/Target/AMDGPU/SIISelLowering.cpp | 65 | 
1 files changed, 36 insertions, 29 deletions
| diff --git a/llvm/lib/Target/AMDGPU/SIISelLowering.cpp b/llvm/lib/Target/AMDGPU/SIISelLowering.cpp index b8c7bd648f4..40b93f4ae3b 100644 --- a/llvm/lib/Target/AMDGPU/SIISelLowering.cpp +++ b/llvm/lib/Target/AMDGPU/SIISelLowering.cpp @@ -1596,29 +1596,32 @@ static void processShaderInputArgs(SmallVectorImpl<ISD::InputArg> &Splits,  }  // Allocate special inputs passed in VGPRs. -static void allocateSpecialEntryInputVGPRs(CCState &CCInfo, -                                           MachineFunction &MF, -                                           const SIRegisterInfo &TRI, -                                           SIMachineFunctionInfo &Info) { +void SITargetLowering::allocateSpecialEntryInputVGPRs(CCState &CCInfo, +                                                      MachineFunction &MF, +                                                      const SIRegisterInfo &TRI, +                                                      SIMachineFunctionInfo &Info) const { +  const LLT S32 = LLT::scalar(32); +  MachineRegisterInfo &MRI = MF.getRegInfo(); +    if (Info.hasWorkItemIDX()) { -    unsigned Reg = AMDGPU::VGPR0; -    MF.addLiveIn(Reg, &AMDGPU::VGPR_32RegClass); +    Register Reg = AMDGPU::VGPR0; +    MRI.setType(MF.addLiveIn(Reg, &AMDGPU::VGPR_32RegClass), S32);      CCInfo.AllocateReg(Reg);      Info.setWorkItemIDX(ArgDescriptor::createRegister(Reg));    }    if (Info.hasWorkItemIDY()) { -    unsigned Reg = AMDGPU::VGPR1; -    MF.addLiveIn(Reg, &AMDGPU::VGPR_32RegClass); +    Register Reg = AMDGPU::VGPR1; +    MRI.setType(MF.addLiveIn(Reg, &AMDGPU::VGPR_32RegClass), S32);      CCInfo.AllocateReg(Reg);      Info.setWorkItemIDY(ArgDescriptor::createRegister(Reg));    }    if (Info.hasWorkItemIDZ()) { -    unsigned Reg = AMDGPU::VGPR2; -    MF.addLiveIn(Reg, &AMDGPU::VGPR_32RegClass); +    Register Reg = AMDGPU::VGPR2; +    MRI.setType(MF.addLiveIn(Reg, &AMDGPU::VGPR_32RegClass), S32);      CCInfo.AllocateReg(Reg);      Info.setWorkItemIDZ(ArgDescriptor::createRegister(Reg)); @@ -1678,10 +1681,10 @@ static ArgDescriptor allocateSGPR64Input(CCState &CCInfo) {    return allocateSGPR32InputImpl(CCInfo, &AMDGPU::SGPR_64RegClass, 16);  } -static void allocateSpecialInputVGPRs(CCState &CCInfo, -                                      MachineFunction &MF, -                                      const SIRegisterInfo &TRI, -                                      SIMachineFunctionInfo &Info) { +void SITargetLowering::allocateSpecialInputVGPRs(CCState &CCInfo, +                                                 MachineFunction &MF, +                                                 const SIRegisterInfo &TRI, +                                                 SIMachineFunctionInfo &Info) const {    const unsigned Mask = 0x3ff;    ArgDescriptor Arg; @@ -1699,10 +1702,11 @@ static void allocateSpecialInputVGPRs(CCState &CCInfo,      Info.setWorkItemIDZ(allocateVGPR32Input(CCInfo, Mask << 20, Arg));  } -static void allocateSpecialInputSGPRs(CCState &CCInfo, -                                      MachineFunction &MF, -                                      const SIRegisterInfo &TRI, -                                      SIMachineFunctionInfo &Info) { +void SITargetLowering::allocateSpecialInputSGPRs( +  CCState &CCInfo, +  MachineFunction &MF, +  const SIRegisterInfo &TRI, +  SIMachineFunctionInfo &Info) const {    auto &ArgInfo = Info.getArgInfo();    // TODO: Unify handling with private memory pointers. @@ -1735,10 +1739,10 @@ static void allocateSpecialInputSGPRs(CCState &CCInfo,  }  // Allocate special inputs passed in user SGPRs. -static void allocateHSAUserSGPRs(CCState &CCInfo, -                                 MachineFunction &MF, -                                 const SIRegisterInfo &TRI, -                                 SIMachineFunctionInfo &Info) { +void SITargetLowering::allocateHSAUserSGPRs(CCState &CCInfo, +                                            MachineFunction &MF, +                                            const SIRegisterInfo &TRI, +                                            SIMachineFunctionInfo &Info) const {    if (Info.hasImplicitBufferPtr()) {      unsigned ImplicitBufferPtrReg = Info.addImplicitBufferPtr(TRI);      MF.addLiveIn(ImplicitBufferPtrReg, &AMDGPU::SGPR_64RegClass); @@ -1765,9 +1769,12 @@ static void allocateHSAUserSGPRs(CCState &CCInfo,    }    if (Info.hasKernargSegmentPtr()) { -    unsigned InputPtrReg = Info.addKernargSegmentPtr(TRI); -    MF.addLiveIn(InputPtrReg, &AMDGPU::SGPR_64RegClass); +    MachineRegisterInfo &MRI = MF.getRegInfo(); +    Register InputPtrReg = Info.addKernargSegmentPtr(TRI);      CCInfo.AllocateReg(InputPtrReg); + +    Register VReg = MF.addLiveIn(InputPtrReg, &AMDGPU::SGPR_64RegClass); +    MRI.setType(VReg, LLT::pointer(AMDGPUAS::CONSTANT_ADDRESS, 64));    }    if (Info.hasDispatchID()) { @@ -1787,11 +1794,11 @@ static void allocateHSAUserSGPRs(CCState &CCInfo,  }  // Allocate special input registers that are initialized per-wave. -static void allocateSystemSGPRs(CCState &CCInfo, -                                MachineFunction &MF, -                                SIMachineFunctionInfo &Info, -                                CallingConv::ID CallConv, -                                bool IsShader) { +void SITargetLowering::allocateSystemSGPRs(CCState &CCInfo, +                                           MachineFunction &MF, +                                           SIMachineFunctionInfo &Info, +                                           CallingConv::ID CallConv, +                                           bool IsShader) const {    if (Info.hasWorkGroupIDX()) {      unsigned Reg = Info.addWorkGroupIDX();      MF.addLiveIn(Reg, &AMDGPU::SReg_32_XM0RegClass); | 

