diff options
Diffstat (limited to 'llvm')
-rw-r--r-- | llvm/lib/Analysis/TargetLibraryInfo.cpp | 14 | ||||
-rw-r--r-- | llvm/test/Transforms/InstCombine/AMDGPU/tan.ll | 21 |
2 files changed, 23 insertions, 12 deletions
diff --git a/llvm/lib/Analysis/TargetLibraryInfo.cpp b/llvm/lib/Analysis/TargetLibraryInfo.cpp index 5bdc24ac291..23096969805 100644 --- a/llvm/lib/Analysis/TargetLibraryInfo.cpp +++ b/llvm/lib/Analysis/TargetLibraryInfo.cpp @@ -105,18 +105,8 @@ static void initialize(TargetLibraryInfoImpl &TLI, const Triple &T, TLI.setShouldSignExtI32Param(ShouldSignExtI32Param); if (T.getArch() == Triple::r600 || - T.getArch() == Triple::amdgcn) { - TLI.setUnavailable(LibFunc_ldexp); - TLI.setUnavailable(LibFunc_ldexpf); - TLI.setUnavailable(LibFunc_ldexpl); - TLI.setUnavailable(LibFunc_exp10); - TLI.setUnavailable(LibFunc_exp10f); - TLI.setUnavailable(LibFunc_exp10l); - TLI.setUnavailable(LibFunc_log10); - TLI.setUnavailable(LibFunc_log10f); - TLI.setUnavailable(LibFunc_log10l); - TLI.setUnavailable(LibFunc_printf); - } + T.getArch() == Triple::amdgcn) + TLI.disableAllFunctions(); // There are no library implementations of memcpy and memset for AMD gpus and // these can be difficult to lower in the backend. diff --git a/llvm/test/Transforms/InstCombine/AMDGPU/tan.ll b/llvm/test/Transforms/InstCombine/AMDGPU/tan.ll new file mode 100644 index 00000000000..4c3a9f1fb79 --- /dev/null +++ b/llvm/test/Transforms/InstCombine/AMDGPU/tan.ll @@ -0,0 +1,21 @@ +; RUN: opt -mtriple=amdgcn--amdpal -S -instcombine <%s | FileCheck --check-prefixes=GCN %s + +; Check that sin/cos is not folded to tan on amdgcn. + +; GCN-LABEL: define amdgpu_ps float @llpc.shader.FS.main +; GCN: call float @llvm.sin.f32 +; GCN: call float @llvm.cos.f32 + +declare float @llvm.sin.f32(float) #0 +declare float @llvm.cos.f32(float) #0 + +define amdgpu_ps float @llpc.shader.FS.main(float %arg) { +.entry: + %tmp32 = call float @llvm.sin.f32(float %arg) + %tmp33 = call float @llvm.cos.f32(float %arg) + %tmp34 = fdiv reassoc nnan nsz arcp contract float 1.000000e+00, %tmp33 + %tmp35 = fmul reassoc nnan nsz arcp contract float %tmp32, %tmp34 + ret float %tmp35 +} + +attributes #0 = { nounwind readnone speculatable willreturn } |