diff options
author | Nicolai Haehnle <nhaehnle@gmail.com> | 2016-05-02 17:37:01 +0000 |
---|---|---|
committer | Nicolai Haehnle <nhaehnle@gmail.com> | 2016-05-02 17:37:01 +0000 |
commit | 119d3d80cbb53ff601f5bf56affb464d3b5f55ea (patch) | |
tree | 683002e241fa797689f012ac51e8a443080babcd | |
parent | e951a1d739d6cc7479451d4465f2cf74b41ae374 (diff) | |
download | bcm5719-llvm-119d3d80cbb53ff601f5bf56affb464d3b5f55ea.tar.gz bcm5719-llvm-119d3d80cbb53ff601f5bf56affb464d3b5f55ea.zip |
AMDGPU: llvm.SI.fs.constant is a source of divergence
Summary:
This intrinsic is used to get flat-shaded fragment shader inputs. Those are
uniform across a primitive, but a fragment shader wave may process pixels from
multiple primitives (as indicated by the prim_mask), and so that's where
divergence can arise.
Reviewers: arsenm, tstellarAMD
Subscribers: arsenm, llvm-commits
Differential Revision: http://reviews.llvm.org/D19747
llvm-svn: 268259
-rw-r--r-- | llvm/lib/Target/AMDGPU/AMDGPUTargetTransformInfo.cpp | 1 | ||||
-rw-r--r-- | llvm/test/Analysis/DivergenceAnalysis/AMDGPU/interp-intrinsics.ll | 22 |
2 files changed, 23 insertions, 0 deletions
diff --git a/llvm/lib/Target/AMDGPU/AMDGPUTargetTransformInfo.cpp b/llvm/lib/Target/AMDGPU/AMDGPUTargetTransformInfo.cpp index 39da9ddb69e..fabec277707 100644 --- a/llvm/lib/Target/AMDGPU/AMDGPUTargetTransformInfo.cpp +++ b/llvm/lib/Target/AMDGPU/AMDGPUTargetTransformInfo.cpp @@ -260,6 +260,7 @@ static bool isIntrinsicSourceOfDivergence(const TargetIntrinsicInfo *TII, return false; case AMDGPUIntrinsic::SI_tid: case AMDGPUIntrinsic::SI_fs_interp: + case AMDGPUIntrinsic::SI_fs_constant: return true; } } diff --git a/llvm/test/Analysis/DivergenceAnalysis/AMDGPU/interp-intrinsics.ll b/llvm/test/Analysis/DivergenceAnalysis/AMDGPU/interp-intrinsics.ll new file mode 100644 index 00000000000..d1c90ba608c --- /dev/null +++ b/llvm/test/Analysis/DivergenceAnalysis/AMDGPU/interp-intrinsics.ll @@ -0,0 +1,22 @@ +; RUN: opt -mtriple amdgcn--- -analyze -divergence %s | FileCheck %s + +; CHECK-LABEL: 'fs_interp' +; CHECK: DIVERGENT: %v = call float @llvm.SI.fs.interp( +define amdgpu_ps void @fs_interp(i32 inreg %prim_mask, <2 x i32> %interp_param) #1 { + %v = call float @llvm.SI.fs.interp(i32 0, i32 0, i32 %prim_mask, <2 x i32> %interp_param) + store volatile float %v, float addrspace(1)* undef + ret void +} + +; CHECK-LABEL: 'fs_constant' +; CHECK: DIVERGENT: %v = call float @llvm.SI.fs.constant( +define amdgpu_ps void @fs_constant(i32 inreg %prim_mask, <2 x i32> %interp_param) #1 { + %v = call float @llvm.SI.fs.constant(i32 0, i32 0, i32 %prim_mask) + store volatile float %v, float addrspace(1)* undef + ret void +} + +declare float @llvm.SI.fs.interp(i32, i32, i32, <2 x i32>) #0 +declare float @llvm.SI.fs.constant(i32, i32, i32) #0 + +attributes #0 = { nounwind readnone } |