diff options
| author | Eric Christopher <echristo@gmail.com> | 2019-04-17 02:12:23 +0000 |
|---|---|---|
| committer | Eric Christopher <echristo@gmail.com> | 2019-04-17 02:12:23 +0000 |
| commit | a86343512845c9c1fdbac865fea88aa5fce7142a (patch) | |
| tree | 666fc6353de19ad8b00e56b67edd33f24104e4a7 /llvm/test/Transforms/StraightLineStrengthReduce/AMDGPU | |
| parent | 7f8ca6e3679b3af951cb7a4b1377edfaa3244b93 (diff) | |
| download | bcm5719-llvm-a86343512845c9c1fdbac865fea88aa5fce7142a.tar.gz bcm5719-llvm-a86343512845c9c1fdbac865fea88aa5fce7142a.zip | |
Temporarily Revert "Add basic loop fusion pass."
As it's causing some bot failures (and per request from kbarton).
This reverts commit r358543/ab70da07286e618016e78247e4a24fcb84077fda.
llvm-svn: 358546
Diffstat (limited to 'llvm/test/Transforms/StraightLineStrengthReduce/AMDGPU')
3 files changed, 0 insertions, 129 deletions
diff --git a/llvm/test/Transforms/StraightLineStrengthReduce/AMDGPU/lit.local.cfg b/llvm/test/Transforms/StraightLineStrengthReduce/AMDGPU/lit.local.cfg deleted file mode 100644 index 2a665f06be7..00000000000 --- a/llvm/test/Transforms/StraightLineStrengthReduce/AMDGPU/lit.local.cfg +++ /dev/null @@ -1,2 +0,0 @@ -if not 'AMDGPU' in config.root.targets: - config.unsupported = True diff --git a/llvm/test/Transforms/StraightLineStrengthReduce/AMDGPU/pr23975.ll b/llvm/test/Transforms/StraightLineStrengthReduce/AMDGPU/pr23975.ll deleted file mode 100644 index f587a93bf1e..00000000000 --- a/llvm/test/Transforms/StraightLineStrengthReduce/AMDGPU/pr23975.ll +++ /dev/null @@ -1,20 +0,0 @@ -; RUN: opt < %s -slsr -S | FileCheck %s - -target datalayout = "e-p:32:32-p1:64:64-p2:64:64-p3:32:32-p4:64:64-p5:32:32-p24:64:64-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64" -target triple = "amdgcn--" - -%struct.Matrix4x4 = type { [4 x [4 x float]] } - -; Function Attrs: nounwind -define fastcc void @Accelerator_Intersect(%struct.Matrix4x4 addrspace(1)* nocapture readonly %leafTransformations) #0 { -; CHECK-LABEL: @Accelerator_Intersect( -entry: - %tmp = sext i32 undef to i64 - %arrayidx114 = getelementptr inbounds %struct.Matrix4x4, %struct.Matrix4x4 addrspace(1)* %leafTransformations, i64 %tmp - %tmp1 = getelementptr %struct.Matrix4x4, %struct.Matrix4x4 addrspace(1)* %leafTransformations, i64 %tmp, i32 0, i64 0, i64 0 -; CHECK: %tmp1 = getelementptr %struct.Matrix4x4, %struct.Matrix4x4 addrspace(1)* %leafTransformations, i64 %tmp, i32 0, i64 0, i64 0 - %tmp2 = load <4 x float>, <4 x float> addrspace(1)* undef, align 4 - ret void -} - -attributes #0 = { nounwind "disable-tail-calls"="false" "less-precise-fpmad"="false" "no-frame-pointer-elim"="false" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "no-realign-stack" "stack-protector-buffer-size"="8" "target-cpu"="tahiti" "unsafe-fp-math"="false" "use-soft-float"="false" } diff --git a/llvm/test/Transforms/StraightLineStrengthReduce/AMDGPU/reassociate-geps-and-slsr-addrspace.ll b/llvm/test/Transforms/StraightLineStrengthReduce/AMDGPU/reassociate-geps-and-slsr-addrspace.ll deleted file mode 100644 index 9554ae69031..00000000000 --- a/llvm/test/Transforms/StraightLineStrengthReduce/AMDGPU/reassociate-geps-and-slsr-addrspace.ll +++ /dev/null @@ -1,107 +0,0 @@ -; RUN: opt -S -mtriple=amdgcn-- -separate-const-offset-from-gep -slsr -gvn < %s | FileCheck %s - -target datalayout = "e-p:32:32-p1:64:64-p2:64:64-p3:32:32-p4:64:64-p5:32:32-p24:64:64-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64" - - -; CHECK-LABEL: @slsr_after_reassociate_global_geps_mubuf_max_offset( -; CHECK: [[b1:%[0-9]+]] = getelementptr float, float addrspace(1)* %arr, i64 [[bump:%[0-9]+]] -; CHECK: [[b2:%[0-9]+]] = getelementptr float, float addrspace(1)* [[b1]], i64 [[bump]] -define amdgpu_kernel void @slsr_after_reassociate_global_geps_mubuf_max_offset(float addrspace(1)* %out, float addrspace(1)* noalias %arr, i32 %i) { -bb: - %i2 = shl nsw i32 %i, 1 - %j1 = add nsw i32 %i, 1023 - %tmp = sext i32 %j1 to i64 - %p1 = getelementptr inbounds float, float addrspace(1)* %arr, i64 %tmp - %tmp3 = bitcast float addrspace(1)* %p1 to i32 addrspace(1)* - %v11 = load i32, i32 addrspace(1)* %tmp3, align 4 - %tmp4 = bitcast float addrspace(1)* %out to i32 addrspace(1)* - store i32 %v11, i32 addrspace(1)* %tmp4, align 4 - - %j2 = add nsw i32 %i2, 1023 - %tmp5 = sext i32 %j2 to i64 - %p2 = getelementptr inbounds float, float addrspace(1)* %arr, i64 %tmp5 - %tmp6 = bitcast float addrspace(1)* %p2 to i32 addrspace(1)* - %v22 = load i32, i32 addrspace(1)* %tmp6, align 4 - %tmp7 = bitcast float addrspace(1)* %out to i32 addrspace(1)* - store i32 %v22, i32 addrspace(1)* %tmp7, align 4 - - ret void -} - -; CHECK-LABEL: @slsr_after_reassociate_global_geps_over_mubuf_max_offset( -; CHECK: %j1 = add nsw i32 %i, 1024 -; CHECK: %tmp = sext i32 %j1 to i64 -; CHECK: getelementptr inbounds float, float addrspace(1)* %arr, i64 %tmp -; CHECK: getelementptr inbounds float, float addrspace(1)* %arr, i64 %tmp5 -define amdgpu_kernel void @slsr_after_reassociate_global_geps_over_mubuf_max_offset(float addrspace(1)* %out, float addrspace(1)* noalias %arr, i32 %i) { -bb: - %i2 = shl nsw i32 %i, 1 - %j1 = add nsw i32 %i, 1024 - %tmp = sext i32 %j1 to i64 - %p1 = getelementptr inbounds float, float addrspace(1)* %arr, i64 %tmp - %tmp3 = bitcast float addrspace(1)* %p1 to i32 addrspace(1)* - %v11 = load i32, i32 addrspace(1)* %tmp3, align 4 - %tmp4 = bitcast float addrspace(1)* %out to i32 addrspace(1)* - store i32 %v11, i32 addrspace(1)* %tmp4, align 4 - - %j2 = add nsw i32 %i2, 1024 - %tmp5 = sext i32 %j2 to i64 - %p2 = getelementptr inbounds float, float addrspace(1)* %arr, i64 %tmp5 - %tmp6 = bitcast float addrspace(1)* %p2 to i32 addrspace(1)* - %v22 = load i32, i32 addrspace(1)* %tmp6, align 4 - %tmp7 = bitcast float addrspace(1)* %out to i32 addrspace(1)* - store i32 %v22, i32 addrspace(1)* %tmp7, align 4 - - ret void -} - -; CHECK-LABEL: @slsr_after_reassociate_lds_geps_ds_max_offset( -; CHECK: [[B1:%[0-9]+]] = getelementptr float, float addrspace(3)* %arr, i32 %i -; CHECK: getelementptr inbounds float, float addrspace(3)* [[B1]], i32 16383 - -; CHECK: [[B2:%[0-9]+]] = getelementptr float, float addrspace(3)* [[B1]], i32 %i -; CHECK: getelementptr inbounds float, float addrspace(3)* [[B2]], i32 16383 -define amdgpu_kernel void @slsr_after_reassociate_lds_geps_ds_max_offset(float addrspace(1)* %out, float addrspace(3)* noalias %arr, i32 %i) { -bb: - %i2 = shl nsw i32 %i, 1 - %j1 = add nsw i32 %i, 16383 - %p1 = getelementptr inbounds float, float addrspace(3)* %arr, i32 %j1 - %tmp3 = bitcast float addrspace(3)* %p1 to i32 addrspace(3)* - %v11 = load i32, i32 addrspace(3)* %tmp3, align 4 - %tmp4 = bitcast float addrspace(1)* %out to i32 addrspace(1)* - store i32 %v11, i32 addrspace(1)* %tmp4, align 4 - - %j2 = add nsw i32 %i2, 16383 - %p2 = getelementptr inbounds float, float addrspace(3)* %arr, i32 %j2 - %tmp6 = bitcast float addrspace(3)* %p2 to i32 addrspace(3)* - %v22 = load i32, i32 addrspace(3)* %tmp6, align 4 - %tmp7 = bitcast float addrspace(1)* %out to i32 addrspace(1)* - store i32 %v22, i32 addrspace(1)* %tmp7, align 4 - - ret void -} - -; CHECK-LABEL: @slsr_after_reassociate_lds_geps_over_ds_max_offset( -; CHECK: %j1 = add nsw i32 %i, 16384 -; CHECK: getelementptr inbounds float, float addrspace(3)* %arr, i32 %j1 -; CHECK: %j2 = add i32 %j1, %i -; CHECK: getelementptr inbounds float, float addrspace(3)* %arr, i32 %j2 -define amdgpu_kernel void @slsr_after_reassociate_lds_geps_over_ds_max_offset(float addrspace(1)* %out, float addrspace(3)* noalias %arr, i32 %i) { -bb: - %i2 = shl nsw i32 %i, 1 - %j1 = add nsw i32 %i, 16384 - %p1 = getelementptr inbounds float, float addrspace(3)* %arr, i32 %j1 - %tmp3 = bitcast float addrspace(3)* %p1 to i32 addrspace(3)* - %v11 = load i32, i32 addrspace(3)* %tmp3, align 4 - %tmp4 = bitcast float addrspace(1)* %out to i32 addrspace(1)* - store i32 %v11, i32 addrspace(1)* %tmp4, align 4 - - %j2 = add nsw i32 %i2, 16384 - %p2 = getelementptr inbounds float, float addrspace(3)* %arr, i32 %j2 - %tmp6 = bitcast float addrspace(3)* %p2 to i32 addrspace(3)* - %v22 = load i32, i32 addrspace(3)* %tmp6, align 4 - %tmp7 = bitcast float addrspace(1)* %out to i32 addrspace(1)* - store i32 %v22, i32 addrspace(1)* %tmp7, align 4 - - ret void -} |

