diff options
| author | Fangrui Song <maskray@google.com> | 2019-08-23 02:17:04 +0000 | 
|---|---|---|
| committer | Fangrui Song <maskray@google.com> | 2019-08-23 02:17:04 +0000 | 
| commit | 3fc933af8b49519658e4c2fd82f93c6d680c8a08 (patch) | |
| tree | f4be5e7421f3997fc0e85fdbbee52eb9fe1e5bc4 /llvm/lib | |
| parent | 7fbadf3b2793bf907d5a1fb7c1c9078500a0b030 (diff) | |
| download | bcm5719-llvm-3fc933af8b49519658e4c2fd82f93c6d680c8a08.tar.gz bcm5719-llvm-3fc933af8b49519658e4c2fd82f93c6d680c8a08.zip | |
[AlignmentFromAssumptions] getNewAlignmentDiff(): use getURemExpr()
The alignment is calculated incorrectly, thus sometimes it doesn't generate aligned mov instructions, as shown by the example below:
```
// b.cc
typedef long long index;
extern "C" index g_tid;
extern "C" index g_num;
void add3(float* __restrict__ a, float* __restrict__ b, float* __restrict__ c) {
    index n = 64*1024;
    index m = 16*1024;
    index k = 4*1024;
    index tid = g_tid;
    index num = g_num;
    __builtin_assume_aligned(a, 32);
    __builtin_assume_aligned(b, 32);
    __builtin_assume_aligned(c, 32);
    for (index i0=tid*k; i0<m; i0+=num*k)
        for (index i1=0; i1<n*m; i1+=m)
            for (index i2=0; i2<k; i2++)
                c[i1+i0+i2] = b[i0+i2] + a[i1+i0+i2];
}
```
Compile with `clang b.cc -Ofast -march=skylake -mavx2 -S`
```
vmovaps -224(%rdi,%rbx,4), %ymm0
vmovups -192(%rdi,%rbx,4), %ymm1         # should be movaps
vmovups -160(%rdi,%rbx,4), %ymm2         # should be movaps
vmovups -128(%rdi,%rbx,4), %ymm3         # should be movaps
vaddps  -224(%rsi,%rbx,4), %ymm0, %ymm0
vaddps  -192(%rsi,%rbx,4), %ymm1, %ymm1
vaddps  -160(%rsi,%rbx,4), %ymm2, %ymm2
vaddps  -128(%rsi,%rbx,4), %ymm3, %ymm3
vmovaps %ymm0, -224(%rdx,%rbx,4)
vmovups %ymm1, -192(%rdx,%rbx,4)         # should be movaps
vmovups %ymm2, -160(%rdx,%rbx,4)         # should be movaps
vmovups %ymm3, -128(%rdx,%rbx,4)         # should be movaps
```
Differential Revision: https://reviews.llvm.org/D66575
Patch by Dun Liang
llvm-svn: 369723
Diffstat (limited to 'llvm/lib')
| -rw-r--r-- | llvm/lib/Transforms/Scalar/AlignmentFromAssumptions.cpp | 4 | 
1 files changed, 1 insertions, 3 deletions
| diff --git a/llvm/lib/Transforms/Scalar/AlignmentFromAssumptions.cpp b/llvm/lib/Transforms/Scalar/AlignmentFromAssumptions.cpp index de9a62e88c2..a301542a206 100644 --- a/llvm/lib/Transforms/Scalar/AlignmentFromAssumptions.cpp +++ b/llvm/lib/Transforms/Scalar/AlignmentFromAssumptions.cpp @@ -93,9 +93,7 @@ static unsigned getNewAlignmentDiff(const SCEV *DiffSCEV,                                      const SCEV *AlignSCEV,                                      ScalarEvolution *SE) {    // DiffUnits = Diff % int64_t(Alignment) -  const SCEV *DiffAlignDiv = SE->getUDivExpr(DiffSCEV, AlignSCEV); -  const SCEV *DiffAlign = SE->getMulExpr(DiffAlignDiv, AlignSCEV); -  const SCEV *DiffUnitsSCEV = SE->getMinusSCEV(DiffAlign, DiffSCEV); +  const SCEV *DiffUnitsSCEV = SE->getURemExpr(DiffSCEV, AlignSCEV);    LLVM_DEBUG(dbgs() << "\talignment relative to " << *AlignSCEV << " is "                      << *DiffUnitsSCEV << " (diff: " << *DiffSCEV << ")\n"); | 

