diff options
Diffstat (limited to 'llvm/test/CodeGen/AArch64/load-combine.ll')
-rw-r--r-- | llvm/test/CodeGen/AArch64/load-combine.ll | 146 |
1 files changed, 83 insertions, 63 deletions
diff --git a/llvm/test/CodeGen/AArch64/load-combine.ll b/llvm/test/CodeGen/AArch64/load-combine.ll index b9879b555aa..906646cda15 100644 --- a/llvm/test/CodeGen/AArch64/load-combine.ll +++ b/llvm/test/CodeGen/AArch64/load-combine.ll @@ -1,11 +1,13 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc < %s -mtriple=arm64-unknown | FileCheck %s ; i8* p; // p is 1 byte aligned ; (i32) p[0] | ((i32) p[1] << 8) | ((i32) p[2] << 16) | ((i32) p[3] << 24) define i32 @load_i32_by_i8_unaligned(i32* %arg) { ; CHECK-LABEL: load_i32_by_i8_unaligned: -; CHECK: ldr w0, [x0] -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldr w0, [x0] +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = getelementptr inbounds i8, i8* %tmp, i32 0 %tmp2 = load i8, i8* %tmp1, align 1 @@ -32,8 +34,9 @@ define i32 @load_i32_by_i8_unaligned(i32* %arg) { ; (i32) p[0] | ((i32) p[1] << 8) | ((i32) p[2] << 16) | ((i32) p[3] << 24) define i32 @load_i32_by_i8_aligned(i32* %arg) { ; CHECK-LABEL: load_i32_by_i8_aligned: -; CHECK: ldr w0, [x0] -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldr w0, [x0] +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = getelementptr inbounds i8, i8* %tmp, i32 0 %tmp2 = load i8, i8* %tmp1, align 4 @@ -60,9 +63,10 @@ define i32 @load_i32_by_i8_aligned(i32* %arg) { ; ((i32) p[0] << 24) | ((i32) p[1] << 16) | ((i32) p[2] << 8) | (i32) p[3] define i32 @load_i32_by_i8_bswap(i32* %arg) { ; CHECK-LABEL: load_i32_by_i8_bswap: -; CHECK: ldr w8, [x0] -; CHECK-NEXT: rev w0, w8 -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldr w8, [x0] +; CHECK-NEXT: rev w0, w8 +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = load i8, i8* %tmp, align 4 %tmp2 = zext i8 %tmp1 to i32 @@ -88,8 +92,9 @@ define i32 @load_i32_by_i8_bswap(i32* %arg) { ; (i64) p[0] | ((i64) p[1] << 8) | ((i64) p[2] << 16) | ((i64) p[3] << 24) | ((i64) p[4] << 32) | ((i64) p[5] << 40) | ((i64) p[6] << 48) | ((i64) p[7] << 56) define i64 @load_i64_by_i8(i64* %arg) { ; CHECK-LABEL: load_i64_by_i8: -; CHECK: ldr x0, [x0] -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldr x0, [x0] +; CHECK-NEXT: ret %tmp = bitcast i64* %arg to i8* %tmp1 = load i8, i8* %tmp, align 8 %tmp2 = zext i8 %tmp1 to i64 @@ -135,9 +140,10 @@ define i64 @load_i64_by_i8(i64* %arg) { ; ((i64) p[0] << 56) | ((i64) p[1] << 48) | ((i64) p[2] << 40) | ((i64) p[3] << 32) | ((i64) p[4] << 24) | ((i64) p[5] << 16) | ((i64) p[6] << 8) | (i64) p[7] define i64 @load_i64_by_i8_bswap(i64* %arg) { ; CHECK-LABEL: load_i64_by_i8_bswap: -; CHECK: ldr x8, [x0] -; CHECK-NEXT: rev x0, x8 -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldr x8, [x0] +; CHECK-NEXT: rev x0, x8 +; CHECK-NEXT: ret %tmp = bitcast i64* %arg to i8* %tmp1 = load i8, i8* %tmp, align 8 %tmp2 = zext i8 %tmp1 to i64 @@ -183,8 +189,9 @@ define i64 @load_i64_by_i8_bswap(i64* %arg) { ; (i32) p[1] | ((i32) p[2] << 8) | ((i32) p[3] << 16) | ((i32) p[4] << 24) define i32 @load_i32_by_i8_nonzero_offset(i32* %arg) { ; CHECK-LABEL: load_i32_by_i8_nonzero_offset: -; CHECK: ldur w0, [x0, #1] -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldur w0, [x0, #1] +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = getelementptr inbounds i8, i8* %tmp, i32 1 @@ -212,8 +219,9 @@ define i32 @load_i32_by_i8_nonzero_offset(i32* %arg) { ; (i32) p[-4] | ((i32) p[-3] << 8) | ((i32) p[-2] << 16) | ((i32) p[-1] << 24) define i32 @load_i32_by_i8_neg_offset(i32* %arg) { ; CHECK-LABEL: load_i32_by_i8_neg_offset: -; CHECK: ldur w0, [x0, #-4] -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldur w0, [x0, #-4] +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = getelementptr inbounds i8, i8* %tmp, i32 -4 @@ -241,9 +249,10 @@ define i32 @load_i32_by_i8_neg_offset(i32* %arg) { ; (i32) p[4] | ((i32) p[3] << 8) | ((i32) p[2] << 16) | ((i32) p[1] << 24) define i32 @load_i32_by_i8_nonzero_offset_bswap(i32* %arg) { ; CHECK-LABEL: load_i32_by_i8_nonzero_offset_bswap: -; CHECK: ldur w8, [x0, #1] -; CHECK-NEXT: rev w0, w8 -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldur w8, [x0, #1] +; CHECK-NEXT: rev w0, w8 +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = getelementptr inbounds i8, i8* %tmp, i32 4 @@ -271,9 +280,10 @@ define i32 @load_i32_by_i8_nonzero_offset_bswap(i32* %arg) { ; (i32) p[-1] | ((i32) p[-2] << 8) | ((i32) p[-3] << 16) | ((i32) p[-4] << 24) define i32 @load_i32_by_i8_neg_offset_bswap(i32* %arg) { ; CHECK-LABEL: load_i32_by_i8_neg_offset_bswap: -; CHECK: ldur w8, [x0, #-4] -; CHECK-NEXT: rev w0, w8 -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldur w8, [x0, #-4] +; CHECK-NEXT: rev w0, w8 +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = getelementptr inbounds i8, i8* %tmp, i32 -1 @@ -303,9 +313,10 @@ declare i16 @llvm.bswap.i16(i16) ; (i32) bswap(p[1]) | (i32) bswap(p[0] << 16) define i32 @load_i32_by_bswap_i16(i32* %arg) { ; CHECK-LABEL: load_i32_by_bswap_i16: -; CHECK: ldr w8, [x0] -; CHECK-NEXT: rev w0, w8 -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldr w8, [x0] +; CHECK-NEXT: rev w0, w8 +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i16* %tmp1 = load i16, i16* %tmp, align 4 @@ -324,8 +335,9 @@ define i32 @load_i32_by_bswap_i16(i32* %arg) { ; (i32) p[0] | (sext(p[1] << 16) to i32) define i32 @load_i32_by_sext_i16(i32* %arg) { ; CHECK-LABEL: load_i32_by_sext_i16: -; CHECK: ldr w0, [x0] -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldr w0, [x0] +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i16* %tmp1 = load i16, i16* %tmp, align 4 %tmp2 = zext i16 %tmp1 to i32 @@ -342,9 +354,10 @@ define i32 @load_i32_by_sext_i16(i32* %arg) { ; (i32) p[i] | ((i32) p[i + 1] << 8) | ((i32) p[i + 2] << 16) | ((i32) p[i + 3] << 24) define i32 @load_i32_by_i8_base_offset_index(i8* %arg, i32 %i) { ; CHECK-LABEL: load_i32_by_i8_base_offset_index: -; CHECK: add x8, x0, w1, uxtw -; CHECK-NEXT: ldr w0, [x8, #12] -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: add x8, x0, w1, uxtw +; CHECK-NEXT: ldr w0, [x8, #12] +; CHECK-NEXT: ret %tmp = add nuw nsw i32 %i, 3 %tmp2 = add nuw nsw i32 %i, 2 %tmp3 = add nuw nsw i32 %i, 1 @@ -379,9 +392,10 @@ define i32 @load_i32_by_i8_base_offset_index(i8* %arg, i32 %i) { ; (i32) p[i + 1] | ((i32) p[i + 2] << 8) | ((i32) p[i + 3] << 16) | ((i32) p[i + 4] << 24) define i32 @load_i32_by_i8_base_offset_index_2(i8* %arg, i32 %i) { ; CHECK-LABEL: load_i32_by_i8_base_offset_index_2: -; CHECK: add x8, x0, w1, uxtw -; CHECK-NEXT: ldur w0, [x8, #13] -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: add x8, x0, w1, uxtw +; CHECK-NEXT: ldur w0, [x8, #13] +; CHECK-NEXT: ret %tmp = add nuw nsw i32 %i, 4 %tmp2 = add nuw nsw i32 %i, 3 %tmp3 = add nuw nsw i32 %i, 2 @@ -416,11 +430,12 @@ define i32 @load_i32_by_i8_base_offset_index_2(i8* %arg, i32 %i) { ; (i32) p[0] | ((i32) p[1] << 8) define i32 @zext_load_i32_by_i8(i32* %arg) { ; CHECK-LABEL: zext_load_i32_by_i8: -; CHECK: ldrb w8, [x0] -; CHECK-NEXT: ldrb w9, [x0, #1] -; CHECK-NEXT: bfi w8, w9, #8, #8 -; CHECK-NEXT: mov w0, w8 -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldrb w8, [x0] +; CHECK-NEXT: ldrb w9, [x0, #1] +; CHECK-NEXT: bfi w8, w9, #8, #8 +; CHECK-NEXT: mov w0, w8 +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = getelementptr inbounds i8, i8* %tmp, i32 0 @@ -438,11 +453,12 @@ define i32 @zext_load_i32_by_i8(i32* %arg) { ; ((i32) p[0] << 8) | ((i32) p[1] << 16) define i32 @zext_load_i32_by_i8_shl_8(i32* %arg) { ; CHECK-LABEL: zext_load_i32_by_i8_shl_8: -; CHECK: ldrb w8, [x0] -; CHECK-NEXT: ldrb w9, [x0, #1] -; CHECK-NEXT: lsl w0, w8, #8 -; CHECK-NEXT: bfi w0, w9, #16, #8 -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldrb w8, [x0] +; CHECK-NEXT: ldrb w9, [x0, #1] +; CHECK-NEXT: lsl w0, w8, #8 +; CHECK-NEXT: bfi w0, w9, #16, #8 +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = getelementptr inbounds i8, i8* %tmp, i32 0 @@ -461,11 +477,12 @@ define i32 @zext_load_i32_by_i8_shl_8(i32* %arg) { ; ((i32) p[0] << 16) | ((i32) p[1] << 24) define i32 @zext_load_i32_by_i8_shl_16(i32* %arg) { ; CHECK-LABEL: zext_load_i32_by_i8_shl_16: -; CHECK: ldrb w8, [x0] -; CHECK-NEXT: ldrb w9, [x0, #1] -; CHECK-NEXT: lsl w0, w8, #16 -; CHECK-NEXT: bfi w0, w9, #24, #8 -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldrb w8, [x0] +; CHECK-NEXT: ldrb w9, [x0, #1] +; CHECK-NEXT: lsl w0, w8, #16 +; CHECK-NEXT: bfi w0, w9, #24, #8 +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = getelementptr inbounds i8, i8* %tmp, i32 0 @@ -483,11 +500,12 @@ define i32 @zext_load_i32_by_i8_shl_16(i32* %arg) { ; (i32) p[1] | ((i32) p[0] << 8) define i32 @zext_load_i32_by_i8_bswap(i32* %arg) { ; CHECK-LABEL: zext_load_i32_by_i8_bswap: -; CHECK: ldrb w8, [x0, #1] -; CHECK-NEXT: ldrb w9, [x0] -; CHECK-NEXT: bfi w8, w9, #8, #8 -; CHECK-NEXT: mov w0, w8 -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldrb w8, [x0, #1] +; CHECK-NEXT: ldrb w9, [x0] +; CHECK-NEXT: bfi w8, w9, #8, #8 +; CHECK-NEXT: mov w0, w8 +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = getelementptr inbounds i8, i8* %tmp, i32 1 @@ -505,11 +523,12 @@ define i32 @zext_load_i32_by_i8_bswap(i32* %arg) { ; ((i32) p[1] << 8) | ((i32) p[0] << 16) define i32 @zext_load_i32_by_i8_bswap_shl_8(i32* %arg) { ; CHECK-LABEL: zext_load_i32_by_i8_bswap_shl_8: -; CHECK: ldrb w8, [x0, #1] -; CHECK-NEXT: ldrb w9, [x0] -; CHECK-NEXT: lsl w0, w8, #8 -; CHECK-NEXT: bfi w0, w9, #16, #8 -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldrb w8, [x0, #1] +; CHECK-NEXT: ldrb w9, [x0] +; CHECK-NEXT: lsl w0, w8, #8 +; CHECK-NEXT: bfi w0, w9, #16, #8 +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = getelementptr inbounds i8, i8* %tmp, i32 1 @@ -528,11 +547,12 @@ define i32 @zext_load_i32_by_i8_bswap_shl_8(i32* %arg) { ; ((i32) p[1] << 16) | ((i32) p[0] << 24) define i32 @zext_load_i32_by_i8_bswap_shl_16(i32* %arg) { ; CHECK-LABEL: zext_load_i32_by_i8_bswap_shl_16: -; CHECK: ldrb w8, [x0, #1] -; CHECK-NEXT: ldrb w9, [x0] -; CHECK-NEXT: lsl w0, w8, #16 -; CHECK-NEXT: bfi w0, w9, #24, #8 -; CHECK-NEXT: ret +; CHECK: // %bb.0: +; CHECK-NEXT: ldrb w8, [x0, #1] +; CHECK-NEXT: ldrb w9, [x0] +; CHECK-NEXT: lsl w0, w8, #16 +; CHECK-NEXT: bfi w0, w9, #24, #8 +; CHECK-NEXT: ret %tmp = bitcast i32* %arg to i8* %tmp1 = getelementptr inbounds i8, i8* %tmp, i32 1 |