diff options
author | David Green <david.green@arm.com> | 2020-01-06 15:54:36 +0000 |
---|---|---|
committer | David Green <david.green@arm.com> | 2020-01-06 16:38:49 +0000 |
commit | f88d52728b9c7f91e4cfec657c0fc60be07d2cb4 (patch) | |
tree | 6ab72905c7136db4a995987a5ea34b350bb0beae | |
parent | 0eb981b8ce70d07b1b1fb39b969a6fe9509840c1 (diff) | |
download | bcm5719-llvm-f88d52728b9c7f91e4cfec657c0fc60be07d2cb4.tar.gz bcm5719-llvm-f88d52728b9c7f91e4cfec657c0fc60be07d2cb4.zip |
[ARM] Use the correct opcodes for Thumb2 segmented stack frame lowering
The segmented stack lowering code appears to be using ARM opcodes under
Thumb2. The MRC opcode will be the same for Thumb and ARM, but t2LDR
seems wrong. Either way, using the correct thumb vs arm opcodes is more
correct.
Differential Revision: https://reviews.llvm.org/D72074
-rw-r--r-- | llvm/lib/Target/ARM/ARMFrameLowering.cpp | 6 | ||||
-rw-r--r-- | llvm/test/CodeGen/Thumb2/segmented-stacks.ll | 86 |
2 files changed, 65 insertions, 27 deletions
diff --git a/llvm/lib/Target/ARM/ARMFrameLowering.cpp b/llvm/lib/Target/ARM/ARMFrameLowering.cpp index 5428bd6c94b..cb98b2b34ef 100644 --- a/llvm/lib/Target/ARM/ARMFrameLowering.cpp +++ b/llvm/lib/Target/ARM/ARMFrameLowering.cpp @@ -2424,7 +2424,8 @@ void ARMFrameLowering::adjustForSegmentedStacks( } else { // Get TLS base address from the coprocessor // mrc p15, #0, SR0, c13, c0, #3 - BuildMI(McrMBB, DL, TII.get(ARM::MRC), ScratchReg0) + BuildMI(McrMBB, DL, TII.get(Thumb ? ARM::t2MRC : ARM::MRC), + ScratchReg0) .addImm(15) .addImm(0) .addImm(13) @@ -2438,7 +2439,8 @@ void ARMFrameLowering::adjustForSegmentedStacks( // Get the stack limit from the right offset // ldr SR0, [sr0, #4 * TlsOffset] - BuildMI(GetMBB, DL, TII.get(ARM::LDRi12), ScratchReg0) + BuildMI(GetMBB, DL, TII.get(Thumb ? ARM::t2LDRi12 : ARM::LDRi12), + ScratchReg0) .addReg(ScratchReg0) .addImm(4 * TlsOffset) .add(predOps(ARMCC::AL)); diff --git a/llvm/test/CodeGen/Thumb2/segmented-stacks.ll b/llvm/test/CodeGen/Thumb2/segmented-stacks.ll index 49627fb7c3c..ee4dd0186b3 100644 --- a/llvm/test/CodeGen/Thumb2/segmented-stacks.ll +++ b/llvm/test/CodeGen/Thumb2/segmented-stacks.ll @@ -1,34 +1,70 @@ -; RUN: llc < %s -mtriple=thumb-linux-androideabi -mcpu=arm1156t2-s -mattr=+thumb2 -verify-machineinstrs | FileCheck %s -check-prefix=Thumb-android -; RUN: llc < %s -mtriple=thumb-linux-androideabi -mcpu=arm1156t2-s -mattr=+thumb2 -filetype=obj +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc < %s -mtriple=thumb-linux-androideabi -mcpu=arm1156t2-s -mattr=+thumb2 -verify-machineinstrs | FileCheck %s -check-prefix=THUMB +; RUN: llc < %s -mtriple=arm-linux-androideabi -mcpu=arm1156t2-s -verify-machineinstrs | FileCheck %s -check-prefix=ARM ; Just to prevent the alloca from being optimized away declare void @dummy_use(i32*, i32) define void @test_basic() #0 { - %mem = alloca i32, i32 10 - call void @dummy_use (i32* %mem, i32 10) - ret void - -; Thumb-android: test_basic: - -; Thumb-android: push {r4, r5} -; Thumb-android-NEXT: mrc p15, #0, r4, c13, c0, #3 -; Thumb-android-NEXT: mov r5, sp -; Thumb-android-NEXT: ldr r4, [r4, #252] -; Thumb-android-NEXT: cmp r4, r5 -; Thumb-android-NEXT: blo .LBB0_2 - -; Thumb-android: mov r4, #48 -; Thumb-android-NEXT: mov r5, #0 -; Thumb-android-NEXT: push {lr} -; Thumb-android-NEXT: bl __morestack -; Thumb-android-NEXT: ldr lr, [sp], #4 -; Thumb-android-NEXT: pop {r4, r5} -; Thumb-android-NEXT: bx lr - -; Thumb-android: pop {r4, r5} - +; THUMB-LABEL: test_basic: +; THUMB: @ %bb.0: +; THUMB-NEXT: push {r4, r5} +; THUMB-NEXT: mrc p15, #0, r4, c13, c0, #3 +; THUMB-NEXT: mov r5, sp +; THUMB-NEXT: ldr.w r4, [r4, #252] +; THUMB-NEXT: cmp r4, r5 +; THUMB-NEXT: blo .LBB0_2 +; THUMB-NEXT: @ %bb.1: +; THUMB-NEXT: mov r4, #48 +; THUMB-NEXT: mov r5, #0 +; THUMB-NEXT: push {lr} +; THUMB-NEXT: bl __morestack +; THUMB-NEXT: ldr lr, [sp], #4 +; THUMB-NEXT: pop {r4, r5} +; THUMB-NEXT: bx lr +; THUMB-NEXT: .LBB0_2: +; THUMB-NEXT: pop {r4, r5} +; THUMB-NEXT: .save {r7, lr} +; THUMB-NEXT: push {r7, lr} +; THUMB-NEXT: .pad #40 +; THUMB-NEXT: sub sp, #40 +; THUMB-NEXT: mov r0, sp +; THUMB-NEXT: movs r1, #10 +; THUMB-NEXT: bl dummy_use +; THUMB-NEXT: add sp, #40 +; THUMB-NEXT: pop {r7, pc} +; +; ARM-LABEL: test_basic: +; ARM: @ %bb.0: +; ARM-NEXT: push {r4, r5} +; ARM-NEXT: mrc p15, #0, r4, c13, c0, #3 +; ARM-NEXT: mov r5, sp +; ARM-NEXT: ldr r4, [r4, #252] +; ARM-NEXT: cmp r4, r5 +; ARM-NEXT: blo .LBB0_2 +; ARM-NEXT: @ %bb.1: +; ARM-NEXT: mov r4, #48 +; ARM-NEXT: mov r5, #0 +; ARM-NEXT: stmdb sp!, {lr} +; ARM-NEXT: bl __morestack +; ARM-NEXT: ldm sp!, {lr} +; ARM-NEXT: pop {r4, r5} +; ARM-NEXT: bx lr +; ARM-NEXT: .LBB0_2: +; ARM-NEXT: pop {r4, r5} +; ARM-NEXT: .save {r11, lr} +; ARM-NEXT: push {r11, lr} +; ARM-NEXT: .pad #40 +; ARM-NEXT: sub sp, sp, #40 +; ARM-NEXT: mov r0, sp +; ARM-NEXT: mov r1, #10 +; ARM-NEXT: bl dummy_use +; ARM-NEXT: add sp, sp, #40 +; ARM-NEXT: pop {r11, pc} + %mem = alloca i32, i32 10 + call void @dummy_use (i32* %mem, i32 10) + ret void } attributes #0 = { "split-stack" } |