diff options
| author | Alex Bradbury <asb@lowrisc.org> | 2018-01-18 11:34:02 +0000 |
|---|---|---|
| committer | Alex Bradbury <asb@lowrisc.org> | 2018-01-18 11:34:02 +0000 |
| commit | 7d6aa1f7ae73206460bc36c97d5b48bdbf7c2cd8 (patch) | |
| tree | 19a95f1c99019c338f9250c313ec36b0722de084 /llvm/test/CodeGen/RISCV/vararg.ll | |
| parent | c806d39182c1aa6c647d044d19d58aad9f5c95df (diff) | |
| download | bcm5719-llvm-7d6aa1f7ae73206460bc36c97d5b48bdbf7c2cd8.tar.gz bcm5719-llvm-7d6aa1f7ae73206460bc36c97d5b48bdbf7c2cd8.zip | |
[RISCV] Implement frame pointer elimination
llvm-svn: 322839
Diffstat (limited to 'llvm/test/CodeGen/RISCV/vararg.ll')
| -rw-r--r-- | llvm/test/CodeGen/RISCV/vararg.ll | 960 |
1 files changed, 798 insertions, 162 deletions
diff --git a/llvm/test/CodeGen/RISCV/vararg.ll b/llvm/test/CodeGen/RISCV/vararg.ll index 8f9a4b793a9..61a6178e095 100644 --- a/llvm/test/CodeGen/RISCV/vararg.ll +++ b/llvm/test/CodeGen/RISCV/vararg.ll @@ -1,6 +1,8 @@ ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc -mtriple=riscv32 -verify-machineinstrs < %s \ -; RUN: | FileCheck -check-prefix=RV32I %s +; RUN: | FileCheck -check-prefix=RV32I-FPELIM %s +; RUN: llc -mtriple=riscv32 -verify-machineinstrs -disable-fp-elim < %s \ +; RUN: | FileCheck -check-prefix=RV32I-WITHFP %s declare void @llvm.va_start(i8*) declare void @llvm.va_end(i8*) @@ -15,23 +17,54 @@ define i32 @va1(i8* %fmt, ...) nounwind { ; RV32I-LABEL: va1: ; RV32I: # %bb.0: ; RV32I-NEXT: addi sp, sp, -48 -; RV32I-NEXT: sw ra, 12(sp) -; RV32I-NEXT: sw s0, 8(sp) -; RV32I-NEXT: addi s0, sp, 16 -; RV32I-NEXT: sw a1, 4(s0) -; RV32I-NEXT: sw a7, 28(s0) -; RV32I-NEXT: sw a6, 24(s0) -; RV32I-NEXT: sw a5, 20(s0) -; RV32I-NEXT: sw a4, 16(s0) -; RV32I-NEXT: sw a3, 12(s0) -; RV32I-NEXT: sw a2, 8(s0) -; RV32I-NEXT: addi a0, s0, 8 -; RV32I-NEXT: sw a0, -12(s0) -; RV32I-NEXT: lw a0, 4(s0) -; RV32I-NEXT: lw s0, 8(sp) -; RV32I-NEXT: lw ra, 12(sp) +; RV32I-NEXT: sw a1, 20(sp) +; RV32I-NEXT: sw a7, 44(sp) +; RV32I-NEXT: sw a6, 40(sp) +; RV32I-NEXT: sw a5, 36(sp) +; RV32I-NEXT: sw a4, 32(sp) +; RV32I-NEXT: sw a3, 28(sp) +; RV32I-NEXT: sw a2, 24(sp) +; RV32I-NEXT: addi a0, sp, 24 +; RV32I-NEXT: sw a0, 12(sp) +; RV32I-NEXT: lw a0, 20(sp) ; RV32I-NEXT: addi sp, sp, 48 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va1: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -48 +; RV32I-FPELIM-NEXT: sw a1, 20(sp) +; RV32I-FPELIM-NEXT: sw a7, 44(sp) +; RV32I-FPELIM-NEXT: sw a6, 40(sp) +; RV32I-FPELIM-NEXT: sw a5, 36(sp) +; RV32I-FPELIM-NEXT: sw a4, 32(sp) +; RV32I-FPELIM-NEXT: sw a3, 28(sp) +; RV32I-FPELIM-NEXT: sw a2, 24(sp) +; RV32I-FPELIM-NEXT: addi a0, sp, 24 +; RV32I-FPELIM-NEXT: sw a0, 12(sp) +; RV32I-FPELIM-NEXT: lw a0, 20(sp) +; RV32I-FPELIM-NEXT: addi sp, sp, 48 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va1: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -48 +; RV32I-WITHFP-NEXT: sw ra, 12(sp) +; RV32I-WITHFP-NEXT: sw s0, 8(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 16 +; RV32I-WITHFP-NEXT: sw a1, 4(s0) +; RV32I-WITHFP-NEXT: sw a7, 28(s0) +; RV32I-WITHFP-NEXT: sw a6, 24(s0) +; RV32I-WITHFP-NEXT: sw a5, 20(s0) +; RV32I-WITHFP-NEXT: sw a4, 16(s0) +; RV32I-WITHFP-NEXT: sw a3, 12(s0) +; RV32I-WITHFP-NEXT: sw a2, 8(s0) +; RV32I-WITHFP-NEXT: addi a0, s0, 8 +; RV32I-WITHFP-NEXT: sw a0, -12(s0) +; RV32I-WITHFP-NEXT: lw a0, 4(s0) +; RV32I-WITHFP-NEXT: lw s0, 8(sp) +; RV32I-WITHFP-NEXT: lw ra, 12(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 48 +; RV32I-WITHFP-NEXT: ret %va = alloca i8*, align 4 %1 = bitcast i8** %va to i8* call void @llvm.va_start(i8* %1) @@ -48,23 +81,54 @@ define i32 @va1_va_arg(i8* %fmt, ...) nounwind { ; RV32I-LABEL: va1_va_arg: ; RV32I: # %bb.0: ; RV32I-NEXT: addi sp, sp, -48 -; RV32I-NEXT: sw ra, 12(sp) -; RV32I-NEXT: sw s0, 8(sp) -; RV32I-NEXT: addi s0, sp, 16 -; RV32I-NEXT: sw a1, 4(s0) -; RV32I-NEXT: sw a7, 28(s0) -; RV32I-NEXT: sw a6, 24(s0) -; RV32I-NEXT: sw a5, 20(s0) -; RV32I-NEXT: sw a4, 16(s0) -; RV32I-NEXT: sw a3, 12(s0) -; RV32I-NEXT: sw a2, 8(s0) -; RV32I-NEXT: addi a0, s0, 8 -; RV32I-NEXT: sw a0, -12(s0) -; RV32I-NEXT: lw a0, 4(s0) -; RV32I-NEXT: lw s0, 8(sp) -; RV32I-NEXT: lw ra, 12(sp) +; RV32I-NEXT: sw a1, 20(sp) +; RV32I-NEXT: sw a7, 44(sp) +; RV32I-NEXT: sw a6, 40(sp) +; RV32I-NEXT: sw a5, 36(sp) +; RV32I-NEXT: sw a4, 32(sp) +; RV32I-NEXT: sw a3, 28(sp) +; RV32I-NEXT: sw a2, 24(sp) +; RV32I-NEXT: addi a0, sp, 24 +; RV32I-NEXT: sw a0, 12(sp) +; RV32I-NEXT: lw a0, 20(sp) ; RV32I-NEXT: addi sp, sp, 48 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va1_va_arg: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -48 +; RV32I-FPELIM-NEXT: sw a1, 20(sp) +; RV32I-FPELIM-NEXT: sw a7, 44(sp) +; RV32I-FPELIM-NEXT: sw a6, 40(sp) +; RV32I-FPELIM-NEXT: sw a5, 36(sp) +; RV32I-FPELIM-NEXT: sw a4, 32(sp) +; RV32I-FPELIM-NEXT: sw a3, 28(sp) +; RV32I-FPELIM-NEXT: sw a2, 24(sp) +; RV32I-FPELIM-NEXT: addi a0, sp, 24 +; RV32I-FPELIM-NEXT: sw a0, 12(sp) +; RV32I-FPELIM-NEXT: lw a0, 20(sp) +; RV32I-FPELIM-NEXT: addi sp, sp, 48 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va1_va_arg: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -48 +; RV32I-WITHFP-NEXT: sw ra, 12(sp) +; RV32I-WITHFP-NEXT: sw s0, 8(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 16 +; RV32I-WITHFP-NEXT: sw a1, 4(s0) +; RV32I-WITHFP-NEXT: sw a7, 28(s0) +; RV32I-WITHFP-NEXT: sw a6, 24(s0) +; RV32I-WITHFP-NEXT: sw a5, 20(s0) +; RV32I-WITHFP-NEXT: sw a4, 16(s0) +; RV32I-WITHFP-NEXT: sw a3, 12(s0) +; RV32I-WITHFP-NEXT: sw a2, 8(s0) +; RV32I-WITHFP-NEXT: addi a0, s0, 8 +; RV32I-WITHFP-NEXT: sw a0, -12(s0) +; RV32I-WITHFP-NEXT: lw a0, 4(s0) +; RV32I-WITHFP-NEXT: lw s0, 8(sp) +; RV32I-WITHFP-NEXT: lw ra, 12(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 48 +; RV32I-WITHFP-NEXT: ret %va = alloca i8*, align 4 %1 = bitcast i8** %va to i8* call void @llvm.va_start(i8* %1) @@ -107,6 +171,69 @@ define i32 @va1_va_arg_alloca(i8* %fmt, ...) nounwind { ; RV32I-NEXT: lw ra, 12(sp) ; RV32I-NEXT: addi sp, sp, 48 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va1_va_arg_alloca: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -48 +; RV32I-FPELIM-NEXT: sw ra, 12(sp) +; RV32I-FPELIM-NEXT: sw s0, 8(sp) +; RV32I-FPELIM-NEXT: sw s1, 4(sp) +; RV32I-FPELIM-NEXT: addi s0, sp, 16 +; RV32I-FPELIM-NEXT: sw a1, 4(s0) +; RV32I-FPELIM-NEXT: sw a7, 28(s0) +; RV32I-FPELIM-NEXT: sw a6, 24(s0) +; RV32I-FPELIM-NEXT: sw a5, 20(s0) +; RV32I-FPELIM-NEXT: sw a4, 16(s0) +; RV32I-FPELIM-NEXT: sw a3, 12(s0) +; RV32I-FPELIM-NEXT: sw a2, 8(s0) +; RV32I-FPELIM-NEXT: addi a0, s0, 8 +; RV32I-FPELIM-NEXT: sw a0, -16(s0) +; RV32I-FPELIM-NEXT: lw s1, 4(s0) +; RV32I-FPELIM-NEXT: addi a0, s1, 15 +; RV32I-FPELIM-NEXT: andi a0, a0, -16 +; RV32I-FPELIM-NEXT: sub a0, sp, a0 +; RV32I-FPELIM-NEXT: mv sp, a0 +; RV32I-FPELIM-NEXT: lui a1, %hi(notdead) +; RV32I-FPELIM-NEXT: addi a1, a1, %lo(notdead) +; RV32I-FPELIM-NEXT: jalr a1 +; RV32I-FPELIM-NEXT: mv a0, s1 +; RV32I-FPELIM-NEXT: addi sp, s0, -16 +; RV32I-FPELIM-NEXT: lw s1, 4(sp) +; RV32I-FPELIM-NEXT: lw s0, 8(sp) +; RV32I-FPELIM-NEXT: lw ra, 12(sp) +; RV32I-FPELIM-NEXT: addi sp, sp, 48 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va1_va_arg_alloca: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -48 +; RV32I-WITHFP-NEXT: sw ra, 12(sp) +; RV32I-WITHFP-NEXT: sw s0, 8(sp) +; RV32I-WITHFP-NEXT: sw s1, 4(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 16 +; RV32I-WITHFP-NEXT: sw a1, 4(s0) +; RV32I-WITHFP-NEXT: sw a7, 28(s0) +; RV32I-WITHFP-NEXT: sw a6, 24(s0) +; RV32I-WITHFP-NEXT: sw a5, 20(s0) +; RV32I-WITHFP-NEXT: sw a4, 16(s0) +; RV32I-WITHFP-NEXT: sw a3, 12(s0) +; RV32I-WITHFP-NEXT: sw a2, 8(s0) +; RV32I-WITHFP-NEXT: addi a0, s0, 8 +; RV32I-WITHFP-NEXT: sw a0, -16(s0) +; RV32I-WITHFP-NEXT: lw s1, 4(s0) +; RV32I-WITHFP-NEXT: addi a0, s1, 15 +; RV32I-WITHFP-NEXT: andi a0, a0, -16 +; RV32I-WITHFP-NEXT: sub a0, sp, a0 +; RV32I-WITHFP-NEXT: mv sp, a0 +; RV32I-WITHFP-NEXT: lui a1, %hi(notdead) +; RV32I-WITHFP-NEXT: addi a1, a1, %lo(notdead) +; RV32I-WITHFP-NEXT: jalr a1 +; RV32I-WITHFP-NEXT: mv a0, s1 +; RV32I-WITHFP-NEXT: addi sp, s0, -16 +; RV32I-WITHFP-NEXT: lw s1, 4(sp) +; RV32I-WITHFP-NEXT: lw s0, 8(sp) +; RV32I-WITHFP-NEXT: lw ra, 12(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 48 +; RV32I-WITHFP-NEXT: ret %va = alloca i8*, align 4 %1 = bitcast i8** %va to i8* call void @llvm.va_start(i8* %1) @@ -122,8 +249,6 @@ define void @va1_caller() nounwind { ; RV32I: # %bb.0: ; RV32I-NEXT: addi sp, sp, -16 ; RV32I-NEXT: sw ra, 12(sp) -; RV32I-NEXT: sw s0, 8(sp) -; RV32I-NEXT: addi s0, sp, 16 ; RV32I-NEXT: lui a0, 261888 ; RV32I-NEXT: mv a3, a0 ; RV32I-NEXT: lui a0, %hi(va1) @@ -131,11 +256,42 @@ define void @va1_caller() nounwind { ; RV32I-NEXT: addi a4, zero, 2 ; RV32I-NEXT: mv a2, zero ; RV32I-NEXT: jalr a0 -; RV32I-NEXT: lw s0, 8(sp) ; RV32I-NEXT: lw ra, 12(sp) ; RV32I-NEXT: addi sp, sp, 16 ; RV32I-NEXT: ret ; Pass a double, as a float would be promoted by a C/C++ frontend +; RV32I-FPELIM-LABEL: va1_caller: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -16 +; RV32I-FPELIM-NEXT: sw ra, 12(sp) +; RV32I-FPELIM-NEXT: lui a0, 261888 +; RV32I-FPELIM-NEXT: mv a3, a0 +; RV32I-FPELIM-NEXT: lui a0, %hi(va1) +; RV32I-FPELIM-NEXT: addi a0, a0, %lo(va1) +; RV32I-FPELIM-NEXT: addi a4, zero, 2 +; RV32I-FPELIM-NEXT: mv a2, zero +; RV32I-FPELIM-NEXT: jalr a0 +; RV32I-FPELIM-NEXT: lw ra, 12(sp) +; RV32I-FPELIM-NEXT: addi sp, sp, 16 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va1_caller: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -16 +; RV32I-WITHFP-NEXT: sw ra, 12(sp) +; RV32I-WITHFP-NEXT: sw s0, 8(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 16 +; RV32I-WITHFP-NEXT: lui a0, 261888 +; RV32I-WITHFP-NEXT: mv a3, a0 +; RV32I-WITHFP-NEXT: lui a0, %hi(va1) +; RV32I-WITHFP-NEXT: addi a0, a0, %lo(va1) +; RV32I-WITHFP-NEXT: addi a4, zero, 2 +; RV32I-WITHFP-NEXT: mv a2, zero +; RV32I-WITHFP-NEXT: jalr a0 +; RV32I-WITHFP-NEXT: lw s0, 8(sp) +; RV32I-WITHFP-NEXT: lw ra, 12(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 16 +; RV32I-WITHFP-NEXT: ret %1 = call i32 (i8*, ...) @va1(i8* undef, double 1.0, i32 2) ret void } @@ -147,27 +303,66 @@ define double @va2(i8 *%fmt, ...) nounwind { ; RV32I-LABEL: va2: ; RV32I: # %bb.0: ; RV32I-NEXT: addi sp, sp, -48 -; RV32I-NEXT: sw ra, 12(sp) -; RV32I-NEXT: sw s0, 8(sp) -; RV32I-NEXT: addi s0, sp, 16 -; RV32I-NEXT: sw a7, 28(s0) -; RV32I-NEXT: sw a6, 24(s0) -; RV32I-NEXT: sw a5, 20(s0) -; RV32I-NEXT: sw a4, 16(s0) -; RV32I-NEXT: sw a3, 12(s0) -; RV32I-NEXT: sw a2, 8(s0) -; RV32I-NEXT: sw a1, 4(s0) -; RV32I-NEXT: addi a0, s0, 19 -; RV32I-NEXT: sw a0, -12(s0) -; RV32I-NEXT: addi a0, s0, 11 +; RV32I-NEXT: sw a7, 44(sp) +; RV32I-NEXT: sw a6, 40(sp) +; RV32I-NEXT: sw a5, 36(sp) +; RV32I-NEXT: sw a4, 32(sp) +; RV32I-NEXT: sw a3, 28(sp) +; RV32I-NEXT: sw a2, 24(sp) +; RV32I-NEXT: sw a1, 20(sp) +; RV32I-NEXT: addi a0, sp, 35 +; RV32I-NEXT: sw a0, 12(sp) +; RV32I-NEXT: addi a0, sp, 27 ; RV32I-NEXT: andi a1, a0, -8 ; RV32I-NEXT: lw a0, 0(a1) ; RV32I-NEXT: ori a1, a1, 4 ; RV32I-NEXT: lw a1, 0(a1) -; RV32I-NEXT: lw s0, 8(sp) -; RV32I-NEXT: lw ra, 12(sp) ; RV32I-NEXT: addi sp, sp, 48 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va2: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -48 +; RV32I-FPELIM-NEXT: sw a7, 44(sp) +; RV32I-FPELIM-NEXT: sw a6, 40(sp) +; RV32I-FPELIM-NEXT: sw a5, 36(sp) +; RV32I-FPELIM-NEXT: sw a4, 32(sp) +; RV32I-FPELIM-NEXT: sw a3, 28(sp) +; RV32I-FPELIM-NEXT: sw a2, 24(sp) +; RV32I-FPELIM-NEXT: sw a1, 20(sp) +; RV32I-FPELIM-NEXT: addi a0, sp, 35 +; RV32I-FPELIM-NEXT: sw a0, 12(sp) +; RV32I-FPELIM-NEXT: addi a0, sp, 27 +; RV32I-FPELIM-NEXT: andi a1, a0, -8 +; RV32I-FPELIM-NEXT: lw a0, 0(a1) +; RV32I-FPELIM-NEXT: ori a1, a1, 4 +; RV32I-FPELIM-NEXT: lw a1, 0(a1) +; RV32I-FPELIM-NEXT: addi sp, sp, 48 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va2: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -48 +; RV32I-WITHFP-NEXT: sw ra, 12(sp) +; RV32I-WITHFP-NEXT: sw s0, 8(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 16 +; RV32I-WITHFP-NEXT: sw a7, 28(s0) +; RV32I-WITHFP-NEXT: sw a6, 24(s0) +; RV32I-WITHFP-NEXT: sw a5, 20(s0) +; RV32I-WITHFP-NEXT: sw a4, 16(s0) +; RV32I-WITHFP-NEXT: sw a3, 12(s0) +; RV32I-WITHFP-NEXT: sw a2, 8(s0) +; RV32I-WITHFP-NEXT: sw a1, 4(s0) +; RV32I-WITHFP-NEXT: addi a0, s0, 19 +; RV32I-WITHFP-NEXT: sw a0, -12(s0) +; RV32I-WITHFP-NEXT: addi a0, s0, 11 +; RV32I-WITHFP-NEXT: andi a1, a0, -8 +; RV32I-WITHFP-NEXT: lw a0, 0(a1) +; RV32I-WITHFP-NEXT: ori a1, a1, 4 +; RV32I-WITHFP-NEXT: lw a1, 0(a1) +; RV32I-WITHFP-NEXT: lw s0, 8(sp) +; RV32I-WITHFP-NEXT: lw ra, 12(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 48 +; RV32I-WITHFP-NEXT: ret %va = alloca i8*, align 4 %1 = bitcast i8** %va to i8* call void @llvm.va_start(i8* %1) @@ -188,28 +383,69 @@ define double @va2_va_arg(i8 *%fmt, ...) nounwind { ; RV32I-LABEL: va2_va_arg: ; RV32I: # %bb.0: ; RV32I-NEXT: addi sp, sp, -48 -; RV32I-NEXT: sw ra, 12(sp) -; RV32I-NEXT: sw s0, 8(sp) -; RV32I-NEXT: addi s0, sp, 16 -; RV32I-NEXT: sw a7, 28(s0) -; RV32I-NEXT: sw a6, 24(s0) -; RV32I-NEXT: sw a5, 20(s0) -; RV32I-NEXT: sw a4, 16(s0) -; RV32I-NEXT: sw a3, 12(s0) -; RV32I-NEXT: sw a2, 8(s0) -; RV32I-NEXT: sw a1, 4(s0) -; RV32I-NEXT: addi a0, s0, 11 +; RV32I-NEXT: sw a7, 44(sp) +; RV32I-NEXT: sw a6, 40(sp) +; RV32I-NEXT: sw a5, 36(sp) +; RV32I-NEXT: sw a4, 32(sp) +; RV32I-NEXT: sw a3, 28(sp) +; RV32I-NEXT: sw a2, 24(sp) +; RV32I-NEXT: sw a1, 20(sp) +; RV32I-NEXT: addi a0, sp, 27 ; RV32I-NEXT: andi a0, a0, -8 ; RV32I-NEXT: ori a1, a0, 4 -; RV32I-NEXT: sw a1, -12(s0) +; RV32I-NEXT: sw a1, 12(sp) ; RV32I-NEXT: lw a0, 0(a0) ; RV32I-NEXT: addi a2, a1, 4 -; RV32I-NEXT: sw a2, -12(s0) +; RV32I-NEXT: sw a2, 12(sp) ; RV32I-NEXT: lw a1, 0(a1) -; RV32I-NEXT: lw s0, 8(sp) -; RV32I-NEXT: lw ra, 12(sp) ; RV32I-NEXT: addi sp, sp, 48 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va2_va_arg: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -48 +; RV32I-FPELIM-NEXT: sw a7, 44(sp) +; RV32I-FPELIM-NEXT: sw a6, 40(sp) +; RV32I-FPELIM-NEXT: sw a5, 36(sp) +; RV32I-FPELIM-NEXT: sw a4, 32(sp) +; RV32I-FPELIM-NEXT: sw a3, 28(sp) +; RV32I-FPELIM-NEXT: sw a2, 24(sp) +; RV32I-FPELIM-NEXT: sw a1, 20(sp) +; RV32I-FPELIM-NEXT: addi a0, sp, 27 +; RV32I-FPELIM-NEXT: andi a0, a0, -8 +; RV32I-FPELIM-NEXT: ori a1, a0, 4 +; RV32I-FPELIM-NEXT: sw a1, 12(sp) +; RV32I-FPELIM-NEXT: lw a0, 0(a0) +; RV32I-FPELIM-NEXT: addi a2, a1, 4 +; RV32I-FPELIM-NEXT: sw a2, 12(sp) +; RV32I-FPELIM-NEXT: lw a1, 0(a1) +; RV32I-FPELIM-NEXT: addi sp, sp, 48 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va2_va_arg: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -48 +; RV32I-WITHFP-NEXT: sw ra, 12(sp) +; RV32I-WITHFP-NEXT: sw s0, 8(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 16 +; RV32I-WITHFP-NEXT: sw a7, 28(s0) +; RV32I-WITHFP-NEXT: sw a6, 24(s0) +; RV32I-WITHFP-NEXT: sw a5, 20(s0) +; RV32I-WITHFP-NEXT: sw a4, 16(s0) +; RV32I-WITHFP-NEXT: sw a3, 12(s0) +; RV32I-WITHFP-NEXT: sw a2, 8(s0) +; RV32I-WITHFP-NEXT: sw a1, 4(s0) +; RV32I-WITHFP-NEXT: addi a0, s0, 11 +; RV32I-WITHFP-NEXT: andi a0, a0, -8 +; RV32I-WITHFP-NEXT: ori a1, a0, 4 +; RV32I-WITHFP-NEXT: sw a1, -12(s0) +; RV32I-WITHFP-NEXT: lw a0, 0(a0) +; RV32I-WITHFP-NEXT: addi a2, a1, 4 +; RV32I-WITHFP-NEXT: sw a2, -12(s0) +; RV32I-WITHFP-NEXT: lw a1, 0(a1) +; RV32I-WITHFP-NEXT: lw s0, 8(sp) +; RV32I-WITHFP-NEXT: lw ra, 12(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 48 +; RV32I-WITHFP-NEXT: ret %va = alloca i8*, align 4 %1 = bitcast i8** %va to i8* call void @llvm.va_start(i8* %1) @@ -223,18 +459,45 @@ define void @va2_caller() nounwind { ; RV32I: # %bb.0: ; RV32I-NEXT: addi sp, sp, -16 ; RV32I-NEXT: sw ra, 12(sp) -; RV32I-NEXT: sw s0, 8(sp) -; RV32I-NEXT: addi s0, sp, 16 ; RV32I-NEXT: lui a0, 261888 ; RV32I-NEXT: mv a3, a0 ; RV32I-NEXT: lui a0, %hi(va2) ; RV32I-NEXT: addi a0, a0, %lo(va2) ; RV32I-NEXT: mv a2, zero ; RV32I-NEXT: jalr a0 -; RV32I-NEXT: lw s0, 8(sp) ; RV32I-NEXT: lw ra, 12(sp) ; RV32I-NEXT: addi sp, sp, 16 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va2_caller: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -16 +; RV32I-FPELIM-NEXT: sw ra, 12(sp) +; RV32I-FPELIM-NEXT: lui a0, 261888 +; RV32I-FPELIM-NEXT: mv a3, a0 +; RV32I-FPELIM-NEXT: lui a0, %hi(va2) +; RV32I-FPELIM-NEXT: addi a0, a0, %lo(va2) +; RV32I-FPELIM-NEXT: mv a2, zero +; RV32I-FPELIM-NEXT: jalr a0 +; RV32I-FPELIM-NEXT: lw ra, 12(sp) +; RV32I-FPELIM-NEXT: addi sp, sp, 16 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va2_caller: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -16 +; RV32I-WITHFP-NEXT: sw ra, 12(sp) +; RV32I-WITHFP-NEXT: sw s0, 8(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 16 +; RV32I-WITHFP-NEXT: lui a0, 261888 +; RV32I-WITHFP-NEXT: mv a3, a0 +; RV32I-WITHFP-NEXT: lui a0, %hi(va2) +; RV32I-WITHFP-NEXT: addi a0, a0, %lo(va2) +; RV32I-WITHFP-NEXT: mv a2, zero +; RV32I-WITHFP-NEXT: jalr a0 +; RV32I-WITHFP-NEXT: lw s0, 8(sp) +; RV32I-WITHFP-NEXT: lw ra, 12(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 16 +; RV32I-WITHFP-NEXT: ret %1 = call double (i8*, ...) @va2(i8* undef, double 1.000000e+00) ret void } @@ -245,20 +508,18 @@ define void @va2_caller() nounwind { define double @va3(i32 %a, double %b, ...) nounwind { ; RV32I-LABEL: va3: ; RV32I: # %bb.0: -; RV32I-NEXT: addi sp, sp, -48 -; RV32I-NEXT: sw ra, 20(sp) -; RV32I-NEXT: sw s0, 16(sp) -; RV32I-NEXT: addi s0, sp, 24 -; RV32I-NEXT: sw a7, 20(s0) -; RV32I-NEXT: sw a6, 16(s0) -; RV32I-NEXT: sw a5, 12(s0) -; RV32I-NEXT: sw a4, 8(s0) -; RV32I-NEXT: sw a3, 4(s0) -; RV32I-NEXT: addi a0, s0, 19 -; RV32I-NEXT: sw a0, -12(s0) +; RV32I-NEXT: addi sp, sp, -32 +; RV32I-NEXT: sw ra, 4(sp) +; RV32I-NEXT: sw a7, 28(sp) +; RV32I-NEXT: sw a6, 24(sp) +; RV32I-NEXT: sw a5, 20(sp) +; RV32I-NEXT: sw a4, 16(sp) +; RV32I-NEXT: sw a3, 12(sp) +; RV32I-NEXT: addi a0, sp, 27 +; RV32I-NEXT: sw a0, 0(sp) ; RV32I-NEXT: lui a0, %hi(__adddf3) ; RV32I-NEXT: addi a5, a0, %lo(__adddf3) -; RV32I-NEXT: addi a0, s0, 11 +; RV32I-NEXT: addi a0, sp, 19 ; RV32I-NEXT: andi a0, a0, -8 ; RV32I-NEXT: lw a4, 0(a0) ; RV32I-NEXT: ori a0, a0, 4 @@ -267,10 +528,63 @@ define double @va3(i32 %a, double %b, ...) nounwind { ; RV32I-NEXT: mv a1, a2 ; RV32I-NEXT: mv a2, a4 ; RV32I-NEXT: jalr a5 -; RV32I-NEXT: lw s0, 16(sp) -; RV32I-NEXT: lw ra, 20(sp) -; RV32I-NEXT: addi sp, sp, 48 +; RV32I-NEXT: lw ra, 4(sp) +; RV32I-NEXT: addi sp, sp, 32 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va3: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -32 +; RV32I-FPELIM-NEXT: sw ra, 4(sp) +; RV32I-FPELIM-NEXT: sw a7, 28(sp) +; RV32I-FPELIM-NEXT: sw a6, 24(sp) +; RV32I-FPELIM-NEXT: sw a5, 20(sp) +; RV32I-FPELIM-NEXT: sw a4, 16(sp) +; RV32I-FPELIM-NEXT: sw a3, 12(sp) +; RV32I-FPELIM-NEXT: addi a0, sp, 27 +; RV32I-FPELIM-NEXT: sw a0, 0(sp) +; RV32I-FPELIM-NEXT: lui a0, %hi(__adddf3) +; RV32I-FPELIM-NEXT: addi a5, a0, %lo(__adddf3) +; RV32I-FPELIM-NEXT: addi a0, sp, 19 +; RV32I-FPELIM-NEXT: andi a0, a0, -8 +; RV32I-FPELIM-NEXT: lw a4, 0(a0) +; RV32I-FPELIM-NEXT: ori a0, a0, 4 +; RV32I-FPELIM-NEXT: lw a3, 0(a0) +; RV32I-FPELIM-NEXT: mv a0, a1 +; RV32I-FPELIM-NEXT: mv a1, a2 +; RV32I-FPELIM-NEXT: mv a2, a4 +; RV32I-FPELIM-NEXT: jalr a5 +; RV32I-FPELIM-NEXT: lw ra, 4(sp) +; RV32I-FPELIM-NEXT: addi sp, sp, 32 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va3: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -48 +; RV32I-WITHFP-NEXT: sw ra, 20(sp) +; RV32I-WITHFP-NEXT: sw s0, 16(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 24 +; RV32I-WITHFP-NEXT: sw a7, 20(s0) +; RV32I-WITHFP-NEXT: sw a6, 16(s0) +; RV32I-WITHFP-NEXT: sw a5, 12(s0) +; RV32I-WITHFP-NEXT: sw a4, 8(s0) +; RV32I-WITHFP-NEXT: sw a3, 4(s0) +; RV32I-WITHFP-NEXT: addi a0, s0, 19 +; RV32I-WITHFP-NEXT: sw a0, -12(s0) +; RV32I-WITHFP-NEXT: lui a0, %hi(__adddf3) +; RV32I-WITHFP-NEXT: addi a5, a0, %lo(__adddf3) +; RV32I-WITHFP-NEXT: addi a0, s0, 11 +; RV32I-WITHFP-NEXT: andi a0, a0, -8 +; RV32I-WITHFP-NEXT: lw a4, 0(a0) +; RV32I-WITHFP-NEXT: ori a0, a0, 4 +; RV32I-WITHFP-NEXT: lw a3, 0(a0) +; RV32I-WITHFP-NEXT: mv a0, a1 +; RV32I-WITHFP-NEXT: mv a1, a2 +; RV32I-WITHFP-NEXT: mv a2, a4 +; RV32I-WITHFP-NEXT: jalr a5 +; RV32I-WITHFP-NEXT: lw s0, 16(sp) +; RV32I-WITHFP-NEXT: lw ra, 20(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 48 +; RV32I-WITHFP-NEXT: ret %va = alloca i8*, align 4 %1 = bitcast i8** %va to i8* call void @llvm.va_start(i8* %1) @@ -291,22 +605,20 @@ define double @va3(i32 %a, double %b, ...) nounwind { define double @va3_va_arg(i32 %a, double %b, ...) nounwind { ; RV32I-LABEL: va3_va_arg: ; RV32I: # %bb.0: -; RV32I-NEXT: addi sp, sp, -48 -; RV32I-NEXT: sw ra, 20(sp) -; RV32I-NEXT: sw s0, 16(sp) -; RV32I-NEXT: addi s0, sp, 24 -; RV32I-NEXT: sw a7, 20(s0) -; RV32I-NEXT: sw a6, 16(s0) -; RV32I-NEXT: sw a5, 12(s0) -; RV32I-NEXT: sw a4, 8(s0) -; RV32I-NEXT: sw a3, 4(s0) -; RV32I-NEXT: addi a0, s0, 11 +; RV32I-NEXT: addi sp, sp, -32 +; RV32I-NEXT: sw ra, 4(sp) +; RV32I-NEXT: sw a7, 28(sp) +; RV32I-NEXT: sw a6, 24(sp) +; RV32I-NEXT: sw a5, 20(sp) +; RV32I-NEXT: sw a4, 16(sp) +; RV32I-NEXT: sw a3, 12(sp) +; RV32I-NEXT: addi a0, sp, 19 ; RV32I-NEXT: andi a0, a0, -8 ; RV32I-NEXT: ori a3, a0, 4 -; RV32I-NEXT: sw a3, -12(s0) +; RV32I-NEXT: sw a3, 0(sp) ; RV32I-NEXT: lw a4, 0(a0) ; RV32I-NEXT: addi a0, a3, 4 -; RV32I-NEXT: sw a0, -12(s0) +; RV32I-NEXT: sw a0, 0(sp) ; RV32I-NEXT: lui a0, %hi(__adddf3) ; RV32I-NEXT: addi a5, a0, %lo(__adddf3) ; RV32I-NEXT: lw a3, 0(a3) @@ -314,10 +626,65 @@ define double @va3_va_arg(i32 %a, double %b, ...) nounwind { ; RV32I-NEXT: mv a1, a2 ; RV32I-NEXT: mv a2, a4 ; RV32I-NEXT: jalr a5 -; RV32I-NEXT: lw s0, 16(sp) -; RV32I-NEXT: lw ra, 20(sp) -; RV32I-NEXT: addi sp, sp, 48 +; RV32I-NEXT: lw ra, 4(sp) +; RV32I-NEXT: addi sp, sp, 32 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va3_va_arg: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -32 +; RV32I-FPELIM-NEXT: sw ra, 4(sp) +; RV32I-FPELIM-NEXT: sw a7, 28(sp) +; RV32I-FPELIM-NEXT: sw a6, 24(sp) +; RV32I-FPELIM-NEXT: sw a5, 20(sp) +; RV32I-FPELIM-NEXT: sw a4, 16(sp) +; RV32I-FPELIM-NEXT: sw a3, 12(sp) +; RV32I-FPELIM-NEXT: addi a0, sp, 19 +; RV32I-FPELIM-NEXT: andi a0, a0, -8 +; RV32I-FPELIM-NEXT: ori a3, a0, 4 +; RV32I-FPELIM-NEXT: sw a3, 0(sp) +; RV32I-FPELIM-NEXT: lw a4, 0(a0) +; RV32I-FPELIM-NEXT: addi a0, a3, 4 +; RV32I-FPELIM-NEXT: sw a0, 0(sp) +; RV32I-FPELIM-NEXT: lui a0, %hi(__adddf3) +; RV32I-FPELIM-NEXT: addi a5, a0, %lo(__adddf3) +; RV32I-FPELIM-NEXT: lw a3, 0(a3) +; RV32I-FPELIM-NEXT: mv a0, a1 +; RV32I-FPELIM-NEXT: mv a1, a2 +; RV32I-FPELIM-NEXT: mv a2, a4 +; RV32I-FPELIM-NEXT: jalr a5 +; RV32I-FPELIM-NEXT: lw ra, 4(sp) +; RV32I-FPELIM-NEXT: addi sp, sp, 32 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va3_va_arg: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -48 +; RV32I-WITHFP-NEXT: sw ra, 20(sp) +; RV32I-WITHFP-NEXT: sw s0, 16(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 24 +; RV32I-WITHFP-NEXT: sw a7, 20(s0) +; RV32I-WITHFP-NEXT: sw a6, 16(s0) +; RV32I-WITHFP-NEXT: sw a5, 12(s0) +; RV32I-WITHFP-NEXT: sw a4, 8(s0) +; RV32I-WITHFP-NEXT: sw a3, 4(s0) +; RV32I-WITHFP-NEXT: addi a0, s0, 11 +; RV32I-WITHFP-NEXT: andi a0, a0, -8 +; RV32I-WITHFP-NEXT: ori a3, a0, 4 +; RV32I-WITHFP-NEXT: sw a3, -12(s0) +; RV32I-WITHFP-NEXT: lw a4, 0(a0) +; RV32I-WITHFP-NEXT: addi a0, a3, 4 +; RV32I-WITHFP-NEXT: sw a0, -12(s0) +; RV32I-WITHFP-NEXT: lui a0, %hi(__adddf3) +; RV32I-WITHFP-NEXT: addi a5, a0, %lo(__adddf3) +; RV32I-WITHFP-NEXT: lw a3, 0(a3) +; RV32I-WITHFP-NEXT: mv a0, a1 +; RV32I-WITHFP-NEXT: mv a1, a2 +; RV32I-WITHFP-NEXT: mv a2, a4 +; RV32I-WITHFP-NEXT: jalr a5 +; RV32I-WITHFP-NEXT: lw s0, 16(sp) +; RV32I-WITHFP-NEXT: lw ra, 20(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 48 +; RV32I-WITHFP-NEXT: ret %va = alloca i8*, align 4 %1 = bitcast i8** %va to i8* call void @llvm.va_start(i8* %1) @@ -332,8 +699,6 @@ define void @va3_caller() nounwind { ; RV32I: # %bb.0: ; RV32I-NEXT: addi sp, sp, -16 ; RV32I-NEXT: sw ra, 12(sp) -; RV32I-NEXT: sw s0, 8(sp) -; RV32I-NEXT: addi s0, sp, 16 ; RV32I-NEXT: lui a0, 261888 ; RV32I-NEXT: mv a2, a0 ; RV32I-NEXT: lui a0, 262144 @@ -344,10 +709,47 @@ define void @va3_caller() nounwind { ; RV32I-NEXT: mv a1, zero ; RV32I-NEXT: mv a4, zero ; RV32I-NEXT: jalr a3 -; RV32I-NEXT: lw s0, 8(sp) ; RV32I-NEXT: lw ra, 12(sp) ; RV32I-NEXT: addi sp, sp, 16 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va3_caller: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -16 +; RV32I-FPELIM-NEXT: sw ra, 12(sp) +; RV32I-FPELIM-NEXT: lui a0, 261888 +; RV32I-FPELIM-NEXT: mv a2, a0 +; RV32I-FPELIM-NEXT: lui a0, 262144 +; RV32I-FPELIM-NEXT: mv a5, a0 +; RV32I-FPELIM-NEXT: lui a0, %hi(va3) +; RV32I-FPELIM-NEXT: addi a3, a0, %lo(va3) +; RV32I-FPELIM-NEXT: addi a0, zero, 2 +; RV32I-FPELIM-NEXT: mv a1, zero +; RV32I-FPELIM-NEXT: mv a4, zero +; RV32I-FPELIM-NEXT: jalr a3 +; RV32I-FPELIM-NEXT: lw ra, 12(sp) +; RV32I-FPELIM-NEXT: addi sp, sp, 16 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va3_caller: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -16 +; RV32I-WITHFP-NEXT: sw ra, 12(sp) +; RV32I-WITHFP-NEXT: sw s0, 8(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 16 +; RV32I-WITHFP-NEXT: lui a0, 261888 +; RV32I-WITHFP-NEXT: mv a2, a0 +; RV32I-WITHFP-NEXT: lui a0, 262144 +; RV32I-WITHFP-NEXT: mv a5, a0 +; RV32I-WITHFP-NEXT: lui a0, %hi(va3) +; RV32I-WITHFP-NEXT: addi a3, a0, %lo(va3) +; RV32I-WITHFP-NEXT: addi a0, zero, 2 +; RV32I-WITHFP-NEXT: mv a1, zero +; RV32I-WITHFP-NEXT: mv a4, zero +; RV32I-WITHFP-NEXT: jalr a3 +; RV32I-WITHFP-NEXT: lw s0, 8(sp) +; RV32I-WITHFP-NEXT: lw ra, 12(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 16 +; RV32I-WITHFP-NEXT: ret %1 = call double (i32, double, ...) @va3(i32 2, double 1.000000e+00, double 2.000000e+00) ret void } @@ -357,49 +759,134 @@ declare void @llvm.va_copy(i8*, i8*) define i32 @va4_va_copy(i32 %argno, ...) nounwind { ; RV32I-LABEL: va4_va_copy: ; RV32I: # %bb.0: -; RV32I-NEXT: addi sp, sp, -64 -; RV32I-NEXT: sw ra, 28(sp) -; RV32I-NEXT: sw s0, 24(sp) -; RV32I-NEXT: sw s1, 20(sp) -; RV32I-NEXT: addi s0, sp, 32 -; RV32I-NEXT: sw a1, 4(s0) -; RV32I-NEXT: sw a7, 28(s0) -; RV32I-NEXT: sw a6, 24(s0) -; RV32I-NEXT: sw a5, 20(s0) -; RV32I-NEXT: sw a4, 16(s0) -; RV32I-NEXT: sw a3, 12(s0) -; RV32I-NEXT: sw a2, 8(s0) -; RV32I-NEXT: addi a0, s0, 8 -; RV32I-NEXT: sw a0, -16(s0) -; RV32I-NEXT: sw a0, -20(s0) -; RV32I-NEXT: lw s1, 4(s0) +; RV32I-NEXT: addi sp, sp, -48 +; RV32I-NEXT: sw ra, 12(sp) +; RV32I-NEXT: sw s1, 8(sp) +; RV32I-NEXT: sw a1, 20(sp) +; RV32I-NEXT: sw a7, 44(sp) +; RV32I-NEXT: sw a6, 40(sp) +; RV32I-NEXT: sw a5, 36(sp) +; RV32I-NEXT: sw a4, 32(sp) +; RV32I-NEXT: sw a3, 28(sp) +; RV32I-NEXT: sw a2, 24(sp) +; RV32I-NEXT: addi a0, sp, 24 +; RV32I-NEXT: sw a0, 4(sp) +; RV32I-NEXT: sw a0, 0(sp) +; RV32I-NEXT: lw s1, 20(sp) ; RV32I-NEXT: lui a1, %hi(notdead) ; RV32I-NEXT: addi a1, a1, %lo(notdead) ; RV32I-NEXT: jalr a1 -; RV32I-NEXT: lw a0, -16(s0) +; RV32I-NEXT: lw a0, 4(sp) ; RV32I-NEXT: addi a0, a0, 3 ; RV32I-NEXT: andi a0, a0, -4 ; RV32I-NEXT: addi a1, a0, 4 -; RV32I-NEXT: sw a1, -16(s0) +; RV32I-NEXT: sw a1, 4(sp) ; RV32I-NEXT: lw a1, 0(a0) ; RV32I-NEXT: addi a0, a0, 7 ; RV32I-NEXT: andi a0, a0, -4 ; RV32I-NEXT: addi a2, a0, 4 -; RV32I-NEXT: sw a2, -16(s0) +; RV32I-NEXT: sw a2, 4(sp) ; RV32I-NEXT: lw a2, 0(a0) ; RV32I-NEXT: addi a0, a0, 7 ; RV32I-NEXT: andi a0, a0, -4 ; RV32I-NEXT: addi a3, a0, 4 -; RV32I-NEXT: sw a3, -16(s0) +; RV32I-NEXT: sw a3, 4(sp) ; RV32I-NEXT: add a1, a1, s1 ; RV32I-NEXT: add a1, a1, a2 ; RV32I-NEXT: lw a0, 0(a0) ; RV32I-NEXT: add a0, a1, a0 -; RV32I-NEXT: lw s1, 20(sp) -; RV32I-NEXT: lw s0, 24(sp) -; RV32I-NEXT: lw ra, 28(sp) -; RV32I-NEXT: addi sp, sp, 64 +; RV32I-NEXT: lw s1, 8(sp) +; RV32I-NEXT: lw ra, 12(sp) +; RV32I-NEXT: addi sp, sp, 48 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va4_va_copy: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -48 +; RV32I-FPELIM-NEXT: sw ra, 12(sp) +; RV32I-FPELIM-NEXT: sw s1, 8(sp) +; RV32I-FPELIM-NEXT: sw a1, 20(sp) +; RV32I-FPELIM-NEXT: sw a7, 44(sp) +; RV32I-FPELIM-NEXT: sw a6, 40(sp) +; RV32I-FPELIM-NEXT: sw a5, 36(sp) +; RV32I-FPELIM-NEXT: sw a4, 32(sp) +; RV32I-FPELIM-NEXT: sw a3, 28(sp) +; RV32I-FPELIM-NEXT: sw a2, 24(sp) +; RV32I-FPELIM-NEXT: addi a0, sp, 24 +; RV32I-FPELIM-NEXT: sw a0, 4(sp) +; RV32I-FPELIM-NEXT: sw a0, 0(sp) +; RV32I-FPELIM-NEXT: lw s1, 20(sp) +; RV32I-FPELIM-NEXT: lui a1, %hi(notdead) +; RV32I-FPELIM-NEXT: addi a1, a1, %lo(notdead) +; RV32I-FPELIM-NEXT: jalr a1 +; RV32I-FPELIM-NEXT: lw a0, 4(sp) +; RV32I-FPELIM-NEXT: addi a0, a0, 3 +; RV32I-FPELIM-NEXT: andi a0, a0, -4 +; RV32I-FPELIM-NEXT: addi a1, a0, 4 +; RV32I-FPELIM-NEXT: sw a1, 4(sp) +; RV32I-FPELIM-NEXT: lw a1, 0(a0) +; RV32I-FPELIM-NEXT: addi a0, a0, 7 +; RV32I-FPELIM-NEXT: andi a0, a0, -4 +; RV32I-FPELIM-NEXT: addi a2, a0, 4 +; RV32I-FPELIM-NEXT: sw a2, 4(sp) +; RV32I-FPELIM-NEXT: lw a2, 0(a0) +; RV32I-FPELIM-NEXT: addi a0, a0, 7 +; RV32I-FPELIM-NEXT: andi a0, a0, -4 +; RV32I-FPELIM-NEXT: addi a3, a0, 4 +; RV32I-FPELIM-NEXT: sw a3, 4(sp) +; RV32I-FPELIM-NEXT: add a1, a1, s1 +; RV32I-FPELIM-NEXT: add a1, a1, a2 +; RV32I-FPELIM-NEXT: lw a0, 0(a0) +; RV32I-FPELIM-NEXT: add a0, a1, a0 +; RV32I-FPELIM-NEXT: lw s1, 8(sp) +; RV32I-FPELIM-NEXT: lw ra, 12(sp) +; RV32I-FPELIM-NEXT: addi sp, sp, 48 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va4_va_copy: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -64 +; RV32I-WITHFP-NEXT: sw ra, 28(sp) +; RV32I-WITHFP-NEXT: sw s0, 24(sp) +; RV32I-WITHFP-NEXT: sw s1, 20(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 32 +; RV32I-WITHFP-NEXT: sw a1, 4(s0) +; RV32I-WITHFP-NEXT: sw a7, 28(s0) +; RV32I-WITHFP-NEXT: sw a6, 24(s0) +; RV32I-WITHFP-NEXT: sw a5, 20(s0) +; RV32I-WITHFP-NEXT: sw a4, 16(s0) +; RV32I-WITHFP-NEXT: sw a3, 12(s0) +; RV32I-WITHFP-NEXT: sw a2, 8(s0) +; RV32I-WITHFP-NEXT: addi a0, s0, 8 +; RV32I-WITHFP-NEXT: sw a0, -16(s0) +; RV32I-WITHFP-NEXT: sw a0, -20(s0) +; RV32I-WITHFP-NEXT: lw s1, 4(s0) +; RV32I-WITHFP-NEXT: lui a1, %hi(notdead) +; RV32I-WITHFP-NEXT: addi a1, a1, %lo(notdead) +; RV32I-WITHFP-NEXT: jalr a1 +; RV32I-WITHFP-NEXT: lw a0, -16(s0) +; RV32I-WITHFP-NEXT: addi a0, a0, 3 +; RV32I-WITHFP-NEXT: andi a0, a0, -4 +; RV32I-WITHFP-NEXT: addi a1, a0, 4 +; RV32I-WITHFP-NEXT: sw a1, -16(s0) +; RV32I-WITHFP-NEXT: lw a1, 0(a0) +; RV32I-WITHFP-NEXT: addi a0, a0, 7 +; RV32I-WITHFP-NEXT: andi a0, a0, -4 +; RV32I-WITHFP-NEXT: addi a2, a0, 4 +; RV32I-WITHFP-NEXT: sw a2, -16(s0) +; RV32I-WITHFP-NEXT: lw a2, 0(a0) +; RV32I-WITHFP-NEXT: addi a0, a0, 7 +; RV32I-WITHFP-NEXT: andi a0, a0, -4 +; RV32I-WITHFP-NEXT: addi a3, a0, 4 +; RV32I-WITHFP-NEXT: sw a3, -16(s0) +; RV32I-WITHFP-NEXT: add a1, a1, s1 +; RV32I-WITHFP-NEXT: add a1, a1, a2 +; RV32I-WITHFP-NEXT: lw a0, 0(a0) +; RV32I-WITHFP-NEXT: add a0, a1, a0 +; RV32I-WITHFP-NEXT: lw s1, 20(sp) +; RV32I-WITHFP-NEXT: lw s0, 24(sp) +; RV32I-WITHFP-NEXT: lw ra, 28(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 64 +; RV32I-WITHFP-NEXT: ret %vargs = alloca i8*, align 4 %wargs = alloca i8*, align 4 %1 = bitcast i8** %vargs to i8* @@ -425,22 +912,49 @@ define i32 @va4_va_copy(i32 %argno, ...) nounwind { define i32 @va5_aligned_stack_callee(i32 %a, ...) nounwind { ; RV32I-LABEL: va5_aligned_stack_callee: ; RV32I: # %bb.0: -; RV32I-NEXT: addi sp, sp, -48 -; RV32I-NEXT: sw ra, 12(sp) -; RV32I-NEXT: sw s0, 8(sp) -; RV32I-NEXT: addi s0, sp, 16 -; RV32I-NEXT: sw a7, 28(s0) -; RV32I-NEXT: sw a6, 24(s0) -; RV32I-NEXT: sw a5, 20(s0) -; RV32I-NEXT: sw a4, 16(s0) -; RV32I-NEXT: sw a3, 12(s0) -; RV32I-NEXT: sw a2, 8(s0) -; RV32I-NEXT: sw a1, 4(s0) +; RV32I-NEXT: addi sp, sp, -32 +; RV32I-NEXT: sw a7, 28(sp) +; RV32I-NEXT: sw a6, 24(sp) +; RV32I-NEXT: sw a5, 20(sp) +; RV32I-NEXT: sw a4, 16(sp) +; RV32I-NEXT: sw a3, 12(sp) +; RV32I-NEXT: sw a2, 8(sp) +; RV32I-NEXT: sw a1, 4(sp) ; RV32I-NEXT: addi a0, zero, 1 -; RV32I-NEXT: lw s0, 8(sp) -; RV32I-NEXT: lw ra, 12(sp) -; RV32I-NEXT: addi sp, sp, 48 +; RV32I-NEXT: addi sp, sp, 32 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va5_aligned_stack_callee: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -32 +; RV32I-FPELIM-NEXT: sw a7, 28(sp) +; RV32I-FPELIM-NEXT: sw a6, 24(sp) +; RV32I-FPELIM-NEXT: sw a5, 20(sp) +; RV32I-FPELIM-NEXT: sw a4, 16(sp) +; RV32I-FPELIM-NEXT: sw a3, 12(sp) +; RV32I-FPELIM-NEXT: sw a2, 8(sp) +; RV32I-FPELIM-NEXT: sw a1, 4(sp) +; RV32I-FPELIM-NEXT: addi a0, zero, 1 +; RV32I-FPELIM-NEXT: addi sp, sp, 32 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va5_aligned_stack_callee: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -48 +; RV32I-WITHFP-NEXT: sw ra, 12(sp) +; RV32I-WITHFP-NEXT: sw s0, 8(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 16 +; RV32I-WITHFP-NEXT: sw a7, 28(s0) +; RV32I-WITHFP-NEXT: sw a6, 24(s0) +; RV32I-WITHFP-NEXT: sw a5, 20(s0) +; RV32I-WITHFP-NEXT: sw a4, 16(s0) +; RV32I-WITHFP-NEXT: sw a3, 12(s0) +; RV32I-WITHFP-NEXT: sw a2, 8(s0) +; RV32I-WITHFP-NEXT: sw a1, 4(s0) +; RV32I-WITHFP-NEXT: addi a0, zero, 1 +; RV32I-WITHFP-NEXT: lw s0, 8(sp) +; RV32I-WITHFP-NEXT: lw ra, 12(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 48 +; RV32I-WITHFP-NEXT: ret ret i32 1 } @@ -451,8 +965,6 @@ define void @va5_aligned_stack_caller() nounwind { ; RV32I: # %bb.0: ; RV32I-NEXT: addi sp, sp, -64 ; RV32I-NEXT: sw ra, 60(sp) -; RV32I-NEXT: sw s0, 56(sp) -; RV32I-NEXT: addi s0, sp, 64 ; RV32I-NEXT: addi a0, zero, 17 ; RV32I-NEXT: sw a0, 24(sp) ; RV32I-NEXT: addi a0, zero, 16 @@ -469,31 +981,122 @@ define void @va5_aligned_stack_caller() nounwind { ; RV32I-NEXT: sw a0, 0(sp) ; RV32I-NEXT: lui a0, 262153 ; RV32I-NEXT: addi a0, a0, 491 -; RV32I-NEXT: sw a0, -20(s0) +; RV32I-NEXT: sw a0, 44(sp) ; RV32I-NEXT: lui a0, 545260 ; RV32I-NEXT: addi a0, a0, -1967 -; RV32I-NEXT: sw a0, -24(s0) +; RV32I-NEXT: sw a0, 40(sp) ; RV32I-NEXT: lui a0, 964690 ; RV32I-NEXT: addi a0, a0, -328 -; RV32I-NEXT: sw a0, -28(s0) +; RV32I-NEXT: sw a0, 36(sp) ; RV32I-NEXT: lui a0, 335544 ; RV32I-NEXT: addi a0, a0, 1311 -; RV32I-NEXT: sw a0, -32(s0) +; RV32I-NEXT: sw a0, 32(sp) ; RV32I-NEXT: lui a0, 688509 ; RV32I-NEXT: addi a6, a0, -2048 ; RV32I-NEXT: lui a0, %hi(va5_aligned_stack_callee) ; RV32I-NEXT: addi a5, a0, %lo(va5_aligned_stack_callee) ; RV32I-NEXT: addi a0, zero, 1 ; RV32I-NEXT: addi a1, zero, 11 -; RV32I-NEXT: addi a2, s0, -32 +; RV32I-NEXT: addi a2, sp, 32 ; RV32I-NEXT: addi a3, zero, 12 ; RV32I-NEXT: addi a4, zero, 13 ; RV32I-NEXT: addi a7, zero, 4 ; RV32I-NEXT: jalr a5 -; RV32I-NEXT: lw s0, 56(sp) ; RV32I-NEXT: lw ra, 60(sp) ; RV32I-NEXT: addi sp, sp, 64 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va5_aligned_stack_caller: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -64 +; RV32I-FPELIM-NEXT: sw ra, 60(sp) +; RV32I-FPELIM-NEXT: addi a0, zero, 17 +; RV32I-FPELIM-NEXT: sw a0, 24(sp) +; RV32I-FPELIM-NEXT: addi a0, zero, 16 +; RV32I-FPELIM-NEXT: sw a0, 20(sp) +; RV32I-FPELIM-NEXT: addi a0, zero, 15 +; RV32I-FPELIM-NEXT: sw a0, 16(sp) +; RV32I-FPELIM-NEXT: lui a0, 262236 +; RV32I-FPELIM-NEXT: addi a0, a0, 655 +; RV32I-FPELIM-NEXT: sw a0, 12(sp) +; RV32I-FPELIM-NEXT: lui a0, 377487 +; RV32I-FPELIM-NEXT: addi a0, a0, 1475 +; RV32I-FPELIM-NEXT: sw a0, 8(sp) +; RV32I-FPELIM-NEXT: addi a0, zero, 14 +; RV32I-FPELIM-NEXT: sw a0, 0(sp) +; RV32I-FPELIM-NEXT: lui a0, 262153 +; RV32I-FPELIM-NEXT: addi a0, a0, 491 +; RV32I-FPELIM-NEXT: sw a0, 44(sp) +; RV32I-FPELIM-NEXT: lui a0, 545260 +; RV32I-FPELIM-NEXT: addi a0, a0, -1967 +; RV32I-FPELIM-NEXT: sw a0, 40(sp) +; RV32I-FPELIM-NEXT: lui a0, 964690 +; RV32I-FPELIM-NEXT: addi a0, a0, -328 +; RV32I-FPELIM-NEXT: sw a0, 36(sp) +; RV32I-FPELIM-NEXT: lui a0, 335544 +; RV32I-FPELIM-NEXT: addi a0, a0, 1311 +; RV32I-FPELIM-NEXT: sw a0, 32(sp) +; RV32I-FPELIM-NEXT: lui a0, 688509 +; RV32I-FPELIM-NEXT: addi a6, a0, -2048 +; RV32I-FPELIM-NEXT: lui a0, %hi(va5_aligned_stack_callee) +; RV32I-FPELIM-NEXT: addi a5, a0, %lo(va5_aligned_stack_callee) +; RV32I-FPELIM-NEXT: addi a0, zero, 1 +; RV32I-FPELIM-NEXT: addi a1, zero, 11 +; RV32I-FPELIM-NEXT: addi a2, sp, 32 +; RV32I-FPELIM-NEXT: addi a3, zero, 12 +; RV32I-FPELIM-NEXT: addi a4, zero, 13 +; RV32I-FPELIM-NEXT: addi a7, zero, 4 +; RV32I-FPELIM-NEXT: jalr a5 +; RV32I-FPELIM-NEXT: lw ra, 60(sp) +; RV32I-FPELIM-NEXT: addi sp, sp, 64 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va5_aligned_stack_caller: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -64 +; RV32I-WITHFP-NEXT: sw ra, 60(sp) +; RV32I-WITHFP-NEXT: sw s0, 56(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 64 +; RV32I-WITHFP-NEXT: addi a0, zero, 17 +; RV32I-WITHFP-NEXT: sw a0, 24(sp) +; RV32I-WITHFP-NEXT: addi a0, zero, 16 +; RV32I-WITHFP-NEXT: sw a0, 20(sp) +; RV32I-WITHFP-NEXT: addi a0, zero, 15 +; RV32I-WITHFP-NEXT: sw a0, 16(sp) +; RV32I-WITHFP-NEXT: lui a0, 262236 +; RV32I-WITHFP-NEXT: addi a0, a0, 655 +; RV32I-WITHFP-NEXT: sw a0, 12(sp) +; RV32I-WITHFP-NEXT: lui a0, 377487 +; RV32I-WITHFP-NEXT: addi a0, a0, 1475 +; RV32I-WITHFP-NEXT: sw a0, 8(sp) +; RV32I-WITHFP-NEXT: addi a0, zero, 14 +; RV32I-WITHFP-NEXT: sw a0, 0(sp) +; RV32I-WITHFP-NEXT: lui a0, 262153 +; RV32I-WITHFP-NEXT: addi a0, a0, 491 +; RV32I-WITHFP-NEXT: sw a0, -20(s0) +; RV32I-WITHFP-NEXT: lui a0, 545260 +; RV32I-WITHFP-NEXT: addi a0, a0, -1967 +; RV32I-WITHFP-NEXT: sw a0, -24(s0) +; RV32I-WITHFP-NEXT: lui a0, 964690 +; RV32I-WITHFP-NEXT: addi a0, a0, -328 +; RV32I-WITHFP-NEXT: sw a0, -28(s0) +; RV32I-WITHFP-NEXT: lui a0, 335544 +; RV32I-WITHFP-NEXT: addi a0, a0, 1311 +; RV32I-WITHFP-NEXT: sw a0, -32(s0) +; RV32I-WITHFP-NEXT: lui a0, 688509 +; RV32I-WITHFP-NEXT: addi a6, a0, -2048 +; RV32I-WITHFP-NEXT: lui a0, %hi(va5_aligned_stack_callee) +; RV32I-WITHFP-NEXT: addi a5, a0, %lo(va5_aligned_stack_callee) +; RV32I-WITHFP-NEXT: addi a0, zero, 1 +; RV32I-WITHFP-NEXT: addi a1, zero, 11 +; RV32I-WITHFP-NEXT: addi a2, s0, -32 +; RV32I-WITHFP-NEXT: addi a3, zero, 12 +; RV32I-WITHFP-NEXT: addi a4, zero, 13 +; RV32I-WITHFP-NEXT: addi a7, zero, 4 +; RV32I-WITHFP-NEXT: jalr a5 +; RV32I-WITHFP-NEXT: lw s0, 56(sp) +; RV32I-WITHFP-NEXT: lw ra, 60(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 64 +; RV32I-WITHFP-NEXT: ret %1 = call i32 (i32, ...) @va5_aligned_stack_callee(i32 1, i32 11, fp128 0xLEB851EB851EB851F400091EB851EB851, i32 12, i32 13, i64 20000000000, i32 14, double 2.720000e+00, i32 15, [2 x i32] [i32 16, i32 17]) @@ -508,24 +1111,57 @@ define i32 @va6_no_fixed_args(...) nounwind { ; RV32I-LABEL: va6_no_fixed_args: ; RV32I: # %bb.0: ; RV32I-NEXT: addi sp, sp, -48 -; RV32I-NEXT: sw ra, 12(sp) -; RV32I-NEXT: sw s0, 8(sp) -; RV32I-NEXT: addi s0, sp, 16 -; RV32I-NEXT: sw a0, 0(s0) -; RV32I-NEXT: sw a7, 28(s0) -; RV32I-NEXT: sw a6, 24(s0) -; RV32I-NEXT: sw a5, 20(s0) -; RV32I-NEXT: sw a4, 16(s0) -; RV32I-NEXT: sw a3, 12(s0) -; RV32I-NEXT: sw a2, 8(s0) -; RV32I-NEXT: sw a1, 4(s0) -; RV32I-NEXT: addi a0, s0, 4 -; RV32I-NEXT: sw a0, -12(s0) -; RV32I-NEXT: lw a0, 0(s0) -; RV32I-NEXT: lw s0, 8(sp) -; RV32I-NEXT: lw ra, 12(sp) +; RV32I-NEXT: sw a0, 16(sp) +; RV32I-NEXT: sw a7, 44(sp) +; RV32I-NEXT: sw a6, 40(sp) +; RV32I-NEXT: sw a5, 36(sp) +; RV32I-NEXT: sw a4, 32(sp) +; RV32I-NEXT: sw a3, 28(sp) +; RV32I-NEXT: sw a2, 24(sp) +; RV32I-NEXT: sw a1, 20(sp) +; RV32I-NEXT: addi a0, sp, 20 +; RV32I-NEXT: sw a0, 12(sp) +; RV32I-NEXT: lw a0, 16(sp) ; RV32I-NEXT: addi sp, sp, 48 ; RV32I-NEXT: ret +; RV32I-FPELIM-LABEL: va6_no_fixed_args: +; RV32I-FPELIM: # %bb.0: +; RV32I-FPELIM-NEXT: addi sp, sp, -48 +; RV32I-FPELIM-NEXT: sw a0, 16(sp) +; RV32I-FPELIM-NEXT: sw a7, 44(sp) +; RV32I-FPELIM-NEXT: sw a6, 40(sp) +; RV32I-FPELIM-NEXT: sw a5, 36(sp) +; RV32I-FPELIM-NEXT: sw a4, 32(sp) +; RV32I-FPELIM-NEXT: sw a3, 28(sp) +; RV32I-FPELIM-NEXT: sw a2, 24(sp) +; RV32I-FPELIM-NEXT: sw a1, 20(sp) +; RV32I-FPELIM-NEXT: addi a0, sp, 20 +; RV32I-FPELIM-NEXT: sw a0, 12(sp) +; RV32I-FPELIM-NEXT: lw a0, 16(sp) +; RV32I-FPELIM-NEXT: addi sp, sp, 48 +; RV32I-FPELIM-NEXT: ret +; +; RV32I-WITHFP-LABEL: va6_no_fixed_args: +; RV32I-WITHFP: # %bb.0: +; RV32I-WITHFP-NEXT: addi sp, sp, -48 +; RV32I-WITHFP-NEXT: sw ra, 12(sp) +; RV32I-WITHFP-NEXT: sw s0, 8(sp) +; RV32I-WITHFP-NEXT: addi s0, sp, 16 +; RV32I-WITHFP-NEXT: sw a0, 0(s0) +; RV32I-WITHFP-NEXT: sw a7, 28(s0) +; RV32I-WITHFP-NEXT: sw a6, 24(s0) +; RV32I-WITHFP-NEXT: sw a5, 20(s0) +; RV32I-WITHFP-NEXT: sw a4, 16(s0) +; RV32I-WITHFP-NEXT: sw a3, 12(s0) +; RV32I-WITHFP-NEXT: sw a2, 8(s0) +; RV32I-WITHFP-NEXT: sw a1, 4(s0) +; RV32I-WITHFP-NEXT: addi a0, s0, 4 +; RV32I-WITHFP-NEXT: sw a0, -12(s0) +; RV32I-WITHFP-NEXT: lw a0, 0(s0) +; RV32I-WITHFP-NEXT: lw s0, 8(sp) +; RV32I-WITHFP-NEXT: lw ra, 12(sp) +; RV32I-WITHFP-NEXT: addi sp, sp, 48 +; RV32I-WITHFP-NEXT: ret %va = alloca i8*, align 4 %1 = bitcast i8** %va to i8* call void @llvm.va_start(i8* %1) |

