llvm-project/llvm/test/CodeGen/RISCV/double-mem.ll

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -mtriple=riscv32 -mattr=+d -verify-machineinstrs < %s \
; RUN:   | FileCheck -check-prefix=RV32IFD %s
; RUN: llc -mtriple=riscv64 -mattr=+d -verify-machineinstrs < %s \
; RUN:   | FileCheck -check-prefix=RV64IFD %s

define double @fld(double *%a) nounwind {
; RV32IFD-LABEL: fld:
; RV32IFD:       # %bb.0:
; RV32IFD-NEXT:    addi sp, sp, -16
; RV32IFD-NEXT:    fld ft0, 24(a0)
; RV32IFD-NEXT:    fld ft1, 0(a0)
; RV32IFD-NEXT:    fadd.d ft0, ft1, ft0
; RV32IFD-NEXT:    fsd ft0, 8(sp)
; RV32IFD-NEXT:    lw a0, 8(sp)
; RV32IFD-NEXT:    lw a1, 12(sp)
; RV32IFD-NEXT:    addi sp, sp, 16
; RV32IFD-NEXT:    ret
;
; RV64IFD-LABEL: fld:
; RV64IFD:       # %bb.0:
; RV64IFD-NEXT:    fld ft0, 24(a0)
; RV64IFD-NEXT:    fld ft1, 0(a0)
; RV64IFD-NEXT:    fadd.d ft0, ft1, ft0
; RV64IFD-NEXT:    fmv.x.d a0, ft0
; RV64IFD-NEXT:    ret
  %1 = load double, double* %a
  %2 = getelementptr double, double* %a, i32 3
  %3 = load double, double* %2
; Use both loaded values in an FP op to ensure an fld is used, even for the
; soft float ABI
  %4 = fadd double %1, %3
  ret double %4
}

define void @fsd(double *%a, double %b, double %c) nounwind {
; RV32IFD-LABEL: fsd:
; RV32IFD:       # %bb.0:
; RV32IFD-NEXT:    addi sp, sp, -16
; RV32IFD-NEXT:    sw a3, 8(sp)
; RV32IFD-NEXT:    sw a4, 12(sp)
; RV32IFD-NEXT:    fld ft0, 8(sp)
; RV32IFD-NEXT:    sw a1, 8(sp)
; RV32IFD-NEXT:    sw a2, 12(sp)
; RV32IFD-NEXT:    fld ft1, 8(sp)
; RV32IFD-NEXT:    fadd.d ft0, ft1, ft0
; RV32IFD-NEXT:    fsd ft0, 64(a0)
; RV32IFD-NEXT:    fsd ft0, 0(a0)
; RV32IFD-NEXT:    addi sp, sp, 16
; RV32IFD-NEXT:    ret
;
; RV64IFD-LABEL: fsd:
; RV64IFD:       # %bb.0:
; RV64IFD-NEXT:    fmv.d.x ft0, a2
; RV64IFD-NEXT:    fmv.d.x ft1, a1
; RV64IFD-NEXT:    fadd.d ft0, ft1, ft0
; RV64IFD-NEXT:    fsd ft0, 64(a0)
; RV64IFD-NEXT:    fsd ft0, 0(a0)
; RV64IFD-NEXT:    ret
; Use %b and %c in an FP op to ensure floating point registers are used, even
; for the soft float ABI
  %1 = fadd double %b, %c
  store double %1, double* %a
  %2 = getelementptr double, double* %a, i32 8
  store double %1, double* %2
  ret void
}

; Check load and store to a global
@G = global double 0.0

define double @fld_fsd_global(double %a, double %b) nounwind {
; RV32IFD-LABEL: fld_fsd_global:
; RV32IFD:       # %bb.0:
; RV32IFD-NEXT:    addi sp, sp, -16
; RV32IFD-NEXT:    sw a2, 8(sp)
; RV32IFD-NEXT:    sw a3, 12(sp)
; RV32IFD-NEXT:    fld ft0, 8(sp)
; RV32IFD-NEXT:    sw a0, 8(sp)
; RV32IFD-NEXT:    sw a1, 12(sp)
; RV32IFD-NEXT:    fld ft1, 8(sp)
; RV32IFD-NEXT:    fadd.d ft0, ft1, ft0
; RV32IFD-NEXT:    lui a0, %hi(G)
; RV32IFD-NEXT:    fld ft1, %lo(G)(a0)
; RV32IFD-NEXT:    fsd ft0, %lo(G)(a0)
; RV32IFD-NEXT:    addi a0, a0, %lo(G)
; RV32IFD-NEXT:    fld ft1, 72(a0)
; RV32IFD-NEXT:    fsd ft0, 72(a0)
; RV32IFD-NEXT:    fsd ft0, 8(sp)
; RV32IFD-NEXT:    lw a0, 8(sp)
; RV32IFD-NEXT:    lw a1, 12(sp)
; RV32IFD-NEXT:    addi sp, sp, 16
; RV32IFD-NEXT:    ret
;
; RV64IFD-LABEL: fld_fsd_global:
; RV64IFD:       # %bb.0:
; RV64IFD-NEXT:    fmv.d.x ft0, a1
; RV64IFD-NEXT:    fmv.d.x ft1, a0
; RV64IFD-NEXT:    fadd.d ft0, ft1, ft0
; RV64IFD-NEXT:    lui a0, %hi(G)
; RV64IFD-NEXT:    fld ft1, %lo(G)(a0)
; RV64IFD-NEXT:    fsd ft0, %lo(G)(a0)
; RV64IFD-NEXT:    addi a0, a0, %lo(G)
; RV64IFD-NEXT:    fld ft1, 72(a0)
; RV64IFD-NEXT:    fsd ft0, 72(a0)
; RV64IFD-NEXT:    fmv.x.d a0, ft0
; RV64IFD-NEXT:    ret
; Use %a and %b in an FP op to ensure floating point registers are used, even
; for the soft float ABI
  %1 = fadd double %a, %b
  %2 = load volatile double, double* @G
  store double %1, double* @G
  %3 = getelementptr double, double* @G, i32 9
  %4 = load volatile double, double* %3
  store double %1, double* %3
  ret double %1
}

; Ensure that 1 is added to the high 20 bits if bit 11 of the low part is 1
define double @fld_fsd_constant(double %a) nounwind {
; RV32IFD-LABEL: fld_fsd_constant:
; RV32IFD:       # %bb.0:
; RV32IFD-NEXT:    addi sp, sp, -16
; RV32IFD-NEXT:    sw a0, 8(sp)
; RV32IFD-NEXT:    sw a1, 12(sp)
; RV32IFD-NEXT:    fld ft0, 8(sp)
; RV32IFD-NEXT:    lui a0, 912092
; RV32IFD-NEXT:    fld ft1, -273(a0)
; RV32IFD-NEXT:    fadd.d ft0, ft0, ft1
; RV32IFD-NEXT:    fsd ft0, -273(a0)
; RV32IFD-NEXT:    fsd ft0, 8(sp)
; RV32IFD-NEXT:    lw a0, 8(sp)
; RV32IFD-NEXT:    lw a1, 12(sp)
; RV32IFD-NEXT:    addi sp, sp, 16
; RV32IFD-NEXT:    ret
;
; RV64IFD-LABEL: fld_fsd_constant:
; RV64IFD:       # %bb.0:
; RV64IFD-NEXT:    fmv.d.x ft0, a0
; RV64IFD-NEXT:    lui a0, 56
; RV64IFD-NEXT:    addiw a0, a0, -1353
; RV64IFD-NEXT:    slli a0, a0, 14
; RV64IFD-NEXT:    fld ft1, -273(a0)
; RV64IFD-NEXT:    fadd.d ft0, ft0, ft1
; RV64IFD-NEXT:    fsd ft0, -273(a0)
; RV64IFD-NEXT:    fmv.x.d a0, ft0
; RV64IFD-NEXT:    ret
  %1 = inttoptr i32 3735928559 to double*
  %2 = load volatile double, double* %1
  %3 = fadd double %a, %2
  store double %3, double* %1
  ret double %3
}

declare void @notdead(i8*)

define double @fld_stack(double %a) nounwind {
; RV32IFD-LABEL: fld_stack:
; RV32IFD:       # %bb.0:
; RV32IFD-NEXT:    addi sp, sp, -32
; RV32IFD-NEXT:    sw ra, 28(sp)
; RV32IFD-NEXT:    sw s0, 24(sp)
; RV32IFD-NEXT:    sw s1, 20(sp)
; RV32IFD-NEXT:    mv s0, a1
; RV32IFD-NEXT:    mv s1, a0
; RV32IFD-NEXT:    addi a0, sp, 8
; RV32IFD-NEXT:    call notdead
; RV32IFD-NEXT:    sw s1, 0(sp)
; RV32IFD-NEXT:    sw s0, 4(sp)
; RV32IFD-NEXT:    fld ft0, 0(sp)
; RV32IFD-NEXT:    fld ft1, 8(sp)
; RV32IFD-NEXT:    fadd.d ft0, ft1, ft0
; RV32IFD-NEXT:    fsd ft0, 0(sp)
; RV32IFD-NEXT:    lw a0, 0(sp)
; RV32IFD-NEXT:    lw a1, 4(sp)
; RV32IFD-NEXT:    lw s1, 20(sp)
; RV32IFD-NEXT:    lw s0, 24(sp)
; RV32IFD-NEXT:    lw ra, 28(sp)
; RV32IFD-NEXT:    addi sp, sp, 32
; RV32IFD-NEXT:    ret
;
; RV64IFD-LABEL: fld_stack:
; RV64IFD:       # %bb.0:
; RV64IFD-NEXT:    addi sp, sp, -32
; RV64IFD-NEXT:    sd ra, 24(sp)
; RV64IFD-NEXT:    sd s0, 16(sp)
; RV64IFD-NEXT:    mv s0, a0
; RV64IFD-NEXT:    addi a0, sp, 8
; RV64IFD-NEXT:    call notdead
; RV64IFD-NEXT:    fmv.d.x ft0, s0
; RV64IFD-NEXT:    fld ft1, 8(sp)
; RV64IFD-NEXT:    fadd.d ft0, ft1, ft0
; RV64IFD-NEXT:    fmv.x.d a0, ft0
; RV64IFD-NEXT:    ld s0, 16(sp)
; RV64IFD-NEXT:    ld ra, 24(sp)
; RV64IFD-NEXT:    addi sp, sp, 32
; RV64IFD-NEXT:    ret
  %1 = alloca double, align 8
  %2 = bitcast double* %1 to i8*
  call void @notdead(i8* %2)
  %3 = load double, double* %1
  %4 = fadd double %3, %a ; force load in to FPR64
  ret double %4
}

define void @fsd_stack(double %a, double %b) nounwind {
; RV32IFD-LABEL: fsd_stack:
; RV32IFD:       # %bb.0:
; RV32IFD-NEXT:    addi sp, sp, -32
; RV32IFD-NEXT:    sw ra, 28(sp)
; RV32IFD-NEXT:    sw a2, 8(sp)
; RV32IFD-NEXT:    sw a3, 12(sp)
; RV32IFD-NEXT:    fld ft0, 8(sp)
; RV32IFD-NEXT:    sw a0, 8(sp)
; RV32IFD-NEXT:    sw a1, 12(sp)
; RV32IFD-NEXT:    fld ft1, 8(sp)
; RV32IFD-NEXT:    fadd.d ft0, ft1, ft0
; RV32IFD-NEXT:    fsd ft0, 16(sp)
; RV32IFD-NEXT:    addi a0, sp, 16
; RV32IFD-NEXT:    call notdead
; RV32IFD-NEXT:    lw ra, 28(sp)
; RV32IFD-NEXT:    addi sp, sp, 32
; RV32IFD-NEXT:    ret
;
; RV64IFD-LABEL: fsd_stack:
; RV64IFD:       # %bb.0:
; RV64IFD-NEXT:    addi sp, sp, -16
; RV64IFD-NEXT:    sd ra, 8(sp)
; RV64IFD-NEXT:    fmv.d.x ft0, a1
; RV64IFD-NEXT:    fmv.d.x ft1, a0
; RV64IFD-NEXT:    fadd.d ft0, ft1, ft0
; RV64IFD-NEXT:    fsd ft0, 0(sp)
; RV64IFD-NEXT:    mv a0, sp
; RV64IFD-NEXT:    call notdead
; RV64IFD-NEXT:    ld ra, 8(sp)
; RV64IFD-NEXT:    addi sp, sp, 16
; RV64IFD-NEXT:    ret
  %1 = fadd double %a, %b ; force store from FPR64
  %2 = alloca double, align 8
  store double %1, double* %2
  %3 = bitcast double* %2 to i8*
  call void @notdead(i8* %3)
  ret void
}

; Test selection of store<ST4[%a], trunc to f32>, ..
define void @fsd_trunc(float* %a, double %b) nounwind noinline optnone {
; RV32IFD-LABEL: fsd_trunc:
; RV32IFD:       # %bb.0:
; RV32IFD-NEXT:    addi sp, sp, -16
; RV32IFD-NEXT:    sw a1, 8(sp)
; RV32IFD-NEXT:    sw a2, 12(sp)
; RV32IFD-NEXT:    fld ft0, 8(sp)
; RV32IFD-NEXT:    fcvt.s.d ft0, ft0
; RV32IFD-NEXT:    fsw ft0, 0(a0)
; RV32IFD-NEXT:    addi sp, sp, 16
; RV32IFD-NEXT:    ret
;
; RV64IFD-LABEL: fsd_trunc:
; RV64IFD:       # %bb.0:
; RV64IFD-NEXT:    fmv.d.x ft0, a1
; RV64IFD-NEXT:    fcvt.s.d ft0, ft0
; RV64IFD-NEXT:    fsw ft0, 0(a0)
; RV64IFD-NEXT:    ret
  %1 = fptrunc double %b to float
  store float %1, float* %a, align 4
  ret void
}
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00			`; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py`
			`; RUN: llc -mtriple=riscv32 -mattr=+d -verify-machineinstrs < %s \`
			`; RUN: \| FileCheck -check-prefix=RV32IFD %s`
[RISCV] Implement RV64D codegen This patch: * Adds necessary RV64D codegen patterns * Modifies CC_RISCV so it will properly handle f64 types (with soft float ABI) Note that in general there is no reason to try to select fcvt.w[u].d rather than fcvt.l[u].d for i32 conversions because fptosi/fptoui produce poison if the input won't fit into the target type. Differential Revision: https://reviews.llvm.org/D53237 llvm-svn: 352833 2019-02-01 11:53:30 +08:00			`; RUN: llc -mtriple=riscv64 -mattr=+d -verify-machineinstrs < %s \`
			`; RUN: \| FileCheck -check-prefix=RV64IFD %s`
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00
			`define double @fld(double *%a) nounwind {`
			`; RV32IFD-LABEL: fld:`
			`; RV32IFD: # %bb.0:`
			`; RV32IFD-NEXT: addi sp, sp, -16`
			`; RV32IFD-NEXT: fld ft0, 24(a0)`
			`; RV32IFD-NEXT: fld ft1, 0(a0)`
			`; RV32IFD-NEXT: fadd.d ft0, ft1, ft0`
			`; RV32IFD-NEXT: fsd ft0, 8(sp)`
			`; RV32IFD-NEXT: lw a0, 8(sp)`
			`; RV32IFD-NEXT: lw a1, 12(sp)`
			`; RV32IFD-NEXT: addi sp, sp, 16`
			`; RV32IFD-NEXT: ret`
[RISCV] Implement RV64D codegen This patch: * Adds necessary RV64D codegen patterns * Modifies CC_RISCV so it will properly handle f64 types (with soft float ABI) Note that in general there is no reason to try to select fcvt.w[u].d rather than fcvt.l[u].d for i32 conversions because fptosi/fptoui produce poison if the input won't fit into the target type. Differential Revision: https://reviews.llvm.org/D53237 llvm-svn: 352833 2019-02-01 11:53:30 +08:00			`;`
			`; RV64IFD-LABEL: fld:`
			`; RV64IFD: # %bb.0:`
			`; RV64IFD-NEXT: fld ft0, 24(a0)`
			`; RV64IFD-NEXT: fld ft1, 0(a0)`
			`; RV64IFD-NEXT: fadd.d ft0, ft1, ft0`
			`; RV64IFD-NEXT: fmv.x.d a0, ft0`
			`; RV64IFD-NEXT: ret`
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00			`%1 = load double, double* %a`
			`%2 = getelementptr double, double* %a, i32 3`
			`%3 = load double, double* %2`
			`; Use both loaded values in an FP op to ensure an fld is used, even for the`
			`; soft float ABI`
			`%4 = fadd double %1, %3`
			`ret double %4`
			`}`

			`define void @fsd(double *%a, double %b, double %c) nounwind {`
			`; RV32IFD-LABEL: fsd:`
			`; RV32IFD: # %bb.0:`
			`; RV32IFD-NEXT: addi sp, sp, -16`
			`; RV32IFD-NEXT: sw a3, 8(sp)`
			`; RV32IFD-NEXT: sw a4, 12(sp)`
			`; RV32IFD-NEXT: fld ft0, 8(sp)`
			`; RV32IFD-NEXT: sw a1, 8(sp)`
			`; RV32IFD-NEXT: sw a2, 12(sp)`
			`; RV32IFD-NEXT: fld ft1, 8(sp)`
			`; RV32IFD-NEXT: fadd.d ft0, ft1, ft0`
			`; RV32IFD-NEXT: fsd ft0, 64(a0)`
			`; RV32IFD-NEXT: fsd ft0, 0(a0)`
			`; RV32IFD-NEXT: addi sp, sp, 16`
			`; RV32IFD-NEXT: ret`
[RISCV] Implement RV64D codegen This patch: * Adds necessary RV64D codegen patterns * Modifies CC_RISCV so it will properly handle f64 types (with soft float ABI) Note that in general there is no reason to try to select fcvt.w[u].d rather than fcvt.l[u].d for i32 conversions because fptosi/fptoui produce poison if the input won't fit into the target type. Differential Revision: https://reviews.llvm.org/D53237 llvm-svn: 352833 2019-02-01 11:53:30 +08:00			`;`
			`; RV64IFD-LABEL: fsd:`
			`; RV64IFD: # %bb.0:`
			`; RV64IFD-NEXT: fmv.d.x ft0, a2`
			`; RV64IFD-NEXT: fmv.d.x ft1, a1`
			`; RV64IFD-NEXT: fadd.d ft0, ft1, ft0`
			`; RV64IFD-NEXT: fsd ft0, 64(a0)`
			`; RV64IFD-NEXT: fsd ft0, 0(a0)`
			`; RV64IFD-NEXT: ret`
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00			`; Use %b and %c in an FP op to ensure floating point registers are used, even`
			`; for the soft float ABI`
			`%1 = fadd double %b, %c`
			`store double %1, double* %a`
			`%2 = getelementptr double, double* %a, i32 8`
			`store double %1, double* %2`
			`ret void`
			`}`

			`; Check load and store to a global`
			`@G = global double 0.0`

			`define double @fld_fsd_global(double %a, double %b) nounwind {`
			`; RV32IFD-LABEL: fld_fsd_global:`
			`; RV32IFD: # %bb.0:`
			`; RV32IFD-NEXT: addi sp, sp, -16`
			`; RV32IFD-NEXT: sw a2, 8(sp)`
			`; RV32IFD-NEXT: sw a3, 12(sp)`
			`; RV32IFD-NEXT: fld ft0, 8(sp)`
			`; RV32IFD-NEXT: sw a0, 8(sp)`
			`; RV32IFD-NEXT: sw a1, 12(sp)`
			`; RV32IFD-NEXT: fld ft1, 8(sp)`
			`; RV32IFD-NEXT: fadd.d ft0, ft1, ft0`
			`; RV32IFD-NEXT: lui a0, %hi(G)`
			`; RV32IFD-NEXT: fld ft1, %lo(G)(a0)`
			`; RV32IFD-NEXT: fsd ft0, %lo(G)(a0)`
[RISCV] Separate base from offset in lowerGlobalAddress Summary: When lowering global address, lower the base as a TargetGlobal first then create an SDNode for the offset separately and chain it to the address calculation This optimization will create a DAG where the base address of a global access will be reused between different access. The offset can later be folded into the immediate part of the memory access instruction. With this optimization we generate: lui a0, %hi(s) addi a0, a0, %lo(s) ; shared base address. addi a1, zero, 20 ; 2 instructions per access. sw a1, 44(a0) addi a1, zero, 10 sw a1, 8(a0) addi a1, zero, 30 sw a1, 80(a0) Instead of: lui a0, %hi(s+44) ; 3 instructions per access. addi a1, zero, 20 sw a1, %lo(s+44)(a0) lui a0, %hi(s+8) addi a1, zero, 10 sw a1, %lo(s+8)(a0) lui a0, %hi(s+80) addi a1, zero, 30 sw a1, %lo(s+80)(a0) Which will save one instruction per access. Reviewers: asb, apazos Reviewed By: asb Subscribers: rbar, johnrusso, simoncook, jordy.potman.lists, niosHD, kito-cheng, shiva0217, zzheng, edward-jones, mgrang, apazos, asb, llvm-commits Differential Revision: https://reviews.llvm.org/D46989 llvm-svn: 332641 2018-05-18 02:14:53 +08:00			`; RV32IFD-NEXT: addi a0, a0, %lo(G)`
			`; RV32IFD-NEXT: fld ft1, 72(a0)`
			`; RV32IFD-NEXT: fsd ft0, 72(a0)`
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00			`; RV32IFD-NEXT: fsd ft0, 8(sp)`
			`; RV32IFD-NEXT: lw a0, 8(sp)`
			`; RV32IFD-NEXT: lw a1, 12(sp)`
			`; RV32IFD-NEXT: addi sp, sp, 16`
			`; RV32IFD-NEXT: ret`
[RISCV] Implement RV64D codegen This patch: * Adds necessary RV64D codegen patterns * Modifies CC_RISCV so it will properly handle f64 types (with soft float ABI) Note that in general there is no reason to try to select fcvt.w[u].d rather than fcvt.l[u].d for i32 conversions because fptosi/fptoui produce poison if the input won't fit into the target type. Differential Revision: https://reviews.llvm.org/D53237 llvm-svn: 352833 2019-02-01 11:53:30 +08:00			`;`
			`; RV64IFD-LABEL: fld_fsd_global:`
			`; RV64IFD: # %bb.0:`
			`; RV64IFD-NEXT: fmv.d.x ft0, a1`
			`; RV64IFD-NEXT: fmv.d.x ft1, a0`
			`; RV64IFD-NEXT: fadd.d ft0, ft1, ft0`
			`; RV64IFD-NEXT: lui a0, %hi(G)`
			`; RV64IFD-NEXT: fld ft1, %lo(G)(a0)`
			`; RV64IFD-NEXT: fsd ft0, %lo(G)(a0)`
			`; RV64IFD-NEXT: addi a0, a0, %lo(G)`
			`; RV64IFD-NEXT: fld ft1, 72(a0)`
			`; RV64IFD-NEXT: fsd ft0, 72(a0)`
			`; RV64IFD-NEXT: fmv.x.d a0, ft0`
			`; RV64IFD-NEXT: ret`
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00			`; Use %a and %b in an FP op to ensure floating point registers are used, even`
			`; for the soft float ABI`
			`%1 = fadd double %a, %b`
			`%2 = load volatile double, double* @G`
			`store double %1, double* @G`
			`%3 = getelementptr double, double* @G, i32 9`
			`%4 = load volatile double, double* %3`
			`store double %1, double* %3`
			`ret double %1`
			`}`

			`; Ensure that 1 is added to the high 20 bits if bit 11 of the low part is 1`
			`define double @fld_fsd_constant(double %a) nounwind {`
			`; RV32IFD-LABEL: fld_fsd_constant:`
			`; RV32IFD: # %bb.0:`
			`; RV32IFD-NEXT: addi sp, sp, -16`
			`; RV32IFD-NEXT: sw a0, 8(sp)`
			`; RV32IFD-NEXT: sw a1, 12(sp)`
			`; RV32IFD-NEXT: fld ft0, 8(sp)`
			`; RV32IFD-NEXT: lui a0, 912092`
			`; RV32IFD-NEXT: fld ft1, -273(a0)`
			`; RV32IFD-NEXT: fadd.d ft0, ft0, ft1`
			`; RV32IFD-NEXT: fsd ft0, -273(a0)`
			`; RV32IFD-NEXT: fsd ft0, 8(sp)`
			`; RV32IFD-NEXT: lw a0, 8(sp)`
			`; RV32IFD-NEXT: lw a1, 12(sp)`
			`; RV32IFD-NEXT: addi sp, sp, 16`
			`; RV32IFD-NEXT: ret`
[RISCV] Implement RV64D codegen This patch: * Adds necessary RV64D codegen patterns * Modifies CC_RISCV so it will properly handle f64 types (with soft float ABI) Note that in general there is no reason to try to select fcvt.w[u].d rather than fcvt.l[u].d for i32 conversions because fptosi/fptoui produce poison if the input won't fit into the target type. Differential Revision: https://reviews.llvm.org/D53237 llvm-svn: 352833 2019-02-01 11:53:30 +08:00			`;`
			`; RV64IFD-LABEL: fld_fsd_constant:`
			`; RV64IFD: # %bb.0:`
			`; RV64IFD-NEXT: fmv.d.x ft0, a0`
			`; RV64IFD-NEXT: lui a0, 56`
			`; RV64IFD-NEXT: addiw a0, a0, -1353`
			`; RV64IFD-NEXT: slli a0, a0, 14`
			`; RV64IFD-NEXT: fld ft1, -273(a0)`
			`; RV64IFD-NEXT: fadd.d ft0, ft0, ft1`
			`; RV64IFD-NEXT: fsd ft0, -273(a0)`
			`; RV64IFD-NEXT: fmv.x.d a0, ft0`
			`; RV64IFD-NEXT: ret`
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00			`%1 = inttoptr i32 3735928559 to double*`
			`%2 = load volatile double, double* %1`
			`%3 = fadd double %a, %2`
			`store double %3, double* %1`
			`ret double %3`
			`}`

			`declare void @notdead(i8*)`

			`define double @fld_stack(double %a) nounwind {`
			`; RV32IFD-LABEL: fld_stack:`
			`; RV32IFD: # %bb.0:`
			`; RV32IFD-NEXT: addi sp, sp, -32`
			`; RV32IFD-NEXT: sw ra, 28(sp)`
[RISCV] Only mark fp as reserved if the function has a dedicated frame pointer This follows similar logic in the ARM and Mips backends, and allows the free use of s0 in functions without a dedicated frame pointer. The changes in callee-saved-gprs.ll most clearly show the effect of this patch. llvm-svn: 356063 2019-03-14 00:33:45 +08:00			`; RV32IFD-NEXT: sw s0, 24(sp)`
			`; RV32IFD-NEXT: sw s1, 20(sp)`
			`; RV32IFD-NEXT: mv s0, a1`
[RISCV] Set CostPerUse for registers Summary: Set CostPerUse higher for registers that are not used in the compressed instruction set. This will influence the greedy register allocator to reduce the use of registers that can't be encoded in 16 bit instructions. This affects register allocation even when compressed instruction isn't targeted, we see no major negative codegen impact. Reviewers: asb Reviewed By: asb Subscribers: rbar, johnrusso, simoncook, jordy.potman.lists, apazos, niosHD, kito-cheng, shiva0217, zzheng, edward-jones, mgrang Differential Revision: https://reviews.llvm.org/D47039 llvm-svn: 333132 2018-05-24 05:34:30 +08:00			`; RV32IFD-NEXT: mv s1, a0`
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00			`; RV32IFD-NEXT: addi a0, sp, 8`
[RISCV] Expand function call to "call" pseudoinstruction To do this: 1. Change GlobalAddress SDNode to TargetGlobalAddress to avoid legalizer split the symbol. 2. Change ExternalSymbol SDNode to TargetExternalSymbol to avoid legalizer split the symbol. 3. Let PseudoCALL match direct call with target operand TargetGlobalAddress and TargetExternalSymbol. Differential Revision: https://reviews.llvm.org/D44885 llvm-svn: 330827 2018-04-25 22:19:12 +08:00			`; RV32IFD-NEXT: call notdead`
[RISCV] Set CostPerUse for registers Summary: Set CostPerUse higher for registers that are not used in the compressed instruction set. This will influence the greedy register allocator to reduce the use of registers that can't be encoded in 16 bit instructions. This affects register allocation even when compressed instruction isn't targeted, we see no major negative codegen impact. Reviewers: asb Reviewed By: asb Subscribers: rbar, johnrusso, simoncook, jordy.potman.lists, apazos, niosHD, kito-cheng, shiva0217, zzheng, edward-jones, mgrang Differential Revision: https://reviews.llvm.org/D47039 llvm-svn: 333132 2018-05-24 05:34:30 +08:00			`; RV32IFD-NEXT: sw s1, 0(sp)`
[RISCV] Only mark fp as reserved if the function has a dedicated frame pointer This follows similar logic in the ARM and Mips backends, and allows the free use of s0 in functions without a dedicated frame pointer. The changes in callee-saved-gprs.ll most clearly show the effect of this patch. llvm-svn: 356063 2019-03-14 00:33:45 +08:00			`; RV32IFD-NEXT: sw s0, 4(sp)`
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00			`; RV32IFD-NEXT: fld ft0, 0(sp)`
			`; RV32IFD-NEXT: fld ft1, 8(sp)`
			`; RV32IFD-NEXT: fadd.d ft0, ft1, ft0`
			`; RV32IFD-NEXT: fsd ft0, 0(sp)`
			`; RV32IFD-NEXT: lw a0, 0(sp)`
			`; RV32IFD-NEXT: lw a1, 4(sp)`
[RISCV] Only mark fp as reserved if the function has a dedicated frame pointer This follows similar logic in the ARM and Mips backends, and allows the free use of s0 in functions without a dedicated frame pointer. The changes in callee-saved-gprs.ll most clearly show the effect of this patch. llvm-svn: 356063 2019-03-14 00:33:45 +08:00			`; RV32IFD-NEXT: lw s1, 20(sp)`
			`; RV32IFD-NEXT: lw s0, 24(sp)`
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00			`; RV32IFD-NEXT: lw ra, 28(sp)`
			`; RV32IFD-NEXT: addi sp, sp, 32`
			`; RV32IFD-NEXT: ret`
[RISCV] Implement RV64D codegen This patch: * Adds necessary RV64D codegen patterns * Modifies CC_RISCV so it will properly handle f64 types (with soft float ABI) Note that in general there is no reason to try to select fcvt.w[u].d rather than fcvt.l[u].d for i32 conversions because fptosi/fptoui produce poison if the input won't fit into the target type. Differential Revision: https://reviews.llvm.org/D53237 llvm-svn: 352833 2019-02-01 11:53:30 +08:00			`;`
			`; RV64IFD-LABEL: fld_stack:`
			`; RV64IFD: # %bb.0:`
			`; RV64IFD-NEXT: addi sp, sp, -32`
			`; RV64IFD-NEXT: sd ra, 24(sp)`
[RISCV] Only mark fp as reserved if the function has a dedicated frame pointer This follows similar logic in the ARM and Mips backends, and allows the free use of s0 in functions without a dedicated frame pointer. The changes in callee-saved-gprs.ll most clearly show the effect of this patch. llvm-svn: 356063 2019-03-14 00:33:45 +08:00			`; RV64IFD-NEXT: sd s0, 16(sp)`
			`; RV64IFD-NEXT: mv s0, a0`
[RISCV] Implement RV64D codegen This patch: * Adds necessary RV64D codegen patterns * Modifies CC_RISCV so it will properly handle f64 types (with soft float ABI) Note that in general there is no reason to try to select fcvt.w[u].d rather than fcvt.l[u].d for i32 conversions because fptosi/fptoui produce poison if the input won't fit into the target type. Differential Revision: https://reviews.llvm.org/D53237 llvm-svn: 352833 2019-02-01 11:53:30 +08:00			`; RV64IFD-NEXT: addi a0, sp, 8`
			`; RV64IFD-NEXT: call notdead`
[RISCV] Only mark fp as reserved if the function has a dedicated frame pointer This follows similar logic in the ARM and Mips backends, and allows the free use of s0 in functions without a dedicated frame pointer. The changes in callee-saved-gprs.ll most clearly show the effect of this patch. llvm-svn: 356063 2019-03-14 00:33:45 +08:00			`; RV64IFD-NEXT: fmv.d.x ft0, s0`
[RISCV] Implement RV64D codegen This patch: * Adds necessary RV64D codegen patterns * Modifies CC_RISCV so it will properly handle f64 types (with soft float ABI) Note that in general there is no reason to try to select fcvt.w[u].d rather than fcvt.l[u].d for i32 conversions because fptosi/fptoui produce poison if the input won't fit into the target type. Differential Revision: https://reviews.llvm.org/D53237 llvm-svn: 352833 2019-02-01 11:53:30 +08:00			`; RV64IFD-NEXT: fld ft1, 8(sp)`
			`; RV64IFD-NEXT: fadd.d ft0, ft1, ft0`
			`; RV64IFD-NEXT: fmv.x.d a0, ft0`
[RISCV] Only mark fp as reserved if the function has a dedicated frame pointer This follows similar logic in the ARM and Mips backends, and allows the free use of s0 in functions without a dedicated frame pointer. The changes in callee-saved-gprs.ll most clearly show the effect of this patch. llvm-svn: 356063 2019-03-14 00:33:45 +08:00			`; RV64IFD-NEXT: ld s0, 16(sp)`
[RISCV] Implement RV64D codegen This patch: * Adds necessary RV64D codegen patterns * Modifies CC_RISCV so it will properly handle f64 types (with soft float ABI) Note that in general there is no reason to try to select fcvt.w[u].d rather than fcvt.l[u].d for i32 conversions because fptosi/fptoui produce poison if the input won't fit into the target type. Differential Revision: https://reviews.llvm.org/D53237 llvm-svn: 352833 2019-02-01 11:53:30 +08:00			`; RV64IFD-NEXT: ld ra, 24(sp)`
			`; RV64IFD-NEXT: addi sp, sp, 32`
			`; RV64IFD-NEXT: ret`
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00			`%1 = alloca double, align 8`
			`%2 = bitcast double* %1 to i8*`
			`call void @notdead(i8* %2)`
			`%3 = load double, double* %1`
			`%4 = fadd double %3, %a ; force load in to FPR64`
			`ret double %4`
			`}`

			`define void @fsd_stack(double %a, double %b) nounwind {`
			`; RV32IFD-LABEL: fsd_stack:`
			`; RV32IFD: # %bb.0:`
			`; RV32IFD-NEXT: addi sp, sp, -32`
			`; RV32IFD-NEXT: sw ra, 28(sp)`
			`; RV32IFD-NEXT: sw a2, 8(sp)`
			`; RV32IFD-NEXT: sw a3, 12(sp)`
			`; RV32IFD-NEXT: fld ft0, 8(sp)`
			`; RV32IFD-NEXT: sw a0, 8(sp)`
			`; RV32IFD-NEXT: sw a1, 12(sp)`
			`; RV32IFD-NEXT: fld ft1, 8(sp)`
			`; RV32IFD-NEXT: fadd.d ft0, ft1, ft0`
			`; RV32IFD-NEXT: fsd ft0, 16(sp)`
			`; RV32IFD-NEXT: addi a0, sp, 16`
[RISCV] Expand function call to "call" pseudoinstruction To do this: 1. Change GlobalAddress SDNode to TargetGlobalAddress to avoid legalizer split the symbol. 2. Change ExternalSymbol SDNode to TargetExternalSymbol to avoid legalizer split the symbol. 3. Let PseudoCALL match direct call with target operand TargetGlobalAddress and TargetExternalSymbol. Differential Revision: https://reviews.llvm.org/D44885 llvm-svn: 330827 2018-04-25 22:19:12 +08:00			`; RV32IFD-NEXT: call notdead`
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00			`; RV32IFD-NEXT: lw ra, 28(sp)`
			`; RV32IFD-NEXT: addi sp, sp, 32`
			`; RV32IFD-NEXT: ret`
[RISCV] Implement RV64D codegen This patch: * Adds necessary RV64D codegen patterns * Modifies CC_RISCV so it will properly handle f64 types (with soft float ABI) Note that in general there is no reason to try to select fcvt.w[u].d rather than fcvt.l[u].d for i32 conversions because fptosi/fptoui produce poison if the input won't fit into the target type. Differential Revision: https://reviews.llvm.org/D53237 llvm-svn: 352833 2019-02-01 11:53:30 +08:00			`;`
			`; RV64IFD-LABEL: fsd_stack:`
			`; RV64IFD: # %bb.0:`
			`; RV64IFD-NEXT: addi sp, sp, -16`
			`; RV64IFD-NEXT: sd ra, 8(sp)`
			`; RV64IFD-NEXT: fmv.d.x ft0, a1`
			`; RV64IFD-NEXT: fmv.d.x ft1, a0`
			`; RV64IFD-NEXT: fadd.d ft0, ft1, ft0`
			`; RV64IFD-NEXT: fsd ft0, 0(sp)`
			`; RV64IFD-NEXT: mv a0, sp`
			`; RV64IFD-NEXT: call notdead`
			`; RV64IFD-NEXT: ld ra, 8(sp)`
			`; RV64IFD-NEXT: addi sp, sp, 16`
			`; RV64IFD-NEXT: ret`
[RISCV] Add tests missed in r329871 llvm-svn: 329872 2018-04-12 13:36:44 +08:00			`%1 = fadd double %a, %b ; force store from FPR64`
			`%2 = alloca double, align 8`
			`store double %1, double* %2`
			`%3 = bitcast double* %2 to i8*`
			`call void @notdead(i8* %3)`
			`ret void`
			`}`
[RISCV] Codegen support for RV32D floating point conversion operations This also includes support and a test for truncating stores, which are now possible thanks to the fpround pattern. llvm-svn: 329876 2018-04-12 13:47:15 +08:00
			`; Test selection of store<ST4[%a], trunc to f32>, ..`
			`define void @fsd_trunc(float* %a, double %b) nounwind noinline optnone {`
			`; RV32IFD-LABEL: fsd_trunc:`
			`; RV32IFD: # %bb.0:`
			`; RV32IFD-NEXT: addi sp, sp, -16`
			`; RV32IFD-NEXT: sw a1, 8(sp)`
			`; RV32IFD-NEXT: sw a2, 12(sp)`
			`; RV32IFD-NEXT: fld ft0, 8(sp)`
			`; RV32IFD-NEXT: fcvt.s.d ft0, ft0`
			`; RV32IFD-NEXT: fsw ft0, 0(a0)`
			`; RV32IFD-NEXT: addi sp, sp, 16`
			`; RV32IFD-NEXT: ret`
[RISCV] Implement RV64D codegen This patch: * Adds necessary RV64D codegen patterns * Modifies CC_RISCV so it will properly handle f64 types (with soft float ABI) Note that in general there is no reason to try to select fcvt.w[u].d rather than fcvt.l[u].d for i32 conversions because fptosi/fptoui produce poison if the input won't fit into the target type. Differential Revision: https://reviews.llvm.org/D53237 llvm-svn: 352833 2019-02-01 11:53:30 +08:00			`;`
			`; RV64IFD-LABEL: fsd_trunc:`
			`; RV64IFD: # %bb.0:`
			`; RV64IFD-NEXT: fmv.d.x ft0, a1`
			`; RV64IFD-NEXT: fcvt.s.d ft0, ft0`
			`; RV64IFD-NEXT: fsw ft0, 0(a0)`
			`; RV64IFD-NEXT: ret`
[RISCV] Codegen support for RV32D floating point conversion operations This also includes support and a test for truncating stores, which are now possible thanks to the fpround pattern. llvm-svn: 329876 2018-04-12 13:47:15 +08:00			`%1 = fptrunc double %b to float`
			`store float %1, float* %a, align 4`
			`ret void`
			`}`