llvm-project/llvm/test/CodeGen/X86/tailcall-64.ll

; RUN: llc -mtriple=x86_64-apple-macosx -mcpu=core2 < %s | FileCheck %s

declare i64 @testi()

define i64 @test_trivial() {
 %A = tail call i64 @testi()
 ret i64 %A
}
; CHECK: test_trivial:
; CHECK: jmp	_testi                  ## TAILCALL


define i64 @test_noop_bitcast() {
 %A = tail call i64 @testi()
 %B = bitcast i64 %A to i64
 ret i64 %B
}
; CHECK: test_noop_bitcast:
; CHECK: jmp	_testi                  ## TAILCALL


; Tail call shouldn't be blocked by no-op inttoptr.
define i8* @test_inttoptr() {
  %A = tail call i64 @testi()
  %B = inttoptr i64 %A to i8*
  ret i8* %B
}

; CHECK: test_inttoptr:
; CHECK: jmp	_testi                  ## TAILCALL


declare <4 x float> @testv()

define <4 x i32> @test_vectorbitcast() {
  %A = tail call <4 x float> @testv()
  %B = bitcast <4 x float> %A to <4 x i32>
  ret <4 x i32> %B
}
; CHECK: test_vectorbitcast:
; CHECK: jmp	_testv                  ## TAILCALL


declare { i64, i64 } @testp()

define {i64, i64} @test_pair_trivial() {
  %A = tail call { i64, i64} @testp()
  ret { i64, i64} %A
}
; CHECK: test_pair_trivial:
; CHECK: jmp	_testp                  ## TAILCALL


define {i64, i64} @test_pair_trivial_extract() {
  %A = tail call { i64, i64} @testp()
  %x = extractvalue { i64, i64} %A, 0
  %y = extractvalue { i64, i64} %A, 1
  
  %b = insertvalue {i64, i64} undef, i64 %x, 0
  %c = insertvalue {i64, i64} %b, i64 %y, 1
  
  ret { i64, i64} %c
}

; CHECK: test_pair_trivial_extract:
; CHECK: jmp	_testp                  ## TAILCALL

define {i8*, i64} @test_pair_conv_extract() {
  %A = tail call { i64, i64} @testp()
  %x = extractvalue { i64, i64} %A, 0
  %y = extractvalue { i64, i64} %A, 1
  
  %x1 = inttoptr i64 %x to i8*
  
  %b = insertvalue {i8*, i64} undef, i8* %x1, 0
  %c = insertvalue {i8*, i64} %b, i64 %y, 1
  
  ret { i8*, i64} %c
}

; CHECK: test_pair_conv_extract:
; CHECK: jmp	_testp                  ## TAILCALL


; PR13006
define { i64, i64 } @crash(i8* %this) {
  %c = tail call { i64, i64 } @testp()
  %mrv7 = insertvalue { i64, i64 } %c, i64 undef, 1
  ret { i64, i64 } %mrv7
}

; Check that we can fold an indexed load into a tail call instruction.
; CHECK: fold_indexed_load
; CHECK: leaq (%rsi,%rsi,4), %[[RAX:r..]]
; CHECK: jmpq *16(%{{r..}},%[[RAX]],8)  # TAILCALL
%struct.funcs = type { i32 (i8*, i32*, i32)*, i32 (i8*)*, i32 (i8*)*, i32 (i8*, i32)*, i32 }
@func_table = external global [0 x %struct.funcs]
define void @fold_indexed_load(i8* %mbstr, i64 %idxprom) nounwind uwtable ssp {
entry:
  %dsplen = getelementptr inbounds [0 x %struct.funcs]* @func_table, i64 0, i64 %idxprom, i32 2
  %x1 = load i32 (i8*)** %dsplen, align 8
  %call = tail call i32 %x1(i8* %mbstr) nounwind
  ret void
}

; <rdar://problem/12282281> Fold an indexed load into the tail call instruction.
; Calling a varargs function with 6 arguments requires 7 registers (%al is the
; vector count for varargs functions). This leaves %r11 as the only available
; scratch register.
;
; It is not possible to fold an indexed load into TCRETURNmi64 in that case.
;
; typedef int (*funcptr)(void*, ...);
; extern const funcptr funcs[];
; int f(int n) {
;   return funcs[n](0, 0, 0, 0, 0, 0);
; }
;
; CHECK: rdar12282281
; CHECK: jmpq *%r11 # TAILCALL
@funcs = external constant [0 x i32 (i8*, ...)*]

define i32 @rdar12282281(i32 %n) nounwind uwtable ssp {
entry:
  %idxprom = sext i32 %n to i64
  %arrayidx = getelementptr inbounds [0 x i32 (i8*, ...)*]* @funcs, i64 0, i64 %idxprom
  %0 = load i32 (i8*, ...)** %arrayidx, align 8
  %call = tail call i32 (i8*, ...)* %0(i8* null, i32 0, i32 0, i32 0, i32 0, i32 0) nounwind
  ret i32 %call
}

define x86_fp80 @fp80_call(x86_fp80 %x) nounwind  {
entry:
; CHECK: fp80_call:
; CHECK: jmp _fp80_callee
  %call = tail call x86_fp80 @fp80_callee(x86_fp80 %x) nounwind
  ret x86_fp80 %call
}

declare x86_fp80 @fp80_callee(x86_fp80)

; rdar://12229511
define x86_fp80 @trunc_fp80(x86_fp80 %x) nounwind  {
entry:
; CHECK: trunc_fp80
; CHECK: callq _trunc
; CHECK-NOT: jmp _trunc
; CHECK: ret
  %conv = fptrunc x86_fp80 %x to double
  %call = tail call double @trunc(double %conv) nounwind readnone
  %conv1 = fpext double %call to x86_fp80
  ret x86_fp80 %conv1
}

declare double @trunc(double) nounwind readnone
Fix an illegal tailcall opt where the callee returns a double via xmm while caller returns x86_fp80 via st0. rdar://12229511 llvm-svn: 164588 2012-09-25 13:32:34 +08:00			`; RUN: llc -mtriple=x86_64-apple-macosx -mcpu=core2 < %s \| FileCheck %s`
add some simple 64-bit tail call tests. llvm-svn: 157797 2012-06-01 13:03:31 +08:00
			`declare i64 @testi()`

			`define i64 @test_trivial() {`
			`%A = tail call i64 @testi()`
			`ret i64 %A`
			`}`
			`; CHECK: test_trivial:`
			`; CHECK: jmp _testi ## TAILCALL`


			`define i64 @test_noop_bitcast() {`
			`%A = tail call i64 @testi()`
			`%B = bitcast i64 %A to i64`
			`ret i64 %B`
			`}`
			`; CHECK: test_noop_bitcast:`
			`; CHECK: jmp _testi ## TAILCALL`
enhance getNoopInput to know about vector<->vector bitcasts of legal types, as well as int<->ptr casts. This allows us to tailcall functions with some trivial casts between the call and return (i.e. because the return types disagree). llvm-svn: 157798 2012-06-01 13:16:33 +08:00

			`; Tail call shouldn't be blocked by no-op inttoptr.`
			`define i8* @test_inttoptr() {`
			`%A = tail call i64 @testi()`
			`%B = inttoptr i64 %A to i8*`
			`ret i8* %B`
			`}`

			`; CHECK: test_inttoptr:`
			`; CHECK: jmp _testi ## TAILCALL`


			`declare <4 x float> @testv()`

			`define <4 x i32> @test_vectorbitcast() {`
			`%A = tail call <4 x float> @testv()`
			`%B = bitcast <4 x float> %A to <4 x i32>`
			`ret <4 x i32> %B`
			`}`
			`; CHECK: test_vectorbitcast:`
			`; CHECK: jmp _testv ## TAILCALL`
enhance the logic for looking through tailcalls to look through transparent casts in multiple-return value scenarios, like what happens on X86-64 when returning small structs. llvm-svn: 157800 2012-06-01 13:29:15 +08:00

			`declare { i64, i64 } @testp()`

			`define {i64, i64} @test_pair_trivial() {`
			`%A = tail call { i64, i64} @testp()`
			`ret { i64, i64} %A`
			`}`
			`; CHECK: test_pair_trivial:`
			`; CHECK: jmp _testp ## TAILCALL`



			`define {i64, i64} @test_pair_trivial_extract() {`
			`%A = tail call { i64, i64} @testp()`
			`%x = extractvalue { i64, i64} %A, 0`
			`%y = extractvalue { i64, i64} %A, 1`

			`%b = insertvalue {i64, i64} undef, i64 %x, 0`
			`%c = insertvalue {i64, i64} %b, i64 %y, 1`

			`ret { i64, i64} %c`
			`}`

			`; CHECK: test_pair_trivial_extract:`
			`; CHECK: jmp _testp ## TAILCALL`

			`define {i8*, i64} @test_pair_conv_extract() {`
			`%A = tail call { i64, i64} @testp()`
			`%x = extractvalue { i64, i64} %A, 0`
			`%y = extractvalue { i64, i64} %A, 1`

			`%x1 = inttoptr i64 %x to i8*`

			`%b = insertvalue {i8, i64} undef, i8 %x1, 0`
			`%c = insertvalue {i8*, i64} %b, i64 %y, 1`

			`ret { i8*, i64} %c`
			`}`

			`; CHECK: test_pair_conv_extract:`
			`; CHECK: jmp _testp ## TAILCALL`



testcase for PR13006, thanks to Duncan for filing it. llvm-svn: 157824 2012-06-02 02:19:46 +08:00			`; PR13006`
			`define { i64, i64 } @crash(i8* %this) {`
			`%c = tail call { i64, i64 } @testp()`
			`%mrv7 = insertvalue { i64, i64 } %c, i64 undef, 1`
			`ret { i64, i64 } %mrv7`
			`}`

Fix the TCRETURNmi64 bug differently. Add a PatFrag to match X86tcret using 6 fixed registers or less. This avoids folding loads into TCRETURNmi64 using 7 or more volatile registers. <rdar://problem/12282281> llvm-svn: 163819 2012-09-14 02:31:27 +08:00			`; Check that we can fold an indexed load into a tail call instruction.`
			`; CHECK: fold_indexed_load`
			`; CHECK: leaq (%rsi,%rsi,4), %[[RAX:r..]]`
Fix test case to avoid PIC magic. llvm-svn: 163827 2012-09-14 03:47:45 +08:00			`; CHECK: jmpq *16(%{{r..}},%[[RAX]],8) # TAILCALL`
Fix the TCRETURNmi64 bug differently. Add a PatFrag to match X86tcret using 6 fixed registers or less. This avoids folding loads into TCRETURNmi64 using 7 or more volatile registers. <rdar://problem/12282281> llvm-svn: 163819 2012-09-14 02:31:27 +08:00			`%struct.funcs = type { i32 (i8, i32, i32), i32 (i8), i32 (i8), i32 (i8, i32)*, i32 }`
			`@func_table = external global [0 x %struct.funcs]`
			`define void @fold_indexed_load(i8* %mbstr, i64 %idxprom) nounwind uwtable ssp {`
			`entry:`
			`%dsplen = getelementptr inbounds [0 x %struct.funcs]* @func_table, i64 0, i64 %idxprom, i32 2`
			`%x1 = load i32 (i8)* %dsplen, align 8`
			`%call = tail call i32 %x1(i8* %mbstr) nounwind`
			`ret void`
			`}`
enhance the logic for looking through tailcalls to look through transparent casts in multiple-return value scenarios, like what happens on X86-64 when returning small structs. llvm-svn: 157800 2012-06-01 13:29:15 +08:00
Fix the TCRETURNmi64 bug differently. Add a PatFrag to match X86tcret using 6 fixed registers or less. This avoids folding loads into TCRETURNmi64 using 7 or more volatile registers. <rdar://problem/12282281> llvm-svn: 163819 2012-09-14 02:31:27 +08:00			`; <rdar://problem/12282281> Fold an indexed load into the tail call instruction.`
			`; Calling a varargs function with 6 arguments requires 7 registers (%al is the`
			`; vector count for varargs functions). This leaves %r11 as the only available`
			`; scratch register.`
			`;`
			`; It is not possible to fold an indexed load into TCRETURNmi64 in that case.`
			`;`
			`; typedef int (funcptr)(void, ...);`
			`; extern const funcptr funcs[];`
			`; int f(int n) {`
			`; return funcs[n](0, 0, 0, 0, 0, 0);`
			`; }`
			`;`
			`; CHECK: rdar12282281`
			`; CHECK: jmpq *%r11 # TAILCALL`
			`@funcs = external constant [0 x i32 (i8, ...)]`

			`define i32 @rdar12282281(i32 %n) nounwind uwtable ssp {`
			`entry:`
			`%idxprom = sext i32 %n to i64`
			`%arrayidx = getelementptr inbounds [0 x i32 (i8, ...)]* @funcs, i64 0, i64 %idxprom`
			`%0 = load i32 (i8, ...)* %arrayidx, align 8`
			`%call = tail call i32 (i8, ...) %0(i8* null, i32 0, i32 0, i32 0, i32 0, i32 0) nounwind`
			`ret i32 %call`
			`}`
Fix an illegal tailcall opt where the callee returns a double via xmm while caller returns x86_fp80 via st0. rdar://12229511 llvm-svn: 164588 2012-09-25 13:32:34 +08:00
			`define x86_fp80 @fp80_call(x86_fp80 %x) nounwind {`
			`entry:`
			`; CHECK: fp80_call:`
			`; CHECK: jmp _fp80_callee`
			`%call = tail call x86_fp80 @fp80_callee(x86_fp80 %x) nounwind`
			`ret x86_fp80 %call`
			`}`

			`declare x86_fp80 @fp80_callee(x86_fp80)`

			`; rdar://12229511`
			`define x86_fp80 @trunc_fp80(x86_fp80 %x) nounwind {`
			`entry:`
			`; CHECK: trunc_fp80`
			`; CHECK: callq _trunc`
			`; CHECK-NOT: jmp _trunc`
			`; CHECK: ret`
			`%conv = fptrunc x86_fp80 %x to double`
			`%call = tail call double @trunc(double %conv) nounwind readnone`
			`%conv1 = fpext double %call to x86_fp80`
			`ret x86_fp80 %conv1`
			`}`

			`declare double @trunc(double) nounwind readnone`