llvm-project/llvm/test/CodeGen/X86/coalescer-commute2.ll

; RUN: llc < %s -mtriple=x86_64-linux -join-physregs | FileCheck %s
; CHECK-NOT:     mov
; CHECK:     paddw
; CHECK-NOT:     mov
; CHECK:     paddw
; CHECK-NOT:     paddw
; CHECK-NOT:     mov

; The 2-addr pass should ensure that identical code is produced for these functions
; no extra copy should be generated.

define <2 x i64> @test1(<2 x i64> %x, <2 x i64> %y) nounwind  {
entry:
	%tmp6 = bitcast <2 x i64> %y to <8 x i16>		; <<8 x i16>> [#uses=1]
	%tmp8 = bitcast <2 x i64> %x to <8 x i16>		; <<8 x i16>> [#uses=1]
	%tmp9 = add <8 x i16> %tmp8, %tmp6		; <<8 x i16>> [#uses=1]
	%tmp10 = bitcast <8 x i16> %tmp9 to <2 x i64>		; <<2 x i64>> [#uses=1]
	ret <2 x i64> %tmp10
}

define <2 x i64> @test2(<2 x i64> %x, <2 x i64> %y) nounwind  {
entry:
	%tmp6 = bitcast <2 x i64> %x to <8 x i16>		; <<8 x i16>> [#uses=1]
	%tmp8 = bitcast <2 x i64> %y to <8 x i16>		; <<8 x i16>> [#uses=1]
	%tmp9 = add <8 x i16> %tmp8, %tmp6		; <<8 x i16>> [#uses=1]
	%tmp10 = bitcast <8 x i16> %tmp9 to <2 x i64>		; <<2 x i64>> [#uses=1]
	ret <2 x i64> %tmp10
}


; The coalescer should commute the add to avoid a copy.
define <4 x float> @test3(<4 x float> %V) {
entry:
        %tmp8 = shufflevector <4 x float> %V, <4 x float> undef,
                                        <4 x i32> < i32 3, i32 2, i32 1, i32 0 >
        %add = fadd <4 x float> %tmp8, %V
        ret <4 x float> %add
}
Prepare remaining tests for -join-physreg going away. llvm-svn: 130893 2011-05-05 07:54:59 +08:00			`; RUN: llc < %s -mtriple=x86_64-linux -join-physregs \| FileCheck %s`
test/CodeGen/X86: FileCheck-ize and add explicit -mtriple=x86_64-linux. They are useless to Win64 target. llvm-svn: 127732 2011-03-16 21:52:38 +08:00			`; CHECK-NOT: mov`
			`; CHECK: paddw`
			`; CHECK-NOT: mov`
			`; CHECK: paddw`
			`; CHECK-NOT: paddw`
			`; CHECK-NOT: mov`
Evan implemented these. llvm-svn: 47828 2008-03-03 02:05:14 +08:00
			`; The 2-addr pass should ensure that identical code is produced for these functions`
			`; no extra copy should be generated.`

			`define <2 x i64> @test1(<2 x i64> %x, <2 x i64> %y) nounwind {`
			`entry:`
			`%tmp6 = bitcast <2 x i64> %y to <8 x i16> ; <<8 x i16>> [#uses=1]`
			`%tmp8 = bitcast <2 x i64> %x to <8 x i16> ; <<8 x i16>> [#uses=1]`
			`%tmp9 = add <8 x i16> %tmp8, %tmp6 ; <<8 x i16>> [#uses=1]`
			`%tmp10 = bitcast <8 x i16> %tmp9 to <2 x i64> ; <<2 x i64>> [#uses=1]`
			`ret <2 x i64> %tmp10`
			`}`

			`define <2 x i64> @test2(<2 x i64> %x, <2 x i64> %y) nounwind {`
			`entry:`
			`%tmp6 = bitcast <2 x i64> %x to <8 x i16> ; <<8 x i16>> [#uses=1]`
			`%tmp8 = bitcast <2 x i64> %y to <8 x i16> ; <<8 x i16>> [#uses=1]`
			`%tmp9 = add <8 x i16> %tmp8, %tmp6 ; <<8 x i16>> [#uses=1]`
			`%tmp10 = bitcast <8 x i16> %tmp9 to <2 x i64> ; <<2 x i64>> [#uses=1]`
			`ret <2 x i64> %tmp10`
			`}`


			`; The coalescer should commute the add to avoid a copy.`
			`define <4 x float> @test3(<4 x float> %V) {`
			`entry:`
			`%tmp8 = shufflevector <4 x float> %V, <4 x float> undef,`
			`<4 x i32> < i32 3, i32 2, i32 1, i32 0 >`
Split the Add, Sub, and Mul instruction opcodes into separate integer and floating-point opcodes, introducing FAdd, FSub, and FMul. For now, the AsmParser, BitcodeReader, and IRBuilder all preserve backwards compatability, and the Core LLVM APIs preserve backwards compatibility for IR producers. Most front-ends won't need to change immediately. This implements the first step of the plan outlined here: http://nondot.org/sabre/LLVMNotes/IntegerOverflow.txt llvm-svn: 72897 2009-06-05 06:49:04 +08:00			`%add = fadd <4 x float> %tmp8, %V`
Evan implemented these. llvm-svn: 47828 2008-03-03 02:05:14 +08:00			`ret <4 x float> %add`
			`}`