llvm-project/llvm/test/CodeGen/ARM/vld3.ll

; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s

%struct.__neon_int8x8x3_t = type { <8 x i8>,  <8 x i8>,  <8 x i8> }
%struct.__neon_int16x4x3_t = type { <4 x i16>, <4 x i16>, <4 x i16> }
%struct.__neon_int32x2x3_t = type { <2 x i32>, <2 x i32>, <2 x i32> }
%struct.__neon_float32x2x3_t = type { <2 x float>, <2 x float>, <2 x float> }
%struct.__neon_int64x1x3_t = type { <1 x i64>, <1 x i64>, <1 x i64> }

%struct.__neon_int8x16x3_t = type { <16 x i8>,  <16 x i8>,  <16 x i8> }
%struct.__neon_int16x8x3_t = type { <8 x i16>, <8 x i16>, <8 x i16> }
%struct.__neon_int32x4x3_t = type { <4 x i32>, <4 x i32>, <4 x i32> }
%struct.__neon_float32x4x3_t = type { <4 x float>, <4 x float>, <4 x float> }

define <8 x i8> @vld3i8(i8* %A) nounwind {
;CHECK: vld3i8:
;Check the alignment value.  Max for this instruction is 64 bits:
;CHECK: vld3.8 {d16, d17, d18}, [r0, :64]
	%tmp1 = call %struct.__neon_int8x8x3_t @llvm.arm.neon.vld3.v8i8(i8* %A, i32 32)
        %tmp2 = extractvalue %struct.__neon_int8x8x3_t %tmp1, 0
        %tmp3 = extractvalue %struct.__neon_int8x8x3_t %tmp1, 2
        %tmp4 = add <8 x i8> %tmp2, %tmp3
	ret <8 x i8> %tmp4
}

define <4 x i16> @vld3i16(i16* %A) nounwind {
;CHECK: vld3i16:
;CHECK: vld3.16
	%tmp0 = bitcast i16* %A to i8*
	%tmp1 = call %struct.__neon_int16x4x3_t @llvm.arm.neon.vld3.v4i16(i8* %tmp0, i32 1)
        %tmp2 = extractvalue %struct.__neon_int16x4x3_t %tmp1, 0
        %tmp3 = extractvalue %struct.__neon_int16x4x3_t %tmp1, 2
        %tmp4 = add <4 x i16> %tmp2, %tmp3
	ret <4 x i16> %tmp4
}

define <2 x i32> @vld3i32(i32* %A) nounwind {
;CHECK: vld3i32:
;CHECK: vld3.32
	%tmp0 = bitcast i32* %A to i8*
	%tmp1 = call %struct.__neon_int32x2x3_t @llvm.arm.neon.vld3.v2i32(i8* %tmp0, i32 1)
        %tmp2 = extractvalue %struct.__neon_int32x2x3_t %tmp1, 0
        %tmp3 = extractvalue %struct.__neon_int32x2x3_t %tmp1, 2
        %tmp4 = add <2 x i32> %tmp2, %tmp3
	ret <2 x i32> %tmp4
}

define <2 x float> @vld3f(float* %A) nounwind {
;CHECK: vld3f:
;CHECK: vld3.32
	%tmp0 = bitcast float* %A to i8*
	%tmp1 = call %struct.__neon_float32x2x3_t @llvm.arm.neon.vld3.v2f32(i8* %tmp0, i32 1)
        %tmp2 = extractvalue %struct.__neon_float32x2x3_t %tmp1, 0
        %tmp3 = extractvalue %struct.__neon_float32x2x3_t %tmp1, 2
        %tmp4 = fadd <2 x float> %tmp2, %tmp3
	ret <2 x float> %tmp4
}

define <1 x i64> @vld3i64(i64* %A) nounwind {
;CHECK: vld3i64:
;Check the alignment value.  Max for this instruction is 64 bits:
;CHECK: vld1.64 {d16, d17, d18}, [r0, :64]
	%tmp0 = bitcast i64* %A to i8*
	%tmp1 = call %struct.__neon_int64x1x3_t @llvm.arm.neon.vld3.v1i64(i8* %tmp0, i32 16)
        %tmp2 = extractvalue %struct.__neon_int64x1x3_t %tmp1, 0
        %tmp3 = extractvalue %struct.__neon_int64x1x3_t %tmp1, 2
        %tmp4 = add <1 x i64> %tmp2, %tmp3
	ret <1 x i64> %tmp4
}

define <16 x i8> @vld3Qi8(i8* %A) nounwind {
;CHECK: vld3Qi8:
;Check the alignment value.  Max for this instruction is 64 bits:
;CHECK: vld3.8 {d16, d18, d20}, [r0, :64]!
;CHECK: vld3.8 {d17, d19, d21}, [r0, :64]
	%tmp1 = call %struct.__neon_int8x16x3_t @llvm.arm.neon.vld3.v16i8(i8* %A, i32 32)
        %tmp2 = extractvalue %struct.__neon_int8x16x3_t %tmp1, 0
        %tmp3 = extractvalue %struct.__neon_int8x16x3_t %tmp1, 2
        %tmp4 = add <16 x i8> %tmp2, %tmp3
	ret <16 x i8> %tmp4
}

define <8 x i16> @vld3Qi16(i16* %A) nounwind {
;CHECK: vld3Qi16:
;CHECK: vld3.16
;CHECK: vld3.16
	%tmp0 = bitcast i16* %A to i8*
	%tmp1 = call %struct.__neon_int16x8x3_t @llvm.arm.neon.vld3.v8i16(i8* %tmp0, i32 1)
        %tmp2 = extractvalue %struct.__neon_int16x8x3_t %tmp1, 0
        %tmp3 = extractvalue %struct.__neon_int16x8x3_t %tmp1, 2
        %tmp4 = add <8 x i16> %tmp2, %tmp3
	ret <8 x i16> %tmp4
}

define <4 x i32> @vld3Qi32(i32* %A) nounwind {
;CHECK: vld3Qi32:
;CHECK: vld3.32
;CHECK: vld3.32
	%tmp0 = bitcast i32* %A to i8*
	%tmp1 = call %struct.__neon_int32x4x3_t @llvm.arm.neon.vld3.v4i32(i8* %tmp0, i32 1)
        %tmp2 = extractvalue %struct.__neon_int32x4x3_t %tmp1, 0
        %tmp3 = extractvalue %struct.__neon_int32x4x3_t %tmp1, 2
        %tmp4 = add <4 x i32> %tmp2, %tmp3
	ret <4 x i32> %tmp4
}

define <4 x float> @vld3Qf(float* %A) nounwind {
;CHECK: vld3Qf:
;CHECK: vld3.32
;CHECK: vld3.32
	%tmp0 = bitcast float* %A to i8*
	%tmp1 = call %struct.__neon_float32x4x3_t @llvm.arm.neon.vld3.v4f32(i8* %tmp0, i32 1)
        %tmp2 = extractvalue %struct.__neon_float32x4x3_t %tmp1, 0
        %tmp3 = extractvalue %struct.__neon_float32x4x3_t %tmp1, 2
        %tmp4 = fadd <4 x float> %tmp2, %tmp3
	ret <4 x float> %tmp4
}

declare %struct.__neon_int8x8x3_t @llvm.arm.neon.vld3.v8i8(i8*, i32) nounwind readonly
declare %struct.__neon_int16x4x3_t @llvm.arm.neon.vld3.v4i16(i8*, i32) nounwind readonly
declare %struct.__neon_int32x2x3_t @llvm.arm.neon.vld3.v2i32(i8*, i32) nounwind readonly
declare %struct.__neon_float32x2x3_t @llvm.arm.neon.vld3.v2f32(i8*, i32) nounwind readonly
declare %struct.__neon_int64x1x3_t @llvm.arm.neon.vld3.v1i64(i8*, i32) nounwind readonly

declare %struct.__neon_int8x16x3_t @llvm.arm.neon.vld3.v16i8(i8*, i32) nounwind readonly
declare %struct.__neon_int16x8x3_t @llvm.arm.neon.vld3.v8i16(i8*, i32) nounwind readonly
declare %struct.__neon_int32x4x3_t @llvm.arm.neon.vld3.v4i32(i8*, i32) nounwind readonly
declare %struct.__neon_float32x4x3_t @llvm.arm.neon.vld3.v4f32(i8*, i32) nounwind readonly
Eliminate more uses of llvm-as and llvm-dis. llvm-svn: 81293 2009-09-09 08:09:15 +08:00			`; RUN: llc < %s -march=arm -mattr=+neon \| FileCheck %s`
Add tests for new NEON vld instructions. llvm-svn: 78264 2009-08-06 08:38:31 +08:00
Update NEON struct names to match llvm-gcc changes. (This is not required for correctness but might help with sanity.) llvm-svn: 83415 2009-10-07 05:16:19 +08:00			`%struct.__neon_int8x8x3_t = type { <8 x i8>, <8 x i8>, <8 x i8> }`
			`%struct.__neon_int16x4x3_t = type { <4 x i16>, <4 x i16>, <4 x i16> }`
			`%struct.__neon_int32x2x3_t = type { <2 x i32>, <2 x i32>, <2 x i32> }`
			`%struct.__neon_float32x2x3_t = type { <2 x float>, <2 x float>, <2 x float> }`
Add codegen support for NEON vld3 intrinsics with <1 x i64> vectors. llvm-svn: 83506 2009-10-08 07:39:57 +08:00			`%struct.__neon_int64x1x3_t = type { <1 x i64>, <1 x i64>, <1 x i64> }`
Add tests for new NEON vld instructions. llvm-svn: 78264 2009-08-06 08:38:31 +08:00
Add codegen support for NEON vld3 intrinsics with 128-bit vectors. llvm-svn: 83471 2009-10-08 01:24:55 +08:00			`%struct.__neon_int8x16x3_t = type { <16 x i8>, <16 x i8>, <16 x i8> }`
			`%struct.__neon_int16x8x3_t = type { <8 x i16>, <8 x i16>, <8 x i16> }`
			`%struct.__neon_int32x4x3_t = type { <4 x i32>, <4 x i32>, <4 x i32> }`
			`%struct.__neon_float32x4x3_t = type { <4 x float>, <4 x float>, <4 x float> }`

Add tests for new NEON vld instructions. llvm-svn: 78264 2009-08-06 08:38:31 +08:00			`define <8 x i8> @vld3i8(i8* %A) nounwind {`
			`;CHECK: vld3i8:`
Set alignment operand for NEON VLD instructions. llvm-svn: 114696 2010-09-24 05:43:54 +08:00			`;Check the alignment value. Max for this instruction is 64 bits:`
Change register allocation order for ARM VFP and NEON registers to put the callee-saved registers at the end of the lists. Also prefer to avoid using the low registers that are in register subclasses required by certain instructions, so that those registers will more likely be available when needed. This change makes a huge improvement in spilling in some cases. Thanks to Jakob for helping me realize the problem. Most of this patch is fixing the testsuite. There are quite a few places where we're checking for specific registers. I changed those to wildcards in places where that doesn't weaken the tests. The spill-q.ll and thumb2-spill-q.ll tests stopped spilling with this change, so I added a bunch of live values to force spills on those tests. llvm-svn: 116055 2010-10-08 14:15:13 +08:00			`;CHECK: vld3.8 {d16, d17, d18}, [r0, :64]`
Set alignment operand for NEON VLD instructions. llvm-svn: 114696 2010-09-24 05:43:54 +08:00			`%tmp1 = call %struct.__neon_int8x8x3_t @llvm.arm.neon.vld3.v8i8(i8* %A, i32 32)`
Update NEON struct names to match llvm-gcc changes. (This is not required for correctness but might help with sanity.) llvm-svn: 83415 2009-10-07 05:16:19 +08:00			`%tmp2 = extractvalue %struct.__neon_int8x8x3_t %tmp1, 0`
			`%tmp3 = extractvalue %struct.__neon_int8x8x3_t %tmp1, 2`
Add tests for new NEON vld instructions. llvm-svn: 78264 2009-08-06 08:38:31 +08:00			`%tmp4 = add <8 x i8> %tmp2, %tmp3`
			`ret <8 x i8> %tmp4`
			`}`

			`define <4 x i16> @vld3i16(i16* %A) nounwind {`
			`;CHECK: vld3i16:`
			`;CHECK: vld3.16`
Fix tests for Neon load/store intrinsics to match the i8* types expected by the intrinsics. The reason for those i8* types is that the intrinsics are overloaded on the vector type and we don't have a way to declare an intrinsic where one argument is an overloaded vector type and another argument is a pointer to the vector element type. The bitcasts added here will match what the frontend will typically generate when these intrinsics are used. llvm-svn: 101840 2010-04-20 08:17:16 +08:00			`%tmp0 = bitcast i16* %A to i8*`
Add alignment arguments to all the NEON load/store intrinsics. Update all the tests using those intrinsics and add support for auto-upgrading bitcode files with the old versions of the intrinsics. llvm-svn: 112271 2010-08-28 01:13:24 +08:00			`%tmp1 = call %struct.__neon_int16x4x3_t @llvm.arm.neon.vld3.v4i16(i8* %tmp0, i32 1)`
Update NEON struct names to match llvm-gcc changes. (This is not required for correctness but might help with sanity.) llvm-svn: 83415 2009-10-07 05:16:19 +08:00			`%tmp2 = extractvalue %struct.__neon_int16x4x3_t %tmp1, 0`
			`%tmp3 = extractvalue %struct.__neon_int16x4x3_t %tmp1, 2`
Add tests for new NEON vld instructions. llvm-svn: 78264 2009-08-06 08:38:31 +08:00			`%tmp4 = add <4 x i16> %tmp2, %tmp3`
			`ret <4 x i16> %tmp4`
			`}`

			`define <2 x i32> @vld3i32(i32* %A) nounwind {`
			`;CHECK: vld3i32:`
			`;CHECK: vld3.32`
Fix tests for Neon load/store intrinsics to match the i8* types expected by the intrinsics. The reason for those i8* types is that the intrinsics are overloaded on the vector type and we don't have a way to declare an intrinsic where one argument is an overloaded vector type and another argument is a pointer to the vector element type. The bitcasts added here will match what the frontend will typically generate when these intrinsics are used. llvm-svn: 101840 2010-04-20 08:17:16 +08:00			`%tmp0 = bitcast i32* %A to i8*`
Add alignment arguments to all the NEON load/store intrinsics. Update all the tests using those intrinsics and add support for auto-upgrading bitcode files with the old versions of the intrinsics. llvm-svn: 112271 2010-08-28 01:13:24 +08:00			`%tmp1 = call %struct.__neon_int32x2x3_t @llvm.arm.neon.vld3.v2i32(i8* %tmp0, i32 1)`
Update NEON struct names to match llvm-gcc changes. (This is not required for correctness but might help with sanity.) llvm-svn: 83415 2009-10-07 05:16:19 +08:00			`%tmp2 = extractvalue %struct.__neon_int32x2x3_t %tmp1, 0`
			`%tmp3 = extractvalue %struct.__neon_int32x2x3_t %tmp1, 2`
Add tests for new NEON vld instructions. llvm-svn: 78264 2009-08-06 08:38:31 +08:00			`%tmp4 = add <2 x i32> %tmp2, %tmp3`
			`ret <2 x i32> %tmp4`
			`}`

			`define <2 x float> @vld3f(float* %A) nounwind {`
			`;CHECK: vld3f:`
			`;CHECK: vld3.32`
Fix tests for Neon load/store intrinsics to match the i8* types expected by the intrinsics. The reason for those i8* types is that the intrinsics are overloaded on the vector type and we don't have a way to declare an intrinsic where one argument is an overloaded vector type and another argument is a pointer to the vector element type. The bitcasts added here will match what the frontend will typically generate when these intrinsics are used. llvm-svn: 101840 2010-04-20 08:17:16 +08:00			`%tmp0 = bitcast float* %A to i8*`
Add alignment arguments to all the NEON load/store intrinsics. Update all the tests using those intrinsics and add support for auto-upgrading bitcode files with the old versions of the intrinsics. llvm-svn: 112271 2010-08-28 01:13:24 +08:00			`%tmp1 = call %struct.__neon_float32x2x3_t @llvm.arm.neon.vld3.v2f32(i8* %tmp0, i32 1)`
Update NEON struct names to match llvm-gcc changes. (This is not required for correctness but might help with sanity.) llvm-svn: 83415 2009-10-07 05:16:19 +08:00			`%tmp2 = extractvalue %struct.__neon_float32x2x3_t %tmp1, 0`
			`%tmp3 = extractvalue %struct.__neon_float32x2x3_t %tmp1, 2`
Fix tests to use fadd, fsub, and fmul, instead of add, sub, and mul, when the type is floating-point. llvm-svn: 102969 2010-05-04 06:36:46 +08:00			`%tmp4 = fadd <2 x float> %tmp2, %tmp3`
Add tests for new NEON vld instructions. llvm-svn: 78264 2009-08-06 08:38:31 +08:00			`ret <2 x float> %tmp4`
			`}`

Add codegen support for NEON vld3 intrinsics with <1 x i64> vectors. llvm-svn: 83506 2009-10-08 07:39:57 +08:00			`define <1 x i64> @vld3i64(i64* %A) nounwind {`
			`;CHECK: vld3i64:`
Set alignment operand for NEON VLD instructions. llvm-svn: 114696 2010-09-24 05:43:54 +08:00			`;Check the alignment value. Max for this instruction is 64 bits:`
Change register allocation order for ARM VFP and NEON registers to put the callee-saved registers at the end of the lists. Also prefer to avoid using the low registers that are in register subclasses required by certain instructions, so that those registers will more likely be available when needed. This change makes a huge improvement in spilling in some cases. Thanks to Jakob for helping me realize the problem. Most of this patch is fixing the testsuite. There are quite a few places where we're checking for specific registers. I changed those to wildcards in places where that doesn't weaken the tests. The spill-q.ll and thumb2-spill-q.ll tests stopped spilling with this change, so I added a bunch of live values to force spills on those tests. llvm-svn: 116055 2010-10-08 14:15:13 +08:00			`;CHECK: vld1.64 {d16, d17, d18}, [r0, :64]`
Fix tests for Neon load/store intrinsics to match the i8* types expected by the intrinsics. The reason for those i8* types is that the intrinsics are overloaded on the vector type and we don't have a way to declare an intrinsic where one argument is an overloaded vector type and another argument is a pointer to the vector element type. The bitcasts added here will match what the frontend will typically generate when these intrinsics are used. llvm-svn: 101840 2010-04-20 08:17:16 +08:00			`%tmp0 = bitcast i64* %A to i8*`
Set alignment operand for NEON VLD instructions. llvm-svn: 114696 2010-09-24 05:43:54 +08:00			`%tmp1 = call %struct.__neon_int64x1x3_t @llvm.arm.neon.vld3.v1i64(i8* %tmp0, i32 16)`
Add codegen support for NEON vld3 intrinsics with <1 x i64> vectors. llvm-svn: 83506 2009-10-08 07:39:57 +08:00			`%tmp2 = extractvalue %struct.__neon_int64x1x3_t %tmp1, 0`
			`%tmp3 = extractvalue %struct.__neon_int64x1x3_t %tmp1, 2`
			`%tmp4 = add <1 x i64> %tmp2, %tmp3`
			`ret <1 x i64> %tmp4`
			`}`

Add codegen support for NEON vld3 intrinsics with 128-bit vectors. llvm-svn: 83471 2009-10-08 01:24:55 +08:00			`define <16 x i8> @vld3Qi8(i8* %A) nounwind {`
			`;CHECK: vld3Qi8:`
Set alignment operand for NEON VLD instructions. llvm-svn: 114696 2010-09-24 05:43:54 +08:00			`;Check the alignment value. Max for this instruction is 64 bits:`
Change register allocation order for ARM VFP and NEON registers to put the callee-saved registers at the end of the lists. Also prefer to avoid using the low registers that are in register subclasses required by certain instructions, so that those registers will more likely be available when needed. This change makes a huge improvement in spilling in some cases. Thanks to Jakob for helping me realize the problem. Most of this patch is fixing the testsuite. There are quite a few places where we're checking for specific registers. I changed those to wildcards in places where that doesn't weaken the tests. The spill-q.ll and thumb2-spill-q.ll tests stopped spilling with this change, so I added a bunch of live values to force spills on those tests. llvm-svn: 116055 2010-10-08 14:15:13 +08:00			`;CHECK: vld3.8 {d16, d18, d20}, [r0, :64]!`
			`;CHECK: vld3.8 {d17, d19, d21}, [r0, :64]`
Set alignment operand for NEON VLD instructions. llvm-svn: 114696 2010-09-24 05:43:54 +08:00			`%tmp1 = call %struct.__neon_int8x16x3_t @llvm.arm.neon.vld3.v16i8(i8* %A, i32 32)`
Add codegen support for NEON vld3 intrinsics with 128-bit vectors. llvm-svn: 83471 2009-10-08 01:24:55 +08:00			`%tmp2 = extractvalue %struct.__neon_int8x16x3_t %tmp1, 0`
			`%tmp3 = extractvalue %struct.__neon_int8x16x3_t %tmp1, 2`
			`%tmp4 = add <16 x i8> %tmp2, %tmp3`
			`ret <16 x i8> %tmp4`
			`}`

			`define <8 x i16> @vld3Qi16(i16* %A) nounwind {`
			`;CHECK: vld3Qi16:`
			`;CHECK: vld3.16`
			`;CHECK: vld3.16`
Fix tests for Neon load/store intrinsics to match the i8* types expected by the intrinsics. The reason for those i8* types is that the intrinsics are overloaded on the vector type and we don't have a way to declare an intrinsic where one argument is an overloaded vector type and another argument is a pointer to the vector element type. The bitcasts added here will match what the frontend will typically generate when these intrinsics are used. llvm-svn: 101840 2010-04-20 08:17:16 +08:00			`%tmp0 = bitcast i16* %A to i8*`
Add alignment arguments to all the NEON load/store intrinsics. Update all the tests using those intrinsics and add support for auto-upgrading bitcode files with the old versions of the intrinsics. llvm-svn: 112271 2010-08-28 01:13:24 +08:00			`%tmp1 = call %struct.__neon_int16x8x3_t @llvm.arm.neon.vld3.v8i16(i8* %tmp0, i32 1)`
Add codegen support for NEON vld3 intrinsics with 128-bit vectors. llvm-svn: 83471 2009-10-08 01:24:55 +08:00			`%tmp2 = extractvalue %struct.__neon_int16x8x3_t %tmp1, 0`
			`%tmp3 = extractvalue %struct.__neon_int16x8x3_t %tmp1, 2`
			`%tmp4 = add <8 x i16> %tmp2, %tmp3`
			`ret <8 x i16> %tmp4`
			`}`

			`define <4 x i32> @vld3Qi32(i32* %A) nounwind {`
			`;CHECK: vld3Qi32:`
			`;CHECK: vld3.32`
			`;CHECK: vld3.32`
Fix tests for Neon load/store intrinsics to match the i8* types expected by the intrinsics. The reason for those i8* types is that the intrinsics are overloaded on the vector type and we don't have a way to declare an intrinsic where one argument is an overloaded vector type and another argument is a pointer to the vector element type. The bitcasts added here will match what the frontend will typically generate when these intrinsics are used. llvm-svn: 101840 2010-04-20 08:17:16 +08:00			`%tmp0 = bitcast i32* %A to i8*`
Add alignment arguments to all the NEON load/store intrinsics. Update all the tests using those intrinsics and add support for auto-upgrading bitcode files with the old versions of the intrinsics. llvm-svn: 112271 2010-08-28 01:13:24 +08:00			`%tmp1 = call %struct.__neon_int32x4x3_t @llvm.arm.neon.vld3.v4i32(i8* %tmp0, i32 1)`
Add codegen support for NEON vld3 intrinsics with 128-bit vectors. llvm-svn: 83471 2009-10-08 01:24:55 +08:00			`%tmp2 = extractvalue %struct.__neon_int32x4x3_t %tmp1, 0`
			`%tmp3 = extractvalue %struct.__neon_int32x4x3_t %tmp1, 2`
			`%tmp4 = add <4 x i32> %tmp2, %tmp3`
			`ret <4 x i32> %tmp4`
			`}`

			`define <4 x float> @vld3Qf(float* %A) nounwind {`
			`;CHECK: vld3Qf:`
			`;CHECK: vld3.32`
			`;CHECK: vld3.32`
Fix tests for Neon load/store intrinsics to match the i8* types expected by the intrinsics. The reason for those i8* types is that the intrinsics are overloaded on the vector type and we don't have a way to declare an intrinsic where one argument is an overloaded vector type and another argument is a pointer to the vector element type. The bitcasts added here will match what the frontend will typically generate when these intrinsics are used. llvm-svn: 101840 2010-04-20 08:17:16 +08:00			`%tmp0 = bitcast float* %A to i8*`
Add alignment arguments to all the NEON load/store intrinsics. Update all the tests using those intrinsics and add support for auto-upgrading bitcode files with the old versions of the intrinsics. llvm-svn: 112271 2010-08-28 01:13:24 +08:00			`%tmp1 = call %struct.__neon_float32x4x3_t @llvm.arm.neon.vld3.v4f32(i8* %tmp0, i32 1)`
Add codegen support for NEON vld3 intrinsics with 128-bit vectors. llvm-svn: 83471 2009-10-08 01:24:55 +08:00			`%tmp2 = extractvalue %struct.__neon_float32x4x3_t %tmp1, 0`
			`%tmp3 = extractvalue %struct.__neon_float32x4x3_t %tmp1, 2`
Fix tests to use fadd, fsub, and fmul, instead of add, sub, and mul, when the type is floating-point. llvm-svn: 102969 2010-05-04 06:36:46 +08:00			`%tmp4 = fadd <4 x float> %tmp2, %tmp3`
Add codegen support for NEON vld3 intrinsics with 128-bit vectors. llvm-svn: 83471 2009-10-08 01:24:55 +08:00			`ret <4 x float> %tmp4`
			`}`

Add alignment arguments to all the NEON load/store intrinsics. Update all the tests using those intrinsics and add support for auto-upgrading bitcode files with the old versions of the intrinsics. llvm-svn: 112271 2010-08-28 01:13:24 +08:00			`declare %struct.__neon_int8x8x3_t @llvm.arm.neon.vld3.v8i8(i8*, i32) nounwind readonly`
			`declare %struct.__neon_int16x4x3_t @llvm.arm.neon.vld3.v4i16(i8*, i32) nounwind readonly`
			`declare %struct.__neon_int32x2x3_t @llvm.arm.neon.vld3.v2i32(i8*, i32) nounwind readonly`
			`declare %struct.__neon_float32x2x3_t @llvm.arm.neon.vld3.v2f32(i8*, i32) nounwind readonly`
			`declare %struct.__neon_int64x1x3_t @llvm.arm.neon.vld3.v1i64(i8*, i32) nounwind readonly`
Add codegen support for NEON vld3 intrinsics with 128-bit vectors. llvm-svn: 83471 2009-10-08 01:24:55 +08:00
Add alignment arguments to all the NEON load/store intrinsics. Update all the tests using those intrinsics and add support for auto-upgrading bitcode files with the old versions of the intrinsics. llvm-svn: 112271 2010-08-28 01:13:24 +08:00			`declare %struct.__neon_int8x16x3_t @llvm.arm.neon.vld3.v16i8(i8*, i32) nounwind readonly`
			`declare %struct.__neon_int16x8x3_t @llvm.arm.neon.vld3.v8i16(i8*, i32) nounwind readonly`
			`declare %struct.__neon_int32x4x3_t @llvm.arm.neon.vld3.v4i32(i8*, i32) nounwind readonly`
			`declare %struct.__neon_float32x4x3_t @llvm.arm.neon.vld3.v4f32(i8*, i32) nounwind readonly`