llvm-project/llvm/test/CodeGen/X86/avx-cvt.ll

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx | FileCheck %s

define <8 x float> @sitofp00(<8 x i32> %a) nounwind {
; CHECK-LABEL: sitofp00:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvtdq2ps %ymm0, %ymm0
; CHECK-NEXT:    retq
  %b = sitofp <8 x i32> %a to <8 x float>
  ret <8 x float> %b
}

define <8 x i32> @fptosi00(<8 x float> %a) nounwind {
; CHECK-LABEL: fptosi00:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvttps2dq %ymm0, %ymm0
; CHECK-NEXT:    retq
  %b = fptosi <8 x float> %a to <8 x i32>
  ret <8 x i32> %b
}

define <4 x double> @sitofp01(<4 x i32> %a) {
; CHECK-LABEL: sitofp01:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvtdq2pd %xmm0, %ymm0
; CHECK-NEXT:    retq
  %b = sitofp <4 x i32> %a to <4 x double>
  ret <4 x double> %b
}

define <8 x float> @sitofp02(<8 x i16> %a) {
; CHECK-LABEL: sitofp02:
; CHECK:       # BB#0:
; CHECK-NEXT:    vpmovsxwd %xmm0, %xmm1
; CHECK-NEXT:    vpshufd {{.*#+}} xmm0 = xmm0[2,3,0,1]
; CHECK-NEXT:    vpmovsxwd %xmm0, %xmm0
; CHECK-NEXT:    vinsertf128 $1, %xmm0, %ymm1, %ymm0
; CHECK-NEXT:    vcvtdq2ps %ymm0, %ymm0
; CHECK-NEXT:    retq
  %b = sitofp <8 x i16> %a to <8 x float>
  ret <8 x float> %b
}

define <4 x i32> @fptosi01(<4 x double> %a) {
; CHECK-LABEL: fptosi01:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvttpd2dqy %ymm0, %xmm0
; CHECK-NEXT:    vzeroupper
; CHECK-NEXT:    retq
  %b = fptosi <4 x double> %a to <4 x i32>
  ret <4 x i32> %b
}

define <8 x float> @fptrunc00(<8 x double> %b) nounwind {
; CHECK-LABEL: fptrunc00:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvtpd2psy %ymm0, %xmm0
; CHECK-NEXT:    vcvtpd2psy %ymm1, %xmm1
; CHECK-NEXT:    vinsertf128 $1, %xmm1, %ymm0, %ymm0
; CHECK-NEXT:    retq
  %a = fptrunc <8 x double> %b to <8 x float>
  ret <8 x float> %a
}

define <4 x double> @fpext00(<4 x float> %b) nounwind {
; CHECK-LABEL: fpext00:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvtps2pd %xmm0, %ymm0
; CHECK-NEXT:    retq
  %a = fpext <4 x float> %b to <4 x double>
  ret <4 x double> %a
}

define double @funcA(i64* nocapture %e) nounwind uwtable readonly ssp {
; CHECK-LABEL: funcA:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvtsi2sdq (%rdi), %xmm0, %xmm0
; CHECK-NEXT:    retq
  %tmp1 = load i64, i64* %e, align 8
  %conv = sitofp i64 %tmp1 to double
  ret double %conv
}

define double @funcB(i32* nocapture %e) nounwind uwtable readonly ssp {
; CHECK-LABEL: funcB:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvtsi2sdl (%rdi), %xmm0, %xmm0
; CHECK-NEXT:    retq
  %tmp1 = load i32, i32* %e, align 4
  %conv = sitofp i32 %tmp1 to double
  ret double %conv
}

define float @funcC(i32* nocapture %e) nounwind uwtable readonly ssp {
; CHECK-LABEL: funcC:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvtsi2ssl (%rdi), %xmm0, %xmm0
; CHECK-NEXT:    retq
  %tmp1 = load i32, i32* %e, align 4
  %conv = sitofp i32 %tmp1 to float
  ret float %conv
}

define float @funcD(i64* nocapture %e) nounwind uwtable readonly ssp {
; CHECK-LABEL: funcD:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvtsi2ssq (%rdi), %xmm0, %xmm0
; CHECK-NEXT:    retq
  %tmp1 = load i64, i64* %e, align 8
  %conv = sitofp i64 %tmp1 to float
  ret float %conv
}

define void @fpext() nounwind uwtable {
; CHECK-LABEL: fpext:
; CHECK:       # BB#0:
; CHECK-NEXT:    vcvtss2sd -{{[0-9]+}}(%rsp), %xmm0, %xmm0
; CHECK-NEXT:    vmovsd %xmm0, -{{[0-9]+}}(%rsp)
; CHECK-NEXT:    retq
  %f = alloca float, align 4
  %d = alloca double, align 8
  %tmp = load float, float* %f, align 4
  %conv = fpext float %tmp to double
  store double %conv, double* %d, align 8
  ret void
}

define double @nearbyint_f64(double %a) {
; CHECK-LABEL: nearbyint_f64:
; CHECK:       # BB#0:
; CHECK-NEXT:    vroundsd $12, %xmm0, %xmm0, %xmm0
; CHECK-NEXT:    retq
  %res = call double @llvm.nearbyint.f64(double %a)
  ret double %res
}
declare double @llvm.nearbyint.f64(double %p)

define float @floor_f32(float %a) {
; CHECK-LABEL: floor_f32:
; CHECK:       # BB#0:
; CHECK-NEXT:    vroundss $9, %xmm0, %xmm0, %xmm0
; CHECK-NEXT:    retq
  %res = call float @llvm.floor.f32(float %a)
  ret float %res
}
declare float @llvm.floor.f32(float %p)
Make utils/update_llc_test_checks.py note that the assertions are autogenerated. Also update existing test cases which appear to be generated by it and weren't modified (other than addition of the header) by rerunning it. llvm-svn: 253917 2015-11-24 05:33:58 +08:00			`; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx \| FileCheck %s`
- Teach SSEDomainFix to switch between different levels of AVX instructions. Here we guess that AVX will have domain issues, so just implement them for consistency and in the future we remove if it's unnecessary. - Make foldMemoryOperandImpl aware of 256-bit zero vectors folding and support the 128-bit counterparts of AVX too. - Make sure MOV[AU]PS instructions are only selected when SSE1 is enabled, and duplicate the patterns to match AVX. - Add a testcase for a simple 128-bit zero vector creation. llvm-svn: 110946 2010-08-13 04:20:53 +08:00
Rename and tidy up tests llvm-svn: 137103 2011-08-09 11:04:23 +08:00			`define <8 x float> @sitofp00(<8 x i32> %a) nounwind {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: sitofp00:`
			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvtdq2ps %ymm0, %ymm0`
			`; CHECK-NEXT: retq`
Rename and tidy up tests llvm-svn: 137103 2011-08-09 11:04:23 +08:00			`%b = sitofp <8 x i32> %a to <8 x float>`
			`ret <8 x float> %b`
			`}`
- Teach SSEDomainFix to switch between different levels of AVX instructions. Here we guess that AVX will have domain issues, so just implement them for consistency and in the future we remove if it's unnecessary. - Make foldMemoryOperandImpl aware of 256-bit zero vectors folding and support the 128-bit counterparts of AVX too. - Make sure MOV[AU]PS instructions are only selected when SSE1 is enabled, and duplicate the patterns to match AVX. - Add a testcase for a simple 128-bit zero vector creation. llvm-svn: 110946 2010-08-13 04:20:53 +08:00
Rename and tidy up tests llvm-svn: 137103 2011-08-09 11:04:23 +08:00			`define <8 x i32> @fptosi00(<8 x float> %a) nounwind {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: fptosi00:`
			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvttps2dq %ymm0, %ymm0`
			`; CHECK-NEXT: retq`
Rename and tidy up tests llvm-svn: 137103 2011-08-09 11:04:23 +08:00			`%b = fptosi <8 x float> %a to <8 x i32>`
			`ret <8 x i32> %b`
- Teach SSEDomainFix to switch between different levels of AVX instructions. Here we guess that AVX will have domain issues, so just implement them for consistency and in the future we remove if it's unnecessary. - Make foldMemoryOperandImpl aware of 256-bit zero vectors folding and support the 128-bit counterparts of AVX too. - Make sure MOV[AU]PS instructions are only selected when SSE1 is enabled, and duplicate the patterns to match AVX. - Add a testcase for a simple 128-bit zero vector creation. llvm-svn: 110946 2010-08-13 04:20:53 +08:00			`}`

Reapply a more appropriate solution than in r137114. AVX supports v4f64 = sitofp v4i32. This fix PR10559. Also add support for v4i32 = fptosi v4f64. llvm-svn: 137128 2011-08-10 01:39:13 +08:00			`define <4 x double> @sitofp01(<4 x i32> %a) {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: sitofp01:`
			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvtdq2pd %xmm0, %ymm0`
			`; CHECK-NEXT: retq`
Reapply a more appropriate solution than in r137114. AVX supports v4f64 = sitofp v4i32. This fix PR10559. Also add support for v4i32 = fptosi v4f64. llvm-svn: 137128 2011-08-10 01:39:13 +08:00			`%b = sitofp <4 x i32> %a to <4 x double>`
			`ret <4 x double> %b`
			`}`

X86: Promote sitofp <8 x i16> to <8 x i32> when AVX is available. A vector sext + sitofp is a lot cheaper than 8 scalar conversions. llvm-svn: 178448 2013-03-31 20:49:15 +08:00			`define <8 x float> @sitofp02(<8 x i16> %a) {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: sitofp02:`
			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vpmovsxwd %xmm0, %xmm1`
			`; CHECK-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[2,3,0,1]`
			`; CHECK-NEXT: vpmovsxwd %xmm0, %xmm0`
			`; CHECK-NEXT: vinsertf128 $1, %xmm0, %ymm1, %ymm0`
			`; CHECK-NEXT: vcvtdq2ps %ymm0, %ymm0`
			`; CHECK-NEXT: retq`
X86: Promote sitofp <8 x i16> to <8 x i32> when AVX is available. A vector sext + sitofp is a lot cheaper than 8 scalar conversions. llvm-svn: 178448 2013-03-31 20:49:15 +08:00			`%b = sitofp <8 x i16> %a to <8 x float>`
			`ret <8 x float> %b`
			`}`

Reapply a more appropriate solution than in r137114. AVX supports v4f64 = sitofp v4i32. This fix PR10559. Also add support for v4i32 = fptosi v4f64. llvm-svn: 137128 2011-08-10 01:39:13 +08:00			`define <4 x i32> @fptosi01(<4 x double> %a) {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: fptosi01:`
			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvttpd2dqy %ymm0, %xmm0`
			`; CHECK-NEXT: vzeroupper`
			`; CHECK-NEXT: retq`
Reapply a more appropriate solution than in r137114. AVX supports v4f64 = sitofp v4i32. This fix PR10559. Also add support for v4i32 = fptosi v4f64. llvm-svn: 137128 2011-08-10 01:39:13 +08:00			`%b = fptosi <4 x double> %a to <4 x i32>`
			`ret <4 x i32> %b`
			`}`

Rename and tidy up tests llvm-svn: 137103 2011-08-09 11:04:23 +08:00			`define <8 x float> @fptrunc00(<8 x double> %b) nounwind {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: fptrunc00:`
			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvtpd2psy %ymm0, %xmm0`
			`; CHECK-NEXT: vcvtpd2psy %ymm1, %xmm1`
			`; CHECK-NEXT: vinsertf128 $1, %xmm1, %ymm0, %ymm0`
			`; CHECK-NEXT: retq`
Rename and tidy up tests llvm-svn: 137103 2011-08-09 11:04:23 +08:00			`%a = fptrunc <8 x double> %b to <8 x float>`
			`ret <8 x float> %a`
Add support for avx vector fextend llvm-svn: 137105 2011-08-09 11:04:29 +08:00			`}`

			`define <4 x double> @fpext00(<4 x float> %b) nounwind {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: fpext00:`
			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvtps2pd %xmm0, %ymm0`
			`; CHECK-NEXT: retq`
Add support for avx vector fextend llvm-svn: 137105 2011-08-09 11:04:29 +08:00			`%a = fpext <4 x float> %b to <4 x double>`
			`ret <4 x double> %a`
Add AVX suport for fpextend. Original patch by Syoyo Fujita with more comments by me. llvm-svn: 133153 2011-06-16 15:03:21 +08:00			`}`
Add AVX 128-bit patterns for sint_to_fp llvm-svn: 135332 2011-07-16 08:50:20 +08:00
			`define double @funcA(i64* nocapture %e) nounwind uwtable readonly ssp {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: funcA:`
			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvtsi2sdq (%rdi), %xmm0, %xmm0`
			`; CHECK-NEXT: retq`
[opaque pointer type] Add textual IR support for explicit type parameter to load instruction Essentially the same as the GEP change in r230786. A similar migration script can be used to update test cases, though a few more test case improvements/changes were required this time around: (r229269-r229278) import fileinput import sys import re pat = re.compile(r"((?:=\|:\|^)\sload (?:atomic )?(?:volatile )?(.?))(\| addrspace\(\d+\) )\($\| (?:%\|@\|null\|undef\|blockaddress\|getelementptr\|addrspacecast\|bitcast\|inttoptr\|\[\[[a-zA-Z]\|\{\{).$)") for line in sys.stdin: sys.stdout.write(re.sub(pat, r"\1, \2\3*\4", line)) Reviewers: rafael, dexonsmith, grosser Differential Revision: http://reviews.llvm.org/D7649 llvm-svn: 230794 2015-02-28 05:17:42 +08:00			`%tmp1 = load i64, i64* %e, align 8`
Add AVX 128-bit patterns for sint_to_fp llvm-svn: 135332 2011-07-16 08:50:20 +08:00			`%conv = sitofp i64 %tmp1 to double`
			`ret double %conv`
			`}`

			`define double @funcB(i32* nocapture %e) nounwind uwtable readonly ssp {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: funcB:`
			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvtsi2sdl (%rdi), %xmm0, %xmm0`
			`; CHECK-NEXT: retq`
[opaque pointer type] Add textual IR support for explicit type parameter to load instruction Essentially the same as the GEP change in r230786. A similar migration script can be used to update test cases, though a few more test case improvements/changes were required this time around: (r229269-r229278) import fileinput import sys import re pat = re.compile(r"((?:=\|:\|^)\sload (?:atomic )?(?:volatile )?(.?))(\| addrspace\(\d+\) )\($\| (?:%\|@\|null\|undef\|blockaddress\|getelementptr\|addrspacecast\|bitcast\|inttoptr\|\[\[[a-zA-Z]\|\{\{).$)") for line in sys.stdin: sys.stdout.write(re.sub(pat, r"\1, \2\3*\4", line)) Reviewers: rafael, dexonsmith, grosser Differential Revision: http://reviews.llvm.org/D7649 llvm-svn: 230794 2015-02-28 05:17:42 +08:00			`%tmp1 = load i32, i32* %e, align 4`
Add AVX 128-bit patterns for sint_to_fp llvm-svn: 135332 2011-07-16 08:50:20 +08:00			`%conv = sitofp i32 %tmp1 to double`
			`ret double %conv`
			`}`

			`define float @funcC(i32* nocapture %e) nounwind uwtable readonly ssp {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: funcC:`
			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvtsi2ssl (%rdi), %xmm0, %xmm0`
			`; CHECK-NEXT: retq`
[opaque pointer type] Add textual IR support for explicit type parameter to load instruction Essentially the same as the GEP change in r230786. A similar migration script can be used to update test cases, though a few more test case improvements/changes were required this time around: (r229269-r229278) import fileinput import sys import re pat = re.compile(r"((?:=\|:\|^)\sload (?:atomic )?(?:volatile )?(.?))(\| addrspace\(\d+\) )\($\| (?:%\|@\|null\|undef\|blockaddress\|getelementptr\|addrspacecast\|bitcast\|inttoptr\|\[\[[a-zA-Z]\|\{\{).$)") for line in sys.stdin: sys.stdout.write(re.sub(pat, r"\1, \2\3*\4", line)) Reviewers: rafael, dexonsmith, grosser Differential Revision: http://reviews.llvm.org/D7649 llvm-svn: 230794 2015-02-28 05:17:42 +08:00			`%tmp1 = load i32, i32* %e, align 4`
Add AVX 128-bit patterns for sint_to_fp llvm-svn: 135332 2011-07-16 08:50:20 +08:00			`%conv = sitofp i32 %tmp1 to float`
			`ret float %conv`
			`}`

			`define float @funcD(i64* nocapture %e) nounwind uwtable readonly ssp {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: funcD:`
			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vcvtsi2ssq (%rdi), %xmm0, %xmm0`
			`; CHECK-NEXT: retq`
[opaque pointer type] Add textual IR support for explicit type parameter to load instruction Essentially the same as the GEP change in r230786. A similar migration script can be used to update test cases, though a few more test case improvements/changes were required this time around: (r229269-r229278) import fileinput import sys import re pat = re.compile(r"((?:=\|:\|^)\sload (?:atomic )?(?:volatile )?(.?))(\| addrspace\(\d+\) )\($\| (?:%\|@\|null\|undef\|blockaddress\|getelementptr\|addrspacecast\|bitcast\|inttoptr\|\[\[[a-zA-Z]\|\{\{).$)") for line in sys.stdin: sys.stdout.write(re.sub(pat, r"\1, \2\3*\4", line)) Reviewers: rafael, dexonsmith, grosser Differential Revision: http://reviews.llvm.org/D7649 llvm-svn: 230794 2015-02-28 05:17:42 +08:00			`%tmp1 = load i64, i64* %e, align 8`
Add AVX 128-bit patterns for sint_to_fp llvm-svn: 135332 2011-07-16 08:50:20 +08:00			`%conv = sitofp i64 %tmp1 to float`
			`ret float %conv`
			`}`
Add AVX 128-bit sqrt versions llvm-svn: 135404 2011-07-19 01:51:40 +08:00
Rename and tidy up tests llvm-svn: 137103 2011-08-09 11:04:23 +08:00			`define void @fpext() nounwind uwtable {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: fpext:`
			`; CHECK: # BB#0:`
Allow PeepholeOptimizer to fold a few more cases The condition for clearing the folding candidate list was clamped together with the "uninteresting instruction" condition. This is too conservative, e.g. we don't need to clear the list when encountering an IMPLICIT_DEF. Differential Revision: http://reviews.llvm.org/D11591 llvm-svn: 244577 2015-08-11 16:19:43 +08:00			`; CHECK-NEXT: vcvtss2sd -{{[0-9]+}}(%rsp), %xmm0, %xmm0`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-NEXT: vmovsd %xmm0, -{{[0-9]+}}(%rsp)`
			`; CHECK-NEXT: retq`
Rename and tidy up tests llvm-svn: 137103 2011-08-09 11:04:23 +08:00			`%f = alloca float, align 4`
			`%d = alloca double, align 8`
[opaque pointer type] Add textual IR support for explicit type parameter to load instruction Essentially the same as the GEP change in r230786. A similar migration script can be used to update test cases, though a few more test case improvements/changes were required this time around: (r229269-r229278) import fileinput import sys import re pat = re.compile(r"((?:=\|:\|^)\sload (?:atomic )?(?:volatile )?(.?))(\| addrspace\(\d+\) )\($\| (?:%\|@\|null\|undef\|blockaddress\|getelementptr\|addrspacecast\|bitcast\|inttoptr\|\[\[[a-zA-Z]\|\{\{).$)") for line in sys.stdin: sys.stdout.write(re.sub(pat, r"\1, \2\3*\4", line)) Reviewers: rafael, dexonsmith, grosser Differential Revision: http://reviews.llvm.org/D7649 llvm-svn: 230794 2015-02-28 05:17:42 +08:00			`%tmp = load float, float* %f, align 4`
Rename and tidy up tests llvm-svn: 137103 2011-08-09 11:04:23 +08:00			`%conv = fpext float %tmp to double`
			`store double %conv, double* %d, align 8`
			`ret void`
Add AVX 128-bit sqrt versions llvm-svn: 135404 2011-07-19 01:51:40 +08:00			`}`

AVX-512: recommitted 229837 + bugfix + test llvm-svn: 230223 2015-02-23 23:12:31 +08:00			`define double @nearbyint_f64(double %a) {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: nearbyint_f64:`
			`; CHECK: # BB#0:`
			`; CHECK-NEXT: vroundsd $12, %xmm0, %xmm0, %xmm0`
			`; CHECK-NEXT: retq`
AVX-512: recommitted 229837 + bugfix + test llvm-svn: 230223 2015-02-23 23:12:31 +08:00			`%res = call double @llvm.nearbyint.f64(double %a)`
			`ret double %res`
			`}`
			`declare double @llvm.nearbyint.f64(double %p)`

			`define float @floor_f32(float %a) {`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-LABEL: floor_f32:`
			`; CHECK: # BB#0:`
Don't raise inexact when lowering ceil, floor, round, trunc. The C standard has historically not specified whether or not these functions should raise the inexact flag. Traditionally on Darwin, these functions did raise inexact, and the llvm lowerings followed that conventions. n1778 (C bindings for IEEE-754 (2008)) clarifies that these functions should not set inexact. This patch brings the lowerings for arm64 and x86 in line with the newly specified behavior. This also lets us fold some logic into TD patterns, which is nice. Differential Revision: http://reviews.llvm.org/D12969 llvm-svn: 248266 2015-09-22 19:43:17 +08:00			`; CHECK-NEXT: vroundss $9, %xmm0, %xmm0, %xmm0`
use update_llc_test_checks.py to tighten checking; remove unnecessary testing params llvm-svn: 234027 2015-04-04 01:13:31 +08:00			`; CHECK-NEXT: retq`
AVX-512: recommitted 229837 + bugfix + test llvm-svn: 230223 2015-02-23 23:12:31 +08:00			`%res = call float @llvm.floor.f32(float %a)`
			`ret float %res`
			`}`
			`declare float @llvm.floor.f32(float %p)`