forked from OSchip/llvm-project
75 lines
2.5 KiB
C
75 lines
2.5 KiB
C
// Test with fast math
|
|
// RUN: %clang_cc1 -triple i386-pc-linux-gnu -emit-llvm -DFAST \
|
|
// RUN: -mreassociate \
|
|
// RUN: -o - %s | FileCheck --check-prefixes CHECK,CHECKFAST,CHECKNP %s
|
|
//
|
|
// Test with fast math and fprotect-parens
|
|
// RUN: %clang_cc1 -triple i386-pc-linux-gnu -emit-llvm -DFAST \
|
|
// RUN: -mreassociate -fprotect-parens -ffp-contract=on\
|
|
// RUN: -o - %s | FileCheck --check-prefixes CHECK,CHECKFAST,CHECKPP %s
|
|
//
|
|
// Test without fast math: llvm intrinsic not created
|
|
// RUN: %clang_cc1 -triple i386-pc-linux-gnu -emit-llvm -fprotect-parens\
|
|
// RUN: -o - %s | FileCheck --implicit-check-not="llvm.arithmetic.fence" %s
|
|
//
|
|
int v;
|
|
int addit(float a, float b) {
|
|
// CHECK: define {{.*}}@addit(float noundef %a, float noundef %b) #0 {
|
|
_Complex double cd, cd1;
|
|
cd = __arithmetic_fence(cd1);
|
|
// CHECKFAST: call{{.*}} double @llvm.arithmetic.fence.f64({{.*}}real)
|
|
// CHECKFAST: call{{.*}} double @llvm.arithmetic.fence.f64({{.*}}imag)
|
|
// Vector should be supported.
|
|
typedef float __v2f32 __attribute__((__vector_size__(8)));
|
|
__v2f32 vec1, vec2;
|
|
vec1 = __arithmetic_fence(vec2);
|
|
// CHECKFAST: call{{.*}} <2 x float> @llvm.arithmetic.fence.v2f32
|
|
vec2 = (vec2 + vec1);
|
|
// CHECKPP: call{{.*}} <2 x float> @llvm.arithmetic.fence.v2f32
|
|
|
|
v = __arithmetic_fence(a + b);
|
|
// CHECKFAST: call{{.*}} float @llvm.arithmetic.fence.f32(float %add{{.*}})
|
|
|
|
v = (a + b);
|
|
// CHECKPP: call{{.*}} float @llvm.arithmetic.fence.f32(float %add{{.*}})
|
|
v = a + (b*b);
|
|
// CHECKPP: fmul reassoc
|
|
// CHECKPP-NEXT: call{{.*}} float @llvm.arithmetic.fence.f32(float %mul)
|
|
// CHECKNP: fmul
|
|
// CHECKNP: fadd
|
|
v = b + a*a;
|
|
// CHECKPP: call{{.*}} float @llvm.fmuladd.f32
|
|
// CHECKNP: fmul
|
|
// CHECKNP: fadd
|
|
v = b + __arithmetic_fence(a*a); // Fence blocks recognition of FMA
|
|
// CHECKPP: fmul
|
|
// CHECKNP: fmul
|
|
|
|
b = (a);
|
|
(a) = b;
|
|
// CHECK-NEXT fptosi
|
|
// CHECK-NEXT store i32
|
|
// CHECK-NEXT load float
|
|
// CHECK-NEXT store float
|
|
// CHECK-NEXT load float
|
|
// CHECK-NEXT store float
|
|
return 0;
|
|
// CHECK-NEXT ret i32 0
|
|
}
|
|
int addit1(int a, int b) {
|
|
// CHECK: define {{.*}}@addit1(i32 noundef %a, i32 noundef %b{{.*}}
|
|
v = (a + b);
|
|
// CHECK-NOT: call{{.*}} float @llvm.arithmetic.fence.int(float noundef %add)
|
|
return 0;
|
|
}
|
|
#ifdef FAST
|
|
#pragma float_control(precise, on)
|
|
int subit(float a, float b, float *fp) {
|
|
// CHECKFAST: define {{.*}}@subit(float noundef %a, float noundef %b{{.*}}
|
|
*fp = __arithmetic_fence(a - b);
|
|
*fp = (a + b);
|
|
// CHECK-NOT: call{{.*}} float @llvm.arithmetic.fence.f32(float noundef %add)
|
|
return 0;
|
|
}
|
|
#endif
|