forked from OSchip/llvm-project
68 lines
2.4 KiB
LLVM
68 lines
2.4 KiB
LLVM
; RUN: opt < %s -cost-model -analyze -mtriple=x86_64-apple-macosx10.8.0 -mcpu=corei7-avx | FileCheck -check-prefix=CHECK -check-prefix=AVX1 %s
|
|
; RUN: opt < %s -cost-model -analyze -mtriple=x86_64-apple-macosx10.8.0 -mcpu=core-avx2 | FileCheck -check-prefix=CHECK -check-prefix=AVX2 %s
|
|
; RUN: opt < %s -cost-model -analyze -mtriple=x86_64-apple-macosx10.8.0 -mcpu=knl | FileCheck -check-prefix=CHECK -check-prefix=AVX512 %s
|
|
|
|
target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
|
|
target triple = "x86_64-apple-macosx10.8.0"
|
|
|
|
define i32 @cmp(i32 %arg) {
|
|
; -- floats --
|
|
;AVX1: cost of 1 {{.*}} fcmp
|
|
;AVX2: cost of 1 {{.*}} fcmp
|
|
%A = fcmp olt <2 x float> undef, undef
|
|
;AVX1: cost of 1 {{.*}} fcmp
|
|
;AVX2: cost of 1 {{.*}} fcmp
|
|
%B = fcmp olt <4 x float> undef, undef
|
|
;AVX1: cost of 1 {{.*}} fcmp
|
|
;AVX2: cost of 1 {{.*}} fcmp
|
|
%C = fcmp olt <8 x float> undef, undef
|
|
;AVX1: cost of 1 {{.*}} fcmp
|
|
;AVX2: cost of 1 {{.*}} fcmp
|
|
%D = fcmp olt <2 x double> undef, undef
|
|
;AVX1: cost of 1 {{.*}} fcmp
|
|
;AVX2: cost of 1 {{.*}} fcmp
|
|
%E = fcmp olt <4 x double> undef, undef
|
|
|
|
; AVX512: cost of 1 {{.*}} %E1 = fcmp
|
|
%E1 = fcmp olt <16 x float> undef, undef
|
|
; AVX512: cost of 2 {{.*}} %E2 = fcmp
|
|
%E2 = fcmp olt <16 x double> undef, undef
|
|
|
|
; -- integers --
|
|
|
|
;AVX1: cost of 1 {{.*}} icmp
|
|
;AVX2: cost of 1 {{.*}} icmp
|
|
%F = icmp eq <16 x i8> undef, undef
|
|
;AVX1: cost of 1 {{.*}} icmp
|
|
;AVX2: cost of 1 {{.*}} icmp
|
|
%G = icmp eq <8 x i16> undef, undef
|
|
;AVX1: cost of 1 {{.*}} icmp
|
|
;AVX2: cost of 1 {{.*}} icmp
|
|
%H = icmp eq <4 x i32> undef, undef
|
|
;AVX1: cost of 1 {{.*}} icmp
|
|
;AVX2: cost of 1 {{.*}} icmp
|
|
%I = icmp eq <2 x i64> undef, undef
|
|
;AVX1: cost of 4 {{.*}} icmp
|
|
;AVX2: cost of 1 {{.*}} icmp
|
|
%J = icmp eq <4 x i64> undef, undef
|
|
;AVX1: cost of 4 {{.*}} icmp
|
|
;AVX2: cost of 1 {{.*}} icmp
|
|
%K = icmp eq <8 x i32> undef, undef
|
|
;AVX1: cost of 4 {{.*}} icmp
|
|
;AVX2: cost of 1 {{.*}} icmp
|
|
%L = icmp eq <16 x i16> undef, undef
|
|
;AVX1: cost of 4 {{.*}} icmp
|
|
;AVX2: cost of 1 {{.*}} icmp
|
|
%M = icmp eq <32 x i8> undef, undef
|
|
|
|
; AVX512: cost of 1 {{.*}} %M1 = icmp
|
|
%M1 = icmp eq <16 x i32> undef, undef
|
|
; AVX512: cost of 2 {{.*}} %M2 = icmp
|
|
%M2 = icmp eq <16 x i64> undef, undef
|
|
|
|
;CHECK: cost of 0 {{.*}} ret
|
|
ret i32 undef
|
|
}
|
|
|
|
|