forked from OSchip/llvm-project
[NFC][X86][CostModel] Add some load/store tests w/ non-power-of-two elt cnt vectors
For example the cost to load <48 x i16> should likely be 3, because that's just 3x load i256.
This commit is contained in:
parent
b601c67192
commit
aa165eac32
|
@ -25,6 +25,18 @@ define i32 @stores(i32 %arg) {
|
|||
; SSE-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 13 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 12 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 12 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 14 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 22 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 24 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 26 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 46 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 48 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 50 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 94 for instruction: store <47 x i16> undef, <47 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 96 for instruction: store <48 x i16> undef, <48 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 98 for instruction: store <49 x i16> undef, <49 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef
|
||||
;
|
||||
; AVX-LABEL: 'stores'
|
||||
|
@ -45,6 +57,18 @@ define i32 @stores(i32 %arg) {
|
|||
; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 11 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 12 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 12 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 14 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 25 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 28 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 31 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 54 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 56 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 59 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 117 for instruction: store <47 x i16> undef, <47 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 120 for instruction: store <48 x i16> undef, <48 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 122 for instruction: store <49 x i16> undef, <49 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef
|
||||
;
|
||||
; AVX512-LABEL: 'stores'
|
||||
|
@ -65,6 +89,18 @@ define i32 @stores(i32 %arg) {
|
|||
; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 11 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 13 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 12 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 14 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 25 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 28 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 31 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 61 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 64 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 67 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 125 for instruction: store <47 x i16> undef, <47 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 128 for instruction: store <48 x i16> undef, <48 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 131 for instruction: store <49 x i16> undef, <49 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef
|
||||
;
|
||||
store i8 undef, i8* undef, align 4
|
||||
|
@ -89,6 +125,22 @@ define i32 @stores(i32 %arg) {
|
|||
store <5 x i32> undef, <5 x i32>* undef, align 4
|
||||
store <5 x i64> undef, <5 x i64>* undef, align 4
|
||||
|
||||
store <5 x i16> undef, <5 x i16>* undef, align 4
|
||||
store <6 x i16> undef, <6 x i16>* undef, align 4 ; 1 x i64 + 1 x i32
|
||||
store <7 x i16> undef, <7 x i16>* undef, align 4
|
||||
|
||||
store <11 x i16> undef, <11 x i16>* undef, align 4
|
||||
store <12 x i16> undef, <12 x i16>* undef, align 4 ; 1 x i128 + 1 x i64
|
||||
store <13 x i16> undef, <13 x i16>* undef, align 4
|
||||
|
||||
store <23 x i16> undef, <23 x i16>* undef, align 4
|
||||
store <24 x i16> undef, <24 x i16>* undef, align 4 ; 1 x i256 + 1 x i128
|
||||
store <25 x i16> undef, <25 x i16>* undef, align 4
|
||||
|
||||
store <47 x i16> undef, <47 x i16>* undef, align 4
|
||||
store <48 x i16> undef, <48 x i16>* undef, align 4 ; 3 x i256
|
||||
store <49 x i16> undef, <49 x i16>* undef, align 4
|
||||
|
||||
ret i32 undef
|
||||
}
|
||||
|
||||
|
@ -111,6 +163,18 @@ define i32 @loads(i32 %arg) {
|
|||
; SSE-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %15 = load <3 x i64>, <3 x i64>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %16 = load <5 x i32>, <5 x i32>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 14 for instruction: %17 = load <5 x i64>, <5 x i64>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %18 = load <5 x i16>, <5 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %19 = load <6 x i16>, <6 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 14 for instruction: %20 = load <7 x i16>, <7 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 22 for instruction: %21 = load <11 x i16>, <11 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 24 for instruction: %22 = load <12 x i16>, <12 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 26 for instruction: %23 = load <13 x i16>, <13 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 46 for instruction: %24 = load <23 x i16>, <23 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 48 for instruction: %25 = load <24 x i16>, <24 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 50 for instruction: %26 = load <25 x i16>, <25 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 94 for instruction: %27 = load <47 x i16>, <47 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 96 for instruction: %28 = load <48 x i16>, <48 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 98 for instruction: %29 = load <49 x i16>, <49 x i16>* undef, align 4
|
||||
; SSE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef
|
||||
;
|
||||
; AVX-LABEL: 'loads'
|
||||
|
@ -131,6 +195,18 @@ define i32 @loads(i32 %arg) {
|
|||
; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %15 = load <3 x i64>, <3 x i64>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 13 for instruction: %16 = load <5 x i32>, <5 x i32>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 13 for instruction: %17 = load <5 x i64>, <5 x i64>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %18 = load <5 x i16>, <5 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %19 = load <6 x i16>, <6 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 14 for instruction: %20 = load <7 x i16>, <7 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 25 for instruction: %21 = load <11 x i16>, <11 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 27 for instruction: %22 = load <12 x i16>, <12 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 29 for instruction: %23 = load <13 x i16>, <13 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 49 for instruction: %24 = load <23 x i16>, <23 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 51 for instruction: %25 = load <24 x i16>, <24 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 55 for instruction: %26 = load <25 x i16>, <25 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 101 for instruction: %27 = load <47 x i16>, <47 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 102 for instruction: %28 = load <48 x i16>, <48 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 105 for instruction: %29 = load <49 x i16>, <49 x i16>* undef, align 4
|
||||
; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef
|
||||
;
|
||||
; AVX512-LABEL: 'loads'
|
||||
|
@ -151,6 +227,18 @@ define i32 @loads(i32 %arg) {
|
|||
; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %15 = load <3 x i64>, <3 x i64>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 13 for instruction: %16 = load <5 x i32>, <5 x i32>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 14 for instruction: %17 = load <5 x i64>, <5 x i64>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %18 = load <5 x i16>, <5 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %19 = load <6 x i16>, <6 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 14 for instruction: %20 = load <7 x i16>, <7 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 25 for instruction: %21 = load <11 x i16>, <11 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 27 for instruction: %22 = load <12 x i16>, <12 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 29 for instruction: %23 = load <13 x i16>, <13 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 50 for instruction: %24 = load <23 x i16>, <23 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 51 for instruction: %25 = load <24 x i16>, <24 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 55 for instruction: %26 = load <25 x i16>, <25 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 101 for instruction: %27 = load <47 x i16>, <47 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 102 for instruction: %28 = load <48 x i16>, <48 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 106 for instruction: %29 = load <49 x i16>, <49 x i16>* undef, align 4
|
||||
; AVX512-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef
|
||||
;
|
||||
load i8, i8* undef, align 4
|
||||
|
@ -175,5 +263,21 @@ define i32 @loads(i32 %arg) {
|
|||
load <5 x i32>, <5 x i32>* undef, align 4
|
||||
load <5 x i64>, <5 x i64>* undef, align 4
|
||||
|
||||
load <5 x i16>, <5 x i16>* undef, align 4
|
||||
load <6 x i16>, <6 x i16>* undef, align 4 ; 1 x i64 + 1 x i32
|
||||
load <7 x i16>, <7 x i16>* undef, align 4
|
||||
|
||||
load <11 x i16>, <11 x i16>* undef, align 4
|
||||
load <12 x i16>, <12 x i16>* undef, align 4 ; 1 x i128 + 1 x i64
|
||||
load <13 x i16>, <13 x i16>* undef, align 4
|
||||
|
||||
load <23 x i16>, <23 x i16>* undef, align 4
|
||||
load <24 x i16>, <24 x i16>* undef, align 4 ; 1 x i256 + 1 x i128
|
||||
load <25 x i16>, <25 x i16>* undef, align 4
|
||||
|
||||
load <47 x i16>, <47 x i16>* undef, align 4
|
||||
load <48 x i16>, <48 x i16>* undef, align 4 ; 3 x i256
|
||||
load <49 x i16>, <49 x i16>* undef, align 4
|
||||
|
||||
ret i32 undef
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue