2017-07-16 21:59:44 +08:00
|
|
|
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
2017-08-01 23:14:35 +08:00
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -print-schedule -mcpu=x86-64 -mattr=+bmi | FileCheck %s --check-prefix=CHECK --check-prefix=GENERIC
|
2017-07-16 21:59:44 +08:00
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -print-schedule -mcpu=haswell | FileCheck %s --check-prefix=CHECK --check-prefix=HASWELL
|
2017-10-17 21:45:39 +08:00
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -print-schedule -mcpu=broadwell | FileCheck %s --check-prefix=CHECK --check-prefix=BROADWELL
|
2017-10-10 17:53:18 +08:00
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -print-schedule -mcpu=skylake | FileCheck %s --check-prefix=CHECK --check-prefix=SKYLAKE
|
2017-07-16 21:59:44 +08:00
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -print-schedule -mcpu=knl | FileCheck %s --check-prefix=CHECK --check-prefix=HASWELL
|
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -print-schedule -mcpu=btver2 | FileCheck %s --check-prefix=CHECK --check-prefix=BTVER2
|
2017-07-19 10:45:14 +08:00
|
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -print-schedule -mcpu=znver1 | FileCheck %s --check-prefix=CHECK --check-prefix=ZNVER1
|
2017-07-16 21:59:44 +08:00
|
|
|
|
|
|
|
define i16 @test_andn_i16(i16 zeroext %a0, i16 zeroext %a1, i16 *%a2) {
|
|
|
|
; GENERIC-LABEL: test_andn_i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: andnl %esi, %edi, %eax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: notl %edi # sched: [1:0.33]
|
2017-08-13 21:59:24 +08:00
|
|
|
; GENERIC-NEXT: andw (%rdx), %di # sched: [6:0.50]
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: addl %edi, %eax # sched: [1:0.33]
|
2017-12-07 18:40:31 +08:00
|
|
|
; GENERIC-NEXT: # kill: def %ax killed %ax killed %eax
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_andn_i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: andnl %esi, %edi, %eax # sched: [1:0.50]
|
|
|
|
; HASWELL-NEXT: notl %edi # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: andw (%rdx), %di # sched: [6:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: addl %edi, %eax # sched: [1:0.25]
|
2017-12-07 18:40:31 +08:00
|
|
|
; HASWELL-NEXT: # kill: def %ax killed %ax killed %eax
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_andn_i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: andnl %esi, %edi, %eax # sched: [1:0.50]
|
|
|
|
; BROADWELL-NEXT: notl %edi # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: andw (%rdx), %di # sched: [6:0.50]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: addl %edi, %eax # sched: [1:0.25]
|
2017-12-07 18:40:31 +08:00
|
|
|
; BROADWELL-NEXT: # kill: def %ax killed %ax killed %eax
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_andn_i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: andnl %esi, %edi, %eax # sched: [1:0.50]
|
|
|
|
; SKYLAKE-NEXT: notl %edi # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: andw (%rdx), %di # sched: [6:0.50]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: addl %edi, %eax # sched: [1:0.25]
|
2017-12-07 18:40:31 +08:00
|
|
|
; SKYLAKE-NEXT: # kill: def %ax killed %ax killed %eax
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_andn_i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: andnl %esi, %edi, %eax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: notl %edi # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: andw (%rdx), %di # sched: [4:1.00]
|
|
|
|
; BTVER2-NEXT: addl %edi, %eax # sched: [1:0.50]
|
2017-12-07 18:40:31 +08:00
|
|
|
; BTVER2-NEXT: # kill: def %ax killed %ax killed %eax
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_andn_i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: andnl %esi, %edi, %eax # sched: [1:0.25]
|
|
|
|
; ZNVER1-NEXT: notl %edi # sched: [1:0.25]
|
|
|
|
; ZNVER1-NEXT: andw (%rdx), %di # sched: [5:0.50]
|
|
|
|
; ZNVER1-NEXT: addl %edi, %eax # sched: [1:0.25]
|
2017-12-07 18:40:31 +08:00
|
|
|
; ZNVER1-NEXT: # kill: def %ax killed %ax killed %eax
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i16, i16 *%a2
|
|
|
|
%2 = xor i16 %a0, -1
|
|
|
|
%3 = and i16 %2, %a1
|
|
|
|
%4 = and i16 %2, %1
|
|
|
|
%5 = add i16 %3, %4
|
|
|
|
ret i16 %5
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @test_andn_i32(i32 %a0, i32 %a1, i32 *%a2) {
|
|
|
|
; GENERIC-LABEL: test_andn_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: andnl %esi, %edi, %ecx # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: andnl (%rdx), %edi, %eax # sched: [5:0.50]
|
|
|
|
; GENERIC-NEXT: addl %ecx, %eax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_andn_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: andnl %esi, %edi, %ecx # sched: [1:0.50]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: andnl (%rdx), %edi, %eax # sched: [6:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_andn_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: andnl %esi, %edi, %ecx # sched: [1:0.50]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: andnl (%rdx), %edi, %eax # sched: [6:0.50]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_andn_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: andnl %esi, %edi, %ecx # sched: [1:0.50]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: andnl (%rdx), %edi, %eax # sched: [6:0.50]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_andn_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: andnl (%rdx), %edi, %eax # sched: [4:1.00]
|
|
|
|
; BTVER2-NEXT: andnl %esi, %edi, %ecx # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: addl %ecx, %eax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_andn_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: andnl (%rdx), %edi, %eax # sched: [5:0.50]
|
|
|
|
; ZNVER1-NEXT: andnl %esi, %edi, %ecx # sched: [1:0.25]
|
|
|
|
; ZNVER1-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i32, i32 *%a2
|
|
|
|
%2 = xor i32 %a0, -1
|
|
|
|
%3 = and i32 %2, %a1
|
|
|
|
%4 = and i32 %2, %1
|
|
|
|
%5 = add i32 %3, %4
|
|
|
|
ret i32 %5
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @test_andn_i64(i64 %a0, i64 %a1, i64 *%a2) {
|
|
|
|
; GENERIC-LABEL: test_andn_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: andnq %rsi, %rdi, %rcx # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: andnq (%rdx), %rdi, %rax # sched: [5:0.50]
|
|
|
|
; GENERIC-NEXT: addq %rcx, %rax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_andn_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: andnq %rsi, %rdi, %rcx # sched: [1:0.50]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: andnq (%rdx), %rdi, %rax # sched: [6:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_andn_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: andnq %rsi, %rdi, %rcx # sched: [1:0.50]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: andnq (%rdx), %rdi, %rax # sched: [6:0.50]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_andn_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: andnq %rsi, %rdi, %rcx # sched: [1:0.50]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: andnq (%rdx), %rdi, %rax # sched: [6:0.50]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_andn_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: andnq (%rdx), %rdi, %rax # sched: [4:1.00]
|
|
|
|
; BTVER2-NEXT: andnq %rsi, %rdi, %rcx # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: addq %rcx, %rax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_andn_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: andnq (%rdx), %rdi, %rax # sched: [5:0.50]
|
|
|
|
; ZNVER1-NEXT: andnq %rsi, %rdi, %rcx # sched: [1:0.25]
|
|
|
|
; ZNVER1-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i64, i64 *%a2
|
|
|
|
%2 = xor i64 %a0, -1
|
|
|
|
%3 = and i64 %2, %a1
|
|
|
|
%4 = and i64 %2, %1
|
|
|
|
%5 = add i64 %3, %4
|
|
|
|
ret i64 %5
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @test_bextr_i32(i32 %a0, i32 %a1, i32 *%a2) {
|
|
|
|
; GENERIC-LABEL: test_bextr_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; GENERIC-NEXT: bextrl %edi, (%rdx), %ecx # sched: [5:0.50]
|
|
|
|
; GENERIC-NEXT: bextrl %edi, %esi, %eax # sched: [1:0.33]
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: addl %ecx, %eax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_bextr_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: bextrl %edi, (%rdx), %ecx # sched: [7:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: bextrl %edi, %esi, %eax # sched: [2:0.50]
|
|
|
|
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_bextr_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: bextrl %edi, (%rdx), %ecx # sched: [7:0.50]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: bextrl %edi, %esi, %eax # sched: [2:0.50]
|
|
|
|
; BROADWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_bextr_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: bextrl %edi, (%rdx), %ecx # sched: [7:0.50]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: bextrl %edi, %esi, %eax # sched: [2:0.50]
|
|
|
|
; SKYLAKE-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_bextr_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; BTVER2-NEXT: bextrl %edi, (%rdx), %ecx # sched: [4:1.00]
|
|
|
|
; BTVER2-NEXT: bextrl %edi, %esi, %eax # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: addl %ecx, %eax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_bextr_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: bextrl %edi, (%rdx), %ecx # sched: [5:0.50]
|
|
|
|
; ZNVER1-NEXT: bextrl %edi, %esi, %eax # sched: [1:0.25]
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i32, i32 *%a2
|
|
|
|
%2 = tail call i32 @llvm.x86.bmi.bextr.32(i32 %1, i32 %a0)
|
|
|
|
%3 = tail call i32 @llvm.x86.bmi.bextr.32(i32 %a1, i32 %a0)
|
|
|
|
%4 = add i32 %2, %3
|
|
|
|
ret i32 %4
|
|
|
|
}
|
|
|
|
declare i32 @llvm.x86.bmi.bextr.32(i32, i32)
|
|
|
|
|
|
|
|
define i64 @test_bextr_i64(i64 %a0, i64 %a1, i64 *%a2) {
|
|
|
|
; GENERIC-LABEL: test_bextr_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; GENERIC-NEXT: bextrq %rdi, (%rdx), %rcx # sched: [5:0.50]
|
|
|
|
; GENERIC-NEXT: bextrq %rdi, %rsi, %rax # sched: [1:0.33]
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: addq %rcx, %rax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_bextr_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: bextrq %rdi, (%rdx), %rcx # sched: [7:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: bextrq %rdi, %rsi, %rax # sched: [2:0.50]
|
|
|
|
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_bextr_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: bextrq %rdi, (%rdx), %rcx # sched: [7:0.50]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: bextrq %rdi, %rsi, %rax # sched: [2:0.50]
|
|
|
|
; BROADWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_bextr_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: bextrq %rdi, (%rdx), %rcx # sched: [7:0.50]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: bextrq %rdi, %rsi, %rax # sched: [2:0.50]
|
|
|
|
; SKYLAKE-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_bextr_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; BTVER2-NEXT: bextrq %rdi, (%rdx), %rcx # sched: [4:1.00]
|
|
|
|
; BTVER2-NEXT: bextrq %rdi, %rsi, %rax # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: addq %rcx, %rax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_bextr_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: bextrq %rdi, (%rdx), %rcx # sched: [5:0.50]
|
|
|
|
; ZNVER1-NEXT: bextrq %rdi, %rsi, %rax # sched: [1:0.25]
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i64, i64 *%a2
|
|
|
|
%2 = tail call i64 @llvm.x86.bmi.bextr.64(i64 %1, i64 %a0)
|
|
|
|
%3 = tail call i64 @llvm.x86.bmi.bextr.64(i64 %a1, i64 %a0)
|
|
|
|
%4 = add i64 %2, %3
|
|
|
|
ret i64 %4
|
|
|
|
}
|
|
|
|
declare i64 @llvm.x86.bmi.bextr.64(i64, i64)
|
|
|
|
|
|
|
|
define i32 @test_blsi_i32(i32 %a0, i32 *%a1) {
|
|
|
|
; GENERIC-LABEL: test_blsi_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; GENERIC-NEXT: blsil (%rsi), %ecx # sched: [5:0.50]
|
|
|
|
; GENERIC-NEXT: blsil %edi, %eax # sched: [1:0.33]
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: addl %ecx, %eax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_blsi_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: blsil (%rsi), %ecx # sched: [6:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: blsil %edi, %eax # sched: [1:0.50]
|
|
|
|
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_blsi_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: blsil (%rsi), %ecx # sched: [6:0.50]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: blsil %edi, %eax # sched: [1:0.50]
|
|
|
|
; BROADWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_blsi_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: blsil (%rsi), %ecx # sched: [6:0.50]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: blsil %edi, %eax # sched: [1:0.50]
|
|
|
|
; SKYLAKE-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_blsi_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; BTVER2-NEXT: blsil (%rsi), %ecx # sched: [4:1.00]
|
|
|
|
; BTVER2-NEXT: blsil %edi, %eax # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: addl %ecx, %eax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_blsi_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: blsil (%rsi), %ecx # sched: [6:0.50]
|
|
|
|
; ZNVER1-NEXT: blsil %edi, %eax # sched: [2:0.25]
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i32, i32 *%a1
|
|
|
|
%2 = sub i32 0, %1
|
|
|
|
%3 = sub i32 0, %a0
|
|
|
|
%4 = and i32 %1, %2
|
|
|
|
%5 = and i32 %a0, %3
|
|
|
|
%6 = add i32 %4, %5
|
|
|
|
ret i32 %6
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @test_blsi_i64(i64 %a0, i64 *%a1) {
|
|
|
|
; GENERIC-LABEL: test_blsi_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; GENERIC-NEXT: blsiq (%rsi), %rcx # sched: [5:0.50]
|
|
|
|
; GENERIC-NEXT: blsiq %rdi, %rax # sched: [1:0.33]
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: addq %rcx, %rax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_blsi_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: blsiq (%rsi), %rcx # sched: [6:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: blsiq %rdi, %rax # sched: [1:0.50]
|
|
|
|
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_blsi_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: blsiq (%rsi), %rcx # sched: [6:0.50]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: blsiq %rdi, %rax # sched: [1:0.50]
|
|
|
|
; BROADWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_blsi_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: blsiq (%rsi), %rcx # sched: [6:0.50]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: blsiq %rdi, %rax # sched: [1:0.50]
|
|
|
|
; SKYLAKE-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_blsi_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; BTVER2-NEXT: blsiq (%rsi), %rcx # sched: [4:1.00]
|
|
|
|
; BTVER2-NEXT: blsiq %rdi, %rax # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: addq %rcx, %rax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_blsi_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: blsiq (%rsi), %rcx # sched: [6:0.50]
|
|
|
|
; ZNVER1-NEXT: blsiq %rdi, %rax # sched: [2:0.25]
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i64, i64 *%a1
|
|
|
|
%2 = sub i64 0, %1
|
|
|
|
%3 = sub i64 0, %a0
|
|
|
|
%4 = and i64 %1, %2
|
|
|
|
%5 = and i64 %a0, %3
|
|
|
|
%6 = add i64 %4, %5
|
|
|
|
ret i64 %6
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @test_blsmsk_i32(i32 %a0, i32 *%a1) {
|
|
|
|
; GENERIC-LABEL: test_blsmsk_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; GENERIC-NEXT: blsmskl (%rsi), %ecx # sched: [5:0.50]
|
|
|
|
; GENERIC-NEXT: blsmskl %edi, %eax # sched: [1:0.33]
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: addl %ecx, %eax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_blsmsk_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: blsmskl (%rsi), %ecx # sched: [6:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: blsmskl %edi, %eax # sched: [1:0.50]
|
|
|
|
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_blsmsk_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: blsmskl (%rsi), %ecx # sched: [6:0.50]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: blsmskl %edi, %eax # sched: [1:0.50]
|
|
|
|
; BROADWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_blsmsk_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: blsmskl (%rsi), %ecx # sched: [6:0.50]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: blsmskl %edi, %eax # sched: [1:0.50]
|
|
|
|
; SKYLAKE-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_blsmsk_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; BTVER2-NEXT: blsmskl (%rsi), %ecx # sched: [4:1.00]
|
|
|
|
; BTVER2-NEXT: blsmskl %edi, %eax # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: addl %ecx, %eax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_blsmsk_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: blsmskl (%rsi), %ecx # sched: [6:0.50]
|
|
|
|
; ZNVER1-NEXT: blsmskl %edi, %eax # sched: [2:0.25]
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i32, i32 *%a1
|
|
|
|
%2 = sub i32 %1, 1
|
|
|
|
%3 = sub i32 %a0, 1
|
|
|
|
%4 = xor i32 %1, %2
|
|
|
|
%5 = xor i32 %a0, %3
|
|
|
|
%6 = add i32 %4, %5
|
|
|
|
ret i32 %6
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @test_blsmsk_i64(i64 %a0, i64 *%a1) {
|
|
|
|
; GENERIC-LABEL: test_blsmsk_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; GENERIC-NEXT: blsmskq (%rsi), %rcx # sched: [5:0.50]
|
|
|
|
; GENERIC-NEXT: blsmskq %rdi, %rax # sched: [1:0.33]
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: addq %rcx, %rax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_blsmsk_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: blsmskq (%rsi), %rcx # sched: [6:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: blsmskq %rdi, %rax # sched: [1:0.50]
|
|
|
|
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_blsmsk_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: blsmskq (%rsi), %rcx # sched: [6:0.50]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: blsmskq %rdi, %rax # sched: [1:0.50]
|
|
|
|
; BROADWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_blsmsk_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: blsmskq (%rsi), %rcx # sched: [6:0.50]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: blsmskq %rdi, %rax # sched: [1:0.50]
|
|
|
|
; SKYLAKE-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_blsmsk_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; BTVER2-NEXT: blsmskq (%rsi), %rcx # sched: [4:1.00]
|
|
|
|
; BTVER2-NEXT: blsmskq %rdi, %rax # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: addq %rcx, %rax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_blsmsk_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: blsmskq (%rsi), %rcx # sched: [6:0.50]
|
|
|
|
; ZNVER1-NEXT: blsmskq %rdi, %rax # sched: [2:0.25]
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i64, i64 *%a1
|
|
|
|
%2 = sub i64 %1, 1
|
|
|
|
%3 = sub i64 %a0, 1
|
|
|
|
%4 = xor i64 %1, %2
|
|
|
|
%5 = xor i64 %a0, %3
|
|
|
|
%6 = add i64 %4, %5
|
|
|
|
ret i64 %6
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @test_blsr_i32(i32 %a0, i32 *%a1) {
|
|
|
|
; GENERIC-LABEL: test_blsr_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; GENERIC-NEXT: blsrl (%rsi), %ecx # sched: [5:0.50]
|
|
|
|
; GENERIC-NEXT: blsrl %edi, %eax # sched: [1:0.33]
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: addl %ecx, %eax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_blsr_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: blsrl (%rsi), %ecx # sched: [6:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: blsrl %edi, %eax # sched: [1:0.50]
|
|
|
|
; HASWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_blsr_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: blsrl (%rsi), %ecx # sched: [6:0.50]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: blsrl %edi, %eax # sched: [1:0.50]
|
|
|
|
; BROADWELL-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_blsr_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: blsrl (%rsi), %ecx # sched: [6:0.50]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: blsrl %edi, %eax # sched: [1:0.50]
|
|
|
|
; SKYLAKE-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_blsr_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; BTVER2-NEXT: blsrl (%rsi), %ecx # sched: [4:1.00]
|
|
|
|
; BTVER2-NEXT: blsrl %edi, %eax # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: addl %ecx, %eax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_blsr_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: blsrl (%rsi), %ecx # sched: [6:0.50]
|
|
|
|
; ZNVER1-NEXT: blsrl %edi, %eax # sched: [2:0.25]
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: addl %ecx, %eax # sched: [1:0.25]
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i32, i32 *%a1
|
|
|
|
%2 = sub i32 %1, 1
|
|
|
|
%3 = sub i32 %a0, 1
|
|
|
|
%4 = and i32 %1, %2
|
|
|
|
%5 = and i32 %a0, %3
|
|
|
|
%6 = add i32 %4, %5
|
|
|
|
ret i32 %6
|
|
|
|
}
|
|
|
|
|
|
|
|
define i64 @test_blsr_i64(i64 %a0, i64 *%a1) {
|
|
|
|
; GENERIC-LABEL: test_blsr_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; GENERIC-NEXT: blsrq (%rsi), %rcx # sched: [5:0.50]
|
|
|
|
; GENERIC-NEXT: blsrq %rdi, %rax # sched: [1:0.33]
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: addq %rcx, %rax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_blsr_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: blsrq (%rsi), %rcx # sched: [6:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: blsrq %rdi, %rax # sched: [1:0.50]
|
|
|
|
; HASWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_blsr_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: blsrq (%rsi), %rcx # sched: [6:0.50]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: blsrq %rdi, %rax # sched: [1:0.50]
|
|
|
|
; BROADWELL-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_blsr_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: blsrq (%rsi), %rcx # sched: [6:0.50]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: blsrq %rdi, %rax # sched: [1:0.50]
|
|
|
|
; SKYLAKE-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_blsr_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-12-08 01:37:39 +08:00
|
|
|
; BTVER2-NEXT: blsrq (%rsi), %rcx # sched: [4:1.00]
|
|
|
|
; BTVER2-NEXT: blsrq %rdi, %rax # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: addq %rcx, %rax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_blsr_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: blsrq (%rsi), %rcx # sched: [6:0.50]
|
|
|
|
; ZNVER1-NEXT: blsrq %rdi, %rax # sched: [2:0.25]
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: addq %rcx, %rax # sched: [1:0.25]
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i64, i64 *%a1
|
|
|
|
%2 = sub i64 %1, 1
|
|
|
|
%3 = sub i64 %a0, 1
|
|
|
|
%4 = and i64 %1, %2
|
|
|
|
%5 = and i64 %a0, %3
|
|
|
|
%6 = add i64 %4, %5
|
|
|
|
ret i64 %6
|
|
|
|
}
|
|
|
|
|
|
|
|
define i16 @test_cttz_i16(i16 zeroext %a0, i16 *%a1) {
|
|
|
|
; GENERIC-LABEL: test_cttz_i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-12-07 23:24:14 +08:00
|
|
|
; GENERIC-NEXT: tzcntw (%rsi), %cx # sched: [7:1.00]
|
|
|
|
; GENERIC-NEXT: tzcntw %di, %ax # sched: [3:1.00]
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: orl %ecx, %eax # sched: [1:0.33]
|
2017-12-07 18:40:31 +08:00
|
|
|
; GENERIC-NEXT: # kill: def %ax killed %ax killed %eax
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_cttz_i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: tzcntw (%rsi), %cx # sched: [8:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: tzcntw %di, %ax # sched: [3:1.00]
|
|
|
|
; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
|
2017-12-07 18:40:31 +08:00
|
|
|
; HASWELL-NEXT: # kill: def %ax killed %ax killed %eax
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_cttz_i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: tzcntw (%rsi), %cx # sched: [8:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: tzcntw %di, %ax # sched: [3:1.00]
|
|
|
|
; BROADWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
|
2017-12-07 18:40:31 +08:00
|
|
|
; BROADWELL-NEXT: # kill: def %ax killed %ax killed %eax
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_cttz_i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: tzcntw (%rsi), %cx # sched: [8:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: tzcntw %di, %ax # sched: [3:1.00]
|
|
|
|
; SKYLAKE-NEXT: orl %ecx, %eax # sched: [1:0.25]
|
2017-12-07 18:40:31 +08:00
|
|
|
; SKYLAKE-NEXT: # kill: def %ax killed %ax killed %eax
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_cttz_i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-12-07 23:24:14 +08:00
|
|
|
; BTVER2-NEXT: tzcntw (%rsi), %cx # sched: [6:1.00]
|
|
|
|
; BTVER2-NEXT: tzcntw %di, %ax # sched: [3:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: orl %ecx, %eax # sched: [1:0.50]
|
2017-12-07 18:40:31 +08:00
|
|
|
; BTVER2-NEXT: # kill: def %ax killed %ax killed %eax
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_cttz_i16:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: tzcntw (%rsi), %cx # sched: [6:0.50]
|
|
|
|
; ZNVER1-NEXT: tzcntw %di, %ax # sched: [2:0.25]
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: orl %ecx, %eax # sched: [1:0.25]
|
2017-12-07 18:40:31 +08:00
|
|
|
; ZNVER1-NEXT: # kill: def %ax killed %ax killed %eax
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i16, i16 *%a1
|
|
|
|
%2 = tail call i16 @llvm.cttz.i16( i16 %1, i1 false )
|
|
|
|
%3 = tail call i16 @llvm.cttz.i16( i16 %a0, i1 false )
|
|
|
|
%4 = or i16 %2, %3
|
|
|
|
ret i16 %4
|
|
|
|
}
|
|
|
|
declare i16 @llvm.cttz.i16(i16, i1)
|
|
|
|
|
|
|
|
define i32 @test_cttz_i32(i32 %a0, i32 *%a1) {
|
|
|
|
; GENERIC-LABEL: test_cttz_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-12-07 23:24:14 +08:00
|
|
|
; GENERIC-NEXT: tzcntl (%rsi), %ecx # sched: [7:1.00]
|
|
|
|
; GENERIC-NEXT: tzcntl %edi, %eax # sched: [3:1.00]
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: orl %ecx, %eax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_cttz_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: tzcntl (%rsi), %ecx # sched: [8:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: tzcntl %edi, %eax # sched: [3:1.00]
|
|
|
|
; HASWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_cttz_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: tzcntl (%rsi), %ecx # sched: [8:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: tzcntl %edi, %eax # sched: [3:1.00]
|
|
|
|
; BROADWELL-NEXT: orl %ecx, %eax # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_cttz_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: tzcntl (%rsi), %ecx # sched: [8:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: tzcntl %edi, %eax # sched: [3:1.00]
|
|
|
|
; SKYLAKE-NEXT: orl %ecx, %eax # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_cttz_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-12-07 23:24:14 +08:00
|
|
|
; BTVER2-NEXT: tzcntl (%rsi), %ecx # sched: [6:1.00]
|
|
|
|
; BTVER2-NEXT: tzcntl %edi, %eax # sched: [3:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: orl %ecx, %eax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_cttz_i32:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: tzcntl (%rsi), %ecx # sched: [6:0.50]
|
|
|
|
; ZNVER1-NEXT: tzcntl %edi, %eax # sched: [2:0.25]
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: orl %ecx, %eax # sched: [1:0.25]
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i32, i32 *%a1
|
|
|
|
%2 = tail call i32 @llvm.cttz.i32( i32 %1, i1 false )
|
|
|
|
%3 = tail call i32 @llvm.cttz.i32( i32 %a0, i1 false )
|
|
|
|
%4 = or i32 %2, %3
|
|
|
|
ret i32 %4
|
|
|
|
}
|
|
|
|
declare i32 @llvm.cttz.i32(i32, i1)
|
|
|
|
|
|
|
|
define i64 @test_cttz_i64(i64 %a0, i64 *%a1) {
|
|
|
|
; GENERIC-LABEL: test_cttz_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; GENERIC: # %bb.0:
|
2017-12-07 23:24:14 +08:00
|
|
|
; GENERIC-NEXT: tzcntq (%rsi), %rcx # sched: [7:1.00]
|
|
|
|
; GENERIC-NEXT: tzcntq %rdi, %rax # sched: [3:1.00]
|
2017-08-01 23:14:35 +08:00
|
|
|
; GENERIC-NEXT: orq %rcx, %rax # sched: [1:0.33]
|
|
|
|
; GENERIC-NEXT: retq # sched: [1:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
|
|
|
; HASWELL-LABEL: test_cttz_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; HASWELL: # %bb.0:
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: tzcntq (%rsi), %rcx # sched: [8:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
; HASWELL-NEXT: tzcntq %rdi, %rax # sched: [3:1.00]
|
|
|
|
; HASWELL-NEXT: orq %rcx, %rax # sched: [1:0.25]
|
2017-12-08 17:48:44 +08:00
|
|
|
; HASWELL-NEXT: retq # sched: [7:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
;
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-LABEL: test_cttz_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BROADWELL: # %bb.0:
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: tzcntq (%rsi), %rcx # sched: [8:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
; BROADWELL-NEXT: tzcntq %rdi, %rax # sched: [3:1.00]
|
|
|
|
; BROADWELL-NEXT: orq %rcx, %rax # sched: [1:0.25]
|
2017-10-25 04:19:47 +08:00
|
|
|
; BROADWELL-NEXT: retq # sched: [7:1.00]
|
2017-10-17 21:45:39 +08:00
|
|
|
;
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-LABEL: test_cttz_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; SKYLAKE: # %bb.0:
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: tzcntq (%rsi), %rcx # sched: [8:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
; SKYLAKE-NEXT: tzcntq %rdi, %rax # sched: [3:1.00]
|
|
|
|
; SKYLAKE-NEXT: orq %rcx, %rax # sched: [1:0.25]
|
2017-10-17 14:47:04 +08:00
|
|
|
; SKYLAKE-NEXT: retq # sched: [7:1.00]
|
2017-10-10 17:53:18 +08:00
|
|
|
;
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-LABEL: test_cttz_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; BTVER2: # %bb.0:
|
2017-12-07 23:24:14 +08:00
|
|
|
; BTVER2-NEXT: tzcntq (%rsi), %rcx # sched: [6:1.00]
|
|
|
|
; BTVER2-NEXT: tzcntq %rdi, %rax # sched: [3:1.00]
|
2017-07-16 21:59:44 +08:00
|
|
|
; BTVER2-NEXT: orq %rcx, %rax # sched: [1:0.50]
|
|
|
|
; BTVER2-NEXT: retq # sched: [4:1.00]
|
2017-07-19 10:45:14 +08:00
|
|
|
;
|
|
|
|
; ZNVER1-LABEL: test_cttz_i64:
|
2017-12-05 01:18:51 +08:00
|
|
|
; ZNVER1: # %bb.0:
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: tzcntq (%rsi), %rcx # sched: [6:0.50]
|
|
|
|
; ZNVER1-NEXT: tzcntq %rdi, %rax # sched: [2:0.25]
|
2017-07-19 10:45:14 +08:00
|
|
|
; ZNVER1-NEXT: orq %rcx, %rax # sched: [1:0.25]
|
AMD family 17h (znver1) scheduler model update.
Summary:
This patch enables the following:
1) Regex based Instruction itineraries for integer instructions.
2) The instructions are grouped as per the nature of the instructions
(move, arithmetic, logic, Misc, Control Transfer).
3) FP instructions and their itineraries are added which includes values
for SSE4A, BMI, BMI2 and SHA instructions.
Patch by Ganesh Gopalasubramanian
Reviewers: RKSimon, craig.topper
Subscribers: vprasad, shivaram, ddibyend, andreadb, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D36617
llvm-svn: 312237
2017-08-31 20:38:35 +08:00
|
|
|
; ZNVER1-NEXT: retq # sched: [1:0.50]
|
2017-07-16 21:59:44 +08:00
|
|
|
%1 = load i64, i64 *%a1
|
|
|
|
%2 = tail call i64 @llvm.cttz.i64( i64 %1, i1 false )
|
|
|
|
%3 = tail call i64 @llvm.cttz.i64( i64 %a0, i1 false )
|
|
|
|
%4 = or i64 %2, %3
|
|
|
|
ret i64 %4
|
|
|
|
}
|
|
|
|
declare i64 @llvm.cttz.i64(i64, i1)
|