llvm-project/llvm/test/CodeGen/X86/ctpop-combine.ll

201 lines
6.5 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+popcnt | FileCheck %s -check-prefixes=CHECK,POPCOUNT
; RUN: llc < %s -mtriple=x86_64-unknown -mattr=-popcnt | FileCheck %s -check-prefixes=CHECK,NO-POPCOUNT
declare i8 @llvm.ctpop.i8(i8) nounwind readnone
declare i64 @llvm.ctpop.i64(i64) nounwind readnone
define i32 @test1(i64 %x) nounwind readnone {
; CHECK-LABEL: test1:
; CHECK: # %bb.0:
; CHECK-NEXT: leaq -1(%rdi), %rcx
; CHECK-NEXT: xorl %eax, %eax
; CHECK-NEXT: testq %rcx, %rdi
; CHECK-NEXT: setne %al
; CHECK-NEXT: retq
%count = tail call i64 @llvm.ctpop.i64(i64 %x)
%cast = trunc i64 %count to i32
%cmp = icmp ugt i32 %cast, 1
%conv = zext i1 %cmp to i32
ret i32 %conv
}
define i32 @test2(i64 %x) nounwind readnone {
; CHECK-LABEL: test2:
; CHECK: # %bb.0:
; CHECK-NEXT: leaq -1(%rdi), %rcx
; CHECK-NEXT: xorl %eax, %eax
; CHECK-NEXT: testq %rcx, %rdi
; CHECK-NEXT: sete %al
; CHECK-NEXT: retq
%count = tail call i64 @llvm.ctpop.i64(i64 %x)
%cmp = icmp ult i64 %count, 2
%conv = zext i1 %cmp to i32
ret i32 %conv
}
define i32 @test3(i64 %x) nounwind readnone {
; POPCOUNT-LABEL: test3:
; POPCOUNT: # %bb.0:
; POPCOUNT-NEXT: popcntq %rdi, %rcx
; POPCOUNT-NEXT: andb $63, %cl
; POPCOUNT-NEXT: xorl %eax, %eax
; POPCOUNT-NEXT: cmpb $2, %cl
; POPCOUNT-NEXT: setb %al
; POPCOUNT-NEXT: retq
;
; NO-POPCOUNT-LABEL: test3:
; NO-POPCOUNT: # %bb.0:
; NO-POPCOUNT-NEXT: movq %rdi, %rax
; NO-POPCOUNT-NEXT: shrq %rax
; NO-POPCOUNT-NEXT: movabsq $6148914691236517205, %rcx # imm = 0x5555555555555555
; NO-POPCOUNT-NEXT: andq %rax, %rcx
; NO-POPCOUNT-NEXT: subq %rcx, %rdi
; NO-POPCOUNT-NEXT: movabsq $3689348814741910323, %rax # imm = 0x3333333333333333
; NO-POPCOUNT-NEXT: movq %rdi, %rcx
; NO-POPCOUNT-NEXT: andq %rax, %rcx
; NO-POPCOUNT-NEXT: shrq $2, %rdi
; NO-POPCOUNT-NEXT: andq %rax, %rdi
; NO-POPCOUNT-NEXT: addq %rcx, %rdi
; NO-POPCOUNT-NEXT: movq %rdi, %rax
; NO-POPCOUNT-NEXT: shrq $4, %rax
; NO-POPCOUNT-NEXT: addq %rdi, %rax
; NO-POPCOUNT-NEXT: movabsq $1085102592571150095, %rcx # imm = 0xF0F0F0F0F0F0F0F
; NO-POPCOUNT-NEXT: andq %rax, %rcx
; NO-POPCOUNT-NEXT: movabsq $72340172838076673, %rdx # imm = 0x101010101010101
; NO-POPCOUNT-NEXT: imulq %rcx, %rdx
; NO-POPCOUNT-NEXT: shrq $56, %rdx
; NO-POPCOUNT-NEXT: andb $63, %dl
; NO-POPCOUNT-NEXT: xorl %eax, %eax
; NO-POPCOUNT-NEXT: cmpb $2, %dl
; NO-POPCOUNT-NEXT: setb %al
; NO-POPCOUNT-NEXT: retq
%count = tail call i64 @llvm.ctpop.i64(i64 %x)
%cast = trunc i64 %count to i6 ; Too small for 0-64
%cmp = icmp ult i6 %cast, 2
%conv = zext i1 %cmp to i32
ret i32 %conv
}
define i8 @test4(i8 %x) nounwind readnone {
; POPCOUNT-LABEL: test4:
; POPCOUNT: # %bb.0:
; POPCOUNT-NEXT: andl $127, %edi
; POPCOUNT-NEXT: popcntl %edi, %eax
; POPCOUNT-NEXT: # kill: def $al killed $al killed $eax
; POPCOUNT-NEXT: retq
;
; NO-POPCOUNT-LABEL: test4:
; NO-POPCOUNT: # %bb.0:
; NO-POPCOUNT-NEXT: # kill: def $edi killed $edi def $rdi
; NO-POPCOUNT-NEXT: andb $127, %dil
; NO-POPCOUNT-NEXT: movl %edi, %eax
; NO-POPCOUNT-NEXT: shrb %al
; NO-POPCOUNT-NEXT: andb $21, %al
; NO-POPCOUNT-NEXT: subb %al, %dil
; NO-POPCOUNT-NEXT: movl %edi, %eax
; NO-POPCOUNT-NEXT: andb $51, %al
; NO-POPCOUNT-NEXT: shrb $2, %dil
; NO-POPCOUNT-NEXT: andb $51, %dil
; NO-POPCOUNT-NEXT: addb %al, %dil
; NO-POPCOUNT-NEXT: movl %edi, %eax
; NO-POPCOUNT-NEXT: shrb $4, %al
; NO-POPCOUNT-NEXT: addl %edi, %eax
; NO-POPCOUNT-NEXT: andb $15, %al
; NO-POPCOUNT-NEXT: # kill: def $al killed $al killed $eax
; NO-POPCOUNT-NEXT: retq
%x2 = and i8 %x, 127
%count = tail call i8 @llvm.ctpop.i8(i8 %x2)
%and = and i8 %count, 7
ret i8 %and
}
define i32 @ctpop_eq_one(i64 %x) nounwind readnone {
; POPCOUNT-LABEL: ctpop_eq_one:
; POPCOUNT: # %bb.0:
; POPCOUNT-NEXT: popcntq %rdi, %rcx
; POPCOUNT-NEXT: xorl %eax, %eax
; POPCOUNT-NEXT: cmpl $1, %ecx
; POPCOUNT-NEXT: sete %al
; POPCOUNT-NEXT: retq
;
; NO-POPCOUNT-LABEL: ctpop_eq_one:
; NO-POPCOUNT: # %bb.0:
; NO-POPCOUNT-NEXT: leaq -1(%rdi), %rax
; NO-POPCOUNT-NEXT: testq %rax, %rdi
; NO-POPCOUNT-NEXT: sete %al
; NO-POPCOUNT-NEXT: testq %rdi, %rdi
; NO-POPCOUNT-NEXT: setne %cl
; NO-POPCOUNT-NEXT: andb %al, %cl
; NO-POPCOUNT-NEXT: movzbl %cl, %eax
; NO-POPCOUNT-NEXT: retq
%count = tail call i64 @llvm.ctpop.i64(i64 %x)
%cmp = icmp eq i64 %count, 1
%conv = zext i1 %cmp to i32
ret i32 %conv
}
define i32 @ctpop_ne_one(i64 %x) nounwind readnone {
; POPCOUNT-LABEL: ctpop_ne_one:
; POPCOUNT: # %bb.0:
; POPCOUNT-NEXT: popcntq %rdi, %rcx
; POPCOUNT-NEXT: xorl %eax, %eax
; POPCOUNT-NEXT: cmpl $1, %ecx
; POPCOUNT-NEXT: setne %al
; POPCOUNT-NEXT: retq
;
; NO-POPCOUNT-LABEL: ctpop_ne_one:
; NO-POPCOUNT: # %bb.0:
; NO-POPCOUNT-NEXT: leaq -1(%rdi), %rax
; NO-POPCOUNT-NEXT: testq %rax, %rdi
; NO-POPCOUNT-NEXT: setne %al
; NO-POPCOUNT-NEXT: testq %rdi, %rdi
; NO-POPCOUNT-NEXT: sete %cl
; NO-POPCOUNT-NEXT: orb %al, %cl
; NO-POPCOUNT-NEXT: movzbl %cl, %eax
; NO-POPCOUNT-NEXT: retq
%count = tail call i64 @llvm.ctpop.i64(i64 %x)
%cmp = icmp ne i64 %count, 1
%conv = zext i1 %cmp to i32
ret i32 %conv
}
define i1 @ctpop_trunc_non_power2(i255 %x) nounwind {
; CHECK-LABEL: ctpop_trunc_non_power2:
; CHECK: # %bb.0:
; CHECK-NEXT: pushq %rbx
; CHECK-NEXT: movabsq $9223372036854775807, %r8 # imm = 0x7FFFFFFFFFFFFFFF
; CHECK-NEXT: movq %rcx, %r9
; CHECK-NEXT: andq %r8, %r9
; CHECK-NEXT: movq %rdi, %r11
; CHECK-NEXT: addq $-1, %r11
; CHECK-NEXT: movq %rsi, %r10
; CHECK-NEXT: adcq $-1, %r10
; CHECK-NEXT: movq %rdx, %rax
; CHECK-NEXT: adcq $-1, %rax
; CHECK-NEXT: movq %rcx, %rbx
; CHECK-NEXT: adcq %r8, %rbx
; CHECK-NEXT: andq %rdi, %r11
; CHECK-NEXT: andq %rdx, %rax
; CHECK-NEXT: orq %r11, %rax
; CHECK-NEXT: andq %rsi, %r10
; CHECK-NEXT: andq %r8, %rbx
; CHECK-NEXT: andq %rcx, %rbx
; CHECK-NEXT: orq %r10, %rbx
; CHECK-NEXT: orq %rax, %rbx
; CHECK-NEXT: sete %cl
; CHECK-NEXT: orq %rdx, %rdi
; CHECK-NEXT: orq %rsi, %r9
; CHECK-NEXT: orq %rdi, %r9
; CHECK-NEXT: setne %al
; CHECK-NEXT: andb %cl, %al
; CHECK-NEXT: popq %rbx
; CHECK-NEXT: retq
%a = call i255 @llvm.ctpop.i255(i255 %x)
%b = trunc i255 %a to i8 ; largest value from ctpop is 255, fits in 8 bits.
%c = icmp eq i8 %b, 1
ret i1 %c
}
declare i255 @llvm.ctpop.i255(i255)