llvm-project/llvm/test/Transforms/InstCombine/unsigned_saturated_sub.ll

454 lines
14 KiB
LLVM

; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt -instcombine -S < %s | FileCheck %s
; Canonicalization of unsigned saturated subtraction idioms to
; usub.sat() intrinsics is tested here.
declare void @use(i64)
declare void @usei32(i32)
declare void @usei1(i1)
; (a > b) ? a - b : 0 -> usub.sat(a, b)
define i64 @max_sub_ugt(i64 %a, i64 %b) {
; CHECK-LABEL: @max_sub_ugt(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A:%.*]], i64 [[B:%.*]])
; CHECK-NEXT: ret i64 [[TMP1]]
;
%cmp = icmp ugt i64 %a, %b
%sub = sub i64 %a, %b
%sel = select i1 %cmp, i64 %sub ,i64 0
ret i64 %sel
}
; (a >= b) ? a - b : 0 -> usub.sat(a, b)
define i64 @max_sub_uge(i64 %a, i64 %b) {
; CHECK-LABEL: @max_sub_uge(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A:%.*]], i64 [[B:%.*]])
; CHECK-NEXT: ret i64 [[TMP1]]
;
%cmp = icmp uge i64 %a, %b
%sub = sub i64 %a, %b
%sel = select i1 %cmp, i64 %sub ,i64 0
ret i64 %sel
}
define i64 @max_sub_uge_extrause1(i64 %a, i64 %b) {
; CHECK-LABEL: @max_sub_uge_extrause1(
; CHECK-NEXT: [[SUB:%.*]] = sub i64 [[A:%.*]], [[B:%.*]]
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A]], i64 [[B]])
; CHECK-NEXT: call void @use(i64 [[SUB]])
; CHECK-NEXT: ret i64 [[TMP1]]
;
%cmp = icmp uge i64 %a, %b
%sub = sub i64 %a, %b
%sel = select i1 %cmp, i64 %sub ,i64 0
call void @use(i64 %sub)
ret i64 %sel
}
define i64 @max_sub_uge_extrause2(i64 %a, i64 %b) {
; CHECK-LABEL: @max_sub_uge_extrause2(
; CHECK-NEXT: [[CMP:%.*]] = icmp uge i64 [[A:%.*]], [[B:%.*]]
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A]], i64 [[B]])
; CHECK-NEXT: call void @usei1(i1 [[CMP]])
; CHECK-NEXT: ret i64 [[TMP1]]
;
%cmp = icmp uge i64 %a, %b
%sub = sub i64 %a, %b
%sel = select i1 %cmp, i64 %sub ,i64 0
call void @usei1(i1 %cmp)
ret i64 %sel
}
define i64 @max_sub_uge_extrause3(i64 %a, i64 %b) {
; CHECK-LABEL: @max_sub_uge_extrause3(
; CHECK-NEXT: [[CMP:%.*]] = icmp uge i64 [[A:%.*]], [[B:%.*]]
; CHECK-NEXT: [[SUB:%.*]] = sub i64 [[A]], [[B]]
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A]], i64 [[B]])
; CHECK-NEXT: call void @use(i64 [[SUB]])
; CHECK-NEXT: call void @usei1(i1 [[CMP]])
; CHECK-NEXT: ret i64 [[TMP1]]
;
%cmp = icmp uge i64 %a, %b
%sub = sub i64 %a, %b
%sel = select i1 %cmp, i64 %sub ,i64 0
call void @use(i64 %sub)
call void @usei1(i1 %cmp)
ret i64 %sel
}
; Again, with vectors:
; (a > b) ? a - b : 0 -> usub.sat(a, b)
define <4 x i32> @max_sub_ugt_vec(<4 x i32> %a, <4 x i32> %b) {
; CHECK-LABEL: @max_sub_ugt_vec(
; CHECK-NEXT: [[TMP1:%.*]] = call <4 x i32> @llvm.usub.sat.v4i32(<4 x i32> [[A:%.*]], <4 x i32> [[B:%.*]])
; CHECK-NEXT: ret <4 x i32> [[TMP1]]
;
%cmp = icmp ugt <4 x i32> %a, %b
%sub = sub <4 x i32> %a, %b
%sel = select <4 x i1> %cmp, <4 x i32> %sub, <4 x i32> zeroinitializer
ret <4 x i32> %sel
}
; Use extra ops to thwart icmp swapping canonicalization.
; (b < a) ? a - b : 0 -> usub.sat(a, b)
define i64 @max_sub_ult(i64 %a, i64 %b) {
; CHECK-LABEL: @max_sub_ult(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A:%.*]], i64 [[B:%.*]])
; CHECK-NEXT: [[EXTRASUB:%.*]] = sub i64 [[B]], [[A]]
; CHECK-NEXT: call void @use(i64 [[EXTRASUB]])
; CHECK-NEXT: ret i64 [[TMP1]]
;
%cmp = icmp ult i64 %b, %a
%sub = sub i64 %a, %b
%sel = select i1 %cmp, i64 %sub ,i64 0
%extrasub = sub i64 %b, %a
call void @use(i64 %extrasub)
ret i64 %sel
}
; (b > a) ? 0 : a - b -> usub.sat(a, b)
define i64 @max_sub_ugt_sel_swapped(i64 %a, i64 %b) {
; CHECK-LABEL: @max_sub_ugt_sel_swapped(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A:%.*]], i64 [[B:%.*]])
; CHECK-NEXT: [[EXTRASUB:%.*]] = sub i64 [[B]], [[A]]
; CHECK-NEXT: call void @use(i64 [[EXTRASUB]])
; CHECK-NEXT: ret i64 [[TMP1]]
;
%cmp = icmp ugt i64 %b, %a
%sub = sub i64 %a, %b
%sel = select i1 %cmp, i64 0 ,i64 %sub
%extrasub = sub i64 %b, %a
call void @use(i64 %extrasub)
ret i64 %sel
}
; (a < b) ? 0 : a - b -> usub.sat(a, b)
define i64 @max_sub_ult_sel_swapped(i64 %a, i64 %b) {
; CHECK-LABEL: @max_sub_ult_sel_swapped(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A:%.*]], i64 [[B:%.*]])
; CHECK-NEXT: ret i64 [[TMP1]]
;
%cmp = icmp ult i64 %a, %b
%sub = sub i64 %a, %b
%sel = select i1 %cmp, i64 0 ,i64 %sub
ret i64 %sel
}
; ((a > b) ? b - a : 0) -> -usub.sat(a, b)
define i64 @neg_max_sub_ugt(i64 %a, i64 %b) {
; CHECK-LABEL: @neg_max_sub_ugt(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A:%.*]], i64 [[B:%.*]])
; CHECK-NEXT: [[TMP2:%.*]] = sub i64 0, [[TMP1]]
; CHECK-NEXT: [[EXTRASUB:%.*]] = sub i64 [[A]], [[B]]
; CHECK-NEXT: call void @use(i64 [[EXTRASUB]])
; CHECK-NEXT: ret i64 [[TMP2]]
;
%cmp = icmp ugt i64 %a, %b
%sub = sub i64 %b, %a
%sel = select i1 %cmp, i64 %sub ,i64 0
%extrasub = sub i64 %a, %b
call void @use(i64 %extrasub)
ret i64 %sel
}
; ((b < a) ? b - a : 0) -> -usub.sat(a, b)
define i64 @neg_max_sub_ult(i64 %a, i64 %b) {
; CHECK-LABEL: @neg_max_sub_ult(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A:%.*]], i64 [[B:%.*]])
; CHECK-NEXT: [[TMP2:%.*]] = sub i64 0, [[TMP1]]
; CHECK-NEXT: ret i64 [[TMP2]]
;
%cmp = icmp ult i64 %b, %a
%sub = sub i64 %b, %a
%sel = select i1 %cmp, i64 %sub ,i64 0
ret i64 %sel
}
; ((b > a) ? 0 : b - a) -> -usub.sat(a, b)
define i64 @neg_max_sub_ugt_sel_swapped(i64 %a, i64 %b) {
; CHECK-LABEL: @neg_max_sub_ugt_sel_swapped(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A:%.*]], i64 [[B:%.*]])
; CHECK-NEXT: [[TMP2:%.*]] = sub i64 0, [[TMP1]]
; CHECK-NEXT: ret i64 [[TMP2]]
;
%cmp = icmp ugt i64 %b, %a
%sub = sub i64 %b, %a
%sel = select i1 %cmp, i64 0 ,i64 %sub
ret i64 %sel
}
define i64 @neg_max_sub_ugt_sel_swapped_extrause1(i64 %a, i64 %b) {
; CHECK-LABEL: @neg_max_sub_ugt_sel_swapped_extrause1(
; CHECK-NEXT: [[CMP:%.*]] = icmp ugt i64 [[B:%.*]], [[A:%.*]]
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A]], i64 [[B]])
; CHECK-NEXT: [[TMP2:%.*]] = sub i64 0, [[TMP1]]
; CHECK-NEXT: call void @usei1(i1 [[CMP]])
; CHECK-NEXT: ret i64 [[TMP2]]
;
%cmp = icmp ugt i64 %b, %a
%sub = sub i64 %b, %a
%sel = select i1 %cmp, i64 0 ,i64 %sub
call void @usei1(i1 %cmp)
ret i64 %sel
}
define i64 @neg_max_sub_ugt_sel_swapped_extrause2(i64 %a, i64 %b) {
; CHECK-LABEL: @neg_max_sub_ugt_sel_swapped_extrause2(
; CHECK-NEXT: [[SUB:%.*]] = sub i64 [[B:%.*]], [[A:%.*]]
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A]], i64 [[B]])
; CHECK-NEXT: [[TMP2:%.*]] = sub i64 0, [[TMP1]]
; CHECK-NEXT: call void @use(i64 [[SUB]])
; CHECK-NEXT: ret i64 [[TMP2]]
;
%cmp = icmp ugt i64 %b, %a
%sub = sub i64 %b, %a
%sel = select i1 %cmp, i64 0 ,i64 %sub
call void @use(i64 %sub)
ret i64 %sel
}
define i64 @neg_max_sub_ugt_sel_swapped_extrause3(i64 %a, i64 %b) {
; CHECK-LABEL: @neg_max_sub_ugt_sel_swapped_extrause3(
; CHECK-NEXT: [[CMP:%.*]] = icmp ugt i64 [[B:%.*]], [[A:%.*]]
; CHECK-NEXT: [[SUB:%.*]] = sub i64 [[B]], [[A]]
; CHECK-NEXT: [[SEL:%.*]] = select i1 [[CMP]], i64 0, i64 [[SUB]]
; CHECK-NEXT: call void @use(i64 [[SUB]])
; CHECK-NEXT: call void @usei1(i1 [[CMP]])
; CHECK-NEXT: ret i64 [[SEL]]
;
%cmp = icmp ugt i64 %b, %a
%sub = sub i64 %b, %a
%sel = select i1 %cmp, i64 0 ,i64 %sub
call void @use(i64 %sub)
call void @usei1(i1 %cmp)
ret i64 %sel
}
; ((a < b) ? 0 : b - a) -> -usub.sat(a, b)
define i64 @neg_max_sub_ult_sel_swapped(i64 %a, i64 %b) {
; CHECK-LABEL: @neg_max_sub_ult_sel_swapped(
; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.usub.sat.i64(i64 [[A:%.*]], i64 [[B:%.*]])
; CHECK-NEXT: [[TMP2:%.*]] = sub i64 0, [[TMP1]]
; CHECK-NEXT: [[EXTRASUB:%.*]] = sub i64 [[A]], [[B]]
; CHECK-NEXT: call void @use(i64 [[EXTRASUB]])
; CHECK-NEXT: ret i64 [[TMP2]]
;
%cmp = icmp ult i64 %a, %b
%sub = sub i64 %b, %a
%sel = select i1 %cmp, i64 0 ,i64 %sub
%extrasub = sub i64 %a, %b
call void @use(i64 %extrasub)
ret i64 %sel
}
define i32 @max_sub_ugt_c1(i32 %a) {
; CHECK-LABEL: @max_sub_ugt_c1(
; CHECK-NEXT: [[TMP1:%.*]] = call i32 @llvm.usub.sat.i32(i32 [[A:%.*]], i32 1)
; CHECK-NEXT: ret i32 [[TMP1]]
;
%cmp = icmp ugt i32 %a, 1
%sub = add i32 %a, -1
%sel = select i1 %cmp, i32 %sub ,i32 0
ret i32 %sel
}
define i32 @max_sub_ugt_c01(i32 %a) {
; CHECK-LABEL: @max_sub_ugt_c01(
; CHECK-NEXT: [[CMP:%.*]] = icmp eq i32 [[A:%.*]], 0
; CHECK-NEXT: [[SUB:%.*]] = add i32 [[A]], -1
; CHECK-NEXT: [[SEL:%.*]] = select i1 [[CMP]], i32 0, i32 [[SUB]]
; CHECK-NEXT: ret i32 [[SEL]]
;
%cmp = icmp ugt i32 %a, 0
%sub = add i32 %a, -1
%sel = select i1 %cmp, i32 %sub ,i32 0
ret i32 %sel
}
define i32 @max_sub_ugt_c10(i32 %a) {
; CHECK-LABEL: @max_sub_ugt_c10(
; CHECK-NEXT: [[TMP1:%.*]] = call i32 @llvm.usub.sat.i32(i32 [[A:%.*]], i32 10)
; CHECK-NEXT: ret i32 [[TMP1]]
;
%cmp = icmp ugt i32 %a, 10
%sub = add i32 %a, -10
%sel = select i1 %cmp, i32 %sub, i32 0
ret i32 %sel
}
define i32 @max_sub_ugt_c910(i32 %a) {
; CHECK-LABEL: @max_sub_ugt_c910(
; CHECK-NEXT: [[CMP:%.*]] = icmp ugt i32 [[A:%.*]], 9
; CHECK-NEXT: [[SUB:%.*]] = add i32 [[A]], -10
; CHECK-NEXT: [[SEL:%.*]] = select i1 [[CMP]], i32 [[SUB]], i32 0
; CHECK-NEXT: ret i32 [[SEL]]
;
%cmp = icmp ugt i32 %a, 9
%sub = add i32 %a, -10
%sel = select i1 %cmp, i32 %sub, i32 0
ret i32 %sel
}
define i32 @max_sub_ugt_c1110(i32 %a) {
; CHECK-LABEL: @max_sub_ugt_c1110(
; CHECK-NEXT: [[CMP:%.*]] = icmp ugt i32 [[A:%.*]], 11
; CHECK-NEXT: [[SUB:%.*]] = add i32 [[A]], -10
; CHECK-NEXT: [[SEL:%.*]] = select i1 [[CMP]], i32 [[SUB]], i32 0
; CHECK-NEXT: ret i32 [[SEL]]
;
%cmp = icmp ugt i32 %a, 11
%sub = add i32 %a, -10
%sel = select i1 %cmp, i32 %sub, i32 0
ret i32 %sel
}
define i32 @max_sub_ugt_c0(i32 %a) {
; CHECK-LABEL: @max_sub_ugt_c0(
; CHECK-NEXT: ret i32 0
;
%cmp = icmp ugt i32 %a, -1
%sub = add i32 %a, 0
%sel = select i1 %cmp, i32 %sub, i32 0
ret i32 %sel
}
define i32 @max_sub_ugt_cmiss(i32 %a) {
; CHECK-LABEL: @max_sub_ugt_cmiss(
; CHECK-NEXT: [[CMP:%.*]] = icmp ugt i32 [[A:%.*]], 1
; CHECK-NEXT: [[SUB:%.*]] = add i32 [[A]], -2
; CHECK-NEXT: [[SEL:%.*]] = select i1 [[CMP]], i32 [[SUB]], i32 0
; CHECK-NEXT: ret i32 [[SEL]]
;
%cmp = icmp ugt i32 %a, 1
%sub = add i32 %a, -2
%sel = select i1 %cmp, i32 %sub, i32 0
ret i32 %sel
}
define i32 @max_sub_ult_c1(i32 %a) {
; CHECK-LABEL: @max_sub_ult_c1(
; CHECK-NEXT: [[CMP:%.*]] = icmp eq i32 [[A:%.*]], 0
; CHECK-NEXT: [[SEL:%.*]] = sext i1 [[CMP]] to i32
; CHECK-NEXT: ret i32 [[SEL]]
;
%cmp = icmp ult i32 %a, 1
%sub = add i32 %a, -1
%sel = select i1 %cmp, i32 %sub, i32 0
ret i32 %sel
}
define i32 @max_sub_ult_c2(i32 %a) {
; CHECK-LABEL: @max_sub_ult_c2(
; CHECK-NEXT: [[TMP1:%.*]] = call i32 @llvm.usub.sat.i32(i32 2, i32 [[A:%.*]])
; CHECK-NEXT: [[TMP2:%.*]] = sub nsw i32 0, [[TMP1]]
; CHECK-NEXT: ret i32 [[TMP2]]
;
%cmp = icmp ult i32 %a, 2
%sub = add i32 %a, -2
%sel = select i1 %cmp, i32 %sub, i32 0
ret i32 %sel
}
define i32 @max_sub_ult_c2_oneuseicmp(i32 %a) {
; CHECK-LABEL: @max_sub_ult_c2_oneuseicmp(
; CHECK-NEXT: [[CMP:%.*]] = icmp ult i32 [[A:%.*]], 2
; CHECK-NEXT: [[TMP1:%.*]] = call i32 @llvm.usub.sat.i32(i32 2, i32 [[A]])
; CHECK-NEXT: [[TMP2:%.*]] = sub nsw i32 0, [[TMP1]]
; CHECK-NEXT: call void @usei1(i1 [[CMP]])
; CHECK-NEXT: ret i32 [[TMP2]]
;
%cmp = icmp ult i32 %a, 2
%sub = add i32 %a, -2
%sel = select i1 %cmp, i32 %sub, i32 0
call void @usei1(i1 %cmp)
ret i32 %sel
}
define i32 @max_sub_ult_c2_oneusesub(i32 %a) {
; CHECK-LABEL: @max_sub_ult_c2_oneusesub(
; CHECK-NEXT: [[SUB:%.*]] = add i32 [[A:%.*]], -2
; CHECK-NEXT: [[TMP1:%.*]] = call i32 @llvm.usub.sat.i32(i32 2, i32 [[A]])
; CHECK-NEXT: [[TMP2:%.*]] = sub nsw i32 0, [[TMP1]]
; CHECK-NEXT: call void @usei32(i32 [[SUB]])
; CHECK-NEXT: ret i32 [[TMP2]]
;
%cmp = icmp ult i32 %a, 2
%sub = add i32 %a, -2
%sel = select i1 %cmp, i32 %sub, i32 0
call void @usei32(i32 %sub)
ret i32 %sel
}
define i32 @max_sub_ult_c32(i32 %a) {
; CHECK-LABEL: @max_sub_ult_c32(
; CHECK-NEXT: [[CMP:%.*]] = icmp ult i32 [[A:%.*]], 3
; CHECK-NEXT: [[SUB:%.*]] = add i32 [[A]], -2
; CHECK-NEXT: [[SEL:%.*]] = select i1 [[CMP]], i32 [[SUB]], i32 0
; CHECK-NEXT: ret i32 [[SEL]]
;
%cmp = icmp ult i32 %a, 3
%sub = add i32 %a, -2
%sel = select i1 %cmp, i32 %sub, i32 0
ret i32 %sel
}
define i32 @max_sub_ugt_c32(i32 %a) {
; CHECK-LABEL: @max_sub_ugt_c32(
; CHECK-NEXT: [[CMP:%.*]] = icmp ult i32 [[A:%.*]], 3
; CHECK-NEXT: [[SUB:%.*]] = add i32 [[A]], -2
; CHECK-NEXT: [[SEL:%.*]] = select i1 [[CMP]], i32 [[SUB]], i32 0
; CHECK-NEXT: ret i32 [[SEL]]
;
%cmp = icmp ugt i32 3, %a
%sub = add i32 %a, -2
%sel = select i1 %cmp, i32 %sub, i32 0
ret i32 %sel
}
define i32 @max_sub_uge_c32(i32 %a) {
; CHECK-LABEL: @max_sub_uge_c32(
; CHECK-NEXT: [[CMP:%.*]] = icmp ult i32 [[A:%.*]], 3
; CHECK-NEXT: [[SUB:%.*]] = add i32 [[A]], -2
; CHECK-NEXT: [[SEL:%.*]] = select i1 [[CMP]], i32 [[SUB]], i32 0
; CHECK-NEXT: ret i32 [[SEL]]
;
%cmp = icmp uge i32 2, %a
%sub = add i32 %a, -2
%sel = select i1 %cmp, i32 %sub, i32 0
ret i32 %sel
}
define i32 @max_sub_ult_c12(i32 %a) {
; CHECK-LABEL: @max_sub_ult_c12(
; CHECK-NEXT: [[CMP:%.*]] = icmp eq i32 [[A:%.*]], 0
; CHECK-NEXT: [[SEL:%.*]] = select i1 [[CMP]], i32 -2, i32 0
; CHECK-NEXT: ret i32 [[SEL]]
;
%cmp = icmp ult i32 %a, 1
%sub = add i32 %a, -2
%sel = select i1 %cmp, i32 %sub, i32 0
ret i32 %sel
}
define i32 @max_sub_ult_c0(i32 %a) {
; CHECK-LABEL: @max_sub_ult_c0(
; CHECK-NEXT: ret i32 0
;
%cmp = icmp ult i32 %a, 0
%sub = add i32 %a, -1
%sel = select i1 %cmp, i32 %sub, i32 0
ret i32 %sel
}