forked from OSchip/llvm-project
[InstCombine] Add trunc+zext 'narrow' funnel shift tests (PR35155)
Based on the rotation equivalents in rotate.ll
This commit is contained in:
parent
bb39372e5e
commit
76996470ef
|
@ -200,3 +200,104 @@ define <2 x i64> @fshr_sub_mask_vector(<2 x i64> %x, <2 x i64> %y, <2 x i64> %a)
|
|||
%r = or <2 x i64> %shl, %shr
|
||||
ret <2 x i64> %r
|
||||
}
|
||||
|
||||
; PR35155 - these are optionally UB-free funnel shift left/right patterns that are narrowed to a smaller bitwidth.
|
||||
|
||||
define i16 @fshl_16bit(i16 %x, i16 %y, i32 %shift) {
|
||||
; CHECK-LABEL: @fshl_16bit(
|
||||
; CHECK-NEXT: [[AND:%.*]] = and i32 [[SHIFT:%.*]], 15
|
||||
; CHECK-NEXT: [[CONVX:%.*]] = zext i16 [[X:%.*]] to i32
|
||||
; CHECK-NEXT: [[SHL:%.*]] = shl i32 [[CONVX]], [[AND]]
|
||||
; CHECK-NEXT: [[SUB:%.*]] = sub nuw nsw i32 16, [[AND]]
|
||||
; CHECK-NEXT: [[CONVY:%.*]] = zext i16 [[X]] to i32
|
||||
; CHECK-NEXT: [[SHR:%.*]] = lshr i32 [[CONVY]], [[SUB]]
|
||||
; CHECK-NEXT: [[OR:%.*]] = or i32 [[SHR]], [[SHL]]
|
||||
; CHECK-NEXT: [[CONV2:%.*]] = trunc i32 [[OR]] to i16
|
||||
; CHECK-NEXT: ret i16 [[CONV2]]
|
||||
;
|
||||
%and = and i32 %shift, 15
|
||||
%convx = zext i16 %x to i32
|
||||
%shl = shl i32 %convx, %and
|
||||
%sub = sub i32 16, %and
|
||||
%convy = zext i16 %x to i32
|
||||
%shr = lshr i32 %convy, %sub
|
||||
%or = or i32 %shr, %shl
|
||||
%conv2 = trunc i32 %or to i16
|
||||
ret i16 %conv2
|
||||
}
|
||||
|
||||
; Commute the 'or' operands and try a vector type.
|
||||
|
||||
define <2 x i16> @fshl_commute_16bit_vec(<2 x i16> %x, <2 x i16> %y, <2 x i32> %shift) {
|
||||
; CHECK-LABEL: @fshl_commute_16bit_vec(
|
||||
; CHECK-NEXT: [[AND:%.*]] = and <2 x i32> [[SHIFT:%.*]], <i32 15, i32 15>
|
||||
; CHECK-NEXT: [[CONVX:%.*]] = zext <2 x i16> [[X:%.*]] to <2 x i32>
|
||||
; CHECK-NEXT: [[SHL:%.*]] = shl <2 x i32> [[CONVX]], [[AND]]
|
||||
; CHECK-NEXT: [[SUB:%.*]] = sub nuw nsw <2 x i32> <i32 16, i32 16>, [[AND]]
|
||||
; CHECK-NEXT: [[CONVY:%.*]] = zext <2 x i16> [[Y:%.*]] to <2 x i32>
|
||||
; CHECK-NEXT: [[SHR:%.*]] = lshr <2 x i32> [[CONVY]], [[SUB]]
|
||||
; CHECK-NEXT: [[OR:%.*]] = or <2 x i32> [[SHL]], [[SHR]]
|
||||
; CHECK-NEXT: [[CONV2:%.*]] = trunc <2 x i32> [[OR]] to <2 x i16>
|
||||
; CHECK-NEXT: ret <2 x i16> [[CONV2]]
|
||||
;
|
||||
%and = and <2 x i32> %shift, <i32 15, i32 15>
|
||||
%convx = zext <2 x i16> %x to <2 x i32>
|
||||
%shl = shl <2 x i32> %convx, %and
|
||||
%sub = sub <2 x i32> <i32 16, i32 16>, %and
|
||||
%convy = zext <2 x i16> %y to <2 x i32>
|
||||
%shr = lshr <2 x i32> %convy, %sub
|
||||
%or = or <2 x i32> %shl, %shr
|
||||
%conv2 = trunc <2 x i32> %or to <2 x i16>
|
||||
ret <2 x i16> %conv2
|
||||
}
|
||||
|
||||
; Change the size, shift direction (the subtract is on the left-shift), and mask op.
|
||||
|
||||
define i8 @fshr_8bit(i8 %x, i8 %y, i3 %shift) {
|
||||
; CHECK-LABEL: @fshr_8bit(
|
||||
; CHECK-NEXT: [[AND:%.*]] = zext i3 [[SHIFT:%.*]] to i32
|
||||
; CHECK-NEXT: [[CONVX:%.*]] = zext i8 [[X:%.*]] to i32
|
||||
; CHECK-NEXT: [[SHR:%.*]] = lshr i32 [[CONVX]], [[AND]]
|
||||
; CHECK-NEXT: [[SUB:%.*]] = sub nuw nsw i32 8, [[AND]]
|
||||
; CHECK-NEXT: [[CONVY:%.*]] = zext i8 [[Y:%.*]] to i32
|
||||
; CHECK-NEXT: [[SHL:%.*]] = shl i32 [[CONVY]], [[SUB]]
|
||||
; CHECK-NEXT: [[OR:%.*]] = or i32 [[SHL]], [[SHR]]
|
||||
; CHECK-NEXT: [[CONV2:%.*]] = trunc i32 [[OR]] to i8
|
||||
; CHECK-NEXT: ret i8 [[CONV2]]
|
||||
;
|
||||
%and = zext i3 %shift to i32
|
||||
%convx = zext i8 %x to i32
|
||||
%shr = lshr i32 %convx, %and
|
||||
%sub = sub i32 8, %and
|
||||
%convy = zext i8 %y to i32
|
||||
%shl = shl i32 %convy, %sub
|
||||
%or = or i32 %shl, %shr
|
||||
%conv2 = trunc i32 %or to i8
|
||||
ret i8 %conv2
|
||||
}
|
||||
|
||||
; The shifted value does not need to be a zexted value; here it is masked.
|
||||
; The shift mask could be less than the bitwidth, but this is still ok.
|
||||
|
||||
define i8 @fshr_commute_8bit(i32 %x, i32 %y, i32 %shift) {
|
||||
; CHECK-LABEL: @fshr_commute_8bit(
|
||||
; CHECK-NEXT: [[AND:%.*]] = and i32 [[SHIFT:%.*]], 3
|
||||
; CHECK-NEXT: [[CONVX:%.*]] = and i32 [[X:%.*]], 255
|
||||
; CHECK-NEXT: [[SHR:%.*]] = lshr i32 [[CONVX]], [[AND]]
|
||||
; CHECK-NEXT: [[SUB:%.*]] = sub nuw nsw i32 8, [[AND]]
|
||||
; CHECK-NEXT: [[CONVY:%.*]] = and i32 [[Y:%.*]], 255
|
||||
; CHECK-NEXT: [[SHL:%.*]] = shl i32 [[CONVY]], [[SUB]]
|
||||
; CHECK-NEXT: [[OR:%.*]] = or i32 [[SHR]], [[SHL]]
|
||||
; CHECK-NEXT: [[CONV2:%.*]] = trunc i32 [[OR]] to i8
|
||||
; CHECK-NEXT: ret i8 [[CONV2]]
|
||||
;
|
||||
%and = and i32 %shift, 3
|
||||
%convx = and i32 %x, 255
|
||||
%shr = lshr i32 %convx, %and
|
||||
%sub = sub i32 8, %and
|
||||
%convy = and i32 %y, 255
|
||||
%shl = shl i32 %convy, %sub
|
||||
%or = or i32 %shr, %shl
|
||||
%conv2 = trunc i32 %or to i8
|
||||
ret i8 %conv2
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue