Thanks to visit codestin.com
Credit goes to github.com

Skip to content

Commit ead4f3e

Browse files
authored
[InstCombine] Canonicalize active lane mask params (#158065)
Rewrite active lane mask intrinsics to begin their range from 0 when both parameters are constant integers.
1 parent 7ebfcbd commit ead4f3e

File tree

2 files changed

+51
-0
lines changed

2 files changed

+51
-0
lines changed

llvm/lib/Transforms/InstCombine/InstCombineCalls.cpp

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3952,6 +3952,19 @@ Instruction *InstCombinerImpl::visitCallInst(CallInst &CI) {
39523952
}
39533953
break;
39543954
}
3955+
case Intrinsic::get_active_lane_mask: {
3956+
const APInt *Op0, *Op1;
3957+
if (match(II->getOperand(0), m_StrictlyPositive(Op0)) &&
3958+
match(II->getOperand(1), m_APInt(Op1))) {
3959+
Type *OpTy = II->getOperand(0)->getType();
3960+
return replaceInstUsesWith(
3961+
*II, Builder.CreateIntrinsic(
3962+
II->getType(), Intrinsic::get_active_lane_mask,
3963+
{Constant::getNullValue(OpTy),
3964+
ConstantInt::get(OpTy, Op1->usub_sat(*Op0))}));
3965+
}
3966+
break;
3967+
}
39553968
default: {
39563969
// Handle target specific intrinsics
39573970
std::optional<Instruction *> V = targetInstCombineIntrinsic(*II);
Lines changed: 38 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,38 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
2+
; RUN: opt < %s -passes=instcombine -S | FileCheck %s
3+
4+
define <vscale x 4 x i1> @rewrite_range_nxv4i1() {
5+
; CHECK-LABEL: define <vscale x 4 x i1> @rewrite_range_nxv4i1() {
6+
; CHECK-NEXT: [[MASK:%.*]] = call <vscale x 4 x i1> @llvm.get.active.lane.mask.nxv4i1.i32(i32 0, i32 3)
7+
; CHECK-NEXT: ret <vscale x 4 x i1> [[MASK]]
8+
;
9+
%mask = call <vscale x 4 x i1> @llvm.get.active.lane.mask.nxv4i1.i32(i32 1, i32 4)
10+
ret <vscale x 4 x i1> %mask
11+
}
12+
13+
define <vscale x 16 x i1> @rewrite_range_nxv16i1() {
14+
; CHECK-LABEL: define <vscale x 16 x i1> @rewrite_range_nxv16i1() {
15+
; CHECK-NEXT: [[MASK:%.*]] = call <vscale x 16 x i1> @llvm.get.active.lane.mask.nxv16i1.i64(i64 0, i64 7)
16+
; CHECK-NEXT: ret <vscale x 16 x i1> [[MASK]]
17+
;
18+
%mask = call <vscale x 16 x i1> @llvm.get.active.lane.mask.nxv16i1.i64(i64 123123, i64 123130)
19+
ret <vscale x 16 x i1> %mask
20+
}
21+
22+
define <vscale x 16 x i1> @rewrite_range_nxv16i1_i128() {
23+
; CHECK-LABEL: define <vscale x 16 x i1> @rewrite_range_nxv16i1_i128() {
24+
; CHECK-NEXT: [[MASK:%.*]] = call <vscale x 16 x i1> @llvm.get.active.lane.mask.nxv16i1.i128(i128 0, i128 10)
25+
; CHECK-NEXT: ret <vscale x 16 x i1> [[MASK]]
26+
;
27+
%mask = call <vscale x 16 x i1> @llvm.get.active.lane.mask.nxv16i1.i128(i128 18446744073709551616, i128 18446744073709551626)
28+
ret <vscale x 16 x i1> %mask
29+
}
30+
31+
define <vscale x 4 x i1> @bail_lhs_is_zero() {
32+
; CHECK-LABEL: define <vscale x 4 x i1> @bail_lhs_is_zero() {
33+
; CHECK-NEXT: [[MASK:%.*]] = call <vscale x 4 x i1> @llvm.get.active.lane.mask.nxv4i1.i32(i32 0, i32 4)
34+
; CHECK-NEXT: ret <vscale x 4 x i1> [[MASK]]
35+
;
36+
%mask = call <vscale x 4 x i1> @llvm.get.active.lane.mask.nxv4i1.i32(i32 0, i32 4)
37+
ret <vscale x 4 x i1> %mask
38+
}

0 commit comments

Comments
 (0)