Skip to content

Commit 19a625a

Browse files
committed
[SLP][NFC]Add a test with incorrect size of the external user detection.
1 parent cce4dc7 commit 19a625a

File tree

1 file changed

+56
-0
lines changed

1 file changed

+56
-0
lines changed
Lines changed: 56 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,56 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4
2+
; RUN: opt -S --passes=slp-vectorizer -mtriple=aarch64 -slp-threshold=-20 -slp-vectorize-hor=0 < %s | FileCheck %s
3+
4+
define i16 @foo(i16 %in1, i16 %in2) {
5+
; CHECK-LABEL: define i16 @foo(
6+
; CHECK-SAME: i16 [[IN1:%.*]], i16 [[IN2:%.*]]) {
7+
; CHECK-NEXT: entry:
8+
; CHECK-NEXT: [[TMP0:%.*]] = insertelement <2 x i16> poison, i16 [[IN1]], i32 0
9+
; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <2 x i16> [[TMP0]], <2 x i16> poison, <2 x i32> zeroinitializer
10+
; CHECK-NEXT: [[TMP2:%.*]] = insertelement <2 x i16> poison, i16 [[IN2]], i32 0
11+
; CHECK-NEXT: [[TMP3:%.*]] = shufflevector <2 x i16> [[TMP2]], <2 x i16> poison, <2 x i32> zeroinitializer
12+
; CHECK-NEXT: [[TMP4:%.*]] = mul <2 x i16> [[TMP3]], [[TMP1]]
13+
; CHECK-NEXT: [[TMP5:%.*]] = and <2 x i16> [[TMP4]], <i16 -1, i16 -1>
14+
; CHECK-NEXT: [[TMP6:%.*]] = zext <2 x i16> [[TMP5]] to <2 x i64>
15+
; CHECK-NEXT: [[TMP7:%.*]] = icmp ne <2 x i64> [[TMP6]], <i64 65533, i64 65533>
16+
; CHECK-NEXT: [[TMP8:%.*]] = extractelement <2 x i1> [[TMP7]], i32 1
17+
; CHECK-NEXT: [[ZEXT3_1:%.*]] = zext i1 [[TMP8]] to i16
18+
; CHECK-NEXT: [[TMP9:%.*]] = extractelement <2 x i16> [[TMP4]], i32 1
19+
; CHECK-NEXT: [[TMP10:%.*]] = zext i16 [[TMP9]] to i64
20+
; CHECK-NEXT: [[CMP2_1:%.*]] = icmp ne i64 [[TMP10]], 196605
21+
; CHECK-NEXT: [[ZEXT4_1:%.*]] = zext i1 [[CMP2_1]] to i16
22+
; CHECK-NEXT: [[ADD1:%.*]] = add nuw nsw i16 [[ZEXT3_1]], [[ZEXT4_1]]
23+
; CHECK-NEXT: [[TMP11:%.*]] = extractelement <2 x i1> [[TMP7]], i32 0
24+
; CHECK-NEXT: [[ZEXT3_2:%.*]] = zext i1 [[TMP11]] to i16
25+
; CHECK-NEXT: [[TMP12:%.*]] = extractelement <2 x i16> [[TMP4]], i32 0
26+
; CHECK-NEXT: [[TMP13:%.*]] = zext i16 [[TMP12]] to i64
27+
; CHECK-NEXT: [[CMP2_2:%.*]] = icmp ne i64 [[TMP13]], 196605
28+
; CHECK-NEXT: [[ZEXT4_2:%.*]] = zext i1 [[CMP2_2]] to i16
29+
; CHECK-NEXT: [[ADD2:%.*]] = add nuw nsw i16 [[ADD1]], [[ZEXT4_2]]
30+
; CHECK-NEXT: [[ADD3:%.*]] = add nuw nsw i16 [[ADD2]], [[ZEXT3_2]]
31+
; CHECK-NEXT: ret i16 [[ADD3]]
32+
;
33+
entry:
34+
%zext1_1 = zext i16 %in1 to i64
35+
%zext2_1 = zext i16 %in2 to i64
36+
%mul1 = mul nuw nsw i64 %zext2_1, %zext1_1
37+
%and1 = and i64 %mul1, 65535
38+
%cmp1_1 = icmp ne i64 %and1, 65533
39+
%zext3_1 = zext i1 %cmp1_1 to i16
40+
%cmp2_1 = icmp ne i64 %mul1, 196605
41+
%zext4_1 = zext i1 %cmp2_1 to i16
42+
%add1 = add nuw nsw i16 %zext3_1, %zext4_1
43+
%zext1_2 = zext i16 %in1 to i64
44+
%zext2_2 = zext i16 %in2 to i64
45+
%mul2 = mul nuw nsw i64 %zext2_2, %zext1_2
46+
%and2 = and i64 %mul2, 65535
47+
%cmp1_2 = icmp ne i64 %and2, 65533
48+
%zext3_2 = zext i1 %cmp1_2 to i16
49+
%cmp2_2 = icmp ne i64 %mul2, 196605
50+
%zext4_2 = zext i1 %cmp2_2 to i16
51+
%add2 = add nuw nsw i16 %add1, %zext4_2
52+
%add3 = add nuw nsw i16 %add2, %zext3_2
53+
ret i16 %add3
54+
}
55+
56+

0 commit comments

Comments
 (0)