@@ -9,20 +9,31 @@ target triple = "aarch64-unknown-linux-gnu"
9
9
; DEBUG: Found an estimated cost of Invalid for VF vscale x 1 For instruction: %indvars.iv.next1295 = add i7 %indvars.iv1294, 1
10
10
11
11
define void @induction_i7 (ptr %dst ) #0 {
12
- ; CHECK-LABEL: @induction_i7(
12
+ ; CHECK-LABEL: define void @induction_i7(
13
+ ; CHECK-SAME: ptr [[DST:%.*]])
13
14
; CHECK: vector.ph:
14
- ; CHECK: %ind.end = trunc i64 %n.vec to i7
15
+ ; CHECK-NEXT: [[TMP2:%.*]] = call i64 @llvm.vscale.i64()
16
+ ; CHECK-NEXT: [[TMP3:%.*]] = mul i64 [[TMP2]], 4
17
+ ; CHECK-NEXT: [[N_MOD_VF:%.*]] = urem i64 64, [[TMP3]]
18
+ ; CHECK-NEXT: [[N_VEC:%.*]] = sub i64 64, [[N_MOD_VF]]
19
+ ; CHECK-NEXT: [[IND_END:%.*]] = trunc i64 [[N_VEC]] to i7
15
20
; CHECK-NEXT: [[TMP4:%.*]] = call i64 @llvm.vscale.i64()
16
21
; CHECK-NEXT: [[TMP5:%.*]] = mul i64 [[TMP4]], 4
17
22
; CHECK-NEXT: [[TMP6:%.*]] = call <vscale x 2 x i8> @llvm.experimental.stepvector.nxv2i8()
18
23
; CHECK-NEXT: [[TMP7:%.*]] = trunc <vscale x 2 x i8> [[TMP6]] to <vscale x 2 x i7>
19
24
; CHECK-NEXT: [[TMP8:%.*]] = add <vscale x 2 x i7> [[TMP7]], zeroinitializer
20
25
; CHECK-NEXT: [[TMP9:%.*]] = mul <vscale x 2 x i7> [[TMP8]], shufflevector (<vscale x 2 x i7> insertelement (<vscale x 2 x i7> poison, i7 1, i64 0), <vscale x 2 x i7> poison, <vscale x 2 x i32> zeroinitializer)
21
26
; CHECK-NEXT: [[INDUCTION:%.*]] = add <vscale x 2 x i7> zeroinitializer, [[TMP9]]
22
- ; CHECK: vector.body:
23
- ; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %vector.ph ], [ [[INDEX_NEXT:%.*]], %vector.body ]
24
- ; CHECK-NEXT: [[VEC_IND:%.*]] = phi <vscale x 2 x i7> [ [[INDUCTION]], %vector.ph ], [ [[VEC_IND_NEXT:%.*]], %vector.body ]
25
- ; CHECK-NEXT: [[STEP_ADD:%.*]] = add <vscale x 2 x i7> [[VEC_IND]], [[DOTSPLAT:%.*]]
27
+ ; CHECK-NEXT: [[TMP10:%.*]] = call i7 @llvm.vscale.i7()
28
+ ; CHECK-NEXT: [[TMP11:%.*]] = mul i7 [[TMP10]], 2
29
+ ; CHECK-NEXT: [[TMP12:%.*]] = mul i7 1, [[TMP11]]
30
+ ; CHECK-NEXT: [[DOTSPLATINSERT:%.*]] = insertelement <vscale x 2 x i7> poison, i7 [[TMP12]], i64 0
31
+ ; CHECK-NEXT: [[DOTSPLAT:%.*]] = shufflevector <vscale x 2 x i7> [[DOTSPLATINSERT]], <vscale x 2 x i7> poison, <vscale x 2 x i32> zeroinitializer
32
+ ; CHECK-NEXT: br label %[[VECTOR_BODY:.*]]
33
+ ; CHECK: [[VECTOR_BODY]]:
34
+ ; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %vector.ph ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ]
35
+ ; CHECK-NEXT: [[VEC_IND:%.*]] = phi <vscale x 2 x i7> [ [[INDUCTION]], %vector.ph ], [ [[VEC_IND_NEXT:%.*]], %[[VECTOR_BODY]] ]
36
+ ; CHECK-NEXT: [[STEP_ADD:%.*]] = add <vscale x 2 x i7> [[VEC_IND]], [[DOTSPLAT]]
26
37
; CHECK-NEXT: [[TMP13:%.*]] = add i64 [[INDEX]], 0
27
38
; CHECK-NEXT: [[TMP14:%.*]] = call i64 @llvm.vscale.i64()
28
39
; CHECK-NEXT: [[TMP15:%.*]] = mul i64 [[TMP14]], 2
@@ -31,8 +42,8 @@ define void @induction_i7(ptr %dst) #0 {
31
42
; CHECK-NEXT: [[TMP18:%.*]] = add i64 [[INDEX]], [[TMP17]]
32
43
; CHECK-NEXT: [[TMP19:%.*]] = add <vscale x 2 x i7> [[VEC_IND]], zeroinitializer
33
44
; CHECK-NEXT: [[TMP20:%.*]] = add <vscale x 2 x i7> [[STEP_ADD]], zeroinitializer
34
- ; CHECK-NEXT: [[TMP21:%.*]] = getelementptr inbounds i64, ptr [[DST:%.* ]], i64 [[TMP13]]
35
- ; CHECK-NEXT: [[TMP22:%.*]] = getelementptr inbounds i64, ptr [[DST:%.* ]], i64 [[TMP18]]
45
+ ; CHECK-NEXT: [[TMP21:%.*]] = getelementptr inbounds i64, ptr [[DST]], i64 [[TMP13]]
46
+ ; CHECK-NEXT: [[TMP22:%.*]] = getelementptr inbounds i64, ptr [[DST]], i64 [[TMP18]]
36
47
; CHECK-NEXT: [[TMP23:%.*]] = zext <vscale x 2 x i7> [[TMP19]] to <vscale x 2 x i64>
37
48
; CHECK-NEXT: [[TMP24:%.*]] = zext <vscale x 2 x i7> [[TMP20]] to <vscale x 2 x i64>
38
49
; CHECK-NEXT: [[TMP25:%.*]] = getelementptr inbounds i64, ptr [[TMP21]], i32 0
@@ -43,6 +54,9 @@ define void @induction_i7(ptr %dst) #0 {
43
54
; CHECK-NEXT: store <vscale x 2 x i64> [[TMP24]], ptr [[TMP28]], align 8
44
55
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], [[TMP5]]
45
56
; CHECK-NEXT: [[VEC_IND_NEXT]] = add <vscale x 2 x i7> [[STEP_ADD]], [[DOTSPLAT]]
57
+ ; CHECK-NEXT: [[TMP29:%.*]] = icmp eq i64 [[INDEX_NEXT]], [[N_VEC]]
58
+ ; CHECK-NEXT: br i1 [[TMP29]], label %middle.block, label %[[VECTOR_BODY]]
59
+ ;
46
60
47
61
entry:
48
62
br label %for.body
@@ -69,18 +83,30 @@ for.end: ; preds = %for.body
69
83
; DEBUG: Found an estimated cost of Invalid for VF vscale x 1 For instruction: %indvars.iv.next1295 = add i3 %indvars.iv1294, 1
70
84
71
85
define void @induction_i3_zext (ptr %dst ) #0 {
72
- ; CHECK-LABEL: @induction_i3_zext(
86
+ ; CHECK-LABEL: define void @induction_i3_zext(
87
+ ; CHECK-SAME: ptr [[DST:%.*]])
73
88
; CHECK: vector.ph:
74
- ; CHECK: %ind.end = trunc i64 %n.vec to i3
89
+ ; CHECK-NEXT: [[TMP2:%.*]] = call i64 @llvm.vscale.i64()
90
+ ; CHECK-NEXT: [[TMP3:%.*]] = mul i64 [[TMP2]], 4
91
+ ; CHECK-NEXT: [[N_MOD_VF:%.*]] = urem i64 64, [[TMP3]]
92
+ ; CHECK-NEXT: [[N_VEC:%.*]] = sub i64 64, [[N_MOD_VF]]
93
+ ; CHECK-NEXT: [[IND_END:%.*]] = trunc i64 [[N_VEC]] to i3
75
94
; CHECK-NEXT: [[TMP4:%.*]] = call i64 @llvm.vscale.i64()
76
95
; CHECK-NEXT: [[TMP5:%.*]] = mul i64 [[TMP4]], 4
77
96
; CHECK-NEXT: [[TMP6:%.*]] = call <vscale x 2 x i8> @llvm.experimental.stepvector.nxv2i8()
78
97
; CHECK-NEXT: [[TMP7:%.*]] = trunc <vscale x 2 x i8> [[TMP6]] to <vscale x 2 x i3>
79
98
; CHECK-NEXT: [[TMP8:%.*]] = add <vscale x 2 x i3> [[TMP7]], zeroinitializer
80
99
; CHECK-NEXT: [[TMP9:%.*]] = mul <vscale x 2 x i3> [[TMP8]], shufflevector (<vscale x 2 x i3> insertelement (<vscale x 2 x i3> poison, i3 1, i64 0), <vscale x 2 x i3> poison, <vscale x 2 x i32> zeroinitializer)
81
- ; CHECK: vector.body:
82
- ; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %vector.ph ], [ [[INDEX_NEXT:%.*]], %vector.body ]
83
- ; CHECK-NEXT: [[VEC_IND:%.*]] = phi <vscale x 2 x i3> [ [[INDUCTION]], %vector.ph ], [ [[VEC_IND_NEXT:%.*]], %vector.body ]
100
+ ; CHECK-NEXT: [[INDUCTION:%.*]] = add <vscale x 2 x i3> zeroinitializer, [[TMP9]]
101
+ ; CHECK-NEXT: [[TMP10:%.*]] = call i3 @llvm.vscale.i3()
102
+ ; CHECK-NEXT: [[TMP11:%.*]] = mul i3 [[TMP10]], 2
103
+ ; CHECK-NEXT: [[TMP12:%.*]] = mul i3 1, [[TMP11]]
104
+ ; CHECK-NEXT: [[DOTSPLATINSERT:%.*]] = insertelement <vscale x 2 x i3> poison, i3 [[TMP12]], i64 0
105
+ ; CHECK-NEXT: [[DOTSPLAT:%.*]] = shufflevector <vscale x 2 x i3> [[DOTSPLATINSERT]], <vscale x 2 x i3> poison, <vscale x 2 x i32> zeroinitializer
106
+ ; CHECK-NEXT: br label %[[VECTOR_BODY:.*]]
107
+ ; CHECK: [[VECTOR_BODY]]:
108
+ ; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %vector.ph ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ]
109
+ ; CHECK-NEXT: [[VEC_IND:%.*]] = phi <vscale x 2 x i3> [ [[INDUCTION]], %vector.ph ], [ [[VEC_IND_NEXT:%.*]], %[[VECTOR_BODY]] ]
84
110
; CHECK-NEXT: [[STEP_ADD:%.*]] = add <vscale x 2 x i3> [[VEC_IND]], [[DOTSPLAT]]
85
111
; CHECK-NEXT: [[TMP13:%.*]] = add i64 [[INDEX]], 0
86
112
; CHECK-NEXT: [[TMP14:%.*]] = call i64 @llvm.vscale.i64()
@@ -100,6 +126,9 @@ define void @induction_i3_zext(ptr %dst) #0 {
100
126
; CHECK-NEXT: store <vscale x 2 x i64> [[TMP20]], ptr [[TMP26]], align 8
101
127
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], [[TMP5]]
102
128
; CHECK-NEXT: [[VEC_IND_NEXT]] = add <vscale x 2 x i3> [[STEP_ADD]], [[DOTSPLAT]]
129
+ ; CHECK-NEXT: [[TMP27:%.*]] = icmp eq i64 [[INDEX_NEXT]], [[N_VEC]]
130
+ ; CHECK-NEXT: br i1 [[TMP27]], label %middle.block, label %[[VECTOR_BODY]]
131
+ ;
103
132
entry:
104
133
br label %for.body
105
134
0 commit comments