@@ -14,15 +14,18 @@ define <8 x i16> @test_x86_vcvtps2ph_128(<4 x float> %a0) #0 {
14
14
; CHECK-SAME: <4 x float> [[A0:%.*]]) #[[ATTR0:[0-9]+]] {
15
15
; CHECK-NEXT: [[TMP1:%.*]] = load <4 x i32>, ptr @__msan_param_tls, align 8
16
16
; CHECK-NEXT: call void @llvm.donothing()
17
- ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <4 x i32> [[TMP1]] to i128
18
- ; CHECK-NEXT: [[_MSCMP:%.*]] = icmp ne i128 [[TMP2]], 0
19
- ; CHECK-NEXT: br i1 [[_MSCMP]], label %[[BB3:.*]], label %[[BB4:.*]], !prof [[PROF1:![0-9]+]]
20
- ; CHECK: [[BB3]]:
21
- ; CHECK-NEXT: call void @__msan_warning_noreturn() #[[ATTR4:[0-9]+]]
22
- ; CHECK-NEXT: unreachable
23
- ; CHECK: [[BB4]]:
17
+ ; CHECK-NEXT: [[TMP2:%.*]] = icmp ne <4 x i32> [[TMP1]], zeroinitializer
18
+ ; CHECK-NEXT: [[TMP3:%.*]] = sext <4 x i1> [[TMP2]] to <4 x i16>
19
+ ; CHECK-NEXT: [[TMP4:%.*]] = extractelement <4 x i16> [[TMP3]], i64 0
20
+ ; CHECK-NEXT: [[TMP5:%.*]] = insertelement <8 x i16> zeroinitializer, i16 [[TMP4]], i64 0
21
+ ; CHECK-NEXT: [[TMP6:%.*]] = extractelement <4 x i16> [[TMP3]], i64 1
22
+ ; CHECK-NEXT: [[TMP7:%.*]] = insertelement <8 x i16> [[TMP5]], i16 [[TMP6]], i64 1
23
+ ; CHECK-NEXT: [[TMP8:%.*]] = extractelement <4 x i16> [[TMP3]], i64 2
24
+ ; CHECK-NEXT: [[TMP9:%.*]] = insertelement <8 x i16> [[TMP7]], i16 [[TMP8]], i64 2
25
+ ; CHECK-NEXT: [[TMP10:%.*]] = extractelement <4 x i16> [[TMP3]], i64 3
26
+ ; CHECK-NEXT: [[TMP11:%.*]] = insertelement <8 x i16> [[TMP9]], i16 [[TMP10]], i64 3
24
27
; CHECK-NEXT: [[RES:%.*]] = call <8 x i16> @llvm.x86.vcvtps2ph.128(<4 x float> [[A0]], i32 0)
25
- ; CHECK-NEXT: store <8 x i16> zeroinitializer , ptr @__msan_retval_tls, align 8
28
+ ; CHECK-NEXT: store <8 x i16> [[TMP11]] , ptr @__msan_retval_tls, align 8
26
29
; CHECK-NEXT: ret <8 x i16> [[RES]]
27
30
;
28
31
%res = call <8 x i16 > @llvm.x86.vcvtps2ph.128 (<4 x float > %a0 , i32 0 ) ; <<8 x i16>> [#uses=1]
@@ -35,15 +38,10 @@ define <8 x i16> @test_x86_vcvtps2ph_256(<8 x float> %a0) #0 {
35
38
; CHECK-SAME: <8 x float> [[A0:%.*]]) #[[ATTR0]] {
36
39
; CHECK-NEXT: [[TMP1:%.*]] = load <8 x i32>, ptr @__msan_param_tls, align 8
37
40
; CHECK-NEXT: call void @llvm.donothing()
38
- ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <8 x i32> [[TMP1]] to i256
39
- ; CHECK-NEXT: [[_MSCMP:%.*]] = icmp ne i256 [[TMP2]], 0
40
- ; CHECK-NEXT: br i1 [[_MSCMP]], label %[[BB3:.*]], label %[[BB4:.*]], !prof [[PROF1]]
41
- ; CHECK: [[BB3]]:
42
- ; CHECK-NEXT: call void @__msan_warning_noreturn() #[[ATTR4]]
43
- ; CHECK-NEXT: unreachable
44
- ; CHECK: [[BB4]]:
41
+ ; CHECK-NEXT: [[TMP2:%.*]] = icmp ne <8 x i32> [[TMP1]], zeroinitializer
42
+ ; CHECK-NEXT: [[TMP3:%.*]] = sext <8 x i1> [[TMP2]] to <8 x i16>
45
43
; CHECK-NEXT: [[RES:%.*]] = call <8 x i16> @llvm.x86.vcvtps2ph.256(<8 x float> [[A0]], i32 0)
46
- ; CHECK-NEXT: store <8 x i16> zeroinitializer , ptr @__msan_retval_tls, align 8
44
+ ; CHECK-NEXT: store <8 x i16> [[TMP3]] , ptr @__msan_retval_tls, align 8
47
45
; CHECK-NEXT: ret <8 x i16> [[RES]]
48
46
;
49
47
%res = call <8 x i16 > @llvm.x86.vcvtps2ph.256 (<8 x float > %a0 , i32 0 ) ; <<8 x i16>> [#uses=1]
@@ -59,24 +57,19 @@ define void @test_x86_vcvtps2ph_256_m(ptr nocapture %d, <8 x float> %a) nounwind
59
57
; CHECK-NEXT: [[TMP17:%.*]] = load <8 x i32>, ptr inttoptr (i64 add (i64 ptrtoint (ptr @__msan_param_tls to i64), i64 8) to ptr), align 8
60
58
; CHECK-NEXT: [[TMP18:%.*]] = load i64, ptr @__msan_param_tls, align 8
61
59
; CHECK-NEXT: call void @llvm.donothing()
62
- ; CHECK-NEXT: [[TMP4:%.*]] = bitcast <8 x i32> [[TMP17]] to i256
63
- ; CHECK-NEXT: [[_MSCMP:%.*]] = icmp ne i256 [[TMP4]], 0
64
- ; CHECK-NEXT: br i1 [[_MSCMP]], label %[[BB3:.*]], label %[[BB4:.*]], !prof [[PROF1]]
65
- ; CHECK: [[BB3]]:
66
- ; CHECK-NEXT: call void @__msan_warning_noreturn() #[[ATTR4]]
67
- ; CHECK-NEXT: unreachable
68
- ; CHECK: [[BB4]]:
60
+ ; CHECK-NEXT: [[TMP20:%.*]] = icmp ne <8 x i32> [[TMP17]], zeroinitializer
61
+ ; CHECK-NEXT: [[TMP21:%.*]] = sext <8 x i1> [[TMP20]] to <8 x i16>
69
62
; CHECK-NEXT: [[TMP0:%.*]] = tail call <8 x i16> @llvm.x86.vcvtps2ph.256(<8 x float> [[A]], i32 3)
70
63
; CHECK-NEXT: [[_MSCMP1:%.*]] = icmp ne i64 [[TMP18]], 0
71
- ; CHECK-NEXT: br i1 [[_MSCMP1]], label %[[BB6 :.*]], label %[[BB7 :.*]], !prof [[PROF1]]
72
- ; CHECK: [[BB6 ]]:
73
- ; CHECK-NEXT: call void @__msan_warning_noreturn() #[[ATTR4]]
64
+ ; CHECK-NEXT: br i1 [[_MSCMP1]], label %[[BB5 :.*]], label %[[BB6 :.*]], !prof [[PROF1:![0-9]+ ]]
65
+ ; CHECK: [[BB5 ]]:
66
+ ; CHECK-NEXT: call void @__msan_warning_noreturn() #[[ATTR4:[0-9]+ ]]
74
67
; CHECK-NEXT: unreachable
75
- ; CHECK: [[BB7 ]]:
68
+ ; CHECK: [[BB6 ]]:
76
69
; CHECK-NEXT: [[TMP1:%.*]] = ptrtoint ptr [[D]] to i64
77
70
; CHECK-NEXT: [[TMP2:%.*]] = xor i64 [[TMP1]], 87960930222080
78
71
; CHECK-NEXT: [[TMP3:%.*]] = inttoptr i64 [[TMP2]] to ptr
79
- ; CHECK-NEXT: store <8 x i16> zeroinitializer , ptr [[TMP3]], align 16
72
+ ; CHECK-NEXT: store <8 x i16> [[TMP21]] , ptr [[TMP3]], align 16
80
73
; CHECK-NEXT: store <8 x i16> [[TMP0]], ptr [[D]], align 16
81
74
; CHECK-NEXT: ret void
82
75
;
@@ -93,25 +86,29 @@ define void @test_x86_vcvtps2ph_128_m(ptr nocapture %d, <4 x float> %a) nounwind
93
86
; CHECK-NEXT: [[TMP9:%.*]] = load <4 x i32>, ptr inttoptr (i64 add (i64 ptrtoint (ptr @__msan_param_tls to i64), i64 8) to ptr), align 8
94
87
; CHECK-NEXT: [[TMP10:%.*]] = load i64, ptr @__msan_param_tls, align 8
95
88
; CHECK-NEXT: call void @llvm.donothing()
96
- ; CHECK-NEXT: [[TMP5:%.*]] = bitcast <4 x i32> [[TMP9]] to i128
97
- ; CHECK-NEXT: [[_MSCMP:%.*]] = icmp ne i128 [[TMP5]], 0
98
- ; CHECK-NEXT: br i1 [[_MSCMP]], label %[[BB3:.*]], label %[[BB4:.*]], !prof [[PROF1]]
99
- ; CHECK: [[BB3]]:
100
- ; CHECK-NEXT: call void @__msan_warning_noreturn() #[[ATTR4]]
101
- ; CHECK-NEXT: unreachable
102
- ; CHECK: [[BB4]]:
89
+ ; CHECK-NEXT: [[TMP12:%.*]] = icmp ne <4 x i32> [[TMP9]], zeroinitializer
90
+ ; CHECK-NEXT: [[TMP13:%.*]] = sext <4 x i1> [[TMP12]] to <4 x i16>
91
+ ; CHECK-NEXT: [[TMP14:%.*]] = extractelement <4 x i16> [[TMP13]], i64 0
92
+ ; CHECK-NEXT: [[TMP5:%.*]] = insertelement <8 x i16> zeroinitializer, i16 [[TMP14]], i64 0
93
+ ; CHECK-NEXT: [[TMP6:%.*]] = extractelement <4 x i16> [[TMP13]], i64 1
94
+ ; CHECK-NEXT: [[TMP7:%.*]] = insertelement <8 x i16> [[TMP5]], i16 [[TMP6]], i64 1
95
+ ; CHECK-NEXT: [[TMP8:%.*]] = extractelement <4 x i16> [[TMP13]], i64 2
96
+ ; CHECK-NEXT: [[TMP15:%.*]] = insertelement <8 x i16> [[TMP7]], i16 [[TMP8]], i64 2
97
+ ; CHECK-NEXT: [[TMP16:%.*]] = extractelement <4 x i16> [[TMP13]], i64 3
98
+ ; CHECK-NEXT: [[TMP11:%.*]] = insertelement <8 x i16> [[TMP15]], i16 [[TMP16]], i64 3
103
99
; CHECK-NEXT: [[TMP0:%.*]] = tail call <8 x i16> @llvm.x86.vcvtps2ph.128(<4 x float> [[A]], i32 3)
100
+ ; CHECK-NEXT: [[_MSPROP:%.*]] = shufflevector <8 x i16> [[TMP11]], <8 x i16> splat (i16 -1), <4 x i32> <i32 0, i32 1, i32 2, i32 3>
104
101
; CHECK-NEXT: [[TMP1:%.*]] = shufflevector <8 x i16> [[TMP0]], <8 x i16> poison, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
105
102
; CHECK-NEXT: [[_MSCMP1:%.*]] = icmp ne i64 [[TMP10]], 0
106
- ; CHECK-NEXT: br i1 [[_MSCMP1]], label %[[BB7 :.*]], label %[[BB8 :.*]], !prof [[PROF1]]
107
- ; CHECK: [[BB7 ]]:
103
+ ; CHECK-NEXT: br i1 [[_MSCMP1]], label %[[BB14 :.*]], label %[[BB15 :.*]], !prof [[PROF1]]
104
+ ; CHECK: [[BB14 ]]:
108
105
; CHECK-NEXT: call void @__msan_warning_noreturn() #[[ATTR4]]
109
106
; CHECK-NEXT: unreachable
110
- ; CHECK: [[BB8 ]]:
107
+ ; CHECK: [[BB15 ]]:
111
108
; CHECK-NEXT: [[TMP2:%.*]] = ptrtoint ptr [[D]] to i64
112
109
; CHECK-NEXT: [[TMP3:%.*]] = xor i64 [[TMP2]], 87960930222080
113
110
; CHECK-NEXT: [[TMP4:%.*]] = inttoptr i64 [[TMP3]] to ptr
114
- ; CHECK-NEXT: store <4 x i16> zeroinitializer , ptr [[TMP4]], align 8
111
+ ; CHECK-NEXT: store <4 x i16> [[_MSPROP]] , ptr [[TMP4]], align 8
115
112
; CHECK-NEXT: store <4 x i16> [[TMP1]], ptr [[D]], align 8
116
113
; CHECK-NEXT: ret void
117
114
;
@@ -129,26 +126,31 @@ define void @test_x86_vcvtps2ph_128_m2(ptr nocapture %hf4x16, <4 x float> %f4X86
129
126
; CHECK-NEXT: [[TMP0:%.*]] = load <4 x i32>, ptr inttoptr (i64 add (i64 ptrtoint (ptr @__msan_param_tls to i64), i64 8) to ptr), align 8
130
127
; CHECK-NEXT: [[TMP1:%.*]] = load i64, ptr @__msan_param_tls, align 8
131
128
; CHECK-NEXT: call void @llvm.donothing()
132
- ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <4 x i32> [[TMP0]] to i128
133
- ; CHECK-NEXT: [[_MSCMP:%.*]] = icmp ne i128 [[TMP2]], 0
134
- ; CHECK-NEXT: br i1 [[_MSCMP]], label %[[BB3:.*]], label %[[BB4:.*]], !prof [[PROF1]]
135
- ; CHECK: [[BB3]]:
136
- ; CHECK-NEXT: call void @__msan_warning_noreturn() #[[ATTR4]]
137
- ; CHECK-NEXT: unreachable
138
- ; CHECK: [[BB4]]:
129
+ ; CHECK-NEXT: [[TMP2:%.*]] = icmp ne <4 x i32> [[TMP0]], zeroinitializer
130
+ ; CHECK-NEXT: [[TMP3:%.*]] = sext <4 x i1> [[TMP2]] to <4 x i16>
131
+ ; CHECK-NEXT: [[TMP4:%.*]] = extractelement <4 x i16> [[TMP3]], i64 0
132
+ ; CHECK-NEXT: [[TMP5:%.*]] = insertelement <8 x i16> zeroinitializer, i16 [[TMP4]], i64 0
133
+ ; CHECK-NEXT: [[TMP6:%.*]] = extractelement <4 x i16> [[TMP3]], i64 1
134
+ ; CHECK-NEXT: [[TMP7:%.*]] = insertelement <8 x i16> [[TMP5]], i16 [[TMP6]], i64 1
135
+ ; CHECK-NEXT: [[TMP8:%.*]] = extractelement <4 x i16> [[TMP3]], i64 2
136
+ ; CHECK-NEXT: [[TMP9:%.*]] = insertelement <8 x i16> [[TMP7]], i16 [[TMP8]], i64 2
137
+ ; CHECK-NEXT: [[TMP10:%.*]] = extractelement <4 x i16> [[TMP3]], i64 3
138
+ ; CHECK-NEXT: [[TMP14:%.*]] = insertelement <8 x i16> [[TMP9]], i16 [[TMP10]], i64 3
139
139
; CHECK-NEXT: [[TMP11:%.*]] = tail call <8 x i16> @llvm.x86.vcvtps2ph.128(<4 x float> [[F4X86]], i32 3)
140
+ ; CHECK-NEXT: [[TMP13:%.*]] = bitcast <8 x i16> [[TMP14]] to <2 x i64>
140
141
; CHECK-NEXT: [[TMP12:%.*]] = bitcast <8 x i16> [[TMP11]] to <2 x double>
142
+ ; CHECK-NEXT: [[_MSPROP:%.*]] = extractelement <2 x i64> [[TMP13]], i32 0
141
143
; CHECK-NEXT: [[VECEXT:%.*]] = extractelement <2 x double> [[TMP12]], i32 0
142
144
; CHECK-NEXT: [[_MSCMP1:%.*]] = icmp ne i64 [[TMP1]], 0
143
- ; CHECK-NEXT: br i1 [[_MSCMP1]], label %[[BB7 :.*]], label %[[BB8 :.*]], !prof [[PROF1]]
144
- ; CHECK: [[BB7 ]]:
145
+ ; CHECK-NEXT: br i1 [[_MSCMP1]], label %[[BB15 :.*]], label %[[BB16 :.*]], !prof [[PROF1]]
146
+ ; CHECK: [[BB15 ]]:
145
147
; CHECK-NEXT: call void @__msan_warning_noreturn() #[[ATTR4]]
146
148
; CHECK-NEXT: unreachable
147
- ; CHECK: [[BB8 ]]:
149
+ ; CHECK: [[BB16 ]]:
148
150
; CHECK-NEXT: [[TMP15:%.*]] = ptrtoint ptr [[HF4X16]] to i64
149
151
; CHECK-NEXT: [[TMP16:%.*]] = xor i64 [[TMP15]], 87960930222080
150
152
; CHECK-NEXT: [[TMP17:%.*]] = inttoptr i64 [[TMP16]] to ptr
151
- ; CHECK-NEXT: store i64 0 , ptr [[TMP17]], align 8
153
+ ; CHECK-NEXT: store i64 [[_MSPROP]] , ptr [[TMP17]], align 8
152
154
; CHECK-NEXT: store double [[VECEXT]], ptr [[HF4X16]], align 8
153
155
; CHECK-NEXT: ret void
154
156
;
@@ -167,27 +169,32 @@ define void @test_x86_vcvtps2ph_128_m3(ptr nocapture %hf4x16, <4 x float> %f4X86
167
169
; CHECK-NEXT: [[TMP0:%.*]] = load <4 x i32>, ptr inttoptr (i64 add (i64 ptrtoint (ptr @__msan_param_tls to i64), i64 8) to ptr), align 8
168
170
; CHECK-NEXT: [[TMP1:%.*]] = load i64, ptr @__msan_param_tls, align 8
169
171
; CHECK-NEXT: call void @llvm.donothing()
170
- ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <4 x i32> [[TMP0]] to i128
171
- ; CHECK-NEXT: [[_MSCMP:%.*]] = icmp ne i128 [[TMP2]], 0
172
- ; CHECK-NEXT: br i1 [[_MSCMP]], label %[[BB3:.*]], label %[[BB4:.*]], !prof [[PROF1]]
173
- ; CHECK: [[BB3]]:
174
- ; CHECK-NEXT: call void @__msan_warning_noreturn() #[[ATTR4]]
175
- ; CHECK-NEXT: unreachable
176
- ; CHECK: [[BB4]]:
172
+ ; CHECK-NEXT: [[TMP2:%.*]] = icmp ne <4 x i32> [[TMP0]], zeroinitializer
173
+ ; CHECK-NEXT: [[TMP3:%.*]] = sext <4 x i1> [[TMP2]] to <4 x i16>
174
+ ; CHECK-NEXT: [[TMP4:%.*]] = extractelement <4 x i16> [[TMP3]], i64 0
175
+ ; CHECK-NEXT: [[TMP5:%.*]] = insertelement <8 x i16> zeroinitializer, i16 [[TMP4]], i64 0
176
+ ; CHECK-NEXT: [[TMP6:%.*]] = extractelement <4 x i16> [[TMP3]], i64 1
177
+ ; CHECK-NEXT: [[TMP7:%.*]] = insertelement <8 x i16> [[TMP5]], i16 [[TMP6]], i64 1
178
+ ; CHECK-NEXT: [[TMP8:%.*]] = extractelement <4 x i16> [[TMP3]], i64 2
179
+ ; CHECK-NEXT: [[TMP9:%.*]] = insertelement <8 x i16> [[TMP7]], i16 [[TMP8]], i64 2
180
+ ; CHECK-NEXT: [[TMP10:%.*]] = extractelement <4 x i16> [[TMP3]], i64 3
181
+ ; CHECK-NEXT: [[TMP13:%.*]] = insertelement <8 x i16> [[TMP9]], i16 [[TMP10]], i64 3
177
182
; CHECK-NEXT: [[TMP11:%.*]] = tail call <8 x i16> @llvm.x86.vcvtps2ph.128(<4 x float> [[F4X86]], i32 3)
178
- ; CHECK-NEXT: [[TMP12:%.*]] = bitcast <8 x i16> [[TMP11]] to <2 x i64>
183
+ ; CHECK-NEXT: [[TMP12:%.*]] = bitcast <8 x i16> [[TMP13]] to <2 x i64>
184
+ ; CHECK-NEXT: [[TMP14:%.*]] = bitcast <8 x i16> [[TMP11]] to <2 x i64>
179
185
; CHECK-NEXT: [[VECEXT:%.*]] = extractelement <2 x i64> [[TMP12]], i32 0
186
+ ; CHECK-NEXT: [[VECEXT1:%.*]] = extractelement <2 x i64> [[TMP14]], i32 0
180
187
; CHECK-NEXT: [[_MSCMP1:%.*]] = icmp ne i64 [[TMP1]], 0
181
- ; CHECK-NEXT: br i1 [[_MSCMP1]], label %[[BB7 :.*]], label %[[BB8 :.*]], !prof [[PROF1]]
182
- ; CHECK: [[BB7 ]]:
188
+ ; CHECK-NEXT: br i1 [[_MSCMP1]], label %[[BB15 :.*]], label %[[BB16 :.*]], !prof [[PROF1]]
189
+ ; CHECK: [[BB15 ]]:
183
190
; CHECK-NEXT: call void @__msan_warning_noreturn() #[[ATTR4]]
184
191
; CHECK-NEXT: unreachable
185
- ; CHECK: [[BB8 ]]:
192
+ ; CHECK: [[BB16 ]]:
186
193
; CHECK-NEXT: [[TMP15:%.*]] = ptrtoint ptr [[HF4X16]] to i64
187
194
; CHECK-NEXT: [[TMP16:%.*]] = xor i64 [[TMP15]], 87960930222080
188
195
; CHECK-NEXT: [[TMP17:%.*]] = inttoptr i64 [[TMP16]] to ptr
189
- ; CHECK-NEXT: store i64 0 , ptr [[TMP17]], align 8
190
- ; CHECK-NEXT: store i64 [[VECEXT ]], ptr [[HF4X16]], align 8
196
+ ; CHECK-NEXT: store i64 [[VECEXT]] , ptr [[TMP17]], align 8
197
+ ; CHECK-NEXT: store i64 [[VECEXT1 ]], ptr [[HF4X16]], align 8
191
198
; CHECK-NEXT: ret void
192
199
;
193
200
entry:
0 commit comments