@@ -77,79 +77,188 @@ define i32 @par(i32 %a, i32 %b, i32 %c, i32 %d) {
77
77
ret i32 %t3
78
78
}
79
79
80
- ; In the following tests, verify that a bitcast doesn't get in the way
81
- ; of a select transform. These bitcasts are common in SSE/AVX and possibly
80
+ ; In the following tests (8 commutation variants) , verify that a bitcast doesn't get
81
+ ; in the way of a select transform. These bitcasts are common in SSE/AVX and possibly
82
82
; other vector code because of canonicalization to i64 elements for vectors.
83
83
84
- define <2 x i64 > @bitcast_select (<4 x i1 > %cmp , <2 x i64 > %a , <2 x i64 > %b ) {
85
- ; CHECK-LABEL: @bitcast_select(
86
- ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <2 x i64> %a to <4 x i32>
87
- ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <2 x i64> %b to <4 x i32>
84
+ ; The fptosi instructions are included to avoid commutation canonicalization based on
85
+ ; operator weight. Using another cast operator ensures that both operands of all logic
86
+ ; ops are equally weighted, and this ensures that we're testing all commutation
87
+ ; possibilities.
88
+
89
+ define <2 x i64 > @bitcast_select_swap0 (<4 x i1 > %cmp , <2 x double > %a , <2 x double > %b ) {
90
+ ; CHECK-LABEL: @bitcast_select_swap0(
91
+ ; CHECK-NEXT: [[SIA:%.*]] = fptosi <2 x double> %a to <2 x i64>
92
+ ; CHECK-NEXT: [[SIB:%.*]] = fptosi <2 x double> %b to <2 x i64>
93
+ ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <2 x i64> [[SIA]] to <4 x i32>
94
+ ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <2 x i64> [[SIB]] to <4 x i32>
95
+ ; CHECK-NEXT: [[TMP3:%.*]] = select <4 x i1> %cmp, <4 x i32> [[TMP1]], <4 x i32> [[TMP2]]
96
+ ; CHECK-NEXT: [[OR:%.*]] = bitcast <4 x i32> [[TMP3]] to <2 x i64>
97
+ ; CHECK-NEXT: ret <2 x i64> [[OR]]
98
+ ;
99
+ %sia = fptosi <2 x double > %a to <2 x i64 >
100
+ %sib = fptosi <2 x double > %b to <2 x i64 >
101
+ %sext = sext <4 x i1 > %cmp to <4 x i32 >
102
+ %bc1 = bitcast <4 x i32 > %sext to <2 x i64 >
103
+ %and1 = and <2 x i64 > %bc1 , %sia
104
+ %neg = xor <4 x i32 > %sext , <i32 -1 , i32 -1 , i32 -1 , i32 -1 >
105
+ %bc2 = bitcast <4 x i32 > %neg to <2 x i64 >
106
+ %and2 = and <2 x i64 > %bc2 , %sib
107
+ %or = or <2 x i64 > %and1 , %and2
108
+ ret <2 x i64 > %or
109
+ }
110
+
111
+ define <2 x i64 > @bitcast_select_swap1 (<4 x i1 > %cmp , <2 x double > %a , <2 x double > %b ) {
112
+ ; CHECK-LABEL: @bitcast_select_swap1(
113
+ ; CHECK-NEXT: [[SIA:%.*]] = fptosi <2 x double> %a to <2 x i64>
114
+ ; CHECK-NEXT: [[SIB:%.*]] = fptosi <2 x double> %b to <2 x i64>
115
+ ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <2 x i64> [[SIA]] to <4 x i32>
116
+ ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <2 x i64> [[SIB]] to <4 x i32>
117
+ ; CHECK-NEXT: [[TMP3:%.*]] = select <4 x i1> %cmp, <4 x i32> [[TMP1]], <4 x i32> [[TMP2]]
118
+ ; CHECK-NEXT: [[OR:%.*]] = bitcast <4 x i32> [[TMP3]] to <2 x i64>
119
+ ; CHECK-NEXT: ret <2 x i64> [[OR]]
120
+ ;
121
+ %sia = fptosi <2 x double > %a to <2 x i64 >
122
+ %sib = fptosi <2 x double > %b to <2 x i64 >
123
+ %sext = sext <4 x i1 > %cmp to <4 x i32 >
124
+ %bc1 = bitcast <4 x i32 > %sext to <2 x i64 >
125
+ %and1 = and <2 x i64 > %bc1 , %sia
126
+ %neg = xor <4 x i32 > %sext , <i32 -1 , i32 -1 , i32 -1 , i32 -1 >
127
+ %bc2 = bitcast <4 x i32 > %neg to <2 x i64 >
128
+ %and2 = and <2 x i64 > %bc2 , %sib
129
+ %or = or <2 x i64 > %and2 , %and1
130
+ ret <2 x i64 > %or
131
+ }
132
+
133
+ define <2 x i64 > @bitcast_select_swap2 (<4 x i1 > %cmp , <2 x double > %a , <2 x double > %b ) {
134
+ ; CHECK-LABEL: @bitcast_select_swap2(
135
+ ; CHECK-NEXT: [[SIA:%.*]] = fptosi <2 x double> %a to <2 x i64>
136
+ ; CHECK-NEXT: [[SIB:%.*]] = fptosi <2 x double> %b to <2 x i64>
137
+ ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <2 x i64> [[SIA]] to <4 x i32>
138
+ ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <2 x i64> [[SIB]] to <4 x i32>
139
+ ; CHECK-NEXT: [[TMP3:%.*]] = select <4 x i1> %cmp, <4 x i32> [[TMP1]], <4 x i32> [[TMP2]]
140
+ ; CHECK-NEXT: [[OR:%.*]] = bitcast <4 x i32> [[TMP3]] to <2 x i64>
141
+ ; CHECK-NEXT: ret <2 x i64> [[OR]]
142
+ ;
143
+ %sia = fptosi <2 x double > %a to <2 x i64 >
144
+ %sib = fptosi <2 x double > %b to <2 x i64 >
145
+ %sext = sext <4 x i1 > %cmp to <4 x i32 >
146
+ %bc1 = bitcast <4 x i32 > %sext to <2 x i64 >
147
+ %and1 = and <2 x i64 > %bc1 , %sia
148
+ %neg = xor <4 x i32 > %sext , <i32 -1 , i32 -1 , i32 -1 , i32 -1 >
149
+ %bc2 = bitcast <4 x i32 > %neg to <2 x i64 >
150
+ %and2 = and <2 x i64 > %sib , %bc2
151
+ %or = or <2 x i64 > %and1 , %and2
152
+ ret <2 x i64 > %or
153
+ }
154
+
155
+ define <2 x i64 > @bitcast_select_swap3 (<4 x i1 > %cmp , <2 x double > %a , <2 x double > %b ) {
156
+ ; CHECK-LABEL: @bitcast_select_swap3(
157
+ ; CHECK-NEXT: [[SIA:%.*]] = fptosi <2 x double> %a to <2 x i64>
158
+ ; CHECK-NEXT: [[SIB:%.*]] = fptosi <2 x double> %b to <2 x i64>
159
+ ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <2 x i64> [[SIA]] to <4 x i32>
160
+ ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <2 x i64> [[SIB]] to <4 x i32>
161
+ ; CHECK-NEXT: [[TMP3:%.*]] = select <4 x i1> %cmp, <4 x i32> [[TMP1]], <4 x i32> [[TMP2]]
162
+ ; CHECK-NEXT: [[OR:%.*]] = bitcast <4 x i32> [[TMP3]] to <2 x i64>
163
+ ; CHECK-NEXT: ret <2 x i64> [[OR]]
164
+ ;
165
+ %sia = fptosi <2 x double > %a to <2 x i64 >
166
+ %sib = fptosi <2 x double > %b to <2 x i64 >
167
+ %sext = sext <4 x i1 > %cmp to <4 x i32 >
168
+ %bc1 = bitcast <4 x i32 > %sext to <2 x i64 >
169
+ %and1 = and <2 x i64 > %bc1 , %sia
170
+ %neg = xor <4 x i32 > %sext , <i32 -1 , i32 -1 , i32 -1 , i32 -1 >
171
+ %bc2 = bitcast <4 x i32 > %neg to <2 x i64 >
172
+ %and2 = and <2 x i64 > %sib , %bc2
173
+ %or = or <2 x i64 > %and2 , %and1
174
+ ret <2 x i64 > %or
175
+ }
176
+
177
+ define <2 x i64 > @bitcast_select_swap4 (<4 x i1 > %cmp , <2 x double > %a , <2 x double > %b ) {
178
+ ; CHECK-LABEL: @bitcast_select_swap4(
179
+ ; CHECK-NEXT: [[SIA:%.*]] = fptosi <2 x double> %a to <2 x i64>
180
+ ; CHECK-NEXT: [[SIB:%.*]] = fptosi <2 x double> %b to <2 x i64>
181
+ ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <2 x i64> [[SIA]] to <4 x i32>
182
+ ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <2 x i64> [[SIB]] to <4 x i32>
88
183
; CHECK-NEXT: [[TMP3:%.*]] = select <4 x i1> %cmp, <4 x i32> [[TMP1]], <4 x i32> [[TMP2]]
89
184
; CHECK-NEXT: [[OR:%.*]] = bitcast <4 x i32> [[TMP3]] to <2 x i64>
90
185
; CHECK-NEXT: ret <2 x i64> [[OR]]
91
186
;
187
+ %sia = fptosi <2 x double > %a to <2 x i64 >
188
+ %sib = fptosi <2 x double > %b to <2 x i64 >
92
189
%sext = sext <4 x i1 > %cmp to <4 x i32 >
93
- %t2 = bitcast <4 x i32 > %sext to <2 x i64 >
94
- %and = and <2 x i64 > %t2 , %a
190
+ %bc1 = bitcast <4 x i32 > %sext to <2 x i64 >
191
+ %and1 = and <2 x i64 > %sia , %bc1
95
192
%neg = xor <4 x i32 > %sext , <i32 -1 , i32 -1 , i32 -1 , i32 -1 >
96
- %neg2 = bitcast <4 x i32 > %neg to <2 x i64 >
97
- %and2 = and <2 x i64 > %neg2 , %b
98
- %or = or <2 x i64 > %and , %and2
193
+ %bc2 = bitcast <4 x i32 > %neg to <2 x i64 >
194
+ %and2 = and <2 x i64 > %bc2 , %sib
195
+ %or = or <2 x i64 > %and1 , %and2
99
196
ret <2 x i64 > %or
100
197
}
101
198
102
- define <2 x i64 > @bitcast_select_swap_or_ops (<4 x i1 > %cmp , <2 x i64 > %a , <2 x i64 > %b ) {
103
- ; CHECK-LABEL: @bitcast_select_swap_or_ops(
104
- ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <2 x i64> %a to <4 x i32>
105
- ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <2 x i64> %b to <4 x i32>
199
+ define <2 x i64 > @bitcast_select_swap5 (<4 x i1 > %cmp , <2 x double > %a , <2 x double > %b ) {
200
+ ; CHECK-LABEL: @bitcast_select_swap5(
201
+ ; CHECK-NEXT: [[SIA:%.*]] = fptosi <2 x double> %a to <2 x i64>
202
+ ; CHECK-NEXT: [[SIB:%.*]] = fptosi <2 x double> %b to <2 x i64>
203
+ ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <2 x i64> [[SIA]] to <4 x i32>
204
+ ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <2 x i64> [[SIB]] to <4 x i32>
106
205
; CHECK-NEXT: [[TMP3:%.*]] = select <4 x i1> %cmp, <4 x i32> [[TMP1]], <4 x i32> [[TMP2]]
107
206
; CHECK-NEXT: [[OR:%.*]] = bitcast <4 x i32> [[TMP3]] to <2 x i64>
108
207
; CHECK-NEXT: ret <2 x i64> [[OR]]
109
208
;
209
+ %sia = fptosi <2 x double > %a to <2 x i64 >
210
+ %sib = fptosi <2 x double > %b to <2 x i64 >
110
211
%sext = sext <4 x i1 > %cmp to <4 x i32 >
111
- %t2 = bitcast <4 x i32 > %sext to <2 x i64 >
112
- %and = and <2 x i64 > %t2 , %a
212
+ %bc1 = bitcast <4 x i32 > %sext to <2 x i64 >
213
+ %and1 = and <2 x i64 > %sia , %bc1
113
214
%neg = xor <4 x i32 > %sext , <i32 -1 , i32 -1 , i32 -1 , i32 -1 >
114
- %neg2 = bitcast <4 x i32 > %neg to <2 x i64 >
115
- %and2 = and <2 x i64 > %neg2 , %b
116
- %or = or <2 x i64 > %and2 , %and
215
+ %bc2 = bitcast <4 x i32 > %neg to <2 x i64 >
216
+ %and2 = and <2 x i64 > %bc2 , %sib
217
+ %or = or <2 x i64 > %and2 , %and1
117
218
ret <2 x i64 > %or
118
219
}
119
220
120
- define <2 x i64 > @bitcast_select_swap_and_ops (<4 x i1 > %cmp , <2 x i64 > %a , <2 x i64 > %b ) {
121
- ; CHECK-LABEL: @bitcast_select_swap_and_ops(
122
- ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <2 x i64> %a to <4 x i32>
123
- ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <2 x i64> %b to <4 x i32>
221
+ define <2 x i64 > @bitcast_select_swap6 (<4 x i1 > %cmp , <2 x double > %a , <2 x double > %b ) {
222
+ ; CHECK-LABEL: @bitcast_select_swap6(
223
+ ; CHECK-NEXT: [[SIA:%.*]] = fptosi <2 x double> %a to <2 x i64>
224
+ ; CHECK-NEXT: [[SIB:%.*]] = fptosi <2 x double> %b to <2 x i64>
225
+ ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <2 x i64> [[SIA]] to <4 x i32>
226
+ ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <2 x i64> [[SIB]] to <4 x i32>
124
227
; CHECK-NEXT: [[TMP3:%.*]] = select <4 x i1> %cmp, <4 x i32> [[TMP1]], <4 x i32> [[TMP2]]
125
228
; CHECK-NEXT: [[OR:%.*]] = bitcast <4 x i32> [[TMP3]] to <2 x i64>
126
229
; CHECK-NEXT: ret <2 x i64> [[OR]]
127
230
;
231
+ %sia = fptosi <2 x double > %a to <2 x i64 >
232
+ %sib = fptosi <2 x double > %b to <2 x i64 >
128
233
%sext = sext <4 x i1 > %cmp to <4 x i32 >
129
- %t2 = bitcast <4 x i32 > %sext to <2 x i64 >
130
- %and = and <2 x i64 > %t2 , %a
234
+ %bc1 = bitcast <4 x i32 > %sext to <2 x i64 >
235
+ %and1 = and <2 x i64 > %sia , %bc1
131
236
%neg = xor <4 x i32 > %sext , <i32 -1 , i32 -1 , i32 -1 , i32 -1 >
132
- %neg2 = bitcast <4 x i32 > %neg to <2 x i64 >
133
- %and2 = and <2 x i64 > %b , %neg2
134
- %or = or <2 x i64 > %and , %and2
237
+ %bc2 = bitcast <4 x i32 > %neg to <2 x i64 >
238
+ %and2 = and <2 x i64 > %sib , %bc2
239
+ %or = or <2 x i64 > %and1 , %and2
135
240
ret <2 x i64 > %or
136
241
}
137
242
138
- define <2 x i64 > @bitcast_select_swap_and_ops2 (<4 x i1 > %cmp , <2 x i64 > %a , <2 x i64 > %b ) {
139
- ; CHECK-LABEL: @bitcast_select_swap_and_ops2(
140
- ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <2 x i64> %a to <4 x i32>
141
- ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <2 x i64> %b to <4 x i32>
243
+ define <2 x i64 > @bitcast_select_swap7 (<4 x i1 > %cmp , <2 x double > %a , <2 x double > %b ) {
244
+ ; CHECK-LABEL: @bitcast_select_swap7(
245
+ ; CHECK-NEXT: [[SIA:%.*]] = fptosi <2 x double> %a to <2 x i64>
246
+ ; CHECK-NEXT: [[SIB:%.*]] = fptosi <2 x double> %b to <2 x i64>
247
+ ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <2 x i64> [[SIA]] to <4 x i32>
248
+ ; CHECK-NEXT: [[TMP2:%.*]] = bitcast <2 x i64> [[SIB]] to <4 x i32>
142
249
; CHECK-NEXT: [[TMP3:%.*]] = select <4 x i1> %cmp, <4 x i32> [[TMP1]], <4 x i32> [[TMP2]]
143
250
; CHECK-NEXT: [[OR:%.*]] = bitcast <4 x i32> [[TMP3]] to <2 x i64>
144
251
; CHECK-NEXT: ret <2 x i64> [[OR]]
145
252
;
253
+ %sia = fptosi <2 x double > %a to <2 x i64 >
254
+ %sib = fptosi <2 x double > %b to <2 x i64 >
146
255
%sext = sext <4 x i1 > %cmp to <4 x i32 >
147
- %t2 = bitcast <4 x i32 > %sext to <2 x i64 >
148
- %and = and <2 x i64 > %a , %t2
256
+ %bc1 = bitcast <4 x i32 > %sext to <2 x i64 >
257
+ %and1 = and <2 x i64 > %sia , %bc1
149
258
%neg = xor <4 x i32 > %sext , <i32 -1 , i32 -1 , i32 -1 , i32 -1 >
150
- %neg2 = bitcast <4 x i32 > %neg to <2 x i64 >
151
- %and2 = and <2 x i64 > %neg2 , %b
152
- %or = or <2 x i64 > %and , %and2
259
+ %bc2 = bitcast <4 x i32 > %neg to <2 x i64 >
260
+ %and2 = and <2 x i64 > %sib , %bc2
261
+ %or = or <2 x i64 > %and2 , %and1
153
262
ret <2 x i64 > %or
154
263
}
155
264
0 commit comments