@@ -143,31 +143,31 @@ define <4 x i32> @test_urem_odd_div(<4 x i32> %X) nounwind readnone {
143
143
define <4 x i32 > @test_urem_even_div (<4 x i32 > %X ) nounwind readnone {
144
144
; CHECK-SSE2-LABEL: test_urem_even_div:
145
145
; CHECK-SSE2: # %bb.0:
146
- ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm0[0,1,2,0 ]
147
- ; CHECK-SSE2-NEXT: movdqa {{.*#+}} xmm2 = [2863311531,3435973837,2863311531,2454267027]
148
- ; CHECK-SSE2-NEXT: pmuludq %xmm2 , %xmm1
149
- ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm1 [1,3,2,3]
146
+ ; CHECK-SSE2-NEXT: movdqa {{.*#+}} xmm1 = [2863311531,3435973837,2863311531,2454267027 ]
147
+ ; CHECK-SSE2-NEXT: movdqa %xmm0, % xmm2
148
+ ; CHECK-SSE2-NEXT: pmuludq %xmm1 , %xmm2
149
+ ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm2 = xmm2 [1,3,2,3]
150
150
; CHECK-SSE2-NEXT: movdqa %xmm0, %xmm3
151
151
; CHECK-SSE2-NEXT: psrld $1, %xmm3
152
152
; CHECK-SSE2-NEXT: movdqa %xmm0, %xmm4
153
153
; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm4 = xmm4[1,1],xmm3[3,3]
154
- ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm2 = xmm2 [1,1,3,3]
155
- ; CHECK-SSE2-NEXT: pmuludq %xmm4, %xmm2
156
- ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm2 = xmm2 [1,3,2,3]
157
- ; CHECK-SSE2-NEXT: punpckldq {{.*#+}} xmm1 = xmm1 [0],xmm2 [0],xmm1 [1],xmm2 [1]
158
- ; CHECK-SSE2-NEXT: movdqa %xmm1 , %xmm2
159
- ; CHECK-SSE2-NEXT: psrld $2, %xmm2
160
- ; CHECK-SSE2-NEXT: psrld $3, %xmm1
161
- ; CHECK-SSE2-NEXT: movdqa %xmm1 , %xmm3
162
- ; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm3 = xmm3[1,1],xmm2 [3,3]
154
+ ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm1 [1,1,3,3]
155
+ ; CHECK-SSE2-NEXT: pmuludq %xmm4, %xmm1
156
+ ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm1 [1,3,2,3]
157
+ ; CHECK-SSE2-NEXT: punpckldq {{.*#+}} xmm2 = xmm2 [0],xmm1 [0],xmm2 [1],xmm1 [1]
158
+ ; CHECK-SSE2-NEXT: movdqa %xmm2 , %xmm1
159
+ ; CHECK-SSE2-NEXT: psrld $2, %xmm1
160
+ ; CHECK-SSE2-NEXT: psrld $3, %xmm2
161
+ ; CHECK-SSE2-NEXT: movdqa %xmm2 , %xmm3
162
+ ; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm3 = xmm3[1,1],xmm1 [3,3]
163
163
; CHECK-SSE2-NEXT: movdqa {{.*#+}} xmm4 = [6,10,12,14]
164
164
; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm5 = xmm4[1,1,3,3]
165
165
; CHECK-SSE2-NEXT: pmuludq %xmm3, %xmm5
166
166
; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm3 = xmm5[0,2,2,3]
167
- ; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm2 = xmm2 [0,3],xmm1 [1,2]
168
- ; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm2 = xmm2 [0,2,3,1]
169
- ; CHECK-SSE2-NEXT: pmuludq %xmm4, %xmm2
170
- ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm2 [0,2,2,3]
167
+ ; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1 [0,3],xmm2 [1,2]
168
+ ; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm1 = xmm1 [0,2,3,1]
169
+ ; CHECK-SSE2-NEXT: pmuludq %xmm4, %xmm1
170
+ ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm1 [0,2,2,3]
171
171
; CHECK-SSE2-NEXT: punpckldq {{.*#+}} xmm1 = xmm1[0],xmm3[0],xmm1[1],xmm3[1]
172
172
; CHECK-SSE2-NEXT: psubd %xmm1, %xmm0
173
173
; CHECK-SSE2-NEXT: pxor %xmm1, %xmm1
@@ -377,30 +377,30 @@ define <4 x i32> @test_urem_pow2(<4 x i32> %X) nounwind readnone {
377
377
define <4 x i32 > @test_urem_one (<4 x i32 > %X ) nounwind readnone {
378
378
; CHECK-SSE2-LABEL: test_urem_one:
379
379
; CHECK-SSE2: # %bb.0:
380
- ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm0[0,1,2,0 ]
381
- ; CHECK-SSE2-NEXT: movdqa {{.*#+}} xmm2 = [2863311531,0,2863311531,2454267027]
382
- ; CHECK-SSE2-NEXT: pmuludq %xmm2 , %xmm1
383
- ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm1 [1,3,2,3]
380
+ ; CHECK-SSE2-NEXT: movdqa {{.*#+}} xmm1 = [2863311531,0,2863311531,2454267027 ]
381
+ ; CHECK-SSE2-NEXT: movdqa %xmm0, % xmm2
382
+ ; CHECK-SSE2-NEXT: pmuludq %xmm1 , %xmm2
383
+ ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm2 = xmm2 [1,3,2,3]
384
384
; CHECK-SSE2-NEXT: movdqa %xmm0, %xmm3
385
385
; CHECK-SSE2-NEXT: psrld $1, %xmm3
386
386
; CHECK-SSE2-NEXT: movdqa %xmm0, %xmm4
387
387
; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm4 = xmm4[1,1],xmm3[3,3]
388
- ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm2 = xmm2 [1,1,3,3]
389
- ; CHECK-SSE2-NEXT: pmuludq %xmm4, %xmm2
390
- ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm2 = xmm2 [1,3,2,3]
391
- ; CHECK-SSE2-NEXT: punpckldq {{.*#+}} xmm1 = xmm1 [0],xmm2 [0],xmm1 [1],xmm2 [1]
392
- ; CHECK-SSE2-NEXT: movdqa %xmm1 , %xmm2
393
- ; CHECK-SSE2-NEXT: psrld $2, %xmm2
388
+ ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm1 [1,1,3,3]
389
+ ; CHECK-SSE2-NEXT: pmuludq %xmm4, %xmm1
390
+ ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm1 [1,3,2,3]
391
+ ; CHECK-SSE2-NEXT: punpckldq {{.*#+}} xmm2 = xmm2 [0],xmm1 [0],xmm2 [1],xmm1 [1]
392
+ ; CHECK-SSE2-NEXT: movdqa %xmm2 , %xmm1
393
+ ; CHECK-SSE2-NEXT: psrld $2, %xmm1
394
394
; CHECK-SSE2-NEXT: movdqa %xmm0, %xmm3
395
- ; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm3 = xmm3[1,0],xmm2 [0,0]
396
- ; CHECK-SSE2-NEXT: psrld $3, %xmm1
397
- ; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm3 = xmm3[2,0],xmm1 [2,3]
398
- ; CHECK-SSE2-NEXT: movdqa {{.*#+}} xmm1 = [6,1,12,14]
399
- ; CHECK-SSE2-NEXT: pmuludq %xmm1 , %xmm3
395
+ ; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm3 = xmm3[1,0],xmm1 [0,0]
396
+ ; CHECK-SSE2-NEXT: psrld $3, %xmm2
397
+ ; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm3 = xmm3[2,0],xmm2 [2,3]
398
+ ; CHECK-SSE2-NEXT: movdqa {{.*#+}} xmm2 = [6,1,12,14]
399
+ ; CHECK-SSE2-NEXT: pmuludq %xmm2 , %xmm3
400
400
; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm3 = xmm3[0,2,2,3]
401
401
; CHECK-SSE2-NEXT: movdqa %xmm0, %xmm4
402
- ; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm4 = xmm4[1,1],xmm2 [3,3]
403
- ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm1 [1,1,3,3]
402
+ ; CHECK-SSE2-NEXT: shufps {{.*#+}} xmm4 = xmm4[1,1],xmm1 [3,3]
403
+ ; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm2 [1,1,3,3]
404
404
; CHECK-SSE2-NEXT: pmuludq %xmm4, %xmm1
405
405
; CHECK-SSE2-NEXT: pshufd {{.*#+}} xmm1 = xmm1[0,2,2,3]
406
406
; CHECK-SSE2-NEXT: punpckldq {{.*#+}} xmm3 = xmm3[0],xmm1[0],xmm3[1],xmm1[1]
0 commit comments