@@ -2280,11 +2280,11 @@ define <32 x i1> @pr51133(<32 x i8> %x, <32 x i8> %y) {
2280
2280
; CHECK-SSE41-NEXT: movdqa %xmm0, %xmm4
2281
2281
; CHECK-SSE41-NEXT: movq %rdi, %rax
2282
2282
; CHECK-SSE41-NEXT: movdqa %xmm1, %xmm0
2283
- ; CHECK-SSE41-NEXT: pmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0
2283
+ ; CHECK-SSE41-NEXT: pmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0 # [171,0,183,0,61,0,127,0,9,0,41,0,1,0,161,0]
2284
2284
; CHECK-SSE41-NEXT: pmovzxbw {{.*#+}} xmm5 = [255,255,255,255,255,255,255,255]
2285
2285
; CHECK-SSE41-NEXT: pand %xmm5, %xmm0
2286
2286
; CHECK-SSE41-NEXT: movdqa %xmm1, %xmm6
2287
- ; CHECK-SSE41-NEXT: pmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm6
2287
+ ; CHECK-SSE41-NEXT: pmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm6 # [0,103,0,171,0,1,0,183,0,0,0,183,0,1,0,221]
2288
2288
; CHECK-SSE41-NEXT: psllw $8, %xmm6
2289
2289
; CHECK-SSE41-NEXT: por %xmm0, %xmm6
2290
2290
; CHECK-SSE41-NEXT: paddb {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm6
@@ -2307,9 +2307,9 @@ define <32 x i1> @pr51133(<32 x i8> %x, <32 x i8> %y) {
2307
2307
; CHECK-SSE41-NEXT: movaps {{.*#+}} xmm0 = [255,255,255,255,255,0,255,255,255,255,255,255,255,255,255,255]
2308
2308
; CHECK-SSE41-NEXT: pblendvb %xmm0, %xmm7, %xmm1
2309
2309
; CHECK-SSE41-NEXT: movdqa %xmm4, %xmm0
2310
- ; CHECK-SSE41-NEXT: pmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0
2310
+ ; CHECK-SSE41-NEXT: pmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0 # [197,0,27,0,1,0,1,0,223,0,205,0,161,0,171,0]
2311
2311
; CHECK-SSE41-NEXT: pand %xmm5, %xmm0
2312
- ; CHECK-SSE41-NEXT: pmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm4
2312
+ ; CHECK-SSE41-NEXT: pmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm4 # [0,205,0,241,0,1,0,163,0,223,0,183,0,1,0,239]
2313
2313
; CHECK-SSE41-NEXT: psllw $8, %xmm4
2314
2314
; CHECK-SSE41-NEXT: por %xmm0, %xmm4
2315
2315
; CHECK-SSE41-NEXT: paddb {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm4
@@ -2345,10 +2345,10 @@ define <32 x i1> @pr51133(<32 x i8> %x, <32 x i8> %y) {
2345
2345
; CHECK-AVX1-NEXT: vpmulhw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm4, %xmm4 # [20224,26368,6912,30976,33024,33024,33024,12032]
2346
2346
; CHECK-AVX1-NEXT: vpsrlw $8, %xmm4, %xmm4
2347
2347
; CHECK-AVX1-NEXT: vpackuswb %xmm3, %xmm4, %xmm4
2348
- ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm5
2348
+ ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm5 # [0,0,0,0,1,0,1,0,1,0,0,0,0,0,0,0]
2349
2349
; CHECK-AVX1-NEXT: vbroadcastss {{.*#+}} xmm3 = [255,255,255,255,255,255,255,255]
2350
2350
; CHECK-AVX1-NEXT: vpand %xmm3, %xmm5, %xmm5
2351
- ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm6
2351
+ ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm6 # [0,0,0,0,0,1,0,0,0,1,0,1,0,1,0,1]
2352
2352
; CHECK-AVX1-NEXT: vpsllw $8, %xmm6, %xmm6
2353
2353
; CHECK-AVX1-NEXT: vpor %xmm6, %xmm5, %xmm5
2354
2354
; CHECK-AVX1-NEXT: vpaddb %xmm5, %xmm4, %xmm4
@@ -2365,9 +2365,9 @@ define <32 x i1> @pr51133(<32 x i8> %x, <32 x i8> %y) {
2365
2365
; CHECK-AVX1-NEXT: vbroadcastss {{.*#+}} xmm5 = [1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1]
2366
2366
; CHECK-AVX1-NEXT: vpand %xmm5, %xmm4, %xmm4
2367
2367
; CHECK-AVX1-NEXT: vpaddb %xmm4, %xmm6, %xmm4
2368
- ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm4, %xmm6
2368
+ ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm4, %xmm6 # [13,0,19,0,2,0,2,0,62,0,5,0,97,0,3,0]
2369
2369
; CHECK-AVX1-NEXT: vpand %xmm3, %xmm6, %xmm6
2370
- ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm4, %xmm4
2370
+ ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm4, %xmm4 # [0,5,0,34,0,8,0,88,0,62,0,7,0,2,0,60]
2371
2371
; CHECK-AVX1-NEXT: vpsllw $8, %xmm4, %xmm4
2372
2372
; CHECK-AVX1-NEXT: vpor %xmm4, %xmm6, %xmm4
2373
2373
; CHECK-AVX1-NEXT: vpsubb %xmm4, %xmm0, %xmm4
@@ -2379,9 +2379,9 @@ define <32 x i1> @pr51133(<32 x i8> %x, <32 x i8> %y) {
2379
2379
; CHECK-AVX1-NEXT: vpmulhw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm7, %xmm7 # [22016,24320,37632,11008,12544,32512,16640,37632]
2380
2380
; CHECK-AVX1-NEXT: vpsrlw $8, %xmm7, %xmm7
2381
2381
; CHECK-AVX1-NEXT: vpackuswb %xmm6, %xmm7, %xmm6
2382
- ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm7
2382
+ ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm7 # [0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0]
2383
2383
; CHECK-AVX1-NEXT: vpand %xmm3, %xmm7, %xmm7
2384
- ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm8
2384
+ ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm8 # [0,0,0,0,0,255,0,1,0,1,0,1,0,1,0,1]
2385
2385
; CHECK-AVX1-NEXT: vpsllw $8, %xmm8, %xmm8
2386
2386
; CHECK-AVX1-NEXT: vpor %xmm7, %xmm8, %xmm7
2387
2387
; CHECK-AVX1-NEXT: vpaddb %xmm7, %xmm6, %xmm6
@@ -2398,9 +2398,9 @@ define <32 x i1> @pr51133(<32 x i8> %x, <32 x i8> %y) {
2398
2398
; CHECK-AVX1-NEXT: vpand {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm6, %xmm6
2399
2399
; CHECK-AVX1-NEXT: vpand %xmm5, %xmm6, %xmm5
2400
2400
; CHECK-AVX1-NEXT: vpaddb %xmm5, %xmm7, %xmm5
2401
- ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm5, %xmm6
2401
+ ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm5, %xmm6 # [3,0,7,0,84,0,127,0,114,0,50,0,2,0,97,0]
2402
2402
; CHECK-AVX1-NEXT: vpand %xmm3, %xmm6, %xmm3
2403
- ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm5, %xmm5
2403
+ ; CHECK-AVX1-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm5, %xmm5 # [0,87,0,6,0,128,0,56,0,1,0,7,0,8,0,117]
2404
2404
; CHECK-AVX1-NEXT: vpsllw $8, %xmm5, %xmm5
2405
2405
; CHECK-AVX1-NEXT: vpor %xmm5, %xmm3, %xmm3
2406
2406
; CHECK-AVX1-NEXT: vpsubb %xmm3, %xmm0, %xmm0
@@ -2427,10 +2427,10 @@ define <32 x i1> @pr51133(<32 x i8> %x, <32 x i8> %y) {
2427
2427
; CHECK-AVX2-NEXT: vpmulhw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm4, %ymm4 # [20224,26368,6912,30976,33024,33024,33024,12032,22016,24320,37632,11008,12544,32512,16640,37632]
2428
2428
; CHECK-AVX2-NEXT: vpsrlw $8, %ymm4, %ymm4
2429
2429
; CHECK-AVX2-NEXT: vpackuswb %ymm3, %ymm4, %ymm3
2430
- ; CHECK-AVX2-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm0, %ymm4
2430
+ ; CHECK-AVX2-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm0, %ymm4 # [0,0,0,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0]
2431
2431
; CHECK-AVX2-NEXT: vpbroadcastw {{.*#+}} ymm5 = [255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255]
2432
2432
; CHECK-AVX2-NEXT: vpand %ymm5, %ymm4, %ymm4
2433
- ; CHECK-AVX2-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm0, %ymm6
2433
+ ; CHECK-AVX2-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm0, %ymm6 # [0,0,0,0,0,1,0,0,0,1,0,1,0,1,0,1,0,0,0,0,0,255,0,1,0,1,0,1,0,1,0,1]
2434
2434
; CHECK-AVX2-NEXT: vpsllw $8, %ymm6, %ymm6
2435
2435
; CHECK-AVX2-NEXT: vpor %ymm6, %ymm4, %ymm4
2436
2436
; CHECK-AVX2-NEXT: vpaddb %ymm4, %ymm3, %ymm3
@@ -2447,9 +2447,9 @@ define <32 x i1> @pr51133(<32 x i8> %x, <32 x i8> %y) {
2447
2447
; CHECK-AVX2-NEXT: vpand {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm3, %ymm3
2448
2448
; CHECK-AVX2-NEXT: vpand {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm3, %ymm3
2449
2449
; CHECK-AVX2-NEXT: vpaddb %ymm3, %ymm4, %ymm3
2450
- ; CHECK-AVX2-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm3, %ymm4
2450
+ ; CHECK-AVX2-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm3, %ymm4 # [13,0,19,0,2,0,2,0,62,0,5,0,97,0,3,0,3,0,7,0,84,0,127,0,114,0,50,0,2,0,97,0]
2451
2451
; CHECK-AVX2-NEXT: vpand %ymm5, %ymm4, %ymm4
2452
- ; CHECK-AVX2-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm3, %ymm3
2452
+ ; CHECK-AVX2-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm3, %ymm3 # [0,5,0,34,0,8,0,88,0,62,0,7,0,2,0,60,0,87,0,6,0,128,0,56,0,1,0,7,0,8,0,117]
2453
2453
; CHECK-AVX2-NEXT: vpsllw $8, %ymm3, %ymm3
2454
2454
; CHECK-AVX2-NEXT: vpor %ymm3, %ymm4, %ymm3
2455
2455
; CHECK-AVX2-NEXT: vpsubb %ymm3, %ymm0, %ymm0
@@ -2462,8 +2462,8 @@ define <32 x i1> @pr51133(<32 x i8> %x, <32 x i8> %y) {
2462
2462
;
2463
2463
; CHECK-AVX512VL-LABEL: pr51133:
2464
2464
; CHECK-AVX512VL: # %bb.0:
2465
- ; CHECK-AVX512VL-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm0, %ymm2
2466
- ; CHECK-AVX512VL-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm0, %ymm3
2465
+ ; CHECK-AVX512VL-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm0, %ymm2 # [197,0,27,0,1,0,1,0,223,0,205,0,161,0,171,0,171,0,183,0,61,0,127,0,9,0,41,0,1,0,161,0]
2466
+ ; CHECK-AVX512VL-NEXT: vpmaddubsw {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm0, %ymm3 # [0,205,0,241,0,1,0,163,0,223,0,183,0,1,0,239,0,103,0,171,0,1,0,183,0,0,0,183,0,1,0,221]
2467
2467
; CHECK-AVX512VL-NEXT: vpsllw $8, %ymm3, %ymm3
2468
2468
; CHECK-AVX512VL-NEXT: vpternlogd $248, {{\.?LCPI[0-9]+_[0-9]+}}(%rip){1to8}, %ymm2, %ymm3
2469
2469
; CHECK-AVX512VL-NEXT: vpaddb {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %ymm3, %ymm2
0 commit comments