@@ -397,45 +397,45 @@ define <vscale x 4 x i64> @usdot_8to64(<vscale x 4 x i64> %acc, <vscale x 16 x i
397
397
; CHECK-NEWLOWERING-NEXT: .cfi_offset w29, -16
398
398
; CHECK-NEWLOWERING-NEXT: .cfi_escape 0x10, 0x48, 0x0a, 0x11, 0x70, 0x22, 0x11, 0x78, 0x92, 0x2e, 0x00, 0x1e, 0x22 // $d8 @ cfa - 16 - 8 * VG
399
399
; CHECK-NEWLOWERING-NEXT: .cfi_escape 0x10, 0x49, 0x0a, 0x11, 0x70, 0x22, 0x11, 0x70, 0x92, 0x2e, 0x00, 0x1e, 0x22 // $d9 @ cfa - 16 - 16 * VG
400
- ; CHECK-NEWLOWERING-NEXT: uunpklo z4.h, z2.b
400
+ ; CHECK-NEWLOWERING-NEXT: uunpkhi z4.h, z2.b
401
+ ; CHECK-NEWLOWERING-NEXT: uunpklo z2.h, z2.b
401
402
; CHECK-NEWLOWERING-NEXT: sunpklo z5.h, z3.b
402
- ; CHECK-NEWLOWERING-NEXT: uunpkhi z2.h, z2.b
403
403
; CHECK-NEWLOWERING-NEXT: sunpkhi z3.h, z3.b
404
404
; CHECK-NEWLOWERING-NEXT: ptrue p0.d
405
405
; CHECK-NEWLOWERING-NEXT: uunpklo z6.s, z4.h
406
+ ; CHECK-NEWLOWERING-NEXT: uunpklo z7.s, z2.h
407
+ ; CHECK-NEWLOWERING-NEXT: sunpklo z24.s, z5.h
408
+ ; CHECK-NEWLOWERING-NEXT: sunpklo z25.s, z3.h
406
409
; CHECK-NEWLOWERING-NEXT: uunpkhi z4.s, z4.h
407
- ; CHECK-NEWLOWERING-NEXT: sunpklo z7.s, z5.h
408
- ; CHECK-NEWLOWERING-NEXT: sunpkhi z5.s, z5.h
409
- ; CHECK-NEWLOWERING-NEXT: uunpklo z24.s, z2.h
410
410
; CHECK-NEWLOWERING-NEXT: uunpkhi z2.s, z2.h
411
- ; CHECK-NEWLOWERING-NEXT: sunpklo z25.s, z3.h
412
411
; CHECK-NEWLOWERING-NEXT: sunpkhi z3.s, z3.h
413
- ; CHECK-NEWLOWERING-NEXT: uunpkhi z26.d, z6.s
414
- ; CHECK-NEWLOWERING-NEXT: uunpklo z6.d, z6.s
415
- ; CHECK-NEWLOWERING-NEXT: uunpklo z27.d, z4.s
416
- ; CHECK-NEWLOWERING-NEXT: sunpklo z28.d, z7.s
417
- ; CHECK-NEWLOWERING-NEXT: sunpklo z29.d, z5.s
412
+ ; CHECK-NEWLOWERING-NEXT: sunpkhi z5.s, z5.h
413
+ ; CHECK-NEWLOWERING-NEXT: uunpklo z26.d, z6.s
414
+ ; CHECK-NEWLOWERING-NEXT: uunpklo z27.d, z7.s
415
+ ; CHECK-NEWLOWERING-NEXT: uunpkhi z7.d, z7.s
416
+ ; CHECK-NEWLOWERING-NEXT: sunpklo z28.d, z24.s
417
+ ; CHECK-NEWLOWERING-NEXT: sunpkhi z24.d, z24.s
418
+ ; CHECK-NEWLOWERING-NEXT: uunpkhi z6.d, z6.s
419
+ ; CHECK-NEWLOWERING-NEXT: sunpklo z29.d, z25.s
420
+ ; CHECK-NEWLOWERING-NEXT: sunpkhi z25.d, z25.s
421
+ ; CHECK-NEWLOWERING-NEXT: uunpklo z30.d, z4.s
418
422
; CHECK-NEWLOWERING-NEXT: uunpkhi z4.d, z4.s
419
- ; CHECK-NEWLOWERING-NEXT: sunpkhi z7.d, z7.s
423
+ ; CHECK-NEWLOWERING-NEXT: uunpklo z31.d, z2.s
424
+ ; CHECK-NEWLOWERING-NEXT: uunpkhi z2.d, z2.s
425
+ ; CHECK-NEWLOWERING-NEXT: sunpklo z8.d, z3.s
426
+ ; CHECK-NEWLOWERING-NEXT: sunpklo z9.d, z5.s
420
427
; CHECK-NEWLOWERING-NEXT: sunpkhi z5.d, z5.s
421
- ; CHECK-NEWLOWERING-NEXT: uunpkhi z30.d, z24.s
422
- ; CHECK-NEWLOWERING-NEXT: uunpkhi z31.d, z2.s
423
- ; CHECK-NEWLOWERING-NEXT: uunpklo z24.d, z24.s
424
- ; CHECK-NEWLOWERING-NEXT: uunpklo z2.d, z2.s
425
- ; CHECK-NEWLOWERING-NEXT: sunpkhi z8.d, z25.s
426
- ; CHECK-NEWLOWERING-NEXT: sunpklo z25.d, z25.s
427
- ; CHECK-NEWLOWERING-NEXT: sunpklo z9.d, z3.s
428
- ; CHECK-NEWLOWERING-NEXT: mul z27.d, z27.d, z29.d
429
- ; CHECK-NEWLOWERING-NEXT: mla z0.d, p0/m, z6.d, z28.d
428
+ ; CHECK-NEWLOWERING-NEXT: mul z7.d, z7.d, z24.d
429
+ ; CHECK-NEWLOWERING-NEXT: mla z0.d, p0/m, z27.d, z28.d
430
430
; CHECK-NEWLOWERING-NEXT: sunpkhi z3.d, z3.s
431
- ; CHECK-NEWLOWERING-NEXT: mul z4 .d, z4 .d, z5 .d
432
- ; CHECK-NEWLOWERING-NEXT: mla z1.d, p0/m, z26.d, z7 .d
433
- ; CHECK-NEWLOWERING-NEXT: mla z0.d, p0/m, z2.d, z9 .d
434
- ; CHECK-NEWLOWERING-NEXT: movprfx z2, z27
435
- ; CHECK-NEWLOWERING-NEXT: mla z2.d, p0/m, z24 .d, z25 .d
431
+ ; CHECK-NEWLOWERING-NEXT: mul z6 .d, z6 .d, z25 .d
432
+ ; CHECK-NEWLOWERING-NEXT: mla z1.d, p0/m, z26.d, z29 .d
433
+ ; CHECK-NEWLOWERING-NEXT: mla z0.d, p0/m, z2.d, z5 .d
434
+ ; CHECK-NEWLOWERING-NEXT: movprfx z2, z7
435
+ ; CHECK-NEWLOWERING-NEXT: mla z2.d, p0/m, z31 .d, z9 .d
436
436
; CHECK-NEWLOWERING-NEXT: ldr z9, [sp] // 16-byte Folded Reload
437
- ; CHECK-NEWLOWERING-NEXT: mla z1.d, p0/m, z31 .d, z3.d
438
- ; CHECK-NEWLOWERING-NEXT: movprfx z3, z4
437
+ ; CHECK-NEWLOWERING-NEXT: mla z1.d, p0/m, z4 .d, z3.d
438
+ ; CHECK-NEWLOWERING-NEXT: movprfx z3, z6
439
439
; CHECK-NEWLOWERING-NEXT: mla z3.d, p0/m, z30.d, z8.d
440
440
; CHECK-NEWLOWERING-NEXT: ldr z8, [sp, #1, mul vl] // 16-byte Folded Reload
441
441
; CHECK-NEWLOWERING-NEXT: add z0.d, z2.d, z0.d
@@ -530,45 +530,45 @@ define <vscale x 4 x i64> @sudot_8to64(<vscale x 4 x i64> %acc, <vscale x 16 x i
530
530
; CHECK-NEWLOWERING-NEXT: .cfi_offset w29, -16
531
531
; CHECK-NEWLOWERING-NEXT: .cfi_escape 0x10, 0x48, 0x0a, 0x11, 0x70, 0x22, 0x11, 0x78, 0x92, 0x2e, 0x00, 0x1e, 0x22 // $d8 @ cfa - 16 - 8 * VG
532
532
; CHECK-NEWLOWERING-NEXT: .cfi_escape 0x10, 0x49, 0x0a, 0x11, 0x70, 0x22, 0x11, 0x70, 0x92, 0x2e, 0x00, 0x1e, 0x22 // $d9 @ cfa - 16 - 16 * VG
533
- ; CHECK-NEWLOWERING-NEXT: sunpklo z4.h, z2.b
533
+ ; CHECK-NEWLOWERING-NEXT: sunpkhi z4.h, z2.b
534
+ ; CHECK-NEWLOWERING-NEXT: sunpklo z2.h, z2.b
534
535
; CHECK-NEWLOWERING-NEXT: uunpklo z5.h, z3.b
535
- ; CHECK-NEWLOWERING-NEXT: sunpkhi z2.h, z2.b
536
536
; CHECK-NEWLOWERING-NEXT: uunpkhi z3.h, z3.b
537
537
; CHECK-NEWLOWERING-NEXT: ptrue p0.d
538
538
; CHECK-NEWLOWERING-NEXT: sunpklo z6.s, z4.h
539
+ ; CHECK-NEWLOWERING-NEXT: sunpklo z7.s, z2.h
540
+ ; CHECK-NEWLOWERING-NEXT: uunpklo z24.s, z5.h
541
+ ; CHECK-NEWLOWERING-NEXT: uunpklo z25.s, z3.h
539
542
; CHECK-NEWLOWERING-NEXT: sunpkhi z4.s, z4.h
540
- ; CHECK-NEWLOWERING-NEXT: uunpklo z7.s, z5.h
541
- ; CHECK-NEWLOWERING-NEXT: uunpkhi z5.s, z5.h
542
- ; CHECK-NEWLOWERING-NEXT: sunpklo z24.s, z2.h
543
543
; CHECK-NEWLOWERING-NEXT: sunpkhi z2.s, z2.h
544
- ; CHECK-NEWLOWERING-NEXT: uunpklo z25.s, z3.h
545
544
; CHECK-NEWLOWERING-NEXT: uunpkhi z3.s, z3.h
546
- ; CHECK-NEWLOWERING-NEXT: sunpkhi z26.d, z6.s
547
- ; CHECK-NEWLOWERING-NEXT: sunpklo z6.d, z6.s
548
- ; CHECK-NEWLOWERING-NEXT: sunpklo z27.d, z4.s
549
- ; CHECK-NEWLOWERING-NEXT: uunpklo z28.d, z7.s
550
- ; CHECK-NEWLOWERING-NEXT: uunpklo z29.d, z5.s
545
+ ; CHECK-NEWLOWERING-NEXT: uunpkhi z5.s, z5.h
546
+ ; CHECK-NEWLOWERING-NEXT: sunpklo z26.d, z6.s
547
+ ; CHECK-NEWLOWERING-NEXT: sunpklo z27.d, z7.s
548
+ ; CHECK-NEWLOWERING-NEXT: sunpkhi z7.d, z7.s
549
+ ; CHECK-NEWLOWERING-NEXT: uunpklo z28.d, z24.s
550
+ ; CHECK-NEWLOWERING-NEXT: uunpkhi z24.d, z24.s
551
+ ; CHECK-NEWLOWERING-NEXT: sunpkhi z6.d, z6.s
552
+ ; CHECK-NEWLOWERING-NEXT: uunpklo z29.d, z25.s
553
+ ; CHECK-NEWLOWERING-NEXT: uunpkhi z25.d, z25.s
554
+ ; CHECK-NEWLOWERING-NEXT: sunpklo z30.d, z4.s
551
555
; CHECK-NEWLOWERING-NEXT: sunpkhi z4.d, z4.s
552
- ; CHECK-NEWLOWERING-NEXT: uunpkhi z7.d, z7.s
556
+ ; CHECK-NEWLOWERING-NEXT: sunpklo z31.d, z2.s
557
+ ; CHECK-NEWLOWERING-NEXT: sunpkhi z2.d, z2.s
558
+ ; CHECK-NEWLOWERING-NEXT: uunpklo z8.d, z3.s
559
+ ; CHECK-NEWLOWERING-NEXT: uunpklo z9.d, z5.s
553
560
; CHECK-NEWLOWERING-NEXT: uunpkhi z5.d, z5.s
554
- ; CHECK-NEWLOWERING-NEXT: sunpkhi z30.d, z24.s
555
- ; CHECK-NEWLOWERING-NEXT: sunpkhi z31.d, z2.s
556
- ; CHECK-NEWLOWERING-NEXT: sunpklo z24.d, z24.s
557
- ; CHECK-NEWLOWERING-NEXT: sunpklo z2.d, z2.s
558
- ; CHECK-NEWLOWERING-NEXT: uunpkhi z8.d, z25.s
559
- ; CHECK-NEWLOWERING-NEXT: uunpklo z25.d, z25.s
560
- ; CHECK-NEWLOWERING-NEXT: uunpklo z9.d, z3.s
561
- ; CHECK-NEWLOWERING-NEXT: mul z27.d, z27.d, z29.d
562
- ; CHECK-NEWLOWERING-NEXT: mla z0.d, p0/m, z6.d, z28.d
561
+ ; CHECK-NEWLOWERING-NEXT: mul z7.d, z7.d, z24.d
562
+ ; CHECK-NEWLOWERING-NEXT: mla z0.d, p0/m, z27.d, z28.d
563
563
; CHECK-NEWLOWERING-NEXT: uunpkhi z3.d, z3.s
564
- ; CHECK-NEWLOWERING-NEXT: mul z4 .d, z4 .d, z5 .d
565
- ; CHECK-NEWLOWERING-NEXT: mla z1.d, p0/m, z26.d, z7 .d
566
- ; CHECK-NEWLOWERING-NEXT: mla z0.d, p0/m, z2.d, z9 .d
567
- ; CHECK-NEWLOWERING-NEXT: movprfx z2, z27
568
- ; CHECK-NEWLOWERING-NEXT: mla z2.d, p0/m, z24 .d, z25 .d
564
+ ; CHECK-NEWLOWERING-NEXT: mul z6 .d, z6 .d, z25 .d
565
+ ; CHECK-NEWLOWERING-NEXT: mla z1.d, p0/m, z26.d, z29 .d
566
+ ; CHECK-NEWLOWERING-NEXT: mla z0.d, p0/m, z2.d, z5 .d
567
+ ; CHECK-NEWLOWERING-NEXT: movprfx z2, z7
568
+ ; CHECK-NEWLOWERING-NEXT: mla z2.d, p0/m, z31 .d, z9 .d
569
569
; CHECK-NEWLOWERING-NEXT: ldr z9, [sp] // 16-byte Folded Reload
570
- ; CHECK-NEWLOWERING-NEXT: mla z1.d, p0/m, z31 .d, z3.d
571
- ; CHECK-NEWLOWERING-NEXT: movprfx z3, z4
570
+ ; CHECK-NEWLOWERING-NEXT: mla z1.d, p0/m, z4 .d, z3.d
571
+ ; CHECK-NEWLOWERING-NEXT: movprfx z3, z6
572
572
; CHECK-NEWLOWERING-NEXT: mla z3.d, p0/m, z30.d, z8.d
573
573
; CHECK-NEWLOWERING-NEXT: ldr z8, [sp, #1, mul vl] // 16-byte Folded Reload
574
574
; CHECK-NEWLOWERING-NEXT: add z0.d, z2.d, z0.d
0 commit comments