|
36 | 36 | ; CHECK-NEXT: vlda wh7, [p4, #352]; vshift.align x0, x0, s0, x8, r3
|
37 | 37 | ; CHECK-NEXT: vlda wl7, [p4, #320]; movxm le, #.L_LEnd0
|
38 | 38 | ; CHECK-NEXT: nopb ; vlda wh9, [p4, #416]; nops ; nopx ; vshift.align x2, x2, s0, x10, r3; nopv
|
39 |
| - ; CHECK-NEXT: nopb ; vlda wl9, [p4, #384]; nops ; nopx ; vshuffle x5, x0, x2, r25; nopv |
40 |
| - ; CHECK-NEXT: nopb ; vlda wh11, [p4, #480]; nops ; nopx ; vshift.align x4, x4, s0, x1, r3; nopv |
41 |
| - ; CHECK-NEXT: nopb ; vlda wl11, [p4, #448]; nops ; nopx ; vshuffle x8, x0, x2, r9; nopv |
42 |
| - ; CHECK-NEXT: vldb wh5, [p5, #32]; nopa ; nops ; nopx ; vshift.align x6, x6, s0, x3, r3; nopv |
43 |
| - ; CHECK-NEXT: nopb ; vlda wl5, [p5], #256; nops ; nopx ; vshuffle x3, x4, x6, r9; nopv |
| 39 | + ; CHECK-NEXT: nopb ; vlda wl9, [p4, #384]; nops ; nopx ; vshuffle x8, x0, x2, r9; nopv |
| 40 | + ; CHECK-NEXT: vldb wh5, [p5, #32]; nopa ; nops ; nopx ; vshift.align x4, x4, s0, x1, r3; nopv |
| 41 | + ; CHECK-NEXT: nopb ; vlda wl5, [p5], #256; nops ; nopx ; vshuffle x5, x0, x2, r25; nopv |
| 42 | + ; CHECK-NEXT: nopb ; vlda wh11, [p4, #480]; nops ; nopx ; vshift.align x6, x6, s0, x3, r3; nopv |
| 43 | + ; CHECK-NEXT: nopb ; vlda wl11, [p4, #448]; nops ; nopx ; vshuffle x3, x4, x6, r9; nopv |
44 | 44 | ; CHECK-NEXT: nopb ; nopa ; nops ; nopx ; vshuffle x10, x4, x6, r25; vmac.f bml4, bml4, x8, x7, r29
|
45 | 45 | ; CHECK-NEXT: nopa ; vshuffle x1, x3, x5, r13
|
46 | 46 | ; CHECK-NEXT: vshuffle x3, x3, x5, r24; vmac.f bmh1, bmh1, x8, x9, r29
|
47 | 47 | ; CHECK-NEXT: mov r3, p0; vmac.f bmh0, bmh0, x1, x9, r29
|
48 |
| - ; CHECK-NEXT: and r3, r3, r0; mov p4, p7; vmac.f bmh3, bmh3, x3, x9, r29 |
49 |
| - ; CHECK-NEXT: add r3, r3, #34; vmac.f bmh2, bmh2, x10, x9, r29 |
50 |
| - ; CHECK-NEXT: vmac.f bmh7, bmh7, x8, x5, r29 |
51 |
| - ; CHECK-NEXT: vmac.f bmh5, bmh5, x1, x5, r29 |
| 48 | + ; CHECK-NEXT: and r3, r3, r0; mov p4, p7; vmac.f bmh7, bmh7, x8, x5, r29 |
| 49 | + ; CHECK-NEXT: add r3, r3, #34; vmac.f bmh5, bmh5, x1, x5, r29 |
| 50 | + ; CHECK-NEXT: vmac.f bml2, bml2, x3, x5, r29 |
| 51 | + ; CHECK-NEXT: vmac.f bml0, bml0, x10, x5, r29 |
52 | 52 | ; CHECK-NEXT: .p2align 4
|
53 | 53 | ; CHECK-NEXT: .LBB0_2: // %for.body
|
54 | 54 | ; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
|
55 |
| - ; CHECK-NEXT: vldb wh8, [p0, #32]; nopa ; nops ; nopx ; mov p7, p5; vmac.f bml2, bml2, x3, x5, r29 |
56 |
| - ; CHECK-NEXT: nopa ; vldb wl8, [p0], m4; nopx ; vmac.f bml0, bml0, x10, x5, r29 |
| 55 | + ; CHECK-NEXT: vldb wh8, [p0, #32]; nopa ; nops ; nopx ; mov p7, p5; vmac.f bmh3, bmh3, x3, x9, r29 |
| 56 | + ; CHECK-NEXT: nopa ; vldb wl8, [p0], m4; nopx ; vmac.f bmh2, bmh2, x10, x9, r29 |
57 | 57 | ; CHECK-NEXT: vldb wh10, [p0, #32]; vmac.f bml3, bml3, x1, x7, r29
|
58 | 58 | ; CHECK-NEXT: vldb wl10, [p0], m4; vmac.f bml6, bml6, x3, x7, r29
|
59 | 59 | ; CHECK-NEXT: vldb wh1, [p0, #32]; vmac.f bml5, bml5, x10, x7, r29
|
|
63 | 63 | ; CHECK-NEXT: vlda wh7, [p4, #352]; vshift.align x0, x0, s0, x8, r3; vmac.f bmh8, bmh8, x10, x11, r29
|
64 | 64 | ; CHECK-NEXT: vlda wl7, [p4, #320]
|
65 | 65 | ; CHECK-NEXT: vlda wh9, [p4, #416]; vshift.align x2, x2, s0, x10, r3
|
66 |
| - ; CHECK-NEXT: vlda wl9, [p4, #384]; vshuffle x5, x0, x2, r25 |
67 |
| - ; CHECK-NEXT: vlda wh11, [p4, #480]; vshift.align x4, x4, s0, x1, r3 |
68 |
| - ; CHECK-NEXT: vlda wl11, [p4, #448]; vshuffle x8, x0, x2, r9 |
69 |
| - ; CHECK-NEXT: vldb wh5, [p5, #32]; vshift.align x6, x6, s0, x3, r3 |
70 |
| - ; CHECK-NEXT: vlda wl5, [p5], #256; vshuffle x3, x4, x6, r9 |
| 66 | + ; CHECK-NEXT: vlda wl9, [p4, #384]; vshuffle x8, x0, x2, r9 |
| 67 | + ; CHECK-NEXT: vldb wh5, [p5, #32]; vshift.align x4, x4, s0, x1, r3 |
| 68 | + ; CHECK-NEXT: vlda wl5, [p5], #256; vshuffle x5, x0, x2, r25 |
| 69 | + ; CHECK-NEXT: vlda wh11, [p4, #480]; vshift.align x6, x6, s0, x3, r3 |
| 70 | + ; CHECK-NEXT: vlda wl11, [p4, #448]; vshuffle x3, x4, x6, r9 |
71 | 71 | ; CHECK-NEXT: vshuffle x10, x4, x6, r25; vmac.f bml4, bml4, x8, x7, r29
|
72 | 72 | ; CHECK-NEXT: vshuffle x1, x3, x5, r13
|
73 | 73 | ; CHECK-NEXT: vshuffle x3, x3, x5, r24; vmac.f bmh1, bmh1, x8, x9, r29
|
74 | 74 | ; CHECK-NEXT: mov r3, p0; vmac.f bmh0, bmh0, x1, x9, r29
|
75 |
| - ; CHECK-NEXT: and r3, r3, r0; mov p4, p7; vmac.f bmh3, bmh3, x3, x9, r29 |
76 |
| - ; CHECK-NEXT: add r3, r3, #34; vmac.f bmh2, bmh2, x10, x9, r29 |
77 |
| - ; CHECK-NEXT: vmac.f bmh7, bmh7, x8, x5, r29 |
| 75 | + ; CHECK-NEXT: and r3, r3, r0; mov p4, p7; vmac.f bmh7, bmh7, x8, x5, r29 |
| 76 | + ; CHECK-NEXT: add r3, r3, #34; vmac.f bmh5, bmh5, x1, x5, r29 |
| 77 | + ; CHECK-NEXT: vmac.f bml2, bml2, x3, x5, r29 |
78 | 78 | ; CHECK-NEXT: .L_LEnd0:
|
79 |
| - ; CHECK-NEXT: nopb ; nopa ; nops ; nopxm ; vmac.f bmh5, bmh5, x1, x5, r29 |
| 79 | + ; CHECK-NEXT: nopb ; nopa ; nops ; nopxm ; vmac.f bml0, bml0, x10, x5, r29 |
80 | 80 | ; CHECK-NEXT: // %bb.3: // %for.cond.cleanup
|
81 |
| - ; CHECK-NEXT: nopb ; nopa ; nops ; nopxm ; vmac.f bml2, bml2, x3, x5, r29 |
82 |
| - ; CHECK-NEXT: vmac.f bml0, bml0, x10, x5, r29 |
| 81 | + ; CHECK-NEXT: nopb ; nopa ; nops ; nopxm ; vmac.f bmh3, bmh3, x3, x9, r29 |
| 82 | + ; CHECK-NEXT: vmac.f bmh2, bmh2, x10, x9, r29 |
83 | 83 | ; CHECK-NEXT: vmac.f bml3, bml3, x1, x7, r29
|
84 | 84 | ; CHECK-NEXT: vmac.f bml6, bml6, x3, x7, r29
|
85 | 85 | ; CHECK-NEXT: vmac.f bml5, bml5, x10, x7, r29
|
|
0 commit comments