| 1 | #include <cstdint> |
| 2 | |
| 3 | struct alignas(16) vec_t { |
| 4 | uint64_t a, b; |
| 5 | }; |
| 6 | |
| 7 | int main() { |
| 8 | constexpr uint64_t gprs[] = { |
| 9 | 0x0001020304050607, |
| 10 | 0x1011121314151617, |
| 11 | 0x2021222324252627, |
| 12 | 0x3031323334353637, |
| 13 | 0x4041424344454647, |
| 14 | 0x5051525354555657, |
| 15 | 0x6061626364656667, |
| 16 | 0x7071727374757677, |
| 17 | }; |
| 18 | |
| 19 | constexpr vec_t vecs[] = { |
| 20 | { .a: 0x0F0E0D0C0B0A0908, .b: 0x1716151413121110, }, |
| 21 | { .a: 0x100F0E0D0C0B0A09, .b: 0x1817161514131211, }, |
| 22 | { .a: 0x11100F0E0D0C0B0A, .b: 0x1918171615141312, }, |
| 23 | { .a: 0x1211100F0E0D0C0B, .b: 0x1A19181716151413, }, |
| 24 | { .a: 0x131211100F0E0D0C, .b: 0x1B1A191817161514, }, |
| 25 | { .a: 0x14131211100F0E0D, .b: 0x1C1B1A1918171615, }, |
| 26 | { .a: 0x1514131211100F0E, .b: 0x1D1C1B1A19181716, }, |
| 27 | { .a: 0x161514131211100F, .b: 0x1E1D1C1B1A191817, }, |
| 28 | }; |
| 29 | |
| 30 | asm volatile( |
| 31 | "ldp x0, x1, [%0]\n\t" |
| 32 | "ldp x2, x3, [%0, #16]\n\t" |
| 33 | "ldp x4, x5, [%0, #32]\n\t" |
| 34 | "ldp x6, x7, [%0, #48]\n\t" |
| 35 | "\n\t" |
| 36 | "ld1 {v0.2d, v1.2d, v2.2d, v3.2d}, [%1], #64\n\t" |
| 37 | "ld1 {v4.2d, v5.2d, v6.2d, v7.2d}, [%1], #64\n\t" |
| 38 | "\n\t" |
| 39 | "brk #0\n\t" |
| 40 | : |
| 41 | : "r" (gprs), "r" (vecs) |
| 42 | : "x0" , "x1" , "x2" , "x3" , "x4" , "x5" , "x6" , "x7" , |
| 43 | "v0" , "v1" , "v2" , "v3" , "v4" , "v5" , "v6" , "v7" |
| 44 | ); |
| 45 | |
| 46 | return 0; |
| 47 | } |
| 48 | |