Fix Windows build by including raw_ostream.h
[oota-llvm.git] / test / MC / AArch64 / neon-simd-ldst-one-elem.s
1 // RUN: llvm-mc -triple=arm64 -mattr=+neon -show-encoding < %s | FileCheck %s
2
3 // Check that the assembler can handle the documented syntax for AArch64
4
5 //------------------------------------------------------------------------------
6 // Load single 1-element structure to all lanes of 1 register
7 //------------------------------------------------------------------------------
8          ld1r { v0.16b }, [x0]
9          ld1r { v15.8h }, [x15]
10          ld1r { v31.4s }, [sp]
11          ld1r { v0.2d }, [x0]
12          ld1r { v0.8b }, [x0]
13          ld1r { v15.4h }, [x15]
14          ld1r { v31.2s }, [sp]
15          ld1r { v0.1d }, [x0]
16 // CHECK: ld1r { v0.16b }, [x0]          // encoding: [0x00,0xc0,0x40,0x4d]
17 // CHECK: ld1r { v15.8h }, [x15]         // encoding: [0xef,0xc5,0x40,0x4d]
18 // CHECK: ld1r { v31.4s }, [sp]          // encoding: [0xff,0xcb,0x40,0x4d]
19 // CHECK: ld1r { v0.2d }, [x0]           // encoding: [0x00,0xcc,0x40,0x4d]
20 // CHECK: ld1r { v0.8b }, [x0]           // encoding: [0x00,0xc0,0x40,0x0d]
21 // CHECK: ld1r { v15.4h }, [x15]         // encoding: [0xef,0xc5,0x40,0x0d]
22 // CHECK: ld1r { v31.2s }, [sp]          // encoding: [0xff,0xcb,0x40,0x0d]
23 // CHECK: ld1r { v0.1d }, [x0]           // encoding: [0x00,0xcc,0x40,0x0d]
24
25 //------------------------------------------------------------------------------
26 // Load single N-element structure to all lanes of N consecutive
27 // registers (N = 2,3,4)
28 //------------------------------------------------------------------------------
29          ld2r { v0.16b, v1.16b }, [x0]
30          ld2r { v15.8h, v16.8h }, [x15]
31          ld2r { v31.4s, v0.4s }, [sp]
32          ld2r { v0.2d, v1.2d }, [x0]
33          ld2r { v0.8b, v1.8b }, [x0]
34          ld2r { v15.4h, v16.4h }, [x15]
35          ld2r { v31.2s, v0.2s }, [sp]
36          ld2r { v31.1d, v0.1d }, [sp]
37 // CHECK: ld2r { v0.16b, v1.16b }, [x0]  // encoding: [0x00,0xc0,0x60,0x4d]
38 // CHECK: ld2r { v15.8h, v16.8h }, [x15] // encoding: [0xef,0xc5,0x60,0x4d]
39 // CHECK: ld2r { v31.4s, v0.4s }, [sp]   // encoding: [0xff,0xcb,0x60,0x4d]
40 // CHECK: ld2r { v0.2d, v1.2d }, [x0]    // encoding: [0x00,0xcc,0x60,0x4d]
41 // CHECK: ld2r { v0.8b, v1.8b }, [x0]    // encoding: [0x00,0xc0,0x60,0x0d]
42 // CHECK: ld2r { v15.4h, v16.4h }, [x15] // encoding: [0xef,0xc5,0x60,0x0d]
43 // CHECK: ld2r { v31.2s, v0.2s }, [sp]   // encoding: [0xff,0xcb,0x60,0x0d]
44 // CHECK: ld2r { v31.1d, v0.1d }, [sp]   // encoding: [0xff,0xcf,0x60,0x0d]
45
46          ld3r { v0.16b, v1.16b, v2.16b }, [x0]
47          ld3r { v15.8h, v16.8h, v17.8h }, [x15]
48          ld3r { v31.4s, v0.4s, v1.4s }, [sp]
49          ld3r { v0.2d, v1.2d, v2.2d }, [x0]
50          ld3r { v0.8b, v1.8b, v2.8b }, [x0]
51          ld3r { v15.4h, v16.4h, v17.4h }, [x15]
52          ld3r { v31.2s, v0.2s, v1.2s }, [sp]
53          ld3r { v31.1d, v0.1d, v1.1d }, [sp]
54 // CHECK: ld3r { v0.16b, v1.16b, v2.16b }, [x0] // encoding: [0x00,0xe0,0x40,0x4d]
55 // CHECK: ld3r { v15.8h, v16.8h, v17.8h }, [x15] // encoding: [0xef,0xe5,0x40,0x4d]
56 // CHECK: ld3r { v31.4s, v0.4s, v1.4s }, [sp] // encoding: [0xff,0xeb,0x40,0x4d]
57 // CHECK: ld3r { v0.2d, v1.2d, v2.2d }, [x0] // encoding: [0x00,0xec,0x40,0x4d]
58 // CHECK: ld3r { v0.8b, v1.8b, v2.8b }, [x0] // encoding: [0x00,0xe0,0x40,0x0d]
59 // CHECK: ld3r { v15.4h, v16.4h, v17.4h }, [x15] // encoding: [0xef,0xe5,0x40,0x0d]
60 // CHECK: ld3r { v31.2s, v0.2s, v1.2s }, [sp] // encoding: [0xff,0xeb,0x40,0x0d]
61 // CHECK: ld3r { v31.1d, v0.1d, v1.1d }, [sp] // encoding: [0xff,0xef,0x40,0x0d]
62
63          ld4r { v0.16b, v1.16b, v2.16b, v3.16b }, [x0]
64          ld4r { v15.8h, v16.8h, v17.8h, v18.8h }, [x15]
65          ld4r { v31.4s, v0.4s, v1.4s, v2.4s }, [sp]
66          ld4r { v0.2d, v1.2d, v2.2d, v3.2d }, [x0]
67          ld4r { v0.8b, v1.8b, v2.8b, v3.8b }, [x0]
68          ld4r { v15.4h, v16.4h, v17.4h, v18.4h }, [x15]
69          ld4r { v31.2s, v0.2s, v1.2s, v2.2s }, [sp]
70          ld4r { v31.1d, v0.1d, v1.1d, v2.1d }, [sp]
71 // CHECK: ld4r { v0.16b, v1.16b, v2.16b, v3.16b }, [x0] // encoding: [0x00,0xe0,0x60,0x4d]
72 // CHECK: ld4r { v15.8h, v16.8h, v17.8h, v18.8h }, [x15] // encoding: [0xef,0xe5,0x60,0x4d]
73 // CHECK: ld4r { v31.4s, v0.4s, v1.4s, v2.4s }, [sp] // encoding: [0xff,0xeb,0x60,0x4d]
74 // CHECK: ld4r { v0.2d, v1.2d, v2.2d, v3.2d }, [x0] // encoding: [0x00,0xec,0x60,0x4d]
75 // CHECK: ld4r { v0.8b, v1.8b, v2.8b, v3.8b }, [x0] // encoding: [0x00,0xe0,0x60,0x0d]
76 // CHECK: ld4r { v15.4h, v16.4h, v17.4h, v18.4h }, [x15] // encoding: [0xef,0xe5,0x60,0x0d]
77 // CHECK: ld4r { v31.2s, v0.2s, v1.2s, v2.2s }, [sp] // encoding: [0xff,0xeb,0x60,0x0d]
78 // CHECK: ld4r { v31.1d, v0.1d, v1.1d, v2.1d }, [sp] // encoding: [0xff,0xef,0x60,0x0d]
79
80 //------------------------------------------------------------------------------
81 // Load single 1-element structure to one lane of 1 register.
82 //------------------------------------------------------------------------------
83          ld1 { v0.b }[9], [x0]
84          ld1 { v15.h }[7], [x15]
85          ld1 { v31.s }[3], [sp]
86          ld1 { v0.d }[1], [x0]
87 // CHECK: ld1 { v0.b }[9], [x0]         // encoding: [0x00,0x04,0x40,0x4d]
88 // CHECK: ld1 { v15.h }[7], [x15]       // encoding: [0xef,0x59,0x40,0x4d]
89 // CHECK: ld1 { v31.s }[3], [sp]        // encoding: [0xff,0x93,0x40,0x4d]
90 // CHECK: ld1 { v0.d }[1], [x0]         // encoding: [0x00,0x84,0x40,0x4d]
91
92 //------------------------------------------------------------------------------
93 // Load single N-element structure to one lane of N consecutive registers
94 // (N = 2,3,4)
95 //------------------------------------------------------------------------------
96          ld2 { v0.b, v1.b }[9], [x0]
97          ld2 { v15.h, v16.h }[7], [x15]
98          ld2 { v31.s, v0.s }[3], [sp]
99          ld2 { v0.d, v1.d }[1], [x0]
100 // CHECK: ld2 { v0.b, v1.b }[9], [x0]   // encoding: [0x00,0x04,0x60,0x4d]
101 // CHECK: ld2 { v15.h, v16.h }[7], [x15] // encoding: [0xef,0x59,0x60,0x4d]
102 // CHECK: ld2 { v31.s, v0.s }[3], [sp]  // encoding: [0xff,0x93,0x60,0x4d]
103 // CHECK: ld2 { v0.d, v1.d }[1], [x0]   // encoding: [0x00,0x84,0x60,0x4d]
104
105          ld3 { v0.b, v1.b, v2.b }[9], [x0]
106          ld3 { v15.h, v16.h, v17.h }[7], [x15]
107          ld3 { v31.s, v0.s, v1.s }[3], [sp]
108          ld3 { v0.d, v1.d, v2.d }[1], [x0]
109 // CHECK: ld3 { v0.b, v1.b, v2.b }[9], [x0] // encoding: [0x00,0x24,0x40,0x4d]
110 // CHECK: ld3 { v15.h, v16.h, v17.h }[7], [x15] // encoding: [0xef,0x79,0x40,0x4d]
111 // CHECK: ld3 { v31.s, v0.s, v1.s }[3], [sp] // encoding: [0xff,0xb3,0x40,0x4d]
112 // CHECK: ld3 { v0.d, v1.d, v2.d }[1], [x0] // encoding: [0x00,0xa4,0x40,0x4d]
113
114          ld4 { v0.b, v1.b, v2.b, v3.b }[9], [x0]
115          ld4 { v15.h, v16.h, v17.h, v18.h }[7], [x15]
116          ld4 { v31.s, v0.s, v1.s, v2.s }[3], [sp]
117          ld4 { v0.d, v1.d, v2.d, v3.d }[1], [x0]
118 // CHECK: ld4 { v0.b, v1.b, v2.b, v3.b }[9], [x0] // encoding: [0x00,0x24,0x60,0x4d]
119 // CHECK: ld4 { v15.h, v16.h, v17.h, v18.h }[7], [x15] // encoding: [0xef,0x79,0x60,0x4d]
120 // CHECK: ld4 { v31.s, v0.s, v1.s, v2.s }[3], [sp] // encoding: [0xff,0xb3,0x60,0x4d]
121 // CHECK: ld4 { v0.d, v1.d, v2.d, v3.d }[1], [x0] // encoding: [0x00,0xa4,0x60,0x4d]
122
123 //------------------------------------------------------------------------------
124 // Store single 1-element structure from one lane of 1 register.
125 //------------------------------------------------------------------------------
126          st1 { v0.b }[9], [x0]
127          st1 { v15.h }[7], [x15]
128          st1 { v31.s }[3], [sp]
129          st1 { v0.d }[1], [x0]
130 // CHECK: st1 { v0.b }[9], [x0]         // encoding: [0x00,0x04,0x00,0x4d]
131 // CHECK: st1 { v15.h }[7], [x15]       // encoding: [0xef,0x59,0x00,0x4d]
132 // CHECK: st1 { v31.s }[3], [sp]        // encoding: [0xff,0x93,0x00,0x4d]
133 // CHECK: st1 { v0.d }[1], [x0]         // encoding: [0x00,0x84,0x00,0x4d]
134
135 //------------------------------------------------------------------------------
136 // Store single N-element structure from one lane of N consecutive registers
137 // (N = 2,3,4)
138 //------------------------------------------------------------------------------
139          st2 { v0.b, v1.b }[9], [x0]
140          st2 { v15.h, v16.h }[7], [x15]
141          st2 { v31.s, v0.s }[3], [sp]
142          st2 { v0.d, v1.d }[1], [x0]
143 // CHECK: st2 { v0.b, v1.b }[9], [x0]   // encoding: [0x00,0x04,0x20,0x4d]
144 // CHECK: st2 { v15.h, v16.h }[7], [x15] // encoding: [0xef,0x59,0x20,0x4d]
145 // CHECK: st2 { v31.s, v0.s }[3], [sp]  // encoding: [0xff,0x93,0x20,0x4d]
146 // CHECK: st2 { v0.d, v1.d }[1], [x0]   // encoding: [0x00,0x84,0x20,0x4d]
147
148          st3 { v0.b, v1.b, v2.b }[9], [x0]
149          st3 { v15.h, v16.h, v17.h }[7], [x15]
150          st3 { v31.s, v0.s, v1.s }[3], [sp]
151          st3 { v0.d, v1.d, v2.d }[1], [x0]
152 // CHECK: st3 { v0.b, v1.b, v2.b }[9], [x0] // encoding: [0x00,0x24,0x00,0x4d]
153 // CHECK: st3 { v15.h, v16.h, v17.h }[7], [x15] // encoding: [0xef,0x79,0x00,0x4d]
154 // CHECK: st3 { v31.s, v0.s, v1.s }[3], [sp] // encoding: [0xff,0xb3,0x00,0x4d]
155 // CHECK: st3 { v0.d, v1.d, v2.d }[1], [x0] // encoding: [0x00,0xa4,0x00,0x4d]
156
157          st4 { v0.b, v1.b, v2.b, v3.b }[9], [x0]
158          st4 { v15.h, v16.h, v17.h, v18.h }[7], [x15]
159          st4 { v31.s, v0.s, v1.s, v2.s }[3], [sp]
160          st4 { v0.d, v1.d, v2.d, v3.d }[1], [x0]
161 // CHECK: st4 { v0.b, v1.b, v2.b, v3.b }[9], [x0] // encoding: [0x00,0x24,0x20,0x4d]
162 // CHECK: st4 { v15.h, v16.h, v17.h, v18.h }[7], [x15] // encoding: [0xef,0x79,0x20,0x4d]
163 // CHECK: st4 { v31.s, v0.s, v1.s, v2.s }[3], [sp] // encoding: [0xff,0xb3,0x20,0x4d]
164 // CHECK: st4 { v0.d, v1.d, v2.d, v3.d }[1], [x0] // encoding: [0x00,0xa4,0x20,0x4d]
165
166 //------------------------------------------------------------------------------
167 // Post-index oad single 1-element structure to all lanes of 1 register
168 //------------------------------------------------------------------------------
169          ld1r { v0.16b }, [x0], #1
170          ld1r { v15.8h }, [x15], #2
171          ld1r { v31.4s }, [sp], #4
172          ld1r { v0.2d }, [x0], #8
173          ld1r { v0.8b }, [x0], x0
174          ld1r { v15.4h }, [x15], x1
175          ld1r { v31.2s }, [sp], x2
176          ld1r { v0.1d }, [x0], x3
177 // CHECK: ld1r { v0.16b }, [x0], #1      // encoding: [0x00,0xc0,0xdf,0x4d]
178 // CHECK: ld1r { v15.8h }, [x15], #2     // encoding: [0xef,0xc5,0xdf,0x4d]
179 // CHECK: ld1r { v31.4s }, [sp], #4      // encoding: [0xff,0xcb,0xdf,0x4d]
180 // CHECK: ld1r { v0.2d }, [x0], #8       // encoding: [0x00,0xcc,0xdf,0x4d]
181 // CHECK: ld1r { v0.8b }, [x0], x0       // encoding: [0x00,0xc0,0xc0,0x0d]
182 // CHECK: ld1r { v15.4h }, [x15], x1     // encoding: [0xef,0xc5,0xc1,0x0d]
183 // CHECK: ld1r { v31.2s }, [sp], x2      // encoding: [0xff,0xcb,0xc2,0x0d]
184 // CHECK: ld1r { v0.1d }, [x0], x3       // encoding: [0x00,0xcc,0xc3,0x0d]
185
186 //------------------------------------------------------------------------------
187 // Post-index load single N-element structure to all lanes of N consecutive
188 // registers (N = 2,3,4)
189 //------------------------------------------------------------------------------
190          ld2r { v0.16b, v1.16b }, [x0], #2
191          ld2r { v15.8h, v16.8h }, [x15], #4
192          ld2r { v31.4s, v0.4s }, [sp], #8
193          ld2r { v0.2d, v1.2d }, [x0], #16
194          ld2r { v0.8b, v1.8b }, [x0], x6
195          ld2r { v15.4h, v16.4h }, [x15], x7
196          ld2r { v31.2s, v0.2s }, [sp], x9
197          ld2r { v31.1d, v0.1d }, [x0], x5
198 // CHECK: ld2r { v0.16b, v1.16b }, [x0], #2 // encoding: [0x00,0xc0,0xff,0x4d]
199 // CHECK: ld2r { v15.8h, v16.8h }, [x15], #4 // encoding: [0xef,0xc5,0xff,0x4d]
200 // CHECK: ld2r { v31.4s, v0.4s }, [sp], #8 // encoding: [0xff,0xcb,0xff,0x4d]
201 // CHECK: ld2r { v0.2d, v1.2d }, [x0], #16 // encoding: [0x00,0xcc,0xff,0x4d]
202 // CHECK: ld2r { v0.8b, v1.8b }, [x0], x6 // encoding: [0x00,0xc0,0xe6,0x0d]
203 // CHECK: ld2r { v15.4h, v16.4h }, [x15], x7 // encoding: [0xef,0xc5,0xe7,0x0d]
204 // CHECK: ld2r { v31.2s, v0.2s }, [sp], x9 // encoding: [0xff,0xcb,0xe9,0x0d]
205 // CHECK: ld2r { v31.1d, v0.1d }, [x0], x5 // encoding: [0x1f,0xcc,0xe5,0x0d]
206
207          ld3r { v0.16b, v1.16b, v2.16b }, [x0], x9
208          ld3r { v15.8h, v16.8h, v17.8h }, [x15], x6
209          ld3r { v31.4s, v0.4s, v1.4s }, [sp], x7
210          ld3r { v0.2d, v1.2d, v2.2d }, [x0], x5
211          ld3r { v0.8b, v1.8b, v2.8b }, [x0], #3
212          ld3r { v15.4h, v16.4h, v17.4h }, [x15], #6
213          ld3r { v31.2s, v0.2s, v1.2s }, [sp], #12
214          ld3r { v31.1d, v0.1d, v1.1d }, [sp], #24
215 // CHECK: ld3r { v0.16b, v1.16b, v2.16b }, [x0], x9 // encoding: [0x00,0xe0,0xc9,0x4d]
216 // CHECK: ld3r { v15.8h, v16.8h, v17.8h }, [x15], x6 // encoding: [0xef,0xe5,0xc6,0x4d]
217 // CHECK: ld3r { v31.4s, v0.4s, v1.4s }, [sp], x7 // encoding: [0xff,0xeb,0xc7,0x4d]
218 // CHECK: ld3r { v0.2d, v1.2d, v2.2d }, [x0], x5 // encoding: [0x00,0xec,0xc5,0x4d]
219 // CHECK: ld3r { v0.8b, v1.8b, v2.8b }, [x0], #3 // encoding: [0x00,0xe0,0xdf,0x0d]
220 // CHECK: ld3r { v15.4h, v16.4h, v17.4h }, [x15], #6 // encoding: [0xef,0xe5,0xdf,0x0d]
221 // CHECK: ld3r { v31.2s, v0.2s, v1.2s }, [sp], #12 // encoding: [0xff,0xeb,0xdf,0x0d]
222 // CHECK: ld3r { v31.1d, v0.1d, v1.1d }, [sp], #24 // encoding: [0xff,0xef,0xdf,0x0d]
223
224          ld4r { v0.16b, v1.16b, v2.16b, v3.16b }, [x0], #4
225          ld4r { v15.8h, v16.8h, v17.8h, v18.8h }, [x15], #8
226          ld4r { v31.4s, v0.4s, v1.4s, v2.4s }, [sp], #16
227          ld4r { v0.2d, v1.2d, v2.2d, v3.2d }, [x0], #32
228          ld4r { v0.8b, v1.8b, v2.8b, v3.8b }, [x0], x5
229          ld4r { v15.4h, v16.4h, v17.4h, v18.4h }, [x15], x9
230          ld4r { v31.2s, v0.2s, v1.2s, v2.2s }, [sp], x30
231          ld4r { v31.1d, v0.1d, v1.1d, v2.1d }, [sp], x7
232 // CHECK: ld4r { v0.16b, v1.16b, v2.16b, v3.16b }, [x0], #4 // encoding: [0x00,0xe0,0xff,0x4d]
233 // CHECK: ld4r { v15.8h, v16.8h, v17.8h, v18.8h }, [x15], #8 // encoding: [0xef,0xe5,0xff,0x4d]
234 // CHECK: ld4r { v31.4s, v0.4s, v1.4s, v2.4s }, [sp], #16 // encoding: [0xff,0xeb,0xff,0x4d]
235 // CHECK: ld4r { v0.2d, v1.2d, v2.2d, v3.2d }, [x0], #32 // encoding: [0x00,0xec,0xff,0x4d]
236 // CHECK: ld4r { v0.8b, v1.8b, v2.8b, v3.8b }, [x0], x5 // encoding: [0x00,0xe0,0xe5,0x0d]
237 // CHECK: ld4r { v15.4h, v16.4h, v17.4h, v18.4h }, [x15], x9 // encoding: [0xef,0xe5,0xe9,0x0d]
238 // CHECK: ld4r { v31.2s, v0.2s, v1.2s, v2.2s }, [sp], x30 // encoding: [0xff,0xeb,0xfe,0x0d]
239 // CHECK: ld4r { v31.1d, v0.1d, v1.1d, v2.1d }, [sp], x7 // encoding: [0xff,0xef,0xe7,0x0d]
240
241 //------------------------------------------------------------------------------
242 // Post-index load single 1-element structure to one lane of 1 register.
243 //------------------------------------------------------------------------------
244          ld1 { v0.b }[9], [x0], #1
245          ld1 { v15.h }[7], [x15], x9
246          ld1 { v31.s }[3], [sp], x6
247          ld1 { v0.d }[1], [x0], #8
248 // CHECK: ld1 { v0.b }[9], [x0], #1     // encoding: [0x00,0x04,0xdf,0x4d]
249 // CHECK: ld1 { v15.h }[7], [x15], x9   // encoding: [0xef,0x59,0xc9,0x4d]
250 // CHECK: ld1 { v31.s }[3], [sp], x6    // encoding: [0xff,0x93,0xc6,0x4d]
251 // CHECK: ld1 { v0.d }[1], [x0], #8     // encoding: [0x00,0x84,0xdf,0x4d]
252
253 //------------------------------------------------------------------------------
254 // Post-index load single N-element structure to one lane of N consecutive
255 // registers (N = 2,3,4)
256 //------------------------------------------------------------------------------
257          ld2 { v0.b, v1.b }[9], [x0], x3
258          ld2 { v15.h, v16.h }[7], [x15], #4
259          ld2 { v31.s, v0.s }[3], [sp], #8
260          ld2 { v0.d, v1.d }[1], [x0], x0
261 // CHECK: ld2 { v0.b, v1.b }[9], [x0], x3 // encoding: [0x00,0x04,0xe3,0x4d]
262 // CHECK: ld2 { v15.h, v16.h }[7], [x15], #4 // encoding: [0xef,0x59,0xff,0x4d]
263 // CHECK: ld2 { v31.s, v0.s }[3], [sp], #8 // encoding: [0xff,0x93,0xff,0x4d]
264 // CHECK: ld2 { v0.d, v1.d }[1], [x0], x0 // encoding: [0x00,0x84,0xe0,0x4d]
265
266          ld3 { v0.b, v1.b, v2.b }[9], [x0], #3
267          ld3 { v15.h, v16.h, v17.h }[7], [x15], #6
268          ld3 { v31.s, v0.s, v1.s }[3], [sp], x3
269          ld3 { v0.d, v1.d, v2.d }[1], [x0], x6
270 // CHECK: ld3 { v0.b, v1.b, v2.b }[9], [x0], #3 // encoding: [0x00,0x24,0xdf,0x4d]
271 // CHECK: ld3 { v15.h, v16.h, v17.h }[7], [x15], #6 // encoding: [0xef,0x79,0xdf,0x4d]
272 // CHECK: ld3 { v31.s, v0.s, v1.s }[3], [sp], x3 // encoding: [0xff,0xb3,0xc3,0x4d]
273 // CHECK: ld3 { v0.d, v1.d, v2.d }[1], [x0], x6 // encoding: [0x00,0xa4,0xc6,0x4d]
274
275          ld4 { v0.b, v1.b, v2.b, v3.b }[9], [x0], x5
276          ld4 { v15.h, v16.h, v17.h, v18.h }[7], [x15], x7
277          ld4 { v31.s, v0.s, v1.s, v2.s }[3], [sp], #16
278          ld4 { v0.d, v1.d, v2.d, v3.d }[1], [x0], #32
279 // CHECK: ld4 { v0.b, v1.b, v2.b, v3.b }[9], [x0], x5 // encoding: [0x00,0x24,0xe5,0x4d]
280 // CHECK: ld4 { v15.h, v16.h, v17.h, v18.h }[7], [x15], x7 // encoding: [0xef,0x79,0xe7,0x4d]
281 // CHECK: ld4 { v31.s, v0.s, v1.s, v2.s }[3], [sp], #16 // encoding: [0xff,0xb3,0xff,0x4d]
282 // CHECK: ld4 { v0.d, v1.d, v2.d, v3.d }[1], [x0], #32 // encoding: [0x00,0xa4,0xff,0x4d]
283
284 //------------------------------------------------------------------------------
285 // Post-index store single 1-element structure from one lane of 1 register.
286 //------------------------------------------------------------------------------
287          st1 { v0.b }[9], [x0], #1
288          st1 { v15.h }[7], [x15], x9
289          st1 { v31.s }[3], [sp], x6
290          st1 { v0.d }[1], [x0], #8
291 // CHECK: st1 { v0.b }[9], [x0], #1     // encoding: [0x00,0x04,0x9f,0x4d]
292 // CHECK: st1 { v15.h }[7], [x15], x9   // encoding: [0xef,0x59,0x89,0x4d]
293 // CHECK: st1 { v31.s }[3], [sp], x6    // encoding: [0xff,0x93,0x86,0x4d]
294 // CHECK: st1 { v0.d }[1], [x0], #8     // encoding: [0x00,0x84,0x9f,0x4d]
295
296 //------------------------------------------------------------------------------
297 // Post-index store single N-element structure from one lane of N consecutive
298 // registers (N = 2,3,4)
299 //------------------------------------------------------------------------------
300          st2 { v0.b, v1.b }[9], [x0], x3
301          st2 { v15.h, v16.h }[7], [x15], #4
302          st2 { v31.s, v0.s }[3], [sp], #8
303          st2 { v0.d, v1.d }[1], [x0], x0
304 // CHECK: st2 { v0.b, v1.b }[9], [x0], x3 // encoding: [0x00,0x04,0xa3,0x4d]
305 // CHECK: st2 { v15.h, v16.h }[7], [x15], #4 // encoding: [0xef,0x59,0xbf,0x4d]
306 // CHECK: st2 { v31.s, v0.s }[3], [sp], #8 // encoding: [0xff,0x93,0xbf,0x4d]
307 // CHECK: st2 { v0.d, v1.d }[1], [x0], x0 // encoding: [0x00,0x84,0xa0,0x4d]
308
309          st3 { v0.b, v1.b, v2.b }[9], [x0], #3
310          st3 { v15.h, v16.h, v17.h }[7], [x15], #6
311          st3 { v31.s, v0.s, v1.s }[3], [sp], x3
312          st3 { v0.d, v1.d, v2.d }[1], [x0], x6
313 // CHECK: st3 { v0.b, v1.b, v2.b }[9], [x0], #3 // encoding: [0x00,0x24,0x9f,0x4d]
314 // CHECK: st3 { v15.h, v16.h, v17.h }[7], [x15], #6 // encoding: [0xef,0x79,0x9f,0x4d]
315 // CHECK: st3 { v31.s, v0.s, v1.s }[3], [sp], x3 // encoding: [0xff,0xb3,0x83,0x4d]
316 // CHECK: st3 { v0.d, v1.d, v2.d }[1], [x0], x6 // encoding: [0x00,0xa4,0x86,0x4d]
317
318          st4 { v0.b, v1.b, v2.b, v3.b }[9], [x0], x5
319          st4 { v15.h, v16.h, v17.h, v18.h }[7], [x15], x7
320          st4 { v31.s, v0.s, v1.s, v2.s }[3], [sp], #16
321          st4 { v0.d, v1.d, v2.d, v3.d }[1], [x0], #32
322 // CHECK: st4 { v0.b, v1.b, v2.b, v3.b }[9], [x0], x5 // encoding: [0x00,0x24,0xa5,0x4d]
323 // CHECK: st4 { v15.h, v16.h, v17.h, v18.h }[7], [x15], x7 // encoding: [0xef,0x79,0xa7,0x4d]
324 // CHECK: st4 { v31.s, v0.s, v1.s, v2.s }[3], [sp], #16 // encoding: [0xff,0xb3,0xbf,0x4d]
325 // CHECK: st4 { v0.d, v1.d, v2.d, v3.d }[1], [x0], #32 // encoding: [0x00,0xa4,0xbf,0x4d]