xref: /llvm-project/llvm/test/tools/llvm-mca/AArch64/Cortex/A55-writeback.s (revision 475d687ac1123f7ea01bc90789d93b5938930ca1)
1# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
2# RUN: llvm-mca -mtriple=aarch64 -mcpu=cortex-a55 --instruction-info=0 --resource-pressure=0 --timeline --timeline-max-iterations=1 < %s | FileCheck %s
3
4# LLVM-MCA-BEGIN G01
5ld1  { v1.1d }, [x27], #8
6add x0, x27, 1
7ld1  { v1.2d }, [x27], #16
8add x0, x27, 1
9ld1  { v1.2s }, [x27], #8
10add x0, x27, 1
11ld1  { v1.4h }, [x27], #8
12add x0, x27, 1
13ld1  { v1.4s }, [x27], #16
14add x0, x27, 1
15# LLVM-MCA-END
16
17# LLVM-MCA-BEGIN G02
18ld1  { v1.8b }, [x27], #8
19add x0, x27, 1
20ld1  { v1.8h }, [x27], #16
21add x0, x27, 1
22ld1  { v1.16b }, [x27], #16
23add x0, x27, 1
24ld1  { v1.1d }, [x27], x28
25add x0, x27, 1
26ld1  { v1.2d }, [x27], x28
27add x0, x27, 1
28# LLVM-MCA-END
29
30# LLVM-MCA-BEGIN G03
31ld1  { v1.2s }, [x27], x28
32add x0, x27, 1
33ld1  { v1.4h }, [x27], x28
34add x0, x27, 1
35ld1  { v1.4s }, [x27], x28
36add x0, x27, 1
37ld1  { v1.8b }, [x27], x28
38add x0, x27, 1
39ld1  { v1.8h }, [x27], x28
40add x0, x27, 1
41# LLVM-MCA-END
42
43# LLVM-MCA-BEGIN G04
44ld1  { v1.16b }, [x27], x28
45add x0, x27, 1
46ld1  { v1.1d, v2.1d }, [x27], #16
47add x0, x27, 1
48ld1  { v1.2d, v2.2d }, [x27], #32
49add x0, x27, 1
50ld1  { v1.2s, v2.2s }, [x27], #16
51add x0, x27, 1
52ld1  { v1.4h, v2.4h }, [x27], #16
53add x0, x27, 1
54# LLVM-MCA-END
55
56# LLVM-MCA-BEGIN G05
57ld1  { v1.4s, v2.4s }, [x27], #32
58add x0, x27, 1
59ld1  { v1.8b, v2.8b }, [x27], #16
60add x0, x27, 1
61ld1  { v1.8h, v2.8h }, [x27], #32
62add x0, x27, 1
63ld1  { v1.16b, v2.16b }, [x27], #32
64add x0, x27, 1
65ld1  { v1.1d, v2.1d }, [x27], x28
66add x0, x27, 1
67# LLVM-MCA-END
68
69# LLVM-MCA-BEGIN G06
70ld1  { v1.2d, v2.2d }, [x27], x28
71add x0, x27, 1
72ld1  { v1.2s, v2.2s }, [x27], x28
73add x0, x27, 1
74ld1  { v1.4h, v2.4h }, [x27], x28
75add x0, x27, 1
76ld1  { v1.4s, v2.4s }, [x27], x28
77add x0, x27, 1
78ld1  { v1.8b, v2.8b }, [x27], x28
79add x0, x27, 1
80# LLVM-MCA-END
81
82# LLVM-MCA-BEGIN G07
83ld1  { v1.8h, v2.8h }, [x27], x28
84add x0, x27, 1
85ld1  { v1.16b, v2.16b }, [x27], x28
86add x0, x27, 1
87ld1  { v1.1d, v2.1d, v3.1d }, [x27], #24
88add x0, x27, 1
89ld1  { v1.2d, v2.2d, v3.2d }, [x27], #48
90add x0, x27, 1
91ld1  { v1.2s, v2.2s, v3.2s }, [x27], #24
92add x0, x27, 1
93# LLVM-MCA-END
94
95# LLVM-MCA-BEGIN G08
96ld1  { v1.4h, v2.4h, v3.4h }, [x27], #24
97add x0, x27, 1
98ld1  { v1.4s, v2.4s, v3.4s }, [x27], #48
99add x0, x27, 1
100ld1  { v1.8b, v2.8b, v3.8b }, [x27], #24
101add x0, x27, 1
102ld1  { v1.8h, v2.8h, v3.8h }, [x27], #48
103add x0, x27, 1
104ld1  { v1.16b, v2.16b, v3.16b }, [x27], #48
105add x0, x27, 1
106# LLVM-MCA-END
107
108# LLVM-MCA-BEGIN G09
109ld1  { v1.1d, v2.1d, v3.1d }, [x27], x28
110add x0, x27, 1
111ld1  { v1.2d, v2.2d, v3.2d }, [x27], x28
112add x0, x27, 1
113ld1  { v1.2s, v2.2s, v3.2s }, [x27], x28
114add x0, x27, 1
115ld1  { v1.4h, v2.4h, v3.4h }, [x27], x28
116add x0, x27, 1
117ld1  { v1.4s, v2.4s, v3.4s }, [x27], x28
118add x0, x27, 1
119# LLVM-MCA-END
120
121# LLVM-MCA-BEGIN G10
122ld1  { v1.8b, v2.8b, v3.8b }, [x27], x28
123add x0, x27, 1
124ld1  { v1.8h, v2.8h, v3.8h }, [x27], x28
125add x0, x27, 1
126ld1  { v1.16b, v2.16b, v3.16b }, [x27], x28
127add x0, x27, 1
128ld1  { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
129add x0, x27, 1
130ld1  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
131add x0, x27, 1
132# LLVM-MCA-END
133
134# LLVM-MCA-BEGIN G11
135ld1  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
136add x0, x27, 1
137ld1  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
138add x0, x27, 1
139ld1  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
140add x0, x27, 1
141ld1  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
142add x0, x27, 1
143ld1  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
144add x0, x27, 1
145# LLVM-MCA-END
146
147# LLVM-MCA-BEGIN G12
148ld1  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
149add x0, x27, 1
150ld1  { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
151add x0, x27, 1
152ld1  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
153add x0, x27, 1
154ld1  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
155add x0, x27, 1
156ld1  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
157add x0, x27, 1
158# LLVM-MCA-END
159
160# LLVM-MCA-BEGIN G13
161ld1  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
162add x0, x27, 1
163ld1  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
164add x0, x27, 1
165ld1  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
166add x0, x27, 1
167ld1  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
168add x0, x27, 1
169ld1  { v1.b }[0], [x27], #1
170add x0, x27, 1
171# LLVM-MCA-END
172
173# LLVM-MCA-BEGIN G14
174ld1  { v1.b }[8], [x27], #1
175add x0, x27, 1
176ld1  { v1.b }[0], [x27], x28
177add x0, x27, 1
178ld1  { v1.b }[8], [x27], x28
179add x0, x27, 1
180ld1  { v1.h }[0], [x27], #2
181add x0, x27, 1
182ld1  { v1.h }[4], [x27], #2
183add x0, x27, 1
184# LLVM-MCA-END
185
186# LLVM-MCA-BEGIN G15
187ld1  { v1.h }[0], [x27], x28
188add x0, x27, 1
189ld1  { v1.h }[4], [x27], x28
190add x0, x27, 1
191ld1  { v1.s }[0], [x27], #4
192add x0, x27, 1
193ld1  { v1.s }[0], [x27], x28
194add x0, x27, 1
195ld1  { v1.d }[0], [x27], #8
196add x0, x27, 1
197# LLVM-MCA-END
198
199# LLVM-MCA-BEGIN G16
200ld1  { v1.d }[0], [x27], x28
201add x0, x27, 1
202ld1r  { v1.1d }, [x27], #8
203add x0, x27, 1
204ld1r  { v1.2d }, [x27], #8
205add x0, x27, 1
206ld1r  { v1.2s }, [x27], #4
207add x0, x27, 1
208ld1r  { v1.4h }, [x27], #2
209add x0, x27, 1
210# LLVM-MCA-END
211
212# LLVM-MCA-BEGIN G17
213ld1r  { v1.4s }, [x27], #4
214add x0, x27, 1
215ld1r  { v1.8b }, [x27], #1
216add x0, x27, 1
217ld1r  { v1.8h }, [x27], #2
218add x0, x27, 1
219ld1r  { v1.16b }, [x27], #1
220add x0, x27, 1
221ld1r  { v1.1d }, [x27], x28
222add x0, x27, 1
223# LLVM-MCA-END
224
225# LLVM-MCA-BEGIN G18
226ld1r  { v1.2d }, [x27], x28
227add x0, x27, 1
228ld1r  { v1.2s }, [x27], x28
229add x0, x27, 1
230ld1r  { v1.4h }, [x27], x28
231add x0, x27, 1
232ld1r  { v1.4s }, [x27], x28
233add x0, x27, 1
234ld1r  { v1.8b }, [x27], x28
235add x0, x27, 1
236# LLVM-MCA-END
237
238# LLVM-MCA-BEGIN G19
239ld1r  { v1.8h }, [x27], x28
240add x0, x27, 1
241ld1r  { v1.16b }, [x27], x28
242add x0, x27, 1
243ld2  { v1.2d, v2.2d }, [x27], #32
244add x0, x27, 1
245ld2  { v1.2s, v2.2s }, [x27], #16
246add x0, x27, 1
247ld2  { v1.4h, v2.4h }, [x27], #16
248add x0, x27, 1
249# LLVM-MCA-END
250
251# LLVM-MCA-BEGIN G20
252ld2  { v1.4s, v2.4s }, [x27], #32
253add x0, x27, 1
254ld2  { v1.8b, v2.8b }, [x27], #16
255add x0, x27, 1
256ld2  { v1.8h, v2.8h }, [x27], #32
257add x0, x27, 1
258ld2  { v1.16b, v2.16b }, [x27], #32
259add x0, x27, 1
260ld2  { v1.2d, v2.2d }, [x27], x28
261add x0, x27, 1
262# LLVM-MCA-END
263
264# LLVM-MCA-BEGIN G21
265ld2  { v1.2s, v2.2s }, [x27], x28
266add x0, x27, 1
267ld2  { v1.4h, v2.4h }, [x27], x28
268add x0, x27, 1
269ld2  { v1.4s, v2.4s }, [x27], x28
270add x0, x27, 1
271ld2  { v1.8b, v2.8b }, [x27], x28
272add x0, x27, 1
273ld2  { v1.8h, v2.8h }, [x27], x28
274add x0, x27, 1
275# LLVM-MCA-END
276
277# LLVM-MCA-BEGIN G22
278ld2  { v1.16b, v2.16b }, [x27], x28
279add x0, x27, 1
280ld2  { v1.b, v2.b }[0], [x27], #2
281add x0, x27, 1
282ld2  { v1.b, v2.b }[8], [x27], #2
283add x0, x27, 1
284ld2  { v1.b, v2.b }[0], [x27], x28
285add x0, x27, 1
286ld2  { v1.b, v2.b }[8], [x27], x28
287add x0, x27, 1
288# LLVM-MCA-END
289
290# LLVM-MCA-BEGIN G23
291ld2  { v1.h, v2.h }[0], [x27], #4
292add x0, x27, 1
293ld2  { v1.h, v2.h }[4], [x27], #4
294add x0, x27, 1
295ld2  { v1.h, v2.h }[0], [x27], x28
296add x0, x27, 1
297ld2  { v1.h, v2.h }[4], [x27], x28
298add x0, x27, 1
299ld2  { v1.s, v2.s }[0], [x27], #8
300add x0, x27, 1
301# LLVM-MCA-END
302
303# LLVM-MCA-BEGIN G24
304ld2  { v1.s, v2.s }[0], [x27], x28
305add x0, x27, 1
306ld2  { v1.d, v2.d }[0], [x27], #16
307add x0, x27, 1
308ld2  { v1.d, v2.d }[0], [x27], x28
309add x0, x27, 1
310ld2r  { v1.1d, v2.1d }, [x27], #16
311add x0, x27, 1
312ld2r  { v1.2d, v2.2d }, [x27], #16
313add x0, x27, 1
314# LLVM-MCA-END
315
316# LLVM-MCA-BEGIN G25
317ld2r  { v1.2s, v2.2s }, [x27], #8
318add x0, x27, 1
319ld2r  { v1.4h, v2.4h }, [x27], #4
320add x0, x27, 1
321ld2r  { v1.4s, v2.4s }, [x27], #8
322add x0, x27, 1
323ld2r  { v1.8b, v2.8b }, [x27], #2
324add x0, x27, 1
325ld2r  { v1.8h, v2.8h }, [x27], #4
326add x0, x27, 1
327# LLVM-MCA-END
328
329# LLVM-MCA-BEGIN G26
330ld2r  { v1.16b, v2.16b }, [x27], #2
331add x0, x27, 1
332ld2r  { v1.1d, v2.1d }, [x27], x28
333add x0, x27, 1
334ld2r  { v1.2d, v2.2d }, [x27], x28
335add x0, x27, 1
336ld2r  { v1.2s, v2.2s }, [x27], x28
337add x0, x27, 1
338ld2r  { v1.4h, v2.4h }, [x27], x28
339add x0, x27, 1
340# LLVM-MCA-END
341
342# LLVM-MCA-BEGIN G27
343ld2r  { v1.4s, v2.4s }, [x27], x28
344add x0, x27, 1
345ld2r  { v1.8b, v2.8b }, [x27], x28
346add x0, x27, 1
347ld2r  { v1.8h, v2.8h }, [x27], x28
348add x0, x27, 1
349ld2r  { v1.16b, v2.16b }, [x27], x28
350add x0, x27, 1
351ld3  { v1.2d, v2.2d, v3.2d }, [x27], #48
352add x0, x27, 1
353# LLVM-MCA-END
354
355# LLVM-MCA-BEGIN G28
356ld3  { v1.2s, v2.2s, v3.2s }, [x27], #24
357add x0, x27, 1
358ld3  { v1.4h, v2.4h, v3.4h }, [x27], #24
359add x0, x27, 1
360ld3  { v1.4s, v2.4s, v3.4s }, [x27], #48
361add x0, x27, 1
362ld3  { v1.8b, v2.8b, v3.8b }, [x27], #24
363add x0, x27, 1
364ld3  { v1.8h, v2.8h, v3.8h }, [x27], #48
365add x0, x27, 1
366# LLVM-MCA-END
367
368# LLVM-MCA-BEGIN G29
369ld3  { v1.16b, v2.16b, v3.16b }, [x27], #48
370add x0, x27, 1
371ld3  { v1.2d, v2.2d, v3.2d }, [x27], x28
372add x0, x27, 1
373ld3  { v1.2s, v2.2s, v3.2s }, [x27], x28
374add x0, x27, 1
375ld3  { v1.4h, v2.4h, v3.4h }, [x27], x28
376add x0, x27, 1
377ld3  { v1.4s, v2.4s, v3.4s }, [x27], x28
378add x0, x27, 1
379# LLVM-MCA-END
380
381# LLVM-MCA-BEGIN G30
382ld3  { v1.8b, v2.8b, v3.8b }, [x27], x28
383add x0, x27, 1
384ld3  { v1.8h, v2.8h, v3.8h }, [x27], x28
385add x0, x27, 1
386ld3  { v1.16b, v2.16b, v3.16b }, [x27], x28
387add x0, x27, 1
388ld3  { v1.b, v2.b, v3.b }[0], [x27], #3
389add x0, x27, 1
390ld3  { v1.b, v2.b, v3.b }[8], [x27], #3
391add x0, x27, 1
392# LLVM-MCA-END
393
394# LLVM-MCA-BEGIN G31
395ld3  { v1.b, v2.b, v3.b }[0], [x27], x28
396add x0, x27, 1
397ld3  { v1.b, v2.b, v3.b }[8], [x27], x28
398add x0, x27, 1
399ld3  { v1.h, v2.h, v3.h }[0], [x27], #6
400add x0, x27, 1
401ld3  { v1.h, v2.h, v3.h }[4], [x27], #6
402add x0, x27, 1
403ld3  { v1.h, v2.h, v3.h }[0], [x27], x28
404add x0, x27, 1
405# LLVM-MCA-END
406
407# LLVM-MCA-BEGIN G32
408ld3  { v1.h, v2.h, v3.h }[4], [x27], x28
409add x0, x27, 1
410ld3  { v1.s, v2.s, v3.s }[0], [x27], #12
411add x0, x27, 1
412ld3  { v1.s, v2.s, v3.s }[0], [x27], x28
413add x0, x27, 1
414ld3  { v1.d, v2.d, v3.d }[0], [x27], #24
415add x0, x27, 1
416ld3  { v1.d, v2.d, v3.d }[0], [x27], x28
417add x0, x27, 1
418# LLVM-MCA-END
419
420# LLVM-MCA-BEGIN G33
421ld3r  { v1.1d, v2.1d, v3.1d }, [x27], #24
422add x0, x27, 1
423ld3r  { v1.2d, v2.2d, v3.2d }, [x27], #24
424add x0, x27, 1
425ld3r  { v1.2s, v2.2s, v3.2s }, [x27], #12
426add x0, x27, 1
427ld3r  { v1.4h, v2.4h, v3.4h }, [x27], #6
428add x0, x27, 1
429ld3r  { v1.4s, v2.4s, v3.4s }, [x27], #12
430add x0, x27, 1
431# LLVM-MCA-END
432
433# LLVM-MCA-BEGIN G34
434ld3r  { v1.8b, v2.8b, v3.8b }, [x27], #3
435add x0, x27, 1
436ld3r  { v1.8h, v2.8h, v3.8h }, [x27], #6
437add x0, x27, 1
438ld3r  { v1.16b, v2.16b, v3.16b }, [x27], #3
439add x0, x27, 1
440ld3r  { v1.1d, v2.1d, v3.1d }, [x27], x28
441add x0, x27, 1
442ld3r  { v1.2d, v2.2d, v3.2d }, [x27], x28
443add x0, x27, 1
444# LLVM-MCA-END
445
446# LLVM-MCA-BEGIN G35
447ld3r  { v1.2s, v2.2s, v3.2s }, [x27], x28
448add x0, x27, 1
449ld3r  { v1.4h, v2.4h, v3.4h }, [x27], x28
450add x0, x27, 1
451ld3r  { v1.4s, v2.4s, v3.4s }, [x27], x28
452add x0, x27, 1
453ld3r  { v1.8b, v2.8b, v3.8b }, [x27], x28
454add x0, x27, 1
455ld3r  { v1.8h, v2.8h, v3.8h }, [x27], x28
456add x0, x27, 1
457# LLVM-MCA-END
458
459# LLVM-MCA-BEGIN G36
460ld3r  { v1.16b, v2.16b, v3.16b }, [x27], x28
461add x0, x27, 1
462ld4  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
463add x0, x27, 1
464ld4  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
465add x0, x27, 1
466ld4  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
467add x0, x27, 1
468ld4  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
469add x0, x27, 1
470# LLVM-MCA-END
471
472# LLVM-MCA-BEGIN G37
473ld4  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
474add x0, x27, 1
475ld4  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
476add x0, x27, 1
477ld4  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
478add x0, x27, 1
479ld4  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
480add x0, x27, 1
481ld4  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
482add x0, x27, 1
483# LLVM-MCA-END
484
485# LLVM-MCA-BEGIN G38
486ld4  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
487add x0, x27, 1
488ld4  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
489add x0, x27, 1
490ld4  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
491add x0, x27, 1
492ld4  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
493add x0, x27, 1
494ld4  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
495add x0, x27, 1
496# LLVM-MCA-END
497
498# LLVM-MCA-BEGIN G39
499ld4  { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
500add x0, x27, 1
501ld4  { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
502add x0, x27, 1
503ld4  { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
504add x0, x27, 1
505ld4  { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
506add x0, x27, 1
507ld4  { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
508add x0, x27, 1
509# LLVM-MCA-END
510
511# LLVM-MCA-BEGIN G40
512ld4  { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
513add x0, x27, 1
514ld4  { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
515add x0, x27, 1
516ld4  { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
517add x0, x27, 1
518ld4  { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
519add x0, x27, 1
520ld4  { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
521add x0, x27, 1
522# LLVM-MCA-END
523
524# LLVM-MCA-BEGIN G41
525ld4  { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
526add x0, x27, 1
527ld4  { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
528add x0, x27, 1
529ld4r  { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
530add x0, x27, 1
531ld4r  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32
532add x0, x27, 1
533ld4r  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16
534add x0, x27, 1
535# LLVM-MCA-END
536
537# LLVM-MCA-BEGIN G42
538ld4r  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8
539add x0, x27, 1
540ld4r  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16
541add x0, x27, 1
542ld4r  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4
543add x0, x27, 1
544ld4r  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8
545add x0, x27, 1
546ld4r  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4
547add x0, x27, 1
548# LLVM-MCA-END
549
550# LLVM-MCA-BEGIN G43
551ld4r  { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
552add x0, x27, 1
553ld4r  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
554add x0, x27, 1
555ld4r  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
556add x0, x27, 1
557ld4r  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
558add x0, x27, 1
559ld4r  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
560add x0, x27, 1
561# LLVM-MCA-END
562
563# LLVM-MCA-BEGIN G44
564ld4r  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
565add x0, x27, 1
566ld4r  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
567add x0, x27, 1
568ld4r  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
569add x0, x27, 1
570ldp  s1, s2, [x27], #248
571add x0, x27, 1
572ldp  d1, d2, [x27], #496
573add x0, x27, 1
574# LLVM-MCA-END
575
576# LLVM-MCA-BEGIN G45
577ldp  q1, q2, [x27], #992
578add x0, x27, 1
579ldp  s1, s2, [x27, #248]!
580add x0, x27, 1
581ldp  d1, d2, [x27, #496]!
582add x0, x27, 1
583ldp  q1, q2, [x27, #992]!
584add x0, x27, 1
585ldp  w1, w2, [x27], #248
586add x0, x27, 1
587# LLVM-MCA-END
588
589# LLVM-MCA-BEGIN G46
590ldp  x1, x2, [x27], #496
591add x0, x27, 1
592ldp  w1, w2, [x27, #248]!
593add x0, x27, 1
594ldp  x1, x2, [x27, #496]!
595add x0, x27, 1
596ldpsw  x1, x2, [x27], #248
597add x0, x27, 1
598ldpsw  x1, x2, [x27, #248]!
599add x0, x27, 1
600# LLVM-MCA-END
601
602# LLVM-MCA-BEGIN G47
603ldr  b1, [x27], #254
604add x0, x27, 1
605ldr  h1, [x27], #254
606add x0, x27, 1
607ldr  s1, [x27], #254
608add x0, x27, 1
609ldr  d1, [x27], #254
610add x0, x27, 1
611ldr  q1, [x27], #254
612add x0, x27, 1
613# LLVM-MCA-END
614
615# LLVM-MCA-BEGIN G48
616ldr  b1, [x27, #254]!
617add x0, x27, 1
618ldr  h1, [x27, #254]!
619add x0, x27, 1
620ldr  s1, [x27, #254]!
621add x0, x27, 1
622ldr  d1, [x27, #254]!
623add x0, x27, 1
624ldr  q1, [x27, #254]!
625add x0, x27, 1
626# LLVM-MCA-END
627
628# LLVM-MCA-BEGIN G49
629ldr  w1, [x27], #254
630add x0, x27, 1
631ldr  x1, [x27], #254
632add x0, x27, 1
633ldr  w1, [x27, #254]!
634add x0, x27, 1
635ldr  x1, [x27, #254]!
636add x0, x27, 1
637ldrb  w1, [x27], #254
638add x0, x27, 1
639# LLVM-MCA-END
640
641# LLVM-MCA-BEGIN G50
642ldrb  w1, [x27, #254]!
643add x0, x27, 1
644ldrh  w1, [x27], #254
645add x0, x27, 1
646ldrh  w1, [x27, #254]!
647add x0, x27, 1
648ldrsb  w1, [x27], #254
649add x0, x27, 1
650ldrsb  x1, [x27], #254
651add x0, x27, 1
652# LLVM-MCA-END
653
654# LLVM-MCA-BEGIN G51
655ldrsb  w1, [x27, #254]!
656add x0, x27, 1
657ldrsb  x1, [x27, #254]!
658add x0, x27, 1
659ldrsh  w1, [x27], #254
660add x0, x27, 1
661ldrsh  x1, [x27], #254
662add x0, x27, 1
663ldrsh  w1, [x27, #254]!
664add x0, x27, 1
665# LLVM-MCA-END
666
667# LLVM-MCA-BEGIN G52
668ldrsh  x1, [x27, #254]!
669add x0, x27, 1
670ldrsw  x1, [x27], #254
671add x0, x27, 1
672ldrsw  x1, [x27, #254]!
673add x0, x27, 1
674st1  { v1.1d }, [x27], #8
675add x0, x27, 1
676st1  { v1.2d }, [x27], #16
677add x0, x27, 1
678# LLVM-MCA-END
679
680# LLVM-MCA-BEGIN G53
681st1  { v1.2s }, [x27], #8
682add x0, x27, 1
683st1  { v1.4h }, [x27], #8
684add x0, x27, 1
685st1  { v1.4s }, [x27], #16
686add x0, x27, 1
687st1  { v1.8b }, [x27], #8
688add x0, x27, 1
689st1  { v1.8h }, [x27], #16
690add x0, x27, 1
691# LLVM-MCA-END
692
693# LLVM-MCA-BEGIN G54
694st1  { v1.16b }, [x27], #16
695add x0, x27, 1
696st1  { v1.1d }, [x27], x28
697add x0, x27, 1
698st1  { v1.2d }, [x27], x28
699add x0, x27, 1
700st1  { v1.2s }, [x27], x28
701add x0, x27, 1
702st1  { v1.4h }, [x27], x28
703add x0, x27, 1
704# LLVM-MCA-END
705
706# LLVM-MCA-BEGIN G55
707st1  { v1.4s }, [x27], x28
708add x0, x27, 1
709st1  { v1.8b }, [x27], x28
710add x0, x27, 1
711st1  { v1.8h }, [x27], x28
712add x0, x27, 1
713st1  { v1.16b }, [x27], x28
714add x0, x27, 1
715st1  { v1.1d, v2.1d }, [x27], #16
716add x0, x27, 1
717# LLVM-MCA-END
718
719# LLVM-MCA-BEGIN G56
720st1  { v1.2d, v2.2d }, [x27], #32
721add x0, x27, 1
722st1  { v1.2s, v2.2s }, [x27], #16
723add x0, x27, 1
724st1  { v1.4h, v2.4h }, [x27], #16
725add x0, x27, 1
726st1  { v1.4s, v2.4s }, [x27], #32
727add x0, x27, 1
728st1  { v1.8b, v2.8b }, [x27], #16
729add x0, x27, 1
730# LLVM-MCA-END
731
732# LLVM-MCA-BEGIN G57
733st1  { v1.8h, v2.8h }, [x27], #32
734add x0, x27, 1
735st1  { v1.16b, v2.16b }, [x27], #32
736add x0, x27, 1
737st1  { v1.1d, v2.1d }, [x27], x28
738add x0, x27, 1
739st1  { v1.2d, v2.2d }, [x27], x28
740add x0, x27, 1
741st1  { v1.2s, v2.2s }, [x27], x28
742add x0, x27, 1
743# LLVM-MCA-END
744
745# LLVM-MCA-BEGIN G58
746st1  { v1.4h, v2.4h }, [x27], x28
747add x0, x27, 1
748st1  { v1.4s, v2.4s }, [x27], x28
749add x0, x27, 1
750st1  { v1.8b, v2.8b }, [x27], x28
751add x0, x27, 1
752st1  { v1.8h, v2.8h }, [x27], x28
753add x0, x27, 1
754st1  { v1.16b, v2.16b }, [x27], x28
755add x0, x27, 1
756# LLVM-MCA-END
757
758# LLVM-MCA-BEGIN G59
759st1  { v1.1d, v2.1d, v3.1d }, [x27], #24
760add x0, x27, 1
761st1  { v1.2d, v2.2d, v3.2d }, [x27], #48
762add x0, x27, 1
763st1  { v1.2s, v2.2s, v3.2s }, [x27], #24
764add x0, x27, 1
765st1  { v1.4h, v2.4h, v3.4h }, [x27], #24
766add x0, x27, 1
767st1  { v1.4s, v2.4s, v3.4s }, [x27], #48
768add x0, x27, 1
769# LLVM-MCA-END
770
771# LLVM-MCA-BEGIN G60
772st1  { v1.8b, v2.8b, v3.8b }, [x27], #24
773add x0, x27, 1
774st1  { v1.8h, v2.8h, v3.8h }, [x27], #48
775add x0, x27, 1
776st1  { v1.16b, v2.16b, v3.16b }, [x27], #48
777add x0, x27, 1
778st1  { v1.1d, v2.1d, v3.1d }, [x27], x28
779add x0, x27, 1
780st1  { v1.2d, v2.2d, v3.2d }, [x27], x28
781add x0, x27, 1
782# LLVM-MCA-END
783
784# LLVM-MCA-BEGIN G61
785st1  { v1.2s, v2.2s, v3.2s }, [x27], x28
786add x0, x27, 1
787st1  { v1.4h, v2.4h, v3.4h }, [x27], x28
788add x0, x27, 1
789st1  { v1.4s, v2.4s, v3.4s }, [x27], x28
790add x0, x27, 1
791st1  { v1.8b, v2.8b, v3.8b }, [x27], x28
792add x0, x27, 1
793st1  { v1.8h, v2.8h, v3.8h }, [x27], x28
794add x0, x27, 1
795# LLVM-MCA-END
796
797# LLVM-MCA-BEGIN G62
798st1  { v1.16b, v2.16b, v3.16b }, [x27], x28
799add x0, x27, 1
800st1  { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
801add x0, x27, 1
802st1  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
803add x0, x27, 1
804st1  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
805add x0, x27, 1
806st1  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
807add x0, x27, 1
808# LLVM-MCA-END
809
810# LLVM-MCA-BEGIN G63
811st1  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
812add x0, x27, 1
813st1  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
814add x0, x27, 1
815st1  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
816add x0, x27, 1
817st1  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
818add x0, x27, 1
819st1  { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
820add x0, x27, 1
821# LLVM-MCA-END
822
823# LLVM-MCA-BEGIN G64
824st1  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
825add x0, x27, 1
826st1  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
827add x0, x27, 1
828st1  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
829add x0, x27, 1
830st1  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
831add x0, x27, 1
832st1  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
833add x0, x27, 1
834# LLVM-MCA-END
835
836# LLVM-MCA-BEGIN G65
837st1  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
838add x0, x27, 1
839st1  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
840add x0, x27, 1
841st1  { v1.b }[0], [x27], #1
842add x0, x27, 1
843st1  { v1.b }[8], [x27], #1
844add x0, x27, 1
845st1  { v1.b }[0], [x27], x28
846add x0, x27, 1
847# LLVM-MCA-END
848
849# LLVM-MCA-BEGIN G66
850st1  { v1.b }[8], [x27], x28
851add x0, x27, 1
852st1  { v1.h }[0], [x27], #2
853add x0, x27, 1
854st1  { v1.h }[4], [x27], #2
855add x0, x27, 1
856st1  { v1.h }[0], [x27], x28
857add x0, x27, 1
858st1  { v1.h }[4], [x27], x28
859add x0, x27, 1
860# LLVM-MCA-END
861
862# LLVM-MCA-BEGIN G67
863st1  { v1.s }[0], [x27], #4
864add x0, x27, 1
865st1  { v1.s }[0], [x27], x28
866add x0, x27, 1
867st1  { v1.d }[0], [x27], #8
868add x0, x27, 1
869st1  { v1.d }[0], [x27], x28
870add x0, x27, 1
871st2  { v1.2d, v2.2d }, [x27], #32
872add x0, x27, 1
873# LLVM-MCA-END
874
875# LLVM-MCA-BEGIN G68
876st2  { v1.2s, v2.2s }, [x27], #16
877add x0, x27, 1
878st2  { v1.4h, v2.4h }, [x27], #16
879add x0, x27, 1
880st2  { v1.4s, v2.4s }, [x27], #32
881add x0, x27, 1
882st2  { v1.8b, v2.8b }, [x27], #16
883add x0, x27, 1
884st2  { v1.8h, v2.8h }, [x27], #32
885add x0, x27, 1
886# LLVM-MCA-END
887
888# LLVM-MCA-BEGIN G69
889st2  { v1.16b, v2.16b }, [x27], #32
890add x0, x27, 1
891st2  { v1.2d, v2.2d }, [x27], x28
892add x0, x27, 1
893st2  { v1.2s, v2.2s }, [x27], x28
894add x0, x27, 1
895st2  { v1.4h, v2.4h }, [x27], x28
896add x0, x27, 1
897st2  { v1.4s, v2.4s }, [x27], x28
898add x0, x27, 1
899# LLVM-MCA-END
900
901# LLVM-MCA-BEGIN G70
902st2  { v1.8b, v2.8b }, [x27], x28
903add x0, x27, 1
904st2  { v1.8h, v2.8h }, [x27], x28
905add x0, x27, 1
906st2  { v1.16b, v2.16b }, [x27], x28
907add x0, x27, 1
908st2  { v1.b, v2.b }[0], [x27], #2
909add x0, x27, 1
910st2  { v1.b, v2.b }[8], [x27], #2
911add x0, x27, 1
912# LLVM-MCA-END
913
914# LLVM-MCA-BEGIN G71
915st2  { v1.b, v2.b }[0], [x27], x28
916add x0, x27, 1
917st2  { v1.b, v2.b }[8], [x27], x28
918add x0, x27, 1
919st2  { v1.h, v2.h }[0], [x27], #4
920add x0, x27, 1
921st2  { v1.h, v2.h }[4], [x27], #4
922add x0, x27, 1
923st2  { v1.h, v2.h }[0], [x27], x28
924add x0, x27, 1
925# LLVM-MCA-END
926
927# LLVM-MCA-BEGIN G72
928st2  { v1.h, v2.h }[4], [x27], x28
929add x0, x27, 1
930st2  { v1.s, v2.s }[0], [x27], #8
931add x0, x27, 1
932st2  { v1.s, v2.s }[0], [x27], x28
933add x0, x27, 1
934st2  { v1.d, v2.d }[0], [x27], #16
935add x0, x27, 1
936st2  { v1.d, v2.d }[0], [x27], x28
937add x0, x27, 1
938# LLVM-MCA-END
939
940# LLVM-MCA-BEGIN G73
941st3  { v1.2d, v2.2d, v3.2d }, [x27], #48
942add x0, x27, 1
943st3  { v1.2s, v2.2s, v3.2s }, [x27], #24
944add x0, x27, 1
945st3  { v1.4h, v2.4h, v3.4h }, [x27], #24
946add x0, x27, 1
947# LLVM-MCA-END
948
949# LLVM-MCA-BEGIN G74
950st3  { v1.4s, v2.4s, v3.4s }, [x27], #48
951add x0, x27, 1
952st3  { v1.8b, v2.8b, v3.8b }, [x27], #24
953add x0, x27, 1
954st3  { v1.8h, v2.8h, v3.8h }, [x27], #48
955add x0, x27, 1
956st3  { v1.16b, v2.16b, v3.16b }, [x27], #48
957add x0, x27, 1
958st3  { v1.2d, v2.2d, v3.2d }, [x27], x28
959add x0, x27, 1
960# LLVM-MCA-END
961
962# LLVM-MCA-BEGIN G75
963st3  { v1.2s, v2.2s, v3.2s }, [x27], x28
964add x0, x27, 1
965st3  { v1.4h, v2.4h, v3.4h }, [x27], x28
966add x0, x27, 1
967st3  { v1.4s, v2.4s, v3.4s }, [x27], x28
968add x0, x27, 1
969st3  { v1.8b, v2.8b, v3.8b }, [x27], x28
970add x0, x27, 1
971st3  { v1.8h, v2.8h, v3.8h }, [x27], x28
972add x0, x27, 1
973# LLVM-MCA-END
974
975# LLVM-MCA-BEGIN G76
976st3  { v1.16b, v2.16b, v3.16b }, [x27], x28
977add x0, x27, 1
978st3  { v1.b, v2.b, v3.b }[0], [x27], #3
979add x0, x27, 1
980st3  { v1.b, v2.b, v3.b }[8], [x27], #3
981add x0, x27, 1
982st3  { v1.b, v2.b, v3.b }[0], [x27], x28
983add x0, x27, 1
984st3  { v1.b, v2.b, v3.b }[8], [x27], x28
985add x0, x27, 1
986# LLVM-MCA-END
987
988# LLVM-MCA-BEGIN G77
989st3  { v1.h, v2.h, v3.h }[0], [x27], #6
990add x0, x27, 1
991st3  { v1.h, v2.h, v3.h }[4], [x27], #6
992add x0, x27, 1
993st3  { v1.h, v2.h, v3.h }[0], [x27], x28
994add x0, x27, 1
995st3  { v1.h, v2.h, v3.h }[4], [x27], x28
996add x0, x27, 1
997st3  { v1.s, v2.s, v3.s }[0], [x27], #12
998add x0, x27, 1
999# LLVM-MCA-END
1000
1001# LLVM-MCA-BEGIN G78
1002st3  { v1.s, v2.s, v3.s }[0], [x27], x28
1003add x0, x27, 1
1004st3  { v1.d, v2.d, v3.d }[0], [x27], #24
1005add x0, x27, 1
1006st3  { v1.d, v2.d, v3.d }[0], [x27], x28
1007add x0, x27, 1
1008st4  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
1009add x0, x27, 1
1010st4  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
1011add x0, x27, 1
1012# LLVM-MCA-END
1013
1014# LLVM-MCA-BEGIN G79
1015st4  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
1016add x0, x27, 1
1017st4  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
1018add x0, x27, 1
1019st4  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
1020add x0, x27, 1
1021st4  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
1022add x0, x27, 1
1023st4  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
1024add x0, x27, 1
1025# LLVM-MCA-END
1026
1027# LLVM-MCA-BEGIN G80
1028st4  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
1029add x0, x27, 1
1030st4  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
1031add x0, x27, 1
1032st4  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
1033add x0, x27, 1
1034st4  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
1035add x0, x27, 1
1036st4  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
1037add x0, x27, 1
1038# LLVM-MCA-END
1039
1040# LLVM-MCA-BEGIN G81
1041st4  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
1042add x0, x27, 1
1043st4  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
1044add x0, x27, 1
1045st4  { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
1046add x0, x27, 1
1047st4  { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
1048add x0, x27, 1
1049st4  { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
1050add x0, x27, 1
1051# LLVM-MCA-END
1052
1053# LLVM-MCA-BEGIN G82
1054st4  { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
1055add x0, x27, 1
1056st4  { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
1057add x0, x27, 1
1058st4  { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
1059add x0, x27, 1
1060st4  { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
1061add x0, x27, 1
1062st4  { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
1063add x0, x27, 1
1064# LLVM-MCA-END
1065
1066# LLVM-MCA-BEGIN G83
1067st4  { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
1068add x0, x27, 1
1069st4  { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
1070add x0, x27, 1
1071st4  { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
1072add x0, x27, 1
1073st4  { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
1074add x0, x27, 1
1075# LLVM-MCA-END
1076
1077# LLVM-MCA-BEGIN G84
1078stp  s1, s2, [x27], #248
1079add x0, x27, 1
1080stp  d1, d2, [x27], #496
1081add x0, x27, 1
1082# LLVM-MCA-END
1083
1084# LLVM-MCA-BEGIN G85
1085stp  q1, q2, [x27], #992
1086add x0, x27, 1
1087stp  s1, s2, [x27, #248]!
1088add x0, x27, 1
1089stp  d1, d2, [x27, #496]!
1090add x0, x27, 1
1091stp  q1, q2, [x27, #992]!
1092add x0, x27, 1
1093stp  w1, w2, [x27], #248
1094add x0, x27, 1
1095# LLVM-MCA-END
1096
1097# LLVM-MCA-BEGIN G86
1098stp  x1, x2, [x27], #496
1099add x0, x27, 1
1100stp  w1, w2, [x27, #248]!
1101add x0, x27, 1
1102stp  x1, x2, [x27, #496]!
1103add x0, x27, 1
1104str  b1, [x27], #254
1105add x0, x27, 1
1106str  h1, [x27], #254
1107add x0, x27, 1
1108# LLVM-MCA-END
1109
1110# LLVM-MCA-BEGIN G87
1111str  s1, [x27], #254
1112add x0, x27, 1
1113str  d1, [x27], #254
1114add x0, x27, 1
1115str  q1, [x27], #254
1116add x0, x27, 1
1117str  b1, [x27, #254]!
1118add x0, x27, 1
1119str  h1, [x27, #254]!
1120add x0, x27, 1
1121# LLVM-MCA-END
1122
1123# LLVM-MCA-BEGIN G88
1124str  s1, [x27, #254]!
1125add x0, x27, 1
1126str  d1, [x27, #254]!
1127add x0, x27, 1
1128str  q1, [x27, #254]!
1129add x0, x27, 1
1130str  w1, [x27], #254
1131add x0, x27, 1
1132str  x1, [x27], #254
1133add x0, x27, 1
1134# LLVM-MCA-END
1135
1136# LLVM-MCA-BEGIN G89
1137str  w1, [x27, #254]!
1138add x0, x27, 1
1139str  x1, [x27, #254]!
1140add x0, x27, 1
1141strb  w1, [x27], #254
1142add x0, x27, 1
1143strb  w1, [x27, #254]!
1144add x0, x27, 1
1145strh  w1, [x27], #254
1146add x0, x27, 1
1147# LLVM-MCA-END
1148
1149# LLVM-MCA-BEGIN G90
1150strh  w1, [x27, #254]!
1151add x0, x27, 1
1152# LLVM-MCA-END
1153
1154# LLVM-MCA-BEGIN G91
1155ldr  x1, [x27], #254
1156add x0, x27, 1
1157ldr  x2, [x1], #254
1158add x0, x27, 1
1159# LLVM-MCA-END
1160
1161# CHECK:      [0] Code Region - G01
1162
1163# CHECK:      Iterations:        100
1164# CHECK-NEXT: Instructions:      1000
1165# CHECK-NEXT: Total Cycles:      2201
1166# CHECK-NEXT: Total uOps:        1500
1167
1168# CHECK:      Dispatch Width:    2
1169# CHECK-NEXT: uOps Per Cycle:    0.68
1170# CHECK-NEXT: IPC:               0.45
1171# CHECK-NEXT: Block RThroughput: 7.5
1172
1173# CHECK:      Timeline view:
1174# CHECK-NEXT:                     0123456789
1175# CHECK-NEXT: Index     0123456789          012
1176
1177# CHECK:      [0,0]     DeeeE.    .    .    . .   ld1	{ v1.1d }, [x27], #8
1178# CHECK-NEXT: [0,1]     .DeeE.    .    .    . .   add	x0, x27, #1
1179# CHECK-NEXT: [0,2]     .   DeeeeE.    .    . .   ld1	{ v1.2d }, [x27], #16
1180# CHECK-NEXT: [0,3]     .    .DeeE.    .    . .   add	x0, x27, #1
1181# CHECK-NEXT: [0,4]     .    .   DeeeE .    . .   ld1	{ v1.2s }, [x27], #8
1182# CHECK-NEXT: [0,5]     .    .    DeeE .    . .   add	x0, x27, #1
1183# CHECK-NEXT: [0,6]     .    .    .  DeeeE  . .   ld1	{ v1.4h }, [x27], #8
1184# CHECK-NEXT: [0,7]     .    .    .   DeeE  . .   add	x0, x27, #1
1185# CHECK-NEXT: [0,8]     .    .    .    . DeeeeE   ld1	{ v1.4s }, [x27], #16
1186# CHECK-NEXT: [0,9]     .    .    .    .   DeeE   add	x0, x27, #1
1187
1188# CHECK:      Average Wait times (based on the timeline view):
1189# CHECK-NEXT: [0]: Executions
1190# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1191# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1192# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1193
1194# CHECK:            [0]    [1]    [2]    [3]
1195# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.1d }, [x27], #8
1196# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1197# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.2d }, [x27], #16
1198# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1199# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.2s }, [x27], #8
1200# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1201# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.4h }, [x27], #8
1202# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1203# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.4s }, [x27], #16
1204# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1205# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1206
1207# CHECK:      [1] Code Region - G02
1208
1209# CHECK:      Iterations:        100
1210# CHECK-NEXT: Instructions:      1000
1211# CHECK-NEXT: Total Cycles:      2301
1212# CHECK-NEXT: Total uOps:        1500
1213
1214# CHECK:      Dispatch Width:    2
1215# CHECK-NEXT: uOps Per Cycle:    0.65
1216# CHECK-NEXT: IPC:               0.43
1217# CHECK-NEXT: Block RThroughput: 8.0
1218
1219# CHECK:      Timeline view:
1220# CHECK-NEXT:                     0123456789
1221# CHECK-NEXT: Index     0123456789          0123
1222
1223# CHECK:      [0,0]     DeeeE.    .    .    .  .   ld1	{ v1.8b }, [x27], #8
1224# CHECK-NEXT: [0,1]     .DeeE.    .    .    .  .   add	x0, x27, #1
1225# CHECK-NEXT: [0,2]     .   DeeeeE.    .    .  .   ld1	{ v1.8h }, [x27], #16
1226# CHECK-NEXT: [0,3]     .    .DeeE.    .    .  .   add	x0, x27, #1
1227# CHECK-NEXT: [0,4]     .    .   DeeeeE.    .  .   ld1	{ v1.16b }, [x27], #16
1228# CHECK-NEXT: [0,5]     .    .    .DeeE.    .  .   add	x0, x27, #1
1229# CHECK-NEXT: [0,6]     .    .    .   DeeeE .  .   ld1	{ v1.1d }, [x27], x28
1230# CHECK-NEXT: [0,7]     .    .    .    DeeE .  .   add	x0, x27, #1
1231# CHECK-NEXT: [0,8]     .    .    .    .  DeeeeE   ld1	{ v1.2d }, [x27], x28
1232# CHECK-NEXT: [0,9]     .    .    .    .    DeeE   add	x0, x27, #1
1233
1234# CHECK:      Average Wait times (based on the timeline view):
1235# CHECK-NEXT: [0]: Executions
1236# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1237# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1238# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1239
1240# CHECK:            [0]    [1]    [2]    [3]
1241# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.8b }, [x27], #8
1242# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1243# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.8h }, [x27], #16
1244# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1245# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.16b }, [x27], #16
1246# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1247# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.1d }, [x27], x28
1248# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1249# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.2d }, [x27], x28
1250# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1251# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1252
1253# CHECK:      [2] Code Region - G03
1254
1255# CHECK:      Iterations:        100
1256# CHECK-NEXT: Instructions:      1000
1257# CHECK-NEXT: Total Cycles:      2201
1258# CHECK-NEXT: Total uOps:        1500
1259
1260# CHECK:      Dispatch Width:    2
1261# CHECK-NEXT: uOps Per Cycle:    0.68
1262# CHECK-NEXT: IPC:               0.45
1263# CHECK-NEXT: Block RThroughput: 7.5
1264
1265# CHECK:      Timeline view:
1266# CHECK-NEXT:                     0123456789
1267# CHECK-NEXT: Index     0123456789          012
1268
1269# CHECK:      [0,0]     DeeeE.    .    .    . .   ld1	{ v1.2s }, [x27], x28
1270# CHECK-NEXT: [0,1]     .DeeE.    .    .    . .   add	x0, x27, #1
1271# CHECK-NEXT: [0,2]     .   DeeeE .    .    . .   ld1	{ v1.4h }, [x27], x28
1272# CHECK-NEXT: [0,3]     .    DeeE .    .    . .   add	x0, x27, #1
1273# CHECK-NEXT: [0,4]     .    .  DeeeeE .    . .   ld1	{ v1.4s }, [x27], x28
1274# CHECK-NEXT: [0,5]     .    .    DeeE .    . .   add	x0, x27, #1
1275# CHECK-NEXT: [0,6]     .    .    .  DeeeE  . .   ld1	{ v1.8b }, [x27], x28
1276# CHECK-NEXT: [0,7]     .    .    .   DeeE  . .   add	x0, x27, #1
1277# CHECK-NEXT: [0,8]     .    .    .    . DeeeeE   ld1	{ v1.8h }, [x27], x28
1278# CHECK-NEXT: [0,9]     .    .    .    .   DeeE   add	x0, x27, #1
1279
1280# CHECK:      Average Wait times (based on the timeline view):
1281# CHECK-NEXT: [0]: Executions
1282# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1283# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1284# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1285
1286# CHECK:            [0]    [1]    [2]    [3]
1287# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.2s }, [x27], x28
1288# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1289# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.4h }, [x27], x28
1290# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1291# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.4s }, [x27], x28
1292# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1293# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.8b }, [x27], x28
1294# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1295# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.8h }, [x27], x28
1296# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1297# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1298
1299# CHECK:      [3] Code Region - G04
1300
1301# CHECK:      Iterations:        100
1302# CHECK-NEXT: Instructions:      1000
1303# CHECK-NEXT: Total Cycles:      2701
1304# CHECK-NEXT: Total uOps:        1500
1305
1306# CHECK:      Dispatch Width:    2
1307# CHECK-NEXT: uOps Per Cycle:    0.56
1308# CHECK-NEXT: IPC:               0.37
1309# CHECK-NEXT: Block RThroughput: 12.0
1310
1311# CHECK:      Timeline view:
1312# CHECK-NEXT:                     0123456789
1313# CHECK-NEXT: Index     0123456789          01234567
1314
1315# CHECK:      [0,0]     DeeeeE    .    .    .    . .   ld1	{ v1.16b }, [x27], x28
1316# CHECK-NEXT: [0,1]     . DeeE    .    .    .    . .   add	x0, x27, #1
1317# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    . .   ld1	{ v1.1d, v2.1d }, [x27], #16
1318# CHECK-NEXT: [0,3]     .    . DeeE    .    .    . .   add	x0, x27, #1
1319# CHECK-NEXT: [0,4]     .    .    DeeeeeeE  .    . .   ld1	{ v1.2d, v2.2d }, [x27], #32
1320# CHECK-NEXT: [0,5]     .    .    .   DeeE  .    . .   add	x0, x27, #1
1321# CHECK-NEXT: [0,6]     .    .    .    . DeeeeE  . .   ld1	{ v1.2s, v2.2s }, [x27], #16
1322# CHECK-NEXT: [0,7]     .    .    .    .   DeeE  . .   add	x0, x27, #1
1323# CHECK-NEXT: [0,8]     .    .    .    .    . DeeeeE   ld1	{ v1.4h, v2.4h }, [x27], #16
1324# CHECK-NEXT: [0,9]     .    .    .    .    .   DeeE   add	x0, x27, #1
1325
1326# CHECK:      Average Wait times (based on the timeline view):
1327# CHECK-NEXT: [0]: Executions
1328# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1329# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1330# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1331
1332# CHECK:            [0]    [1]    [2]    [3]
1333# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.16b }, [x27], x28
1334# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1335# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.1d, v2.1d }, [x27], #16
1336# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1337# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.2d, v2.2d }, [x27], #32
1338# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1339# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.2s, v2.2s }, [x27], #16
1340# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1341# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.4h, v2.4h }, [x27], #16
1342# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1343# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1344
1345# CHECK:      [4] Code Region - G05
1346
1347# CHECK:      Iterations:        100
1348# CHECK-NEXT: Instructions:      1000
1349# CHECK-NEXT: Total Cycles:      3101
1350# CHECK-NEXT: Total uOps:        1500
1351
1352# CHECK:      Dispatch Width:    2
1353# CHECK-NEXT: uOps Per Cycle:    0.48
1354# CHECK-NEXT: IPC:               0.32
1355# CHECK-NEXT: Block RThroughput: 16.0
1356
1357# CHECK:      Timeline view:
1358# CHECK-NEXT:                     0123456789          01
1359# CHECK-NEXT: Index     0123456789          0123456789
1360
1361# CHECK:      [0,0]     DeeeeeeE  .    .    .    .    ..   ld1	{ v1.4s, v2.4s }, [x27], #32
1362# CHECK-NEXT: [0,1]     .   DeeE  .    .    .    .    ..   add	x0, x27, #1
1363# CHECK-NEXT: [0,2]     .    . DeeeeE  .    .    .    ..   ld1	{ v1.8b, v2.8b }, [x27], #16
1364# CHECK-NEXT: [0,3]     .    .   DeeE  .    .    .    ..   add	x0, x27, #1
1365# CHECK-NEXT: [0,4]     .    .    . DeeeeeeE.    .    ..   ld1	{ v1.8h, v2.8h }, [x27], #32
1366# CHECK-NEXT: [0,5]     .    .    .    .DeeE.    .    ..   add	x0, x27, #1
1367# CHECK-NEXT: [0,6]     .    .    .    .   DeeeeeeE   ..   ld1	{ v1.16b, v2.16b }, [x27], #32
1368# CHECK-NEXT: [0,7]     .    .    .    .    .  DeeE   ..   add	x0, x27, #1
1369# CHECK-NEXT: [0,8]     .    .    .    .    .    .DeeeeE   ld1	{ v1.1d, v2.1d }, [x27], x28
1370# CHECK-NEXT: [0,9]     .    .    .    .    .    .  DeeE   add	x0, x27, #1
1371
1372# CHECK:      Average Wait times (based on the timeline view):
1373# CHECK-NEXT: [0]: Executions
1374# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1375# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1376# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1377
1378# CHECK:            [0]    [1]    [2]    [3]
1379# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.4s, v2.4s }, [x27], #32
1380# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1381# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.8b, v2.8b }, [x27], #16
1382# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1383# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.8h, v2.8h }, [x27], #32
1384# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1385# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.16b, v2.16b }, [x27], #32
1386# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1387# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.1d, v2.1d }, [x27], x28
1388# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1389# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1390
1391# CHECK:      [5] Code Region - G06
1392
1393# CHECK:      Iterations:        100
1394# CHECK-NEXT: Instructions:      1000
1395# CHECK-NEXT: Total Cycles:      2901
1396# CHECK-NEXT: Total uOps:        1500
1397
1398# CHECK:      Dispatch Width:    2
1399# CHECK-NEXT: uOps Per Cycle:    0.52
1400# CHECK-NEXT: IPC:               0.34
1401# CHECK-NEXT: Block RThroughput: 14.0
1402
1403# CHECK:      Timeline view:
1404# CHECK-NEXT:                     0123456789
1405# CHECK-NEXT: Index     0123456789          0123456789
1406
1407# CHECK:      [0,0]     DeeeeeeE  .    .    .    .   .   ld1	{ v1.2d, v2.2d }, [x27], x28
1408# CHECK-NEXT: [0,1]     .   DeeE  .    .    .    .   .   add	x0, x27, #1
1409# CHECK-NEXT: [0,2]     .    . DeeeeE  .    .    .   .   ld1	{ v1.2s, v2.2s }, [x27], x28
1410# CHECK-NEXT: [0,3]     .    .   DeeE  .    .    .   .   add	x0, x27, #1
1411# CHECK-NEXT: [0,4]     .    .    . DeeeeE  .    .   .   ld1	{ v1.4h, v2.4h }, [x27], x28
1412# CHECK-NEXT: [0,5]     .    .    .   DeeE  .    .   .   add	x0, x27, #1
1413# CHECK-NEXT: [0,6]     .    .    .    . DeeeeeeE.   .   ld1	{ v1.4s, v2.4s }, [x27], x28
1414# CHECK-NEXT: [0,7]     .    .    .    .    .DeeE.   .   add	x0, x27, #1
1415# CHECK-NEXT: [0,8]     .    .    .    .    .   DeeeeE   ld1	{ v1.8b, v2.8b }, [x27], x28
1416# CHECK-NEXT: [0,9]     .    .    .    .    .    .DeeE   add	x0, x27, #1
1417
1418# CHECK:      Average Wait times (based on the timeline view):
1419# CHECK-NEXT: [0]: Executions
1420# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1421# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1422# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1423
1424# CHECK:            [0]    [1]    [2]    [3]
1425# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.2d, v2.2d }, [x27], x28
1426# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1427# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.2s, v2.2s }, [x27], x28
1428# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1429# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.4h, v2.4h }, [x27], x28
1430# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1431# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.4s, v2.4s }, [x27], x28
1432# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1433# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.8b, v2.8b }, [x27], x28
1434# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1435# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1436
1437# CHECK:      [6] Code Region - G07
1438
1439# CHECK:      Iterations:        100
1440# CHECK-NEXT: Instructions:      1000
1441# CHECK-NEXT: Total Cycles:      3501
1442# CHECK-NEXT: Total uOps:        1500
1443
1444# CHECK:      Dispatch Width:    2
1445# CHECK-NEXT: uOps Per Cycle:    0.43
1446# CHECK-NEXT: IPC:               0.29
1447# CHECK-NEXT: Block RThroughput: 20.0
1448
1449# CHECK:      Timeline view:
1450# CHECK-NEXT:                     0123456789          012345
1451# CHECK-NEXT: Index     0123456789          0123456789
1452
1453# CHECK:      [0,0]     DeeeeeeE  .    .    .    .    .    .   ld1	{ v1.8h, v2.8h }, [x27], x28
1454# CHECK-NEXT: [0,1]     .   DeeE  .    .    .    .    .    .   add	x0, x27, #1
1455# CHECK-NEXT: [0,2]     .    . DeeeeeeE.    .    .    .    .   ld1	{ v1.16b, v2.16b }, [x27], x28
1456# CHECK-NEXT: [0,3]     .    .    .DeeE.    .    .    .    .   add	x0, x27, #1
1457# CHECK-NEXT: [0,4]     .    .    .   DeeeeeE    .    .    .   ld1	{ v1.1d, v2.1d, v3.1d }, [x27], #24
1458# CHECK-NEXT: [0,5]     .    .    .    . DeeE    .    .    .   add	x0, x27, #1
1459# CHECK-NEXT: [0,6]     .    .    .    .    DeeeeeeeeE.    .   ld1	{ v1.2d, v2.2d, v3.2d }, [x27], #48
1460# CHECK-NEXT: [0,7]     .    .    .    .    .    .DeeE.    .   add	x0, x27, #1
1461# CHECK-NEXT: [0,8]     .    .    .    .    .    .   DeeeeeE   ld1	{ v1.2s, v2.2s, v3.2s }, [x27], #24
1462# CHECK-NEXT: [0,9]     .    .    .    .    .    .    . DeeE   add	x0, x27, #1
1463
1464# CHECK:      Average Wait times (based on the timeline view):
1465# CHECK-NEXT: [0]: Executions
1466# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1467# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1468# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1469
1470# CHECK:            [0]    [1]    [2]    [3]
1471# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.8h, v2.8h }, [x27], x28
1472# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1473# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.16b, v2.16b }, [x27], x28
1474# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1475# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.1d, v2.1d, v3.1d }, [x27], #24
1476# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1477# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.2d, v2.2d, v3.2d }, [x27], #48
1478# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1479# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.2s, v2.2s, v3.2s }, [x27], #24
1480# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1481# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1482
1483# CHECK:      [7] Code Region - G08
1484
1485# CHECK:      Iterations:        100
1486# CHECK-NEXT: Instructions:      1000
1487# CHECK-NEXT: Total Cycles:      3901
1488# CHECK-NEXT: Total uOps:        1500
1489
1490# CHECK:      Dispatch Width:    2
1491# CHECK-NEXT: uOps Per Cycle:    0.38
1492# CHECK-NEXT: IPC:               0.26
1493# CHECK-NEXT: Block RThroughput: 24.0
1494
1495# CHECK:      Timeline view:
1496# CHECK-NEXT:                     0123456789          0123456789
1497# CHECK-NEXT: Index     0123456789          0123456789
1498
1499# CHECK:      [0,0]     DeeeeeE   .    .    .    .    .    .   .   ld1	{ v1.4h, v2.4h, v3.4h }, [x27], #24
1500# CHECK-NEXT: [0,1]     .  DeeE   .    .    .    .    .    .   .   add	x0, x27, #1
1501# CHECK-NEXT: [0,2]     .    .DeeeeeeeeE    .    .    .    .   .   ld1	{ v1.4s, v2.4s, v3.4s }, [x27], #48
1502# CHECK-NEXT: [0,3]     .    .    . DeeE    .    .    .    .   .   add	x0, x27, #1
1503# CHECK-NEXT: [0,4]     .    .    .    DeeeeeE   .    .    .   .   ld1	{ v1.8b, v2.8b, v3.8b }, [x27], #24
1504# CHECK-NEXT: [0,5]     .    .    .    .  DeeE   .    .    .   .   add	x0, x27, #1
1505# CHECK-NEXT: [0,6]     .    .    .    .    .DeeeeeeeeE    .   .   ld1	{ v1.8h, v2.8h, v3.8h }, [x27], #48
1506# CHECK-NEXT: [0,7]     .    .    .    .    .    . DeeE    .   .   add	x0, x27, #1
1507# CHECK-NEXT: [0,8]     .    .    .    .    .    .    DeeeeeeeeE   ld1	{ v1.16b, v2.16b, v3.16b }, [x27], #48
1508# CHECK-NEXT: [0,9]     .    .    .    .    .    .    .    .DeeE   add	x0, x27, #1
1509
1510# CHECK:      Average Wait times (based on the timeline view):
1511# CHECK-NEXT: [0]: Executions
1512# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1513# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1514# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1515
1516# CHECK:            [0]    [1]    [2]    [3]
1517# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.4h, v2.4h, v3.4h }, [x27], #24
1518# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1519# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.4s, v2.4s, v3.4s }, [x27], #48
1520# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1521# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.8b, v2.8b, v3.8b }, [x27], #24
1522# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1523# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.8h, v2.8h, v3.8h }, [x27], #48
1524# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1525# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.16b, v2.16b, v3.16b }, [x27], #48
1526# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1527# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1528
1529# CHECK:      [8] Code Region - G09
1530
1531# CHECK:      Iterations:        100
1532# CHECK-NEXT: Instructions:      1000
1533# CHECK-NEXT: Total Cycles:      3601
1534# CHECK-NEXT: Total uOps:        1500
1535
1536# CHECK:      Dispatch Width:    2
1537# CHECK-NEXT: uOps Per Cycle:    0.42
1538# CHECK-NEXT: IPC:               0.28
1539# CHECK-NEXT: Block RThroughput: 21.0
1540
1541# CHECK:      Timeline view:
1542# CHECK-NEXT:                     0123456789          0123456
1543# CHECK-NEXT: Index     0123456789          0123456789
1544
1545# CHECK:      [0,0]     DeeeeeE   .    .    .    .    .    ..   ld1	{ v1.1d, v2.1d, v3.1d }, [x27], x28
1546# CHECK-NEXT: [0,1]     .  DeeE   .    .    .    .    .    ..   add	x0, x27, #1
1547# CHECK-NEXT: [0,2]     .    .DeeeeeeeeE    .    .    .    ..   ld1	{ v1.2d, v2.2d, v3.2d }, [x27], x28
1548# CHECK-NEXT: [0,3]     .    .    . DeeE    .    .    .    ..   add	x0, x27, #1
1549# CHECK-NEXT: [0,4]     .    .    .    DeeeeeE   .    .    ..   ld1	{ v1.2s, v2.2s, v3.2s }, [x27], x28
1550# CHECK-NEXT: [0,5]     .    .    .    .  DeeE   .    .    ..   add	x0, x27, #1
1551# CHECK-NEXT: [0,6]     .    .    .    .    .DeeeeeE  .    ..   ld1	{ v1.4h, v2.4h, v3.4h }, [x27], x28
1552# CHECK-NEXT: [0,7]     .    .    .    .    .   DeeE  .    ..   add	x0, x27, #1
1553# CHECK-NEXT: [0,8]     .    .    .    .    .    . DeeeeeeeeE   ld1	{ v1.4s, v2.4s, v3.4s }, [x27], x28
1554# CHECK-NEXT: [0,9]     .    .    .    .    .    .    .  DeeE   add	x0, x27, #1
1555
1556# CHECK:      Average Wait times (based on the timeline view):
1557# CHECK-NEXT: [0]: Executions
1558# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1559# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1560# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1561
1562# CHECK:            [0]    [1]    [2]    [3]
1563# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.1d, v2.1d, v3.1d }, [x27], x28
1564# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1565# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.2d, v2.2d, v3.2d }, [x27], x28
1566# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1567# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.2s, v2.2s, v3.2s }, [x27], x28
1568# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1569# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.4h, v2.4h, v3.4h }, [x27], x28
1570# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1571# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.4s, v2.4s, v3.4s }, [x27], x28
1572# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1573# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1574
1575# CHECK:      [9] Code Region - G10
1576
1577# CHECK:      Iterations:        100
1578# CHECK-NEXT: Instructions:      1000
1579# CHECK-NEXT: Total Cycles:      4201
1580# CHECK-NEXT: Total uOps:        1500
1581
1582# CHECK:      Dispatch Width:    2
1583# CHECK-NEXT: uOps Per Cycle:    0.36
1584# CHECK-NEXT: IPC:               0.24
1585# CHECK-NEXT: Block RThroughput: 27.0
1586
1587# CHECK:      Timeline view:
1588# CHECK-NEXT:                     0123456789          0123456789
1589# CHECK-NEXT: Index     0123456789          0123456789          012
1590
1591# CHECK:      [0,0]     DeeeeeE   .    .    .    .    .    .    . .   ld1	{ v1.8b, v2.8b, v3.8b }, [x27], x28
1592# CHECK-NEXT: [0,1]     .  DeeE   .    .    .    .    .    .    . .   add	x0, x27, #1
1593# CHECK-NEXT: [0,2]     .    .DeeeeeeeeE    .    .    .    .    . .   ld1	{ v1.8h, v2.8h, v3.8h }, [x27], x28
1594# CHECK-NEXT: [0,3]     .    .    . DeeE    .    .    .    .    . .   add	x0, x27, #1
1595# CHECK-NEXT: [0,4]     .    .    .    DeeeeeeeeE.    .    .    . .   ld1	{ v1.16b, v2.16b, v3.16b }, [x27], x28
1596# CHECK-NEXT: [0,5]     .    .    .    .    .DeeE.    .    .    . .   add	x0, x27, #1
1597# CHECK-NEXT: [0,6]     .    .    .    .    .   DeeeeeeE   .    . .   ld1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
1598# CHECK-NEXT: [0,7]     .    .    .    .    .    .  DeeE   .    . .   add	x0, x27, #1
1599# CHECK-NEXT: [0,8]     .    .    .    .    .    .    .DeeeeeeeeeeE   ld1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
1600# CHECK-NEXT: [0,9]     .    .    .    .    .    .    .    .   DeeE   add	x0, x27, #1
1601
1602# CHECK:      Average Wait times (based on the timeline view):
1603# CHECK-NEXT: [0]: Executions
1604# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1605# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1606# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1607
1608# CHECK:            [0]    [1]    [2]    [3]
1609# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.8b, v2.8b, v3.8b }, [x27], x28
1610# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1611# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.8h, v2.8h, v3.8h }, [x27], x28
1612# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1613# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.16b, v2.16b, v3.16b }, [x27], x28
1614# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1615# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
1616# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1617# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
1618# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1619# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1620
1621# CHECK:      [10] Code Region - G11
1622
1623# CHECK:      Iterations:        100
1624# CHECK-NEXT: Instructions:      1000
1625# CHECK-NEXT: Total Cycles:      4301
1626# CHECK-NEXT: Total uOps:        1500
1627
1628# CHECK:      Dispatch Width:    2
1629# CHECK-NEXT: uOps Per Cycle:    0.35
1630# CHECK-NEXT: IPC:               0.23
1631# CHECK-NEXT: Block RThroughput: 28.0
1632
1633# CHECK:      Timeline view:
1634# CHECK-NEXT:                     0123456789          0123456789
1635# CHECK-NEXT: Index     0123456789          0123456789          0123
1636
1637# CHECK:      [0,0]     DeeeeeeE  .    .    .    .    .    .    .  .   ld1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
1638# CHECK-NEXT: [0,1]     .   DeeE  .    .    .    .    .    .    .  .   add	x0, x27, #1
1639# CHECK-NEXT: [0,2]     .    . DeeeeeeE.    .    .    .    .    .  .   ld1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
1640# CHECK-NEXT: [0,3]     .    .    .DeeE.    .    .    .    .    .  .   add	x0, x27, #1
1641# CHECK-NEXT: [0,4]     .    .    .   DeeeeeeeeeeE    .    .    .  .   ld1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
1642# CHECK-NEXT: [0,5]     .    .    .    .    . DeeE    .    .    .  .   add	x0, x27, #1
1643# CHECK-NEXT: [0,6]     .    .    .    .    .    DeeeeeeE  .    .  .   ld1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
1644# CHECK-NEXT: [0,7]     .    .    .    .    .    .   DeeE  .    .  .   add	x0, x27, #1
1645# CHECK-NEXT: [0,8]     .    .    .    .    .    .    . DeeeeeeeeeeE   ld1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
1646# CHECK-NEXT: [0,9]     .    .    .    .    .    .    .    .    DeeE   add	x0, x27, #1
1647
1648# CHECK:      Average Wait times (based on the timeline view):
1649# CHECK-NEXT: [0]: Executions
1650# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1651# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1652# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1653
1654# CHECK:            [0]    [1]    [2]    [3]
1655# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
1656# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1657# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
1658# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1659# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
1660# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1661# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
1662# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1663# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
1664# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1665# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1666
1667# CHECK:      [11] Code Region - G12
1668
1669# CHECK:      Iterations:        100
1670# CHECK-NEXT: Instructions:      1000
1671# CHECK-NEXT: Total Cycles:      4301
1672# CHECK-NEXT: Total uOps:        1500
1673
1674# CHECK:      Dispatch Width:    2
1675# CHECK-NEXT: uOps Per Cycle:    0.35
1676# CHECK-NEXT: IPC:               0.23
1677# CHECK-NEXT: Block RThroughput: 28.0
1678
1679# CHECK:      Timeline view:
1680# CHECK-NEXT:                     0123456789          0123456789
1681# CHECK-NEXT: Index     0123456789          0123456789          0123
1682
1683# CHECK:      [0,0]     DeeeeeeeeeeE   .    .    .    .    .    .  .   ld1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
1684# CHECK-NEXT: [0,1]     .    .  DeeE   .    .    .    .    .    .  .   add	x0, x27, #1
1685# CHECK-NEXT: [0,2]     .    .    .DeeeeeeE .    .    .    .    .  .   ld1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
1686# CHECK-NEXT: [0,3]     .    .    .    DeeE .    .    .    .    .  .   add	x0, x27, #1
1687# CHECK-NEXT: [0,4]     .    .    .    .  DeeeeeeeeeeE.    .    .  .   ld1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
1688# CHECK-NEXT: [0,5]     .    .    .    .    .    .DeeE.    .    .  .   add	x0, x27, #1
1689# CHECK-NEXT: [0,6]     .    .    .    .    .    .   DeeeeeeE   .  .   ld1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
1690# CHECK-NEXT: [0,7]     .    .    .    .    .    .    .  DeeE   .  .   add	x0, x27, #1
1691# CHECK-NEXT: [0,8]     .    .    .    .    .    .    .    .DeeeeeeE   ld1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
1692# CHECK-NEXT: [0,9]     .    .    .    .    .    .    .    .    DeeE   add	x0, x27, #1
1693
1694# CHECK:      Average Wait times (based on the timeline view):
1695# CHECK-NEXT: [0]: Executions
1696# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1697# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1698# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1699
1700# CHECK:            [0]    [1]    [2]    [3]
1701# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
1702# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1703# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
1704# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1705# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
1706# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1707# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
1708# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1709# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
1710# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1711# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1712
1713# CHECK:      [12] Code Region - G13
1714
1715# CHECK:      Iterations:        100
1716# CHECK-NEXT: Instructions:      1000
1717# CHECK-NEXT: Total Cycles:      4401
1718# CHECK-NEXT: Total uOps:        1500
1719
1720# CHECK:      Dispatch Width:    2
1721# CHECK-NEXT: uOps Per Cycle:    0.34
1722# CHECK-NEXT: IPC:               0.23
1723# CHECK-NEXT: Block RThroughput: 29.0
1724
1725# CHECK:      Timeline view:
1726# CHECK-NEXT:                     0123456789          0123456789
1727# CHECK-NEXT: Index     0123456789          0123456789          01234
1728
1729# CHECK:      [0,0]     DeeeeeeeeeeE   .    .    .    .    .    .   .   ld1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
1730# CHECK-NEXT: [0,1]     .    .  DeeE   .    .    .    .    .    .   .   add	x0, x27, #1
1731# CHECK-NEXT: [0,2]     .    .    .DeeeeeeE .    .    .    .    .   .   ld1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
1732# CHECK-NEXT: [0,3]     .    .    .    DeeE .    .    .    .    .   .   add	x0, x27, #1
1733# CHECK-NEXT: [0,4]     .    .    .    .  DeeeeeeeeeeE.    .    .   .   ld1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
1734# CHECK-NEXT: [0,5]     .    .    .    .    .    .DeeE.    .    .   .   add	x0, x27, #1
1735# CHECK-NEXT: [0,6]     .    .    .    .    .    .   DeeeeeeeeeeE   .   ld1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
1736# CHECK-NEXT: [0,7]     .    .    .    .    .    .    .    . DeeE   .   add	x0, x27, #1
1737# CHECK-NEXT: [0,8]     .    .    .    .    .    .    .    .    DeeeE   ld1	{ v1.b }[0], [x27], #1
1738# CHECK-NEXT: [0,9]     .    .    .    .    .    .    .    .    .DeeE   add	x0, x27, #1
1739
1740# CHECK:      Average Wait times (based on the timeline view):
1741# CHECK-NEXT: [0]: Executions
1742# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1743# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1744# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1745
1746# CHECK:            [0]    [1]    [2]    [3]
1747# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
1748# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1749# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
1750# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1751# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
1752# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1753# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
1754# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1755# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.b }[0], [x27], #1
1756# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1757# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1758
1759# CHECK:      [13] Code Region - G14
1760
1761# CHECK:      Iterations:        100
1762# CHECK-NEXT: Instructions:      1000
1763# CHECK-NEXT: Total Cycles:      2001
1764# CHECK-NEXT: Total uOps:        1500
1765
1766# CHECK:      Dispatch Width:    2
1767# CHECK-NEXT: uOps Per Cycle:    0.75
1768# CHECK-NEXT: IPC:               0.50
1769# CHECK-NEXT: Block RThroughput: 7.5
1770
1771# CHECK:      Timeline view:
1772# CHECK-NEXT:                     0123456789
1773# CHECK-NEXT: Index     0123456789          0
1774
1775# CHECK:      [0,0]     DeeeE.    .    .    .   ld1	{ v1.b }[8], [x27], #1
1776# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
1777# CHECK-NEXT: [0,2]     .   DeeeE .    .    .   ld1	{ v1.b }[0], [x27], x28
1778# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
1779# CHECK-NEXT: [0,4]     .    .  DeeeE  .    .   ld1	{ v1.b }[8], [x27], x28
1780# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
1781# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   ld1	{ v1.h }[0], [x27], #2
1782# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
1783# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   ld1	{ v1.h }[4], [x27], #2
1784# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
1785
1786# CHECK:      Average Wait times (based on the timeline view):
1787# CHECK-NEXT: [0]: Executions
1788# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1789# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1790# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1791
1792# CHECK:            [0]    [1]    [2]    [3]
1793# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.b }[8], [x27], #1
1794# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1795# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.b }[0], [x27], x28
1796# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1797# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.b }[8], [x27], x28
1798# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1799# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.h }[0], [x27], #2
1800# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1801# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.h }[4], [x27], #2
1802# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1803# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1804
1805# CHECK:      [14] Code Region - G15
1806
1807# CHECK:      Iterations:        100
1808# CHECK-NEXT: Instructions:      1000
1809# CHECK-NEXT: Total Cycles:      2001
1810# CHECK-NEXT: Total uOps:        1500
1811
1812# CHECK:      Dispatch Width:    2
1813# CHECK-NEXT: uOps Per Cycle:    0.75
1814# CHECK-NEXT: IPC:               0.50
1815# CHECK-NEXT: Block RThroughput: 7.5
1816
1817# CHECK:      Timeline view:
1818# CHECK-NEXT:                     0123456789
1819# CHECK-NEXT: Index     0123456789          0
1820
1821# CHECK:      [0,0]     DeeeE.    .    .    .   ld1	{ v1.h }[0], [x27], x28
1822# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
1823# CHECK-NEXT: [0,2]     .   DeeeE .    .    .   ld1	{ v1.h }[4], [x27], x28
1824# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
1825# CHECK-NEXT: [0,4]     .    .  DeeeE  .    .   ld1	{ v1.s }[0], [x27], #4
1826# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
1827# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   ld1	{ v1.s }[0], [x27], x28
1828# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
1829# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   ld1	{ v1.d }[0], [x27], #8
1830# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
1831
1832# CHECK:      Average Wait times (based on the timeline view):
1833# CHECK-NEXT: [0]: Executions
1834# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1835# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1836# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1837
1838# CHECK:            [0]    [1]    [2]    [3]
1839# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.h }[0], [x27], x28
1840# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1841# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1	{ v1.h }[4], [x27], x28
1842# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1843# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1	{ v1.s }[0], [x27], #4
1844# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1845# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1	{ v1.s }[0], [x27], x28
1846# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1847# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1	{ v1.d }[0], [x27], #8
1848# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1849# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1850
1851# CHECK:      [15] Code Region - G16
1852
1853# CHECK:      Iterations:        100
1854# CHECK-NEXT: Instructions:      1000
1855# CHECK-NEXT: Total Cycles:      2001
1856# CHECK-NEXT: Total uOps:        1500
1857
1858# CHECK:      Dispatch Width:    2
1859# CHECK-NEXT: uOps Per Cycle:    0.75
1860# CHECK-NEXT: IPC:               0.50
1861# CHECK-NEXT: Block RThroughput: 7.5
1862
1863# CHECK:      Timeline view:
1864# CHECK-NEXT:                     0123456789
1865# CHECK-NEXT: Index     0123456789          0
1866
1867# CHECK:      [0,0]     DeeeE.    .    .    .   ld1	{ v1.d }[0], [x27], x28
1868# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
1869# CHECK-NEXT: [0,2]     .   DeeeE .    .    .   ld1r	{ v1.1d }, [x27], #8
1870# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
1871# CHECK-NEXT: [0,4]     .    .  DeeeE  .    .   ld1r	{ v1.2d }, [x27], #8
1872# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
1873# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   ld1r	{ v1.2s }, [x27], #4
1874# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
1875# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   ld1r	{ v1.4h }, [x27], #2
1876# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
1877
1878# CHECK:      Average Wait times (based on the timeline view):
1879# CHECK-NEXT: [0]: Executions
1880# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1881# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1882# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1883
1884# CHECK:            [0]    [1]    [2]    [3]
1885# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1	{ v1.d }[0], [x27], x28
1886# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1887# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1r	{ v1.1d }, [x27], #8
1888# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1889# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1r	{ v1.2d }, [x27], #8
1890# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1891# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1r	{ v1.2s }, [x27], #4
1892# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1893# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1r	{ v1.4h }, [x27], #2
1894# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1895# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1896
1897# CHECK:      [16] Code Region - G17
1898
1899# CHECK:      Iterations:        100
1900# CHECK-NEXT: Instructions:      1000
1901# CHECK-NEXT: Total Cycles:      2001
1902# CHECK-NEXT: Total uOps:        1500
1903
1904# CHECK:      Dispatch Width:    2
1905# CHECK-NEXT: uOps Per Cycle:    0.75
1906# CHECK-NEXT: IPC:               0.50
1907# CHECK-NEXT: Block RThroughput: 7.5
1908
1909# CHECK:      Timeline view:
1910# CHECK-NEXT:                     0123456789
1911# CHECK-NEXT: Index     0123456789          0
1912
1913# CHECK:      [0,0]     DeeeE.    .    .    .   ld1r	{ v1.4s }, [x27], #4
1914# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
1915# CHECK-NEXT: [0,2]     .   DeeeE .    .    .   ld1r	{ v1.8b }, [x27], #1
1916# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
1917# CHECK-NEXT: [0,4]     .    .  DeeeE  .    .   ld1r	{ v1.8h }, [x27], #2
1918# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
1919# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   ld1r	{ v1.16b }, [x27], #1
1920# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
1921# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   ld1r	{ v1.1d }, [x27], x28
1922# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
1923
1924# CHECK:      Average Wait times (based on the timeline view):
1925# CHECK-NEXT: [0]: Executions
1926# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1927# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1928# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1929
1930# CHECK:            [0]    [1]    [2]    [3]
1931# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1r	{ v1.4s }, [x27], #4
1932# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1933# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1r	{ v1.8b }, [x27], #1
1934# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1935# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1r	{ v1.8h }, [x27], #2
1936# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1937# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1r	{ v1.16b }, [x27], #1
1938# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1939# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1r	{ v1.1d }, [x27], x28
1940# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1941# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1942
1943# CHECK:      [17] Code Region - G18
1944
1945# CHECK:      Iterations:        100
1946# CHECK-NEXT: Instructions:      1000
1947# CHECK-NEXT: Total Cycles:      2001
1948# CHECK-NEXT: Total uOps:        1500
1949
1950# CHECK:      Dispatch Width:    2
1951# CHECK-NEXT: uOps Per Cycle:    0.75
1952# CHECK-NEXT: IPC:               0.50
1953# CHECK-NEXT: Block RThroughput: 7.5
1954
1955# CHECK:      Timeline view:
1956# CHECK-NEXT:                     0123456789
1957# CHECK-NEXT: Index     0123456789          0
1958
1959# CHECK:      [0,0]     DeeeE.    .    .    .   ld1r	{ v1.2d }, [x27], x28
1960# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
1961# CHECK-NEXT: [0,2]     .   DeeeE .    .    .   ld1r	{ v1.2s }, [x27], x28
1962# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
1963# CHECK-NEXT: [0,4]     .    .  DeeeE  .    .   ld1r	{ v1.4h }, [x27], x28
1964# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
1965# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   ld1r	{ v1.4s }, [x27], x28
1966# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
1967# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   ld1r	{ v1.8b }, [x27], x28
1968# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
1969
1970# CHECK:      Average Wait times (based on the timeline view):
1971# CHECK-NEXT: [0]: Executions
1972# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1973# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1974# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1975
1976# CHECK:            [0]    [1]    [2]    [3]
1977# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1r	{ v1.2d }, [x27], x28
1978# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
1979# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1r	{ v1.2s }, [x27], x28
1980# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
1981# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld1r	{ v1.4h }, [x27], x28
1982# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
1983# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld1r	{ v1.4s }, [x27], x28
1984# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
1985# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld1r	{ v1.8b }, [x27], x28
1986# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
1987# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
1988
1989# CHECK:      [18] Code Region - G19
1990
1991# CHECK:      Iterations:        100
1992# CHECK-NEXT: Instructions:      1000
1993# CHECK-NEXT: Total Cycles:      2501
1994# CHECK-NEXT: Total uOps:        1500
1995
1996# CHECK:      Dispatch Width:    2
1997# CHECK-NEXT: uOps Per Cycle:    0.60
1998# CHECK-NEXT: IPC:               0.40
1999# CHECK-NEXT: Block RThroughput: 10.0
2000
2001# CHECK:      Timeline view:
2002# CHECK-NEXT:                     0123456789
2003# CHECK-NEXT: Index     0123456789          012345
2004
2005# CHECK:      [0,0]     DeeeE.    .    .    .    .   ld1r	{ v1.8h }, [x27], x28
2006# CHECK-NEXT: [0,1]     .DeeE.    .    .    .    .   add	x0, x27, #1
2007# CHECK-NEXT: [0,2]     .   DeeeE .    .    .    .   ld1r	{ v1.16b }, [x27], x28
2008# CHECK-NEXT: [0,3]     .    DeeE .    .    .    .   add	x0, x27, #1
2009# CHECK-NEXT: [0,4]     .    .  DeeeeeeE    .    .   ld2	{ v1.2d, v2.2d }, [x27], #32
2010# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
2011# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld2	{ v1.2s, v2.2s }, [x27], #16
2012# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
2013# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld2	{ v1.4h, v2.4h }, [x27], #16
2014# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
2015
2016# CHECK:      Average Wait times (based on the timeline view):
2017# CHECK-NEXT: [0]: Executions
2018# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2019# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2020# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2021
2022# CHECK:            [0]    [1]    [2]    [3]
2023# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld1r	{ v1.8h }, [x27], x28
2024# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2025# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld1r	{ v1.16b }, [x27], x28
2026# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2027# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld2	{ v1.2d, v2.2d }, [x27], #32
2028# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2029# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld2	{ v1.2s, v2.2s }, [x27], #16
2030# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2031# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld2	{ v1.4h, v2.4h }, [x27], #16
2032# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2033# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2034
2035# CHECK:      [19] Code Region - G20
2036
2037# CHECK:      Iterations:        100
2038# CHECK-NEXT: Instructions:      1000
2039# CHECK-NEXT: Total Cycles:      3301
2040# CHECK-NEXT: Total uOps:        1500
2041
2042# CHECK:      Dispatch Width:    2
2043# CHECK-NEXT: uOps Per Cycle:    0.45
2044# CHECK-NEXT: IPC:               0.30
2045# CHECK-NEXT: Block RThroughput: 18.0
2046
2047# CHECK:      Timeline view:
2048# CHECK-NEXT:                     0123456789          0123
2049# CHECK-NEXT: Index     0123456789          0123456789
2050
2051# CHECK:      [0,0]     DeeeeeeE  .    .    .    .    .  .   ld2	{ v1.4s, v2.4s }, [x27], #32
2052# CHECK-NEXT: [0,1]     .   DeeE  .    .    .    .    .  .   add	x0, x27, #1
2053# CHECK-NEXT: [0,2]     .    . DeeeeE  .    .    .    .  .   ld2	{ v1.8b, v2.8b }, [x27], #16
2054# CHECK-NEXT: [0,3]     .    .   DeeE  .    .    .    .  .   add	x0, x27, #1
2055# CHECK-NEXT: [0,4]     .    .    . DeeeeeeE.    .    .  .   ld2	{ v1.8h, v2.8h }, [x27], #32
2056# CHECK-NEXT: [0,5]     .    .    .    .DeeE.    .    .  .   add	x0, x27, #1
2057# CHECK-NEXT: [0,6]     .    .    .    .   DeeeeeeE   .  .   ld2	{ v1.16b, v2.16b }, [x27], #32
2058# CHECK-NEXT: [0,7]     .    .    .    .    .  DeeE   .  .   add	x0, x27, #1
2059# CHECK-NEXT: [0,8]     .    .    .    .    .    .DeeeeeeE   ld2	{ v1.2d, v2.2d }, [x27], x28
2060# CHECK-NEXT: [0,9]     .    .    .    .    .    .    DeeE   add	x0, x27, #1
2061
2062# CHECK:      Average Wait times (based on the timeline view):
2063# CHECK-NEXT: [0]: Executions
2064# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2065# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2066# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2067
2068# CHECK:            [0]    [1]    [2]    [3]
2069# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld2	{ v1.4s, v2.4s }, [x27], #32
2070# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2071# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld2	{ v1.8b, v2.8b }, [x27], #16
2072# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2073# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld2	{ v1.8h, v2.8h }, [x27], #32
2074# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2075# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld2	{ v1.16b, v2.16b }, [x27], #32
2076# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2077# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld2	{ v1.2d, v2.2d }, [x27], x28
2078# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2079# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2080
2081# CHECK:      [20] Code Region - G21
2082
2083# CHECK:      Iterations:        100
2084# CHECK-NEXT: Instructions:      1000
2085# CHECK-NEXT: Total Cycles:      2901
2086# CHECK-NEXT: Total uOps:        1500
2087
2088# CHECK:      Dispatch Width:    2
2089# CHECK-NEXT: uOps Per Cycle:    0.52
2090# CHECK-NEXT: IPC:               0.34
2091# CHECK-NEXT: Block RThroughput: 14.0
2092
2093# CHECK:      Timeline view:
2094# CHECK-NEXT:                     0123456789
2095# CHECK-NEXT: Index     0123456789          0123456789
2096
2097# CHECK:      [0,0]     DeeeeE    .    .    .    .   .   ld2	{ v1.2s, v2.2s }, [x27], x28
2098# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   .   add	x0, x27, #1
2099# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   .   ld2	{ v1.4h, v2.4h }, [x27], x28
2100# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   .   add	x0, x27, #1
2101# CHECK-NEXT: [0,4]     .    .    DeeeeeeE  .    .   .   ld2	{ v1.4s, v2.4s }, [x27], x28
2102# CHECK-NEXT: [0,5]     .    .    .   DeeE  .    .   .   add	x0, x27, #1
2103# CHECK-NEXT: [0,6]     .    .    .    . DeeeeE  .   .   ld2	{ v1.8b, v2.8b }, [x27], x28
2104# CHECK-NEXT: [0,7]     .    .    .    .   DeeE  .   .   add	x0, x27, #1
2105# CHECK-NEXT: [0,8]     .    .    .    .    . DeeeeeeE   ld2	{ v1.8h, v2.8h }, [x27], x28
2106# CHECK-NEXT: [0,9]     .    .    .    .    .    .DeeE   add	x0, x27, #1
2107
2108# CHECK:      Average Wait times (based on the timeline view):
2109# CHECK-NEXT: [0]: Executions
2110# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2111# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2112# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2113
2114# CHECK:            [0]    [1]    [2]    [3]
2115# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld2	{ v1.2s, v2.2s }, [x27], x28
2116# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2117# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld2	{ v1.4h, v2.4h }, [x27], x28
2118# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2119# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld2	{ v1.4s, v2.4s }, [x27], x28
2120# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2121# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld2	{ v1.8b, v2.8b }, [x27], x28
2122# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2123# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld2	{ v1.8h, v2.8h }, [x27], x28
2124# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2125# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2126
2127# CHECK:      [21] Code Region - G22
2128
2129# CHECK:      Iterations:        100
2130# CHECK-NEXT: Instructions:      1000
2131# CHECK-NEXT: Total Cycles:      2701
2132# CHECK-NEXT: Total uOps:        1500
2133
2134# CHECK:      Dispatch Width:    2
2135# CHECK-NEXT: uOps Per Cycle:    0.56
2136# CHECK-NEXT: IPC:               0.37
2137# CHECK-NEXT: Block RThroughput: 12.0
2138
2139# CHECK:      Timeline view:
2140# CHECK-NEXT:                     0123456789
2141# CHECK-NEXT: Index     0123456789          01234567
2142
2143# CHECK:      [0,0]     DeeeeeeE  .    .    .    . .   ld2	{ v1.16b, v2.16b }, [x27], x28
2144# CHECK-NEXT: [0,1]     .   DeeE  .    .    .    . .   add	x0, x27, #1
2145# CHECK-NEXT: [0,2]     .    . DeeeeE  .    .    . .   ld2	{ v1.b, v2.b }[0], [x27], #2
2146# CHECK-NEXT: [0,3]     .    .   DeeE  .    .    . .   add	x0, x27, #1
2147# CHECK-NEXT: [0,4]     .    .    . DeeeeE  .    . .   ld2	{ v1.b, v2.b }[8], [x27], #2
2148# CHECK-NEXT: [0,5]     .    .    .   DeeE  .    . .   add	x0, x27, #1
2149# CHECK-NEXT: [0,6]     .    .    .    . DeeeeE  . .   ld2	{ v1.b, v2.b }[0], [x27], x28
2150# CHECK-NEXT: [0,7]     .    .    .    .   DeeE  . .   add	x0, x27, #1
2151# CHECK-NEXT: [0,8]     .    .    .    .    . DeeeeE   ld2	{ v1.b, v2.b }[8], [x27], x28
2152# CHECK-NEXT: [0,9]     .    .    .    .    .   DeeE   add	x0, x27, #1
2153
2154# CHECK:      Average Wait times (based on the timeline view):
2155# CHECK-NEXT: [0]: Executions
2156# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2157# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2158# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2159
2160# CHECK:            [0]    [1]    [2]    [3]
2161# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld2	{ v1.16b, v2.16b }, [x27], x28
2162# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2163# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld2	{ v1.b, v2.b }[0], [x27], #2
2164# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2165# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld2	{ v1.b, v2.b }[8], [x27], #2
2166# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2167# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld2	{ v1.b, v2.b }[0], [x27], x28
2168# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2169# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld2	{ v1.b, v2.b }[8], [x27], x28
2170# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2171# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2172
2173# CHECK:      [22] Code Region - G23
2174
2175# CHECK:      Iterations:        100
2176# CHECK-NEXT: Instructions:      1000
2177# CHECK-NEXT: Total Cycles:      2501
2178# CHECK-NEXT: Total uOps:        1500
2179
2180# CHECK:      Dispatch Width:    2
2181# CHECK-NEXT: uOps Per Cycle:    0.60
2182# CHECK-NEXT: IPC:               0.40
2183# CHECK-NEXT: Block RThroughput: 10.0
2184
2185# CHECK:      Timeline view:
2186# CHECK-NEXT:                     0123456789
2187# CHECK-NEXT: Index     0123456789          012345
2188
2189# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld2	{ v1.h, v2.h }[0], [x27], #4
2190# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
2191# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld2	{ v1.h, v2.h }[4], [x27], #4
2192# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
2193# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld2	{ v1.h, v2.h }[0], [x27], x28
2194# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
2195# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld2	{ v1.h, v2.h }[4], [x27], x28
2196# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
2197# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld2	{ v1.s, v2.s }[0], [x27], #8
2198# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
2199
2200# CHECK:      Average Wait times (based on the timeline view):
2201# CHECK-NEXT: [0]: Executions
2202# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2203# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2204# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2205
2206# CHECK:            [0]    [1]    [2]    [3]
2207# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld2	{ v1.h, v2.h }[0], [x27], #4
2208# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2209# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld2	{ v1.h, v2.h }[4], [x27], #4
2210# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2211# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld2	{ v1.h, v2.h }[0], [x27], x28
2212# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2213# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld2	{ v1.h, v2.h }[4], [x27], x28
2214# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2215# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld2	{ v1.s, v2.s }[0], [x27], #8
2216# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2217# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2218
2219# CHECK:      [23] Code Region - G24
2220
2221# CHECK:      Iterations:        100
2222# CHECK-NEXT: Instructions:      1000
2223# CHECK-NEXT: Total Cycles:      2501
2224# CHECK-NEXT: Total uOps:        1500
2225
2226# CHECK:      Dispatch Width:    2
2227# CHECK-NEXT: uOps Per Cycle:    0.60
2228# CHECK-NEXT: IPC:               0.40
2229# CHECK-NEXT: Block RThroughput: 10.0
2230
2231# CHECK:      Timeline view:
2232# CHECK-NEXT:                     0123456789
2233# CHECK-NEXT: Index     0123456789          012345
2234
2235# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld2	{ v1.s, v2.s }[0], [x27], x28
2236# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
2237# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld2	{ v1.d, v2.d }[0], [x27], #16
2238# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
2239# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld2	{ v1.d, v2.d }[0], [x27], x28
2240# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
2241# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld2r	{ v1.1d, v2.1d }, [x27], #16
2242# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
2243# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld2r	{ v1.2d, v2.2d }, [x27], #16
2244# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
2245
2246# CHECK:      Average Wait times (based on the timeline view):
2247# CHECK-NEXT: [0]: Executions
2248# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2249# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2250# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2251
2252# CHECK:            [0]    [1]    [2]    [3]
2253# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld2	{ v1.s, v2.s }[0], [x27], x28
2254# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2255# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld2	{ v1.d, v2.d }[0], [x27], #16
2256# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2257# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld2	{ v1.d, v2.d }[0], [x27], x28
2258# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2259# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld2r	{ v1.1d, v2.1d }, [x27], #16
2260# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2261# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld2r	{ v1.2d, v2.2d }, [x27], #16
2262# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2263# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2264
2265# CHECK:      [24] Code Region - G25
2266
2267# CHECK:      Iterations:        100
2268# CHECK-NEXT: Instructions:      1000
2269# CHECK-NEXT: Total Cycles:      2501
2270# CHECK-NEXT: Total uOps:        1500
2271
2272# CHECK:      Dispatch Width:    2
2273# CHECK-NEXT: uOps Per Cycle:    0.60
2274# CHECK-NEXT: IPC:               0.40
2275# CHECK-NEXT: Block RThroughput: 10.0
2276
2277# CHECK:      Timeline view:
2278# CHECK-NEXT:                     0123456789
2279# CHECK-NEXT: Index     0123456789          012345
2280
2281# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld2r	{ v1.2s, v2.2s }, [x27], #8
2282# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
2283# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld2r	{ v1.4h, v2.4h }, [x27], #4
2284# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
2285# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld2r	{ v1.4s, v2.4s }, [x27], #8
2286# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
2287# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld2r	{ v1.8b, v2.8b }, [x27], #2
2288# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
2289# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld2r	{ v1.8h, v2.8h }, [x27], #4
2290# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
2291
2292# CHECK:      Average Wait times (based on the timeline view):
2293# CHECK-NEXT: [0]: Executions
2294# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2295# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2296# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2297
2298# CHECK:            [0]    [1]    [2]    [3]
2299# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld2r	{ v1.2s, v2.2s }, [x27], #8
2300# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2301# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld2r	{ v1.4h, v2.4h }, [x27], #4
2302# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2303# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld2r	{ v1.4s, v2.4s }, [x27], #8
2304# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2305# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld2r	{ v1.8b, v2.8b }, [x27], #2
2306# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2307# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld2r	{ v1.8h, v2.8h }, [x27], #4
2308# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2309# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2310
2311# CHECK:      [25] Code Region - G26
2312
2313# CHECK:      Iterations:        100
2314# CHECK-NEXT: Instructions:      1000
2315# CHECK-NEXT: Total Cycles:      2501
2316# CHECK-NEXT: Total uOps:        1500
2317
2318# CHECK:      Dispatch Width:    2
2319# CHECK-NEXT: uOps Per Cycle:    0.60
2320# CHECK-NEXT: IPC:               0.40
2321# CHECK-NEXT: Block RThroughput: 10.0
2322
2323# CHECK:      Timeline view:
2324# CHECK-NEXT:                     0123456789
2325# CHECK-NEXT: Index     0123456789          012345
2326
2327# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld2r	{ v1.16b, v2.16b }, [x27], #2
2328# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
2329# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld2r	{ v1.1d, v2.1d }, [x27], x28
2330# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
2331# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld2r	{ v1.2d, v2.2d }, [x27], x28
2332# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
2333# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld2r	{ v1.2s, v2.2s }, [x27], x28
2334# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
2335# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld2r	{ v1.4h, v2.4h }, [x27], x28
2336# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
2337
2338# CHECK:      Average Wait times (based on the timeline view):
2339# CHECK-NEXT: [0]: Executions
2340# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2341# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2342# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2343
2344# CHECK:            [0]    [1]    [2]    [3]
2345# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld2r	{ v1.16b, v2.16b }, [x27], #2
2346# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2347# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld2r	{ v1.1d, v2.1d }, [x27], x28
2348# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2349# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld2r	{ v1.2d, v2.2d }, [x27], x28
2350# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2351# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld2r	{ v1.2s, v2.2s }, [x27], x28
2352# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2353# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld2r	{ v1.4h, v2.4h }, [x27], x28
2354# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2355# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2356
2357# CHECK:      [26] Code Region - G27
2358
2359# CHECK:      Iterations:        100
2360# CHECK-NEXT: Instructions:      1000
2361# CHECK-NEXT: Total Cycles:      2901
2362# CHECK-NEXT: Total uOps:        1500
2363
2364# CHECK:      Dispatch Width:    2
2365# CHECK-NEXT: uOps Per Cycle:    0.52
2366# CHECK-NEXT: IPC:               0.34
2367# CHECK-NEXT: Block RThroughput: 14.0
2368
2369# CHECK:      Timeline view:
2370# CHECK-NEXT:                     0123456789
2371# CHECK-NEXT: Index     0123456789          0123456789
2372
2373# CHECK:      [0,0]     DeeeeE    .    .    .    .   .   ld2r	{ v1.4s, v2.4s }, [x27], x28
2374# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   .   add	x0, x27, #1
2375# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   .   ld2r	{ v1.8b, v2.8b }, [x27], x28
2376# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   .   add	x0, x27, #1
2377# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   .   ld2r	{ v1.8h, v2.8h }, [x27], x28
2378# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   .   add	x0, x27, #1
2379# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   .   ld2r	{ v1.16b, v2.16b }, [x27], x28
2380# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   .   add	x0, x27, #1
2381# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeeeeeE   ld3	{ v1.2d, v2.2d, v3.2d }, [x27], #48
2382# CHECK-NEXT: [0,9]     .    .    .    .    .    .DeeE   add	x0, x27, #1
2383
2384# CHECK:      Average Wait times (based on the timeline view):
2385# CHECK-NEXT: [0]: Executions
2386# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2387# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2388# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2389
2390# CHECK:            [0]    [1]    [2]    [3]
2391# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld2r	{ v1.4s, v2.4s }, [x27], x28
2392# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2393# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld2r	{ v1.8b, v2.8b }, [x27], x28
2394# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2395# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld2r	{ v1.8h, v2.8h }, [x27], x28
2396# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2397# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld2r	{ v1.16b, v2.16b }, [x27], x28
2398# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2399# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld3	{ v1.2d, v2.2d, v3.2d }, [x27], #48
2400# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2401# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2402
2403# CHECK:      [27] Code Region - G28
2404
2405# CHECK:      Iterations:        100
2406# CHECK-NEXT: Instructions:      1000
2407# CHECK-NEXT: Total Cycles:      3601
2408# CHECK-NEXT: Total uOps:        1500
2409
2410# CHECK:      Dispatch Width:    2
2411# CHECK-NEXT: uOps Per Cycle:    0.42
2412# CHECK-NEXT: IPC:               0.28
2413# CHECK-NEXT: Block RThroughput: 21.0
2414
2415# CHECK:      Timeline view:
2416# CHECK-NEXT:                     0123456789          0123456
2417# CHECK-NEXT: Index     0123456789          0123456789
2418
2419# CHECK:      [0,0]     DeeeeeE   .    .    .    .    .    ..   ld3	{ v1.2s, v2.2s, v3.2s }, [x27], #24
2420# CHECK-NEXT: [0,1]     .  DeeE   .    .    .    .    .    ..   add	x0, x27, #1
2421# CHECK-NEXT: [0,2]     .    .DeeeeeE  .    .    .    .    ..   ld3	{ v1.4h, v2.4h, v3.4h }, [x27], #24
2422# CHECK-NEXT: [0,3]     .    .   DeeE  .    .    .    .    ..   add	x0, x27, #1
2423# CHECK-NEXT: [0,4]     .    .    . DeeeeeeeeE   .    .    ..   ld3	{ v1.4s, v2.4s, v3.4s }, [x27], #48
2424# CHECK-NEXT: [0,5]     .    .    .    .  DeeE   .    .    ..   add	x0, x27, #1
2425# CHECK-NEXT: [0,6]     .    .    .    .    .DeeeeeE  .    ..   ld3	{ v1.8b, v2.8b, v3.8b }, [x27], #24
2426# CHECK-NEXT: [0,7]     .    .    .    .    .   DeeE  .    ..   add	x0, x27, #1
2427# CHECK-NEXT: [0,8]     .    .    .    .    .    . DeeeeeeeeE   ld3	{ v1.8h, v2.8h, v3.8h }, [x27], #48
2428# CHECK-NEXT: [0,9]     .    .    .    .    .    .    .  DeeE   add	x0, x27, #1
2429
2430# CHECK:      Average Wait times (based on the timeline view):
2431# CHECK-NEXT: [0]: Executions
2432# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2433# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2434# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2435
2436# CHECK:            [0]    [1]    [2]    [3]
2437# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld3	{ v1.2s, v2.2s, v3.2s }, [x27], #24
2438# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2439# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld3	{ v1.4h, v2.4h, v3.4h }, [x27], #24
2440# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2441# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld3	{ v1.4s, v2.4s, v3.4s }, [x27], #48
2442# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2443# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld3	{ v1.8b, v2.8b, v3.8b }, [x27], #24
2444# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2445# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld3	{ v1.8h, v2.8h, v3.8h }, [x27], #48
2446# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2447# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2448
2449# CHECK:      [28] Code Region - G29
2450
2451# CHECK:      Iterations:        100
2452# CHECK-NEXT: Instructions:      1000
2453# CHECK-NEXT: Total Cycles:      3901
2454# CHECK-NEXT: Total uOps:        1500
2455
2456# CHECK:      Dispatch Width:    2
2457# CHECK-NEXT: uOps Per Cycle:    0.38
2458# CHECK-NEXT: IPC:               0.26
2459# CHECK-NEXT: Block RThroughput: 24.0
2460
2461# CHECK:      Timeline view:
2462# CHECK-NEXT:                     0123456789          0123456789
2463# CHECK-NEXT: Index     0123456789          0123456789
2464
2465# CHECK:      [0,0]     DeeeeeeeeE.    .    .    .    .    .   .   ld3	{ v1.16b, v2.16b, v3.16b }, [x27], #48
2466# CHECK-NEXT: [0,1]     .    .DeeE.    .    .    .    .    .   .   add	x0, x27, #1
2467# CHECK-NEXT: [0,2]     .    .   DeeeeeeeeE .    .    .    .   .   ld3	{ v1.2d, v2.2d, v3.2d }, [x27], x28
2468# CHECK-NEXT: [0,3]     .    .    .    DeeE .    .    .    .   .   add	x0, x27, #1
2469# CHECK-NEXT: [0,4]     .    .    .    .  DeeeeeE.    .    .   .   ld3	{ v1.2s, v2.2s, v3.2s }, [x27], x28
2470# CHECK-NEXT: [0,5]     .    .    .    .    .DeeE.    .    .   .   add	x0, x27, #1
2471# CHECK-NEXT: [0,6]     .    .    .    .    .   DeeeeeE    .   .   ld3	{ v1.4h, v2.4h, v3.4h }, [x27], x28
2472# CHECK-NEXT: [0,7]     .    .    .    .    .    . DeeE    .   .   add	x0, x27, #1
2473# CHECK-NEXT: [0,8]     .    .    .    .    .    .    DeeeeeeeeE   ld3	{ v1.4s, v2.4s, v3.4s }, [x27], x28
2474# CHECK-NEXT: [0,9]     .    .    .    .    .    .    .    .DeeE   add	x0, x27, #1
2475
2476# CHECK:      Average Wait times (based on the timeline view):
2477# CHECK-NEXT: [0]: Executions
2478# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2479# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2480# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2481
2482# CHECK:            [0]    [1]    [2]    [3]
2483# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld3	{ v1.16b, v2.16b, v3.16b }, [x27], #48
2484# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2485# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld3	{ v1.2d, v2.2d, v3.2d }, [x27], x28
2486# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2487# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld3	{ v1.2s, v2.2s, v3.2s }, [x27], x28
2488# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2489# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld3	{ v1.4h, v2.4h, v3.4h }, [x27], x28
2490# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2491# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld3	{ v1.4s, v2.4s, v3.4s }, [x27], x28
2492# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2493# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2494
2495# CHECK:      [29] Code Region - G30
2496
2497# CHECK:      Iterations:        100
2498# CHECK-NEXT: Instructions:      1000
2499# CHECK-NEXT: Total Cycles:      3401
2500# CHECK-NEXT: Total uOps:        1500
2501
2502# CHECK:      Dispatch Width:    2
2503# CHECK-NEXT: uOps Per Cycle:    0.44
2504# CHECK-NEXT: IPC:               0.29
2505# CHECK-NEXT: Block RThroughput: 19.0
2506
2507# CHECK:      Timeline view:
2508# CHECK-NEXT:                     0123456789          01234
2509# CHECK-NEXT: Index     0123456789          0123456789
2510
2511# CHECK:      [0,0]     DeeeeeE   .    .    .    .    .   .   ld3	{ v1.8b, v2.8b, v3.8b }, [x27], x28
2512# CHECK-NEXT: [0,1]     .  DeeE   .    .    .    .    .   .   add	x0, x27, #1
2513# CHECK-NEXT: [0,2]     .    .DeeeeeeeeE    .    .    .   .   ld3	{ v1.8h, v2.8h, v3.8h }, [x27], x28
2514# CHECK-NEXT: [0,3]     .    .    . DeeE    .    .    .   .   add	x0, x27, #1
2515# CHECK-NEXT: [0,4]     .    .    .    DeeeeeeeeE.    .   .   ld3	{ v1.16b, v2.16b, v3.16b }, [x27], x28
2516# CHECK-NEXT: [0,5]     .    .    .    .    .DeeE.    .   .   add	x0, x27, #1
2517# CHECK-NEXT: [0,6]     .    .    .    .    .   DeeeeE.   .   ld3	{ v1.b, v2.b, v3.b }[0], [x27], #3
2518# CHECK-NEXT: [0,7]     .    .    .    .    .    .DeeE.   .   add	x0, x27, #1
2519# CHECK-NEXT: [0,8]     .    .    .    .    .    .   DeeeeE   ld3	{ v1.b, v2.b, v3.b }[8], [x27], #3
2520# CHECK-NEXT: [0,9]     .    .    .    .    .    .    .DeeE   add	x0, x27, #1
2521
2522# CHECK:      Average Wait times (based on the timeline view):
2523# CHECK-NEXT: [0]: Executions
2524# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2525# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2526# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2527
2528# CHECK:            [0]    [1]    [2]    [3]
2529# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld3	{ v1.8b, v2.8b, v3.8b }, [x27], x28
2530# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2531# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld3	{ v1.8h, v2.8h, v3.8h }, [x27], x28
2532# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2533# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld3	{ v1.16b, v2.16b, v3.16b }, [x27], x28
2534# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2535# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld3	{ v1.b, v2.b, v3.b }[0], [x27], #3
2536# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2537# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld3	{ v1.b, v2.b, v3.b }[8], [x27], #3
2538# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2539# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2540
2541# CHECK:      [30] Code Region - G31
2542
2543# CHECK:      Iterations:        100
2544# CHECK-NEXT: Instructions:      1000
2545# CHECK-NEXT: Total Cycles:      2501
2546# CHECK-NEXT: Total uOps:        1500
2547
2548# CHECK:      Dispatch Width:    2
2549# CHECK-NEXT: uOps Per Cycle:    0.60
2550# CHECK-NEXT: IPC:               0.40
2551# CHECK-NEXT: Block RThroughput: 10.0
2552
2553# CHECK:      Timeline view:
2554# CHECK-NEXT:                     0123456789
2555# CHECK-NEXT: Index     0123456789          012345
2556
2557# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld3	{ v1.b, v2.b, v3.b }[0], [x27], x28
2558# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
2559# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld3	{ v1.b, v2.b, v3.b }[8], [x27], x28
2560# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
2561# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld3	{ v1.h, v2.h, v3.h }[0], [x27], #6
2562# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
2563# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld3	{ v1.h, v2.h, v3.h }[4], [x27], #6
2564# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
2565# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld3	{ v1.h, v2.h, v3.h }[0], [x27], x28
2566# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
2567
2568# CHECK:      Average Wait times (based on the timeline view):
2569# CHECK-NEXT: [0]: Executions
2570# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2571# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2572# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2573
2574# CHECK:            [0]    [1]    [2]    [3]
2575# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld3	{ v1.b, v2.b, v3.b }[0], [x27], x28
2576# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2577# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld3	{ v1.b, v2.b, v3.b }[8], [x27], x28
2578# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2579# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld3	{ v1.h, v2.h, v3.h }[0], [x27], #6
2580# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2581# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld3	{ v1.h, v2.h, v3.h }[4], [x27], #6
2582# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2583# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld3	{ v1.h, v2.h, v3.h }[0], [x27], x28
2584# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2585# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2586
2587# CHECK:      [31] Code Region - G32
2588
2589# CHECK:      Iterations:        100
2590# CHECK-NEXT: Instructions:      1000
2591# CHECK-NEXT: Total Cycles:      2501
2592# CHECK-NEXT: Total uOps:        1500
2593
2594# CHECK:      Dispatch Width:    2
2595# CHECK-NEXT: uOps Per Cycle:    0.60
2596# CHECK-NEXT: IPC:               0.40
2597# CHECK-NEXT: Block RThroughput: 10.0
2598
2599# CHECK:      Timeline view:
2600# CHECK-NEXT:                     0123456789
2601# CHECK-NEXT: Index     0123456789          012345
2602
2603# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld3	{ v1.h, v2.h, v3.h }[4], [x27], x28
2604# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
2605# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld3	{ v1.s, v2.s, v3.s }[0], [x27], #12
2606# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
2607# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld3	{ v1.s, v2.s, v3.s }[0], [x27], x28
2608# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
2609# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld3	{ v1.d, v2.d, v3.d }[0], [x27], #24
2610# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
2611# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld3	{ v1.d, v2.d, v3.d }[0], [x27], x28
2612# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
2613
2614# CHECK:      Average Wait times (based on the timeline view):
2615# CHECK-NEXT: [0]: Executions
2616# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2617# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2618# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2619
2620# CHECK:            [0]    [1]    [2]    [3]
2621# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld3	{ v1.h, v2.h, v3.h }[4], [x27], x28
2622# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2623# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld3	{ v1.s, v2.s, v3.s }[0], [x27], #12
2624# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2625# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld3	{ v1.s, v2.s, v3.s }[0], [x27], x28
2626# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2627# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld3	{ v1.d, v2.d, v3.d }[0], [x27], #24
2628# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2629# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld3	{ v1.d, v2.d, v3.d }[0], [x27], x28
2630# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2631# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2632
2633# CHECK:      [32] Code Region - G33
2634
2635# CHECK:      Iterations:        100
2636# CHECK-NEXT: Instructions:      1000
2637# CHECK-NEXT: Total Cycles:      2501
2638# CHECK-NEXT: Total uOps:        1500
2639
2640# CHECK:      Dispatch Width:    2
2641# CHECK-NEXT: uOps Per Cycle:    0.60
2642# CHECK-NEXT: IPC:               0.40
2643# CHECK-NEXT: Block RThroughput: 10.0
2644
2645# CHECK:      Timeline view:
2646# CHECK-NEXT:                     0123456789
2647# CHECK-NEXT: Index     0123456789          012345
2648
2649# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld3r	{ v1.1d, v2.1d, v3.1d }, [x27], #24
2650# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
2651# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld3r	{ v1.2d, v2.2d, v3.2d }, [x27], #24
2652# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
2653# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld3r	{ v1.2s, v2.2s, v3.2s }, [x27], #12
2654# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
2655# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld3r	{ v1.4h, v2.4h, v3.4h }, [x27], #6
2656# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
2657# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld3r	{ v1.4s, v2.4s, v3.4s }, [x27], #12
2658# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
2659
2660# CHECK:      Average Wait times (based on the timeline view):
2661# CHECK-NEXT: [0]: Executions
2662# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2663# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2664# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2665
2666# CHECK:            [0]    [1]    [2]    [3]
2667# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld3r	{ v1.1d, v2.1d, v3.1d }, [x27], #24
2668# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2669# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld3r	{ v1.2d, v2.2d, v3.2d }, [x27], #24
2670# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2671# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld3r	{ v1.2s, v2.2s, v3.2s }, [x27], #12
2672# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2673# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld3r	{ v1.4h, v2.4h, v3.4h }, [x27], #6
2674# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2675# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld3r	{ v1.4s, v2.4s, v3.4s }, [x27], #12
2676# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2677# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2678
2679# CHECK:      [33] Code Region - G34
2680
2681# CHECK:      Iterations:        100
2682# CHECK-NEXT: Instructions:      1000
2683# CHECK-NEXT: Total Cycles:      2501
2684# CHECK-NEXT: Total uOps:        1500
2685
2686# CHECK:      Dispatch Width:    2
2687# CHECK-NEXT: uOps Per Cycle:    0.60
2688# CHECK-NEXT: IPC:               0.40
2689# CHECK-NEXT: Block RThroughput: 10.0
2690
2691# CHECK:      Timeline view:
2692# CHECK-NEXT:                     0123456789
2693# CHECK-NEXT: Index     0123456789          012345
2694
2695# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld3r	{ v1.8b, v2.8b, v3.8b }, [x27], #3
2696# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
2697# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld3r	{ v1.8h, v2.8h, v3.8h }, [x27], #6
2698# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
2699# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld3r	{ v1.16b, v2.16b, v3.16b }, [x27], #3
2700# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
2701# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld3r	{ v1.1d, v2.1d, v3.1d }, [x27], x28
2702# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
2703# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld3r	{ v1.2d, v2.2d, v3.2d }, [x27], x28
2704# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
2705
2706# CHECK:      Average Wait times (based on the timeline view):
2707# CHECK-NEXT: [0]: Executions
2708# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2709# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2710# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2711
2712# CHECK:            [0]    [1]    [2]    [3]
2713# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld3r	{ v1.8b, v2.8b, v3.8b }, [x27], #3
2714# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2715# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld3r	{ v1.8h, v2.8h, v3.8h }, [x27], #6
2716# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2717# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld3r	{ v1.16b, v2.16b, v3.16b }, [x27], #3
2718# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2719# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld3r	{ v1.1d, v2.1d, v3.1d }, [x27], x28
2720# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2721# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld3r	{ v1.2d, v2.2d, v3.2d }, [x27], x28
2722# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2723# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2724
2725# CHECK:      [34] Code Region - G35
2726
2727# CHECK:      Iterations:        100
2728# CHECK-NEXT: Instructions:      1000
2729# CHECK-NEXT: Total Cycles:      2501
2730# CHECK-NEXT: Total uOps:        1500
2731
2732# CHECK:      Dispatch Width:    2
2733# CHECK-NEXT: uOps Per Cycle:    0.60
2734# CHECK-NEXT: IPC:               0.40
2735# CHECK-NEXT: Block RThroughput: 10.0
2736
2737# CHECK:      Timeline view:
2738# CHECK-NEXT:                     0123456789
2739# CHECK-NEXT: Index     0123456789          012345
2740
2741# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld3r	{ v1.2s, v2.2s, v3.2s }, [x27], x28
2742# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
2743# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld3r	{ v1.4h, v2.4h, v3.4h }, [x27], x28
2744# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
2745# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld3r	{ v1.4s, v2.4s, v3.4s }, [x27], x28
2746# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
2747# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld3r	{ v1.8b, v2.8b, v3.8b }, [x27], x28
2748# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
2749# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld3r	{ v1.8h, v2.8h, v3.8h }, [x27], x28
2750# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
2751
2752# CHECK:      Average Wait times (based on the timeline view):
2753# CHECK-NEXT: [0]: Executions
2754# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2755# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2756# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2757
2758# CHECK:            [0]    [1]    [2]    [3]
2759# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld3r	{ v1.2s, v2.2s, v3.2s }, [x27], x28
2760# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2761# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld3r	{ v1.4h, v2.4h, v3.4h }, [x27], x28
2762# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2763# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld3r	{ v1.4s, v2.4s, v3.4s }, [x27], x28
2764# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2765# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld3r	{ v1.8b, v2.8b, v3.8b }, [x27], x28
2766# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2767# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld3r	{ v1.8h, v2.8h, v3.8h }, [x27], x28
2768# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2769# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2770
2771# CHECK:      [35] Code Region - G36
2772
2773# CHECK:      Iterations:        100
2774# CHECK-NEXT: Instructions:      1000
2775# CHECK-NEXT: Total Cycles:      4101
2776# CHECK-NEXT: Total uOps:        1500
2777
2778# CHECK:      Dispatch Width:    2
2779# CHECK-NEXT: uOps Per Cycle:    0.37
2780# CHECK-NEXT: IPC:               0.24
2781# CHECK-NEXT: Block RThroughput: 26.0
2782
2783# CHECK:      Timeline view:
2784# CHECK-NEXT:                     0123456789          0123456789
2785# CHECK-NEXT: Index     0123456789          0123456789          01
2786
2787# CHECK:      [0,0]     DeeeeE    .    .    .    .    .    .    ..   ld3r	{ v1.16b, v2.16b, v3.16b }, [x27], x28
2788# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .    .    .    ..   add	x0, x27, #1
2789# CHECK-NEXT: [0,2]     .    DeeeeeeeeeeE   .    .    .    .    ..   ld4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
2790# CHECK-NEXT: [0,3]     .    .    .  DeeE   .    .    .    .    ..   add	x0, x27, #1
2791# CHECK-NEXT: [0,4]     .    .    .    .DeeeeeeE .    .    .    ..   ld4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
2792# CHECK-NEXT: [0,5]     .    .    .    .    DeeE .    .    .    ..   add	x0, x27, #1
2793# CHECK-NEXT: [0,6]     .    .    .    .    .  DeeeeeeE    .    ..   ld4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
2794# CHECK-NEXT: [0,7]     .    .    .    .    .    . DeeE    .    ..   add	x0, x27, #1
2795# CHECK-NEXT: [0,8]     .    .    .    .    .    .    DeeeeeeeeeeE   ld4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
2796# CHECK-NEXT: [0,9]     .    .    .    .    .    .    .    .  DeeE   add	x0, x27, #1
2797
2798# CHECK:      Average Wait times (based on the timeline view):
2799# CHECK-NEXT: [0]: Executions
2800# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2801# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2802# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2803
2804# CHECK:            [0]    [1]    [2]    [3]
2805# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld3r	{ v1.16b, v2.16b, v3.16b }, [x27], x28
2806# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2807# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
2808# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2809# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
2810# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2811# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
2812# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2813# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
2814# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2815# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2816
2817# CHECK:      [36] Code Region - G37
2818
2819# CHECK:      Iterations:        100
2820# CHECK-NEXT: Instructions:      1000
2821# CHECK-NEXT: Total Cycles:      4701
2822# CHECK-NEXT: Total uOps:        1500
2823
2824# CHECK:      Dispatch Width:    2
2825# CHECK-NEXT: uOps Per Cycle:    0.32
2826# CHECK-NEXT: IPC:               0.21
2827# CHECK-NEXT: Block RThroughput: 32.0
2828
2829# CHECK:      Timeline view:
2830# CHECK-NEXT:                     0123456789          0123456789
2831# CHECK-NEXT: Index     0123456789          0123456789          01234567
2832
2833# CHECK:      [0,0]     DeeeeeeE  .    .    .    .    .    .    .    . .   ld4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
2834# CHECK-NEXT: [0,1]     .   DeeE  .    .    .    .    .    .    .    . .   add	x0, x27, #1
2835# CHECK-NEXT: [0,2]     .    . DeeeeeeeeeeE .    .    .    .    .    . .   ld4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
2836# CHECK-NEXT: [0,3]     .    .    .    DeeE .    .    .    .    .    . .   add	x0, x27, #1
2837# CHECK-NEXT: [0,4]     .    .    .    .  DeeeeeeeeeeE.    .    .    . .   ld4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
2838# CHECK-NEXT: [0,5]     .    .    .    .    .    .DeeE.    .    .    . .   add	x0, x27, #1
2839# CHECK-NEXT: [0,6]     .    .    .    .    .    .   DeeeeeeeeeeE    . .   ld4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
2840# CHECK-NEXT: [0,7]     .    .    .    .    .    .    .    . DeeE    . .   add	x0, x27, #1
2841# CHECK-NEXT: [0,8]     .    .    .    .    .    .    .    .    DeeeeeeE   ld4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
2842# CHECK-NEXT: [0,9]     .    .    .    .    .    .    .    .    .   DeeE   add	x0, x27, #1
2843
2844# CHECK:      Average Wait times (based on the timeline view):
2845# CHECK-NEXT: [0]: Executions
2846# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2847# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2848# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2849
2850# CHECK:            [0]    [1]    [2]    [3]
2851# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
2852# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2853# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
2854# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2855# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
2856# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2857# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
2858# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2859# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
2860# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2861# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2862
2863# CHECK:      [37] Code Region - G38
2864
2865# CHECK:      Iterations:        100
2866# CHECK-NEXT: Instructions:      1000
2867# CHECK-NEXT: Total Cycles:      4701
2868# CHECK-NEXT: Total uOps:        1500
2869
2870# CHECK:      Dispatch Width:    2
2871# CHECK-NEXT: uOps Per Cycle:    0.32
2872# CHECK-NEXT: IPC:               0.21
2873# CHECK-NEXT: Block RThroughput: 32.0
2874
2875# CHECK:      Timeline view:
2876# CHECK-NEXT:                     0123456789          0123456789
2877# CHECK-NEXT: Index     0123456789          0123456789          01234567
2878
2879# CHECK:      [0,0]     DeeeeeeE  .    .    .    .    .    .    .    . .   ld4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
2880# CHECK-NEXT: [0,1]     .   DeeE  .    .    .    .    .    .    .    . .   add	x0, x27, #1
2881# CHECK-NEXT: [0,2]     .    . DeeeeeeeeeeE .    .    .    .    .    . .   ld4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
2882# CHECK-NEXT: [0,3]     .    .    .    DeeE .    .    .    .    .    . .   add	x0, x27, #1
2883# CHECK-NEXT: [0,4]     .    .    .    .  DeeeeeeE    .    .    .    . .   ld4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
2884# CHECK-NEXT: [0,5]     .    .    .    .    . DeeE    .    .    .    . .   add	x0, x27, #1
2885# CHECK-NEXT: [0,6]     .    .    .    .    .    DeeeeeeeeeeE   .    . .   ld4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
2886# CHECK-NEXT: [0,7]     .    .    .    .    .    .    .  DeeE   .    . .   add	x0, x27, #1
2887# CHECK-NEXT: [0,8]     .    .    .    .    .    .    .    .DeeeeeeeeeeE   ld4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
2888# CHECK-NEXT: [0,9]     .    .    .    .    .    .    .    .    .   DeeE   add	x0, x27, #1
2889
2890# CHECK:      Average Wait times (based on the timeline view):
2891# CHECK-NEXT: [0]: Executions
2892# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2893# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2894# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2895
2896# CHECK:            [0]    [1]    [2]    [3]
2897# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
2898# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2899# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
2900# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2901# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
2902# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2903# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
2904# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2905# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
2906# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2907# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2908
2909# CHECK:      [38] Code Region - G39
2910
2911# CHECK:      Iterations:        100
2912# CHECK-NEXT: Instructions:      1000
2913# CHECK-NEXT: Total Cycles:      2501
2914# CHECK-NEXT: Total uOps:        1500
2915
2916# CHECK:      Dispatch Width:    2
2917# CHECK-NEXT: uOps Per Cycle:    0.60
2918# CHECK-NEXT: IPC:               0.40
2919# CHECK-NEXT: Block RThroughput: 10.0
2920
2921# CHECK:      Timeline view:
2922# CHECK-NEXT:                     0123456789
2923# CHECK-NEXT: Index     0123456789          012345
2924
2925# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
2926# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
2927# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
2928# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
2929# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
2930# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
2931# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
2932# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
2933# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
2934# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
2935
2936# CHECK:      Average Wait times (based on the timeline view):
2937# CHECK-NEXT: [0]: Executions
2938# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2939# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2940# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2941
2942# CHECK:            [0]    [1]    [2]    [3]
2943# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
2944# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2945# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
2946# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2947# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
2948# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2949# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
2950# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2951# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
2952# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2953# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
2954
2955# CHECK:      [39] Code Region - G40
2956
2957# CHECK:      Iterations:        100
2958# CHECK-NEXT: Instructions:      1000
2959# CHECK-NEXT: Total Cycles:      2501
2960# CHECK-NEXT: Total uOps:        1500
2961
2962# CHECK:      Dispatch Width:    2
2963# CHECK-NEXT: uOps Per Cycle:    0.60
2964# CHECK-NEXT: IPC:               0.40
2965# CHECK-NEXT: Block RThroughput: 10.0
2966
2967# CHECK:      Timeline view:
2968# CHECK-NEXT:                     0123456789
2969# CHECK-NEXT: Index     0123456789          012345
2970
2971# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
2972# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
2973# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
2974# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
2975# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
2976# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
2977# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
2978# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
2979# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
2980# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
2981
2982# CHECK:      Average Wait times (based on the timeline view):
2983# CHECK-NEXT: [0]: Executions
2984# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2985# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2986# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2987
2988# CHECK:            [0]    [1]    [2]    [3]
2989# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
2990# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
2991# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
2992# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
2993# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
2994# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
2995# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
2996# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
2997# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
2998# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
2999# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3000
3001# CHECK:      [40] Code Region - G41
3002
3003# CHECK:      Iterations:        100
3004# CHECK-NEXT: Instructions:      1000
3005# CHECK-NEXT: Total Cycles:      2501
3006# CHECK-NEXT: Total uOps:        1500
3007
3008# CHECK:      Dispatch Width:    2
3009# CHECK-NEXT: uOps Per Cycle:    0.60
3010# CHECK-NEXT: IPC:               0.40
3011# CHECK-NEXT: Block RThroughput: 10.0
3012
3013# CHECK:      Timeline view:
3014# CHECK-NEXT:                     0123456789
3015# CHECK-NEXT: Index     0123456789          012345
3016
3017# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
3018# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
3019# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
3020# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
3021# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld4r	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
3022# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
3023# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld4r	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32
3024# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
3025# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld4r	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16
3026# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
3027
3028# CHECK:      Average Wait times (based on the timeline view):
3029# CHECK-NEXT: [0]: Executions
3030# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3031# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3032# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3033
3034# CHECK:            [0]    [1]    [2]    [3]
3035# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
3036# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3037# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
3038# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3039# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld4r	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
3040# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3041# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld4r	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32
3042# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3043# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld4r	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16
3044# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3045# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3046
3047# CHECK:      [41] Code Region - G42
3048
3049# CHECK:      Iterations:        100
3050# CHECK-NEXT: Instructions:      1000
3051# CHECK-NEXT: Total Cycles:      2501
3052# CHECK-NEXT: Total uOps:        1500
3053
3054# CHECK:      Dispatch Width:    2
3055# CHECK-NEXT: uOps Per Cycle:    0.60
3056# CHECK-NEXT: IPC:               0.40
3057# CHECK-NEXT: Block RThroughput: 10.0
3058
3059# CHECK:      Timeline view:
3060# CHECK-NEXT:                     0123456789
3061# CHECK-NEXT: Index     0123456789          012345
3062
3063# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld4r	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8
3064# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
3065# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld4r	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16
3066# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
3067# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld4r	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4
3068# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
3069# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld4r	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8
3070# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
3071# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld4r	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4
3072# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
3073
3074# CHECK:      Average Wait times (based on the timeline view):
3075# CHECK-NEXT: [0]: Executions
3076# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3077# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3078# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3079
3080# CHECK:            [0]    [1]    [2]    [3]
3081# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld4r	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8
3082# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3083# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld4r	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16
3084# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3085# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld4r	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4
3086# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3087# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld4r	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8
3088# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3089# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld4r	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4
3090# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3091# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3092
3093# CHECK:      [42] Code Region - G43
3094
3095# CHECK:      Iterations:        100
3096# CHECK-NEXT: Instructions:      1000
3097# CHECK-NEXT: Total Cycles:      2501
3098# CHECK-NEXT: Total uOps:        1500
3099
3100# CHECK:      Dispatch Width:    2
3101# CHECK-NEXT: uOps Per Cycle:    0.60
3102# CHECK-NEXT: IPC:               0.40
3103# CHECK-NEXT: Block RThroughput: 10.0
3104
3105# CHECK:      Timeline view:
3106# CHECK-NEXT:                     0123456789
3107# CHECK-NEXT: Index     0123456789          012345
3108
3109# CHECK:      [0,0]     DeeeeE    .    .    .    .   ld4r	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
3110# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
3111# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   ld4r	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
3112# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
3113# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ld4r	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
3114# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
3115# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   ld4r	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
3116# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
3117# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   ld4r	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
3118# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
3119
3120# CHECK:      Average Wait times (based on the timeline view):
3121# CHECK-NEXT: [0]: Executions
3122# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3123# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3124# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3125
3126# CHECK:            [0]    [1]    [2]    [3]
3127# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld4r	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
3128# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3129# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld4r	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
3130# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3131# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld4r	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
3132# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3133# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ld4r	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
3134# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3135# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ld4r	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
3136# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3137# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3138
3139# CHECK:      [43] Code Region - G44
3140
3141# CHECK:      Iterations:        100
3142# CHECK-NEXT: Instructions:      1000
3143# CHECK-NEXT: Total Cycles:      2401
3144# CHECK-NEXT: Total uOps:        1700
3145
3146# CHECK:      Dispatch Width:    2
3147# CHECK-NEXT: uOps Per Cycle:    0.71
3148# CHECK-NEXT: IPC:               0.42
3149# CHECK-NEXT: Block RThroughput: 9.0
3150
3151# CHECK:      Timeline view:
3152# CHECK-NEXT:                     0123456789
3153# CHECK-NEXT: Index     0123456789          01234
3154
3155# CHECK:      [0,0]     DeeeeE    .    .    .   .   ld4r	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
3156# CHECK-NEXT: [0,1]     . DeeE    .    .    .   .   add	x0, x27, #1
3157# CHECK-NEXT: [0,2]     .    DeeeeE    .    .   .   ld4r	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
3158# CHECK-NEXT: [0,3]     .    . DeeE    .    .   .   add	x0, x27, #1
3159# CHECK-NEXT: [0,4]     .    .    DeeeeE    .   .   ld4r	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
3160# CHECK-NEXT: [0,5]     .    .    . DeeE    .   .   add	x0, x27, #1
3161# CHECK-NEXT: [0,6]     .    .    .    DeeeE.   .   ldp	s1, s2, [x27], #248
3162# CHECK-NEXT: [0,7]     .    .    .    .DeeE.   .   add	x0, x27, #1
3163# CHECK-NEXT: [0,8]     .    .    .    .   DeeeeE   ldp	d1, d2, [x27], #496
3164# CHECK-NEXT: [0,9]     .    .    .    .    .DeeE   add	x0, x27, #1
3165
3166# CHECK:      Average Wait times (based on the timeline view):
3167# CHECK-NEXT: [0]: Executions
3168# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3169# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3170# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3171
3172# CHECK:            [0]    [1]    [2]    [3]
3173# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ld4r	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
3174# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3175# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ld4r	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
3176# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3177# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ld4r	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
3178# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3179# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ldp	s1, s2, [x27], #248
3180# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3181# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ldp	d1, d2, [x27], #496
3182# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3183# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3184
3185# CHECK:      [44] Code Region - G45
3186
3187# CHECK:      Iterations:        100
3188# CHECK-NEXT: Instructions:      1000
3189# CHECK-NEXT: Total Cycles:      2601
3190# CHECK-NEXT: Total uOps:        2000
3191
3192# CHECK:      Dispatch Width:    2
3193# CHECK-NEXT: uOps Per Cycle:    0.77
3194# CHECK-NEXT: IPC:               0.38
3195# CHECK-NEXT: Block RThroughput: 16.0
3196
3197# CHECK:      Timeline view:
3198# CHECK-NEXT:                     0123456789
3199# CHECK-NEXT: Index     0123456789          0123456
3200
3201# CHECK:      [0,0]     DeeeeeE   .    .    .    ..   ldp	q1, q2, [x27], #992
3202# CHECK-NEXT: [0,1]     .  DeeE   .    .    .    ..   add	x0, x27, #1
3203# CHECK-NEXT: [0,2]     .    .DeeeE    .    .    ..   ldp	s1, s2, [x27, #248]!
3204# CHECK-NEXT: [0,3]     .    . DeeE    .    .    ..   add	x0, x27, #1
3205# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    ..   ldp	d1, d2, [x27, #496]!
3206# CHECK-NEXT: [0,5]     .    .    . DeeE    .    ..   add	x0, x27, #1
3207# CHECK-NEXT: [0,6]     .    .    .    DeeeeeE   ..   ldp	q1, q2, [x27, #992]!
3208# CHECK-NEXT: [0,7]     .    .    .    .  DeeE   ..   add	x0, x27, #1
3209# CHECK-NEXT: [0,8]     .    .    .    .    .DeeeE.   ldp	w1, w2, [x27], #248
3210# CHECK-NEXT: [0,9]     .    .    .    .    .  DeeE   add	x0, x27, #1
3211
3212# CHECK:      Average Wait times (based on the timeline view):
3213# CHECK-NEXT: [0]: Executions
3214# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3215# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3216# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3217
3218# CHECK:            [0]    [1]    [2]    [3]
3219# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ldp	q1, q2, [x27], #992
3220# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3221# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ldp	s1, s2, [x27, #248]!
3222# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3223# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ldp	d1, d2, [x27, #496]!
3224# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3225# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ldp	q1, q2, [x27, #992]!
3226# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3227# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ldp	w1, w2, [x27], #248
3228# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3229# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3230
3231# CHECK:      [45] Code Region - G46
3232
3233# CHECK:      Iterations:        100
3234# CHECK-NEXT: Instructions:      1000
3235# CHECK-NEXT: Total Cycles:      2501
3236# CHECK-NEXT: Total uOps:        2000
3237
3238# CHECK:      Dispatch Width:    2
3239# CHECK-NEXT: uOps Per Cycle:    0.80
3240# CHECK-NEXT: IPC:               0.40
3241# CHECK-NEXT: Block RThroughput: 10.0
3242
3243# CHECK:      Timeline view:
3244# CHECK-NEXT:                     0123456789
3245# CHECK-NEXT: Index     0123456789          012345
3246
3247# CHECK:      [0,0]     DeeeeE    .    .    .    .   ldp	x1, x2, [x27], #496
3248# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
3249# CHECK-NEXT: [0,2]     .    DeeeE.    .    .    .   ldp	w1, w2, [x27, #248]!
3250# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
3251# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   ldp	x1, x2, [x27, #496]!
3252# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
3253# CHECK-NEXT: [0,6]     .    .    .    DeeeE.    .   ldpsw	x1, x2, [x27], #248
3254# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
3255# CHECK-NEXT: [0,8]     .    .    .    .    DeeeE.   ldpsw	x1, x2, [x27, #248]!
3256# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
3257
3258# CHECK:      Average Wait times (based on the timeline view):
3259# CHECK-NEXT: [0]: Executions
3260# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3261# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3262# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3263
3264# CHECK:            [0]    [1]    [2]    [3]
3265# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ldp	x1, x2, [x27], #496
3266# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3267# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ldp	w1, w2, [x27, #248]!
3268# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3269# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ldp	x1, x2, [x27, #496]!
3270# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3271# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ldpsw	x1, x2, [x27], #248
3272# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3273# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ldpsw	x1, x2, [x27, #248]!
3274# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3275# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3276
3277# CHECK:      [46] Code Region - G47
3278
3279# CHECK:      Iterations:        100
3280# CHECK-NEXT: Instructions:      1000
3281# CHECK-NEXT: Total Cycles:      2001
3282# CHECK-NEXT: Total uOps:        1500
3283
3284# CHECK:      Dispatch Width:    2
3285# CHECK-NEXT: uOps Per Cycle:    0.75
3286# CHECK-NEXT: IPC:               0.50
3287# CHECK-NEXT: Block RThroughput: 7.5
3288
3289# CHECK:      Timeline view:
3290# CHECK-NEXT:                     0123456789
3291# CHECK-NEXT: Index     0123456789          0
3292
3293# CHECK:      [0,0]     DeeE .    .    .    .   ldr	b1, [x27], #254
3294# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
3295# CHECK-NEXT: [0,2]     .   DeeE  .    .    .   ldr	h1, [x27], #254
3296# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
3297# CHECK-NEXT: [0,4]     .    .  DeeE   .    .   ldr	s1, [x27], #254
3298# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
3299# CHECK-NEXT: [0,6]     .    .    . DeeE    .   ldr	d1, [x27], #254
3300# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
3301# CHECK-NEXT: [0,8]     .    .    .    .DeeE.   ldr	q1, [x27], #254
3302# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
3303
3304# CHECK:      Average Wait times (based on the timeline view):
3305# CHECK-NEXT: [0]: Executions
3306# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3307# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3308# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3309
3310# CHECK:            [0]    [1]    [2]    [3]
3311# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ldr	b1, [x27], #254
3312# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3313# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ldr	h1, [x27], #254
3314# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3315# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ldr	s1, [x27], #254
3316# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3317# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ldr	d1, [x27], #254
3318# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3319# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ldr	q1, [x27], #254
3320# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3321# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3322
3323# CHECK:      [47] Code Region - G48
3324
3325# CHECK:      Iterations:        100
3326# CHECK-NEXT: Instructions:      1000
3327# CHECK-NEXT: Total Cycles:      2001
3328# CHECK-NEXT: Total uOps:        1500
3329
3330# CHECK:      Dispatch Width:    2
3331# CHECK-NEXT: uOps Per Cycle:    0.75
3332# CHECK-NEXT: IPC:               0.50
3333# CHECK-NEXT: Block RThroughput: 7.5
3334
3335# CHECK:      Timeline view:
3336# CHECK-NEXT:                     0123456789
3337# CHECK-NEXT: Index     0123456789          0
3338
3339# CHECK:      [0,0]     DeeE .    .    .    .   ldr	b1, [x27, #254]!
3340# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
3341# CHECK-NEXT: [0,2]     .   DeeE  .    .    .   ldr	h1, [x27, #254]!
3342# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
3343# CHECK-NEXT: [0,4]     .    .  DeeE   .    .   ldr	s1, [x27, #254]!
3344# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
3345# CHECK-NEXT: [0,6]     .    .    . DeeE    .   ldr	d1, [x27, #254]!
3346# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
3347# CHECK-NEXT: [0,8]     .    .    .    .DeeE.   ldr	q1, [x27, #254]!
3348# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
3349
3350# CHECK:      Average Wait times (based on the timeline view):
3351# CHECK-NEXT: [0]: Executions
3352# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3353# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3354# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3355
3356# CHECK:            [0]    [1]    [2]    [3]
3357# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ldr	b1, [x27, #254]!
3358# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3359# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ldr	h1, [x27, #254]!
3360# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3361# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ldr	s1, [x27, #254]!
3362# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3363# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ldr	d1, [x27, #254]!
3364# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3365# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ldr	q1, [x27, #254]!
3366# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3367# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3368
3369# CHECK:      [48] Code Region - G49
3370
3371# CHECK:      Iterations:        100
3372# CHECK-NEXT: Instructions:      1000
3373# CHECK-NEXT: Total Cycles:      2001
3374# CHECK-NEXT: Total uOps:        1500
3375
3376# CHECK:      Dispatch Width:    2
3377# CHECK-NEXT: uOps Per Cycle:    0.75
3378# CHECK-NEXT: IPC:               0.50
3379# CHECK-NEXT: Block RThroughput: 7.5
3380
3381# CHECK:      Timeline view:
3382# CHECK-NEXT:                     0123456789
3383# CHECK-NEXT: Index     0123456789          0
3384
3385# CHECK:      [0,0]     DeeE .    .    .    .   ldr	w1, [x27], #254
3386# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
3387# CHECK-NEXT: [0,2]     .   DeeE  .    .    .   ldr	x1, [x27], #254
3388# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
3389# CHECK-NEXT: [0,4]     .    .  DeeE   .    .   ldr	w1, [x27, #254]!
3390# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
3391# CHECK-NEXT: [0,6]     .    .    . DeeE    .   ldr	x1, [x27, #254]!
3392# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
3393# CHECK-NEXT: [0,8]     .    .    .    .DeeE.   ldrb	w1, [x27], #254
3394# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
3395
3396# CHECK:      Average Wait times (based on the timeline view):
3397# CHECK-NEXT: [0]: Executions
3398# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3399# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3400# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3401
3402# CHECK:            [0]    [1]    [2]    [3]
3403# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ldr	w1, [x27], #254
3404# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3405# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ldr	x1, [x27], #254
3406# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3407# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ldr	w1, [x27, #254]!
3408# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3409# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ldr	x1, [x27, #254]!
3410# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3411# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ldrb	w1, [x27], #254
3412# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3413# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3414
3415# CHECK:      [49] Code Region - G50
3416
3417# CHECK:      Iterations:        100
3418# CHECK-NEXT: Instructions:      1000
3419# CHECK-NEXT: Total Cycles:      2001
3420# CHECK-NEXT: Total uOps:        1500
3421
3422# CHECK:      Dispatch Width:    2
3423# CHECK-NEXT: uOps Per Cycle:    0.75
3424# CHECK-NEXT: IPC:               0.50
3425# CHECK-NEXT: Block RThroughput: 7.5
3426
3427# CHECK:      Timeline view:
3428# CHECK-NEXT:                     0123456789
3429# CHECK-NEXT: Index     0123456789          0
3430
3431# CHECK:      [0,0]     DeeE .    .    .    .   ldrb	w1, [x27, #254]!
3432# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
3433# CHECK-NEXT: [0,2]     .   DeeE  .    .    .   ldrh	w1, [x27], #254
3434# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
3435# CHECK-NEXT: [0,4]     .    .  DeeE   .    .   ldrh	w1, [x27, #254]!
3436# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
3437# CHECK-NEXT: [0,6]     .    .    . DeeE    .   ldrsb	w1, [x27], #254
3438# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
3439# CHECK-NEXT: [0,8]     .    .    .    .DeeE.   ldrsb	x1, [x27], #254
3440# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
3441
3442# CHECK:      Average Wait times (based on the timeline view):
3443# CHECK-NEXT: [0]: Executions
3444# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3445# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3446# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3447
3448# CHECK:            [0]    [1]    [2]    [3]
3449# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ldrb	w1, [x27, #254]!
3450# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3451# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ldrh	w1, [x27], #254
3452# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3453# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ldrh	w1, [x27, #254]!
3454# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3455# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ldrsb	w1, [x27], #254
3456# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3457# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ldrsb	x1, [x27], #254
3458# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3459# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3460
3461# CHECK:      [50] Code Region - G51
3462
3463# CHECK:      Iterations:        100
3464# CHECK-NEXT: Instructions:      1000
3465# CHECK-NEXT: Total Cycles:      2001
3466# CHECK-NEXT: Total uOps:        1500
3467
3468# CHECK:      Dispatch Width:    2
3469# CHECK-NEXT: uOps Per Cycle:    0.75
3470# CHECK-NEXT: IPC:               0.50
3471# CHECK-NEXT: Block RThroughput: 7.5
3472
3473# CHECK:      Timeline view:
3474# CHECK-NEXT:                     0123456789
3475# CHECK-NEXT: Index     0123456789          0
3476
3477# CHECK:      [0,0]     DeeE .    .    .    .   ldrsb	w1, [x27, #254]!
3478# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
3479# CHECK-NEXT: [0,2]     .   DeeE  .    .    .   ldrsb	x1, [x27, #254]!
3480# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
3481# CHECK-NEXT: [0,4]     .    .  DeeE   .    .   ldrsh	w1, [x27], #254
3482# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
3483# CHECK-NEXT: [0,6]     .    .    . DeeE    .   ldrsh	x1, [x27], #254
3484# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
3485# CHECK-NEXT: [0,8]     .    .    .    .DeeE.   ldrsh	w1, [x27, #254]!
3486# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
3487
3488# CHECK:      Average Wait times (based on the timeline view):
3489# CHECK-NEXT: [0]: Executions
3490# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3491# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3492# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3493
3494# CHECK:            [0]    [1]    [2]    [3]
3495# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ldrsb	w1, [x27, #254]!
3496# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3497# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ldrsb	x1, [x27, #254]!
3498# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3499# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ldrsh	w1, [x27], #254
3500# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3501# CHECK-NEXT: 6.     1     0.0    0.0    0.0       ldrsh	x1, [x27], #254
3502# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3503# CHECK-NEXT: 8.     1     0.0    0.0    0.0       ldrsh	w1, [x27, #254]!
3504# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3505# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3506
3507# CHECK:      [51] Code Region - G52
3508
3509# CHECK:      Iterations:        100
3510# CHECK-NEXT: Instructions:      1000
3511# CHECK-NEXT: Total Cycles:      2001
3512# CHECK-NEXT: Total uOps:        1500
3513
3514# CHECK:      Dispatch Width:    2
3515# CHECK-NEXT: uOps Per Cycle:    0.75
3516# CHECK-NEXT: IPC:               0.50
3517# CHECK-NEXT: Block RThroughput: 7.5
3518
3519# CHECK:      Timeline view:
3520# CHECK-NEXT:                     0123456789
3521# CHECK-NEXT: Index     0123456789          0
3522
3523# CHECK:      [0,0]     DeeE .    .    .    .   ldrsh	x1, [x27, #254]!
3524# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
3525# CHECK-NEXT: [0,2]     .   DeeE  .    .    .   ldrsw	x1, [x27], #254
3526# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
3527# CHECK-NEXT: [0,4]     .    .  DeeE   .    .   ldrsw	x1, [x27, #254]!
3528# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
3529# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   st1	{ v1.1d }, [x27], #8
3530# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
3531# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   st1	{ v1.2d }, [x27], #16
3532# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
3533
3534# CHECK:      Average Wait times (based on the timeline view):
3535# CHECK-NEXT: [0]: Executions
3536# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3537# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3538# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3539
3540# CHECK:            [0]    [1]    [2]    [3]
3541# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ldrsh	x1, [x27, #254]!
3542# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3543# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ldrsw	x1, [x27], #254
3544# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3545# CHECK-NEXT: 4.     1     0.0    0.0    0.0       ldrsw	x1, [x27, #254]!
3546# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3547# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.1d }, [x27], #8
3548# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3549# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.2d }, [x27], #16
3550# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3551# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3552
3553# CHECK:      [52] Code Region - G53
3554
3555# CHECK:      Iterations:        100
3556# CHECK-NEXT: Instructions:      1000
3557# CHECK-NEXT: Total Cycles:      2001
3558# CHECK-NEXT: Total uOps:        1500
3559
3560# CHECK:      Dispatch Width:    2
3561# CHECK-NEXT: uOps Per Cycle:    0.75
3562# CHECK-NEXT: IPC:               0.50
3563# CHECK-NEXT: Block RThroughput: 7.5
3564
3565# CHECK:      Timeline view:
3566# CHECK-NEXT:                     0123456789
3567# CHECK-NEXT: Index     0123456789          0
3568
3569# CHECK:      [0,0]     DeeeE.    .    .    .   st1	{ v1.2s }, [x27], #8
3570# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
3571# CHECK-NEXT: [0,2]     .   DeeeE .    .    .   st1	{ v1.4h }, [x27], #8
3572# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
3573# CHECK-NEXT: [0,4]     .    .  DeeeE  .    .   st1	{ v1.4s }, [x27], #16
3574# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
3575# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   st1	{ v1.8b }, [x27], #8
3576# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
3577# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   st1	{ v1.8h }, [x27], #16
3578# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
3579
3580# CHECK:      Average Wait times (based on the timeline view):
3581# CHECK-NEXT: [0]: Executions
3582# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3583# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3584# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3585
3586# CHECK:            [0]    [1]    [2]    [3]
3587# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.2s }, [x27], #8
3588# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3589# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.4h }, [x27], #8
3590# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3591# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.4s }, [x27], #16
3592# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3593# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.8b }, [x27], #8
3594# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3595# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.8h }, [x27], #16
3596# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3597# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3598
3599# CHECK:      [53] Code Region - G54
3600
3601# CHECK:      Iterations:        100
3602# CHECK-NEXT: Instructions:      1000
3603# CHECK-NEXT: Total Cycles:      2001
3604# CHECK-NEXT: Total uOps:        1500
3605
3606# CHECK:      Dispatch Width:    2
3607# CHECK-NEXT: uOps Per Cycle:    0.75
3608# CHECK-NEXT: IPC:               0.50
3609# CHECK-NEXT: Block RThroughput: 7.5
3610
3611# CHECK:      Timeline view:
3612# CHECK-NEXT:                     0123456789
3613# CHECK-NEXT: Index     0123456789          0
3614
3615# CHECK:      [0,0]     DeeeE.    .    .    .   st1	{ v1.16b }, [x27], #16
3616# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
3617# CHECK-NEXT: [0,2]     .   DeeeE .    .    .   st1	{ v1.1d }, [x27], x28
3618# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
3619# CHECK-NEXT: [0,4]     .    .  DeeeE  .    .   st1	{ v1.2d }, [x27], x28
3620# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
3621# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   st1	{ v1.2s }, [x27], x28
3622# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
3623# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   st1	{ v1.4h }, [x27], x28
3624# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
3625
3626# CHECK:      Average Wait times (based on the timeline view):
3627# CHECK-NEXT: [0]: Executions
3628# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3629# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3630# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3631
3632# CHECK:            [0]    [1]    [2]    [3]
3633# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.16b }, [x27], #16
3634# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3635# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.1d }, [x27], x28
3636# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3637# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.2d }, [x27], x28
3638# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3639# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.2s }, [x27], x28
3640# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3641# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.4h }, [x27], x28
3642# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3643# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3644
3645# CHECK:      [54] Code Region - G55
3646
3647# CHECK:      Iterations:        100
3648# CHECK-NEXT: Instructions:      1000
3649# CHECK-NEXT: Total Cycles:      2001
3650# CHECK-NEXT: Total uOps:        1500
3651
3652# CHECK:      Dispatch Width:    2
3653# CHECK-NEXT: uOps Per Cycle:    0.75
3654# CHECK-NEXT: IPC:               0.50
3655# CHECK-NEXT: Block RThroughput: 7.5
3656
3657# CHECK:      Timeline view:
3658# CHECK-NEXT:                     0123456789
3659# CHECK-NEXT: Index     0123456789          0
3660
3661# CHECK:      [0,0]     DeeeE.    .    .    .   st1	{ v1.4s }, [x27], x28
3662# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
3663# CHECK-NEXT: [0,2]     .   DeeeE .    .    .   st1	{ v1.8b }, [x27], x28
3664# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
3665# CHECK-NEXT: [0,4]     .    .  DeeeE  .    .   st1	{ v1.8h }, [x27], x28
3666# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
3667# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   st1	{ v1.16b }, [x27], x28
3668# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
3669# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   st1	{ v1.1d, v2.1d }, [x27], #16
3670# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
3671
3672# CHECK:      Average Wait times (based on the timeline view):
3673# CHECK-NEXT: [0]: Executions
3674# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3675# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3676# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3677
3678# CHECK:            [0]    [1]    [2]    [3]
3679# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.4s }, [x27], x28
3680# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3681# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.8b }, [x27], x28
3682# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3683# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.8h }, [x27], x28
3684# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3685# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.16b }, [x27], x28
3686# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3687# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.1d, v2.1d }, [x27], #16
3688# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3689# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3690
3691# CHECK:      [55] Code Region - G56
3692
3693# CHECK:      Iterations:        100
3694# CHECK-NEXT: Instructions:      1000
3695# CHECK-NEXT: Total Cycles:      2001
3696# CHECK-NEXT: Total uOps:        1500
3697
3698# CHECK:      Dispatch Width:    2
3699# CHECK-NEXT: uOps Per Cycle:    0.75
3700# CHECK-NEXT: IPC:               0.50
3701# CHECK-NEXT: Block RThroughput: 7.5
3702
3703# CHECK:      Timeline view:
3704# CHECK-NEXT:                     0123456789
3705# CHECK-NEXT: Index     0123456789          0
3706
3707# CHECK:      [0,0]     DeeeE.    .    .    .   st1	{ v1.2d, v2.2d }, [x27], #32
3708# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
3709# CHECK-NEXT: [0,2]     .   DeeeE .    .    .   st1	{ v1.2s, v2.2s }, [x27], #16
3710# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
3711# CHECK-NEXT: [0,4]     .    .  DeeeE  .    .   st1	{ v1.4h, v2.4h }, [x27], #16
3712# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
3713# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   st1	{ v1.4s, v2.4s }, [x27], #32
3714# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
3715# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   st1	{ v1.8b, v2.8b }, [x27], #16
3716# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
3717
3718# CHECK:      Average Wait times (based on the timeline view):
3719# CHECK-NEXT: [0]: Executions
3720# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3721# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3722# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3723
3724# CHECK:            [0]    [1]    [2]    [3]
3725# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.2d, v2.2d }, [x27], #32
3726# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3727# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.2s, v2.2s }, [x27], #16
3728# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3729# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.4h, v2.4h }, [x27], #16
3730# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3731# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.4s, v2.4s }, [x27], #32
3732# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3733# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.8b, v2.8b }, [x27], #16
3734# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3735# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3736
3737# CHECK:      [56] Code Region - G57
3738
3739# CHECK:      Iterations:        100
3740# CHECK-NEXT: Instructions:      1000
3741# CHECK-NEXT: Total Cycles:      2001
3742# CHECK-NEXT: Total uOps:        1500
3743
3744# CHECK:      Dispatch Width:    2
3745# CHECK-NEXT: uOps Per Cycle:    0.75
3746# CHECK-NEXT: IPC:               0.50
3747# CHECK-NEXT: Block RThroughput: 7.5
3748
3749# CHECK:      Timeline view:
3750# CHECK-NEXT:                     0123456789
3751# CHECK-NEXT: Index     0123456789          0
3752
3753# CHECK:      [0,0]     DeeeE.    .    .    .   st1	{ v1.8h, v2.8h }, [x27], #32
3754# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
3755# CHECK-NEXT: [0,2]     .   DeeeE .    .    .   st1	{ v1.16b, v2.16b }, [x27], #32
3756# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
3757# CHECK-NEXT: [0,4]     .    .  DeeeE  .    .   st1	{ v1.1d, v2.1d }, [x27], x28
3758# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
3759# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   st1	{ v1.2d, v2.2d }, [x27], x28
3760# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
3761# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   st1	{ v1.2s, v2.2s }, [x27], x28
3762# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
3763
3764# CHECK:      Average Wait times (based on the timeline view):
3765# CHECK-NEXT: [0]: Executions
3766# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3767# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3768# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3769
3770# CHECK:            [0]    [1]    [2]    [3]
3771# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.8h, v2.8h }, [x27], #32
3772# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3773# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.16b, v2.16b }, [x27], #32
3774# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3775# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.1d, v2.1d }, [x27], x28
3776# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3777# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.2d, v2.2d }, [x27], x28
3778# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3779# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.2s, v2.2s }, [x27], x28
3780# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3781# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3782
3783# CHECK:      [57] Code Region - G58
3784
3785# CHECK:      Iterations:        100
3786# CHECK-NEXT: Instructions:      1000
3787# CHECK-NEXT: Total Cycles:      2001
3788# CHECK-NEXT: Total uOps:        1500
3789
3790# CHECK:      Dispatch Width:    2
3791# CHECK-NEXT: uOps Per Cycle:    0.75
3792# CHECK-NEXT: IPC:               0.50
3793# CHECK-NEXT: Block RThroughput: 7.5
3794
3795# CHECK:      Timeline view:
3796# CHECK-NEXT:                     0123456789
3797# CHECK-NEXT: Index     0123456789          0
3798
3799# CHECK:      [0,0]     DeeeE.    .    .    .   st1	{ v1.4h, v2.4h }, [x27], x28
3800# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
3801# CHECK-NEXT: [0,2]     .   DeeeE .    .    .   st1	{ v1.4s, v2.4s }, [x27], x28
3802# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
3803# CHECK-NEXT: [0,4]     .    .  DeeeE  .    .   st1	{ v1.8b, v2.8b }, [x27], x28
3804# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
3805# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   st1	{ v1.8h, v2.8h }, [x27], x28
3806# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
3807# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   st1	{ v1.16b, v2.16b }, [x27], x28
3808# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
3809
3810# CHECK:      Average Wait times (based on the timeline view):
3811# CHECK-NEXT: [0]: Executions
3812# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3813# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3814# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3815
3816# CHECK:            [0]    [1]    [2]    [3]
3817# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.4h, v2.4h }, [x27], x28
3818# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3819# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.4s, v2.4s }, [x27], x28
3820# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3821# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.8b, v2.8b }, [x27], x28
3822# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3823# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.8h, v2.8h }, [x27], x28
3824# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3825# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.16b, v2.16b }, [x27], x28
3826# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3827# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3828
3829# CHECK:      [58] Code Region - G59
3830
3831# CHECK:      Iterations:        100
3832# CHECK-NEXT: Instructions:      1000
3833# CHECK-NEXT: Total Cycles:      2501
3834# CHECK-NEXT: Total uOps:        1500
3835
3836# CHECK:      Dispatch Width:    2
3837# CHECK-NEXT: uOps Per Cycle:    0.60
3838# CHECK-NEXT: IPC:               0.40
3839# CHECK-NEXT: Block RThroughput: 10.0
3840
3841# CHECK:      Timeline view:
3842# CHECK-NEXT:                     0123456789
3843# CHECK-NEXT: Index     0123456789          012345
3844
3845# CHECK:      [0,0]     DeeeeE    .    .    .    .   st1	{ v1.1d, v2.1d, v3.1d }, [x27], #24
3846# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
3847# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st1	{ v1.2d, v2.2d, v3.2d }, [x27], #48
3848# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
3849# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st1	{ v1.2s, v2.2s, v3.2s }, [x27], #24
3850# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
3851# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st1	{ v1.4h, v2.4h, v3.4h }, [x27], #24
3852# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
3853# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st1	{ v1.4s, v2.4s, v3.4s }, [x27], #48
3854# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
3855
3856# CHECK:      Average Wait times (based on the timeline view):
3857# CHECK-NEXT: [0]: Executions
3858# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3859# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3860# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3861
3862# CHECK:            [0]    [1]    [2]    [3]
3863# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.1d, v2.1d, v3.1d }, [x27], #24
3864# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3865# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.2d, v2.2d, v3.2d }, [x27], #48
3866# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3867# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.2s, v2.2s, v3.2s }, [x27], #24
3868# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3869# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.4h, v2.4h, v3.4h }, [x27], #24
3870# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3871# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.4s, v2.4s, v3.4s }, [x27], #48
3872# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3873# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3874
3875# CHECK:      [59] Code Region - G60
3876
3877# CHECK:      Iterations:        100
3878# CHECK-NEXT: Instructions:      1000
3879# CHECK-NEXT: Total Cycles:      2501
3880# CHECK-NEXT: Total uOps:        1500
3881
3882# CHECK:      Dispatch Width:    2
3883# CHECK-NEXT: uOps Per Cycle:    0.60
3884# CHECK-NEXT: IPC:               0.40
3885# CHECK-NEXT: Block RThroughput: 10.0
3886
3887# CHECK:      Timeline view:
3888# CHECK-NEXT:                     0123456789
3889# CHECK-NEXT: Index     0123456789          012345
3890
3891# CHECK:      [0,0]     DeeeeE    .    .    .    .   st1	{ v1.8b, v2.8b, v3.8b }, [x27], #24
3892# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
3893# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st1	{ v1.8h, v2.8h, v3.8h }, [x27], #48
3894# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
3895# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st1	{ v1.16b, v2.16b, v3.16b }, [x27], #48
3896# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
3897# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st1	{ v1.1d, v2.1d, v3.1d }, [x27], x28
3898# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
3899# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st1	{ v1.2d, v2.2d, v3.2d }, [x27], x28
3900# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
3901
3902# CHECK:      Average Wait times (based on the timeline view):
3903# CHECK-NEXT: [0]: Executions
3904# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3905# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3906# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3907
3908# CHECK:            [0]    [1]    [2]    [3]
3909# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.8b, v2.8b, v3.8b }, [x27], #24
3910# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3911# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.8h, v2.8h, v3.8h }, [x27], #48
3912# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3913# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.16b, v2.16b, v3.16b }, [x27], #48
3914# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3915# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.1d, v2.1d, v3.1d }, [x27], x28
3916# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3917# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.2d, v2.2d, v3.2d }, [x27], x28
3918# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3919# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3920
3921# CHECK:      [60] Code Region - G61
3922
3923# CHECK:      Iterations:        100
3924# CHECK-NEXT: Instructions:      1000
3925# CHECK-NEXT: Total Cycles:      2501
3926# CHECK-NEXT: Total uOps:        1500
3927
3928# CHECK:      Dispatch Width:    2
3929# CHECK-NEXT: uOps Per Cycle:    0.60
3930# CHECK-NEXT: IPC:               0.40
3931# CHECK-NEXT: Block RThroughput: 10.0
3932
3933# CHECK:      Timeline view:
3934# CHECK-NEXT:                     0123456789
3935# CHECK-NEXT: Index     0123456789          012345
3936
3937# CHECK:      [0,0]     DeeeeE    .    .    .    .   st1	{ v1.2s, v2.2s, v3.2s }, [x27], x28
3938# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
3939# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st1	{ v1.4h, v2.4h, v3.4h }, [x27], x28
3940# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
3941# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st1	{ v1.4s, v2.4s, v3.4s }, [x27], x28
3942# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
3943# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st1	{ v1.8b, v2.8b, v3.8b }, [x27], x28
3944# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
3945# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st1	{ v1.8h, v2.8h, v3.8h }, [x27], x28
3946# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
3947
3948# CHECK:      Average Wait times (based on the timeline view):
3949# CHECK-NEXT: [0]: Executions
3950# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3951# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3952# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3953
3954# CHECK:            [0]    [1]    [2]    [3]
3955# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.2s, v2.2s, v3.2s }, [x27], x28
3956# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
3957# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.4h, v2.4h, v3.4h }, [x27], x28
3958# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
3959# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.4s, v2.4s, v3.4s }, [x27], x28
3960# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
3961# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.8b, v2.8b, v3.8b }, [x27], x28
3962# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
3963# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.8h, v2.8h, v3.8h }, [x27], x28
3964# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
3965# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
3966
3967# CHECK:      [61] Code Region - G62
3968
3969# CHECK:      Iterations:        100
3970# CHECK-NEXT: Instructions:      1000
3971# CHECK-NEXT: Total Cycles:      2501
3972# CHECK-NEXT: Total uOps:        1500
3973
3974# CHECK:      Dispatch Width:    2
3975# CHECK-NEXT: uOps Per Cycle:    0.60
3976# CHECK-NEXT: IPC:               0.40
3977# CHECK-NEXT: Block RThroughput: 18.0
3978
3979# CHECK:      Timeline view:
3980# CHECK-NEXT:                     0123456789
3981# CHECK-NEXT: Index     0123456789          012345
3982
3983# CHECK:      [0,0]     DeeeeE    .    .    .    .   st1	{ v1.16b, v2.16b, v3.16b }, [x27], x28
3984# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
3985# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
3986# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
3987# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
3988# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
3989# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
3990# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
3991# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
3992# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
3993
3994# CHECK:      Average Wait times (based on the timeline view):
3995# CHECK-NEXT: [0]: Executions
3996# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3997# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3998# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3999
4000# CHECK:            [0]    [1]    [2]    [3]
4001# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.16b, v2.16b, v3.16b }, [x27], x28
4002# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4003# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
4004# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4005# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
4006# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4007# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
4008# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4009# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
4010# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4011# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4012
4013# CHECK:      [62] Code Region - G63
4014
4015# CHECK:      Iterations:        100
4016# CHECK-NEXT: Instructions:      1000
4017# CHECK-NEXT: Total Cycles:      2501
4018# CHECK-NEXT: Total uOps:        1500
4019
4020# CHECK:      Dispatch Width:    2
4021# CHECK-NEXT: uOps Per Cycle:    0.60
4022# CHECK-NEXT: IPC:               0.40
4023# CHECK-NEXT: Block RThroughput: 20.0
4024
4025# CHECK:      Timeline view:
4026# CHECK-NEXT:                     0123456789
4027# CHECK-NEXT: Index     0123456789          012345
4028
4029# CHECK:      [0,0]     DeeeeE    .    .    .    .   st1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
4030# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4031# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
4032# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4033# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
4034# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4035# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
4036# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4037# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
4038# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4039
4040# CHECK:      Average Wait times (based on the timeline view):
4041# CHECK-NEXT: [0]: Executions
4042# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4043# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4044# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4045
4046# CHECK:            [0]    [1]    [2]    [3]
4047# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
4048# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4049# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
4050# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4051# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
4052# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4053# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
4054# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4055# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
4056# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4057# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4058
4059# CHECK:      [63] Code Region - G64
4060
4061# CHECK:      Iterations:        100
4062# CHECK-NEXT: Instructions:      1000
4063# CHECK-NEXT: Total Cycles:      2501
4064# CHECK-NEXT: Total uOps:        1500
4065
4066# CHECK:      Dispatch Width:    2
4067# CHECK-NEXT: uOps Per Cycle:    0.60
4068# CHECK-NEXT: IPC:               0.40
4069# CHECK-NEXT: Block RThroughput: 20.0
4070
4071# CHECK:      Timeline view:
4072# CHECK-NEXT:                     0123456789
4073# CHECK-NEXT: Index     0123456789          012345
4074
4075# CHECK:      [0,0]     DeeeeE    .    .    .    .   st1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
4076# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4077# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
4078# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4079# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
4080# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4081# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
4082# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4083# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
4084# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4085
4086# CHECK:      Average Wait times (based on the timeline view):
4087# CHECK-NEXT: [0]: Executions
4088# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4089# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4090# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4091
4092# CHECK:            [0]    [1]    [2]    [3]
4093# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
4094# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4095# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
4096# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4097# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
4098# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4099# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
4100# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4101# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
4102# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4103# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4104
4105# CHECK:      [64] Code Region - G65
4106
4107# CHECK:      Iterations:        100
4108# CHECK-NEXT: Instructions:      1000
4109# CHECK-NEXT: Total Cycles:      2201
4110# CHECK-NEXT: Total uOps:        1500
4111
4112# CHECK:      Dispatch Width:    2
4113# CHECK-NEXT: uOps Per Cycle:    0.68
4114# CHECK-NEXT: IPC:               0.45
4115# CHECK-NEXT: Block RThroughput: 11.0
4116
4117# CHECK:      Timeline view:
4118# CHECK-NEXT:                     0123456789
4119# CHECK-NEXT: Index     0123456789          012
4120
4121# CHECK:      [0,0]     DeeeeE    .    .    . .   st1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
4122# CHECK-NEXT: [0,1]     . DeeE    .    .    . .   add	x0, x27, #1
4123# CHECK-NEXT: [0,2]     .    DeeeeE    .    . .   st1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
4124# CHECK-NEXT: [0,3]     .    . DeeE    .    . .   add	x0, x27, #1
4125# CHECK-NEXT: [0,4]     .    .    DeeeE.    . .   st1	{ v1.b }[0], [x27], #1
4126# CHECK-NEXT: [0,5]     .    .    .DeeE.    . .   add	x0, x27, #1
4127# CHECK-NEXT: [0,6]     .    .    .   DeeeE . .   st1	{ v1.b }[8], [x27], #1
4128# CHECK-NEXT: [0,7]     .    .    .    DeeE . .   add	x0, x27, #1
4129# CHECK-NEXT: [0,8]     .    .    .    .  DeeeE   st1	{ v1.b }[0], [x27], x28
4130# CHECK-NEXT: [0,9]     .    .    .    .   DeeE   add	x0, x27, #1
4131
4132# CHECK:      Average Wait times (based on the timeline view):
4133# CHECK-NEXT: [0]: Executions
4134# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4135# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4136# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4137
4138# CHECK:            [0]    [1]    [2]    [3]
4139# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
4140# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4141# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
4142# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4143# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.b }[0], [x27], #1
4144# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4145# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.b }[8], [x27], #1
4146# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4147# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.b }[0], [x27], x28
4148# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4149# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4150
4151# CHECK:      [65] Code Region - G66
4152
4153# CHECK:      Iterations:        100
4154# CHECK-NEXT: Instructions:      1000
4155# CHECK-NEXT: Total Cycles:      2001
4156# CHECK-NEXT: Total uOps:        1500
4157
4158# CHECK:      Dispatch Width:    2
4159# CHECK-NEXT: uOps Per Cycle:    0.75
4160# CHECK-NEXT: IPC:               0.50
4161# CHECK-NEXT: Block RThroughput: 7.5
4162
4163# CHECK:      Timeline view:
4164# CHECK-NEXT:                     0123456789
4165# CHECK-NEXT: Index     0123456789          0
4166
4167# CHECK:      [0,0]     DeeeE.    .    .    .   st1	{ v1.b }[8], [x27], x28
4168# CHECK-NEXT: [0,1]     .DeeE.    .    .    .   add	x0, x27, #1
4169# CHECK-NEXT: [0,2]     .   DeeeE .    .    .   st1	{ v1.h }[0], [x27], #2
4170# CHECK-NEXT: [0,3]     .    DeeE .    .    .   add	x0, x27, #1
4171# CHECK-NEXT: [0,4]     .    .  DeeeE  .    .   st1	{ v1.h }[4], [x27], #2
4172# CHECK-NEXT: [0,5]     .    .   DeeE  .    .   add	x0, x27, #1
4173# CHECK-NEXT: [0,6]     .    .    . DeeeE   .   st1	{ v1.h }[0], [x27], x28
4174# CHECK-NEXT: [0,7]     .    .    .  DeeE   .   add	x0, x27, #1
4175# CHECK-NEXT: [0,8]     .    .    .    .DeeeE   st1	{ v1.h }[4], [x27], x28
4176# CHECK-NEXT: [0,9]     .    .    .    . DeeE   add	x0, x27, #1
4177
4178# CHECK:      Average Wait times (based on the timeline view):
4179# CHECK-NEXT: [0]: Executions
4180# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4181# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4182# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4183
4184# CHECK:            [0]    [1]    [2]    [3]
4185# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.b }[8], [x27], x28
4186# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4187# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.h }[0], [x27], #2
4188# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4189# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.h }[4], [x27], #2
4190# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4191# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.h }[0], [x27], x28
4192# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4193# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st1	{ v1.h }[4], [x27], x28
4194# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4195# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4196
4197# CHECK:      [66] Code Region - G67
4198
4199# CHECK:      Iterations:        100
4200# CHECK-NEXT: Instructions:      1000
4201# CHECK-NEXT: Total Cycles:      2101
4202# CHECK-NEXT: Total uOps:        1500
4203
4204# CHECK:      Dispatch Width:    2
4205# CHECK-NEXT: uOps Per Cycle:    0.71
4206# CHECK-NEXT: IPC:               0.48
4207# CHECK-NEXT: Block RThroughput: 8.0
4208
4209# CHECK:      Timeline view:
4210# CHECK-NEXT:                     0123456789
4211# CHECK-NEXT: Index     0123456789          01
4212
4213# CHECK:      [0,0]     DeeeE.    .    .    ..   st1	{ v1.s }[0], [x27], #4
4214# CHECK-NEXT: [0,1]     .DeeE.    .    .    ..   add	x0, x27, #1
4215# CHECK-NEXT: [0,2]     .   DeeeE .    .    ..   st1	{ v1.s }[0], [x27], x28
4216# CHECK-NEXT: [0,3]     .    DeeE .    .    ..   add	x0, x27, #1
4217# CHECK-NEXT: [0,4]     .    .  DeeeE  .    ..   st1	{ v1.d }[0], [x27], #8
4218# CHECK-NEXT: [0,5]     .    .   DeeE  .    ..   add	x0, x27, #1
4219# CHECK-NEXT: [0,6]     .    .    . DeeeE   ..   st1	{ v1.d }[0], [x27], x28
4220# CHECK-NEXT: [0,7]     .    .    .  DeeE   ..   add	x0, x27, #1
4221# CHECK-NEXT: [0,8]     .    .    .    .DeeeeE   st2	{ v1.2d, v2.2d }, [x27], #32
4222# CHECK-NEXT: [0,9]     .    .    .    .  DeeE   add	x0, x27, #1
4223
4224# CHECK:      Average Wait times (based on the timeline view):
4225# CHECK-NEXT: [0]: Executions
4226# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4227# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4228# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4229
4230# CHECK:            [0]    [1]    [2]    [3]
4231# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st1	{ v1.s }[0], [x27], #4
4232# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4233# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st1	{ v1.s }[0], [x27], x28
4234# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4235# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st1	{ v1.d }[0], [x27], #8
4236# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4237# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st1	{ v1.d }[0], [x27], x28
4238# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4239# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st2	{ v1.2d, v2.2d }, [x27], #32
4240# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4241# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4242
4243# CHECK:      [67] Code Region - G68
4244
4245# CHECK:      Iterations:        100
4246# CHECK-NEXT: Instructions:      1000
4247# CHECK-NEXT: Total Cycles:      2501
4248# CHECK-NEXT: Total uOps:        1500
4249
4250# CHECK:      Dispatch Width:    2
4251# CHECK-NEXT: uOps Per Cycle:    0.60
4252# CHECK-NEXT: IPC:               0.40
4253# CHECK-NEXT: Block RThroughput: 14.0
4254
4255# CHECK:      Timeline view:
4256# CHECK-NEXT:                     0123456789
4257# CHECK-NEXT: Index     0123456789          012345
4258
4259# CHECK:      [0,0]     DeeeeE    .    .    .    .   st2	{ v1.2s, v2.2s }, [x27], #16
4260# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4261# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st2	{ v1.4h, v2.4h }, [x27], #16
4262# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4263# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st2	{ v1.4s, v2.4s }, [x27], #32
4264# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4265# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st2	{ v1.8b, v2.8b }, [x27], #16
4266# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4267# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st2	{ v1.8h, v2.8h }, [x27], #32
4268# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4269
4270# CHECK:      Average Wait times (based on the timeline view):
4271# CHECK-NEXT: [0]: Executions
4272# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4273# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4274# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4275
4276# CHECK:            [0]    [1]    [2]    [3]
4277# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st2	{ v1.2s, v2.2s }, [x27], #16
4278# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4279# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st2	{ v1.4h, v2.4h }, [x27], #16
4280# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4281# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st2	{ v1.4s, v2.4s }, [x27], #32
4282# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4283# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st2	{ v1.8b, v2.8b }, [x27], #16
4284# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4285# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st2	{ v1.8h, v2.8h }, [x27], #32
4286# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4287# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4288
4289# CHECK:      [68] Code Region - G69
4290
4291# CHECK:      Iterations:        100
4292# CHECK-NEXT: Instructions:      1000
4293# CHECK-NEXT: Total Cycles:      2501
4294# CHECK-NEXT: Total uOps:        1500
4295
4296# CHECK:      Dispatch Width:    2
4297# CHECK-NEXT: uOps Per Cycle:    0.60
4298# CHECK-NEXT: IPC:               0.40
4299# CHECK-NEXT: Block RThroughput: 16.0
4300
4301# CHECK:      Timeline view:
4302# CHECK-NEXT:                     0123456789
4303# CHECK-NEXT: Index     0123456789          012345
4304
4305# CHECK:      [0,0]     DeeeeE    .    .    .    .   st2	{ v1.16b, v2.16b }, [x27], #32
4306# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4307# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st2	{ v1.2d, v2.2d }, [x27], x28
4308# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4309# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st2	{ v1.2s, v2.2s }, [x27], x28
4310# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4311# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st2	{ v1.4h, v2.4h }, [x27], x28
4312# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4313# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st2	{ v1.4s, v2.4s }, [x27], x28
4314# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4315
4316# CHECK:      Average Wait times (based on the timeline view):
4317# CHECK-NEXT: [0]: Executions
4318# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4319# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4320# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4321
4322# CHECK:            [0]    [1]    [2]    [3]
4323# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st2	{ v1.16b, v2.16b }, [x27], #32
4324# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4325# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st2	{ v1.2d, v2.2d }, [x27], x28
4326# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4327# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st2	{ v1.2s, v2.2s }, [x27], x28
4328# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4329# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st2	{ v1.4h, v2.4h }, [x27], x28
4330# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4331# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st2	{ v1.4s, v2.4s }, [x27], x28
4332# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4333# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4334
4335# CHECK:      [69] Code Region - G70
4336
4337# CHECK:      Iterations:        100
4338# CHECK-NEXT: Instructions:      1000
4339# CHECK-NEXT: Total Cycles:      2501
4340# CHECK-NEXT: Total uOps:        1500
4341
4342# CHECK:      Dispatch Width:    2
4343# CHECK-NEXT: uOps Per Cycle:    0.60
4344# CHECK-NEXT: IPC:               0.40
4345# CHECK-NEXT: Block RThroughput: 14.0
4346
4347# CHECK:      Timeline view:
4348# CHECK-NEXT:                     0123456789
4349# CHECK-NEXT: Index     0123456789          012345
4350
4351# CHECK:      [0,0]     DeeeeE    .    .    .    .   st2	{ v1.8b, v2.8b }, [x27], x28
4352# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4353# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st2	{ v1.8h, v2.8h }, [x27], x28
4354# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4355# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st2	{ v1.16b, v2.16b }, [x27], x28
4356# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4357# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st2	{ v1.b, v2.b }[0], [x27], #2
4358# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4359# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st2	{ v1.b, v2.b }[8], [x27], #2
4360# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4361
4362# CHECK:      Average Wait times (based on the timeline view):
4363# CHECK-NEXT: [0]: Executions
4364# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4365# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4366# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4367
4368# CHECK:            [0]    [1]    [2]    [3]
4369# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st2	{ v1.8b, v2.8b }, [x27], x28
4370# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4371# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st2	{ v1.8h, v2.8h }, [x27], x28
4372# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4373# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st2	{ v1.16b, v2.16b }, [x27], x28
4374# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4375# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st2	{ v1.b, v2.b }[0], [x27], #2
4376# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4377# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st2	{ v1.b, v2.b }[8], [x27], #2
4378# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4379# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4380
4381# CHECK:      [70] Code Region - G71
4382
4383# CHECK:      Iterations:        100
4384# CHECK-NEXT: Instructions:      1000
4385# CHECK-NEXT: Total Cycles:      2501
4386# CHECK-NEXT: Total uOps:        1500
4387
4388# CHECK:      Dispatch Width:    2
4389# CHECK-NEXT: uOps Per Cycle:    0.60
4390# CHECK-NEXT: IPC:               0.40
4391# CHECK-NEXT: Block RThroughput: 10.0
4392
4393# CHECK:      Timeline view:
4394# CHECK-NEXT:                     0123456789
4395# CHECK-NEXT: Index     0123456789          012345
4396
4397# CHECK:      [0,0]     DeeeeE    .    .    .    .   st2	{ v1.b, v2.b }[0], [x27], x28
4398# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4399# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st2	{ v1.b, v2.b }[8], [x27], x28
4400# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4401# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st2	{ v1.h, v2.h }[0], [x27], #4
4402# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4403# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st2	{ v1.h, v2.h }[4], [x27], #4
4404# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4405# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st2	{ v1.h, v2.h }[0], [x27], x28
4406# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4407
4408# CHECK:      Average Wait times (based on the timeline view):
4409# CHECK-NEXT: [0]: Executions
4410# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4411# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4412# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4413
4414# CHECK:            [0]    [1]    [2]    [3]
4415# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st2	{ v1.b, v2.b }[0], [x27], x28
4416# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4417# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st2	{ v1.b, v2.b }[8], [x27], x28
4418# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4419# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st2	{ v1.h, v2.h }[0], [x27], #4
4420# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4421# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st2	{ v1.h, v2.h }[4], [x27], #4
4422# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4423# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st2	{ v1.h, v2.h }[0], [x27], x28
4424# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4425# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4426
4427# CHECK:      [71] Code Region - G72
4428
4429# CHECK:      Iterations:        100
4430# CHECK-NEXT: Instructions:      1000
4431# CHECK-NEXT: Total Cycles:      2501
4432# CHECK-NEXT: Total uOps:        1500
4433
4434# CHECK:      Dispatch Width:    2
4435# CHECK-NEXT: uOps Per Cycle:    0.60
4436# CHECK-NEXT: IPC:               0.40
4437# CHECK-NEXT: Block RThroughput: 10.0
4438
4439# CHECK:      Timeline view:
4440# CHECK-NEXT:                     0123456789
4441# CHECK-NEXT: Index     0123456789          012345
4442
4443# CHECK:      [0,0]     DeeeeE    .    .    .    .   st2	{ v1.h, v2.h }[4], [x27], x28
4444# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4445# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st2	{ v1.s, v2.s }[0], [x27], #8
4446# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4447# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st2	{ v1.s, v2.s }[0], [x27], x28
4448# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4449# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st2	{ v1.d, v2.d }[0], [x27], #16
4450# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4451# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st2	{ v1.d, v2.d }[0], [x27], x28
4452# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4453
4454# CHECK:      Average Wait times (based on the timeline view):
4455# CHECK-NEXT: [0]: Executions
4456# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4457# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4458# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4459
4460# CHECK:            [0]    [1]    [2]    [3]
4461# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st2	{ v1.h, v2.h }[4], [x27], x28
4462# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4463# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st2	{ v1.s, v2.s }[0], [x27], #8
4464# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4465# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st2	{ v1.s, v2.s }[0], [x27], x28
4466# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4467# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st2	{ v1.d, v2.d }[0], [x27], #16
4468# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4469# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st2	{ v1.d, v2.d }[0], [x27], x28
4470# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4471# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4472
4473# CHECK:      [72] Code Region - G73
4474
4475# CHECK:      Iterations:        100
4476# CHECK-NEXT: Instructions:      600
4477# CHECK-NEXT: Total Cycles:      1501
4478# CHECK-NEXT: Total uOps:        900
4479
4480# CHECK:      Dispatch Width:    2
4481# CHECK-NEXT: uOps Per Cycle:    0.60
4482# CHECK-NEXT: IPC:               0.40
4483# CHECK-NEXT: Block RThroughput: 12.0
4484
4485# CHECK:      Timeline view:
4486# CHECK-NEXT:                     012345
4487# CHECK-NEXT: Index     0123456789
4488
4489# CHECK:      [0,0]     DeeeeE    .    .   st3	{ v1.2d, v2.2d, v3.2d }, [x27], #48
4490# CHECK-NEXT: [0,1]     . DeeE    .    .   add	x0, x27, #1
4491# CHECK-NEXT: [0,2]     .    DeeeeE    .   st3	{ v1.2s, v2.2s, v3.2s }, [x27], #24
4492# CHECK-NEXT: [0,3]     .    . DeeE    .   add	x0, x27, #1
4493# CHECK-NEXT: [0,4]     .    .    DeeeeE   st3	{ v1.4h, v2.4h, v3.4h }, [x27], #24
4494# CHECK-NEXT: [0,5]     .    .    . DeeE   add	x0, x27, #1
4495
4496# CHECK:      Average Wait times (based on the timeline view):
4497# CHECK-NEXT: [0]: Executions
4498# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4499# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4500# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4501
4502# CHECK:            [0]    [1]    [2]    [3]
4503# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st3	{ v1.2d, v2.2d, v3.2d }, [x27], #48
4504# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4505# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st3	{ v1.2s, v2.2s, v3.2s }, [x27], #24
4506# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4507# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st3	{ v1.4h, v2.4h, v3.4h }, [x27], #24
4508# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4509# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4510
4511# CHECK:      [73] Code Region - G74
4512
4513# CHECK:      Iterations:        100
4514# CHECK-NEXT: Instructions:      1000
4515# CHECK-NEXT: Total Cycles:      2501
4516# CHECK-NEXT: Total uOps:        1500
4517
4518# CHECK:      Dispatch Width:    2
4519# CHECK-NEXT: uOps Per Cycle:    0.60
4520# CHECK-NEXT: IPC:               0.40
4521# CHECK-NEXT: Block RThroughput: 20.0
4522
4523# CHECK:      Timeline view:
4524# CHECK-NEXT:                     0123456789
4525# CHECK-NEXT: Index     0123456789          012345
4526
4527# CHECK:      [0,0]     DeeeeE    .    .    .    .   st3	{ v1.4s, v2.4s, v3.4s }, [x27], #48
4528# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4529# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st3	{ v1.8b, v2.8b, v3.8b }, [x27], #24
4530# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4531# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st3	{ v1.8h, v2.8h, v3.8h }, [x27], #48
4532# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4533# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st3	{ v1.16b, v2.16b, v3.16b }, [x27], #48
4534# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4535# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st3	{ v1.2d, v2.2d, v3.2d }, [x27], x28
4536# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4537
4538# CHECK:      Average Wait times (based on the timeline view):
4539# CHECK-NEXT: [0]: Executions
4540# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4541# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4542# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4543
4544# CHECK:            [0]    [1]    [2]    [3]
4545# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st3	{ v1.4s, v2.4s, v3.4s }, [x27], #48
4546# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4547# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st3	{ v1.8b, v2.8b, v3.8b }, [x27], #24
4548# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4549# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st3	{ v1.8h, v2.8h, v3.8h }, [x27], #48
4550# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4551# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st3	{ v1.16b, v2.16b, v3.16b }, [x27], #48
4552# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4553# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st3	{ v1.2d, v2.2d, v3.2d }, [x27], x28
4554# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4555# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4556
4557# CHECK:      [74] Code Region - G75
4558
4559# CHECK:      Iterations:        100
4560# CHECK-NEXT: Instructions:      1000
4561# CHECK-NEXT: Total Cycles:      2501
4562# CHECK-NEXT: Total uOps:        1500
4563
4564# CHECK:      Dispatch Width:    2
4565# CHECK-NEXT: uOps Per Cycle:    0.60
4566# CHECK-NEXT: IPC:               0.40
4567# CHECK-NEXT: Block RThroughput: 20.0
4568
4569# CHECK:      Timeline view:
4570# CHECK-NEXT:                     0123456789
4571# CHECK-NEXT: Index     0123456789          012345
4572
4573# CHECK:      [0,0]     DeeeeE    .    .    .    .   st3	{ v1.2s, v2.2s, v3.2s }, [x27], x28
4574# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4575# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st3	{ v1.4h, v2.4h, v3.4h }, [x27], x28
4576# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4577# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st3	{ v1.4s, v2.4s, v3.4s }, [x27], x28
4578# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4579# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st3	{ v1.8b, v2.8b, v3.8b }, [x27], x28
4580# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4581# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st3	{ v1.8h, v2.8h, v3.8h }, [x27], x28
4582# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4583
4584# CHECK:      Average Wait times (based on the timeline view):
4585# CHECK-NEXT: [0]: Executions
4586# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4587# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4588# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4589
4590# CHECK:            [0]    [1]    [2]    [3]
4591# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st3	{ v1.2s, v2.2s, v3.2s }, [x27], x28
4592# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4593# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st3	{ v1.4h, v2.4h, v3.4h }, [x27], x28
4594# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4595# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st3	{ v1.4s, v2.4s, v3.4s }, [x27], x28
4596# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4597# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st3	{ v1.8b, v2.8b, v3.8b }, [x27], x28
4598# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4599# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st3	{ v1.8h, v2.8h, v3.8h }, [x27], x28
4600# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4601# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4602
4603# CHECK:      [75] Code Region - G76
4604
4605# CHECK:      Iterations:        100
4606# CHECK-NEXT: Instructions:      1000
4607# CHECK-NEXT: Total Cycles:      2501
4608# CHECK-NEXT: Total uOps:        1500
4609
4610# CHECK:      Dispatch Width:    2
4611# CHECK-NEXT: uOps Per Cycle:    0.60
4612# CHECK-NEXT: IPC:               0.40
4613# CHECK-NEXT: Block RThroughput: 12.0
4614
4615# CHECK:      Timeline view:
4616# CHECK-NEXT:                     0123456789
4617# CHECK-NEXT: Index     0123456789          012345
4618
4619# CHECK:      [0,0]     DeeeeE    .    .    .    .   st3	{ v1.16b, v2.16b, v3.16b }, [x27], x28
4620# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4621# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st3	{ v1.b, v2.b, v3.b }[0], [x27], #3
4622# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4623# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st3	{ v1.b, v2.b, v3.b }[8], [x27], #3
4624# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4625# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st3	{ v1.b, v2.b, v3.b }[0], [x27], x28
4626# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4627# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st3	{ v1.b, v2.b, v3.b }[8], [x27], x28
4628# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4629
4630# CHECK:      Average Wait times (based on the timeline view):
4631# CHECK-NEXT: [0]: Executions
4632# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4633# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4634# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4635
4636# CHECK:            [0]    [1]    [2]    [3]
4637# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st3	{ v1.16b, v2.16b, v3.16b }, [x27], x28
4638# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4639# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st3	{ v1.b, v2.b, v3.b }[0], [x27], #3
4640# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4641# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st3	{ v1.b, v2.b, v3.b }[8], [x27], #3
4642# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4643# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st3	{ v1.b, v2.b, v3.b }[0], [x27], x28
4644# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4645# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st3	{ v1.b, v2.b, v3.b }[8], [x27], x28
4646# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4647# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4648
4649# CHECK:      [76] Code Region - G77
4650
4651# CHECK:      Iterations:        100
4652# CHECK-NEXT: Instructions:      1000
4653# CHECK-NEXT: Total Cycles:      2501
4654# CHECK-NEXT: Total uOps:        1500
4655
4656# CHECK:      Dispatch Width:    2
4657# CHECK-NEXT: uOps Per Cycle:    0.60
4658# CHECK-NEXT: IPC:               0.40
4659# CHECK-NEXT: Block RThroughput: 10.0
4660
4661# CHECK:      Timeline view:
4662# CHECK-NEXT:                     0123456789
4663# CHECK-NEXT: Index     0123456789          012345
4664
4665# CHECK:      [0,0]     DeeeeE    .    .    .    .   st3	{ v1.h, v2.h, v3.h }[0], [x27], #6
4666# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4667# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st3	{ v1.h, v2.h, v3.h }[4], [x27], #6
4668# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4669# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st3	{ v1.h, v2.h, v3.h }[0], [x27], x28
4670# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4671# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st3	{ v1.h, v2.h, v3.h }[4], [x27], x28
4672# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4673# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st3	{ v1.s, v2.s, v3.s }[0], [x27], #12
4674# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4675
4676# CHECK:      Average Wait times (based on the timeline view):
4677# CHECK-NEXT: [0]: Executions
4678# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4679# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4680# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4681
4682# CHECK:            [0]    [1]    [2]    [3]
4683# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st3	{ v1.h, v2.h, v3.h }[0], [x27], #6
4684# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4685# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st3	{ v1.h, v2.h, v3.h }[4], [x27], #6
4686# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4687# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st3	{ v1.h, v2.h, v3.h }[0], [x27], x28
4688# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4689# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st3	{ v1.h, v2.h, v3.h }[4], [x27], x28
4690# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4691# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st3	{ v1.s, v2.s, v3.s }[0], [x27], #12
4692# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4693# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4694
4695# CHECK:      [77] Code Region - G78
4696
4697# CHECK:      Iterations:        100
4698# CHECK-NEXT: Instructions:      1000
4699# CHECK-NEXT: Total Cycles:      2501
4700# CHECK-NEXT: Total uOps:        1500
4701
4702# CHECK:      Dispatch Width:    2
4703# CHECK-NEXT: uOps Per Cycle:    0.60
4704# CHECK-NEXT: IPC:               0.40
4705# CHECK-NEXT: Block RThroughput: 14.0
4706
4707# CHECK:      Timeline view:
4708# CHECK-NEXT:                     0123456789
4709# CHECK-NEXT: Index     0123456789          012345
4710
4711# CHECK:      [0,0]     DeeeeE    .    .    .    .   st3	{ v1.s, v2.s, v3.s }[0], [x27], x28
4712# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4713# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st3	{ v1.d, v2.d, v3.d }[0], [x27], #24
4714# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4715# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st3	{ v1.d, v2.d, v3.d }[0], [x27], x28
4716# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4717# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
4718# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4719# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
4720# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4721
4722# CHECK:      Average Wait times (based on the timeline view):
4723# CHECK-NEXT: [0]: Executions
4724# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4725# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4726# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4727
4728# CHECK:            [0]    [1]    [2]    [3]
4729# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st3	{ v1.s, v2.s, v3.s }[0], [x27], x28
4730# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4731# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st3	{ v1.d, v2.d, v3.d }[0], [x27], #24
4732# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4733# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st3	{ v1.d, v2.d, v3.d }[0], [x27], x28
4734# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4735# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
4736# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4737# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
4738# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4739# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4740
4741# CHECK:      [78] Code Region - G79
4742
4743# CHECK:      Iterations:        100
4744# CHECK-NEXT: Instructions:      1000
4745# CHECK-NEXT: Total Cycles:      2501
4746# CHECK-NEXT: Total uOps:        1500
4747
4748# CHECK:      Dispatch Width:    2
4749# CHECK-NEXT: uOps Per Cycle:    0.60
4750# CHECK-NEXT: IPC:               0.40
4751# CHECK-NEXT: Block RThroughput: 20.0
4752
4753# CHECK:      Timeline view:
4754# CHECK-NEXT:                     0123456789
4755# CHECK-NEXT: Index     0123456789          012345
4756
4757# CHECK:      [0,0]     DeeeeE    .    .    .    .   st4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
4758# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4759# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
4760# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4761# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
4762# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4763# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
4764# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4765# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
4766# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4767
4768# CHECK:      Average Wait times (based on the timeline view):
4769# CHECK-NEXT: [0]: Executions
4770# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4771# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4772# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4773
4774# CHECK:            [0]    [1]    [2]    [3]
4775# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
4776# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4777# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
4778# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4779# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
4780# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4781# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
4782# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4783# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
4784# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4785# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4786
4787# CHECK:      [79] Code Region - G80
4788
4789# CHECK:      Iterations:        100
4790# CHECK-NEXT: Instructions:      1000
4791# CHECK-NEXT: Total Cycles:      2501
4792# CHECK-NEXT: Total uOps:        1500
4793
4794# CHECK:      Dispatch Width:    2
4795# CHECK-NEXT: uOps Per Cycle:    0.60
4796# CHECK-NEXT: IPC:               0.40
4797# CHECK-NEXT: Block RThroughput: 20.0
4798
4799# CHECK:      Timeline view:
4800# CHECK-NEXT:                     0123456789
4801# CHECK-NEXT: Index     0123456789          012345
4802
4803# CHECK:      [0,0]     DeeeeE    .    .    .    .   st4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
4804# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4805# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
4806# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4807# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
4808# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4809# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
4810# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4811# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
4812# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4813
4814# CHECK:      Average Wait times (based on the timeline view):
4815# CHECK-NEXT: [0]: Executions
4816# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4817# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4818# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4819
4820# CHECK:            [0]    [1]    [2]    [3]
4821# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
4822# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4823# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
4824# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4825# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
4826# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4827# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
4828# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4829# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
4830# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4831# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4832
4833# CHECK:      [80] Code Region - G81
4834
4835# CHECK:      Iterations:        100
4836# CHECK-NEXT: Instructions:      1000
4837# CHECK-NEXT: Total Cycles:      2501
4838# CHECK-NEXT: Total uOps:        1500
4839
4840# CHECK:      Dispatch Width:    2
4841# CHECK-NEXT: uOps Per Cycle:    0.60
4842# CHECK-NEXT: IPC:               0.40
4843# CHECK-NEXT: Block RThroughput: 14.0
4844
4845# CHECK:      Timeline view:
4846# CHECK-NEXT:                     0123456789
4847# CHECK-NEXT: Index     0123456789          012345
4848
4849# CHECK:      [0,0]     DeeeeE    .    .    .    .   st4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
4850# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4851# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
4852# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4853# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
4854# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4855# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
4856# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4857# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
4858# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4859
4860# CHECK:      Average Wait times (based on the timeline view):
4861# CHECK-NEXT: [0]: Executions
4862# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4863# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4864# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4865
4866# CHECK:            [0]    [1]    [2]    [3]
4867# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
4868# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4869# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
4870# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4871# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
4872# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4873# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
4874# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4875# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
4876# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4877# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4878
4879# CHECK:      [81] Code Region - G82
4880
4881# CHECK:      Iterations:        100
4882# CHECK-NEXT: Instructions:      1000
4883# CHECK-NEXT: Total Cycles:      2501
4884# CHECK-NEXT: Total uOps:        1500
4885
4886# CHECK:      Dispatch Width:    2
4887# CHECK-NEXT: uOps Per Cycle:    0.60
4888# CHECK-NEXT: IPC:               0.40
4889# CHECK-NEXT: Block RThroughput: 10.0
4890
4891# CHECK:      Timeline view:
4892# CHECK-NEXT:                     0123456789
4893# CHECK-NEXT: Index     0123456789          012345
4894
4895# CHECK:      [0,0]     DeeeeE    .    .    .    .   st4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
4896# CHECK-NEXT: [0,1]     . DeeE    .    .    .    .   add	x0, x27, #1
4897# CHECK-NEXT: [0,2]     .    DeeeeE    .    .    .   st4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
4898# CHECK-NEXT: [0,3]     .    . DeeE    .    .    .   add	x0, x27, #1
4899# CHECK-NEXT: [0,4]     .    .    DeeeeE    .    .   st4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
4900# CHECK-NEXT: [0,5]     .    .    . DeeE    .    .   add	x0, x27, #1
4901# CHECK-NEXT: [0,6]     .    .    .    DeeeeE    .   st4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
4902# CHECK-NEXT: [0,7]     .    .    .    . DeeE    .   add	x0, x27, #1
4903# CHECK-NEXT: [0,8]     .    .    .    .    DeeeeE   st4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
4904# CHECK-NEXT: [0,9]     .    .    .    .    . DeeE   add	x0, x27, #1
4905
4906# CHECK:      Average Wait times (based on the timeline view):
4907# CHECK-NEXT: [0]: Executions
4908# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4909# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4910# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4911
4912# CHECK:            [0]    [1]    [2]    [3]
4913# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
4914# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4915# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
4916# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4917# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
4918# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4919# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
4920# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4921# CHECK-NEXT: 8.     1     0.0    0.0    0.0       st4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
4922# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
4923# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4924
4925# CHECK:      [82] Code Region - G83
4926
4927# CHECK:      Iterations:        100
4928# CHECK-NEXT: Instructions:      800
4929# CHECK-NEXT: Total Cycles:      2001
4930# CHECK-NEXT: Total uOps:        1200
4931
4932# CHECK:      Dispatch Width:    2
4933# CHECK-NEXT: uOps Per Cycle:    0.60
4934# CHECK-NEXT: IPC:               0.40
4935# CHECK-NEXT: Block RThroughput: 8.0
4936
4937# CHECK:      Timeline view:
4938# CHECK-NEXT:                     0123456789
4939# CHECK-NEXT: Index     0123456789          0
4940
4941# CHECK:      [0,0]     DeeeeE    .    .    .   st4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
4942# CHECK-NEXT: [0,1]     . DeeE    .    .    .   add	x0, x27, #1
4943# CHECK-NEXT: [0,2]     .    DeeeeE    .    .   st4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
4944# CHECK-NEXT: [0,3]     .    . DeeE    .    .   add	x0, x27, #1
4945# CHECK-NEXT: [0,4]     .    .    DeeeeE    .   st4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
4946# CHECK-NEXT: [0,5]     .    .    . DeeE    .   add	x0, x27, #1
4947# CHECK-NEXT: [0,6]     .    .    .    DeeeeE   st4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
4948# CHECK-NEXT: [0,7]     .    .    .    . DeeE   add	x0, x27, #1
4949
4950# CHECK:      Average Wait times (based on the timeline view):
4951# CHECK-NEXT: [0]: Executions
4952# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4953# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4954# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4955
4956# CHECK:            [0]    [1]    [2]    [3]
4957# CHECK-NEXT: 0.     1     0.0    0.0    0.0       st4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
4958# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4959# CHECK-NEXT: 2.     1     0.0    0.0    0.0       st4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
4960# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4961# CHECK-NEXT: 4.     1     0.0    0.0    0.0       st4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
4962# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
4963# CHECK-NEXT: 6.     1     0.0    0.0    0.0       st4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
4964# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
4965# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4966
4967# CHECK:      [83] Code Region - G84
4968
4969# CHECK:      Iterations:        100
4970# CHECK-NEXT: Instructions:      400
4971# CHECK-NEXT: Total Cycles:      403
4972# CHECK-NEXT: Total uOps:        600
4973
4974# CHECK:      Dispatch Width:    2
4975# CHECK-NEXT: uOps Per Cycle:    1.49
4976# CHECK-NEXT: IPC:               0.99
4977# CHECK-NEXT: Block RThroughput: 3.0
4978
4979# CHECK:      Timeline view:
4980# CHECK-NEXT: Index     0123456
4981
4982# CHECK:      [0,0]     DE   ..   stp	s1, s2, [x27], #248
4983# CHECK-NEXT: [0,1]     .DeeE..   add	x0, x27, #1
4984# CHECK-NEXT: [0,2]     . DE ..   stp	d1, d2, [x27], #496
4985# CHECK-NEXT: [0,3]     .  DeeE   add	x0, x27, #1
4986
4987# CHECK:      Average Wait times (based on the timeline view):
4988# CHECK-NEXT: [0]: Executions
4989# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
4990# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
4991# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
4992
4993# CHECK:            [0]    [1]    [2]    [3]
4994# CHECK-NEXT: 0.     1     0.0    0.0    0.0       stp	s1, s2, [x27], #248
4995# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
4996# CHECK-NEXT: 2.     1     0.0    0.0    0.0       stp	d1, d2, [x27], #496
4997# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
4998# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
4999
5000# CHECK:      [84] Code Region - G85
5001
5002# CHECK:      Iterations:        100
5003# CHECK-NEXT: Instructions:      1000
5004# CHECK-NEXT: Total Cycles:      1003
5005# CHECK-NEXT: Total uOps:        1500
5006
5007# CHECK:      Dispatch Width:    2
5008# CHECK-NEXT: uOps Per Cycle:    1.50
5009# CHECK-NEXT: IPC:               1.00
5010# CHECK-NEXT: Block RThroughput: 7.5
5011
5012# CHECK:      Timeline view:
5013# CHECK-NEXT:                     012
5014# CHECK-NEXT: Index     0123456789
5015
5016# CHECK:      [0,0]     DE   .    . .   stp	q1, q2, [x27], #992
5017# CHECK-NEXT: [0,1]     .DeeE.    . .   add	x0, x27, #1
5018# CHECK-NEXT: [0,2]     . DE .    . .   stp	s1, s2, [x27, #248]!
5019# CHECK-NEXT: [0,3]     .  DeeE   . .   add	x0, x27, #1
5020# CHECK-NEXT: [0,4]     .   DE    . .   stp	d1, d2, [x27, #496]!
5021# CHECK-NEXT: [0,5]     .    DeeE . .   add	x0, x27, #1
5022# CHECK-NEXT: [0,6]     .    .DE  . .   stp	q1, q2, [x27, #992]!
5023# CHECK-NEXT: [0,7]     .    . DeeE .   add	x0, x27, #1
5024# CHECK-NEXT: [0,8]     .    .  DE. .   stp	w1, w2, [x27], #248
5025# CHECK-NEXT: [0,9]     .    .   DeeE   add	x0, x27, #1
5026
5027# CHECK:      Average Wait times (based on the timeline view):
5028# CHECK-NEXT: [0]: Executions
5029# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5030# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5031# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5032
5033# CHECK:            [0]    [1]    [2]    [3]
5034# CHECK-NEXT: 0.     1     0.0    0.0    0.0       stp	q1, q2, [x27], #992
5035# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
5036# CHECK-NEXT: 2.     1     0.0    0.0    0.0       stp	s1, s2, [x27, #248]!
5037# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
5038# CHECK-NEXT: 4.     1     0.0    0.0    0.0       stp	d1, d2, [x27, #496]!
5039# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
5040# CHECK-NEXT: 6.     1     0.0    0.0    0.0       stp	q1, q2, [x27, #992]!
5041# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
5042# CHECK-NEXT: 8.     1     0.0    0.0    0.0       stp	w1, w2, [x27], #248
5043# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
5044# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
5045
5046# CHECK:      [85] Code Region - G86
5047
5048# CHECK:      Iterations:        100
5049# CHECK-NEXT: Instructions:      1000
5050# CHECK-NEXT: Total Cycles:      1003
5051# CHECK-NEXT: Total uOps:        1500
5052
5053# CHECK:      Dispatch Width:    2
5054# CHECK-NEXT: uOps Per Cycle:    1.50
5055# CHECK-NEXT: IPC:               1.00
5056# CHECK-NEXT: Block RThroughput: 7.5
5057
5058# CHECK:      Timeline view:
5059# CHECK-NEXT:                     012
5060# CHECK-NEXT: Index     0123456789
5061
5062# CHECK:      [0,0]     DE   .    . .   stp	x1, x2, [x27], #496
5063# CHECK-NEXT: [0,1]     .DeeE.    . .   add	x0, x27, #1
5064# CHECK-NEXT: [0,2]     . DE .    . .   stp	w1, w2, [x27, #248]!
5065# CHECK-NEXT: [0,3]     .  DeeE   . .   add	x0, x27, #1
5066# CHECK-NEXT: [0,4]     .   DE    . .   stp	x1, x2, [x27, #496]!
5067# CHECK-NEXT: [0,5]     .    DeeE . .   add	x0, x27, #1
5068# CHECK-NEXT: [0,6]     .    .DE  . .   str	b1, [x27], #254
5069# CHECK-NEXT: [0,7]     .    . DeeE .   add	x0, x27, #1
5070# CHECK-NEXT: [0,8]     .    .  DE. .   str	h1, [x27], #254
5071# CHECK-NEXT: [0,9]     .    .   DeeE   add	x0, x27, #1
5072
5073# CHECK:      Average Wait times (based on the timeline view):
5074# CHECK-NEXT: [0]: Executions
5075# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5076# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5077# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5078
5079# CHECK:            [0]    [1]    [2]    [3]
5080# CHECK-NEXT: 0.     1     0.0    0.0    0.0       stp	x1, x2, [x27], #496
5081# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
5082# CHECK-NEXT: 2.     1     0.0    0.0    0.0       stp	w1, w2, [x27, #248]!
5083# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
5084# CHECK-NEXT: 4.     1     0.0    0.0    0.0       stp	x1, x2, [x27, #496]!
5085# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
5086# CHECK-NEXT: 6.     1     0.0    0.0    0.0       str	b1, [x27], #254
5087# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
5088# CHECK-NEXT: 8.     1     0.0    0.0    0.0       str	h1, [x27], #254
5089# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
5090# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
5091
5092# CHECK:      [86] Code Region - G87
5093
5094# CHECK:      Iterations:        100
5095# CHECK-NEXT: Instructions:      1000
5096# CHECK-NEXT: Total Cycles:      1003
5097# CHECK-NEXT: Total uOps:        1500
5098
5099# CHECK:      Dispatch Width:    2
5100# CHECK-NEXT: uOps Per Cycle:    1.50
5101# CHECK-NEXT: IPC:               1.00
5102# CHECK-NEXT: Block RThroughput: 7.5
5103
5104# CHECK:      Timeline view:
5105# CHECK-NEXT:                     012
5106# CHECK-NEXT: Index     0123456789
5107
5108# CHECK:      [0,0]     DE   .    . .   str	s1, [x27], #254
5109# CHECK-NEXT: [0,1]     .DeeE.    . .   add	x0, x27, #1
5110# CHECK-NEXT: [0,2]     . DE .    . .   str	d1, [x27], #254
5111# CHECK-NEXT: [0,3]     .  DeeE   . .   add	x0, x27, #1
5112# CHECK-NEXT: [0,4]     .   DE    . .   str	q1, [x27], #254
5113# CHECK-NEXT: [0,5]     .    DeeE . .   add	x0, x27, #1
5114# CHECK-NEXT: [0,6]     .    .DE  . .   str	b1, [x27, #254]!
5115# CHECK-NEXT: [0,7]     .    . DeeE .   add	x0, x27, #1
5116# CHECK-NEXT: [0,8]     .    .  DE. .   str	h1, [x27, #254]!
5117# CHECK-NEXT: [0,9]     .    .   DeeE   add	x0, x27, #1
5118
5119# CHECK:      Average Wait times (based on the timeline view):
5120# CHECK-NEXT: [0]: Executions
5121# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5122# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5123# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5124
5125# CHECK:            [0]    [1]    [2]    [3]
5126# CHECK-NEXT: 0.     1     0.0    0.0    0.0       str	s1, [x27], #254
5127# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
5128# CHECK-NEXT: 2.     1     0.0    0.0    0.0       str	d1, [x27], #254
5129# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
5130# CHECK-NEXT: 4.     1     0.0    0.0    0.0       str	q1, [x27], #254
5131# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
5132# CHECK-NEXT: 6.     1     0.0    0.0    0.0       str	b1, [x27, #254]!
5133# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
5134# CHECK-NEXT: 8.     1     0.0    0.0    0.0       str	h1, [x27, #254]!
5135# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
5136# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
5137
5138# CHECK:      [87] Code Region - G88
5139
5140# CHECK:      Iterations:        100
5141# CHECK-NEXT: Instructions:      1000
5142# CHECK-NEXT: Total Cycles:      1003
5143# CHECK-NEXT: Total uOps:        1500
5144
5145# CHECK:      Dispatch Width:    2
5146# CHECK-NEXT: uOps Per Cycle:    1.50
5147# CHECK-NEXT: IPC:               1.00
5148# CHECK-NEXT: Block RThroughput: 7.5
5149
5150# CHECK:      Timeline view:
5151# CHECK-NEXT:                     012
5152# CHECK-NEXT: Index     0123456789
5153
5154# CHECK:      [0,0]     DE   .    . .   str	s1, [x27, #254]!
5155# CHECK-NEXT: [0,1]     .DeeE.    . .   add	x0, x27, #1
5156# CHECK-NEXT: [0,2]     . DE .    . .   str	d1, [x27, #254]!
5157# CHECK-NEXT: [0,3]     .  DeeE   . .   add	x0, x27, #1
5158# CHECK-NEXT: [0,4]     .   DE    . .   str	q1, [x27, #254]!
5159# CHECK-NEXT: [0,5]     .    DeeE . .   add	x0, x27, #1
5160# CHECK-NEXT: [0,6]     .    .DE  . .   str	w1, [x27], #254
5161# CHECK-NEXT: [0,7]     .    . DeeE .   add	x0, x27, #1
5162# CHECK-NEXT: [0,8]     .    .  DE. .   str	x1, [x27], #254
5163# CHECK-NEXT: [0,9]     .    .   DeeE   add	x0, x27, #1
5164
5165# CHECK:      Average Wait times (based on the timeline view):
5166# CHECK-NEXT: [0]: Executions
5167# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5168# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5169# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5170
5171# CHECK:            [0]    [1]    [2]    [3]
5172# CHECK-NEXT: 0.     1     0.0    0.0    0.0       str	s1, [x27, #254]!
5173# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
5174# CHECK-NEXT: 2.     1     0.0    0.0    0.0       str	d1, [x27, #254]!
5175# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
5176# CHECK-NEXT: 4.     1     0.0    0.0    0.0       str	q1, [x27, #254]!
5177# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
5178# CHECK-NEXT: 6.     1     0.0    0.0    0.0       str	w1, [x27], #254
5179# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
5180# CHECK-NEXT: 8.     1     0.0    0.0    0.0       str	x1, [x27], #254
5181# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
5182# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
5183
5184# CHECK:      [88] Code Region - G89
5185
5186# CHECK:      Iterations:        100
5187# CHECK-NEXT: Instructions:      1000
5188# CHECK-NEXT: Total Cycles:      1003
5189# CHECK-NEXT: Total uOps:        1500
5190
5191# CHECK:      Dispatch Width:    2
5192# CHECK-NEXT: uOps Per Cycle:    1.50
5193# CHECK-NEXT: IPC:               1.00
5194# CHECK-NEXT: Block RThroughput: 7.5
5195
5196# CHECK:      Timeline view:
5197# CHECK-NEXT:                     012
5198# CHECK-NEXT: Index     0123456789
5199
5200# CHECK:      [0,0]     DE   .    . .   str	w1, [x27, #254]!
5201# CHECK-NEXT: [0,1]     .DeeE.    . .   add	x0, x27, #1
5202# CHECK-NEXT: [0,2]     . DE .    . .   str	x1, [x27, #254]!
5203# CHECK-NEXT: [0,3]     .  DeeE   . .   add	x0, x27, #1
5204# CHECK-NEXT: [0,4]     .   DE    . .   strb	w1, [x27], #254
5205# CHECK-NEXT: [0,5]     .    DeeE . .   add	x0, x27, #1
5206# CHECK-NEXT: [0,6]     .    .DE  . .   strb	w1, [x27, #254]!
5207# CHECK-NEXT: [0,7]     .    . DeeE .   add	x0, x27, #1
5208# CHECK-NEXT: [0,8]     .    .  DE. .   strh	w1, [x27], #254
5209# CHECK-NEXT: [0,9]     .    .   DeeE   add	x0, x27, #1
5210
5211# CHECK:      Average Wait times (based on the timeline view):
5212# CHECK-NEXT: [0]: Executions
5213# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5214# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5215# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5216
5217# CHECK:            [0]    [1]    [2]    [3]
5218# CHECK-NEXT: 0.     1     0.0    0.0    0.0       str	w1, [x27, #254]!
5219# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
5220# CHECK-NEXT: 2.     1     0.0    0.0    0.0       str	x1, [x27, #254]!
5221# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
5222# CHECK-NEXT: 4.     1     0.0    0.0    0.0       strb	w1, [x27], #254
5223# CHECK-NEXT: 5.     1     0.0    0.0    0.0       add	x0, x27, #1
5224# CHECK-NEXT: 6.     1     0.0    0.0    0.0       strb	w1, [x27, #254]!
5225# CHECK-NEXT: 7.     1     0.0    0.0    0.0       add	x0, x27, #1
5226# CHECK-NEXT: 8.     1     0.0    0.0    0.0       strh	w1, [x27], #254
5227# CHECK-NEXT: 9.     1     0.0    0.0    0.0       add	x0, x27, #1
5228# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
5229
5230# CHECK:      [89] Code Region - G90
5231
5232# CHECK:      Iterations:        100
5233# CHECK-NEXT: Instructions:      200
5234# CHECK-NEXT: Total Cycles:      203
5235# CHECK-NEXT: Total uOps:        300
5236
5237# CHECK:      Dispatch Width:    2
5238# CHECK-NEXT: uOps Per Cycle:    1.48
5239# CHECK-NEXT: IPC:               0.99
5240# CHECK-NEXT: Block RThroughput: 1.5
5241
5242# CHECK:      Timeline view:
5243# CHECK-NEXT: Index     01234
5244
5245# CHECK:      [0,0]     DE  .   strh	w1, [x27, #254]!
5246# CHECK-NEXT: [0,1]     .DeeE   add	x0, x27, #1
5247
5248# CHECK:      Average Wait times (based on the timeline view):
5249# CHECK-NEXT: [0]: Executions
5250# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5251# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5252# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5253
5254# CHECK:            [0]    [1]    [2]    [3]
5255# CHECK-NEXT: 0.     1     0.0    0.0    0.0       strh	w1, [x27, #254]!
5256# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
5257# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
5258
5259# CHECK:      [90] Code Region - G91
5260
5261# CHECK:      Iterations:        100
5262# CHECK-NEXT: Instructions:      400
5263# CHECK-NEXT: Total Cycles:      801
5264# CHECK-NEXT: Total uOps:        600
5265
5266# CHECK:      Dispatch Width:    2
5267# CHECK-NEXT: uOps Per Cycle:    0.75
5268# CHECK-NEXT: IPC:               0.50
5269# CHECK-NEXT: Block RThroughput: 3.0
5270
5271# CHECK:      Timeline view:
5272# CHECK-NEXT: Index     012345678
5273
5274# CHECK:      [0,0]     DeeE .  .   ldr	x1, [x27], #254
5275# CHECK-NEXT: [0,1]     .DeeE.  .   add	x0, x27, #1
5276# CHECK-NEXT: [0,2]     .   DeeE.   ldr	x2, [x1], #254
5277# CHECK-NEXT: [0,3]     .    DeeE   add	x0, x27, #1
5278
5279# CHECK:      Average Wait times (based on the timeline view):
5280# CHECK-NEXT: [0]: Executions
5281# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
5282# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
5283# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
5284
5285# CHECK:            [0]    [1]    [2]    [3]
5286# CHECK-NEXT: 0.     1     0.0    0.0    0.0       ldr	x1, [x27], #254
5287# CHECK-NEXT: 1.     1     0.0    0.0    0.0       add	x0, x27, #1
5288# CHECK-NEXT: 2.     1     0.0    0.0    0.0       ldr	x2, [x1], #254
5289# CHECK-NEXT: 3.     1     0.0    0.0    0.0       add	x0, x27, #1
5290# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
5291