xref: /llvm-project/llvm/test/tools/llvm-mca/AArch64/HiSilicon/tsv110-writeback.s (revision d093aee1a33e006b31fe5962fa9f98d9c4507283)
1# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
2# RUN: llvm-mca -mtriple=aarch64 -mcpu=tsv110 --instruction-info=0 --resource-pressure=0 --timeline --timeline-max-iterations=1 < %s | FileCheck %s
3
4# LLVM-MCA-BEGIN G01
5ld1  { v1.1d }, [x27], #8
6ld1  { v1.2d }, [x27], #16
7ld1  { v1.2s }, [x27], #8
8ld1  { v1.4h }, [x27], #8
9ld1  { v1.4s }, [x27], #16
10# LLVM-MCA-END
11
12# LLVM-MCA-BEGIN G02
13ld1  { v1.8b }, [x27], #8
14ld1  { v1.8h }, [x27], #16
15ld1  { v1.16b }, [x27], #16
16ld1  { v1.1d }, [x27], x28
17ld1  { v1.2d }, [x27], x28
18# LLVM-MCA-END
19
20# LLVM-MCA-BEGIN G03
21ld1  { v1.2s }, [x27], x28
22ld1  { v1.4h }, [x27], x28
23ld1  { v1.4s }, [x27], x28
24ld1  { v1.8b }, [x27], x28
25ld1  { v1.8h }, [x27], x28
26# LLVM-MCA-END
27
28# LLVM-MCA-BEGIN G04
29ld1  { v1.16b }, [x27], x28
30ld1  { v1.1d, v2.1d }, [x27], #16
31ld1  { v1.2d, v2.2d }, [x27], #32
32ld1  { v1.2s, v2.2s }, [x27], #16
33ld1  { v1.4h, v2.4h }, [x27], #16
34# LLVM-MCA-END
35
36# LLVM-MCA-BEGIN G05
37ld1  { v1.4s, v2.4s }, [x27], #32
38ld1  { v1.8b, v2.8b }, [x27], #16
39ld1  { v1.8h, v2.8h }, [x27], #32
40ld1  { v1.16b, v2.16b }, [x27], #32
41ld1  { v1.1d, v2.1d }, [x27], x28
42# LLVM-MCA-END
43
44# LLVM-MCA-BEGIN G06
45ld1  { v1.2d, v2.2d }, [x27], x28
46ld1  { v1.2s, v2.2s }, [x27], x28
47ld1  { v1.4h, v2.4h }, [x27], x28
48ld1  { v1.4s, v2.4s }, [x27], x28
49ld1  { v1.8b, v2.8b }, [x27], x28
50# LLVM-MCA-END
51
52# LLVM-MCA-BEGIN G07
53ld1  { v1.8h, v2.8h }, [x27], x28
54ld1  { v1.16b, v2.16b }, [x27], x28
55ld1  { v1.1d, v2.1d, v3.1d }, [x27], #24
56ld1  { v1.2d, v2.2d, v3.2d }, [x27], #48
57ld1  { v1.2s, v2.2s, v3.2s }, [x27], #24
58# LLVM-MCA-END
59
60# LLVM-MCA-BEGIN G08
61ld1  { v1.4h, v2.4h, v3.4h }, [x27], #24
62ld1  { v1.4s, v2.4s, v3.4s }, [x27], #48
63ld1  { v1.8b, v2.8b, v3.8b }, [x27], #24
64ld1  { v1.8h, v2.8h, v3.8h }, [x27], #48
65ld1  { v1.16b, v2.16b, v3.16b }, [x27], #48
66# LLVM-MCA-END
67
68# LLVM-MCA-BEGIN G09
69ld1  { v1.1d, v2.1d, v3.1d }, [x27], x28
70ld1  { v1.2d, v2.2d, v3.2d }, [x27], x28
71ld1  { v1.2s, v2.2s, v3.2s }, [x27], x28
72ld1  { v1.4h, v2.4h, v3.4h }, [x27], x28
73ld1  { v1.4s, v2.4s, v3.4s }, [x27], x28
74# LLVM-MCA-END
75
76# LLVM-MCA-BEGIN G10
77ld1  { v1.8b, v2.8b, v3.8b }, [x27], x28
78ld1  { v1.8h, v2.8h, v3.8h }, [x27], x28
79ld1  { v1.16b, v2.16b, v3.16b }, [x27], x28
80ld1  { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
81ld1  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
82# LLVM-MCA-END
83
84# LLVM-MCA-BEGIN G11
85ld1  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
86ld1  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
87ld1  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
88ld1  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
89ld1  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
90# LLVM-MCA-END
91
92# LLVM-MCA-BEGIN G12
93ld1  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
94ld1  { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
95ld1  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
96ld1  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
97ld1  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
98# LLVM-MCA-END
99
100# LLVM-MCA-BEGIN G13
101ld1  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
102ld1  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
103ld1  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
104ld1  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
105ld1  { v1.b }[0], [x27], #1
106# LLVM-MCA-END
107
108# LLVM-MCA-BEGIN G14
109ld1  { v1.b }[8], [x27], #1
110ld1  { v1.b }[0], [x27], x28
111ld1  { v1.b }[8], [x27], x28
112ld1  { v1.h }[0], [x27], #2
113ld1  { v1.h }[4], [x27], #2
114# LLVM-MCA-END
115
116# LLVM-MCA-BEGIN G15
117ld1  { v1.h }[0], [x27], x28
118ld1  { v1.h }[4], [x27], x28
119ld1  { v1.s }[0], [x27], #4
120ld1  { v1.s }[0], [x27], x28
121ld1  { v1.d }[0], [x27], #8
122# LLVM-MCA-END
123
124# LLVM-MCA-BEGIN G16
125ld1  { v1.d }[0], [x27], x28
126ld1r  { v1.1d }, [x27], #8
127ld1r  { v1.2d }, [x27], #8
128ld1r  { v1.2s }, [x27], #4
129ld1r  { v1.4h }, [x27], #2
130# LLVM-MCA-END
131
132# LLVM-MCA-BEGIN G17
133ld1r  { v1.4s }, [x27], #4
134ld1r  { v1.8b }, [x27], #1
135ld1r  { v1.8h }, [x27], #2
136ld1r  { v1.16b }, [x27], #1
137ld1r  { v1.1d }, [x27], x28
138# LLVM-MCA-END
139
140# LLVM-MCA-BEGIN G18
141ld1r  { v1.2d }, [x27], x28
142ld1r  { v1.2s }, [x27], x28
143ld1r  { v1.4h }, [x27], x28
144ld1r  { v1.4s }, [x27], x28
145ld1r  { v1.8b }, [x27], x28
146# LLVM-MCA-END
147
148# LLVM-MCA-BEGIN G19
149ld1r  { v1.8h }, [x27], x28
150ld1r  { v1.16b }, [x27], x28
151ld2  { v1.2d, v2.2d }, [x27], #32
152ld2  { v1.2s, v2.2s }, [x27], #16
153ld2  { v1.4h, v2.4h }, [x27], #16
154# LLVM-MCA-END
155
156# LLVM-MCA-BEGIN G20
157ld2  { v1.4s, v2.4s }, [x27], #32
158ld2  { v1.8b, v2.8b }, [x27], #16
159ld2  { v1.8h, v2.8h }, [x27], #32
160ld2  { v1.16b, v2.16b }, [x27], #32
161ld2  { v1.2d, v2.2d }, [x27], x28
162# LLVM-MCA-END
163
164# LLVM-MCA-BEGIN G21
165ld2  { v1.2s, v2.2s }, [x27], x28
166ld2  { v1.4h, v2.4h }, [x27], x28
167ld2  { v1.4s, v2.4s }, [x27], x28
168ld2  { v1.8b, v2.8b }, [x27], x28
169ld2  { v1.8h, v2.8h }, [x27], x28
170# LLVM-MCA-END
171
172# LLVM-MCA-BEGIN G22
173ld2  { v1.16b, v2.16b }, [x27], x28
174ld2  { v1.b, v2.b }[0], [x27], #2
175ld2  { v1.b, v2.b }[8], [x27], #2
176ld2  { v1.b, v2.b }[0], [x27], x28
177ld2  { v1.b, v2.b }[8], [x27], x28
178# LLVM-MCA-END
179
180# LLVM-MCA-BEGIN G23
181ld2  { v1.h, v2.h }[0], [x27], #4
182ld2  { v1.h, v2.h }[4], [x27], #4
183ld2  { v1.h, v2.h }[0], [x27], x28
184ld2  { v1.h, v2.h }[4], [x27], x28
185ld2  { v1.s, v2.s }[0], [x27], #8
186# LLVM-MCA-END
187
188# LLVM-MCA-BEGIN G24
189ld2  { v1.s, v2.s }[0], [x27], x28
190ld2  { v1.d, v2.d }[0], [x27], #16
191ld2  { v1.d, v2.d }[0], [x27], x28
192ld2r  { v1.1d, v2.1d }, [x27], #16
193ld2r  { v1.2d, v2.2d }, [x27], #16
194# LLVM-MCA-END
195
196# LLVM-MCA-BEGIN G25
197ld2r  { v1.2s, v2.2s }, [x27], #8
198ld2r  { v1.4h, v2.4h }, [x27], #4
199ld2r  { v1.4s, v2.4s }, [x27], #8
200ld2r  { v1.8b, v2.8b }, [x27], #2
201ld2r  { v1.8h, v2.8h }, [x27], #4
202# LLVM-MCA-END
203
204# LLVM-MCA-BEGIN G26
205ld2r  { v1.16b, v2.16b }, [x27], #2
206ld2r  { v1.1d, v2.1d }, [x27], x28
207ld2r  { v1.2d, v2.2d }, [x27], x28
208ld2r  { v1.2s, v2.2s }, [x27], x28
209ld2r  { v1.4h, v2.4h }, [x27], x28
210# LLVM-MCA-END
211
212# LLVM-MCA-BEGIN G27
213ld2r  { v1.4s, v2.4s }, [x27], x28
214ld2r  { v1.8b, v2.8b }, [x27], x28
215ld2r  { v1.8h, v2.8h }, [x27], x28
216ld2r  { v1.16b, v2.16b }, [x27], x28
217ld3  { v1.2d, v2.2d, v3.2d }, [x27], #48
218# LLVM-MCA-END
219
220# LLVM-MCA-BEGIN G28
221ld3  { v1.2s, v2.2s, v3.2s }, [x27], #24
222ld3  { v1.4h, v2.4h, v3.4h }, [x27], #24
223ld3  { v1.4s, v2.4s, v3.4s }, [x27], #48
224ld3  { v1.8b, v2.8b, v3.8b }, [x27], #24
225ld3  { v1.8h, v2.8h, v3.8h }, [x27], #48
226# LLVM-MCA-END
227
228# LLVM-MCA-BEGIN G29
229ld3  { v1.16b, v2.16b, v3.16b }, [x27], #48
230ld3  { v1.2d, v2.2d, v3.2d }, [x27], x28
231ld3  { v1.2s, v2.2s, v3.2s }, [x27], x28
232ld3  { v1.4h, v2.4h, v3.4h }, [x27], x28
233ld3  { v1.4s, v2.4s, v3.4s }, [x27], x28
234# LLVM-MCA-END
235
236# LLVM-MCA-BEGIN G30
237ld3  { v1.8b, v2.8b, v3.8b }, [x27], x28
238ld3  { v1.8h, v2.8h, v3.8h }, [x27], x28
239ld3  { v1.16b, v2.16b, v3.16b }, [x27], x28
240ld3  { v1.b, v2.b, v3.b }[0], [x27], #3
241ld3  { v1.b, v2.b, v3.b }[8], [x27], #3
242# LLVM-MCA-END
243
244# LLVM-MCA-BEGIN G31
245ld3  { v1.b, v2.b, v3.b }[0], [x27], x28
246ld3  { v1.b, v2.b, v3.b }[8], [x27], x28
247ld3  { v1.h, v2.h, v3.h }[0], [x27], #6
248ld3  { v1.h, v2.h, v3.h }[4], [x27], #6
249ld3  { v1.h, v2.h, v3.h }[0], [x27], x28
250# LLVM-MCA-END
251
252# LLVM-MCA-BEGIN G32
253ld3  { v1.h, v2.h, v3.h }[4], [x27], x28
254ld3  { v1.s, v2.s, v3.s }[0], [x27], #12
255ld3  { v1.s, v2.s, v3.s }[0], [x27], x28
256ld3  { v1.d, v2.d, v3.d }[0], [x27], #24
257ld3  { v1.d, v2.d, v3.d }[0], [x27], x28
258# LLVM-MCA-END
259
260# LLVM-MCA-BEGIN G33
261ld3r  { v1.1d, v2.1d, v3.1d }, [x27], #24
262ld3r  { v1.2d, v2.2d, v3.2d }, [x27], #24
263ld3r  { v1.2s, v2.2s, v3.2s }, [x27], #12
264ld3r  { v1.4h, v2.4h, v3.4h }, [x27], #6
265ld3r  { v1.4s, v2.4s, v3.4s }, [x27], #12
266# LLVM-MCA-END
267
268# LLVM-MCA-BEGIN G34
269ld3r  { v1.8b, v2.8b, v3.8b }, [x27], #3
270ld3r  { v1.8h, v2.8h, v3.8h }, [x27], #6
271ld3r  { v1.16b, v2.16b, v3.16b }, [x27], #3
272ld3r  { v1.1d, v2.1d, v3.1d }, [x27], x28
273ld3r  { v1.2d, v2.2d, v3.2d }, [x27], x28
274# LLVM-MCA-END
275
276# LLVM-MCA-BEGIN G35
277ld3r  { v1.2s, v2.2s, v3.2s }, [x27], x28
278ld3r  { v1.4h, v2.4h, v3.4h }, [x27], x28
279ld3r  { v1.4s, v2.4s, v3.4s }, [x27], x28
280ld3r  { v1.8b, v2.8b, v3.8b }, [x27], x28
281ld3r  { v1.8h, v2.8h, v3.8h }, [x27], x28
282# LLVM-MCA-END
283
284# LLVM-MCA-BEGIN G36
285ld3r  { v1.16b, v2.16b, v3.16b }, [x27], x28
286ld4  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
287ld4  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
288ld4  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
289ld4  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
290# LLVM-MCA-END
291
292# LLVM-MCA-BEGIN G37
293ld4  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
294ld4  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
295ld4  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
296ld4  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
297ld4  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
298# LLVM-MCA-END
299
300# LLVM-MCA-BEGIN G38
301ld4  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
302ld4  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
303ld4  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
304ld4  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
305ld4  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
306# LLVM-MCA-END
307
308# LLVM-MCA-BEGIN G39
309ld4  { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
310ld4  { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
311ld4  { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
312ld4  { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
313ld4  { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
314# LLVM-MCA-END
315
316# LLVM-MCA-BEGIN G40
317ld4  { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
318ld4  { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
319ld4  { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
320ld4  { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
321ld4  { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
322# LLVM-MCA-END
323
324# LLVM-MCA-BEGIN G41
325ld4  { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
326ld4  { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
327ld4r  { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
328ld4r  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32
329ld4r  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16
330# LLVM-MCA-END
331
332# LLVM-MCA-BEGIN G42
333ld4r  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8
334ld4r  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16
335ld4r  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4
336ld4r  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8
337ld4r  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4
338# LLVM-MCA-END
339
340# LLVM-MCA-BEGIN G43
341ld4r  { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
342ld4r  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
343ld4r  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
344ld4r  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
345ld4r  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
346# LLVM-MCA-END
347
348# LLVM-MCA-BEGIN G44
349ld4r  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
350ld4r  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
351ld4r  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
352ldp  s1, s2, [x27], #248
353ldp  d1, d2, [x27], #496
354# LLVM-MCA-END
355
356# LLVM-MCA-BEGIN G45
357ldp  q1, q2, [x27], #992
358ldp  s1, s2, [x27, #248]!
359ldp  d1, d2, [x27, #496]!
360ldp  q1, q2, [x27, #992]!
361ldp  w1, w2, [x27], #248
362# LLVM-MCA-END
363
364# LLVM-MCA-BEGIN G46
365ldp  x1, x2, [x27], #496
366ldp  w1, w2, [x27, #248]!
367ldp  x1, x2, [x27, #496]!
368ldpsw  x1, x2, [x27], #248
369ldpsw  x1, x2, [x27, #248]!
370# LLVM-MCA-END
371
372# LLVM-MCA-BEGIN G47
373ldr  b1, [x27], #254
374ldr  h1, [x27], #254
375ldr  s1, [x27], #254
376ldr  d1, [x27], #254
377ldr  q1, [x27], #254
378# LLVM-MCA-END
379
380# LLVM-MCA-BEGIN G48
381ldr  b1, [x27, #254]!
382ldr  h1, [x27, #254]!
383ldr  s1, [x27, #254]!
384ldr  d1, [x27, #254]!
385ldr  q1, [x27, #254]!
386# LLVM-MCA-END
387
388# LLVM-MCA-BEGIN G49
389ldr  w1, [x27], #254
390ldr  x1, [x27], #254
391ldr  w1, [x27, #254]!
392ldr  x1, [x27, #254]!
393ldrb  w1, [x27], #254
394# LLVM-MCA-END
395
396# LLVM-MCA-BEGIN G50
397ldrb  w1, [x27, #254]!
398ldrh  w1, [x27], #254
399ldrh  w1, [x27, #254]!
400ldrsb  w1, [x27], #254
401ldrsb  x1, [x27], #254
402# LLVM-MCA-END
403
404# LLVM-MCA-BEGIN G51
405ldrsb  w1, [x27, #254]!
406ldrsb  x1, [x27, #254]!
407ldrsh  w1, [x27], #254
408ldrsh  x1, [x27], #254
409ldrsh  w1, [x27, #254]!
410# LLVM-MCA-END
411
412# LLVM-MCA-BEGIN G52
413ldrsh  x1, [x27, #254]!
414ldrsw  x1, [x27], #254
415ldrsw  x1, [x27, #254]!
416st1  { v1.1d }, [x27], #8
417st1  { v1.2d }, [x27], #16
418# LLVM-MCA-END
419
420# LLVM-MCA-BEGIN G53
421st1  { v1.2s }, [x27], #8
422st1  { v1.4h }, [x27], #8
423st1  { v1.4s }, [x27], #16
424st1  { v1.8b }, [x27], #8
425st1  { v1.8h }, [x27], #16
426# LLVM-MCA-END
427
428# LLVM-MCA-BEGIN G54
429st1  { v1.16b }, [x27], #16
430st1  { v1.1d }, [x27], x28
431st1  { v1.2d }, [x27], x28
432st1  { v1.2s }, [x27], x28
433st1  { v1.4h }, [x27], x28
434# LLVM-MCA-END
435
436# LLVM-MCA-BEGIN G55
437st1  { v1.4s }, [x27], x28
438st1  { v1.8b }, [x27], x28
439st1  { v1.8h }, [x27], x28
440st1  { v1.16b }, [x27], x28
441st1  { v1.1d, v2.1d }, [x27], #16
442# LLVM-MCA-END
443
444# LLVM-MCA-BEGIN G56
445st1  { v1.2d, v2.2d }, [x27], #32
446st1  { v1.2s, v2.2s }, [x27], #16
447st1  { v1.4h, v2.4h }, [x27], #16
448st1  { v1.4s, v2.4s }, [x27], #32
449st1  { v1.8b, v2.8b }, [x27], #16
450# LLVM-MCA-END
451
452# LLVM-MCA-BEGIN G57
453st1  { v1.8h, v2.8h }, [x27], #32
454st1  { v1.16b, v2.16b }, [x27], #32
455st1  { v1.1d, v2.1d }, [x27], x28
456st1  { v1.2d, v2.2d }, [x27], x28
457st1  { v1.2s, v2.2s }, [x27], x28
458# LLVM-MCA-END
459
460# LLVM-MCA-BEGIN G58
461st1  { v1.4h, v2.4h }, [x27], x28
462st1  { v1.4s, v2.4s }, [x27], x28
463st1  { v1.8b, v2.8b }, [x27], x28
464st1  { v1.8h, v2.8h }, [x27], x28
465st1  { v1.16b, v2.16b }, [x27], x28
466# LLVM-MCA-END
467
468# LLVM-MCA-BEGIN G59
469st1  { v1.1d, v2.1d, v3.1d }, [x27], #24
470st1  { v1.2d, v2.2d, v3.2d }, [x27], #48
471st1  { v1.2s, v2.2s, v3.2s }, [x27], #24
472st1  { v1.4h, v2.4h, v3.4h }, [x27], #24
473st1  { v1.4s, v2.4s, v3.4s }, [x27], #48
474# LLVM-MCA-END
475
476# LLVM-MCA-BEGIN G60
477st1  { v1.8b, v2.8b, v3.8b }, [x27], #24
478st1  { v1.8h, v2.8h, v3.8h }, [x27], #48
479st1  { v1.16b, v2.16b, v3.16b }, [x27], #48
480st1  { v1.1d, v2.1d, v3.1d }, [x27], x28
481st1  { v1.2d, v2.2d, v3.2d }, [x27], x28
482# LLVM-MCA-END
483
484# LLVM-MCA-BEGIN G61
485st1  { v1.2s, v2.2s, v3.2s }, [x27], x28
486st1  { v1.4h, v2.4h, v3.4h }, [x27], x28
487st1  { v1.4s, v2.4s, v3.4s }, [x27], x28
488st1  { v1.8b, v2.8b, v3.8b }, [x27], x28
489st1  { v1.8h, v2.8h, v3.8h }, [x27], x28
490# LLVM-MCA-END
491
492# LLVM-MCA-BEGIN G62
493st1  { v1.16b, v2.16b, v3.16b }, [x27], x28
494st1  { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
495st1  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
496st1  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
497st1  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
498# LLVM-MCA-END
499
500# LLVM-MCA-BEGIN G63
501st1  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
502st1  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
503st1  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
504st1  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
505st1  { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
506# LLVM-MCA-END
507
508# LLVM-MCA-BEGIN G64
509st1  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
510st1  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
511st1  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
512st1  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
513st1  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
514# LLVM-MCA-END
515
516# LLVM-MCA-BEGIN G65
517st1  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
518st1  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
519st1  { v1.b }[0], [x27], #1
520st1  { v1.b }[8], [x27], #1
521st1  { v1.b }[0], [x27], x28
522# LLVM-MCA-END
523
524# LLVM-MCA-BEGIN G66
525st1  { v1.b }[8], [x27], x28
526st1  { v1.h }[0], [x27], #2
527st1  { v1.h }[4], [x27], #2
528st1  { v1.h }[0], [x27], x28
529st1  { v1.h }[4], [x27], x28
530# LLVM-MCA-END
531
532# LLVM-MCA-BEGIN G67
533st1  { v1.s }[0], [x27], #4
534st1  { v1.s }[0], [x27], x28
535st1  { v1.d }[0], [x27], #8
536st1  { v1.d }[0], [x27], x28
537st2  { v1.2d, v2.2d }, [x27], #32
538# LLVM-MCA-END
539
540# LLVM-MCA-BEGIN G68
541st2  { v1.2s, v2.2s }, [x27], #16
542st2  { v1.4h, v2.4h }, [x27], #16
543st2  { v1.4s, v2.4s }, [x27], #32
544st2  { v1.8b, v2.8b }, [x27], #16
545st2  { v1.8h, v2.8h }, [x27], #32
546# LLVM-MCA-END
547
548# LLVM-MCA-BEGIN G69
549st2  { v1.16b, v2.16b }, [x27], #32
550st2  { v1.2d, v2.2d }, [x27], x28
551st2  { v1.2s, v2.2s }, [x27], x28
552st2  { v1.4h, v2.4h }, [x27], x28
553st2  { v1.4s, v2.4s }, [x27], x28
554# LLVM-MCA-END
555
556# LLVM-MCA-BEGIN G70
557st2  { v1.8b, v2.8b }, [x27], x28
558st2  { v1.8h, v2.8h }, [x27], x28
559st2  { v1.16b, v2.16b }, [x27], x28
560st2  { v1.b, v2.b }[0], [x27], #2
561st2  { v1.b, v2.b }[8], [x27], #2
562# LLVM-MCA-END
563
564# LLVM-MCA-BEGIN G71
565st2  { v1.b, v2.b }[0], [x27], x28
566st2  { v1.b, v2.b }[8], [x27], x28
567st2  { v1.h, v2.h }[0], [x27], #4
568st2  { v1.h, v2.h }[4], [x27], #4
569st2  { v1.h, v2.h }[0], [x27], x28
570# LLVM-MCA-END
571
572# LLVM-MCA-BEGIN G72
573st2  { v1.h, v2.h }[4], [x27], x28
574st2  { v1.s, v2.s }[0], [x27], #8
575st2  { v1.s, v2.s }[0], [x27], x28
576st2  { v1.d, v2.d }[0], [x27], #16
577st2  { v1.d, v2.d }[0], [x27], x28
578# LLVM-MCA-END
579
580# LLVM-MCA-BEGIN G73
581st3  { v1.2d, v2.2d, v3.2d }, [x27], #48
582st3  { v1.2s, v2.2s, v3.2s }, [x27], #24
583st3  { v1.4h, v2.4h, v3.4h }, [x27], #24
584# LLVM-MCA-END
585
586# LLVM-MCA-BEGIN G74
587st3  { v1.4s, v2.4s, v3.4s }, [x27], #48
588st3  { v1.8b, v2.8b, v3.8b }, [x27], #24
589st3  { v1.8h, v2.8h, v3.8h }, [x27], #48
590st3  { v1.16b, v2.16b, v3.16b }, [x27], #48
591st3  { v1.2d, v2.2d, v3.2d }, [x27], x28
592# LLVM-MCA-END
593
594# LLVM-MCA-BEGIN G75
595st3  { v1.2s, v2.2s, v3.2s }, [x27], x28
596st3  { v1.4h, v2.4h, v3.4h }, [x27], x28
597st3  { v1.4s, v2.4s, v3.4s }, [x27], x28
598st3  { v1.8b, v2.8b, v3.8b }, [x27], x28
599st3  { v1.8h, v2.8h, v3.8h }, [x27], x28
600# LLVM-MCA-END
601
602# LLVM-MCA-BEGIN G76
603st3  { v1.16b, v2.16b, v3.16b }, [x27], x28
604st3  { v1.b, v2.b, v3.b }[0], [x27], #3
605st3  { v1.b, v2.b, v3.b }[8], [x27], #3
606st3  { v1.b, v2.b, v3.b }[0], [x27], x28
607st3  { v1.b, v2.b, v3.b }[8], [x27], x28
608# LLVM-MCA-END
609
610# LLVM-MCA-BEGIN G77
611st3  { v1.h, v2.h, v3.h }[0], [x27], #6
612st3  { v1.h, v2.h, v3.h }[4], [x27], #6
613st3  { v1.h, v2.h, v3.h }[0], [x27], x28
614st3  { v1.h, v2.h, v3.h }[4], [x27], x28
615st3  { v1.s, v2.s, v3.s }[0], [x27], #12
616# LLVM-MCA-END
617
618# LLVM-MCA-BEGIN G78
619st3  { v1.s, v2.s, v3.s }[0], [x27], x28
620st3  { v1.d, v2.d, v3.d }[0], [x27], #24
621st3  { v1.d, v2.d, v3.d }[0], [x27], x28
622st4  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
623st4  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
624# LLVM-MCA-END
625
626# LLVM-MCA-BEGIN G79
627st4  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
628st4  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
629st4  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
630st4  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
631st4  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
632# LLVM-MCA-END
633
634# LLVM-MCA-BEGIN G80
635st4  { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
636st4  { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
637st4  { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
638st4  { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
639st4  { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
640# LLVM-MCA-END
641
642# LLVM-MCA-BEGIN G81
643st4  { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
644st4  { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
645st4  { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
646st4  { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
647st4  { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
648# LLVM-MCA-END
649
650# LLVM-MCA-BEGIN G82
651st4  { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
652st4  { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
653st4  { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
654st4  { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
655st4  { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
656# LLVM-MCA-END
657
658# LLVM-MCA-BEGIN G83
659st4  { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
660st4  { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
661st4  { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
662st4  { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
663# LLVM-MCA-END
664
665# LLVM-MCA-BEGIN G84
666stp  s1, s2, [x27], #248
667stp  d1, d2, [x27], #496
668# LLVM-MCA-END
669
670# LLVM-MCA-BEGIN G85
671stp  q1, q2, [x27], #992
672stp  s1, s2, [x27, #248]!
673stp  d1, d2, [x27, #496]!
674stp  q1, q2, [x27, #992]!
675stp  w1, w2, [x27], #248
676# LLVM-MCA-END
677
678# LLVM-MCA-BEGIN G86
679stp  x1, x2, [x27], #496
680stp  w1, w2, [x27, #248]!
681stp  x1, x2, [x27, #496]!
682str  b1, [x27], #254
683str  h1, [x27], #254
684# LLVM-MCA-END
685
686# LLVM-MCA-BEGIN G87
687str  s1, [x27], #254
688str  d1, [x27], #254
689str  q1, [x27], #254
690str  b1, [x27, #254]!
691str  h1, [x27, #254]!
692# LLVM-MCA-END
693
694# LLVM-MCA-BEGIN G88
695str  s1, [x27, #254]!
696str  d1, [x27, #254]!
697str  q1, [x27, #254]!
698str  w1, [x27], #254
699str  x1, [x27], #254
700# LLVM-MCA-END
701
702# LLVM-MCA-BEGIN G89
703str  w1, [x27, #254]!
704str  x1, [x27, #254]!
705strb  w1, [x27], #254
706strb  w1, [x27, #254]!
707strh  w1, [x27], #254
708# LLVM-MCA-END
709
710# LLVM-MCA-BEGIN G90
711strh  w1, [x27, #254]!
712# LLVM-MCA-END
713
714# LLVM-MCA-BEGIN G91
715ldr  x1, [x27], #254
716ldr  x2, [x1], #254
717# LLVM-MCA-END
718
719# CHECK:      [0] Code Region - G01
720
721# CHECK:      Iterations:        100
722# CHECK-NEXT: Instructions:      500
723# CHECK-NEXT: Total Cycles:      507
724# CHECK-NEXT: Total uOps:        1000
725
726# CHECK:      Dispatch Width:    4
727# CHECK-NEXT: uOps Per Cycle:    1.97
728# CHECK-NEXT: IPC:               0.99
729# CHECK-NEXT: Block RThroughput: 2.5
730
731# CHECK:      Timeline view:
732# CHECK-NEXT:                     01
733# CHECK-NEXT: Index     0123456789
734
735# CHECK:      [0,0]     DeeeeeER  ..   ld1	{ v1.1d }, [x27], #8
736# CHECK-NEXT: [0,1]     D=eeeeeER ..   ld1	{ v1.2d }, [x27], #16
737# CHECK-NEXT: [0,2]     .D=eeeeeER..   ld1	{ v1.2s }, [x27], #8
738# CHECK-NEXT: [0,3]     .D==eeeeeER.   ld1	{ v1.4h }, [x27], #8
739# CHECK-NEXT: [0,4]     . D==eeeeeER   ld1	{ v1.4s }, [x27], #16
740
741# CHECK:      Average Wait times (based on the timeline view):
742# CHECK-NEXT: [0]: Executions
743# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
744# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
745# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
746
747# CHECK:            [0]    [1]    [2]    [3]
748# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.1d }, [x27], #8
749# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ld1	{ v1.2d }, [x27], #16
750# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ld1	{ v1.2s }, [x27], #8
751# CHECK-NEXT: 3.     1     3.0    0.0    0.0       ld1	{ v1.4h }, [x27], #8
752# CHECK-NEXT: 4.     1     3.0    0.0    0.0       ld1	{ v1.4s }, [x27], #16
753# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
754
755# CHECK:      [1] Code Region - G02
756
757# CHECK:      Iterations:        100
758# CHECK-NEXT: Instructions:      500
759# CHECK-NEXT: Total Cycles:      507
760# CHECK-NEXT: Total uOps:        1000
761
762# CHECK:      Dispatch Width:    4
763# CHECK-NEXT: uOps Per Cycle:    1.97
764# CHECK-NEXT: IPC:               0.99
765# CHECK-NEXT: Block RThroughput: 2.5
766
767# CHECK:      Timeline view:
768# CHECK-NEXT:                     01
769# CHECK-NEXT: Index     0123456789
770
771# CHECK:      [0,0]     DeeeeeER  ..   ld1	{ v1.8b }, [x27], #8
772# CHECK-NEXT: [0,1]     D=eeeeeER ..   ld1	{ v1.8h }, [x27], #16
773# CHECK-NEXT: [0,2]     .D=eeeeeER..   ld1	{ v1.16b }, [x27], #16
774# CHECK-NEXT: [0,3]     .D==eeeeeER.   ld1	{ v1.1d }, [x27], x28
775# CHECK-NEXT: [0,4]     . D==eeeeeER   ld1	{ v1.2d }, [x27], x28
776
777# CHECK:      Average Wait times (based on the timeline view):
778# CHECK-NEXT: [0]: Executions
779# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
780# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
781# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
782
783# CHECK:            [0]    [1]    [2]    [3]
784# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.8b }, [x27], #8
785# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ld1	{ v1.8h }, [x27], #16
786# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ld1	{ v1.16b }, [x27], #16
787# CHECK-NEXT: 3.     1     3.0    0.0    0.0       ld1	{ v1.1d }, [x27], x28
788# CHECK-NEXT: 4.     1     3.0    0.0    0.0       ld1	{ v1.2d }, [x27], x28
789# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
790
791# CHECK:      [2] Code Region - G03
792
793# CHECK:      Iterations:        100
794# CHECK-NEXT: Instructions:      500
795# CHECK-NEXT: Total Cycles:      507
796# CHECK-NEXT: Total uOps:        1000
797
798# CHECK:      Dispatch Width:    4
799# CHECK-NEXT: uOps Per Cycle:    1.97
800# CHECK-NEXT: IPC:               0.99
801# CHECK-NEXT: Block RThroughput: 2.5
802
803# CHECK:      Timeline view:
804# CHECK-NEXT:                     01
805# CHECK-NEXT: Index     0123456789
806
807# CHECK:      [0,0]     DeeeeeER  ..   ld1	{ v1.2s }, [x27], x28
808# CHECK-NEXT: [0,1]     D=eeeeeER ..   ld1	{ v1.4h }, [x27], x28
809# CHECK-NEXT: [0,2]     .D=eeeeeER..   ld1	{ v1.4s }, [x27], x28
810# CHECK-NEXT: [0,3]     .D==eeeeeER.   ld1	{ v1.8b }, [x27], x28
811# CHECK-NEXT: [0,4]     . D==eeeeeER   ld1	{ v1.8h }, [x27], x28
812
813# CHECK:      Average Wait times (based on the timeline view):
814# CHECK-NEXT: [0]: Executions
815# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
816# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
817# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
818
819# CHECK:            [0]    [1]    [2]    [3]
820# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.2s }, [x27], x28
821# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ld1	{ v1.4h }, [x27], x28
822# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ld1	{ v1.4s }, [x27], x28
823# CHECK-NEXT: 3.     1     3.0    0.0    0.0       ld1	{ v1.8b }, [x27], x28
824# CHECK-NEXT: 4.     1     3.0    0.0    0.0       ld1	{ v1.8h }, [x27], x28
825# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
826
827# CHECK:      [3] Code Region - G04
828
829# CHECK:      Iterations:        100
830# CHECK-NEXT: Instructions:      500
831# CHECK-NEXT: Total Cycles:      507
832# CHECK-NEXT: Total uOps:        1000
833
834# CHECK:      Dispatch Width:    4
835# CHECK-NEXT: uOps Per Cycle:    1.97
836# CHECK-NEXT: IPC:               0.99
837# CHECK-NEXT: Block RThroughput: 2.5
838
839# CHECK:      Timeline view:
840# CHECK-NEXT:                     01
841# CHECK-NEXT: Index     0123456789
842
843# CHECK:      [0,0]     DeeeeeER  ..   ld1	{ v1.16b }, [x27], x28
844# CHECK-NEXT: [0,1]     D=eeeeeER ..   ld1	{ v1.1d, v2.1d }, [x27], #16
845# CHECK-NEXT: [0,2]     .D=eeeeeER..   ld1	{ v1.2d, v2.2d }, [x27], #32
846# CHECK-NEXT: [0,3]     .D==eeeeeER.   ld1	{ v1.2s, v2.2s }, [x27], #16
847# CHECK-NEXT: [0,4]     . D==eeeeeER   ld1	{ v1.4h, v2.4h }, [x27], #16
848
849# CHECK:      Average Wait times (based on the timeline view):
850# CHECK-NEXT: [0]: Executions
851# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
852# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
853# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
854
855# CHECK:            [0]    [1]    [2]    [3]
856# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.16b }, [x27], x28
857# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ld1	{ v1.1d, v2.1d }, [x27], #16
858# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ld1	{ v1.2d, v2.2d }, [x27], #32
859# CHECK-NEXT: 3.     1     3.0    0.0    0.0       ld1	{ v1.2s, v2.2s }, [x27], #16
860# CHECK-NEXT: 4.     1     3.0    0.0    0.0       ld1	{ v1.4h, v2.4h }, [x27], #16
861# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
862
863# CHECK:      [4] Code Region - G05
864
865# CHECK:      Iterations:        100
866# CHECK-NEXT: Instructions:      500
867# CHECK-NEXT: Total Cycles:      507
868# CHECK-NEXT: Total uOps:        1000
869
870# CHECK:      Dispatch Width:    4
871# CHECK-NEXT: uOps Per Cycle:    1.97
872# CHECK-NEXT: IPC:               0.99
873# CHECK-NEXT: Block RThroughput: 2.5
874
875# CHECK:      Timeline view:
876# CHECK-NEXT:                     01
877# CHECK-NEXT: Index     0123456789
878
879# CHECK:      [0,0]     DeeeeeER  ..   ld1	{ v1.4s, v2.4s }, [x27], #32
880# CHECK-NEXT: [0,1]     D=eeeeeER ..   ld1	{ v1.8b, v2.8b }, [x27], #16
881# CHECK-NEXT: [0,2]     .D=eeeeeER..   ld1	{ v1.8h, v2.8h }, [x27], #32
882# CHECK-NEXT: [0,3]     .D==eeeeeER.   ld1	{ v1.16b, v2.16b }, [x27], #32
883# CHECK-NEXT: [0,4]     . D==eeeeeER   ld1	{ v1.1d, v2.1d }, [x27], x28
884
885# CHECK:      Average Wait times (based on the timeline view):
886# CHECK-NEXT: [0]: Executions
887# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
888# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
889# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
890
891# CHECK:            [0]    [1]    [2]    [3]
892# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.4s, v2.4s }, [x27], #32
893# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ld1	{ v1.8b, v2.8b }, [x27], #16
894# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ld1	{ v1.8h, v2.8h }, [x27], #32
895# CHECK-NEXT: 3.     1     3.0    0.0    0.0       ld1	{ v1.16b, v2.16b }, [x27], #32
896# CHECK-NEXT: 4.     1     3.0    0.0    0.0       ld1	{ v1.1d, v2.1d }, [x27], x28
897# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
898
899# CHECK:      [5] Code Region - G06
900
901# CHECK:      Iterations:        100
902# CHECK-NEXT: Instructions:      500
903# CHECK-NEXT: Total Cycles:      507
904# CHECK-NEXT: Total uOps:        1000
905
906# CHECK:      Dispatch Width:    4
907# CHECK-NEXT: uOps Per Cycle:    1.97
908# CHECK-NEXT: IPC:               0.99
909# CHECK-NEXT: Block RThroughput: 2.5
910
911# CHECK:      Timeline view:
912# CHECK-NEXT:                     01
913# CHECK-NEXT: Index     0123456789
914
915# CHECK:      [0,0]     DeeeeeER  ..   ld1	{ v1.2d, v2.2d }, [x27], x28
916# CHECK-NEXT: [0,1]     D=eeeeeER ..   ld1	{ v1.2s, v2.2s }, [x27], x28
917# CHECK-NEXT: [0,2]     .D=eeeeeER..   ld1	{ v1.4h, v2.4h }, [x27], x28
918# CHECK-NEXT: [0,3]     .D==eeeeeER.   ld1	{ v1.4s, v2.4s }, [x27], x28
919# CHECK-NEXT: [0,4]     . D==eeeeeER   ld1	{ v1.8b, v2.8b }, [x27], x28
920
921# CHECK:      Average Wait times (based on the timeline view):
922# CHECK-NEXT: [0]: Executions
923# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
924# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
925# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
926
927# CHECK:            [0]    [1]    [2]    [3]
928# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.2d, v2.2d }, [x27], x28
929# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ld1	{ v1.2s, v2.2s }, [x27], x28
930# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ld1	{ v1.4h, v2.4h }, [x27], x28
931# CHECK-NEXT: 3.     1     3.0    0.0    0.0       ld1	{ v1.4s, v2.4s }, [x27], x28
932# CHECK-NEXT: 4.     1     3.0    0.0    0.0       ld1	{ v1.8b, v2.8b }, [x27], x28
933# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
934
935# CHECK:      [6] Code Region - G07
936
937# CHECK:      Iterations:        100
938# CHECK-NEXT: Instructions:      500
939# CHECK-NEXT: Total Cycles:      608
940# CHECK-NEXT: Total uOps:        1600
941
942# CHECK:      Dispatch Width:    4
943# CHECK-NEXT: uOps Per Cycle:    2.63
944# CHECK-NEXT: IPC:               0.82
945# CHECK-NEXT: Block RThroughput: 5.5
946
947# CHECK:      Timeline view:
948# CHECK-NEXT:                     0123
949# CHECK-NEXT: Index     0123456789
950
951# CHECK:      [0,0]     DeeeeeER  .  .   ld1	{ v1.8h, v2.8h }, [x27], x28
952# CHECK-NEXT: [0,1]     D=eeeeeER .  .   ld1	{ v1.16b, v2.16b }, [x27], x28
953# CHECK-NEXT: [0,2]     .D=eeeeeeER  .   ld1	{ v1.1d, v2.1d, v3.1d }, [x27], #24
954# CHECK-NEXT: [0,3]     . D=eeeeeeER .   ld1	{ v1.2d, v2.2d, v3.2d }, [x27], #48
955# CHECK-NEXT: [0,4]     .  D==eeeeeeER   ld1	{ v1.2s, v2.2s, v3.2s }, [x27], #24
956
957# CHECK:      Average Wait times (based on the timeline view):
958# CHECK-NEXT: [0]: Executions
959# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
960# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
961# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
962
963# CHECK:            [0]    [1]    [2]    [3]
964# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.8h, v2.8h }, [x27], x28
965# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ld1	{ v1.16b, v2.16b }, [x27], x28
966# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ld1	{ v1.1d, v2.1d, v3.1d }, [x27], #24
967# CHECK-NEXT: 3.     1     2.0    0.0    0.0       ld1	{ v1.2d, v2.2d, v3.2d }, [x27], #48
968# CHECK-NEXT: 4.     1     3.0    1.0    0.0       ld1	{ v1.2s, v2.2s, v3.2s }, [x27], #24
969# CHECK-NEXT:        1     2.0    0.4    0.0       <total>
970
971# CHECK:      [7] Code Region - G08
972
973# CHECK:      Iterations:        100
974# CHECK-NEXT: Instructions:      500
975# CHECK-NEXT: Total Cycles:      757
976# CHECK-NEXT: Total uOps:        2000
977
978# CHECK:      Dispatch Width:    4
979# CHECK-NEXT: uOps Per Cycle:    2.64
980# CHECK-NEXT: IPC:               0.66
981# CHECK-NEXT: Block RThroughput: 7.5
982
983# CHECK:      Timeline view:
984# CHECK-NEXT:                     01234
985# CHECK-NEXT: Index     0123456789
986
987# CHECK:      [0,0]     DeeeeeeER .   .   ld1	{ v1.4h, v2.4h, v3.4h }, [x27], #24
988# CHECK-NEXT: [0,1]     .DeeeeeeER.   .   ld1	{ v1.4s, v2.4s, v3.4s }, [x27], #48
989# CHECK-NEXT: [0,2]     . D=eeeeeeER  .   ld1	{ v1.8b, v2.8b, v3.8b }, [x27], #24
990# CHECK-NEXT: [0,3]     .  D=eeeeeeER .   ld1	{ v1.8h, v2.8h, v3.8h }, [x27], #48
991# CHECK-NEXT: [0,4]     .   D==eeeeeeER   ld1	{ v1.16b, v2.16b, v3.16b }, [x27], #48
992
993# CHECK:      Average Wait times (based on the timeline view):
994# CHECK-NEXT: [0]: Executions
995# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
996# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
997# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
998
999# CHECK:            [0]    [1]    [2]    [3]
1000# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.4h, v2.4h, v3.4h }, [x27], #24
1001# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld1	{ v1.4s, v2.4s, v3.4s }, [x27], #48
1002# CHECK-NEXT: 2.     1     2.0    1.0    0.0       ld1	{ v1.8b, v2.8b, v3.8b }, [x27], #24
1003# CHECK-NEXT: 3.     1     2.0    0.0    0.0       ld1	{ v1.8h, v2.8h, v3.8h }, [x27], #48
1004# CHECK-NEXT: 4.     1     3.0    1.0    0.0       ld1	{ v1.16b, v2.16b, v3.16b }, [x27], #48
1005# CHECK-NEXT:        1     1.8    0.6    0.0       <total>
1006
1007# CHECK:      [8] Code Region - G09
1008
1009# CHECK:      Iterations:        100
1010# CHECK-NEXT: Instructions:      500
1011# CHECK-NEXT: Total Cycles:      757
1012# CHECK-NEXT: Total uOps:        2000
1013
1014# CHECK:      Dispatch Width:    4
1015# CHECK-NEXT: uOps Per Cycle:    2.64
1016# CHECK-NEXT: IPC:               0.66
1017# CHECK-NEXT: Block RThroughput: 7.5
1018
1019# CHECK:      Timeline view:
1020# CHECK-NEXT:                     01234
1021# CHECK-NEXT: Index     0123456789
1022
1023# CHECK:      [0,0]     DeeeeeeER .   .   ld1	{ v1.1d, v2.1d, v3.1d }, [x27], x28
1024# CHECK-NEXT: [0,1]     .DeeeeeeER.   .   ld1	{ v1.2d, v2.2d, v3.2d }, [x27], x28
1025# CHECK-NEXT: [0,2]     . D=eeeeeeER  .   ld1	{ v1.2s, v2.2s, v3.2s }, [x27], x28
1026# CHECK-NEXT: [0,3]     .  D=eeeeeeER .   ld1	{ v1.4h, v2.4h, v3.4h }, [x27], x28
1027# CHECK-NEXT: [0,4]     .   D==eeeeeeER   ld1	{ v1.4s, v2.4s, v3.4s }, [x27], x28
1028
1029# CHECK:      Average Wait times (based on the timeline view):
1030# CHECK-NEXT: [0]: Executions
1031# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1032# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1033# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1034
1035# CHECK:            [0]    [1]    [2]    [3]
1036# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.1d, v2.1d, v3.1d }, [x27], x28
1037# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld1	{ v1.2d, v2.2d, v3.2d }, [x27], x28
1038# CHECK-NEXT: 2.     1     2.0    1.0    0.0       ld1	{ v1.2s, v2.2s, v3.2s }, [x27], x28
1039# CHECK-NEXT: 3.     1     2.0    0.0    0.0       ld1	{ v1.4h, v2.4h, v3.4h }, [x27], x28
1040# CHECK-NEXT: 4.     1     3.0    1.0    0.0       ld1	{ v1.4s, v2.4s, v3.4s }, [x27], x28
1041# CHECK-NEXT:        1     1.8    0.6    0.0       <total>
1042
1043# CHECK:      [9] Code Region - G10
1044
1045# CHECK:      Iterations:        100
1046# CHECK-NEXT: Instructions:      500
1047# CHECK-NEXT: Total Cycles:      708
1048# CHECK-NEXT: Total uOps:        1800
1049
1050# CHECK:      Dispatch Width:    4
1051# CHECK-NEXT: uOps Per Cycle:    2.54
1052# CHECK-NEXT: IPC:               0.71
1053# CHECK-NEXT: Block RThroughput: 6.5
1054
1055# CHECK:      Timeline view:
1056# CHECK-NEXT:                     01234
1057# CHECK-NEXT: Index     0123456789
1058
1059# CHECK:      [0,0]     DeeeeeeER .   .   ld1	{ v1.8b, v2.8b, v3.8b }, [x27], x28
1060# CHECK-NEXT: [0,1]     .DeeeeeeER.   .   ld1	{ v1.8h, v2.8h, v3.8h }, [x27], x28
1061# CHECK-NEXT: [0,2]     . D=eeeeeeER  .   ld1	{ v1.16b, v2.16b, v3.16b }, [x27], x28
1062# CHECK-NEXT: [0,3]     .  D=eeeeeeER .   ld1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
1063# CHECK-NEXT: [0,4]     .   D==eeeeeeER   ld1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
1064
1065# CHECK:      Average Wait times (based on the timeline view):
1066# CHECK-NEXT: [0]: Executions
1067# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1068# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1069# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1070
1071# CHECK:            [0]    [1]    [2]    [3]
1072# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.8b, v2.8b, v3.8b }, [x27], x28
1073# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld1	{ v1.8h, v2.8h, v3.8h }, [x27], x28
1074# CHECK-NEXT: 2.     1     2.0    1.0    0.0       ld1	{ v1.16b, v2.16b, v3.16b }, [x27], x28
1075# CHECK-NEXT: 3.     1     2.0    0.0    0.0       ld1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
1076# CHECK-NEXT: 4.     1     3.0    1.0    0.0       ld1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
1077# CHECK-NEXT:        1     1.8    0.6    0.0       <total>
1078
1079# CHECK:      [10] Code Region - G11
1080
1081# CHECK:      Iterations:        100
1082# CHECK-NEXT: Instructions:      500
1083# CHECK-NEXT: Total Cycles:      508
1084# CHECK-NEXT: Total uOps:        1500
1085
1086# CHECK:      Dispatch Width:    4
1087# CHECK-NEXT: uOps Per Cycle:    2.95
1088# CHECK-NEXT: IPC:               0.98
1089# CHECK-NEXT: Block RThroughput: 5.0
1090
1091# CHECK:      Timeline view:
1092# CHECK-NEXT:                     012
1093# CHECK-NEXT: Index     0123456789
1094
1095# CHECK:      [0,0]     DeeeeeeER . .   ld1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
1096# CHECK-NEXT: [0,1]     .DeeeeeeER. .   ld1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
1097# CHECK-NEXT: [0,2]     . DeeeeeeER .   ld1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
1098# CHECK-NEXT: [0,3]     .  DeeeeeeER.   ld1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
1099# CHECK-NEXT: [0,4]     .   DeeeeeeER   ld1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
1100
1101# CHECK:      Average Wait times (based on the timeline view):
1102# CHECK-NEXT: [0]: Executions
1103# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1104# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1105# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1106
1107# CHECK:            [0]    [1]    [2]    [3]
1108# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
1109# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
1110# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ld1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
1111# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ld1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
1112# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ld1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
1113# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
1114
1115# CHECK:      [11] Code Region - G12
1116
1117# CHECK:      Iterations:        100
1118# CHECK-NEXT: Instructions:      500
1119# CHECK-NEXT: Total Cycles:      508
1120# CHECK-NEXT: Total uOps:        1500
1121
1122# CHECK:      Dispatch Width:    4
1123# CHECK-NEXT: uOps Per Cycle:    2.95
1124# CHECK-NEXT: IPC:               0.98
1125# CHECK-NEXT: Block RThroughput: 5.0
1126
1127# CHECK:      Timeline view:
1128# CHECK-NEXT:                     012
1129# CHECK-NEXT: Index     0123456789
1130
1131# CHECK:      [0,0]     DeeeeeeER . .   ld1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
1132# CHECK-NEXT: [0,1]     .DeeeeeeER. .   ld1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
1133# CHECK-NEXT: [0,2]     . DeeeeeeER .   ld1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
1134# CHECK-NEXT: [0,3]     .  DeeeeeeER.   ld1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
1135# CHECK-NEXT: [0,4]     .   DeeeeeeER   ld1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
1136
1137# CHECK:      Average Wait times (based on the timeline view):
1138# CHECK-NEXT: [0]: Executions
1139# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1140# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1141# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1142
1143# CHECK:            [0]    [1]    [2]    [3]
1144# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
1145# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
1146# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ld1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
1147# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ld1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
1148# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ld1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
1149# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
1150
1151# CHECK:      [12] Code Region - G13
1152
1153# CHECK:      Iterations:        100
1154# CHECK-NEXT: Instructions:      500
1155# CHECK-NEXT: Total Cycles:      1009
1156# CHECK-NEXT: Total uOps:        1500
1157
1158# CHECK:      Dispatch Width:    4
1159# CHECK-NEXT: uOps Per Cycle:    1.49
1160# CHECK-NEXT: IPC:               0.50
1161# CHECK-NEXT: Block RThroughput: 4.5
1162
1163# CHECK:      Timeline view:
1164# CHECK-NEXT:                     012345678
1165# CHECK-NEXT: Index     0123456789
1166
1167# CHECK:      [0,0]     DeeeeeeER .    .  .   ld1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
1168# CHECK-NEXT: [0,1]     .DeeeeeeER.    .  .   ld1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
1169# CHECK-NEXT: [0,2]     . DeeeeeeER    .  .   ld1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
1170# CHECK-NEXT: [0,3]     .  DeeeeeeER   .  .   ld1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
1171# CHECK-NEXT: [0,4]     .   D=====eeeeeeeER   ld1	{ v1.b }[0], [x27], #1
1172
1173# CHECK:      Average Wait times (based on the timeline view):
1174# CHECK-NEXT: [0]: Executions
1175# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1176# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1177# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1178
1179# CHECK:            [0]    [1]    [2]    [3]
1180# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
1181# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
1182# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ld1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
1183# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ld1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
1184# CHECK-NEXT: 4.     1     6.0    0.0    0.0       ld1	{ v1.b }[0], [x27], #1
1185# CHECK-NEXT:        1     2.0    0.2    0.0       <total>
1186
1187# CHECK:      [13] Code Region - G14
1188
1189# CHECK:      Iterations:        100
1190# CHECK-NEXT: Instructions:      500
1191# CHECK-NEXT: Total Cycles:      3503
1192# CHECK-NEXT: Total uOps:        1500
1193
1194# CHECK:      Dispatch Width:    4
1195# CHECK-NEXT: uOps Per Cycle:    0.43
1196# CHECK-NEXT: IPC:               0.14
1197# CHECK-NEXT: Block RThroughput: 3.8
1198
1199# CHECK:      Timeline view:
1200# CHECK-NEXT:                     0123456789          01234567
1201# CHECK-NEXT: Index     0123456789          0123456789
1202
1203# CHECK:      [0,0]     DeeeeeeeER.    .    .    .    .    . .   ld1	{ v1.b }[8], [x27], #1
1204# CHECK-NEXT: [0,1]     .D======eeeeeeeER   .    .    .    . .   ld1	{ v1.b }[0], [x27], x28
1205# CHECK-NEXT: [0,2]     . D============eeeeeeeER .    .    . .   ld1	{ v1.b }[8], [x27], x28
1206# CHECK-NEXT: [0,3]     .  D==================eeeeeeeER    . .   ld1	{ v1.h }[0], [x27], #2
1207# CHECK-NEXT: [0,4]     .   D========================eeeeeeeER   ld1	{ v1.h }[4], [x27], #2
1208
1209# CHECK:      Average Wait times (based on the timeline view):
1210# CHECK-NEXT: [0]: Executions
1211# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1212# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1213# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1214
1215# CHECK:            [0]    [1]    [2]    [3]
1216# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.b }[8], [x27], #1
1217# CHECK-NEXT: 1.     1     7.0    0.0    0.0       ld1	{ v1.b }[0], [x27], x28
1218# CHECK-NEXT: 2.     1     13.0   0.0    0.0       ld1	{ v1.b }[8], [x27], x28
1219# CHECK-NEXT: 3.     1     19.0   0.0    0.0       ld1	{ v1.h }[0], [x27], #2
1220# CHECK-NEXT: 4.     1     25.0   0.0    0.0       ld1	{ v1.h }[4], [x27], #2
1221# CHECK-NEXT:        1     13.0   0.2    0.0       <total>
1222
1223# CHECK:      [14] Code Region - G15
1224
1225# CHECK:      Iterations:        100
1226# CHECK-NEXT: Instructions:      500
1227# CHECK-NEXT: Total Cycles:      3503
1228# CHECK-NEXT: Total uOps:        1500
1229
1230# CHECK:      Dispatch Width:    4
1231# CHECK-NEXT: uOps Per Cycle:    0.43
1232# CHECK-NEXT: IPC:               0.14
1233# CHECK-NEXT: Block RThroughput: 3.8
1234
1235# CHECK:      Timeline view:
1236# CHECK-NEXT:                     0123456789          01234567
1237# CHECK-NEXT: Index     0123456789          0123456789
1238
1239# CHECK:      [0,0]     DeeeeeeeER.    .    .    .    .    . .   ld1	{ v1.h }[0], [x27], x28
1240# CHECK-NEXT: [0,1]     .D======eeeeeeeER   .    .    .    . .   ld1	{ v1.h }[4], [x27], x28
1241# CHECK-NEXT: [0,2]     . D============eeeeeeeER .    .    . .   ld1	{ v1.s }[0], [x27], #4
1242# CHECK-NEXT: [0,3]     .  D==================eeeeeeeER    . .   ld1	{ v1.s }[0], [x27], x28
1243# CHECK-NEXT: [0,4]     .   D========================eeeeeeeER   ld1	{ v1.d }[0], [x27], #8
1244
1245# CHECK:      Average Wait times (based on the timeline view):
1246# CHECK-NEXT: [0]: Executions
1247# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1248# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1249# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1250
1251# CHECK:            [0]    [1]    [2]    [3]
1252# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.h }[0], [x27], x28
1253# CHECK-NEXT: 1.     1     7.0    0.0    0.0       ld1	{ v1.h }[4], [x27], x28
1254# CHECK-NEXT: 2.     1     13.0   0.0    0.0       ld1	{ v1.s }[0], [x27], #4
1255# CHECK-NEXT: 3.     1     19.0   0.0    0.0       ld1	{ v1.s }[0], [x27], x28
1256# CHECK-NEXT: 4.     1     25.0   0.0    0.0       ld1	{ v1.d }[0], [x27], #8
1257# CHECK-NEXT:        1     13.0   0.2    0.0       <total>
1258
1259# CHECK:      [15] Code Region - G16
1260
1261# CHECK:      Iterations:        100
1262# CHECK-NEXT: Instructions:      500
1263# CHECK-NEXT: Total Cycles:      1103
1264# CHECK-NEXT: Total uOps:        1500
1265
1266# CHECK:      Dispatch Width:    4
1267# CHECK-NEXT: uOps Per Cycle:    1.36
1268# CHECK-NEXT: IPC:               0.45
1269# CHECK-NEXT: Block RThroughput: 3.8
1270
1271# CHECK:      Timeline view:
1272# CHECK-NEXT:                     0123
1273# CHECK-NEXT: Index     0123456789
1274
1275# CHECK:      [0,0]     DeeeeeeeER.  .   ld1	{ v1.d }[0], [x27], x28
1276# CHECK-NEXT: [0,1]     .DeeeeeeeER  .   ld1r	{ v1.1d }, [x27], #8
1277# CHECK-NEXT: [0,2]     . DeeeeeeeER .   ld1r	{ v1.2d }, [x27], #8
1278# CHECK-NEXT: [0,3]     .  DeeeeeeeER.   ld1r	{ v1.2s }, [x27], #4
1279# CHECK-NEXT: [0,4]     .   DeeeeeeeER   ld1r	{ v1.4h }, [x27], #2
1280
1281# CHECK:      Average Wait times (based on the timeline view):
1282# CHECK-NEXT: [0]: Executions
1283# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1284# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1285# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1286
1287# CHECK:            [0]    [1]    [2]    [3]
1288# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1	{ v1.d }[0], [x27], x28
1289# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld1r	{ v1.1d }, [x27], #8
1290# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ld1r	{ v1.2d }, [x27], #8
1291# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ld1r	{ v1.2s }, [x27], #4
1292# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ld1r	{ v1.4h }, [x27], #2
1293# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
1294
1295# CHECK:      [16] Code Region - G17
1296
1297# CHECK:      Iterations:        100
1298# CHECK-NEXT: Instructions:      500
1299# CHECK-NEXT: Total Cycles:      509
1300# CHECK-NEXT: Total uOps:        1500
1301
1302# CHECK:      Dispatch Width:    4
1303# CHECK-NEXT: uOps Per Cycle:    2.95
1304# CHECK-NEXT: IPC:               0.98
1305# CHECK-NEXT: Block RThroughput: 3.8
1306
1307# CHECK:      Timeline view:
1308# CHECK-NEXT:                     0123
1309# CHECK-NEXT: Index     0123456789
1310
1311# CHECK:      [0,0]     DeeeeeeeER.  .   ld1r	{ v1.4s }, [x27], #4
1312# CHECK-NEXT: [0,1]     .DeeeeeeeER  .   ld1r	{ v1.8b }, [x27], #1
1313# CHECK-NEXT: [0,2]     . DeeeeeeeER .   ld1r	{ v1.8h }, [x27], #2
1314# CHECK-NEXT: [0,3]     .  DeeeeeeeER.   ld1r	{ v1.16b }, [x27], #1
1315# CHECK-NEXT: [0,4]     .   DeeeeeeeER   ld1r	{ v1.1d }, [x27], x28
1316
1317# CHECK:      Average Wait times (based on the timeline view):
1318# CHECK-NEXT: [0]: Executions
1319# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1320# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1321# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1322
1323# CHECK:            [0]    [1]    [2]    [3]
1324# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1r	{ v1.4s }, [x27], #4
1325# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld1r	{ v1.8b }, [x27], #1
1326# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ld1r	{ v1.8h }, [x27], #2
1327# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ld1r	{ v1.16b }, [x27], #1
1328# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ld1r	{ v1.1d }, [x27], x28
1329# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
1330
1331# CHECK:      [17] Code Region - G18
1332
1333# CHECK:      Iterations:        100
1334# CHECK-NEXT: Instructions:      500
1335# CHECK-NEXT: Total Cycles:      509
1336# CHECK-NEXT: Total uOps:        1500
1337
1338# CHECK:      Dispatch Width:    4
1339# CHECK-NEXT: uOps Per Cycle:    2.95
1340# CHECK-NEXT: IPC:               0.98
1341# CHECK-NEXT: Block RThroughput: 3.8
1342
1343# CHECK:      Timeline view:
1344# CHECK-NEXT:                     0123
1345# CHECK-NEXT: Index     0123456789
1346
1347# CHECK:      [0,0]     DeeeeeeeER.  .   ld1r	{ v1.2d }, [x27], x28
1348# CHECK-NEXT: [0,1]     .DeeeeeeeER  .   ld1r	{ v1.2s }, [x27], x28
1349# CHECK-NEXT: [0,2]     . DeeeeeeeER .   ld1r	{ v1.4h }, [x27], x28
1350# CHECK-NEXT: [0,3]     .  DeeeeeeeER.   ld1r	{ v1.4s }, [x27], x28
1351# CHECK-NEXT: [0,4]     .   DeeeeeeeER   ld1r	{ v1.8b }, [x27], x28
1352
1353# CHECK:      Average Wait times (based on the timeline view):
1354# CHECK-NEXT: [0]: Executions
1355# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1356# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1357# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1358
1359# CHECK:            [0]    [1]    [2]    [3]
1360# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1r	{ v1.2d }, [x27], x28
1361# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld1r	{ v1.2s }, [x27], x28
1362# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ld1r	{ v1.4h }, [x27], x28
1363# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ld1r	{ v1.4s }, [x27], x28
1364# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ld1r	{ v1.8b }, [x27], x28
1365# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
1366
1367# CHECK:      [18] Code Region - G19
1368
1369# CHECK:      Iterations:        100
1370# CHECK-NEXT: Instructions:      500
1371# CHECK-NEXT: Total Cycles:      509
1372# CHECK-NEXT: Total uOps:        1800
1373
1374# CHECK:      Dispatch Width:    4
1375# CHECK-NEXT: uOps Per Cycle:    3.54
1376# CHECK-NEXT: IPC:               0.98
1377# CHECK-NEXT: Block RThroughput: 4.5
1378
1379# CHECK:      Timeline view:
1380# CHECK-NEXT:                     0123
1381# CHECK-NEXT: Index     0123456789
1382
1383# CHECK:      [0,0]     DeeeeeeeER.  .   ld1r	{ v1.8h }, [x27], x28
1384# CHECK-NEXT: [0,1]     .DeeeeeeeER  .   ld1r	{ v1.16b }, [x27], x28
1385# CHECK-NEXT: [0,2]     . DeeeeeeeER .   ld2	{ v1.2d, v2.2d }, [x27], #32
1386# CHECK-NEXT: [0,3]     .  DeeeeeeeER.   ld2	{ v1.2s, v2.2s }, [x27], #16
1387# CHECK-NEXT: [0,4]     .   DeeeeeeeER   ld2	{ v1.4h, v2.4h }, [x27], #16
1388
1389# CHECK:      Average Wait times (based on the timeline view):
1390# CHECK-NEXT: [0]: Executions
1391# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1392# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1393# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1394
1395# CHECK:            [0]    [1]    [2]    [3]
1396# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld1r	{ v1.8h }, [x27], x28
1397# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld1r	{ v1.16b }, [x27], x28
1398# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ld2	{ v1.2d, v2.2d }, [x27], #32
1399# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ld2	{ v1.2s, v2.2s }, [x27], #16
1400# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ld2	{ v1.4h, v2.4h }, [x27], #16
1401# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
1402
1403# CHECK:      [19] Code Region - G20
1404
1405# CHECK:      Iterations:        100
1406# CHECK-NEXT: Instructions:      500
1407# CHECK-NEXT: Total Cycles:      509
1408# CHECK-NEXT: Total uOps:        2000
1409
1410# CHECK:      Dispatch Width:    4
1411# CHECK-NEXT: uOps Per Cycle:    3.93
1412# CHECK-NEXT: IPC:               0.98
1413# CHECK-NEXT: Block RThroughput: 5.0
1414
1415# CHECK:      Timeline view:
1416# CHECK-NEXT:                     0123
1417# CHECK-NEXT: Index     0123456789
1418
1419# CHECK:      [0,0]     DeeeeeeeER.  .   ld2	{ v1.4s, v2.4s }, [x27], #32
1420# CHECK-NEXT: [0,1]     .DeeeeeeeER  .   ld2	{ v1.8b, v2.8b }, [x27], #16
1421# CHECK-NEXT: [0,2]     . DeeeeeeeER .   ld2	{ v1.8h, v2.8h }, [x27], #32
1422# CHECK-NEXT: [0,3]     .  DeeeeeeeER.   ld2	{ v1.16b, v2.16b }, [x27], #32
1423# CHECK-NEXT: [0,4]     .   DeeeeeeeER   ld2	{ v1.2d, v2.2d }, [x27], x28
1424
1425# CHECK:      Average Wait times (based on the timeline view):
1426# CHECK-NEXT: [0]: Executions
1427# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1428# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1429# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1430
1431# CHECK:            [0]    [1]    [2]    [3]
1432# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld2	{ v1.4s, v2.4s }, [x27], #32
1433# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld2	{ v1.8b, v2.8b }, [x27], #16
1434# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ld2	{ v1.8h, v2.8h }, [x27], #32
1435# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ld2	{ v1.16b, v2.16b }, [x27], #32
1436# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ld2	{ v1.2d, v2.2d }, [x27], x28
1437# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
1438
1439# CHECK:      [20] Code Region - G21
1440
1441# CHECK:      Iterations:        100
1442# CHECK-NEXT: Instructions:      500
1443# CHECK-NEXT: Total Cycles:      509
1444# CHECK-NEXT: Total uOps:        2000
1445
1446# CHECK:      Dispatch Width:    4
1447# CHECK-NEXT: uOps Per Cycle:    3.93
1448# CHECK-NEXT: IPC:               0.98
1449# CHECK-NEXT: Block RThroughput: 5.0
1450
1451# CHECK:      Timeline view:
1452# CHECK-NEXT:                     0123
1453# CHECK-NEXT: Index     0123456789
1454
1455# CHECK:      [0,0]     DeeeeeeeER.  .   ld2	{ v1.2s, v2.2s }, [x27], x28
1456# CHECK-NEXT: [0,1]     .DeeeeeeeER  .   ld2	{ v1.4h, v2.4h }, [x27], x28
1457# CHECK-NEXT: [0,2]     . DeeeeeeeER .   ld2	{ v1.4s, v2.4s }, [x27], x28
1458# CHECK-NEXT: [0,3]     .  DeeeeeeeER.   ld2	{ v1.8b, v2.8b }, [x27], x28
1459# CHECK-NEXT: [0,4]     .   DeeeeeeeER   ld2	{ v1.8h, v2.8h }, [x27], x28
1460
1461# CHECK:      Average Wait times (based on the timeline view):
1462# CHECK-NEXT: [0]: Executions
1463# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1464# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1465# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1466
1467# CHECK:            [0]    [1]    [2]    [3]
1468# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld2	{ v1.2s, v2.2s }, [x27], x28
1469# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld2	{ v1.4h, v2.4h }, [x27], x28
1470# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ld2	{ v1.4s, v2.4s }, [x27], x28
1471# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ld2	{ v1.8b, v2.8b }, [x27], x28
1472# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ld2	{ v1.8h, v2.8h }, [x27], x28
1473# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
1474
1475# CHECK:      [21] Code Region - G22
1476
1477# CHECK:      Iterations:        100
1478# CHECK-NEXT: Instructions:      500
1479# CHECK-NEXT: Total Cycles:      2909
1480# CHECK-NEXT: Total uOps:        2000
1481
1482# CHECK:      Dispatch Width:    4
1483# CHECK-NEXT: uOps Per Cycle:    0.69
1484# CHECK-NEXT: IPC:               0.17
1485# CHECK-NEXT: Block RThroughput: 5.0
1486
1487# CHECK:      Timeline view:
1488# CHECK-NEXT:                     0123456789          01234567
1489# CHECK-NEXT: Index     0123456789          0123456789
1490
1491# CHECK:      [0,0]     DeeeeeeeER.    .    .    .    .    . .   ld2	{ v1.16b, v2.16b }, [x27], x28
1492# CHECK-NEXT: [0,1]     .D======eeeeeeeER   .    .    .    . .   ld2	{ v1.b, v2.b }[0], [x27], #2
1493# CHECK-NEXT: [0,2]     . D============eeeeeeeER .    .    . .   ld2	{ v1.b, v2.b }[8], [x27], #2
1494# CHECK-NEXT: [0,3]     .  D==================eeeeeeeER    . .   ld2	{ v1.b, v2.b }[0], [x27], x28
1495# CHECK-NEXT: [0,4]     .   D========================eeeeeeeER   ld2	{ v1.b, v2.b }[8], [x27], x28
1496
1497# CHECK:      Average Wait times (based on the timeline view):
1498# CHECK-NEXT: [0]: Executions
1499# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1500# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1501# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1502
1503# CHECK:            [0]    [1]    [2]    [3]
1504# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld2	{ v1.16b, v2.16b }, [x27], x28
1505# CHECK-NEXT: 1.     1     7.0    0.0    0.0       ld2	{ v1.b, v2.b }[0], [x27], #2
1506# CHECK-NEXT: 2.     1     13.0   0.0    0.0       ld2	{ v1.b, v2.b }[8], [x27], #2
1507# CHECK-NEXT: 3.     1     19.0   0.0    0.0       ld2	{ v1.b, v2.b }[0], [x27], x28
1508# CHECK-NEXT: 4.     1     25.0   0.0    0.0       ld2	{ v1.b, v2.b }[8], [x27], x28
1509# CHECK-NEXT:        1     13.0   0.2    0.0       <total>
1510
1511# CHECK:      [22] Code Region - G23
1512
1513# CHECK:      Iterations:        100
1514# CHECK-NEXT: Instructions:      500
1515# CHECK-NEXT: Total Cycles:      3503
1516# CHECK-NEXT: Total uOps:        2000
1517
1518# CHECK:      Dispatch Width:    4
1519# CHECK-NEXT: uOps Per Cycle:    0.57
1520# CHECK-NEXT: IPC:               0.14
1521# CHECK-NEXT: Block RThroughput: 5.0
1522
1523# CHECK:      Timeline view:
1524# CHECK-NEXT:                     0123456789          01234567
1525# CHECK-NEXT: Index     0123456789          0123456789
1526
1527# CHECK:      [0,0]     DeeeeeeeER.    .    .    .    .    . .   ld2	{ v1.h, v2.h }[0], [x27], #4
1528# CHECK-NEXT: [0,1]     .D======eeeeeeeER   .    .    .    . .   ld2	{ v1.h, v2.h }[4], [x27], #4
1529# CHECK-NEXT: [0,2]     . D============eeeeeeeER .    .    . .   ld2	{ v1.h, v2.h }[0], [x27], x28
1530# CHECK-NEXT: [0,3]     .  D==================eeeeeeeER    . .   ld2	{ v1.h, v2.h }[4], [x27], x28
1531# CHECK-NEXT: [0,4]     .   D========================eeeeeeeER   ld2	{ v1.s, v2.s }[0], [x27], #8
1532
1533# CHECK:      Average Wait times (based on the timeline view):
1534# CHECK-NEXT: [0]: Executions
1535# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1536# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1537# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1538
1539# CHECK:            [0]    [1]    [2]    [3]
1540# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld2	{ v1.h, v2.h }[0], [x27], #4
1541# CHECK-NEXT: 1.     1     7.0    0.0    0.0       ld2	{ v1.h, v2.h }[4], [x27], #4
1542# CHECK-NEXT: 2.     1     13.0   0.0    0.0       ld2	{ v1.h, v2.h }[0], [x27], x28
1543# CHECK-NEXT: 3.     1     19.0   0.0    0.0       ld2	{ v1.h, v2.h }[4], [x27], x28
1544# CHECK-NEXT: 4.     1     25.0   0.0    0.0       ld2	{ v1.s, v2.s }[0], [x27], #8
1545# CHECK-NEXT:        1     13.0   0.2    0.0       <total>
1546
1547# CHECK:      [23] Code Region - G24
1548
1549# CHECK:      Iterations:        100
1550# CHECK-NEXT: Instructions:      500
1551# CHECK-NEXT: Total Cycles:      2303
1552# CHECK-NEXT: Total uOps:        2000
1553
1554# CHECK:      Dispatch Width:    4
1555# CHECK-NEXT: uOps Per Cycle:    0.87
1556# CHECK-NEXT: IPC:               0.22
1557# CHECK-NEXT: Block RThroughput: 5.0
1558
1559# CHECK:      Timeline view:
1560# CHECK-NEXT:                     0123456789
1561# CHECK-NEXT: Index     0123456789          012345
1562
1563# CHECK:      [0,0]     DeeeeeeeER.    .    .    .   ld2	{ v1.s, v2.s }[0], [x27], x28
1564# CHECK-NEXT: [0,1]     .D======eeeeeeeER   .    .   ld2	{ v1.d, v2.d }[0], [x27], #16
1565# CHECK-NEXT: [0,2]     . D============eeeeeeeER .   ld2	{ v1.d, v2.d }[0], [x27], x28
1566# CHECK-NEXT: [0,3]     .  D============eeeeeeeER.   ld2r	{ v1.1d, v2.1d }, [x27], #16
1567# CHECK-NEXT: [0,4]     .   D============eeeeeeeER   ld2r	{ v1.2d, v2.2d }, [x27], #16
1568
1569# CHECK:      Average Wait times (based on the timeline view):
1570# CHECK-NEXT: [0]: Executions
1571# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1572# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1573# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1574
1575# CHECK:            [0]    [1]    [2]    [3]
1576# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld2	{ v1.s, v2.s }[0], [x27], x28
1577# CHECK-NEXT: 1.     1     7.0    0.0    0.0       ld2	{ v1.d, v2.d }[0], [x27], #16
1578# CHECK-NEXT: 2.     1     13.0   0.0    0.0       ld2	{ v1.d, v2.d }[0], [x27], x28
1579# CHECK-NEXT: 3.     1     13.0   0.0    0.0       ld2r	{ v1.1d, v2.1d }, [x27], #16
1580# CHECK-NEXT: 4.     1     13.0   0.0    0.0       ld2r	{ v1.2d, v2.2d }, [x27], #16
1581# CHECK-NEXT:        1     9.4    0.2    0.0       <total>
1582
1583# CHECK:      [24] Code Region - G25
1584
1585# CHECK:      Iterations:        100
1586# CHECK-NEXT: Instructions:      500
1587# CHECK-NEXT: Total Cycles:      509
1588# CHECK-NEXT: Total uOps:        2000
1589
1590# CHECK:      Dispatch Width:    4
1591# CHECK-NEXT: uOps Per Cycle:    3.93
1592# CHECK-NEXT: IPC:               0.98
1593# CHECK-NEXT: Block RThroughput: 5.0
1594
1595# CHECK:      Timeline view:
1596# CHECK-NEXT:                     0123
1597# CHECK-NEXT: Index     0123456789
1598
1599# CHECK:      [0,0]     DeeeeeeeER.  .   ld2r	{ v1.2s, v2.2s }, [x27], #8
1600# CHECK-NEXT: [0,1]     .DeeeeeeeER  .   ld2r	{ v1.4h, v2.4h }, [x27], #4
1601# CHECK-NEXT: [0,2]     . DeeeeeeeER .   ld2r	{ v1.4s, v2.4s }, [x27], #8
1602# CHECK-NEXT: [0,3]     .  DeeeeeeeER.   ld2r	{ v1.8b, v2.8b }, [x27], #2
1603# CHECK-NEXT: [0,4]     .   DeeeeeeeER   ld2r	{ v1.8h, v2.8h }, [x27], #4
1604
1605# CHECK:      Average Wait times (based on the timeline view):
1606# CHECK-NEXT: [0]: Executions
1607# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1608# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1609# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1610
1611# CHECK:            [0]    [1]    [2]    [3]
1612# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld2r	{ v1.2s, v2.2s }, [x27], #8
1613# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld2r	{ v1.4h, v2.4h }, [x27], #4
1614# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ld2r	{ v1.4s, v2.4s }, [x27], #8
1615# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ld2r	{ v1.8b, v2.8b }, [x27], #2
1616# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ld2r	{ v1.8h, v2.8h }, [x27], #4
1617# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
1618
1619# CHECK:      [25] Code Region - G26
1620
1621# CHECK:      Iterations:        100
1622# CHECK-NEXT: Instructions:      500
1623# CHECK-NEXT: Total Cycles:      509
1624# CHECK-NEXT: Total uOps:        2000
1625
1626# CHECK:      Dispatch Width:    4
1627# CHECK-NEXT: uOps Per Cycle:    3.93
1628# CHECK-NEXT: IPC:               0.98
1629# CHECK-NEXT: Block RThroughput: 5.0
1630
1631# CHECK:      Timeline view:
1632# CHECK-NEXT:                     0123
1633# CHECK-NEXT: Index     0123456789
1634
1635# CHECK:      [0,0]     DeeeeeeeER.  .   ld2r	{ v1.16b, v2.16b }, [x27], #2
1636# CHECK-NEXT: [0,1]     .DeeeeeeeER  .   ld2r	{ v1.1d, v2.1d }, [x27], x28
1637# CHECK-NEXT: [0,2]     . DeeeeeeeER .   ld2r	{ v1.2d, v2.2d }, [x27], x28
1638# CHECK-NEXT: [0,3]     .  DeeeeeeeER.   ld2r	{ v1.2s, v2.2s }, [x27], x28
1639# CHECK-NEXT: [0,4]     .   DeeeeeeeER   ld2r	{ v1.4h, v2.4h }, [x27], x28
1640
1641# CHECK:      Average Wait times (based on the timeline view):
1642# CHECK-NEXT: [0]: Executions
1643# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1644# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1645# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1646
1647# CHECK:            [0]    [1]    [2]    [3]
1648# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld2r	{ v1.16b, v2.16b }, [x27], #2
1649# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld2r	{ v1.1d, v2.1d }, [x27], x28
1650# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ld2r	{ v1.2d, v2.2d }, [x27], x28
1651# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ld2r	{ v1.2s, v2.2s }, [x27], x28
1652# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ld2r	{ v1.4h, v2.4h }, [x27], x28
1653# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
1654
1655# CHECK:      [26] Code Region - G27
1656
1657# CHECK:      Iterations:        100
1658# CHECK-NEXT: Instructions:      500
1659# CHECK-NEXT: Total Cycles:      609
1660# CHECK-NEXT: Total uOps:        2100
1661
1662# CHECK:      Dispatch Width:    4
1663# CHECK-NEXT: uOps Per Cycle:    3.45
1664# CHECK-NEXT: IPC:               0.82
1665# CHECK-NEXT: Block RThroughput: 5.5
1666
1667# CHECK:      Timeline view:
1668# CHECK-NEXT:                     01234
1669# CHECK-NEXT: Index     0123456789
1670
1671# CHECK:      [0,0]     DeeeeeeeER.   .   ld2r	{ v1.4s, v2.4s }, [x27], x28
1672# CHECK-NEXT: [0,1]     .DeeeeeeeER   .   ld2r	{ v1.8b, v2.8b }, [x27], x28
1673# CHECK-NEXT: [0,2]     . DeeeeeeeER  .   ld2r	{ v1.8h, v2.8h }, [x27], x28
1674# CHECK-NEXT: [0,3]     .  DeeeeeeeER .   ld2r	{ v1.16b, v2.16b }, [x27], x28
1675# CHECK-NEXT: [0,4]     .   DeeeeeeeeER   ld3	{ v1.2d, v2.2d, v3.2d }, [x27], #48
1676
1677# CHECK:      Average Wait times (based on the timeline view):
1678# CHECK-NEXT: [0]: Executions
1679# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1680# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1681# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1682
1683# CHECK:            [0]    [1]    [2]    [3]
1684# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld2r	{ v1.4s, v2.4s }, [x27], x28
1685# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ld2r	{ v1.8b, v2.8b }, [x27], x28
1686# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ld2r	{ v1.8h, v2.8h }, [x27], x28
1687# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ld2r	{ v1.16b, v2.16b }, [x27], x28
1688# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ld3	{ v1.2d, v2.2d, v3.2d }, [x27], #48
1689# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
1690
1691# CHECK:      [27] Code Region - G28
1692
1693# CHECK:      Iterations:        100
1694# CHECK-NEXT: Instructions:      500
1695# CHECK-NEXT: Total Cycles:      1009
1696# CHECK-NEXT: Total uOps:        2500
1697
1698# CHECK:      Dispatch Width:    4
1699# CHECK-NEXT: uOps Per Cycle:    2.48
1700# CHECK-NEXT: IPC:               0.50
1701# CHECK-NEXT: Block RThroughput: 7.5
1702
1703# CHECK:      Timeline view:
1704# CHECK-NEXT:                     012345678
1705# CHECK-NEXT: Index     0123456789
1706
1707# CHECK:      [0,0]     DeeeeeeeeER    .  .   ld3	{ v1.2s, v2.2s, v3.2s }, [x27], #24
1708# CHECK-NEXT: [0,1]     . DeeeeeeeeER  .  .   ld3	{ v1.4h, v2.4h, v3.4h }, [x27], #24
1709# CHECK-NEXT: [0,2]     .   DeeeeeeeeER.  .   ld3	{ v1.4s, v2.4s, v3.4s }, [x27], #48
1710# CHECK-NEXT: [0,3]     .    .DeeeeeeeeER .   ld3	{ v1.8b, v2.8b, v3.8b }, [x27], #24
1711# CHECK-NEXT: [0,4]     .    .  DeeeeeeeeER   ld3	{ v1.8h, v2.8h, v3.8h }, [x27], #48
1712
1713# CHECK:      Average Wait times (based on the timeline view):
1714# CHECK-NEXT: [0]: Executions
1715# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1716# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1717# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1718
1719# CHECK:            [0]    [1]    [2]    [3]
1720# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld3	{ v1.2s, v2.2s, v3.2s }, [x27], #24
1721# CHECK-NEXT: 1.     1     1.0    1.0    0.0       ld3	{ v1.4h, v2.4h, v3.4h }, [x27], #24
1722# CHECK-NEXT: 2.     1     1.0    1.0    0.0       ld3	{ v1.4s, v2.4s, v3.4s }, [x27], #48
1723# CHECK-NEXT: 3.     1     1.0    1.0    0.0       ld3	{ v1.8b, v2.8b, v3.8b }, [x27], #24
1724# CHECK-NEXT: 4.     1     1.0    1.0    0.0       ld3	{ v1.8h, v2.8h, v3.8h }, [x27], #48
1725# CHECK-NEXT:        1     1.0    1.0    0.0       <total>
1726
1727# CHECK:      [28] Code Region - G29
1728
1729# CHECK:      Iterations:        100
1730# CHECK-NEXT: Instructions:      500
1731# CHECK-NEXT: Total Cycles:      1009
1732# CHECK-NEXT: Total uOps:        2500
1733
1734# CHECK:      Dispatch Width:    4
1735# CHECK-NEXT: uOps Per Cycle:    2.48
1736# CHECK-NEXT: IPC:               0.50
1737# CHECK-NEXT: Block RThroughput: 7.5
1738
1739# CHECK:      Timeline view:
1740# CHECK-NEXT:                     012345678
1741# CHECK-NEXT: Index     0123456789
1742
1743# CHECK:      [0,0]     DeeeeeeeeER    .  .   ld3	{ v1.16b, v2.16b, v3.16b }, [x27], #48
1744# CHECK-NEXT: [0,1]     . DeeeeeeeeER  .  .   ld3	{ v1.2d, v2.2d, v3.2d }, [x27], x28
1745# CHECK-NEXT: [0,2]     .   DeeeeeeeeER.  .   ld3	{ v1.2s, v2.2s, v3.2s }, [x27], x28
1746# CHECK-NEXT: [0,3]     .    .DeeeeeeeeER .   ld3	{ v1.4h, v2.4h, v3.4h }, [x27], x28
1747# CHECK-NEXT: [0,4]     .    .  DeeeeeeeeER   ld3	{ v1.4s, v2.4s, v3.4s }, [x27], x28
1748
1749# CHECK:      Average Wait times (based on the timeline view):
1750# CHECK-NEXT: [0]: Executions
1751# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1752# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1753# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1754
1755# CHECK:            [0]    [1]    [2]    [3]
1756# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld3	{ v1.16b, v2.16b, v3.16b }, [x27], #48
1757# CHECK-NEXT: 1.     1     1.0    1.0    0.0       ld3	{ v1.2d, v2.2d, v3.2d }, [x27], x28
1758# CHECK-NEXT: 2.     1     1.0    1.0    0.0       ld3	{ v1.2s, v2.2s, v3.2s }, [x27], x28
1759# CHECK-NEXT: 3.     1     1.0    1.0    0.0       ld3	{ v1.4h, v2.4h, v3.4h }, [x27], x28
1760# CHECK-NEXT: 4.     1     1.0    1.0    0.0       ld3	{ v1.4s, v2.4s, v3.4s }, [x27], x28
1761# CHECK-NEXT:        1     1.0    1.0    0.0       <total>
1762
1763# CHECK:      [29] Code Region - G30
1764
1765# CHECK:      Iterations:        100
1766# CHECK-NEXT: Instructions:      500
1767# CHECK-NEXT: Total Cycles:      2011
1768# CHECK-NEXT: Total uOps:        2500
1769
1770# CHECK:      Dispatch Width:    4
1771# CHECK-NEXT: uOps Per Cycle:    1.24
1772# CHECK-NEXT: IPC:               0.25
1773# CHECK-NEXT: Block RThroughput: 7.5
1774
1775# CHECK:      Timeline view:
1776# CHECK-NEXT:                     0123456789          0
1777# CHECK-NEXT: Index     0123456789          0123456789
1778
1779# CHECK:      [0,0]     DeeeeeeeeER    .    .    .    .   ld3	{ v1.8b, v2.8b, v3.8b }, [x27], x28
1780# CHECK-NEXT: [0,1]     . DeeeeeeeeER  .    .    .    .   ld3	{ v1.8h, v2.8h, v3.8h }, [x27], x28
1781# CHECK-NEXT: [0,2]     .   DeeeeeeeeER.    .    .    .   ld3	{ v1.16b, v2.16b, v3.16b }, [x27], x28
1782# CHECK-NEXT: [0,3]     .    .D======eeeeeeeeER  .    .   ld3	{ v1.b, v2.b, v3.b }[0], [x27], #3
1783# CHECK-NEXT: [0,4]     .    .  D============eeeeeeeeER   ld3	{ v1.b, v2.b, v3.b }[8], [x27], #3
1784
1785# CHECK:      Average Wait times (based on the timeline view):
1786# CHECK-NEXT: [0]: Executions
1787# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1788# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1789# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1790
1791# CHECK:            [0]    [1]    [2]    [3]
1792# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld3	{ v1.8b, v2.8b, v3.8b }, [x27], x28
1793# CHECK-NEXT: 1.     1     1.0    1.0    0.0       ld3	{ v1.8h, v2.8h, v3.8h }, [x27], x28
1794# CHECK-NEXT: 2.     1     1.0    1.0    0.0       ld3	{ v1.16b, v2.16b, v3.16b }, [x27], x28
1795# CHECK-NEXT: 3.     1     7.0    0.0    0.0       ld3	{ v1.b, v2.b, v3.b }[0], [x27], #3
1796# CHECK-NEXT: 4.     1     13.0   0.0    0.0       ld3	{ v1.b, v2.b, v3.b }[8], [x27], #3
1797# CHECK-NEXT:        1     4.6    0.6    0.0       <total>
1798
1799# CHECK:      [30] Code Region - G31
1800
1801# CHECK:      Iterations:        100
1802# CHECK-NEXT: Instructions:      500
1803# CHECK-NEXT: Total Cycles:      4003
1804# CHECK-NEXT: Total uOps:        2500
1805
1806# CHECK:      Dispatch Width:    4
1807# CHECK-NEXT: uOps Per Cycle:    0.62
1808# CHECK-NEXT: IPC:               0.12
1809# CHECK-NEXT: Block RThroughput: 7.5
1810
1811# CHECK:      Timeline view:
1812# CHECK-NEXT:                     0123456789          0123456789
1813# CHECK-NEXT: Index     0123456789          0123456789          012
1814
1815# CHECK:      [0,0]     DeeeeeeeeER    .    .    .    .    .    . .   ld3	{ v1.b, v2.b, v3.b }[0], [x27], x28
1816# CHECK-NEXT: [0,1]     . D======eeeeeeeeER .    .    .    .    . .   ld3	{ v1.b, v2.b, v3.b }[8], [x27], x28
1817# CHECK-NEXT: [0,2]     .   D============eeeeeeeeER   .    .    . .   ld3	{ v1.h, v2.h, v3.h }[0], [x27], #6
1818# CHECK-NEXT: [0,3]     .    .D==================eeeeeeeeER.    . .   ld3	{ v1.h, v2.h, v3.h }[4], [x27], #6
1819# CHECK-NEXT: [0,4]     .    .  D========================eeeeeeeeER   ld3	{ v1.h, v2.h, v3.h }[0], [x27], x28
1820
1821# CHECK:      Average Wait times (based on the timeline view):
1822# CHECK-NEXT: [0]: Executions
1823# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1824# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1825# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1826
1827# CHECK:            [0]    [1]    [2]    [3]
1828# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld3	{ v1.b, v2.b, v3.b }[0], [x27], x28
1829# CHECK-NEXT: 1.     1     7.0    0.0    0.0       ld3	{ v1.b, v2.b, v3.b }[8], [x27], x28
1830# CHECK-NEXT: 2.     1     13.0   0.0    0.0       ld3	{ v1.h, v2.h, v3.h }[0], [x27], #6
1831# CHECK-NEXT: 3.     1     19.0   0.0    0.0       ld3	{ v1.h, v2.h, v3.h }[4], [x27], #6
1832# CHECK-NEXT: 4.     1     25.0   0.0    0.0       ld3	{ v1.h, v2.h, v3.h }[0], [x27], x28
1833# CHECK-NEXT:        1     13.0   0.2    0.0       <total>
1834
1835# CHECK:      [31] Code Region - G32
1836
1837# CHECK:      Iterations:        100
1838# CHECK-NEXT: Instructions:      500
1839# CHECK-NEXT: Total Cycles:      4003
1840# CHECK-NEXT: Total uOps:        2500
1841
1842# CHECK:      Dispatch Width:    4
1843# CHECK-NEXT: uOps Per Cycle:    0.62
1844# CHECK-NEXT: IPC:               0.12
1845# CHECK-NEXT: Block RThroughput: 7.5
1846
1847# CHECK:      Timeline view:
1848# CHECK-NEXT:                     0123456789          0123456789
1849# CHECK-NEXT: Index     0123456789          0123456789          012
1850
1851# CHECK:      [0,0]     DeeeeeeeeER    .    .    .    .    .    . .   ld3	{ v1.h, v2.h, v3.h }[4], [x27], x28
1852# CHECK-NEXT: [0,1]     . D======eeeeeeeeER .    .    .    .    . .   ld3	{ v1.s, v2.s, v3.s }[0], [x27], #12
1853# CHECK-NEXT: [0,2]     .   D============eeeeeeeeER   .    .    . .   ld3	{ v1.s, v2.s, v3.s }[0], [x27], x28
1854# CHECK-NEXT: [0,3]     .    .D==================eeeeeeeeER.    . .   ld3	{ v1.d, v2.d, v3.d }[0], [x27], #24
1855# CHECK-NEXT: [0,4]     .    .  D========================eeeeeeeeER   ld3	{ v1.d, v2.d, v3.d }[0], [x27], x28
1856
1857# CHECK:      Average Wait times (based on the timeline view):
1858# CHECK-NEXT: [0]: Executions
1859# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1860# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1861# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1862
1863# CHECK:            [0]    [1]    [2]    [3]
1864# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld3	{ v1.h, v2.h, v3.h }[4], [x27], x28
1865# CHECK-NEXT: 1.     1     7.0    0.0    0.0       ld3	{ v1.s, v2.s, v3.s }[0], [x27], #12
1866# CHECK-NEXT: 2.     1     13.0   0.0    0.0       ld3	{ v1.s, v2.s, v3.s }[0], [x27], x28
1867# CHECK-NEXT: 3.     1     19.0   0.0    0.0       ld3	{ v1.d, v2.d, v3.d }[0], [x27], #24
1868# CHECK-NEXT: 4.     1     25.0   0.0    0.0       ld3	{ v1.d, v2.d, v3.d }[0], [x27], x28
1869# CHECK-NEXT:        1     13.0   0.2    0.0       <total>
1870
1871# CHECK:      [32] Code Region - G33
1872
1873# CHECK:      Iterations:        100
1874# CHECK-NEXT: Instructions:      500
1875# CHECK-NEXT: Total Cycles:      1009
1876# CHECK-NEXT: Total uOps:        2500
1877
1878# CHECK:      Dispatch Width:    4
1879# CHECK-NEXT: uOps Per Cycle:    2.48
1880# CHECK-NEXT: IPC:               0.50
1881# CHECK-NEXT: Block RThroughput: 7.5
1882
1883# CHECK:      Timeline view:
1884# CHECK-NEXT:                     012345678
1885# CHECK-NEXT: Index     0123456789
1886
1887# CHECK:      [0,0]     DeeeeeeeeER    .  .   ld3r	{ v1.1d, v2.1d, v3.1d }, [x27], #24
1888# CHECK-NEXT: [0,1]     . DeeeeeeeeER  .  .   ld3r	{ v1.2d, v2.2d, v3.2d }, [x27], #24
1889# CHECK-NEXT: [0,2]     .   DeeeeeeeeER.  .   ld3r	{ v1.2s, v2.2s, v3.2s }, [x27], #12
1890# CHECK-NEXT: [0,3]     .    .DeeeeeeeeER .   ld3r	{ v1.4h, v2.4h, v3.4h }, [x27], #6
1891# CHECK-NEXT: [0,4]     .    .  DeeeeeeeeER   ld3r	{ v1.4s, v2.4s, v3.4s }, [x27], #12
1892
1893# CHECK:      Average Wait times (based on the timeline view):
1894# CHECK-NEXT: [0]: Executions
1895# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1896# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1897# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1898
1899# CHECK:            [0]    [1]    [2]    [3]
1900# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld3r	{ v1.1d, v2.1d, v3.1d }, [x27], #24
1901# CHECK-NEXT: 1.     1     1.0    1.0    0.0       ld3r	{ v1.2d, v2.2d, v3.2d }, [x27], #24
1902# CHECK-NEXT: 2.     1     1.0    1.0    0.0       ld3r	{ v1.2s, v2.2s, v3.2s }, [x27], #12
1903# CHECK-NEXT: 3.     1     1.0    1.0    0.0       ld3r	{ v1.4h, v2.4h, v3.4h }, [x27], #6
1904# CHECK-NEXT: 4.     1     1.0    1.0    0.0       ld3r	{ v1.4s, v2.4s, v3.4s }, [x27], #12
1905# CHECK-NEXT:        1     1.0    1.0    0.0       <total>
1906
1907# CHECK:      [33] Code Region - G34
1908
1909# CHECK:      Iterations:        100
1910# CHECK-NEXT: Instructions:      500
1911# CHECK-NEXT: Total Cycles:      1009
1912# CHECK-NEXT: Total uOps:        2500
1913
1914# CHECK:      Dispatch Width:    4
1915# CHECK-NEXT: uOps Per Cycle:    2.48
1916# CHECK-NEXT: IPC:               0.50
1917# CHECK-NEXT: Block RThroughput: 7.5
1918
1919# CHECK:      Timeline view:
1920# CHECK-NEXT:                     012345678
1921# CHECK-NEXT: Index     0123456789
1922
1923# CHECK:      [0,0]     DeeeeeeeeER    .  .   ld3r	{ v1.8b, v2.8b, v3.8b }, [x27], #3
1924# CHECK-NEXT: [0,1]     . DeeeeeeeeER  .  .   ld3r	{ v1.8h, v2.8h, v3.8h }, [x27], #6
1925# CHECK-NEXT: [0,2]     .   DeeeeeeeeER.  .   ld3r	{ v1.16b, v2.16b, v3.16b }, [x27], #3
1926# CHECK-NEXT: [0,3]     .    .DeeeeeeeeER .   ld3r	{ v1.1d, v2.1d, v3.1d }, [x27], x28
1927# CHECK-NEXT: [0,4]     .    .  DeeeeeeeeER   ld3r	{ v1.2d, v2.2d, v3.2d }, [x27], x28
1928
1929# CHECK:      Average Wait times (based on the timeline view):
1930# CHECK-NEXT: [0]: Executions
1931# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1932# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1933# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1934
1935# CHECK:            [0]    [1]    [2]    [3]
1936# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld3r	{ v1.8b, v2.8b, v3.8b }, [x27], #3
1937# CHECK-NEXT: 1.     1     1.0    1.0    0.0       ld3r	{ v1.8h, v2.8h, v3.8h }, [x27], #6
1938# CHECK-NEXT: 2.     1     1.0    1.0    0.0       ld3r	{ v1.16b, v2.16b, v3.16b }, [x27], #3
1939# CHECK-NEXT: 3.     1     1.0    1.0    0.0       ld3r	{ v1.1d, v2.1d, v3.1d }, [x27], x28
1940# CHECK-NEXT: 4.     1     1.0    1.0    0.0       ld3r	{ v1.2d, v2.2d, v3.2d }, [x27], x28
1941# CHECK-NEXT:        1     1.0    1.0    0.0       <total>
1942
1943# CHECK:      [34] Code Region - G35
1944
1945# CHECK:      Iterations:        100
1946# CHECK-NEXT: Instructions:      500
1947# CHECK-NEXT: Total Cycles:      1009
1948# CHECK-NEXT: Total uOps:        2500
1949
1950# CHECK:      Dispatch Width:    4
1951# CHECK-NEXT: uOps Per Cycle:    2.48
1952# CHECK-NEXT: IPC:               0.50
1953# CHECK-NEXT: Block RThroughput: 7.5
1954
1955# CHECK:      Timeline view:
1956# CHECK-NEXT:                     012345678
1957# CHECK-NEXT: Index     0123456789
1958
1959# CHECK:      [0,0]     DeeeeeeeeER    .  .   ld3r	{ v1.2s, v2.2s, v3.2s }, [x27], x28
1960# CHECK-NEXT: [0,1]     . DeeeeeeeeER  .  .   ld3r	{ v1.4h, v2.4h, v3.4h }, [x27], x28
1961# CHECK-NEXT: [0,2]     .   DeeeeeeeeER.  .   ld3r	{ v1.4s, v2.4s, v3.4s }, [x27], x28
1962# CHECK-NEXT: [0,3]     .    .DeeeeeeeeER .   ld3r	{ v1.8b, v2.8b, v3.8b }, [x27], x28
1963# CHECK-NEXT: [0,4]     .    .  DeeeeeeeeER   ld3r	{ v1.8h, v2.8h, v3.8h }, [x27], x28
1964
1965# CHECK:      Average Wait times (based on the timeline view):
1966# CHECK-NEXT: [0]: Executions
1967# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
1968# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
1969# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
1970
1971# CHECK:            [0]    [1]    [2]    [3]
1972# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld3r	{ v1.2s, v2.2s, v3.2s }, [x27], x28
1973# CHECK-NEXT: 1.     1     1.0    1.0    0.0       ld3r	{ v1.4h, v2.4h, v3.4h }, [x27], x28
1974# CHECK-NEXT: 2.     1     1.0    1.0    0.0       ld3r	{ v1.4s, v2.4s, v3.4s }, [x27], x28
1975# CHECK-NEXT: 3.     1     1.0    1.0    0.0       ld3r	{ v1.8b, v2.8b, v3.8b }, [x27], x28
1976# CHECK-NEXT: 4.     1     1.0    1.0    0.0       ld3r	{ v1.8h, v2.8h, v3.8h }, [x27], x28
1977# CHECK-NEXT:        1     1.0    1.0    0.0       <total>
1978
1979# CHECK:      [35] Code Region - G36
1980
1981# CHECK:      Iterations:        100
1982# CHECK-NEXT: Instructions:      500
1983# CHECK-NEXT: Total Cycles:      1410
1984# CHECK-NEXT: Total uOps:        4100
1985
1986# CHECK:      Dispatch Width:    4
1987# CHECK-NEXT: uOps Per Cycle:    2.91
1988# CHECK-NEXT: IPC:               0.35
1989# CHECK-NEXT: Block RThroughput: 10.3
1990
1991# CHECK:      Timeline view:
1992# CHECK-NEXT:                     0123456789
1993# CHECK-NEXT: Index     0123456789          0123
1994
1995# CHECK:      [0,0]     DeeeeeeeeER    .    .  .   ld3r	{ v1.16b, v2.16b, v3.16b }, [x27], x28
1996# CHECK-NEXT: [0,1]     . DeeeeeeeeeeER.    .  .   ld4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
1997# CHECK-NEXT: [0,2]     .    DeeeeeeeeeeER  .  .   ld4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
1998# CHECK-NEXT: [0,3]     .    .  DeeeeeeeeeeER  .   ld4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
1999# CHECK-NEXT: [0,4]     .    .    .DeeeeeeeeeeER   ld4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
2000
2001# CHECK:      Average Wait times (based on the timeline view):
2002# CHECK-NEXT: [0]: Executions
2003# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2004# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2005# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2006
2007# CHECK:            [0]    [1]    [2]    [3]
2008# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld3r	{ v1.16b, v2.16b, v3.16b }, [x27], x28
2009# CHECK-NEXT: 1.     1     1.0    1.0    0.0       ld4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
2010# CHECK-NEXT: 2.     1     1.0    1.0    0.0       ld4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
2011# CHECK-NEXT: 3.     1     1.0    1.0    0.0       ld4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
2012# CHECK-NEXT: 4.     1     1.0    1.0    0.0       ld4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
2013# CHECK-NEXT:        1     1.0    1.0    0.0       <total>
2014
2015# CHECK:      [36] Code Region - G37
2016
2017# CHECK:      Iterations:        100
2018# CHECK-NEXT: Instructions:      500
2019# CHECK-NEXT: Total Cycles:      1510
2020# CHECK-NEXT: Total uOps:        4500
2021
2022# CHECK:      Dispatch Width:    4
2023# CHECK-NEXT: uOps Per Cycle:    2.98
2024# CHECK-NEXT: IPC:               0.33
2025# CHECK-NEXT: Block RThroughput: 11.3
2026
2027# CHECK:      Timeline view:
2028# CHECK-NEXT:                     0123456789
2029# CHECK-NEXT: Index     0123456789          01234
2030
2031# CHECK:      [0,0]     DeeeeeeeeeeER  .    .   .   ld4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
2032# CHECK-NEXT: [0,1]     .  DeeeeeeeeeeER    .   .   ld4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
2033# CHECK-NEXT: [0,2]     .    .DeeeeeeeeeeER .   .   ld4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
2034# CHECK-NEXT: [0,3]     .    .   DeeeeeeeeeeER  .   ld4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
2035# CHECK-NEXT: [0,4]     .    .    . DeeeeeeeeeeER   ld4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
2036
2037# CHECK:      Average Wait times (based on the timeline view):
2038# CHECK-NEXT: [0]: Executions
2039# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2040# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2041# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2042
2043# CHECK:            [0]    [1]    [2]    [3]
2044# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
2045# CHECK-NEXT: 1.     1     1.0    1.0    0.0       ld4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
2046# CHECK-NEXT: 2.     1     1.0    1.0    0.0       ld4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
2047# CHECK-NEXT: 3.     1     1.0    1.0    0.0       ld4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
2048# CHECK-NEXT: 4.     1     1.0    1.0    0.0       ld4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
2049# CHECK-NEXT:        1     1.0    1.0    0.0       <total>
2050
2051# CHECK:      [37] Code Region - G38
2052
2053# CHECK:      Iterations:        100
2054# CHECK-NEXT: Instructions:      500
2055# CHECK-NEXT: Total Cycles:      1510
2056# CHECK-NEXT: Total uOps:        4500
2057
2058# CHECK:      Dispatch Width:    4
2059# CHECK-NEXT: uOps Per Cycle:    2.98
2060# CHECK-NEXT: IPC:               0.33
2061# CHECK-NEXT: Block RThroughput: 11.3
2062
2063# CHECK:      Timeline view:
2064# CHECK-NEXT:                     0123456789
2065# CHECK-NEXT: Index     0123456789          01234
2066
2067# CHECK:      [0,0]     DeeeeeeeeeeER  .    .   .   ld4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
2068# CHECK-NEXT: [0,1]     .  DeeeeeeeeeeER    .   .   ld4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
2069# CHECK-NEXT: [0,2]     .    .DeeeeeeeeeeER .   .   ld4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
2070# CHECK-NEXT: [0,3]     .    .   DeeeeeeeeeeER  .   ld4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
2071# CHECK-NEXT: [0,4]     .    .    . DeeeeeeeeeeER   ld4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
2072
2073# CHECK:      Average Wait times (based on the timeline view):
2074# CHECK-NEXT: [0]: Executions
2075# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2076# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2077# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2078
2079# CHECK:            [0]    [1]    [2]    [3]
2080# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
2081# CHECK-NEXT: 1.     1     1.0    1.0    0.0       ld4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
2082# CHECK-NEXT: 2.     1     1.0    1.0    0.0       ld4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
2083# CHECK-NEXT: 3.     1     1.0    1.0    0.0       ld4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
2084# CHECK-NEXT: 4.     1     1.0    1.0    0.0       ld4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
2085# CHECK-NEXT:        1     1.0    1.0    0.0       <total>
2086
2087# CHECK:      [38] Code Region - G39
2088
2089# CHECK:      Iterations:        100
2090# CHECK-NEXT: Instructions:      500
2091# CHECK-NEXT: Total Cycles:      4003
2092# CHECK-NEXT: Total uOps:        3000
2093
2094# CHECK:      Dispatch Width:    4
2095# CHECK-NEXT: uOps Per Cycle:    0.75
2096# CHECK-NEXT: IPC:               0.12
2097# CHECK-NEXT: Block RThroughput: 7.5
2098
2099# CHECK:      Timeline view:
2100# CHECK-NEXT:                     0123456789          0123456789
2101# CHECK-NEXT: Index     0123456789          0123456789          012
2102
2103# CHECK:      [0,0]     DeeeeeeeeER    .    .    .    .    .    . .   ld4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
2104# CHECK-NEXT: [0,1]     . D======eeeeeeeeER .    .    .    .    . .   ld4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
2105# CHECK-NEXT: [0,2]     .   D============eeeeeeeeER   .    .    . .   ld4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
2106# CHECK-NEXT: [0,3]     .    .D==================eeeeeeeeER.    . .   ld4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
2107# CHECK-NEXT: [0,4]     .    .  D========================eeeeeeeeER   ld4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
2108
2109# CHECK:      Average Wait times (based on the timeline view):
2110# CHECK-NEXT: [0]: Executions
2111# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2112# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2113# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2114
2115# CHECK:            [0]    [1]    [2]    [3]
2116# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
2117# CHECK-NEXT: 1.     1     7.0    0.0    0.0       ld4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
2118# CHECK-NEXT: 2.     1     13.0   0.0    0.0       ld4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
2119# CHECK-NEXT: 3.     1     19.0   0.0    0.0       ld4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
2120# CHECK-NEXT: 4.     1     25.0   0.0    0.0       ld4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
2121# CHECK-NEXT:        1     13.0   0.2    0.0       <total>
2122
2123# CHECK:      [39] Code Region - G40
2124
2125# CHECK:      Iterations:        100
2126# CHECK-NEXT: Instructions:      500
2127# CHECK-NEXT: Total Cycles:      4003
2128# CHECK-NEXT: Total uOps:        3000
2129
2130# CHECK:      Dispatch Width:    4
2131# CHECK-NEXT: uOps Per Cycle:    0.75
2132# CHECK-NEXT: IPC:               0.12
2133# CHECK-NEXT: Block RThroughput: 7.5
2134
2135# CHECK:      Timeline view:
2136# CHECK-NEXT:                     0123456789          0123456789
2137# CHECK-NEXT: Index     0123456789          0123456789          012
2138
2139# CHECK:      [0,0]     DeeeeeeeeER    .    .    .    .    .    . .   ld4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
2140# CHECK-NEXT: [0,1]     . D======eeeeeeeeER .    .    .    .    . .   ld4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
2141# CHECK-NEXT: [0,2]     .   D============eeeeeeeeER   .    .    . .   ld4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
2142# CHECK-NEXT: [0,3]     .    .D==================eeeeeeeeER.    . .   ld4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
2143# CHECK-NEXT: [0,4]     .    .  D========================eeeeeeeeER   ld4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
2144
2145# CHECK:      Average Wait times (based on the timeline view):
2146# CHECK-NEXT: [0]: Executions
2147# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2148# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2149# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2150
2151# CHECK:            [0]    [1]    [2]    [3]
2152# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
2153# CHECK-NEXT: 1.     1     7.0    0.0    0.0       ld4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
2154# CHECK-NEXT: 2.     1     13.0   0.0    0.0       ld4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
2155# CHECK-NEXT: 3.     1     19.0   0.0    0.0       ld4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
2156# CHECK-NEXT: 4.     1     25.0   0.0    0.0       ld4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
2157# CHECK-NEXT:        1     13.0   0.2    0.0       <total>
2158
2159# CHECK:      [40] Code Region - G41
2160
2161# CHECK:      Iterations:        100
2162# CHECK-NEXT: Instructions:      500
2163# CHECK-NEXT: Total Cycles:      2003
2164# CHECK-NEXT: Total uOps:        3000
2165
2166# CHECK:      Dispatch Width:    4
2167# CHECK-NEXT: uOps Per Cycle:    1.50
2168# CHECK-NEXT: IPC:               0.25
2169# CHECK-NEXT: Block RThroughput: 7.5
2170
2171# CHECK:      Timeline view:
2172# CHECK-NEXT:                     0123456789
2173# CHECK-NEXT: Index     0123456789          012
2174
2175# CHECK:      [0,0]     DeeeeeeeeER    .    . .   ld4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
2176# CHECK-NEXT: [0,1]     . D======eeeeeeeeER . .   ld4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
2177# CHECK-NEXT: [0,2]     .   D=====eeeeeeeeER. .   ld4r	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
2178# CHECK-NEXT: [0,3]     .    .D=====eeeeeeeeER.   ld4r	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32
2179# CHECK-NEXT: [0,4]     .    .  D====eeeeeeeeER   ld4r	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16
2180
2181# CHECK:      Average Wait times (based on the timeline view):
2182# CHECK-NEXT: [0]: Executions
2183# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2184# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2185# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2186
2187# CHECK:            [0]    [1]    [2]    [3]
2188# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
2189# CHECK-NEXT: 1.     1     7.0    0.0    0.0       ld4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
2190# CHECK-NEXT: 2.     1     6.0    0.0    0.0       ld4r	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
2191# CHECK-NEXT: 3.     1     6.0    1.0    0.0       ld4r	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32
2192# CHECK-NEXT: 4.     1     5.0    0.0    0.0       ld4r	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16
2193# CHECK-NEXT:        1     5.0    0.4    0.0       <total>
2194
2195# CHECK:      [41] Code Region - G42
2196
2197# CHECK:      Iterations:        100
2198# CHECK-NEXT: Instructions:      500
2199# CHECK-NEXT: Total Cycles:      1009
2200# CHECK-NEXT: Total uOps:        3000
2201
2202# CHECK:      Dispatch Width:    4
2203# CHECK-NEXT: uOps Per Cycle:    2.97
2204# CHECK-NEXT: IPC:               0.50
2205# CHECK-NEXT: Block RThroughput: 7.5
2206
2207# CHECK:      Timeline view:
2208# CHECK-NEXT:                     012345678
2209# CHECK-NEXT: Index     0123456789
2210
2211# CHECK:      [0,0]     DeeeeeeeeER    .  .   ld4r	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8
2212# CHECK-NEXT: [0,1]     . DeeeeeeeeER  .  .   ld4r	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16
2213# CHECK-NEXT: [0,2]     .   DeeeeeeeeER.  .   ld4r	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4
2214# CHECK-NEXT: [0,3]     .    .DeeeeeeeeER .   ld4r	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8
2215# CHECK-NEXT: [0,4]     .    .  DeeeeeeeeER   ld4r	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4
2216
2217# CHECK:      Average Wait times (based on the timeline view):
2218# CHECK-NEXT: [0]: Executions
2219# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2220# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2221# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2222
2223# CHECK:            [0]    [1]    [2]    [3]
2224# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld4r	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8
2225# CHECK-NEXT: 1.     1     1.0    1.0    0.0       ld4r	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16
2226# CHECK-NEXT: 2.     1     1.0    1.0    0.0       ld4r	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4
2227# CHECK-NEXT: 3.     1     1.0    1.0    0.0       ld4r	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8
2228# CHECK-NEXT: 4.     1     1.0    1.0    0.0       ld4r	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4
2229# CHECK-NEXT:        1     1.0    1.0    0.0       <total>
2230
2231# CHECK:      [42] Code Region - G43
2232
2233# CHECK:      Iterations:        100
2234# CHECK-NEXT: Instructions:      500
2235# CHECK-NEXT: Total Cycles:      1009
2236# CHECK-NEXT: Total uOps:        3000
2237
2238# CHECK:      Dispatch Width:    4
2239# CHECK-NEXT: uOps Per Cycle:    2.97
2240# CHECK-NEXT: IPC:               0.50
2241# CHECK-NEXT: Block RThroughput: 7.5
2242
2243# CHECK:      Timeline view:
2244# CHECK-NEXT:                     012345678
2245# CHECK-NEXT: Index     0123456789
2246
2247# CHECK:      [0,0]     DeeeeeeeeER    .  .   ld4r	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
2248# CHECK-NEXT: [0,1]     . DeeeeeeeeER  .  .   ld4r	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
2249# CHECK-NEXT: [0,2]     .   DeeeeeeeeER.  .   ld4r	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
2250# CHECK-NEXT: [0,3]     .    .DeeeeeeeeER .   ld4r	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
2251# CHECK-NEXT: [0,4]     .    .  DeeeeeeeeER   ld4r	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
2252
2253# CHECK:      Average Wait times (based on the timeline view):
2254# CHECK-NEXT: [0]: Executions
2255# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2256# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2257# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2258
2259# CHECK:            [0]    [1]    [2]    [3]
2260# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld4r	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
2261# CHECK-NEXT: 1.     1     1.0    1.0    0.0       ld4r	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
2262# CHECK-NEXT: 2.     1     1.0    1.0    0.0       ld4r	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
2263# CHECK-NEXT: 3.     1     1.0    1.0    0.0       ld4r	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
2264# CHECK-NEXT: 4.     1     1.0    1.0    0.0       ld4r	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
2265# CHECK-NEXT:        1     1.0    1.0    0.0       <total>
2266
2267# CHECK:      [43] Code Region - G44
2268
2269# CHECK:      Iterations:        100
2270# CHECK-NEXT: Instructions:      500
2271# CHECK-NEXT: Total Cycles:      807
2272# CHECK-NEXT: Total uOps:        2400
2273
2274# CHECK:      Dispatch Width:    4
2275# CHECK-NEXT: uOps Per Cycle:    2.97
2276# CHECK-NEXT: IPC:               0.62
2277# CHECK-NEXT: Block RThroughput: 6.0
2278
2279# CHECK:      Timeline view:
2280# CHECK-NEXT:                     01234
2281# CHECK-NEXT: Index     0123456789
2282
2283# CHECK:      [0,0]     DeeeeeeeeER   .   ld4r	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
2284# CHECK-NEXT: [0,1]     . DeeeeeeeeER .   ld4r	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
2285# CHECK-NEXT: [0,2]     .   DeeeeeeeeER   ld4r	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
2286# CHECK-NEXT: [0,3]     .    .DeeeeeE-R   ldp	s1, s2, [x27], #248
2287# CHECK-NEXT: [0,4]     .    . DeeeeeER   ldp	d1, d2, [x27], #496
2288
2289# CHECK:      Average Wait times (based on the timeline view):
2290# CHECK-NEXT: [0]: Executions
2291# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2292# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2293# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2294
2295# CHECK:            [0]    [1]    [2]    [3]
2296# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ld4r	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
2297# CHECK-NEXT: 1.     1     1.0    1.0    0.0       ld4r	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
2298# CHECK-NEXT: 2.     1     1.0    1.0    0.0       ld4r	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
2299# CHECK-NEXT: 3.     1     1.0    1.0    1.0       ldp	s1, s2, [x27], #248
2300# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ldp	d1, d2, [x27], #496
2301# CHECK-NEXT:        1     1.0    0.8    0.2       <total>
2302
2303# CHECK:      [44] Code Region - G45
2304
2305# CHECK:      Iterations:        100
2306# CHECK-NEXT: Instructions:      500
2307# CHECK-NEXT: Total Cycles:      506
2308# CHECK-NEXT: Total uOps:        1600
2309
2310# CHECK:      Dispatch Width:    4
2311# CHECK-NEXT: uOps Per Cycle:    3.16
2312# CHECK-NEXT: IPC:               0.99
2313# CHECK-NEXT: Block RThroughput: 4.0
2314
2315# CHECK:      Timeline view:
2316# CHECK-NEXT:                     0
2317# CHECK-NEXT: Index     0123456789
2318
2319# CHECK:      [0,0]     DeeeeeER  .   ldp	q1, q2, [x27], #992
2320# CHECK-NEXT: [0,1]     .DeeeeeER .   ldp	s1, s2, [x27, #248]!
2321# CHECK-NEXT: [0,2]     . DeeeeeER.   ldp	d1, d2, [x27, #496]!
2322# CHECK-NEXT: [0,3]     .  DeeeeeER   ldp	q1, q2, [x27, #992]!
2323# CHECK-NEXT: [0,4]     .   DeeeeER   ldp	w1, w2, [x27], #248
2324
2325# CHECK:      Average Wait times (based on the timeline view):
2326# CHECK-NEXT: [0]: Executions
2327# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2328# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2329# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2330
2331# CHECK:            [0]    [1]    [2]    [3]
2332# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ldp	q1, q2, [x27], #992
2333# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ldp	s1, s2, [x27, #248]!
2334# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ldp	d1, d2, [x27, #496]!
2335# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ldp	q1, q2, [x27, #992]!
2336# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ldp	w1, w2, [x27], #248
2337# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
2338
2339# CHECK:      [45] Code Region - G46
2340
2341# CHECK:      Iterations:        100
2342# CHECK-NEXT: Instructions:      500
2343# CHECK-NEXT: Total Cycles:      506
2344# CHECK-NEXT: Total uOps:        1800
2345
2346# CHECK:      Dispatch Width:    4
2347# CHECK-NEXT: uOps Per Cycle:    3.56
2348# CHECK-NEXT: IPC:               0.99
2349# CHECK-NEXT: Block RThroughput: 4.5
2350
2351# CHECK:      Timeline view:
2352# CHECK-NEXT:                     0
2353# CHECK-NEXT: Index     0123456789
2354
2355# CHECK:      [0,0]     DeeeeER   .   ldp	x1, x2, [x27], #496
2356# CHECK-NEXT: [0,1]     .DeeeeER  .   ldp	w1, w2, [x27, #248]!
2357# CHECK-NEXT: [0,2]     . DeeeeER .   ldp	x1, x2, [x27, #496]!
2358# CHECK-NEXT: [0,3]     .  DeeeeER.   ldpsw	x1, x2, [x27], #248
2359# CHECK-NEXT: [0,4]     .   DeeeeER   ldpsw	x1, x2, [x27, #248]!
2360
2361# CHECK:      Average Wait times (based on the timeline view):
2362# CHECK-NEXT: [0]: Executions
2363# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2364# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2365# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2366
2367# CHECK:            [0]    [1]    [2]    [3]
2368# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ldp	x1, x2, [x27], #496
2369# CHECK-NEXT: 1.     1     1.0    0.0    0.0       ldp	w1, w2, [x27, #248]!
2370# CHECK-NEXT: 2.     1     1.0    0.0    0.0       ldp	x1, x2, [x27, #496]!
2371# CHECK-NEXT: 3.     1     1.0    0.0    0.0       ldpsw	x1, x2, [x27], #248
2372# CHECK-NEXT: 4.     1     1.0    0.0    0.0       ldpsw	x1, x2, [x27, #248]!
2373# CHECK-NEXT:        1     1.0    0.2    0.0       <total>
2374
2375# CHECK:      [46] Code Region - G47
2376
2377# CHECK:      Iterations:        100
2378# CHECK-NEXT: Instructions:      500
2379# CHECK-NEXT: Total Cycles:      507
2380# CHECK-NEXT: Total uOps:        1000
2381
2382# CHECK:      Dispatch Width:    4
2383# CHECK-NEXT: uOps Per Cycle:    1.97
2384# CHECK-NEXT: IPC:               0.99
2385# CHECK-NEXT: Block RThroughput: 2.5
2386
2387# CHECK:      Timeline view:
2388# CHECK-NEXT:                     01
2389# CHECK-NEXT: Index     0123456789
2390
2391# CHECK:      [0,0]     DeeeeeER  ..   ldr	b1, [x27], #254
2392# CHECK-NEXT: [0,1]     D=eeeeeER ..   ldr	h1, [x27], #254
2393# CHECK-NEXT: [0,2]     .D=eeeeeER..   ldr	s1, [x27], #254
2394# CHECK-NEXT: [0,3]     .D==eeeeeER.   ldr	d1, [x27], #254
2395# CHECK-NEXT: [0,4]     . D==eeeeeER   ldr	q1, [x27], #254
2396
2397# CHECK:      Average Wait times (based on the timeline view):
2398# CHECK-NEXT: [0]: Executions
2399# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2400# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2401# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2402
2403# CHECK:            [0]    [1]    [2]    [3]
2404# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ldr	b1, [x27], #254
2405# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ldr	h1, [x27], #254
2406# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ldr	s1, [x27], #254
2407# CHECK-NEXT: 3.     1     3.0    0.0    0.0       ldr	d1, [x27], #254
2408# CHECK-NEXT: 4.     1     3.0    0.0    0.0       ldr	q1, [x27], #254
2409# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2410
2411# CHECK:      [47] Code Region - G48
2412
2413# CHECK:      Iterations:        100
2414# CHECK-NEXT: Instructions:      500
2415# CHECK-NEXT: Total Cycles:      507
2416# CHECK-NEXT: Total uOps:        1000
2417
2418# CHECK:      Dispatch Width:    4
2419# CHECK-NEXT: uOps Per Cycle:    1.97
2420# CHECK-NEXT: IPC:               0.99
2421# CHECK-NEXT: Block RThroughput: 2.5
2422
2423# CHECK:      Timeline view:
2424# CHECK-NEXT:                     01
2425# CHECK-NEXT: Index     0123456789
2426
2427# CHECK:      [0,0]     DeeeeeER  ..   ldr	b1, [x27, #254]!
2428# CHECK-NEXT: [0,1]     D=eeeeeER ..   ldr	h1, [x27, #254]!
2429# CHECK-NEXT: [0,2]     .D=eeeeeER..   ldr	s1, [x27, #254]!
2430# CHECK-NEXT: [0,3]     .D==eeeeeER.   ldr	d1, [x27, #254]!
2431# CHECK-NEXT: [0,4]     . D==eeeeeER   ldr	q1, [x27, #254]!
2432
2433# CHECK:      Average Wait times (based on the timeline view):
2434# CHECK-NEXT: [0]: Executions
2435# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2436# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2437# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2438
2439# CHECK:            [0]    [1]    [2]    [3]
2440# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ldr	b1, [x27, #254]!
2441# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ldr	h1, [x27, #254]!
2442# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ldr	s1, [x27, #254]!
2443# CHECK-NEXT: 3.     1     3.0    0.0    0.0       ldr	d1, [x27, #254]!
2444# CHECK-NEXT: 4.     1     3.0    0.0    0.0       ldr	q1, [x27, #254]!
2445# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2446
2447# CHECK:      [48] Code Region - G49
2448
2449# CHECK:      Iterations:        100
2450# CHECK-NEXT: Instructions:      500
2451# CHECK-NEXT: Total Cycles:      506
2452# CHECK-NEXT: Total uOps:        1000
2453
2454# CHECK:      Dispatch Width:    4
2455# CHECK-NEXT: uOps Per Cycle:    1.98
2456# CHECK-NEXT: IPC:               0.99
2457# CHECK-NEXT: Block RThroughput: 2.5
2458
2459# CHECK:      Timeline view:
2460# CHECK-NEXT:                     0
2461# CHECK-NEXT: Index     0123456789
2462
2463# CHECK:      [0,0]     DeeeeER   .   ldr	w1, [x27], #254
2464# CHECK-NEXT: [0,1]     D=eeeeER  .   ldr	x1, [x27], #254
2465# CHECK-NEXT: [0,2]     .D=eeeeER .   ldr	w1, [x27, #254]!
2466# CHECK-NEXT: [0,3]     .D==eeeeER.   ldr	x1, [x27, #254]!
2467# CHECK-NEXT: [0,4]     . D==eeeeER   ldrb	w1, [x27], #254
2468
2469# CHECK:      Average Wait times (based on the timeline view):
2470# CHECK-NEXT: [0]: Executions
2471# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2472# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2473# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2474
2475# CHECK:            [0]    [1]    [2]    [3]
2476# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ldr	w1, [x27], #254
2477# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ldr	x1, [x27], #254
2478# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ldr	w1, [x27, #254]!
2479# CHECK-NEXT: 3.     1     3.0    0.0    0.0       ldr	x1, [x27, #254]!
2480# CHECK-NEXT: 4.     1     3.0    0.0    0.0       ldrb	w1, [x27], #254
2481# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2482
2483# CHECK:      [49] Code Region - G50
2484
2485# CHECK:      Iterations:        100
2486# CHECK-NEXT: Instructions:      500
2487# CHECK-NEXT: Total Cycles:      506
2488# CHECK-NEXT: Total uOps:        1000
2489
2490# CHECK:      Dispatch Width:    4
2491# CHECK-NEXT: uOps Per Cycle:    1.98
2492# CHECK-NEXT: IPC:               0.99
2493# CHECK-NEXT: Block RThroughput: 2.5
2494
2495# CHECK:      Timeline view:
2496# CHECK-NEXT:                     0
2497# CHECK-NEXT: Index     0123456789
2498
2499# CHECK:      [0,0]     DeeeeER   .   ldrb	w1, [x27, #254]!
2500# CHECK-NEXT: [0,1]     D=eeeeER  .   ldrh	w1, [x27], #254
2501# CHECK-NEXT: [0,2]     .D=eeeeER .   ldrh	w1, [x27, #254]!
2502# CHECK-NEXT: [0,3]     .D==eeeeER.   ldrsb	w1, [x27], #254
2503# CHECK-NEXT: [0,4]     . D==eeeeER   ldrsb	x1, [x27], #254
2504
2505# CHECK:      Average Wait times (based on the timeline view):
2506# CHECK-NEXT: [0]: Executions
2507# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2508# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2509# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2510
2511# CHECK:            [0]    [1]    [2]    [3]
2512# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ldrb	w1, [x27, #254]!
2513# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ldrh	w1, [x27], #254
2514# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ldrh	w1, [x27, #254]!
2515# CHECK-NEXT: 3.     1     3.0    0.0    0.0       ldrsb	w1, [x27], #254
2516# CHECK-NEXT: 4.     1     3.0    0.0    0.0       ldrsb	x1, [x27], #254
2517# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2518
2519# CHECK:      [50] Code Region - G51
2520
2521# CHECK:      Iterations:        100
2522# CHECK-NEXT: Instructions:      500
2523# CHECK-NEXT: Total Cycles:      506
2524# CHECK-NEXT: Total uOps:        1000
2525
2526# CHECK:      Dispatch Width:    4
2527# CHECK-NEXT: uOps Per Cycle:    1.98
2528# CHECK-NEXT: IPC:               0.99
2529# CHECK-NEXT: Block RThroughput: 2.5
2530
2531# CHECK:      Timeline view:
2532# CHECK-NEXT:                     0
2533# CHECK-NEXT: Index     0123456789
2534
2535# CHECK:      [0,0]     DeeeeER   .   ldrsb	w1, [x27, #254]!
2536# CHECK-NEXT: [0,1]     D=eeeeER  .   ldrsb	x1, [x27, #254]!
2537# CHECK-NEXT: [0,2]     .D=eeeeER .   ldrsh	w1, [x27], #254
2538# CHECK-NEXT: [0,3]     .D==eeeeER.   ldrsh	x1, [x27], #254
2539# CHECK-NEXT: [0,4]     . D==eeeeER   ldrsh	w1, [x27, #254]!
2540
2541# CHECK:      Average Wait times (based on the timeline view):
2542# CHECK-NEXT: [0]: Executions
2543# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2544# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2545# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2546
2547# CHECK:            [0]    [1]    [2]    [3]
2548# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ldrsb	w1, [x27, #254]!
2549# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ldrsb	x1, [x27, #254]!
2550# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ldrsh	w1, [x27], #254
2551# CHECK-NEXT: 3.     1     3.0    0.0    0.0       ldrsh	x1, [x27], #254
2552# CHECK-NEXT: 4.     1     3.0    0.0    0.0       ldrsh	w1, [x27, #254]!
2553# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2554
2555# CHECK:      [51] Code Region - G52
2556
2557# CHECK:      Iterations:        100
2558# CHECK-NEXT: Instructions:      500
2559# CHECK-NEXT: Total Cycles:      505
2560# CHECK-NEXT: Total uOps:        1000
2561
2562# CHECK:      Dispatch Width:    4
2563# CHECK-NEXT: uOps Per Cycle:    1.98
2564# CHECK-NEXT: IPC:               0.99
2565# CHECK-NEXT: Block RThroughput: 2.5
2566
2567# CHECK:      Timeline view:
2568# CHECK-NEXT: Index     0123456789
2569
2570# CHECK:      [0,0]     DeeeeER  .   ldrsh	x1, [x27, #254]!
2571# CHECK-NEXT: [0,1]     D=eeeeER .   ldrsw	x1, [x27], #254
2572# CHECK-NEXT: [0,2]     .D=eeeeER.   ldrsw	x1, [x27, #254]!
2573# CHECK-NEXT: [0,3]     .D==eeeER.   st1	{ v1.1d }, [x27], #8
2574# CHECK-NEXT: [0,4]     . D==eeeER   st1	{ v1.2d }, [x27], #16
2575
2576# CHECK:      Average Wait times (based on the timeline view):
2577# CHECK-NEXT: [0]: Executions
2578# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2579# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2580# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2581
2582# CHECK:            [0]    [1]    [2]    [3]
2583# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ldrsh	x1, [x27, #254]!
2584# CHECK-NEXT: 1.     1     2.0    0.0    0.0       ldrsw	x1, [x27], #254
2585# CHECK-NEXT: 2.     1     2.0    0.0    0.0       ldrsw	x1, [x27, #254]!
2586# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.1d }, [x27], #8
2587# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.2d }, [x27], #16
2588# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2589
2590# CHECK:      [52] Code Region - G53
2591
2592# CHECK:      Iterations:        100
2593# CHECK-NEXT: Instructions:      500
2594# CHECK-NEXT: Total Cycles:      505
2595# CHECK-NEXT: Total uOps:        1000
2596
2597# CHECK:      Dispatch Width:    4
2598# CHECK-NEXT: uOps Per Cycle:    1.98
2599# CHECK-NEXT: IPC:               0.99
2600# CHECK-NEXT: Block RThroughput: 2.5
2601
2602# CHECK:      Timeline view:
2603# CHECK-NEXT: Index     0123456789
2604
2605# CHECK:      [0,0]     DeeeER   .   st1	{ v1.2s }, [x27], #8
2606# CHECK-NEXT: [0,1]     D=eeeER  .   st1	{ v1.4h }, [x27], #8
2607# CHECK-NEXT: [0,2]     .D=eeeER .   st1	{ v1.4s }, [x27], #16
2608# CHECK-NEXT: [0,3]     .D==eeeER.   st1	{ v1.8b }, [x27], #8
2609# CHECK-NEXT: [0,4]     . D==eeeER   st1	{ v1.8h }, [x27], #16
2610
2611# CHECK:      Average Wait times (based on the timeline view):
2612# CHECK-NEXT: [0]: Executions
2613# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2614# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2615# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2616
2617# CHECK:            [0]    [1]    [2]    [3]
2618# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.2s }, [x27], #8
2619# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.4h }, [x27], #8
2620# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.4s }, [x27], #16
2621# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.8b }, [x27], #8
2622# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.8h }, [x27], #16
2623# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2624
2625# CHECK:      [53] Code Region - G54
2626
2627# CHECK:      Iterations:        100
2628# CHECK-NEXT: Instructions:      500
2629# CHECK-NEXT: Total Cycles:      505
2630# CHECK-NEXT: Total uOps:        1000
2631
2632# CHECK:      Dispatch Width:    4
2633# CHECK-NEXT: uOps Per Cycle:    1.98
2634# CHECK-NEXT: IPC:               0.99
2635# CHECK-NEXT: Block RThroughput: 2.5
2636
2637# CHECK:      Timeline view:
2638# CHECK-NEXT: Index     0123456789
2639
2640# CHECK:      [0,0]     DeeeER   .   st1	{ v1.16b }, [x27], #16
2641# CHECK-NEXT: [0,1]     D=eeeER  .   st1	{ v1.1d }, [x27], x28
2642# CHECK-NEXT: [0,2]     .D=eeeER .   st1	{ v1.2d }, [x27], x28
2643# CHECK-NEXT: [0,3]     .D==eeeER.   st1	{ v1.2s }, [x27], x28
2644# CHECK-NEXT: [0,4]     . D==eeeER   st1	{ v1.4h }, [x27], x28
2645
2646# CHECK:      Average Wait times (based on the timeline view):
2647# CHECK-NEXT: [0]: Executions
2648# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2649# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2650# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2651
2652# CHECK:            [0]    [1]    [2]    [3]
2653# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.16b }, [x27], #16
2654# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.1d }, [x27], x28
2655# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.2d }, [x27], x28
2656# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.2s }, [x27], x28
2657# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.4h }, [x27], x28
2658# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2659
2660# CHECK:      [54] Code Region - G55
2661
2662# CHECK:      Iterations:        100
2663# CHECK-NEXT: Instructions:      500
2664# CHECK-NEXT: Total Cycles:      506
2665# CHECK-NEXT: Total uOps:        1000
2666
2667# CHECK:      Dispatch Width:    4
2668# CHECK-NEXT: uOps Per Cycle:    1.98
2669# CHECK-NEXT: IPC:               0.99
2670# CHECK-NEXT: Block RThroughput: 2.5
2671
2672# CHECK:      Timeline view:
2673# CHECK-NEXT:                     0
2674# CHECK-NEXT: Index     0123456789
2675
2676# CHECK:      [0,0]     DeeeER    .   st1	{ v1.4s }, [x27], x28
2677# CHECK-NEXT: [0,1]     D=eeeER   .   st1	{ v1.8b }, [x27], x28
2678# CHECK-NEXT: [0,2]     .D=eeeER  .   st1	{ v1.8h }, [x27], x28
2679# CHECK-NEXT: [0,3]     .D==eeeER .   st1	{ v1.16b }, [x27], x28
2680# CHECK-NEXT: [0,4]     . D==eeeeER   st1	{ v1.1d, v2.1d }, [x27], #16
2681
2682# CHECK:      Average Wait times (based on the timeline view):
2683# CHECK-NEXT: [0]: Executions
2684# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2685# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2686# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2687
2688# CHECK:            [0]    [1]    [2]    [3]
2689# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.4s }, [x27], x28
2690# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.8b }, [x27], x28
2691# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.8h }, [x27], x28
2692# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.16b }, [x27], x28
2693# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.1d, v2.1d }, [x27], #16
2694# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2695
2696# CHECK:      [55] Code Region - G56
2697
2698# CHECK:      Iterations:        100
2699# CHECK-NEXT: Instructions:      500
2700# CHECK-NEXT: Total Cycles:      506
2701# CHECK-NEXT: Total uOps:        1000
2702
2703# CHECK:      Dispatch Width:    4
2704# CHECK-NEXT: uOps Per Cycle:    1.98
2705# CHECK-NEXT: IPC:               0.99
2706# CHECK-NEXT: Block RThroughput: 2.5
2707
2708# CHECK:      Timeline view:
2709# CHECK-NEXT:                     0
2710# CHECK-NEXT: Index     0123456789
2711
2712# CHECK:      [0,0]     DeeeeER   .   st1	{ v1.2d, v2.2d }, [x27], #32
2713# CHECK-NEXT: [0,1]     D=eeeeER  .   st1	{ v1.2s, v2.2s }, [x27], #16
2714# CHECK-NEXT: [0,2]     .D=eeeeER .   st1	{ v1.4h, v2.4h }, [x27], #16
2715# CHECK-NEXT: [0,3]     .D==eeeeER.   st1	{ v1.4s, v2.4s }, [x27], #32
2716# CHECK-NEXT: [0,4]     . D==eeeeER   st1	{ v1.8b, v2.8b }, [x27], #16
2717
2718# CHECK:      Average Wait times (based on the timeline view):
2719# CHECK-NEXT: [0]: Executions
2720# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2721# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2722# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2723
2724# CHECK:            [0]    [1]    [2]    [3]
2725# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.2d, v2.2d }, [x27], #32
2726# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.2s, v2.2s }, [x27], #16
2727# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.4h, v2.4h }, [x27], #16
2728# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.4s, v2.4s }, [x27], #32
2729# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.8b, v2.8b }, [x27], #16
2730# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2731
2732# CHECK:      [56] Code Region - G57
2733
2734# CHECK:      Iterations:        100
2735# CHECK-NEXT: Instructions:      500
2736# CHECK-NEXT: Total Cycles:      506
2737# CHECK-NEXT: Total uOps:        1000
2738
2739# CHECK:      Dispatch Width:    4
2740# CHECK-NEXT: uOps Per Cycle:    1.98
2741# CHECK-NEXT: IPC:               0.99
2742# CHECK-NEXT: Block RThroughput: 2.5
2743
2744# CHECK:      Timeline view:
2745# CHECK-NEXT:                     0
2746# CHECK-NEXT: Index     0123456789
2747
2748# CHECK:      [0,0]     DeeeeER   .   st1	{ v1.8h, v2.8h }, [x27], #32
2749# CHECK-NEXT: [0,1]     D=eeeeER  .   st1	{ v1.16b, v2.16b }, [x27], #32
2750# CHECK-NEXT: [0,2]     .D=eeeeER .   st1	{ v1.1d, v2.1d }, [x27], x28
2751# CHECK-NEXT: [0,3]     .D==eeeeER.   st1	{ v1.2d, v2.2d }, [x27], x28
2752# CHECK-NEXT: [0,4]     . D==eeeeER   st1	{ v1.2s, v2.2s }, [x27], x28
2753
2754# CHECK:      Average Wait times (based on the timeline view):
2755# CHECK-NEXT: [0]: Executions
2756# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2757# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2758# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2759
2760# CHECK:            [0]    [1]    [2]    [3]
2761# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.8h, v2.8h }, [x27], #32
2762# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.16b, v2.16b }, [x27], #32
2763# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.1d, v2.1d }, [x27], x28
2764# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.2d, v2.2d }, [x27], x28
2765# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.2s, v2.2s }, [x27], x28
2766# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2767
2768# CHECK:      [57] Code Region - G58
2769
2770# CHECK:      Iterations:        100
2771# CHECK-NEXT: Instructions:      500
2772# CHECK-NEXT: Total Cycles:      506
2773# CHECK-NEXT: Total uOps:        1000
2774
2775# CHECK:      Dispatch Width:    4
2776# CHECK-NEXT: uOps Per Cycle:    1.98
2777# CHECK-NEXT: IPC:               0.99
2778# CHECK-NEXT: Block RThroughput: 2.5
2779
2780# CHECK:      Timeline view:
2781# CHECK-NEXT:                     0
2782# CHECK-NEXT: Index     0123456789
2783
2784# CHECK:      [0,0]     DeeeeER   .   st1	{ v1.4h, v2.4h }, [x27], x28
2785# CHECK-NEXT: [0,1]     D=eeeeER  .   st1	{ v1.4s, v2.4s }, [x27], x28
2786# CHECK-NEXT: [0,2]     .D=eeeeER .   st1	{ v1.8b, v2.8b }, [x27], x28
2787# CHECK-NEXT: [0,3]     .D==eeeeER.   st1	{ v1.8h, v2.8h }, [x27], x28
2788# CHECK-NEXT: [0,4]     . D==eeeeER   st1	{ v1.16b, v2.16b }, [x27], x28
2789
2790# CHECK:      Average Wait times (based on the timeline view):
2791# CHECK-NEXT: [0]: Executions
2792# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2793# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2794# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2795
2796# CHECK:            [0]    [1]    [2]    [3]
2797# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.4h, v2.4h }, [x27], x28
2798# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.4s, v2.4s }, [x27], x28
2799# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.8b, v2.8b }, [x27], x28
2800# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.8h, v2.8h }, [x27], x28
2801# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.16b, v2.16b }, [x27], x28
2802# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2803
2804# CHECK:      [58] Code Region - G59
2805
2806# CHECK:      Iterations:        100
2807# CHECK-NEXT: Instructions:      500
2808# CHECK-NEXT: Total Cycles:      507
2809# CHECK-NEXT: Total uOps:        1000
2810
2811# CHECK:      Dispatch Width:    4
2812# CHECK-NEXT: uOps Per Cycle:    1.97
2813# CHECK-NEXT: IPC:               0.99
2814# CHECK-NEXT: Block RThroughput: 2.5
2815
2816# CHECK:      Timeline view:
2817# CHECK-NEXT:                     01
2818# CHECK-NEXT: Index     0123456789
2819
2820# CHECK:      [0,0]     DeeeeeER  ..   st1	{ v1.1d, v2.1d, v3.1d }, [x27], #24
2821# CHECK-NEXT: [0,1]     D=eeeeeER ..   st1	{ v1.2d, v2.2d, v3.2d }, [x27], #48
2822# CHECK-NEXT: [0,2]     .D=eeeeeER..   st1	{ v1.2s, v2.2s, v3.2s }, [x27], #24
2823# CHECK-NEXT: [0,3]     .D==eeeeeER.   st1	{ v1.4h, v2.4h, v3.4h }, [x27], #24
2824# CHECK-NEXT: [0,4]     . D==eeeeeER   st1	{ v1.4s, v2.4s, v3.4s }, [x27], #48
2825
2826# CHECK:      Average Wait times (based on the timeline view):
2827# CHECK-NEXT: [0]: Executions
2828# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2829# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2830# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2831
2832# CHECK:            [0]    [1]    [2]    [3]
2833# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.1d, v2.1d, v3.1d }, [x27], #24
2834# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.2d, v2.2d, v3.2d }, [x27], #48
2835# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.2s, v2.2s, v3.2s }, [x27], #24
2836# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.4h, v2.4h, v3.4h }, [x27], #24
2837# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.4s, v2.4s, v3.4s }, [x27], #48
2838# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2839
2840# CHECK:      [59] Code Region - G60
2841
2842# CHECK:      Iterations:        100
2843# CHECK-NEXT: Instructions:      500
2844# CHECK-NEXT: Total Cycles:      507
2845# CHECK-NEXT: Total uOps:        1000
2846
2847# CHECK:      Dispatch Width:    4
2848# CHECK-NEXT: uOps Per Cycle:    1.97
2849# CHECK-NEXT: IPC:               0.99
2850# CHECK-NEXT: Block RThroughput: 2.5
2851
2852# CHECK:      Timeline view:
2853# CHECK-NEXT:                     01
2854# CHECK-NEXT: Index     0123456789
2855
2856# CHECK:      [0,0]     DeeeeeER  ..   st1	{ v1.8b, v2.8b, v3.8b }, [x27], #24
2857# CHECK-NEXT: [0,1]     D=eeeeeER ..   st1	{ v1.8h, v2.8h, v3.8h }, [x27], #48
2858# CHECK-NEXT: [0,2]     .D=eeeeeER..   st1	{ v1.16b, v2.16b, v3.16b }, [x27], #48
2859# CHECK-NEXT: [0,3]     .D==eeeeeER.   st1	{ v1.1d, v2.1d, v3.1d }, [x27], x28
2860# CHECK-NEXT: [0,4]     . D==eeeeeER   st1	{ v1.2d, v2.2d, v3.2d }, [x27], x28
2861
2862# CHECK:      Average Wait times (based on the timeline view):
2863# CHECK-NEXT: [0]: Executions
2864# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2865# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2866# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2867
2868# CHECK:            [0]    [1]    [2]    [3]
2869# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.8b, v2.8b, v3.8b }, [x27], #24
2870# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.8h, v2.8h, v3.8h }, [x27], #48
2871# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.16b, v2.16b, v3.16b }, [x27], #48
2872# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.1d, v2.1d, v3.1d }, [x27], x28
2873# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.2d, v2.2d, v3.2d }, [x27], x28
2874# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2875
2876# CHECK:      [60] Code Region - G61
2877
2878# CHECK:      Iterations:        100
2879# CHECK-NEXT: Instructions:      500
2880# CHECK-NEXT: Total Cycles:      507
2881# CHECK-NEXT: Total uOps:        1000
2882
2883# CHECK:      Dispatch Width:    4
2884# CHECK-NEXT: uOps Per Cycle:    1.97
2885# CHECK-NEXT: IPC:               0.99
2886# CHECK-NEXT: Block RThroughput: 2.5
2887
2888# CHECK:      Timeline view:
2889# CHECK-NEXT:                     01
2890# CHECK-NEXT: Index     0123456789
2891
2892# CHECK:      [0,0]     DeeeeeER  ..   st1	{ v1.2s, v2.2s, v3.2s }, [x27], x28
2893# CHECK-NEXT: [0,1]     D=eeeeeER ..   st1	{ v1.4h, v2.4h, v3.4h }, [x27], x28
2894# CHECK-NEXT: [0,2]     .D=eeeeeER..   st1	{ v1.4s, v2.4s, v3.4s }, [x27], x28
2895# CHECK-NEXT: [0,3]     .D==eeeeeER.   st1	{ v1.8b, v2.8b, v3.8b }, [x27], x28
2896# CHECK-NEXT: [0,4]     . D==eeeeeER   st1	{ v1.8h, v2.8h, v3.8h }, [x27], x28
2897
2898# CHECK:      Average Wait times (based on the timeline view):
2899# CHECK-NEXT: [0]: Executions
2900# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2901# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2902# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2903
2904# CHECK:            [0]    [1]    [2]    [3]
2905# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.2s, v2.2s, v3.2s }, [x27], x28
2906# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.4h, v2.4h, v3.4h }, [x27], x28
2907# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.4s, v2.4s, v3.4s }, [x27], x28
2908# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.8b, v2.8b, v3.8b }, [x27], x28
2909# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.8h, v2.8h, v3.8h }, [x27], x28
2910# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2911
2912# CHECK:      [61] Code Region - G62
2913
2914# CHECK:      Iterations:        100
2915# CHECK-NEXT: Instructions:      500
2916# CHECK-NEXT: Total Cycles:      508
2917# CHECK-NEXT: Total uOps:        1000
2918
2919# CHECK:      Dispatch Width:    4
2920# CHECK-NEXT: uOps Per Cycle:    1.97
2921# CHECK-NEXT: IPC:               0.98
2922# CHECK-NEXT: Block RThroughput: 2.5
2923
2924# CHECK:      Timeline view:
2925# CHECK-NEXT:                     012
2926# CHECK-NEXT: Index     0123456789
2927
2928# CHECK:      [0,0]     DeeeeeER  . .   st1	{ v1.16b, v2.16b, v3.16b }, [x27], x28
2929# CHECK-NEXT: [0,1]     D=eeeeeeER. .   st1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
2930# CHECK-NEXT: [0,2]     .D=eeeeeeER .   st1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
2931# CHECK-NEXT: [0,3]     .D==eeeeeeER.   st1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
2932# CHECK-NEXT: [0,4]     . D==eeeeeeER   st1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
2933
2934# CHECK:      Average Wait times (based on the timeline view):
2935# CHECK-NEXT: [0]: Executions
2936# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2937# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2938# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2939
2940# CHECK:            [0]    [1]    [2]    [3]
2941# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.16b, v2.16b, v3.16b }, [x27], x28
2942# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32
2943# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
2944# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
2945# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
2946# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2947
2948# CHECK:      [62] Code Region - G63
2949
2950# CHECK:      Iterations:        100
2951# CHECK-NEXT: Instructions:      500
2952# CHECK-NEXT: Total Cycles:      508
2953# CHECK-NEXT: Total uOps:        1000
2954
2955# CHECK:      Dispatch Width:    4
2956# CHECK-NEXT: uOps Per Cycle:    1.97
2957# CHECK-NEXT: IPC:               0.98
2958# CHECK-NEXT: Block RThroughput: 2.5
2959
2960# CHECK:      Timeline view:
2961# CHECK-NEXT:                     012
2962# CHECK-NEXT: Index     0123456789
2963
2964# CHECK:      [0,0]     DeeeeeeER . .   st1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
2965# CHECK-NEXT: [0,1]     D=eeeeeeER. .   st1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
2966# CHECK-NEXT: [0,2]     .D=eeeeeeER .   st1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
2967# CHECK-NEXT: [0,3]     .D==eeeeeeER.   st1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
2968# CHECK-NEXT: [0,4]     . D==eeeeeeER   st1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
2969
2970# CHECK:      Average Wait times (based on the timeline view):
2971# CHECK-NEXT: [0]: Executions
2972# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
2973# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
2974# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
2975
2976# CHECK:            [0]    [1]    [2]    [3]
2977# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
2978# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
2979# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
2980# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
2981# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28
2982# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
2983
2984# CHECK:      [63] Code Region - G64
2985
2986# CHECK:      Iterations:        100
2987# CHECK-NEXT: Instructions:      500
2988# CHECK-NEXT: Total Cycles:      508
2989# CHECK-NEXT: Total uOps:        1000
2990
2991# CHECK:      Dispatch Width:    4
2992# CHECK-NEXT: uOps Per Cycle:    1.97
2993# CHECK-NEXT: IPC:               0.98
2994# CHECK-NEXT: Block RThroughput: 2.5
2995
2996# CHECK:      Timeline view:
2997# CHECK-NEXT:                     012
2998# CHECK-NEXT: Index     0123456789
2999
3000# CHECK:      [0,0]     DeeeeeeER . .   st1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
3001# CHECK-NEXT: [0,1]     D=eeeeeeER. .   st1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
3002# CHECK-NEXT: [0,2]     .D=eeeeeeER .   st1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
3003# CHECK-NEXT: [0,3]     .D==eeeeeeER.   st1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
3004# CHECK-NEXT: [0,4]     . D==eeeeeeER   st1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
3005
3006# CHECK:      Average Wait times (based on the timeline view):
3007# CHECK-NEXT: [0]: Executions
3008# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3009# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3010# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3011
3012# CHECK:            [0]    [1]    [2]    [3]
3013# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
3014# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
3015# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
3016# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
3017# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
3018# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3019
3020# CHECK:      [64] Code Region - G65
3021
3022# CHECK:      Iterations:        100
3023# CHECK-NEXT: Instructions:      500
3024# CHECK-NEXT: Total Cycles:      505
3025# CHECK-NEXT: Total uOps:        1000
3026
3027# CHECK:      Dispatch Width:    4
3028# CHECK-NEXT: uOps Per Cycle:    1.98
3029# CHECK-NEXT: IPC:               0.99
3030# CHECK-NEXT: Block RThroughput: 2.5
3031
3032# CHECK:      Timeline view:
3033# CHECK-NEXT: Index     0123456789
3034
3035# CHECK:      [0,0]     DeeeeeeER.   st1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
3036# CHECK-NEXT: [0,1]     D=eeeeeeER   st1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
3037# CHECK-NEXT: [0,2]     .D=eeeE--R   st1	{ v1.b }[0], [x27], #1
3038# CHECK-NEXT: [0,3]     .D==eeeE-R   st1	{ v1.b }[8], [x27], #1
3039# CHECK-NEXT: [0,4]     . D==eeeER   st1	{ v1.b }[0], [x27], x28
3040
3041# CHECK:      Average Wait times (based on the timeline view):
3042# CHECK-NEXT: [0]: Executions
3043# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3044# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3045# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3046
3047# CHECK:            [0]    [1]    [2]    [3]
3048# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
3049# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
3050# CHECK-NEXT: 2.     1     2.0    0.0    2.0       st1	{ v1.b }[0], [x27], #1
3051# CHECK-NEXT: 3.     1     3.0    0.0    1.0       st1	{ v1.b }[8], [x27], #1
3052# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.b }[0], [x27], x28
3053# CHECK-NEXT:        1     2.2    0.2    0.6       <total>
3054
3055# CHECK:      [65] Code Region - G66
3056
3057# CHECK:      Iterations:        100
3058# CHECK-NEXT: Instructions:      500
3059# CHECK-NEXT: Total Cycles:      505
3060# CHECK-NEXT: Total uOps:        1000
3061
3062# CHECK:      Dispatch Width:    4
3063# CHECK-NEXT: uOps Per Cycle:    1.98
3064# CHECK-NEXT: IPC:               0.99
3065# CHECK-NEXT: Block RThroughput: 2.5
3066
3067# CHECK:      Timeline view:
3068# CHECK-NEXT: Index     0123456789
3069
3070# CHECK:      [0,0]     DeeeER   .   st1	{ v1.b }[8], [x27], x28
3071# CHECK-NEXT: [0,1]     D=eeeER  .   st1	{ v1.h }[0], [x27], #2
3072# CHECK-NEXT: [0,2]     .D=eeeER .   st1	{ v1.h }[4], [x27], #2
3073# CHECK-NEXT: [0,3]     .D==eeeER.   st1	{ v1.h }[0], [x27], x28
3074# CHECK-NEXT: [0,4]     . D==eeeER   st1	{ v1.h }[4], [x27], x28
3075
3076# CHECK:      Average Wait times (based on the timeline view):
3077# CHECK-NEXT: [0]: Executions
3078# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3079# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3080# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3081
3082# CHECK:            [0]    [1]    [2]    [3]
3083# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.b }[8], [x27], x28
3084# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.h }[0], [x27], #2
3085# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.h }[4], [x27], #2
3086# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.h }[0], [x27], x28
3087# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st1	{ v1.h }[4], [x27], x28
3088# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3089
3090# CHECK:      [66] Code Region - G67
3091
3092# CHECK:      Iterations:        100
3093# CHECK-NEXT: Instructions:      500
3094# CHECK-NEXT: Total Cycles:      506
3095# CHECK-NEXT: Total uOps:        1000
3096
3097# CHECK:      Dispatch Width:    4
3098# CHECK-NEXT: uOps Per Cycle:    1.98
3099# CHECK-NEXT: IPC:               0.99
3100# CHECK-NEXT: Block RThroughput: 2.5
3101
3102# CHECK:      Timeline view:
3103# CHECK-NEXT:                     0
3104# CHECK-NEXT: Index     0123456789
3105
3106# CHECK:      [0,0]     DeeeER    .   st1	{ v1.s }[0], [x27], #4
3107# CHECK-NEXT: [0,1]     D=eeeER   .   st1	{ v1.s }[0], [x27], x28
3108# CHECK-NEXT: [0,2]     .D=eeeER  .   st1	{ v1.d }[0], [x27], #8
3109# CHECK-NEXT: [0,3]     .D==eeeER .   st1	{ v1.d }[0], [x27], x28
3110# CHECK-NEXT: [0,4]     . D==eeeeER   st2	{ v1.2d, v2.2d }, [x27], #32
3111
3112# CHECK:      Average Wait times (based on the timeline view):
3113# CHECK-NEXT: [0]: Executions
3114# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3115# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3116# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3117
3118# CHECK:            [0]    [1]    [2]    [3]
3119# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st1	{ v1.s }[0], [x27], #4
3120# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st1	{ v1.s }[0], [x27], x28
3121# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st1	{ v1.d }[0], [x27], #8
3122# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st1	{ v1.d }[0], [x27], x28
3123# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st2	{ v1.2d, v2.2d }, [x27], #32
3124# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3125
3126# CHECK:      [67] Code Region - G68
3127
3128# CHECK:      Iterations:        100
3129# CHECK-NEXT: Instructions:      500
3130# CHECK-NEXT: Total Cycles:      506
3131# CHECK-NEXT: Total uOps:        1000
3132
3133# CHECK:      Dispatch Width:    4
3134# CHECK-NEXT: uOps Per Cycle:    1.98
3135# CHECK-NEXT: IPC:               0.99
3136# CHECK-NEXT: Block RThroughput: 2.5
3137
3138# CHECK:      Timeline view:
3139# CHECK-NEXT:                     0
3140# CHECK-NEXT: Index     0123456789
3141
3142# CHECK:      [0,0]     DeeeeER   .   st2	{ v1.2s, v2.2s }, [x27], #16
3143# CHECK-NEXT: [0,1]     D=eeeeER  .   st2	{ v1.4h, v2.4h }, [x27], #16
3144# CHECK-NEXT: [0,2]     .D=eeeeER .   st2	{ v1.4s, v2.4s }, [x27], #32
3145# CHECK-NEXT: [0,3]     .D==eeeeER.   st2	{ v1.8b, v2.8b }, [x27], #16
3146# CHECK-NEXT: [0,4]     . D==eeeeER   st2	{ v1.8h, v2.8h }, [x27], #32
3147
3148# CHECK:      Average Wait times (based on the timeline view):
3149# CHECK-NEXT: [0]: Executions
3150# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3151# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3152# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3153
3154# CHECK:            [0]    [1]    [2]    [3]
3155# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st2	{ v1.2s, v2.2s }, [x27], #16
3156# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st2	{ v1.4h, v2.4h }, [x27], #16
3157# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st2	{ v1.4s, v2.4s }, [x27], #32
3158# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st2	{ v1.8b, v2.8b }, [x27], #16
3159# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st2	{ v1.8h, v2.8h }, [x27], #32
3160# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3161
3162# CHECK:      [68] Code Region - G69
3163
3164# CHECK:      Iterations:        100
3165# CHECK-NEXT: Instructions:      500
3166# CHECK-NEXT: Total Cycles:      506
3167# CHECK-NEXT: Total uOps:        1000
3168
3169# CHECK:      Dispatch Width:    4
3170# CHECK-NEXT: uOps Per Cycle:    1.98
3171# CHECK-NEXT: IPC:               0.99
3172# CHECK-NEXT: Block RThroughput: 2.5
3173
3174# CHECK:      Timeline view:
3175# CHECK-NEXT:                     0
3176# CHECK-NEXT: Index     0123456789
3177
3178# CHECK:      [0,0]     DeeeeER   .   st2	{ v1.16b, v2.16b }, [x27], #32
3179# CHECK-NEXT: [0,1]     D=eeeeER  .   st2	{ v1.2d, v2.2d }, [x27], x28
3180# CHECK-NEXT: [0,2]     .D=eeeeER .   st2	{ v1.2s, v2.2s }, [x27], x28
3181# CHECK-NEXT: [0,3]     .D==eeeeER.   st2	{ v1.4h, v2.4h }, [x27], x28
3182# CHECK-NEXT: [0,4]     . D==eeeeER   st2	{ v1.4s, v2.4s }, [x27], x28
3183
3184# CHECK:      Average Wait times (based on the timeline view):
3185# CHECK-NEXT: [0]: Executions
3186# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3187# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3188# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3189
3190# CHECK:            [0]    [1]    [2]    [3]
3191# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st2	{ v1.16b, v2.16b }, [x27], #32
3192# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st2	{ v1.2d, v2.2d }, [x27], x28
3193# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st2	{ v1.2s, v2.2s }, [x27], x28
3194# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st2	{ v1.4h, v2.4h }, [x27], x28
3195# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st2	{ v1.4s, v2.4s }, [x27], x28
3196# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3197
3198# CHECK:      [69] Code Region - G70
3199
3200# CHECK:      Iterations:        100
3201# CHECK-NEXT: Instructions:      500
3202# CHECK-NEXT: Total Cycles:      506
3203# CHECK-NEXT: Total uOps:        1000
3204
3205# CHECK:      Dispatch Width:    4
3206# CHECK-NEXT: uOps Per Cycle:    1.98
3207# CHECK-NEXT: IPC:               0.99
3208# CHECK-NEXT: Block RThroughput: 2.5
3209
3210# CHECK:      Timeline view:
3211# CHECK-NEXT:                     0
3212# CHECK-NEXT: Index     0123456789
3213
3214# CHECK:      [0,0]     DeeeeER   .   st2	{ v1.8b, v2.8b }, [x27], x28
3215# CHECK-NEXT: [0,1]     D=eeeeER  .   st2	{ v1.8h, v2.8h }, [x27], x28
3216# CHECK-NEXT: [0,2]     .D=eeeeER .   st2	{ v1.16b, v2.16b }, [x27], x28
3217# CHECK-NEXT: [0,3]     .D==eeeeER.   st2	{ v1.b, v2.b }[0], [x27], #2
3218# CHECK-NEXT: [0,4]     . D==eeeeER   st2	{ v1.b, v2.b }[8], [x27], #2
3219
3220# CHECK:      Average Wait times (based on the timeline view):
3221# CHECK-NEXT: [0]: Executions
3222# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3223# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3224# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3225
3226# CHECK:            [0]    [1]    [2]    [3]
3227# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st2	{ v1.8b, v2.8b }, [x27], x28
3228# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st2	{ v1.8h, v2.8h }, [x27], x28
3229# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st2	{ v1.16b, v2.16b }, [x27], x28
3230# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st2	{ v1.b, v2.b }[0], [x27], #2
3231# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st2	{ v1.b, v2.b }[8], [x27], #2
3232# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3233
3234# CHECK:      [70] Code Region - G71
3235
3236# CHECK:      Iterations:        100
3237# CHECK-NEXT: Instructions:      500
3238# CHECK-NEXT: Total Cycles:      506
3239# CHECK-NEXT: Total uOps:        1000
3240
3241# CHECK:      Dispatch Width:    4
3242# CHECK-NEXT: uOps Per Cycle:    1.98
3243# CHECK-NEXT: IPC:               0.99
3244# CHECK-NEXT: Block RThroughput: 2.5
3245
3246# CHECK:      Timeline view:
3247# CHECK-NEXT:                     0
3248# CHECK-NEXT: Index     0123456789
3249
3250# CHECK:      [0,0]     DeeeeER   .   st2	{ v1.b, v2.b }[0], [x27], x28
3251# CHECK-NEXT: [0,1]     D=eeeeER  .   st2	{ v1.b, v2.b }[8], [x27], x28
3252# CHECK-NEXT: [0,2]     .D=eeeeER .   st2	{ v1.h, v2.h }[0], [x27], #4
3253# CHECK-NEXT: [0,3]     .D==eeeeER.   st2	{ v1.h, v2.h }[4], [x27], #4
3254# CHECK-NEXT: [0,4]     . D==eeeeER   st2	{ v1.h, v2.h }[0], [x27], x28
3255
3256# CHECK:      Average Wait times (based on the timeline view):
3257# CHECK-NEXT: [0]: Executions
3258# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3259# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3260# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3261
3262# CHECK:            [0]    [1]    [2]    [3]
3263# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st2	{ v1.b, v2.b }[0], [x27], x28
3264# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st2	{ v1.b, v2.b }[8], [x27], x28
3265# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st2	{ v1.h, v2.h }[0], [x27], #4
3266# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st2	{ v1.h, v2.h }[4], [x27], #4
3267# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st2	{ v1.h, v2.h }[0], [x27], x28
3268# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3269
3270# CHECK:      [71] Code Region - G72
3271
3272# CHECK:      Iterations:        100
3273# CHECK-NEXT: Instructions:      500
3274# CHECK-NEXT: Total Cycles:      506
3275# CHECK-NEXT: Total uOps:        1000
3276
3277# CHECK:      Dispatch Width:    4
3278# CHECK-NEXT: uOps Per Cycle:    1.98
3279# CHECK-NEXT: IPC:               0.99
3280# CHECK-NEXT: Block RThroughput: 2.5
3281
3282# CHECK:      Timeline view:
3283# CHECK-NEXT:                     0
3284# CHECK-NEXT: Index     0123456789
3285
3286# CHECK:      [0,0]     DeeeeER   .   st2	{ v1.h, v2.h }[4], [x27], x28
3287# CHECK-NEXT: [0,1]     D=eeeeER  .   st2	{ v1.s, v2.s }[0], [x27], #8
3288# CHECK-NEXT: [0,2]     .D=eeeeER .   st2	{ v1.s, v2.s }[0], [x27], x28
3289# CHECK-NEXT: [0,3]     .D==eeeeER.   st2	{ v1.d, v2.d }[0], [x27], #16
3290# CHECK-NEXT: [0,4]     . D==eeeeER   st2	{ v1.d, v2.d }[0], [x27], x28
3291
3292# CHECK:      Average Wait times (based on the timeline view):
3293# CHECK-NEXT: [0]: Executions
3294# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3295# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3296# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3297
3298# CHECK:            [0]    [1]    [2]    [3]
3299# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st2	{ v1.h, v2.h }[4], [x27], x28
3300# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st2	{ v1.s, v2.s }[0], [x27], #8
3301# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st2	{ v1.s, v2.s }[0], [x27], x28
3302# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st2	{ v1.d, v2.d }[0], [x27], #16
3303# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st2	{ v1.d, v2.d }[0], [x27], x28
3304# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3305
3306# CHECK:      [72] Code Region - G73
3307
3308# CHECK:      Iterations:        100
3309# CHECK-NEXT: Instructions:      300
3310# CHECK-NEXT: Total Cycles:      307
3311# CHECK-NEXT: Total uOps:        600
3312
3313# CHECK:      Dispatch Width:    4
3314# CHECK-NEXT: uOps Per Cycle:    1.95
3315# CHECK-NEXT: IPC:               0.98
3316# CHECK-NEXT: Block RThroughput: 1.5
3317
3318# CHECK:      Timeline view:
3319# CHECK-NEXT: Index     0123456789
3320
3321# CHECK:      [0,0]     DeeeeeER .   st3	{ v1.2d, v2.2d, v3.2d }, [x27], #48
3322# CHECK-NEXT: [0,1]     D=eeeeeER.   st3	{ v1.2s, v2.2s, v3.2s }, [x27], #24
3323# CHECK-NEXT: [0,2]     .D=eeeeeER   st3	{ v1.4h, v2.4h, v3.4h }, [x27], #24
3324
3325# CHECK:      Average Wait times (based on the timeline view):
3326# CHECK-NEXT: [0]: Executions
3327# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3328# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3329# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3330
3331# CHECK:            [0]    [1]    [2]    [3]
3332# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st3	{ v1.2d, v2.2d, v3.2d }, [x27], #48
3333# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st3	{ v1.2s, v2.2s, v3.2s }, [x27], #24
3334# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st3	{ v1.4h, v2.4h, v3.4h }, [x27], #24
3335# CHECK-NEXT:        1     1.7    0.3    0.0       <total>
3336
3337# CHECK:      [73] Code Region - G74
3338
3339# CHECK:      Iterations:        100
3340# CHECK-NEXT: Instructions:      500
3341# CHECK-NEXT: Total Cycles:      507
3342# CHECK-NEXT: Total uOps:        1000
3343
3344# CHECK:      Dispatch Width:    4
3345# CHECK-NEXT: uOps Per Cycle:    1.97
3346# CHECK-NEXT: IPC:               0.99
3347# CHECK-NEXT: Block RThroughput: 2.5
3348
3349# CHECK:      Timeline view:
3350# CHECK-NEXT:                     01
3351# CHECK-NEXT: Index     0123456789
3352
3353# CHECK:      [0,0]     DeeeeeER  ..   st3	{ v1.4s, v2.4s, v3.4s }, [x27], #48
3354# CHECK-NEXT: [0,1]     D=eeeeeER ..   st3	{ v1.8b, v2.8b, v3.8b }, [x27], #24
3355# CHECK-NEXT: [0,2]     .D=eeeeeER..   st3	{ v1.8h, v2.8h, v3.8h }, [x27], #48
3356# CHECK-NEXT: [0,3]     .D==eeeeeER.   st3	{ v1.16b, v2.16b, v3.16b }, [x27], #48
3357# CHECK-NEXT: [0,4]     . D==eeeeeER   st3	{ v1.2d, v2.2d, v3.2d }, [x27], x28
3358
3359# CHECK:      Average Wait times (based on the timeline view):
3360# CHECK-NEXT: [0]: Executions
3361# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3362# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3363# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3364
3365# CHECK:            [0]    [1]    [2]    [3]
3366# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st3	{ v1.4s, v2.4s, v3.4s }, [x27], #48
3367# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st3	{ v1.8b, v2.8b, v3.8b }, [x27], #24
3368# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st3	{ v1.8h, v2.8h, v3.8h }, [x27], #48
3369# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st3	{ v1.16b, v2.16b, v3.16b }, [x27], #48
3370# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st3	{ v1.2d, v2.2d, v3.2d }, [x27], x28
3371# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3372
3373# CHECK:      [74] Code Region - G75
3374
3375# CHECK:      Iterations:        100
3376# CHECK-NEXT: Instructions:      500
3377# CHECK-NEXT: Total Cycles:      507
3378# CHECK-NEXT: Total uOps:        1000
3379
3380# CHECK:      Dispatch Width:    4
3381# CHECK-NEXT: uOps Per Cycle:    1.97
3382# CHECK-NEXT: IPC:               0.99
3383# CHECK-NEXT: Block RThroughput: 2.5
3384
3385# CHECK:      Timeline view:
3386# CHECK-NEXT:                     01
3387# CHECK-NEXT: Index     0123456789
3388
3389# CHECK:      [0,0]     DeeeeeER  ..   st3	{ v1.2s, v2.2s, v3.2s }, [x27], x28
3390# CHECK-NEXT: [0,1]     D=eeeeeER ..   st3	{ v1.4h, v2.4h, v3.4h }, [x27], x28
3391# CHECK-NEXT: [0,2]     .D=eeeeeER..   st3	{ v1.4s, v2.4s, v3.4s }, [x27], x28
3392# CHECK-NEXT: [0,3]     .D==eeeeeER.   st3	{ v1.8b, v2.8b, v3.8b }, [x27], x28
3393# CHECK-NEXT: [0,4]     . D==eeeeeER   st3	{ v1.8h, v2.8h, v3.8h }, [x27], x28
3394
3395# CHECK:      Average Wait times (based on the timeline view):
3396# CHECK-NEXT: [0]: Executions
3397# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3398# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3399# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3400
3401# CHECK:            [0]    [1]    [2]    [3]
3402# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st3	{ v1.2s, v2.2s, v3.2s }, [x27], x28
3403# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st3	{ v1.4h, v2.4h, v3.4h }, [x27], x28
3404# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st3	{ v1.4s, v2.4s, v3.4s }, [x27], x28
3405# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st3	{ v1.8b, v2.8b, v3.8b }, [x27], x28
3406# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st3	{ v1.8h, v2.8h, v3.8h }, [x27], x28
3407# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3408
3409# CHECK:      [75] Code Region - G76
3410
3411# CHECK:      Iterations:        100
3412# CHECK-NEXT: Instructions:      500
3413# CHECK-NEXT: Total Cycles:      507
3414# CHECK-NEXT: Total uOps:        1000
3415
3416# CHECK:      Dispatch Width:    4
3417# CHECK-NEXT: uOps Per Cycle:    1.97
3418# CHECK-NEXT: IPC:               0.99
3419# CHECK-NEXT: Block RThroughput: 2.5
3420
3421# CHECK:      Timeline view:
3422# CHECK-NEXT:                     01
3423# CHECK-NEXT: Index     0123456789
3424
3425# CHECK:      [0,0]     DeeeeeER  ..   st3	{ v1.16b, v2.16b, v3.16b }, [x27], x28
3426# CHECK-NEXT: [0,1]     D=eeeeeER ..   st3	{ v1.b, v2.b, v3.b }[0], [x27], #3
3427# CHECK-NEXT: [0,2]     .D=eeeeeER..   st3	{ v1.b, v2.b, v3.b }[8], [x27], #3
3428# CHECK-NEXT: [0,3]     .D==eeeeeER.   st3	{ v1.b, v2.b, v3.b }[0], [x27], x28
3429# CHECK-NEXT: [0,4]     . D==eeeeeER   st3	{ v1.b, v2.b, v3.b }[8], [x27], x28
3430
3431# CHECK:      Average Wait times (based on the timeline view):
3432# CHECK-NEXT: [0]: Executions
3433# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3434# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3435# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3436
3437# CHECK:            [0]    [1]    [2]    [3]
3438# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st3	{ v1.16b, v2.16b, v3.16b }, [x27], x28
3439# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st3	{ v1.b, v2.b, v3.b }[0], [x27], #3
3440# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st3	{ v1.b, v2.b, v3.b }[8], [x27], #3
3441# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st3	{ v1.b, v2.b, v3.b }[0], [x27], x28
3442# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st3	{ v1.b, v2.b, v3.b }[8], [x27], x28
3443# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3444
3445# CHECK:      [76] Code Region - G77
3446
3447# CHECK:      Iterations:        100
3448# CHECK-NEXT: Instructions:      500
3449# CHECK-NEXT: Total Cycles:      507
3450# CHECK-NEXT: Total uOps:        1000
3451
3452# CHECK:      Dispatch Width:    4
3453# CHECK-NEXT: uOps Per Cycle:    1.97
3454# CHECK-NEXT: IPC:               0.99
3455# CHECK-NEXT: Block RThroughput: 2.5
3456
3457# CHECK:      Timeline view:
3458# CHECK-NEXT:                     01
3459# CHECK-NEXT: Index     0123456789
3460
3461# CHECK:      [0,0]     DeeeeeER  ..   st3	{ v1.h, v2.h, v3.h }[0], [x27], #6
3462# CHECK-NEXT: [0,1]     D=eeeeeER ..   st3	{ v1.h, v2.h, v3.h }[4], [x27], #6
3463# CHECK-NEXT: [0,2]     .D=eeeeeER..   st3	{ v1.h, v2.h, v3.h }[0], [x27], x28
3464# CHECK-NEXT: [0,3]     .D==eeeeeER.   st3	{ v1.h, v2.h, v3.h }[4], [x27], x28
3465# CHECK-NEXT: [0,4]     . D==eeeeeER   st3	{ v1.s, v2.s, v3.s }[0], [x27], #12
3466
3467# CHECK:      Average Wait times (based on the timeline view):
3468# CHECK-NEXT: [0]: Executions
3469# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3470# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3471# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3472
3473# CHECK:            [0]    [1]    [2]    [3]
3474# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st3	{ v1.h, v2.h, v3.h }[0], [x27], #6
3475# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st3	{ v1.h, v2.h, v3.h }[4], [x27], #6
3476# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st3	{ v1.h, v2.h, v3.h }[0], [x27], x28
3477# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st3	{ v1.h, v2.h, v3.h }[4], [x27], x28
3478# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st3	{ v1.s, v2.s, v3.s }[0], [x27], #12
3479# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3480
3481# CHECK:      [77] Code Region - G78
3482
3483# CHECK:      Iterations:        100
3484# CHECK-NEXT: Instructions:      500
3485# CHECK-NEXT: Total Cycles:      510
3486# CHECK-NEXT: Total uOps:        1000
3487
3488# CHECK:      Dispatch Width:    4
3489# CHECK-NEXT: uOps Per Cycle:    1.96
3490# CHECK-NEXT: IPC:               0.98
3491# CHECK-NEXT: Block RThroughput: 2.5
3492
3493# CHECK:      Timeline view:
3494# CHECK-NEXT:                     01234
3495# CHECK-NEXT: Index     0123456789
3496
3497# CHECK:      [0,0]     DeeeeeER  .   .   st3	{ v1.s, v2.s, v3.s }[0], [x27], x28
3498# CHECK-NEXT: [0,1]     D=eeeeeER .   .   st3	{ v1.d, v2.d, v3.d }[0], [x27], #24
3499# CHECK-NEXT: [0,2]     .D=eeeeeER.   .   st3	{ v1.d, v2.d, v3.d }[0], [x27], x28
3500# CHECK-NEXT: [0,3]     .D==eeeeeeeeER.   st4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
3501# CHECK-NEXT: [0,4]     . D==eeeeeeeeER   st4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
3502
3503# CHECK:      Average Wait times (based on the timeline view):
3504# CHECK-NEXT: [0]: Executions
3505# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3506# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3507# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3508
3509# CHECK:            [0]    [1]    [2]    [3]
3510# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st3	{ v1.s, v2.s, v3.s }[0], [x27], x28
3511# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st3	{ v1.d, v2.d, v3.d }[0], [x27], #24
3512# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st3	{ v1.d, v2.d, v3.d }[0], [x27], x28
3513# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64
3514# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32
3515# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3516
3517# CHECK:      [78] Code Region - G79
3518
3519# CHECK:      Iterations:        100
3520# CHECK-NEXT: Instructions:      500
3521# CHECK-NEXT: Total Cycles:      510
3522# CHECK-NEXT: Total uOps:        1000
3523
3524# CHECK:      Dispatch Width:    4
3525# CHECK-NEXT: uOps Per Cycle:    1.96
3526# CHECK-NEXT: IPC:               0.98
3527# CHECK-NEXT: Block RThroughput: 2.5
3528
3529# CHECK:      Timeline view:
3530# CHECK-NEXT:                     01234
3531# CHECK-NEXT: Index     0123456789
3532
3533# CHECK:      [0,0]     DeeeeeeeeER   .   st4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
3534# CHECK-NEXT: [0,1]     D=eeeeeeeeER  .   st4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
3535# CHECK-NEXT: [0,2]     .D=eeeeeeeeER .   st4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
3536# CHECK-NEXT: [0,3]     .D==eeeeeeeeER.   st4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
3537# CHECK-NEXT: [0,4]     . D==eeeeeeeeER   st4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
3538
3539# CHECK:      Average Wait times (based on the timeline view):
3540# CHECK-NEXT: [0]: Executions
3541# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3542# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3543# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3544
3545# CHECK:            [0]    [1]    [2]    [3]
3546# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32
3547# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64
3548# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32
3549# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64
3550# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64
3551# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3552
3553# CHECK:      [79] Code Region - G80
3554
3555# CHECK:      Iterations:        100
3556# CHECK-NEXT: Instructions:      500
3557# CHECK-NEXT: Total Cycles:      510
3558# CHECK-NEXT: Total uOps:        1000
3559
3560# CHECK:      Dispatch Width:    4
3561# CHECK-NEXT: uOps Per Cycle:    1.96
3562# CHECK-NEXT: IPC:               0.98
3563# CHECK-NEXT: Block RThroughput: 2.5
3564
3565# CHECK:      Timeline view:
3566# CHECK-NEXT:                     01234
3567# CHECK-NEXT: Index     0123456789
3568
3569# CHECK:      [0,0]     DeeeeeeeeER   .   st4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
3570# CHECK-NEXT: [0,1]     D=eeeeeeeeER  .   st4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
3571# CHECK-NEXT: [0,2]     .D=eeeeeeeeER .   st4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
3572# CHECK-NEXT: [0,3]     .D==eeeeeeeeER.   st4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
3573# CHECK-NEXT: [0,4]     . D==eeeeeeeeER   st4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
3574
3575# CHECK:      Average Wait times (based on the timeline view):
3576# CHECK-NEXT: [0]: Executions
3577# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3578# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3579# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3580
3581# CHECK:            [0]    [1]    [2]    [3]
3582# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st4	{ v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28
3583# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st4	{ v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28
3584# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st4	{ v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28
3585# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st4	{ v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28
3586# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st4	{ v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28
3587# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3588
3589# CHECK:      [80] Code Region - G81
3590
3591# CHECK:      Iterations:        100
3592# CHECK-NEXT: Instructions:      500
3593# CHECK-NEXT: Total Cycles:      508
3594# CHECK-NEXT: Total uOps:        1000
3595
3596# CHECK:      Dispatch Width:    4
3597# CHECK-NEXT: uOps Per Cycle:    1.97
3598# CHECK-NEXT: IPC:               0.98
3599# CHECK-NEXT: Block RThroughput: 2.5
3600
3601# CHECK:      Timeline view:
3602# CHECK-NEXT:                     012
3603# CHECK-NEXT: Index     0123456789
3604
3605# CHECK:      [0,0]     DeeeeeeeeER .   st4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
3606# CHECK-NEXT: [0,1]     D=eeeeeeeeER.   st4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
3607# CHECK-NEXT: [0,2]     .D=eeeeeeE-R.   st4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
3608# CHECK-NEXT: [0,3]     .D==eeeeeeER.   st4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
3609# CHECK-NEXT: [0,4]     . D==eeeeeeER   st4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
3610
3611# CHECK:      Average Wait times (based on the timeline view):
3612# CHECK-NEXT: [0]: Executions
3613# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3614# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3615# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3616
3617# CHECK:            [0]    [1]    [2]    [3]
3618# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st4	{ v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28
3619# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st4	{ v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28
3620# CHECK-NEXT: 2.     1     2.0    0.0    1.0       st4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], #4
3621# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], #4
3622# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st4	{ v1.b, v2.b, v3.b, v4.b }[0], [x27], x28
3623# CHECK-NEXT:        1     2.2    0.2    0.2       <total>
3624
3625# CHECK:      [81] Code Region - G82
3626
3627# CHECK:      Iterations:        100
3628# CHECK-NEXT: Instructions:      500
3629# CHECK-NEXT: Total Cycles:      508
3630# CHECK-NEXT: Total uOps:        1000
3631
3632# CHECK:      Dispatch Width:    4
3633# CHECK-NEXT: uOps Per Cycle:    1.97
3634# CHECK-NEXT: IPC:               0.98
3635# CHECK-NEXT: Block RThroughput: 2.5
3636
3637# CHECK:      Timeline view:
3638# CHECK-NEXT:                     012
3639# CHECK-NEXT: Index     0123456789
3640
3641# CHECK:      [0,0]     DeeeeeeER . .   st4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
3642# CHECK-NEXT: [0,1]     D=eeeeeeER. .   st4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
3643# CHECK-NEXT: [0,2]     .D=eeeeeeER .   st4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
3644# CHECK-NEXT: [0,3]     .D==eeeeeeER.   st4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
3645# CHECK-NEXT: [0,4]     . D==eeeeeeER   st4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
3646
3647# CHECK:      Average Wait times (based on the timeline view):
3648# CHECK-NEXT: [0]: Executions
3649# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3650# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3651# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3652
3653# CHECK:            [0]    [1]    [2]    [3]
3654# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st4	{ v1.b, v2.b, v3.b, v4.b }[8], [x27], x28
3655# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], #8
3656# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], #8
3657# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st4	{ v1.h, v2.h, v3.h, v4.h }[0], [x27], x28
3658# CHECK-NEXT: 4.     1     3.0    0.0    0.0       st4	{ v1.h, v2.h, v3.h, v4.h }[4], [x27], x28
3659# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3660
3661# CHECK:      [82] Code Region - G83
3662
3663# CHECK:      Iterations:        100
3664# CHECK-NEXT: Instructions:      400
3665# CHECK-NEXT: Total Cycles:      408
3666# CHECK-NEXT: Total uOps:        800
3667
3668# CHECK:      Dispatch Width:    4
3669# CHECK-NEXT: uOps Per Cycle:    1.96
3670# CHECK-NEXT: IPC:               0.98
3671# CHECK-NEXT: Block RThroughput: 2.0
3672
3673# CHECK:      Timeline view:
3674# CHECK-NEXT:                     01
3675# CHECK-NEXT: Index     0123456789
3676
3677# CHECK:      [0,0]     DeeeeeeER ..   st4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
3678# CHECK-NEXT: [0,1]     D=eeeeeeER..   st4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
3679# CHECK-NEXT: [0,2]     .D=eeeeeeER.   st4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
3680# CHECK-NEXT: [0,3]     .D==eeeeeeER   st4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
3681
3682# CHECK:      Average Wait times (based on the timeline view):
3683# CHECK-NEXT: [0]: Executions
3684# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3685# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3686# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3687
3688# CHECK:            [0]    [1]    [2]    [3]
3689# CHECK-NEXT: 0.     1     1.0    1.0    0.0       st4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], #16
3690# CHECK-NEXT: 1.     1     2.0    0.0    0.0       st4	{ v1.s, v2.s, v3.s, v4.s }[0], [x27], x28
3691# CHECK-NEXT: 2.     1     2.0    0.0    0.0       st4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], #32
3692# CHECK-NEXT: 3.     1     3.0    0.0    0.0       st4	{ v1.d, v2.d, v3.d, v4.d }[0], [x27], x28
3693# CHECK-NEXT:        1     2.0    0.3    0.0       <total>
3694
3695# CHECK:      [83] Code Region - G84
3696
3697# CHECK:      Iterations:        100
3698# CHECK-NEXT: Instructions:      200
3699# CHECK-NEXT: Total Cycles:      403
3700# CHECK-NEXT: Total uOps:        600
3701
3702# CHECK:      Dispatch Width:    4
3703# CHECK-NEXT: uOps Per Cycle:    1.49
3704# CHECK-NEXT: IPC:               0.50
3705# CHECK-NEXT: Block RThroughput: 4.0
3706
3707# CHECK:      Timeline view:
3708# CHECK-NEXT: Index     0123456
3709
3710# CHECK:      [0,0]     DeeER..   stp	s1, s2, [x27], #248
3711# CHECK-NEXT: [0,1]     .D=eeER   stp	d1, d2, [x27], #496
3712
3713# CHECK:      Average Wait times (based on the timeline view):
3714# CHECK-NEXT: [0]: Executions
3715# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3716# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3717# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3718
3719# CHECK:            [0]    [1]    [2]    [3]
3720# CHECK-NEXT: 0.     1     1.0    1.0    0.0       stp	s1, s2, [x27], #248
3721# CHECK-NEXT: 1.     1     2.0    1.0    0.0       stp	d1, d2, [x27], #496
3722# CHECK-NEXT:        1     1.5    1.0    0.0       <total>
3723
3724# CHECK:      [84] Code Region - G85
3725
3726# CHECK:      Iterations:        100
3727# CHECK-NEXT: Instructions:      500
3728# CHECK-NEXT: Total Cycles:      903
3729# CHECK-NEXT: Total uOps:        1400
3730
3731# CHECK:      Dispatch Width:    4
3732# CHECK-NEXT: uOps Per Cycle:    1.55
3733# CHECK-NEXT: IPC:               0.55
3734# CHECK-NEXT: Block RThroughput: 9.0
3735
3736# CHECK:      Timeline view:
3737# CHECK-NEXT:                     01
3738# CHECK-NEXT: Index     0123456789
3739
3740# CHECK:      [0,0]     DeeER.    ..   stp	q1, q2, [x27], #992
3741# CHECK-NEXT: [0,1]     .D=eeER   ..   stp	s1, s2, [x27, #248]!
3742# CHECK-NEXT: [0,2]     . D==eeER ..   stp	d1, d2, [x27, #496]!
3743# CHECK-NEXT: [0,3]     .  D===eeER.   stp	q1, q2, [x27, #992]!
3744# CHECK-NEXT: [0,4]     .   D====eER   stp	w1, w2, [x27], #248
3745
3746# CHECK:      Average Wait times (based on the timeline view):
3747# CHECK-NEXT: [0]: Executions
3748# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3749# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3750# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3751
3752# CHECK:            [0]    [1]    [2]    [3]
3753# CHECK-NEXT: 0.     1     1.0    1.0    0.0       stp	q1, q2, [x27], #992
3754# CHECK-NEXT: 1.     1     2.0    1.0    0.0       stp	s1, s2, [x27, #248]!
3755# CHECK-NEXT: 2.     1     3.0    1.0    0.0       stp	d1, d2, [x27, #496]!
3756# CHECK-NEXT: 3.     1     4.0    1.0    0.0       stp	q1, q2, [x27, #992]!
3757# CHECK-NEXT: 4.     1     5.0    1.0    0.0       stp	w1, w2, [x27], #248
3758# CHECK-NEXT:        1     3.0    1.0    0.0       <total>
3759
3760# CHECK:      [85] Code Region - G86
3761
3762# CHECK:      Iterations:        100
3763# CHECK-NEXT: Instructions:      500
3764# CHECK-NEXT: Total Cycles:      503
3765# CHECK-NEXT: Total uOps:        1000
3766
3767# CHECK:      Dispatch Width:    4
3768# CHECK-NEXT: uOps Per Cycle:    1.99
3769# CHECK-NEXT: IPC:               0.99
3770# CHECK-NEXT: Block RThroughput: 5.0
3771
3772# CHECK:      Timeline view:
3773# CHECK-NEXT: Index     01234567
3774
3775# CHECK:      [0,0]     DeER . .   stp	x1, x2, [x27], #496
3776# CHECK-NEXT: [0,1]     D=eER. .   stp	w1, w2, [x27, #248]!
3777# CHECK-NEXT: [0,2]     .D=eER .   stp	x1, x2, [x27, #496]!
3778# CHECK-NEXT: [0,3]     .D==eER.   str	b1, [x27], #254
3779# CHECK-NEXT: [0,4]     . D==eER   str	h1, [x27], #254
3780
3781# CHECK:      Average Wait times (based on the timeline view):
3782# CHECK-NEXT: [0]: Executions
3783# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3784# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3785# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3786
3787# CHECK:            [0]    [1]    [2]    [3]
3788# CHECK-NEXT: 0.     1     1.0    1.0    0.0       stp	x1, x2, [x27], #496
3789# CHECK-NEXT: 1.     1     2.0    0.0    0.0       stp	w1, w2, [x27, #248]!
3790# CHECK-NEXT: 2.     1     2.0    0.0    0.0       stp	x1, x2, [x27, #496]!
3791# CHECK-NEXT: 3.     1     3.0    0.0    0.0       str	b1, [x27], #254
3792# CHECK-NEXT: 4.     1     3.0    0.0    0.0       str	h1, [x27], #254
3793# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3794
3795# CHECK:      [86] Code Region - G87
3796
3797# CHECK:      Iterations:        100
3798# CHECK-NEXT: Instructions:      500
3799# CHECK-NEXT: Total Cycles:      503
3800# CHECK-NEXT: Total uOps:        1000
3801
3802# CHECK:      Dispatch Width:    4
3803# CHECK-NEXT: uOps Per Cycle:    1.99
3804# CHECK-NEXT: IPC:               0.99
3805# CHECK-NEXT: Block RThroughput: 5.0
3806
3807# CHECK:      Timeline view:
3808# CHECK-NEXT: Index     01234567
3809
3810# CHECK:      [0,0]     DeER . .   str	s1, [x27], #254
3811# CHECK-NEXT: [0,1]     D=eER. .   str	d1, [x27], #254
3812# CHECK-NEXT: [0,2]     .D=eER .   str	q1, [x27], #254
3813# CHECK-NEXT: [0,3]     .D==eER.   str	b1, [x27, #254]!
3814# CHECK-NEXT: [0,4]     . D==eER   str	h1, [x27, #254]!
3815
3816# CHECK:      Average Wait times (based on the timeline view):
3817# CHECK-NEXT: [0]: Executions
3818# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3819# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3820# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3821
3822# CHECK:            [0]    [1]    [2]    [3]
3823# CHECK-NEXT: 0.     1     1.0    1.0    0.0       str	s1, [x27], #254
3824# CHECK-NEXT: 1.     1     2.0    0.0    0.0       str	d1, [x27], #254
3825# CHECK-NEXT: 2.     1     2.0    0.0    0.0       str	q1, [x27], #254
3826# CHECK-NEXT: 3.     1     3.0    0.0    0.0       str	b1, [x27, #254]!
3827# CHECK-NEXT: 4.     1     3.0    0.0    0.0       str	h1, [x27, #254]!
3828# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3829
3830# CHECK:      [87] Code Region - G88
3831
3832# CHECK:      Iterations:        100
3833# CHECK-NEXT: Instructions:      500
3834# CHECK-NEXT: Total Cycles:      503
3835# CHECK-NEXT: Total uOps:        1000
3836
3837# CHECK:      Dispatch Width:    4
3838# CHECK-NEXT: uOps Per Cycle:    1.99
3839# CHECK-NEXT: IPC:               0.99
3840# CHECK-NEXT: Block RThroughput: 5.0
3841
3842# CHECK:      Timeline view:
3843# CHECK-NEXT: Index     01234567
3844
3845# CHECK:      [0,0]     DeER . .   str	s1, [x27, #254]!
3846# CHECK-NEXT: [0,1]     D=eER. .   str	d1, [x27, #254]!
3847# CHECK-NEXT: [0,2]     .D=eER .   str	q1, [x27, #254]!
3848# CHECK-NEXT: [0,3]     .D==eER.   str	w1, [x27], #254
3849# CHECK-NEXT: [0,4]     . D==eER   str	x1, [x27], #254
3850
3851# CHECK:      Average Wait times (based on the timeline view):
3852# CHECK-NEXT: [0]: Executions
3853# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3854# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3855# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3856
3857# CHECK:            [0]    [1]    [2]    [3]
3858# CHECK-NEXT: 0.     1     1.0    1.0    0.0       str	s1, [x27, #254]!
3859# CHECK-NEXT: 1.     1     2.0    0.0    0.0       str	d1, [x27, #254]!
3860# CHECK-NEXT: 2.     1     2.0    0.0    0.0       str	q1, [x27, #254]!
3861# CHECK-NEXT: 3.     1     3.0    0.0    0.0       str	w1, [x27], #254
3862# CHECK-NEXT: 4.     1     3.0    0.0    0.0       str	x1, [x27], #254
3863# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3864
3865# CHECK:      [88] Code Region - G89
3866
3867# CHECK:      Iterations:        100
3868# CHECK-NEXT: Instructions:      500
3869# CHECK-NEXT: Total Cycles:      503
3870# CHECK-NEXT: Total uOps:        1000
3871
3872# CHECK:      Dispatch Width:    4
3873# CHECK-NEXT: uOps Per Cycle:    1.99
3874# CHECK-NEXT: IPC:               0.99
3875# CHECK-NEXT: Block RThroughput: 5.0
3876
3877# CHECK:      Timeline view:
3878# CHECK-NEXT: Index     01234567
3879
3880# CHECK:      [0,0]     DeER . .   str	w1, [x27, #254]!
3881# CHECK-NEXT: [0,1]     D=eER. .   str	x1, [x27, #254]!
3882# CHECK-NEXT: [0,2]     .D=eER .   strb	w1, [x27], #254
3883# CHECK-NEXT: [0,3]     .D==eER.   strb	w1, [x27, #254]!
3884# CHECK-NEXT: [0,4]     . D==eER   strh	w1, [x27], #254
3885
3886# CHECK:      Average Wait times (based on the timeline view):
3887# CHECK-NEXT: [0]: Executions
3888# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3889# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3890# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3891
3892# CHECK:            [0]    [1]    [2]    [3]
3893# CHECK-NEXT: 0.     1     1.0    1.0    0.0       str	w1, [x27, #254]!
3894# CHECK-NEXT: 1.     1     2.0    0.0    0.0       str	x1, [x27, #254]!
3895# CHECK-NEXT: 2.     1     2.0    0.0    0.0       strb	w1, [x27], #254
3896# CHECK-NEXT: 3.     1     3.0    0.0    0.0       strb	w1, [x27, #254]!
3897# CHECK-NEXT: 4.     1     3.0    0.0    0.0       strh	w1, [x27], #254
3898# CHECK-NEXT:        1     2.2    0.2    0.0       <total>
3899
3900# CHECK:      [89] Code Region - G90
3901
3902# CHECK:      Iterations:        100
3903# CHECK-NEXT: Instructions:      100
3904# CHECK-NEXT: Total Cycles:      103
3905# CHECK-NEXT: Total uOps:        200
3906
3907# CHECK:      Dispatch Width:    4
3908# CHECK-NEXT: uOps Per Cycle:    1.94
3909# CHECK-NEXT: IPC:               0.97
3910# CHECK-NEXT: Block RThroughput: 1.0
3911
3912# CHECK:      Timeline view:
3913# CHECK-NEXT: Index     0123
3914
3915# CHECK:      [0,0]     DeER   strh	w1, [x27, #254]!
3916
3917# CHECK:      Average Wait times (based on the timeline view):
3918# CHECK-NEXT: [0]: Executions
3919# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3920# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3921# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3922
3923# CHECK:            [0]    [1]    [2]    [3]
3924# CHECK-NEXT: 0.     1     1.0    1.0    0.0       strh	w1, [x27, #254]!
3925
3926# CHECK:      [90] Code Region - G91
3927
3928# CHECK:      Iterations:        100
3929# CHECK-NEXT: Instructions:      200
3930# CHECK-NEXT: Total Cycles:      110
3931# CHECK-NEXT: Total uOps:        400
3932
3933# CHECK:      Dispatch Width:    4
3934# CHECK-NEXT: uOps Per Cycle:    3.64
3935# CHECK-NEXT: IPC:               1.82
3936# CHECK-NEXT: Block RThroughput: 1.0
3937
3938# CHECK:      Timeline view:
3939# CHECK-NEXT:                     0
3940# CHECK-NEXT: Index     0123456789
3941
3942# CHECK:      [0,0]     DeeeeER   .   ldr	x1, [x27], #254
3943# CHECK-NEXT: [0,1]     D====eeeeER   ldr	x2, [x1], #254
3944
3945# CHECK:      Average Wait times (based on the timeline view):
3946# CHECK-NEXT: [0]: Executions
3947# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
3948# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
3949# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
3950
3951# CHECK:            [0]    [1]    [2]    [3]
3952# CHECK-NEXT: 0.     1     1.0    1.0    0.0       ldr	x1, [x27], #254
3953# CHECK-NEXT: 1.     1     5.0    0.0    0.0       ldr	x2, [x1], #254
3954# CHECK-NEXT:        1     3.0    0.5    0.0       <total>
3955