1# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py 2# RUN: llvm-mca -mtriple=aarch64 -mcpu=neoverse-v1 --instruction-info=0 --resource-pressure=0 --timeline --timeline-max-iterations=1 < %s | FileCheck %s 3 4# LLVM-MCA-BEGIN G01 5ld1 { v1.1d }, [x27], #8 6add x0, x27, 1 7ld1 { v1.2d }, [x27], #16 8add x0, x27, 1 9ld1 { v1.2s }, [x27], #8 10add x0, x27, 1 11ld1 { v1.4h }, [x27], #8 12add x0, x27, 1 13ld1 { v1.4s }, [x27], #16 14add x0, x27, 1 15# LLVM-MCA-END 16 17# LLVM-MCA-BEGIN G02 18ld1 { v1.8b }, [x27], #8 19add x0, x27, 1 20ld1 { v1.8h }, [x27], #16 21add x0, x27, 1 22ld1 { v1.16b }, [x27], #16 23add x0, x27, 1 24ld1 { v1.1d }, [x27], x28 25add x0, x27, 1 26ld1 { v1.2d }, [x27], x28 27add x0, x27, 1 28# LLVM-MCA-END 29 30# LLVM-MCA-BEGIN G03 31ld1 { v1.2s }, [x27], x28 32add x0, x27, 1 33ld1 { v1.4h }, [x27], x28 34add x0, x27, 1 35ld1 { v1.4s }, [x27], x28 36add x0, x27, 1 37ld1 { v1.8b }, [x27], x28 38add x0, x27, 1 39ld1 { v1.8h }, [x27], x28 40add x0, x27, 1 41# LLVM-MCA-END 42 43# LLVM-MCA-BEGIN G04 44ld1 { v1.16b }, [x27], x28 45add x0, x27, 1 46ld1 { v1.1d, v2.1d }, [x27], #16 47add x0, x27, 1 48ld1 { v1.2d, v2.2d }, [x27], #32 49add x0, x27, 1 50ld1 { v1.2s, v2.2s }, [x27], #16 51add x0, x27, 1 52ld1 { v1.4h, v2.4h }, [x27], #16 53add x0, x27, 1 54# LLVM-MCA-END 55 56# LLVM-MCA-BEGIN G05 57ld1 { v1.4s, v2.4s }, [x27], #32 58add x0, x27, 1 59ld1 { v1.8b, v2.8b }, [x27], #16 60add x0, x27, 1 61ld1 { v1.8h, v2.8h }, [x27], #32 62add x0, x27, 1 63ld1 { v1.16b, v2.16b }, [x27], #32 64add x0, x27, 1 65ld1 { v1.1d, v2.1d }, [x27], x28 66add x0, x27, 1 67# LLVM-MCA-END 68 69# LLVM-MCA-BEGIN G06 70ld1 { v1.2d, v2.2d }, [x27], x28 71add x0, x27, 1 72ld1 { v1.2s, v2.2s }, [x27], x28 73add x0, x27, 1 74ld1 { v1.4h, v2.4h }, [x27], x28 75add x0, x27, 1 76ld1 { v1.4s, v2.4s }, [x27], x28 77add x0, x27, 1 78ld1 { v1.8b, v2.8b }, [x27], x28 79add x0, x27, 1 80# LLVM-MCA-END 81 82# LLVM-MCA-BEGIN G07 83ld1 { v1.8h, v2.8h }, [x27], x28 84add x0, x27, 1 85ld1 { v1.16b, v2.16b }, [x27], x28 86add x0, x27, 1 87ld1 { v1.1d, v2.1d, v3.1d }, [x27], #24 88add x0, x27, 1 89ld1 { v1.2d, v2.2d, v3.2d }, [x27], #48 90add x0, x27, 1 91ld1 { v1.2s, v2.2s, v3.2s }, [x27], #24 92add x0, x27, 1 93# LLVM-MCA-END 94 95# LLVM-MCA-BEGIN G08 96ld1 { v1.4h, v2.4h, v3.4h }, [x27], #24 97add x0, x27, 1 98ld1 { v1.4s, v2.4s, v3.4s }, [x27], #48 99add x0, x27, 1 100ld1 { v1.8b, v2.8b, v3.8b }, [x27], #24 101add x0, x27, 1 102ld1 { v1.8h, v2.8h, v3.8h }, [x27], #48 103add x0, x27, 1 104ld1 { v1.16b, v2.16b, v3.16b }, [x27], #48 105add x0, x27, 1 106# LLVM-MCA-END 107 108# LLVM-MCA-BEGIN G09 109ld1 { v1.1d, v2.1d, v3.1d }, [x27], x28 110add x0, x27, 1 111ld1 { v1.2d, v2.2d, v3.2d }, [x27], x28 112add x0, x27, 1 113ld1 { v1.2s, v2.2s, v3.2s }, [x27], x28 114add x0, x27, 1 115ld1 { v1.4h, v2.4h, v3.4h }, [x27], x28 116add x0, x27, 1 117ld1 { v1.4s, v2.4s, v3.4s }, [x27], x28 118add x0, x27, 1 119# LLVM-MCA-END 120 121# LLVM-MCA-BEGIN G10 122ld1 { v1.8b, v2.8b, v3.8b }, [x27], x28 123add x0, x27, 1 124ld1 { v1.8h, v2.8h, v3.8h }, [x27], x28 125add x0, x27, 1 126ld1 { v1.16b, v2.16b, v3.16b }, [x27], x28 127add x0, x27, 1 128ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 129add x0, x27, 1 130ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 131add x0, x27, 1 132# LLVM-MCA-END 133 134# LLVM-MCA-BEGIN G11 135ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 136add x0, x27, 1 137ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 138add x0, x27, 1 139ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 140add x0, x27, 1 141ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 142add x0, x27, 1 143ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 144add x0, x27, 1 145# LLVM-MCA-END 146 147# LLVM-MCA-BEGIN G12 148ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 149add x0, x27, 1 150ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 151add x0, x27, 1 152ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 153add x0, x27, 1 154ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 155add x0, x27, 1 156ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 157add x0, x27, 1 158# LLVM-MCA-END 159 160# LLVM-MCA-BEGIN G13 161ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 162add x0, x27, 1 163ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 164add x0, x27, 1 165ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 166add x0, x27, 1 167ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 168add x0, x27, 1 169ld1 { v1.b }[0], [x27], #1 170add x0, x27, 1 171# LLVM-MCA-END 172 173# LLVM-MCA-BEGIN G14 174ld1 { v1.b }[8], [x27], #1 175add x0, x27, 1 176ld1 { v1.b }[0], [x27], x28 177add x0, x27, 1 178ld1 { v1.b }[8], [x27], x28 179add x0, x27, 1 180ld1 { v1.h }[0], [x27], #2 181add x0, x27, 1 182ld1 { v1.h }[4], [x27], #2 183add x0, x27, 1 184# LLVM-MCA-END 185 186# LLVM-MCA-BEGIN G15 187ld1 { v1.h }[0], [x27], x28 188add x0, x27, 1 189ld1 { v1.h }[4], [x27], x28 190add x0, x27, 1 191ld1 { v1.s }[0], [x27], #4 192add x0, x27, 1 193ld1 { v1.s }[0], [x27], x28 194add x0, x27, 1 195ld1 { v1.d }[0], [x27], #8 196add x0, x27, 1 197# LLVM-MCA-END 198 199# LLVM-MCA-BEGIN G16 200ld1 { v1.d }[0], [x27], x28 201add x0, x27, 1 202ld1r { v1.1d }, [x27], #8 203add x0, x27, 1 204ld1r { v1.2d }, [x27], #8 205add x0, x27, 1 206ld1r { v1.2s }, [x27], #4 207add x0, x27, 1 208ld1r { v1.4h }, [x27], #2 209add x0, x27, 1 210# LLVM-MCA-END 211 212# LLVM-MCA-BEGIN G17 213ld1r { v1.4s }, [x27], #4 214add x0, x27, 1 215ld1r { v1.8b }, [x27], #1 216add x0, x27, 1 217ld1r { v1.8h }, [x27], #2 218add x0, x27, 1 219ld1r { v1.16b }, [x27], #1 220add x0, x27, 1 221ld1r { v1.1d }, [x27], x28 222add x0, x27, 1 223# LLVM-MCA-END 224 225# LLVM-MCA-BEGIN G18 226ld1r { v1.2d }, [x27], x28 227add x0, x27, 1 228ld1r { v1.2s }, [x27], x28 229add x0, x27, 1 230ld1r { v1.4h }, [x27], x28 231add x0, x27, 1 232ld1r { v1.4s }, [x27], x28 233add x0, x27, 1 234ld1r { v1.8b }, [x27], x28 235add x0, x27, 1 236# LLVM-MCA-END 237 238# LLVM-MCA-BEGIN G19 239ld1r { v1.8h }, [x27], x28 240add x0, x27, 1 241ld1r { v1.16b }, [x27], x28 242add x0, x27, 1 243ld2 { v1.2d, v2.2d }, [x27], #32 244add x0, x27, 1 245ld2 { v1.2s, v2.2s }, [x27], #16 246add x0, x27, 1 247ld2 { v1.4h, v2.4h }, [x27], #16 248add x0, x27, 1 249# LLVM-MCA-END 250 251# LLVM-MCA-BEGIN G20 252ld2 { v1.4s, v2.4s }, [x27], #32 253add x0, x27, 1 254ld2 { v1.8b, v2.8b }, [x27], #16 255add x0, x27, 1 256ld2 { v1.8h, v2.8h }, [x27], #32 257add x0, x27, 1 258ld2 { v1.16b, v2.16b }, [x27], #32 259add x0, x27, 1 260ld2 { v1.2d, v2.2d }, [x27], x28 261add x0, x27, 1 262# LLVM-MCA-END 263 264# LLVM-MCA-BEGIN G21 265ld2 { v1.2s, v2.2s }, [x27], x28 266add x0, x27, 1 267ld2 { v1.4h, v2.4h }, [x27], x28 268add x0, x27, 1 269ld2 { v1.4s, v2.4s }, [x27], x28 270add x0, x27, 1 271ld2 { v1.8b, v2.8b }, [x27], x28 272add x0, x27, 1 273ld2 { v1.8h, v2.8h }, [x27], x28 274add x0, x27, 1 275# LLVM-MCA-END 276 277# LLVM-MCA-BEGIN G22 278ld2 { v1.16b, v2.16b }, [x27], x28 279add x0, x27, 1 280ld2 { v1.b, v2.b }[0], [x27], #2 281add x0, x27, 1 282ld2 { v1.b, v2.b }[8], [x27], #2 283add x0, x27, 1 284ld2 { v1.b, v2.b }[0], [x27], x28 285add x0, x27, 1 286ld2 { v1.b, v2.b }[8], [x27], x28 287add x0, x27, 1 288# LLVM-MCA-END 289 290# LLVM-MCA-BEGIN G23 291ld2 { v1.h, v2.h }[0], [x27], #4 292add x0, x27, 1 293ld2 { v1.h, v2.h }[4], [x27], #4 294add x0, x27, 1 295ld2 { v1.h, v2.h }[0], [x27], x28 296add x0, x27, 1 297ld2 { v1.h, v2.h }[4], [x27], x28 298add x0, x27, 1 299ld2 { v1.s, v2.s }[0], [x27], #8 300add x0, x27, 1 301# LLVM-MCA-END 302 303# LLVM-MCA-BEGIN G24 304ld2 { v1.s, v2.s }[0], [x27], x28 305add x0, x27, 1 306ld2 { v1.d, v2.d }[0], [x27], #16 307add x0, x27, 1 308ld2 { v1.d, v2.d }[0], [x27], x28 309add x0, x27, 1 310ld2r { v1.1d, v2.1d }, [x27], #16 311add x0, x27, 1 312ld2r { v1.2d, v2.2d }, [x27], #16 313add x0, x27, 1 314# LLVM-MCA-END 315 316# LLVM-MCA-BEGIN G25 317ld2r { v1.2s, v2.2s }, [x27], #8 318add x0, x27, 1 319ld2r { v1.4h, v2.4h }, [x27], #4 320add x0, x27, 1 321ld2r { v1.4s, v2.4s }, [x27], #8 322add x0, x27, 1 323ld2r { v1.8b, v2.8b }, [x27], #2 324add x0, x27, 1 325ld2r { v1.8h, v2.8h }, [x27], #4 326add x0, x27, 1 327# LLVM-MCA-END 328 329# LLVM-MCA-BEGIN G26 330ld2r { v1.16b, v2.16b }, [x27], #2 331add x0, x27, 1 332ld2r { v1.1d, v2.1d }, [x27], x28 333add x0, x27, 1 334ld2r { v1.2d, v2.2d }, [x27], x28 335add x0, x27, 1 336ld2r { v1.2s, v2.2s }, [x27], x28 337add x0, x27, 1 338ld2r { v1.4h, v2.4h }, [x27], x28 339add x0, x27, 1 340# LLVM-MCA-END 341 342# LLVM-MCA-BEGIN G27 343ld2r { v1.4s, v2.4s }, [x27], x28 344add x0, x27, 1 345ld2r { v1.8b, v2.8b }, [x27], x28 346add x0, x27, 1 347ld2r { v1.8h, v2.8h }, [x27], x28 348add x0, x27, 1 349ld2r { v1.16b, v2.16b }, [x27], x28 350add x0, x27, 1 351ld3 { v1.2d, v2.2d, v3.2d }, [x27], #48 352add x0, x27, 1 353# LLVM-MCA-END 354 355# LLVM-MCA-BEGIN G28 356ld3 { v1.2s, v2.2s, v3.2s }, [x27], #24 357add x0, x27, 1 358ld3 { v1.4h, v2.4h, v3.4h }, [x27], #24 359add x0, x27, 1 360ld3 { v1.4s, v2.4s, v3.4s }, [x27], #48 361add x0, x27, 1 362ld3 { v1.8b, v2.8b, v3.8b }, [x27], #24 363add x0, x27, 1 364ld3 { v1.8h, v2.8h, v3.8h }, [x27], #48 365add x0, x27, 1 366# LLVM-MCA-END 367 368# LLVM-MCA-BEGIN G29 369ld3 { v1.16b, v2.16b, v3.16b }, [x27], #48 370add x0, x27, 1 371ld3 { v1.2d, v2.2d, v3.2d }, [x27], x28 372add x0, x27, 1 373ld3 { v1.2s, v2.2s, v3.2s }, [x27], x28 374add x0, x27, 1 375ld3 { v1.4h, v2.4h, v3.4h }, [x27], x28 376add x0, x27, 1 377ld3 { v1.4s, v2.4s, v3.4s }, [x27], x28 378add x0, x27, 1 379# LLVM-MCA-END 380 381# LLVM-MCA-BEGIN G30 382ld3 { v1.8b, v2.8b, v3.8b }, [x27], x28 383add x0, x27, 1 384ld3 { v1.8h, v2.8h, v3.8h }, [x27], x28 385add x0, x27, 1 386ld3 { v1.16b, v2.16b, v3.16b }, [x27], x28 387add x0, x27, 1 388ld3 { v1.b, v2.b, v3.b }[0], [x27], #3 389add x0, x27, 1 390ld3 { v1.b, v2.b, v3.b }[8], [x27], #3 391add x0, x27, 1 392# LLVM-MCA-END 393 394# LLVM-MCA-BEGIN G31 395ld3 { v1.b, v2.b, v3.b }[0], [x27], x28 396add x0, x27, 1 397ld3 { v1.b, v2.b, v3.b }[8], [x27], x28 398add x0, x27, 1 399ld3 { v1.h, v2.h, v3.h }[0], [x27], #6 400add x0, x27, 1 401ld3 { v1.h, v2.h, v3.h }[4], [x27], #6 402add x0, x27, 1 403ld3 { v1.h, v2.h, v3.h }[0], [x27], x28 404add x0, x27, 1 405# LLVM-MCA-END 406 407# LLVM-MCA-BEGIN G32 408ld3 { v1.h, v2.h, v3.h }[4], [x27], x28 409add x0, x27, 1 410ld3 { v1.s, v2.s, v3.s }[0], [x27], #12 411add x0, x27, 1 412ld3 { v1.s, v2.s, v3.s }[0], [x27], x28 413add x0, x27, 1 414ld3 { v1.d, v2.d, v3.d }[0], [x27], #24 415add x0, x27, 1 416ld3 { v1.d, v2.d, v3.d }[0], [x27], x28 417add x0, x27, 1 418# LLVM-MCA-END 419 420# LLVM-MCA-BEGIN G33 421ld3r { v1.1d, v2.1d, v3.1d }, [x27], #24 422add x0, x27, 1 423ld3r { v1.2d, v2.2d, v3.2d }, [x27], #24 424add x0, x27, 1 425ld3r { v1.2s, v2.2s, v3.2s }, [x27], #12 426add x0, x27, 1 427ld3r { v1.4h, v2.4h, v3.4h }, [x27], #6 428add x0, x27, 1 429ld3r { v1.4s, v2.4s, v3.4s }, [x27], #12 430add x0, x27, 1 431# LLVM-MCA-END 432 433# LLVM-MCA-BEGIN G34 434ld3r { v1.8b, v2.8b, v3.8b }, [x27], #3 435add x0, x27, 1 436ld3r { v1.8h, v2.8h, v3.8h }, [x27], #6 437add x0, x27, 1 438ld3r { v1.16b, v2.16b, v3.16b }, [x27], #3 439add x0, x27, 1 440ld3r { v1.1d, v2.1d, v3.1d }, [x27], x28 441add x0, x27, 1 442ld3r { v1.2d, v2.2d, v3.2d }, [x27], x28 443add x0, x27, 1 444# LLVM-MCA-END 445 446# LLVM-MCA-BEGIN G35 447ld3r { v1.2s, v2.2s, v3.2s }, [x27], x28 448add x0, x27, 1 449ld3r { v1.4h, v2.4h, v3.4h }, [x27], x28 450add x0, x27, 1 451ld3r { v1.4s, v2.4s, v3.4s }, [x27], x28 452add x0, x27, 1 453ld3r { v1.8b, v2.8b, v3.8b }, [x27], x28 454add x0, x27, 1 455ld3r { v1.8h, v2.8h, v3.8h }, [x27], x28 456add x0, x27, 1 457# LLVM-MCA-END 458 459# LLVM-MCA-BEGIN G36 460ld3r { v1.16b, v2.16b, v3.16b }, [x27], x28 461add x0, x27, 1 462ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 463add x0, x27, 1 464ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 465add x0, x27, 1 466ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 467add x0, x27, 1 468ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 469add x0, x27, 1 470# LLVM-MCA-END 471 472# LLVM-MCA-BEGIN G37 473ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 474add x0, x27, 1 475ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 476add x0, x27, 1 477ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 478add x0, x27, 1 479ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 480add x0, x27, 1 481ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 482add x0, x27, 1 483# LLVM-MCA-END 484 485# LLVM-MCA-BEGIN G38 486ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 487add x0, x27, 1 488ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 489add x0, x27, 1 490ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 491add x0, x27, 1 492ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 493add x0, x27, 1 494ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 495add x0, x27, 1 496# LLVM-MCA-END 497 498# LLVM-MCA-BEGIN G39 499ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4 500add x0, x27, 1 501ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4 502add x0, x27, 1 503ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28 504add x0, x27, 1 505ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28 506add x0, x27, 1 507ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8 508add x0, x27, 1 509# LLVM-MCA-END 510 511# LLVM-MCA-BEGIN G40 512ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8 513add x0, x27, 1 514ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28 515add x0, x27, 1 516ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28 517add x0, x27, 1 518ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16 519add x0, x27, 1 520ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28 521add x0, x27, 1 522# LLVM-MCA-END 523 524# LLVM-MCA-BEGIN G41 525ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32 526add x0, x27, 1 527ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28 528add x0, x27, 1 529ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 530add x0, x27, 1 531ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32 532add x0, x27, 1 533ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16 534add x0, x27, 1 535# LLVM-MCA-END 536 537# LLVM-MCA-BEGIN G42 538ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8 539add x0, x27, 1 540ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16 541add x0, x27, 1 542ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4 543add x0, x27, 1 544ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8 545add x0, x27, 1 546ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4 547add x0, x27, 1 548# LLVM-MCA-END 549 550# LLVM-MCA-BEGIN G43 551ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 552add x0, x27, 1 553ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 554add x0, x27, 1 555ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 556add x0, x27, 1 557ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 558add x0, x27, 1 559ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 560add x0, x27, 1 561# LLVM-MCA-END 562 563# LLVM-MCA-BEGIN G44 564ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 565add x0, x27, 1 566ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 567add x0, x27, 1 568ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 569add x0, x27, 1 570ldp s1, s2, [x27], #248 571add x0, x27, 1 572ldp d1, d2, [x27], #496 573add x0, x27, 1 574# LLVM-MCA-END 575 576# LLVM-MCA-BEGIN G45 577ldp q1, q2, [x27], #992 578add x0, x27, 1 579ldp s1, s2, [x27, #248]! 580add x0, x27, 1 581ldp d1, d2, [x27, #496]! 582add x0, x27, 1 583ldp q1, q2, [x27, #992]! 584add x0, x27, 1 585ldp w1, w2, [x27], #248 586add x0, x27, 1 587# LLVM-MCA-END 588 589# LLVM-MCA-BEGIN G46 590ldp x1, x2, [x27], #496 591add x0, x27, 1 592ldp w1, w2, [x27, #248]! 593add x0, x27, 1 594ldp x1, x2, [x27, #496]! 595add x0, x27, 1 596ldpsw x1, x2, [x27], #248 597add x0, x27, 1 598ldpsw x1, x2, [x27, #248]! 599add x0, x27, 1 600# LLVM-MCA-END 601 602# LLVM-MCA-BEGIN G47 603ldr b1, [x27], #254 604add x0, x27, 1 605ldr h1, [x27], #254 606add x0, x27, 1 607ldr s1, [x27], #254 608add x0, x27, 1 609ldr d1, [x27], #254 610add x0, x27, 1 611ldr q1, [x27], #254 612add x0, x27, 1 613# LLVM-MCA-END 614 615# LLVM-MCA-BEGIN G48 616ldr b1, [x27, #254]! 617add x0, x27, 1 618ldr h1, [x27, #254]! 619add x0, x27, 1 620ldr s1, [x27, #254]! 621add x0, x27, 1 622ldr d1, [x27, #254]! 623add x0, x27, 1 624ldr q1, [x27, #254]! 625add x0, x27, 1 626# LLVM-MCA-END 627 628# LLVM-MCA-BEGIN G49 629ldr w1, [x27], #254 630add x0, x27, 1 631ldr x1, [x27], #254 632add x0, x27, 1 633ldr w1, [x27, #254]! 634add x0, x27, 1 635ldr x1, [x27, #254]! 636add x0, x27, 1 637ldrb w1, [x27], #254 638add x0, x27, 1 639# LLVM-MCA-END 640 641# LLVM-MCA-BEGIN G50 642ldrb w1, [x27, #254]! 643add x0, x27, 1 644ldrh w1, [x27], #254 645add x0, x27, 1 646ldrh w1, [x27, #254]! 647add x0, x27, 1 648ldrsb w1, [x27], #254 649add x0, x27, 1 650ldrsb x1, [x27], #254 651add x0, x27, 1 652# LLVM-MCA-END 653 654# LLVM-MCA-BEGIN G51 655ldrsb w1, [x27, #254]! 656add x0, x27, 1 657ldrsb x1, [x27, #254]! 658add x0, x27, 1 659ldrsh w1, [x27], #254 660add x0, x27, 1 661ldrsh x1, [x27], #254 662add x0, x27, 1 663ldrsh w1, [x27, #254]! 664add x0, x27, 1 665# LLVM-MCA-END 666 667# LLVM-MCA-BEGIN G52 668ldrsh x1, [x27, #254]! 669add x0, x27, 1 670ldrsw x1, [x27], #254 671add x0, x27, 1 672ldrsw x1, [x27, #254]! 673add x0, x27, 1 674st1 { v1.1d }, [x27], #8 675add x0, x27, 1 676st1 { v1.2d }, [x27], #16 677add x0, x27, 1 678# LLVM-MCA-END 679 680# LLVM-MCA-BEGIN G53 681st1 { v1.2s }, [x27], #8 682add x0, x27, 1 683st1 { v1.4h }, [x27], #8 684add x0, x27, 1 685st1 { v1.4s }, [x27], #16 686add x0, x27, 1 687st1 { v1.8b }, [x27], #8 688add x0, x27, 1 689st1 { v1.8h }, [x27], #16 690add x0, x27, 1 691# LLVM-MCA-END 692 693# LLVM-MCA-BEGIN G54 694st1 { v1.16b }, [x27], #16 695add x0, x27, 1 696st1 { v1.1d }, [x27], x28 697add x0, x27, 1 698st1 { v1.2d }, [x27], x28 699add x0, x27, 1 700st1 { v1.2s }, [x27], x28 701add x0, x27, 1 702st1 { v1.4h }, [x27], x28 703add x0, x27, 1 704# LLVM-MCA-END 705 706# LLVM-MCA-BEGIN G55 707st1 { v1.4s }, [x27], x28 708add x0, x27, 1 709st1 { v1.8b }, [x27], x28 710add x0, x27, 1 711st1 { v1.8h }, [x27], x28 712add x0, x27, 1 713st1 { v1.16b }, [x27], x28 714add x0, x27, 1 715st1 { v1.1d, v2.1d }, [x27], #16 716add x0, x27, 1 717# LLVM-MCA-END 718 719# LLVM-MCA-BEGIN G56 720st1 { v1.2d, v2.2d }, [x27], #32 721add x0, x27, 1 722st1 { v1.2s, v2.2s }, [x27], #16 723add x0, x27, 1 724st1 { v1.4h, v2.4h }, [x27], #16 725add x0, x27, 1 726st1 { v1.4s, v2.4s }, [x27], #32 727add x0, x27, 1 728st1 { v1.8b, v2.8b }, [x27], #16 729add x0, x27, 1 730# LLVM-MCA-END 731 732# LLVM-MCA-BEGIN G57 733st1 { v1.8h, v2.8h }, [x27], #32 734add x0, x27, 1 735st1 { v1.16b, v2.16b }, [x27], #32 736add x0, x27, 1 737st1 { v1.1d, v2.1d }, [x27], x28 738add x0, x27, 1 739st1 { v1.2d, v2.2d }, [x27], x28 740add x0, x27, 1 741st1 { v1.2s, v2.2s }, [x27], x28 742add x0, x27, 1 743# LLVM-MCA-END 744 745# LLVM-MCA-BEGIN G58 746st1 { v1.4h, v2.4h }, [x27], x28 747add x0, x27, 1 748st1 { v1.4s, v2.4s }, [x27], x28 749add x0, x27, 1 750st1 { v1.8b, v2.8b }, [x27], x28 751add x0, x27, 1 752st1 { v1.8h, v2.8h }, [x27], x28 753add x0, x27, 1 754st1 { v1.16b, v2.16b }, [x27], x28 755add x0, x27, 1 756# LLVM-MCA-END 757 758# LLVM-MCA-BEGIN G59 759st1 { v1.1d, v2.1d, v3.1d }, [x27], #24 760add x0, x27, 1 761st1 { v1.2d, v2.2d, v3.2d }, [x27], #48 762add x0, x27, 1 763st1 { v1.2s, v2.2s, v3.2s }, [x27], #24 764add x0, x27, 1 765st1 { v1.4h, v2.4h, v3.4h }, [x27], #24 766add x0, x27, 1 767st1 { v1.4s, v2.4s, v3.4s }, [x27], #48 768add x0, x27, 1 769# LLVM-MCA-END 770 771# LLVM-MCA-BEGIN G60 772st1 { v1.8b, v2.8b, v3.8b }, [x27], #24 773add x0, x27, 1 774st1 { v1.8h, v2.8h, v3.8h }, [x27], #48 775add x0, x27, 1 776st1 { v1.16b, v2.16b, v3.16b }, [x27], #48 777add x0, x27, 1 778st1 { v1.1d, v2.1d, v3.1d }, [x27], x28 779add x0, x27, 1 780st1 { v1.2d, v2.2d, v3.2d }, [x27], x28 781add x0, x27, 1 782# LLVM-MCA-END 783 784# LLVM-MCA-BEGIN G61 785st1 { v1.2s, v2.2s, v3.2s }, [x27], x28 786add x0, x27, 1 787st1 { v1.4h, v2.4h, v3.4h }, [x27], x28 788add x0, x27, 1 789st1 { v1.4s, v2.4s, v3.4s }, [x27], x28 790add x0, x27, 1 791st1 { v1.8b, v2.8b, v3.8b }, [x27], x28 792add x0, x27, 1 793st1 { v1.8h, v2.8h, v3.8h }, [x27], x28 794add x0, x27, 1 795# LLVM-MCA-END 796 797# LLVM-MCA-BEGIN G62 798st1 { v1.16b, v2.16b, v3.16b }, [x27], x28 799add x0, x27, 1 800st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 801add x0, x27, 1 802st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 803add x0, x27, 1 804st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 805add x0, x27, 1 806st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 807add x0, x27, 1 808# LLVM-MCA-END 809 810# LLVM-MCA-BEGIN G63 811st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 812add x0, x27, 1 813st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 814add x0, x27, 1 815st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 816add x0, x27, 1 817st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 818add x0, x27, 1 819st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 820add x0, x27, 1 821# LLVM-MCA-END 822 823# LLVM-MCA-BEGIN G64 824st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 825add x0, x27, 1 826st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 827add x0, x27, 1 828st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 829add x0, x27, 1 830st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 831add x0, x27, 1 832st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 833add x0, x27, 1 834# LLVM-MCA-END 835 836# LLVM-MCA-BEGIN G65 837st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 838add x0, x27, 1 839st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 840add x0, x27, 1 841st1 { v1.b }[0], [x27], #1 842add x0, x27, 1 843st1 { v1.b }[8], [x27], #1 844add x0, x27, 1 845st1 { v1.b }[0], [x27], x28 846add x0, x27, 1 847# LLVM-MCA-END 848 849# LLVM-MCA-BEGIN G66 850st1 { v1.b }[8], [x27], x28 851add x0, x27, 1 852st1 { v1.h }[0], [x27], #2 853add x0, x27, 1 854st1 { v1.h }[4], [x27], #2 855add x0, x27, 1 856st1 { v1.h }[0], [x27], x28 857add x0, x27, 1 858st1 { v1.h }[4], [x27], x28 859add x0, x27, 1 860# LLVM-MCA-END 861 862# LLVM-MCA-BEGIN G67 863st1 { v1.s }[0], [x27], #4 864add x0, x27, 1 865st1 { v1.s }[0], [x27], x28 866add x0, x27, 1 867st1 { v1.d }[0], [x27], #8 868add x0, x27, 1 869st1 { v1.d }[0], [x27], x28 870add x0, x27, 1 871st2 { v1.2d, v2.2d }, [x27], #32 872add x0, x27, 1 873# LLVM-MCA-END 874 875# LLVM-MCA-BEGIN G68 876st2 { v1.2s, v2.2s }, [x27], #16 877add x0, x27, 1 878st2 { v1.4h, v2.4h }, [x27], #16 879add x0, x27, 1 880st2 { v1.4s, v2.4s }, [x27], #32 881add x0, x27, 1 882st2 { v1.8b, v2.8b }, [x27], #16 883add x0, x27, 1 884st2 { v1.8h, v2.8h }, [x27], #32 885add x0, x27, 1 886# LLVM-MCA-END 887 888# LLVM-MCA-BEGIN G69 889st2 { v1.16b, v2.16b }, [x27], #32 890add x0, x27, 1 891st2 { v1.2d, v2.2d }, [x27], x28 892add x0, x27, 1 893st2 { v1.2s, v2.2s }, [x27], x28 894add x0, x27, 1 895st2 { v1.4h, v2.4h }, [x27], x28 896add x0, x27, 1 897st2 { v1.4s, v2.4s }, [x27], x28 898add x0, x27, 1 899# LLVM-MCA-END 900 901# LLVM-MCA-BEGIN G70 902st2 { v1.8b, v2.8b }, [x27], x28 903add x0, x27, 1 904st2 { v1.8h, v2.8h }, [x27], x28 905add x0, x27, 1 906st2 { v1.16b, v2.16b }, [x27], x28 907add x0, x27, 1 908st2 { v1.b, v2.b }[0], [x27], #2 909add x0, x27, 1 910st2 { v1.b, v2.b }[8], [x27], #2 911add x0, x27, 1 912# LLVM-MCA-END 913 914# LLVM-MCA-BEGIN G71 915st2 { v1.b, v2.b }[0], [x27], x28 916add x0, x27, 1 917st2 { v1.b, v2.b }[8], [x27], x28 918add x0, x27, 1 919st2 { v1.h, v2.h }[0], [x27], #4 920add x0, x27, 1 921st2 { v1.h, v2.h }[4], [x27], #4 922add x0, x27, 1 923st2 { v1.h, v2.h }[0], [x27], x28 924add x0, x27, 1 925# LLVM-MCA-END 926 927# LLVM-MCA-BEGIN G72 928st2 { v1.h, v2.h }[4], [x27], x28 929add x0, x27, 1 930st2 { v1.s, v2.s }[0], [x27], #8 931add x0, x27, 1 932st2 { v1.s, v2.s }[0], [x27], x28 933add x0, x27, 1 934st2 { v1.d, v2.d }[0], [x27], #16 935add x0, x27, 1 936st2 { v1.d, v2.d }[0], [x27], x28 937add x0, x27, 1 938# LLVM-MCA-END 939 940# LLVM-MCA-BEGIN G73 941st3 { v1.2d, v2.2d, v3.2d }, [x27], #48 942add x0, x27, 1 943st3 { v1.2s, v2.2s, v3.2s }, [x27], #24 944add x0, x27, 1 945st3 { v1.4h, v2.4h, v3.4h }, [x27], #24 946add x0, x27, 1 947# LLVM-MCA-END 948 949# LLVM-MCA-BEGIN G74 950st3 { v1.4s, v2.4s, v3.4s }, [x27], #48 951add x0, x27, 1 952st3 { v1.8b, v2.8b, v3.8b }, [x27], #24 953add x0, x27, 1 954st3 { v1.8h, v2.8h, v3.8h }, [x27], #48 955add x0, x27, 1 956st3 { v1.16b, v2.16b, v3.16b }, [x27], #48 957add x0, x27, 1 958st3 { v1.2d, v2.2d, v3.2d }, [x27], x28 959add x0, x27, 1 960# LLVM-MCA-END 961 962# LLVM-MCA-BEGIN G75 963st3 { v1.2s, v2.2s, v3.2s }, [x27], x28 964add x0, x27, 1 965st3 { v1.4h, v2.4h, v3.4h }, [x27], x28 966add x0, x27, 1 967st3 { v1.4s, v2.4s, v3.4s }, [x27], x28 968add x0, x27, 1 969st3 { v1.8b, v2.8b, v3.8b }, [x27], x28 970add x0, x27, 1 971st3 { v1.8h, v2.8h, v3.8h }, [x27], x28 972add x0, x27, 1 973# LLVM-MCA-END 974 975# LLVM-MCA-BEGIN G76 976st3 { v1.16b, v2.16b, v3.16b }, [x27], x28 977add x0, x27, 1 978st3 { v1.b, v2.b, v3.b }[0], [x27], #3 979add x0, x27, 1 980st3 { v1.b, v2.b, v3.b }[8], [x27], #3 981add x0, x27, 1 982st3 { v1.b, v2.b, v3.b }[0], [x27], x28 983add x0, x27, 1 984st3 { v1.b, v2.b, v3.b }[8], [x27], x28 985add x0, x27, 1 986# LLVM-MCA-END 987 988# LLVM-MCA-BEGIN G77 989st3 { v1.h, v2.h, v3.h }[0], [x27], #6 990add x0, x27, 1 991st3 { v1.h, v2.h, v3.h }[4], [x27], #6 992add x0, x27, 1 993st3 { v1.h, v2.h, v3.h }[0], [x27], x28 994add x0, x27, 1 995st3 { v1.h, v2.h, v3.h }[4], [x27], x28 996add x0, x27, 1 997st3 { v1.s, v2.s, v3.s }[0], [x27], #12 998add x0, x27, 1 999# LLVM-MCA-END 1000 1001# LLVM-MCA-BEGIN G78 1002st3 { v1.s, v2.s, v3.s }[0], [x27], x28 1003add x0, x27, 1 1004st3 { v1.d, v2.d, v3.d }[0], [x27], #24 1005add x0, x27, 1 1006st3 { v1.d, v2.d, v3.d }[0], [x27], x28 1007add x0, x27, 1 1008st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 1009add x0, x27, 1 1010st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 1011add x0, x27, 1 1012# LLVM-MCA-END 1013 1014# LLVM-MCA-BEGIN G79 1015st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 1016add x0, x27, 1 1017st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 1018add x0, x27, 1 1019st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 1020add x0, x27, 1 1021st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 1022add x0, x27, 1 1023st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 1024add x0, x27, 1 1025# LLVM-MCA-END 1026 1027# LLVM-MCA-BEGIN G80 1028st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 1029add x0, x27, 1 1030st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 1031add x0, x27, 1 1032st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 1033add x0, x27, 1 1034st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 1035add x0, x27, 1 1036st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 1037add x0, x27, 1 1038# LLVM-MCA-END 1039 1040# LLVM-MCA-BEGIN G81 1041st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 1042add x0, x27, 1 1043st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 1044add x0, x27, 1 1045st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4 1046add x0, x27, 1 1047st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4 1048add x0, x27, 1 1049st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28 1050add x0, x27, 1 1051# LLVM-MCA-END 1052 1053# LLVM-MCA-BEGIN G82 1054st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28 1055add x0, x27, 1 1056st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8 1057add x0, x27, 1 1058st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8 1059add x0, x27, 1 1060st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28 1061add x0, x27, 1 1062st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28 1063add x0, x27, 1 1064# LLVM-MCA-END 1065 1066# LLVM-MCA-BEGIN G83 1067st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16 1068add x0, x27, 1 1069st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28 1070add x0, x27, 1 1071st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32 1072add x0, x27, 1 1073st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28 1074add x0, x27, 1 1075# LLVM-MCA-END 1076 1077# LLVM-MCA-BEGIN G84 1078stp s1, s2, [x27], #248 1079add x0, x27, 1 1080stp d1, d2, [x27], #496 1081add x0, x27, 1 1082# LLVM-MCA-END 1083 1084# LLVM-MCA-BEGIN G85 1085stp q1, q2, [x27], #992 1086add x0, x27, 1 1087stp s1, s2, [x27, #248]! 1088add x0, x27, 1 1089stp d1, d2, [x27, #496]! 1090add x0, x27, 1 1091stp q1, q2, [x27, #992]! 1092add x0, x27, 1 1093stp w1, w2, [x27], #248 1094add x0, x27, 1 1095# LLVM-MCA-END 1096 1097# LLVM-MCA-BEGIN G86 1098stp x1, x2, [x27], #496 1099add x0, x27, 1 1100stp w1, w2, [x27, #248]! 1101add x0, x27, 1 1102stp x1, x2, [x27, #496]! 1103add x0, x27, 1 1104str b1, [x27], #254 1105add x0, x27, 1 1106str h1, [x27], #254 1107add x0, x27, 1 1108# LLVM-MCA-END 1109 1110# LLVM-MCA-BEGIN G87 1111str s1, [x27], #254 1112add x0, x27, 1 1113str d1, [x27], #254 1114add x0, x27, 1 1115str q1, [x27], #254 1116add x0, x27, 1 1117str b1, [x27, #254]! 1118add x0, x27, 1 1119str h1, [x27, #254]! 1120add x0, x27, 1 1121# LLVM-MCA-END 1122 1123# LLVM-MCA-BEGIN G88 1124str s1, [x27, #254]! 1125add x0, x27, 1 1126str d1, [x27, #254]! 1127add x0, x27, 1 1128str q1, [x27, #254]! 1129add x0, x27, 1 1130str w1, [x27], #254 1131add x0, x27, 1 1132str x1, [x27], #254 1133add x0, x27, 1 1134# LLVM-MCA-END 1135 1136# LLVM-MCA-BEGIN G89 1137str w1, [x27, #254]! 1138add x0, x27, 1 1139str x1, [x27, #254]! 1140add x0, x27, 1 1141strb w1, [x27], #254 1142add x0, x27, 1 1143strb w1, [x27, #254]! 1144add x0, x27, 1 1145strh w1, [x27], #254 1146add x0, x27, 1 1147# LLVM-MCA-END 1148 1149# LLVM-MCA-BEGIN G90 1150strh w1, [x27, #254]! 1151add x0, x27, 1 1152# LLVM-MCA-END 1153 1154# LLVM-MCA-BEGIN G91 1155ldr x1, [x27], #254 1156add x0, x27, 1 1157ldr x2, [x1], #254 1158add x0, x27, 1 1159# LLVM-MCA-END 1160 1161# CHECK: [0] Code Region - G01 1162 1163# CHECK: Iterations: 100 1164# CHECK-NEXT: Instructions: 1000 1165# CHECK-NEXT: Total Cycles: 508 1166# CHECK-NEXT: Total uOps: 1500 1167 1168# CHECK: Dispatch Width: 15 1169# CHECK-NEXT: uOps Per Cycle: 2.95 1170# CHECK-NEXT: IPC: 1.97 1171# CHECK-NEXT: Block RThroughput: 2.5 1172 1173# CHECK: Timeline view: 1174# CHECK-NEXT: 012 1175# CHECK-NEXT: Index 0123456789 1176 1177# CHECK: [0,0] DeeeeeeER . . ld1 { v1.1d }, [x27], #8 1178# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 1179# CHECK-NEXT: [0,2] D=eeeeeeER. . ld1 { v1.2d }, [x27], #16 1180# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 1181# CHECK-NEXT: [0,4] D==eeeeeeER . ld1 { v1.2s }, [x27], #8 1182# CHECK-NEXT: [0,5] D===eE----R . add x0, x27, #1 1183# CHECK-NEXT: [0,6] D===eeeeeeER. ld1 { v1.4h }, [x27], #8 1184# CHECK-NEXT: [0,7] D====eE----R. add x0, x27, #1 1185# CHECK-NEXT: [0,8] D====eeeeeeER ld1 { v1.4s }, [x27], #16 1186# CHECK-NEXT: [0,9] D=====eE----R add x0, x27, #1 1187 1188# CHECK: Average Wait times (based on the timeline view): 1189# CHECK-NEXT: [0]: Executions 1190# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1191# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1192# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1193 1194# CHECK: [0] [1] [2] [3] 1195# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.1d }, [x27], #8 1196# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 1197# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.2d }, [x27], #16 1198# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1199# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.2s }, [x27], #8 1200# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 1201# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ld1 { v1.4h }, [x27], #8 1202# CHECK-NEXT: 7. 1 5.0 0.0 4.0 add x0, x27, #1 1203# CHECK-NEXT: 8. 1 5.0 0.0 0.0 ld1 { v1.4s }, [x27], #16 1204# CHECK-NEXT: 9. 1 6.0 0.0 4.0 add x0, x27, #1 1205# CHECK-NEXT: 1 3.5 0.1 2.0 <total> 1206 1207# CHECK: [1] Code Region - G02 1208 1209# CHECK: Iterations: 100 1210# CHECK-NEXT: Instructions: 1000 1211# CHECK-NEXT: Total Cycles: 508 1212# CHECK-NEXT: Total uOps: 1500 1213 1214# CHECK: Dispatch Width: 15 1215# CHECK-NEXT: uOps Per Cycle: 2.95 1216# CHECK-NEXT: IPC: 1.97 1217# CHECK-NEXT: Block RThroughput: 2.5 1218 1219# CHECK: Timeline view: 1220# CHECK-NEXT: 012 1221# CHECK-NEXT: Index 0123456789 1222 1223# CHECK: [0,0] DeeeeeeER . . ld1 { v1.8b }, [x27], #8 1224# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 1225# CHECK-NEXT: [0,2] D=eeeeeeER. . ld1 { v1.8h }, [x27], #16 1226# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 1227# CHECK-NEXT: [0,4] D==eeeeeeER . ld1 { v1.16b }, [x27], #16 1228# CHECK-NEXT: [0,5] D===eE----R . add x0, x27, #1 1229# CHECK-NEXT: [0,6] D===eeeeeeER. ld1 { v1.1d }, [x27], x28 1230# CHECK-NEXT: [0,7] D====eE----R. add x0, x27, #1 1231# CHECK-NEXT: [0,8] D====eeeeeeER ld1 { v1.2d }, [x27], x28 1232# CHECK-NEXT: [0,9] D=====eE----R add x0, x27, #1 1233 1234# CHECK: Average Wait times (based on the timeline view): 1235# CHECK-NEXT: [0]: Executions 1236# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1237# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1238# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1239 1240# CHECK: [0] [1] [2] [3] 1241# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.8b }, [x27], #8 1242# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 1243# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.8h }, [x27], #16 1244# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1245# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.16b }, [x27], #16 1246# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 1247# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ld1 { v1.1d }, [x27], x28 1248# CHECK-NEXT: 7. 1 5.0 0.0 4.0 add x0, x27, #1 1249# CHECK-NEXT: 8. 1 5.0 0.0 0.0 ld1 { v1.2d }, [x27], x28 1250# CHECK-NEXT: 9. 1 6.0 0.0 4.0 add x0, x27, #1 1251# CHECK-NEXT: 1 3.5 0.1 2.0 <total> 1252 1253# CHECK: [2] Code Region - G03 1254 1255# CHECK: Iterations: 100 1256# CHECK-NEXT: Instructions: 1000 1257# CHECK-NEXT: Total Cycles: 508 1258# CHECK-NEXT: Total uOps: 1500 1259 1260# CHECK: Dispatch Width: 15 1261# CHECK-NEXT: uOps Per Cycle: 2.95 1262# CHECK-NEXT: IPC: 1.97 1263# CHECK-NEXT: Block RThroughput: 2.5 1264 1265# CHECK: Timeline view: 1266# CHECK-NEXT: 012 1267# CHECK-NEXT: Index 0123456789 1268 1269# CHECK: [0,0] DeeeeeeER . . ld1 { v1.2s }, [x27], x28 1270# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 1271# CHECK-NEXT: [0,2] D=eeeeeeER. . ld1 { v1.4h }, [x27], x28 1272# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 1273# CHECK-NEXT: [0,4] D==eeeeeeER . ld1 { v1.4s }, [x27], x28 1274# CHECK-NEXT: [0,5] D===eE----R . add x0, x27, #1 1275# CHECK-NEXT: [0,6] D===eeeeeeER. ld1 { v1.8b }, [x27], x28 1276# CHECK-NEXT: [0,7] D====eE----R. add x0, x27, #1 1277# CHECK-NEXT: [0,8] D====eeeeeeER ld1 { v1.8h }, [x27], x28 1278# CHECK-NEXT: [0,9] D=====eE----R add x0, x27, #1 1279 1280# CHECK: Average Wait times (based on the timeline view): 1281# CHECK-NEXT: [0]: Executions 1282# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1283# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1284# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1285 1286# CHECK: [0] [1] [2] [3] 1287# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.2s }, [x27], x28 1288# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 1289# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.4h }, [x27], x28 1290# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1291# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.4s }, [x27], x28 1292# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 1293# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ld1 { v1.8b }, [x27], x28 1294# CHECK-NEXT: 7. 1 5.0 0.0 4.0 add x0, x27, #1 1295# CHECK-NEXT: 8. 1 5.0 0.0 0.0 ld1 { v1.8h }, [x27], x28 1296# CHECK-NEXT: 9. 1 6.0 0.0 4.0 add x0, x27, #1 1297# CHECK-NEXT: 1 3.5 0.1 2.0 <total> 1298 1299# CHECK: [3] Code Region - G04 1300 1301# CHECK: Iterations: 100 1302# CHECK-NEXT: Instructions: 1000 1303# CHECK-NEXT: Total Cycles: 508 1304# CHECK-NEXT: Total uOps: 1900 1305 1306# CHECK: Dispatch Width: 15 1307# CHECK-NEXT: uOps Per Cycle: 3.74 1308# CHECK-NEXT: IPC: 1.97 1309# CHECK-NEXT: Block RThroughput: 3.0 1310 1311# CHECK: Timeline view: 1312# CHECK-NEXT: 012 1313# CHECK-NEXT: Index 0123456789 1314 1315# CHECK: [0,0] DeeeeeeER . . ld1 { v1.16b }, [x27], x28 1316# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 1317# CHECK-NEXT: [0,2] D=eeeeeeER. . ld1 { v1.1d, v2.1d }, [x27], #16 1318# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 1319# CHECK-NEXT: [0,4] D==eeeeeeER . ld1 { v1.2d, v2.2d }, [x27], #32 1320# CHECK-NEXT: [0,5] D===eE----R . add x0, x27, #1 1321# CHECK-NEXT: [0,6] D===eeeeeeER. ld1 { v1.2s, v2.2s }, [x27], #16 1322# CHECK-NEXT: [0,7] D====eE----R. add x0, x27, #1 1323# CHECK-NEXT: [0,8] .D===eeeeeeER ld1 { v1.4h, v2.4h }, [x27], #16 1324# CHECK-NEXT: [0,9] .D====eE----R add x0, x27, #1 1325 1326# CHECK: Average Wait times (based on the timeline view): 1327# CHECK-NEXT: [0]: Executions 1328# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1329# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1330# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1331 1332# CHECK: [0] [1] [2] [3] 1333# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.16b }, [x27], x28 1334# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 1335# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.1d, v2.1d }, [x27], #16 1336# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1337# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.2d, v2.2d }, [x27], #32 1338# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 1339# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ld1 { v1.2s, v2.2s }, [x27], #16 1340# CHECK-NEXT: 7. 1 5.0 0.0 4.0 add x0, x27, #1 1341# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld1 { v1.4h, v2.4h }, [x27], #16 1342# CHECK-NEXT: 9. 1 5.0 0.0 4.0 add x0, x27, #1 1343# CHECK-NEXT: 1 3.3 0.1 2.0 <total> 1344 1345# CHECK: [4] Code Region - G05 1346 1347# CHECK: Iterations: 100 1348# CHECK-NEXT: Instructions: 1000 1349# CHECK-NEXT: Total Cycles: 508 1350# CHECK-NEXT: Total uOps: 2000 1351 1352# CHECK: Dispatch Width: 15 1353# CHECK-NEXT: uOps Per Cycle: 3.94 1354# CHECK-NEXT: IPC: 1.97 1355# CHECK-NEXT: Block RThroughput: 3.3 1356 1357# CHECK: Timeline view: 1358# CHECK-NEXT: 012 1359# CHECK-NEXT: Index 0123456789 1360 1361# CHECK: [0,0] DeeeeeeER . . ld1 { v1.4s, v2.4s }, [x27], #32 1362# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 1363# CHECK-NEXT: [0,2] D=eeeeeeER. . ld1 { v1.8b, v2.8b }, [x27], #16 1364# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 1365# CHECK-NEXT: [0,4] D==eeeeeeER . ld1 { v1.8h, v2.8h }, [x27], #32 1366# CHECK-NEXT: [0,5] D===eE----R . add x0, x27, #1 1367# CHECK-NEXT: [0,6] D===eeeeeeER. ld1 { v1.16b, v2.16b }, [x27], #32 1368# CHECK-NEXT: [0,7] .D===eE----R. add x0, x27, #1 1369# CHECK-NEXT: [0,8] .D===eeeeeeER ld1 { v1.1d, v2.1d }, [x27], x28 1370# CHECK-NEXT: [0,9] .D====eE----R add x0, x27, #1 1371 1372# CHECK: Average Wait times (based on the timeline view): 1373# CHECK-NEXT: [0]: Executions 1374# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1375# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1376# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1377 1378# CHECK: [0] [1] [2] [3] 1379# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.4s, v2.4s }, [x27], #32 1380# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 1381# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.8b, v2.8b }, [x27], #16 1382# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1383# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.8h, v2.8h }, [x27], #32 1384# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 1385# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ld1 { v1.16b, v2.16b }, [x27], #32 1386# CHECK-NEXT: 7. 1 4.0 0.0 4.0 add x0, x27, #1 1387# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld1 { v1.1d, v2.1d }, [x27], x28 1388# CHECK-NEXT: 9. 1 5.0 0.0 4.0 add x0, x27, #1 1389# CHECK-NEXT: 1 3.2 0.1 2.0 <total> 1390 1391# CHECK: [5] Code Region - G06 1392 1393# CHECK: Iterations: 100 1394# CHECK-NEXT: Instructions: 1000 1395# CHECK-NEXT: Total Cycles: 508 1396# CHECK-NEXT: Total uOps: 2000 1397 1398# CHECK: Dispatch Width: 15 1399# CHECK-NEXT: uOps Per Cycle: 3.94 1400# CHECK-NEXT: IPC: 1.97 1401# CHECK-NEXT: Block RThroughput: 3.3 1402 1403# CHECK: Timeline view: 1404# CHECK-NEXT: 012 1405# CHECK-NEXT: Index 0123456789 1406 1407# CHECK: [0,0] DeeeeeeER . . ld1 { v1.2d, v2.2d }, [x27], x28 1408# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 1409# CHECK-NEXT: [0,2] D=eeeeeeER. . ld1 { v1.2s, v2.2s }, [x27], x28 1410# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 1411# CHECK-NEXT: [0,4] D==eeeeeeER . ld1 { v1.4h, v2.4h }, [x27], x28 1412# CHECK-NEXT: [0,5] D===eE----R . add x0, x27, #1 1413# CHECK-NEXT: [0,6] D===eeeeeeER. ld1 { v1.4s, v2.4s }, [x27], x28 1414# CHECK-NEXT: [0,7] .D===eE----R. add x0, x27, #1 1415# CHECK-NEXT: [0,8] .D===eeeeeeER ld1 { v1.8b, v2.8b }, [x27], x28 1416# CHECK-NEXT: [0,9] .D====eE----R add x0, x27, #1 1417 1418# CHECK: Average Wait times (based on the timeline view): 1419# CHECK-NEXT: [0]: Executions 1420# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1421# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1422# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1423 1424# CHECK: [0] [1] [2] [3] 1425# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.2d, v2.2d }, [x27], x28 1426# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 1427# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.2s, v2.2s }, [x27], x28 1428# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1429# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.4h, v2.4h }, [x27], x28 1430# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 1431# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ld1 { v1.4s, v2.4s }, [x27], x28 1432# CHECK-NEXT: 7. 1 4.0 0.0 4.0 add x0, x27, #1 1433# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld1 { v1.8b, v2.8b }, [x27], x28 1434# CHECK-NEXT: 9. 1 5.0 0.0 4.0 add x0, x27, #1 1435# CHECK-NEXT: 1 3.2 0.1 2.0 <total> 1436 1437# CHECK: [6] Code Region - G07 1438 1439# CHECK: Iterations: 100 1440# CHECK-NEXT: Instructions: 1000 1441# CHECK-NEXT: Total Cycles: 508 1442# CHECK-NEXT: Total uOps: 2300 1443 1444# CHECK: Dispatch Width: 15 1445# CHECK-NEXT: uOps Per Cycle: 4.53 1446# CHECK-NEXT: IPC: 1.97 1447# CHECK-NEXT: Block RThroughput: 4.3 1448 1449# CHECK: Timeline view: 1450# CHECK-NEXT: 012 1451# CHECK-NEXT: Index 0123456789 1452 1453# CHECK: [0,0] DeeeeeeER . . ld1 { v1.8h, v2.8h }, [x27], x28 1454# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 1455# CHECK-NEXT: [0,2] D=eeeeeeER. . ld1 { v1.16b, v2.16b }, [x27], x28 1456# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 1457# CHECK-NEXT: [0,4] D==eeeeeeER . ld1 { v1.1d, v2.1d, v3.1d }, [x27], #24 1458# CHECK-NEXT: [0,5] D===eE----R . add x0, x27, #1 1459# CHECK-NEXT: [0,6] .D==eeeeeeER. ld1 { v1.2d, v2.2d, v3.2d }, [x27], #48 1460# CHECK-NEXT: [0,7] .D===eE----R. add x0, x27, #1 1461# CHECK-NEXT: [0,8] .D===eeeeeeER ld1 { v1.2s, v2.2s, v3.2s }, [x27], #24 1462# CHECK-NEXT: [0,9] .D====eE----R add x0, x27, #1 1463 1464# CHECK: Average Wait times (based on the timeline view): 1465# CHECK-NEXT: [0]: Executions 1466# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1467# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1468# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1469 1470# CHECK: [0] [1] [2] [3] 1471# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.8h, v2.8h }, [x27], x28 1472# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 1473# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.16b, v2.16b }, [x27], x28 1474# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1475# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.1d, v2.1d, v3.1d }, [x27], #24 1476# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 1477# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld1 { v1.2d, v2.2d, v3.2d }, [x27], #48 1478# CHECK-NEXT: 7. 1 4.0 0.0 4.0 add x0, x27, #1 1479# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld1 { v1.2s, v2.2s, v3.2s }, [x27], #24 1480# CHECK-NEXT: 9. 1 5.0 0.0 4.0 add x0, x27, #1 1481# CHECK-NEXT: 1 3.1 0.1 2.0 <total> 1482 1483# CHECK: [7] Code Region - G08 1484 1485# CHECK: Iterations: 100 1486# CHECK-NEXT: Instructions: 1000 1487# CHECK-NEXT: Total Cycles: 508 1488# CHECK-NEXT: Total uOps: 2500 1489 1490# CHECK: Dispatch Width: 15 1491# CHECK-NEXT: uOps Per Cycle: 4.92 1492# CHECK-NEXT: IPC: 1.97 1493# CHECK-NEXT: Block RThroughput: 5.0 1494 1495# CHECK: Timeline view: 1496# CHECK-NEXT: 012 1497# CHECK-NEXT: Index 0123456789 1498 1499# CHECK: [0,0] DeeeeeeER . . ld1 { v1.4h, v2.4h, v3.4h }, [x27], #24 1500# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 1501# CHECK-NEXT: [0,2] D=eeeeeeER. . ld1 { v1.4s, v2.4s, v3.4s }, [x27], #48 1502# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 1503# CHECK-NEXT: [0,4] D==eeeeeeER . ld1 { v1.8b, v2.8b, v3.8b }, [x27], #24 1504# CHECK-NEXT: [0,5] D===eE----R . add x0, x27, #1 1505# CHECK-NEXT: [0,6] .D==eeeeeeER. ld1 { v1.8h, v2.8h, v3.8h }, [x27], #48 1506# CHECK-NEXT: [0,7] .D===eE----R. add x0, x27, #1 1507# CHECK-NEXT: [0,8] .D===eeeeeeER ld1 { v1.16b, v2.16b, v3.16b }, [x27], #48 1508# CHECK-NEXT: [0,9] .D====eE----R add x0, x27, #1 1509 1510# CHECK: Average Wait times (based on the timeline view): 1511# CHECK-NEXT: [0]: Executions 1512# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1513# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1514# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1515 1516# CHECK: [0] [1] [2] [3] 1517# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.4h, v2.4h, v3.4h }, [x27], #24 1518# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 1519# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.4s, v2.4s, v3.4s }, [x27], #48 1520# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1521# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.8b, v2.8b, v3.8b }, [x27], #24 1522# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 1523# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld1 { v1.8h, v2.8h, v3.8h }, [x27], #48 1524# CHECK-NEXT: 7. 1 4.0 0.0 4.0 add x0, x27, #1 1525# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld1 { v1.16b, v2.16b, v3.16b }, [x27], #48 1526# CHECK-NEXT: 9. 1 5.0 0.0 4.0 add x0, x27, #1 1527# CHECK-NEXT: 1 3.1 0.1 2.0 <total> 1528 1529# CHECK: [8] Code Region - G09 1530 1531# CHECK: Iterations: 100 1532# CHECK-NEXT: Instructions: 1000 1533# CHECK-NEXT: Total Cycles: 508 1534# CHECK-NEXT: Total uOps: 2500 1535 1536# CHECK: Dispatch Width: 15 1537# CHECK-NEXT: uOps Per Cycle: 4.92 1538# CHECK-NEXT: IPC: 1.97 1539# CHECK-NEXT: Block RThroughput: 5.0 1540 1541# CHECK: Timeline view: 1542# CHECK-NEXT: 012 1543# CHECK-NEXT: Index 0123456789 1544 1545# CHECK: [0,0] DeeeeeeER . . ld1 { v1.1d, v2.1d, v3.1d }, [x27], x28 1546# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 1547# CHECK-NEXT: [0,2] D=eeeeeeER. . ld1 { v1.2d, v2.2d, v3.2d }, [x27], x28 1548# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 1549# CHECK-NEXT: [0,4] D==eeeeeeER . ld1 { v1.2s, v2.2s, v3.2s }, [x27], x28 1550# CHECK-NEXT: [0,5] D===eE----R . add x0, x27, #1 1551# CHECK-NEXT: [0,6] .D==eeeeeeER. ld1 { v1.4h, v2.4h, v3.4h }, [x27], x28 1552# CHECK-NEXT: [0,7] .D===eE----R. add x0, x27, #1 1553# CHECK-NEXT: [0,8] .D===eeeeeeER ld1 { v1.4s, v2.4s, v3.4s }, [x27], x28 1554# CHECK-NEXT: [0,9] .D====eE----R add x0, x27, #1 1555 1556# CHECK: Average Wait times (based on the timeline view): 1557# CHECK-NEXT: [0]: Executions 1558# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1559# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1560# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1561 1562# CHECK: [0] [1] [2] [3] 1563# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.1d, v2.1d, v3.1d }, [x27], x28 1564# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 1565# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.2d, v2.2d, v3.2d }, [x27], x28 1566# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1567# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.2s, v2.2s, v3.2s }, [x27], x28 1568# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 1569# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld1 { v1.4h, v2.4h, v3.4h }, [x27], x28 1570# CHECK-NEXT: 7. 1 4.0 0.0 4.0 add x0, x27, #1 1571# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld1 { v1.4s, v2.4s, v3.4s }, [x27], x28 1572# CHECK-NEXT: 9. 1 5.0 0.0 4.0 add x0, x27, #1 1573# CHECK-NEXT: 1 3.1 0.1 2.0 <total> 1574 1575# CHECK: [9] Code Region - G10 1576 1577# CHECK: Iterations: 100 1578# CHECK-NEXT: Instructions: 1000 1579# CHECK-NEXT: Total Cycles: 608 1580# CHECK-NEXT: Total uOps: 2500 1581 1582# CHECK: Dispatch Width: 15 1583# CHECK-NEXT: uOps Per Cycle: 4.11 1584# CHECK-NEXT: IPC: 1.64 1585# CHECK-NEXT: Block RThroughput: 5.0 1586 1587# CHECK: Timeline view: 1588# CHECK-NEXT: 0123 1589# CHECK-NEXT: Index 0123456789 1590 1591# CHECK: [0,0] DeeeeeeER . . ld1 { v1.8b, v2.8b, v3.8b }, [x27], x28 1592# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 1593# CHECK-NEXT: [0,2] D=eeeeeeER. . ld1 { v1.8h, v2.8h, v3.8h }, [x27], x28 1594# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 1595# CHECK-NEXT: [0,4] D==eeeeeeER . ld1 { v1.16b, v2.16b, v3.16b }, [x27], x28 1596# CHECK-NEXT: [0,5] D===eE----R . add x0, x27, #1 1597# CHECK-NEXT: [0,6] .D==eeeeeeER . ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 1598# CHECK-NEXT: [0,7] .D===eE----R . add x0, x27, #1 1599# CHECK-NEXT: [0,8] .D===eeeeeeeER ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 1600# CHECK-NEXT: [0,9] .D====eE-----R add x0, x27, #1 1601 1602# CHECK: Average Wait times (based on the timeline view): 1603# CHECK-NEXT: [0]: Executions 1604# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1605# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1606# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1607 1608# CHECK: [0] [1] [2] [3] 1609# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.8b, v2.8b, v3.8b }, [x27], x28 1610# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 1611# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.8h, v2.8h, v3.8h }, [x27], x28 1612# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1613# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.16b, v2.16b, v3.16b }, [x27], x28 1614# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 1615# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 1616# CHECK-NEXT: 7. 1 4.0 0.0 4.0 add x0, x27, #1 1617# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 1618# CHECK-NEXT: 9. 1 5.0 0.0 5.0 add x0, x27, #1 1619# CHECK-NEXT: 1 3.1 0.1 2.1 <total> 1620 1621# CHECK: [10] Code Region - G11 1622 1623# CHECK: Iterations: 100 1624# CHECK-NEXT: Instructions: 1000 1625# CHECK-NEXT: Total Cycles: 509 1626# CHECK-NEXT: Total uOps: 2400 1627 1628# CHECK: Dispatch Width: 15 1629# CHECK-NEXT: uOps Per Cycle: 4.72 1630# CHECK-NEXT: IPC: 1.96 1631# CHECK-NEXT: Block RThroughput: 4.7 1632 1633# CHECK: Timeline view: 1634# CHECK-NEXT: 0123 1635# CHECK-NEXT: Index 0123456789 1636 1637# CHECK: [0,0] DeeeeeeER . . ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 1638# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 1639# CHECK-NEXT: [0,2] D=eeeeeeER. . ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 1640# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 1641# CHECK-NEXT: [0,4] D==eeeeeeeER . ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 1642# CHECK-NEXT: [0,5] D===eE-----R . add x0, x27, #1 1643# CHECK-NEXT: [0,6] .D==eeeeeeER . ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 1644# CHECK-NEXT: [0,7] .D===eE----R . add x0, x27, #1 1645# CHECK-NEXT: [0,8] .D===eeeeeeeER ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 1646# CHECK-NEXT: [0,9] .D====eE-----R add x0, x27, #1 1647 1648# CHECK: Average Wait times (based on the timeline view): 1649# CHECK-NEXT: [0]: Executions 1650# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1651# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1652# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1653 1654# CHECK: [0] [1] [2] [3] 1655# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 1656# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 1657# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 1658# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1659# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 1660# CHECK-NEXT: 5. 1 4.0 0.0 5.0 add x0, x27, #1 1661# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 1662# CHECK-NEXT: 7. 1 4.0 0.0 4.0 add x0, x27, #1 1663# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 1664# CHECK-NEXT: 9. 1 5.0 0.0 5.0 add x0, x27, #1 1665# CHECK-NEXT: 1 3.1 0.1 2.2 <total> 1666 1667# CHECK: [11] Code Region - G12 1668 1669# CHECK: Iterations: 100 1670# CHECK-NEXT: Instructions: 1000 1671# CHECK-NEXT: Total Cycles: 508 1672# CHECK-NEXT: Total uOps: 2400 1673 1674# CHECK: Dispatch Width: 15 1675# CHECK-NEXT: uOps Per Cycle: 4.72 1676# CHECK-NEXT: IPC: 1.97 1677# CHECK-NEXT: Block RThroughput: 4.7 1678 1679# CHECK: Timeline view: 1680# CHECK-NEXT: 012 1681# CHECK-NEXT: Index 0123456789 1682 1683# CHECK: [0,0] DeeeeeeeER. . ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 1684# CHECK-NEXT: [0,1] D=eE-----R. . add x0, x27, #1 1685# CHECK-NEXT: [0,2] D=eeeeeeER. . ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 1686# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 1687# CHECK-NEXT: [0,4] D==eeeeeeeER. ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 1688# CHECK-NEXT: [0,5] .D==eE-----R. add x0, x27, #1 1689# CHECK-NEXT: [0,6] .D==eeeeeeER. ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 1690# CHECK-NEXT: [0,7] .D===eE----R. add x0, x27, #1 1691# CHECK-NEXT: [0,8] .D===eeeeeeER ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 1692# CHECK-NEXT: [0,9] .D====eE----R add x0, x27, #1 1693 1694# CHECK: Average Wait times (based on the timeline view): 1695# CHECK-NEXT: [0]: Executions 1696# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1697# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1698# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1699 1700# CHECK: [0] [1] [2] [3] 1701# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 1702# CHECK-NEXT: 1. 1 2.0 0.0 5.0 add x0, x27, #1 1703# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 1704# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1705# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 1706# CHECK-NEXT: 5. 1 3.0 0.0 5.0 add x0, x27, #1 1707# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 1708# CHECK-NEXT: 7. 1 4.0 0.0 4.0 add x0, x27, #1 1709# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 1710# CHECK-NEXT: 9. 1 5.0 0.0 4.0 add x0, x27, #1 1711# CHECK-NEXT: 1 3.0 0.1 2.2 <total> 1712 1713# CHECK: [12] Code Region - G13 1714 1715# CHECK: Iterations: 100 1716# CHECK-NEXT: Instructions: 1000 1717# CHECK-NEXT: Total Cycles: 1110 1718# CHECK-NEXT: Total uOps: 2600 1719 1720# CHECK: Dispatch Width: 15 1721# CHECK-NEXT: uOps Per Cycle: 2.34 1722# CHECK-NEXT: IPC: 0.90 1723# CHECK-NEXT: Block RThroughput: 5.0 1724 1725# CHECK: Timeline view: 1726# CHECK-NEXT: 0123456789 1727# CHECK-NEXT: Index 0123456789 0 1728 1729# CHECK: [0,0] DeeeeeeeER. . . ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 1730# CHECK-NEXT: [0,1] D=eE-----R. . . add x0, x27, #1 1731# CHECK-NEXT: [0,2] D=eeeeeeER. . . ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 1732# CHECK-NEXT: [0,3] D==eE----R. . . add x0, x27, #1 1733# CHECK-NEXT: [0,4] D==eeeeeeeER . . ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 1734# CHECK-NEXT: [0,5] .D==eE-----R . . add x0, x27, #1 1735# CHECK-NEXT: [0,6] .D==eeeeeeeER . . ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 1736# CHECK-NEXT: [0,7] .D===eE-----R . . add x0, x27, #1 1737# CHECK-NEXT: [0,8] .D=========eeeeeeeeER ld1 { v1.b }[0], [x27], #1 1738# CHECK-NEXT: [0,9] .D==========eE------R add x0, x27, #1 1739 1740# CHECK: Average Wait times (based on the timeline view): 1741# CHECK-NEXT: [0]: Executions 1742# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1743# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1744# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1745 1746# CHECK: [0] [1] [2] [3] 1747# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 1748# CHECK-NEXT: 1. 1 2.0 0.0 5.0 add x0, x27, #1 1749# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 1750# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1751# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 1752# CHECK-NEXT: 5. 1 3.0 0.0 5.0 add x0, x27, #1 1753# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 1754# CHECK-NEXT: 7. 1 4.0 0.0 5.0 add x0, x27, #1 1755# CHECK-NEXT: 8. 1 10.0 0.0 0.0 ld1 { v1.b }[0], [x27], #1 1756# CHECK-NEXT: 9. 1 11.0 0.0 6.0 add x0, x27, #1 1757# CHECK-NEXT: 1 4.2 0.1 2.5 <total> 1758 1759# CHECK: [13] Code Region - G14 1760 1761# CHECK: Iterations: 100 1762# CHECK-NEXT: Instructions: 1000 1763# CHECK-NEXT: Total Cycles: 4003 1764# CHECK-NEXT: Total uOps: 2000 1765 1766# CHECK: Dispatch Width: 15 1767# CHECK-NEXT: uOps Per Cycle: 0.50 1768# CHECK-NEXT: IPC: 0.25 1769# CHECK-NEXT: Block RThroughput: 2.5 1770 1771# CHECK: Timeline view: 1772# CHECK-NEXT: 0123456789 0123456789 1773# CHECK-NEXT: Index 0123456789 0123456789 012 1774 1775# CHECK: [0,0] DeeeeeeeeER . . . . . . . ld1 { v1.b }[8], [x27], #1 1776# CHECK-NEXT: [0,1] D=eE------R . . . . . . . add x0, x27, #1 1777# CHECK-NEXT: [0,2] D========eeeeeeeeER . . . . . . ld1 { v1.b }[0], [x27], x28 1778# CHECK-NEXT: [0,3] D=========eE------R . . . . . . add x0, x27, #1 1779# CHECK-NEXT: [0,4] D================eeeeeeeeER . . . . ld1 { v1.b }[8], [x27], x28 1780# CHECK-NEXT: [0,5] D=================eE------R . . . . add x0, x27, #1 1781# CHECK-NEXT: [0,6] D========================eeeeeeeeER. . . ld1 { v1.h }[0], [x27], #2 1782# CHECK-NEXT: [0,7] .D========================eE------R. . . add x0, x27, #1 1783# CHECK-NEXT: [0,8] .D===============================eeeeeeeeER ld1 { v1.h }[4], [x27], #2 1784# CHECK-NEXT: [0,9] .D================================eE------R add x0, x27, #1 1785 1786# CHECK: Average Wait times (based on the timeline view): 1787# CHECK-NEXT: [0]: Executions 1788# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1789# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1790# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1791 1792# CHECK: [0] [1] [2] [3] 1793# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.b }[8], [x27], #1 1794# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 1795# CHECK-NEXT: 2. 1 9.0 0.0 0.0 ld1 { v1.b }[0], [x27], x28 1796# CHECK-NEXT: 3. 1 10.0 0.0 6.0 add x0, x27, #1 1797# CHECK-NEXT: 4. 1 17.0 0.0 0.0 ld1 { v1.b }[8], [x27], x28 1798# CHECK-NEXT: 5. 1 18.0 0.0 6.0 add x0, x27, #1 1799# CHECK-NEXT: 6. 1 25.0 0.0 0.0 ld1 { v1.h }[0], [x27], #2 1800# CHECK-NEXT: 7. 1 25.0 0.0 6.0 add x0, x27, #1 1801# CHECK-NEXT: 8. 1 32.0 0.0 0.0 ld1 { v1.h }[4], [x27], #2 1802# CHECK-NEXT: 9. 1 33.0 0.0 6.0 add x0, x27, #1 1803# CHECK-NEXT: 1 17.2 0.1 3.0 <total> 1804 1805# CHECK: [14] Code Region - G15 1806 1807# CHECK: Iterations: 100 1808# CHECK-NEXT: Instructions: 1000 1809# CHECK-NEXT: Total Cycles: 4003 1810# CHECK-NEXT: Total uOps: 2000 1811 1812# CHECK: Dispatch Width: 15 1813# CHECK-NEXT: uOps Per Cycle: 0.50 1814# CHECK-NEXT: IPC: 0.25 1815# CHECK-NEXT: Block RThroughput: 2.5 1816 1817# CHECK: Timeline view: 1818# CHECK-NEXT: 0123456789 0123456789 1819# CHECK-NEXT: Index 0123456789 0123456789 012 1820 1821# CHECK: [0,0] DeeeeeeeeER . . . . . . . ld1 { v1.h }[0], [x27], x28 1822# CHECK-NEXT: [0,1] D=eE------R . . . . . . . add x0, x27, #1 1823# CHECK-NEXT: [0,2] D========eeeeeeeeER . . . . . . ld1 { v1.h }[4], [x27], x28 1824# CHECK-NEXT: [0,3] D=========eE------R . . . . . . add x0, x27, #1 1825# CHECK-NEXT: [0,4] D================eeeeeeeeER . . . . ld1 { v1.s }[0], [x27], #4 1826# CHECK-NEXT: [0,5] D=================eE------R . . . . add x0, x27, #1 1827# CHECK-NEXT: [0,6] D========================eeeeeeeeER. . . ld1 { v1.s }[0], [x27], x28 1828# CHECK-NEXT: [0,7] .D========================eE------R. . . add x0, x27, #1 1829# CHECK-NEXT: [0,8] .D===============================eeeeeeeeER ld1 { v1.d }[0], [x27], #8 1830# CHECK-NEXT: [0,9] .D================================eE------R add x0, x27, #1 1831 1832# CHECK: Average Wait times (based on the timeline view): 1833# CHECK-NEXT: [0]: Executions 1834# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1835# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1836# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1837 1838# CHECK: [0] [1] [2] [3] 1839# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.h }[0], [x27], x28 1840# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 1841# CHECK-NEXT: 2. 1 9.0 0.0 0.0 ld1 { v1.h }[4], [x27], x28 1842# CHECK-NEXT: 3. 1 10.0 0.0 6.0 add x0, x27, #1 1843# CHECK-NEXT: 4. 1 17.0 0.0 0.0 ld1 { v1.s }[0], [x27], #4 1844# CHECK-NEXT: 5. 1 18.0 0.0 6.0 add x0, x27, #1 1845# CHECK-NEXT: 6. 1 25.0 0.0 0.0 ld1 { v1.s }[0], [x27], x28 1846# CHECK-NEXT: 7. 1 25.0 0.0 6.0 add x0, x27, #1 1847# CHECK-NEXT: 8. 1 32.0 0.0 0.0 ld1 { v1.d }[0], [x27], #8 1848# CHECK-NEXT: 9. 1 33.0 0.0 6.0 add x0, x27, #1 1849# CHECK-NEXT: 1 17.2 0.1 3.0 <total> 1850 1851# CHECK: [15] Code Region - G16 1852 1853# CHECK: Iterations: 100 1854# CHECK-NEXT: Instructions: 1000 1855# CHECK-NEXT: Total Cycles: 1203 1856# CHECK-NEXT: Total uOps: 2000 1857 1858# CHECK: Dispatch Width: 15 1859# CHECK-NEXT: uOps Per Cycle: 1.66 1860# CHECK-NEXT: IPC: 0.83 1861# CHECK-NEXT: Block RThroughput: 2.5 1862 1863# CHECK: Timeline view: 1864# CHECK-NEXT: 01234 1865# CHECK-NEXT: Index 0123456789 1866 1867# CHECK: [0,0] DeeeeeeeeER . ld1 { v1.d }[0], [x27], x28 1868# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 1869# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld1r { v1.1d }, [x27], #8 1870# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 1871# CHECK-NEXT: [0,4] D==eeeeeeeeER . ld1r { v1.2d }, [x27], #8 1872# CHECK-NEXT: [0,5] D===eE------R . add x0, x27, #1 1873# CHECK-NEXT: [0,6] D===eeeeeeeeER. ld1r { v1.2s }, [x27], #4 1874# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 1875# CHECK-NEXT: [0,8] .D===eeeeeeeeER ld1r { v1.4h }, [x27], #2 1876# CHECK-NEXT: [0,9] .D====eE------R add x0, x27, #1 1877 1878# CHECK: Average Wait times (based on the timeline view): 1879# CHECK-NEXT: [0]: Executions 1880# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1881# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1882# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1883 1884# CHECK: [0] [1] [2] [3] 1885# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.d }[0], [x27], x28 1886# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 1887# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1r { v1.1d }, [x27], #8 1888# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 1889# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1r { v1.2d }, [x27], #8 1890# CHECK-NEXT: 5. 1 4.0 0.0 6.0 add x0, x27, #1 1891# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ld1r { v1.2s }, [x27], #4 1892# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 1893# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld1r { v1.4h }, [x27], #2 1894# CHECK-NEXT: 9. 1 5.0 0.0 6.0 add x0, x27, #1 1895# CHECK-NEXT: 1 3.2 0.1 3.0 <total> 1896 1897# CHECK: [16] Code Region - G17 1898 1899# CHECK: Iterations: 100 1900# CHECK-NEXT: Instructions: 1000 1901# CHECK-NEXT: Total Cycles: 510 1902# CHECK-NEXT: Total uOps: 2000 1903 1904# CHECK: Dispatch Width: 15 1905# CHECK-NEXT: uOps Per Cycle: 3.92 1906# CHECK-NEXT: IPC: 1.96 1907# CHECK-NEXT: Block RThroughput: 2.5 1908 1909# CHECK: Timeline view: 1910# CHECK-NEXT: 01234 1911# CHECK-NEXT: Index 0123456789 1912 1913# CHECK: [0,0] DeeeeeeeeER . ld1r { v1.4s }, [x27], #4 1914# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 1915# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld1r { v1.8b }, [x27], #1 1916# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 1917# CHECK-NEXT: [0,4] D==eeeeeeeeER . ld1r { v1.8h }, [x27], #2 1918# CHECK-NEXT: [0,5] D===eE------R . add x0, x27, #1 1919# CHECK-NEXT: [0,6] D===eeeeeeeeER. ld1r { v1.16b }, [x27], #1 1920# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 1921# CHECK-NEXT: [0,8] .D===eeeeeeeeER ld1r { v1.1d }, [x27], x28 1922# CHECK-NEXT: [0,9] .D====eE------R add x0, x27, #1 1923 1924# CHECK: Average Wait times (based on the timeline view): 1925# CHECK-NEXT: [0]: Executions 1926# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1927# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1928# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1929 1930# CHECK: [0] [1] [2] [3] 1931# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1r { v1.4s }, [x27], #4 1932# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 1933# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1r { v1.8b }, [x27], #1 1934# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 1935# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1r { v1.8h }, [x27], #2 1936# CHECK-NEXT: 5. 1 4.0 0.0 6.0 add x0, x27, #1 1937# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ld1r { v1.16b }, [x27], #1 1938# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 1939# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld1r { v1.1d }, [x27], x28 1940# CHECK-NEXT: 9. 1 5.0 0.0 6.0 add x0, x27, #1 1941# CHECK-NEXT: 1 3.2 0.1 3.0 <total> 1942 1943# CHECK: [17] Code Region - G18 1944 1945# CHECK: Iterations: 100 1946# CHECK-NEXT: Instructions: 1000 1947# CHECK-NEXT: Total Cycles: 510 1948# CHECK-NEXT: Total uOps: 2000 1949 1950# CHECK: Dispatch Width: 15 1951# CHECK-NEXT: uOps Per Cycle: 3.92 1952# CHECK-NEXT: IPC: 1.96 1953# CHECK-NEXT: Block RThroughput: 2.5 1954 1955# CHECK: Timeline view: 1956# CHECK-NEXT: 01234 1957# CHECK-NEXT: Index 0123456789 1958 1959# CHECK: [0,0] DeeeeeeeeER . ld1r { v1.2d }, [x27], x28 1960# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 1961# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld1r { v1.2s }, [x27], x28 1962# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 1963# CHECK-NEXT: [0,4] D==eeeeeeeeER . ld1r { v1.4h }, [x27], x28 1964# CHECK-NEXT: [0,5] D===eE------R . add x0, x27, #1 1965# CHECK-NEXT: [0,6] D===eeeeeeeeER. ld1r { v1.4s }, [x27], x28 1966# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 1967# CHECK-NEXT: [0,8] .D===eeeeeeeeER ld1r { v1.8b }, [x27], x28 1968# CHECK-NEXT: [0,9] .D====eE------R add x0, x27, #1 1969 1970# CHECK: Average Wait times (based on the timeline view): 1971# CHECK-NEXT: [0]: Executions 1972# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1973# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1974# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1975 1976# CHECK: [0] [1] [2] [3] 1977# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1r { v1.2d }, [x27], x28 1978# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 1979# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1r { v1.2s }, [x27], x28 1980# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 1981# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld1r { v1.4h }, [x27], x28 1982# CHECK-NEXT: 5. 1 4.0 0.0 6.0 add x0, x27, #1 1983# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ld1r { v1.4s }, [x27], x28 1984# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 1985# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld1r { v1.8b }, [x27], x28 1986# CHECK-NEXT: 9. 1 5.0 0.0 6.0 add x0, x27, #1 1987# CHECK-NEXT: 1 3.2 0.1 3.0 <total> 1988 1989# CHECK: [18] Code Region - G19 1990 1991# CHECK: Iterations: 100 1992# CHECK-NEXT: Instructions: 1000 1993# CHECK-NEXT: Total Cycles: 510 1994# CHECK-NEXT: Total uOps: 2400 1995 1996# CHECK: Dispatch Width: 15 1997# CHECK-NEXT: uOps Per Cycle: 4.71 1998# CHECK-NEXT: IPC: 1.96 1999# CHECK-NEXT: Block RThroughput: 2.5 2000 2001# CHECK: Timeline view: 2002# CHECK-NEXT: 01234 2003# CHECK-NEXT: Index 0123456789 2004 2005# CHECK: [0,0] DeeeeeeeeER . ld1r { v1.8h }, [x27], x28 2006# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 2007# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld1r { v1.16b }, [x27], x28 2008# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 2009# CHECK-NEXT: [0,4] D==eeeeeeeeER . ld2 { v1.2d, v2.2d }, [x27], #32 2010# CHECK-NEXT: [0,5] D===eE------R . add x0, x27, #1 2011# CHECK-NEXT: [0,6] .D==eeeeeeeeER. ld2 { v1.2s, v2.2s }, [x27], #16 2012# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 2013# CHECK-NEXT: [0,8] .D===eeeeeeeeER ld2 { v1.4h, v2.4h }, [x27], #16 2014# CHECK-NEXT: [0,9] .D====eE------R add x0, x27, #1 2015 2016# CHECK: Average Wait times (based on the timeline view): 2017# CHECK-NEXT: [0]: Executions 2018# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2019# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2020# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2021 2022# CHECK: [0] [1] [2] [3] 2023# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1r { v1.8h }, [x27], x28 2024# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2025# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld1r { v1.16b }, [x27], x28 2026# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 2027# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld2 { v1.2d, v2.2d }, [x27], #32 2028# CHECK-NEXT: 5. 1 4.0 0.0 6.0 add x0, x27, #1 2029# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld2 { v1.2s, v2.2s }, [x27], #16 2030# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 2031# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld2 { v1.4h, v2.4h }, [x27], #16 2032# CHECK-NEXT: 9. 1 5.0 0.0 6.0 add x0, x27, #1 2033# CHECK-NEXT: 1 3.1 0.1 3.0 <total> 2034 2035# CHECK: [19] Code Region - G20 2036 2037# CHECK: Iterations: 100 2038# CHECK-NEXT: Instructions: 1000 2039# CHECK-NEXT: Total Cycles: 510 2040# CHECK-NEXT: Total uOps: 2900 2041 2042# CHECK: Dispatch Width: 15 2043# CHECK-NEXT: uOps Per Cycle: 5.69 2044# CHECK-NEXT: IPC: 1.96 2045# CHECK-NEXT: Block RThroughput: 3.0 2046 2047# CHECK: Timeline view: 2048# CHECK-NEXT: 01234 2049# CHECK-NEXT: Index 0123456789 2050 2051# CHECK: [0,0] DeeeeeeeeER . ld2 { v1.4s, v2.4s }, [x27], #32 2052# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 2053# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld2 { v1.8b, v2.8b }, [x27], #16 2054# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 2055# CHECK-NEXT: [0,4] .D=eeeeeeeeER . ld2 { v1.8h, v2.8h }, [x27], #32 2056# CHECK-NEXT: [0,5] .D==eE------R . add x0, x27, #1 2057# CHECK-NEXT: [0,6] .D==eeeeeeeeER. ld2 { v1.16b, v2.16b }, [x27], #32 2058# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 2059# CHECK-NEXT: [0,8] . D==eeeeeeeeER ld2 { v1.2d, v2.2d }, [x27], x28 2060# CHECK-NEXT: [0,9] . D===eE------R add x0, x27, #1 2061 2062# CHECK: Average Wait times (based on the timeline view): 2063# CHECK-NEXT: [0]: Executions 2064# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2065# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2066# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2067 2068# CHECK: [0] [1] [2] [3] 2069# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.4s, v2.4s }, [x27], #32 2070# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2071# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld2 { v1.8b, v2.8b }, [x27], #16 2072# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 2073# CHECK-NEXT: 4. 1 2.0 0.0 0.0 ld2 { v1.8h, v2.8h }, [x27], #32 2074# CHECK-NEXT: 5. 1 3.0 0.0 6.0 add x0, x27, #1 2075# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld2 { v1.16b, v2.16b }, [x27], #32 2076# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 2077# CHECK-NEXT: 8. 1 3.0 0.0 0.0 ld2 { v1.2d, v2.2d }, [x27], x28 2078# CHECK-NEXT: 9. 1 4.0 0.0 6.0 add x0, x27, #1 2079# CHECK-NEXT: 1 2.7 0.1 3.0 <total> 2080 2081# CHECK: [20] Code Region - G21 2082 2083# CHECK: Iterations: 100 2084# CHECK-NEXT: Instructions: 1000 2085# CHECK-NEXT: Total Cycles: 510 2086# CHECK-NEXT: Total uOps: 2700 2087 2088# CHECK: Dispatch Width: 15 2089# CHECK-NEXT: uOps Per Cycle: 5.29 2090# CHECK-NEXT: IPC: 1.96 2091# CHECK-NEXT: Block RThroughput: 2.5 2092 2093# CHECK: Timeline view: 2094# CHECK-NEXT: 01234 2095# CHECK-NEXT: Index 0123456789 2096 2097# CHECK: [0,0] DeeeeeeeeER . ld2 { v1.2s, v2.2s }, [x27], x28 2098# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 2099# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld2 { v1.4h, v2.4h }, [x27], x28 2100# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 2101# CHECK-NEXT: [0,4] D==eeeeeeeeER . ld2 { v1.4s, v2.4s }, [x27], x28 2102# CHECK-NEXT: [0,5] .D==eE------R . add x0, x27, #1 2103# CHECK-NEXT: [0,6] .D==eeeeeeeeER. ld2 { v1.8b, v2.8b }, [x27], x28 2104# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 2105# CHECK-NEXT: [0,8] .D===eeeeeeeeER ld2 { v1.8h, v2.8h }, [x27], x28 2106# CHECK-NEXT: [0,9] .D====eE------R add x0, x27, #1 2107 2108# CHECK: Average Wait times (based on the timeline view): 2109# CHECK-NEXT: [0]: Executions 2110# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2111# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2112# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2113 2114# CHECK: [0] [1] [2] [3] 2115# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.2s, v2.2s }, [x27], x28 2116# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2117# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld2 { v1.4h, v2.4h }, [x27], x28 2118# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 2119# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld2 { v1.4s, v2.4s }, [x27], x28 2120# CHECK-NEXT: 5. 1 3.0 0.0 6.0 add x0, x27, #1 2121# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld2 { v1.8b, v2.8b }, [x27], x28 2122# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 2123# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld2 { v1.8h, v2.8h }, [x27], x28 2124# CHECK-NEXT: 9. 1 5.0 0.0 6.0 add x0, x27, #1 2125# CHECK-NEXT: 1 3.0 0.1 3.0 <total> 2126 2127# CHECK: [21] Code Region - G22 2128 2129# CHECK: Iterations: 100 2130# CHECK-NEXT: Instructions: 1000 2131# CHECK-NEXT: Total Cycles: 3310 2132# CHECK-NEXT: Total uOps: 2600 2133 2134# CHECK: Dispatch Width: 15 2135# CHECK-NEXT: uOps Per Cycle: 0.79 2136# CHECK-NEXT: IPC: 0.30 2137# CHECK-NEXT: Block RThroughput: 2.5 2138 2139# CHECK: Timeline view: 2140# CHECK-NEXT: 0123456789 0123456789 2141# CHECK-NEXT: Index 0123456789 0123456789 012 2142 2143# CHECK: [0,0] DeeeeeeeeER . . . . . . . ld2 { v1.16b, v2.16b }, [x27], x28 2144# CHECK-NEXT: [0,1] D=eE------R . . . . . . . add x0, x27, #1 2145# CHECK-NEXT: [0,2] D========eeeeeeeeER . . . . . . ld2 { v1.b, v2.b }[0], [x27], #2 2146# CHECK-NEXT: [0,3] D=========eE------R . . . . . . add x0, x27, #1 2147# CHECK-NEXT: [0,4] D================eeeeeeeeER . . . . ld2 { v1.b, v2.b }[8], [x27], #2 2148# CHECK-NEXT: [0,5] .D================eE------R . . . . add x0, x27, #1 2149# CHECK-NEXT: [0,6] .D=======================eeeeeeeeER. . . ld2 { v1.b, v2.b }[0], [x27], x28 2150# CHECK-NEXT: [0,7] .D========================eE------R. . . add x0, x27, #1 2151# CHECK-NEXT: [0,8] .D===============================eeeeeeeeER ld2 { v1.b, v2.b }[8], [x27], x28 2152# CHECK-NEXT: [0,9] .D================================eE------R add x0, x27, #1 2153 2154# CHECK: Average Wait times (based on the timeline view): 2155# CHECK-NEXT: [0]: Executions 2156# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2157# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2158# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2159 2160# CHECK: [0] [1] [2] [3] 2161# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.16b, v2.16b }, [x27], x28 2162# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2163# CHECK-NEXT: 2. 1 9.0 0.0 0.0 ld2 { v1.b, v2.b }[0], [x27], #2 2164# CHECK-NEXT: 3. 1 10.0 0.0 6.0 add x0, x27, #1 2165# CHECK-NEXT: 4. 1 17.0 0.0 0.0 ld2 { v1.b, v2.b }[8], [x27], #2 2166# CHECK-NEXT: 5. 1 17.0 0.0 6.0 add x0, x27, #1 2167# CHECK-NEXT: 6. 1 24.0 0.0 0.0 ld2 { v1.b, v2.b }[0], [x27], x28 2168# CHECK-NEXT: 7. 1 25.0 0.0 6.0 add x0, x27, #1 2169# CHECK-NEXT: 8. 1 32.0 0.0 0.0 ld2 { v1.b, v2.b }[8], [x27], x28 2170# CHECK-NEXT: 9. 1 33.0 0.0 6.0 add x0, x27, #1 2171# CHECK-NEXT: 1 17.0 0.1 3.0 <total> 2172 2173# CHECK: [22] Code Region - G23 2174 2175# CHECK: Iterations: 100 2176# CHECK-NEXT: Instructions: 1000 2177# CHECK-NEXT: Total Cycles: 4003 2178# CHECK-NEXT: Total uOps: 2500 2179 2180# CHECK: Dispatch Width: 15 2181# CHECK-NEXT: uOps Per Cycle: 0.62 2182# CHECK-NEXT: IPC: 0.25 2183# CHECK-NEXT: Block RThroughput: 2.5 2184 2185# CHECK: Timeline view: 2186# CHECK-NEXT: 0123456789 0123456789 2187# CHECK-NEXT: Index 0123456789 0123456789 012 2188 2189# CHECK: [0,0] DeeeeeeeeER . . . . . . . ld2 { v1.h, v2.h }[0], [x27], #4 2190# CHECK-NEXT: [0,1] D=eE------R . . . . . . . add x0, x27, #1 2191# CHECK-NEXT: [0,2] D========eeeeeeeeER . . . . . . ld2 { v1.h, v2.h }[4], [x27], #4 2192# CHECK-NEXT: [0,3] D=========eE------R . . . . . . add x0, x27, #1 2193# CHECK-NEXT: [0,4] D================eeeeeeeeER . . . . ld2 { v1.h, v2.h }[0], [x27], x28 2194# CHECK-NEXT: [0,5] D=================eE------R . . . . add x0, x27, #1 2195# CHECK-NEXT: [0,6] .D=======================eeeeeeeeER. . . ld2 { v1.h, v2.h }[4], [x27], x28 2196# CHECK-NEXT: [0,7] .D========================eE------R. . . add x0, x27, #1 2197# CHECK-NEXT: [0,8] .D===============================eeeeeeeeER ld2 { v1.s, v2.s }[0], [x27], #8 2198# CHECK-NEXT: [0,9] .D================================eE------R add x0, x27, #1 2199 2200# CHECK: Average Wait times (based on the timeline view): 2201# CHECK-NEXT: [0]: Executions 2202# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2203# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2204# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2205 2206# CHECK: [0] [1] [2] [3] 2207# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.h, v2.h }[0], [x27], #4 2208# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2209# CHECK-NEXT: 2. 1 9.0 0.0 0.0 ld2 { v1.h, v2.h }[4], [x27], #4 2210# CHECK-NEXT: 3. 1 10.0 0.0 6.0 add x0, x27, #1 2211# CHECK-NEXT: 4. 1 17.0 0.0 0.0 ld2 { v1.h, v2.h }[0], [x27], x28 2212# CHECK-NEXT: 5. 1 18.0 0.0 6.0 add x0, x27, #1 2213# CHECK-NEXT: 6. 1 24.0 0.0 0.0 ld2 { v1.h, v2.h }[4], [x27], x28 2214# CHECK-NEXT: 7. 1 25.0 0.0 6.0 add x0, x27, #1 2215# CHECK-NEXT: 8. 1 32.0 0.0 0.0 ld2 { v1.s, v2.s }[0], [x27], #8 2216# CHECK-NEXT: 9. 1 33.0 0.0 6.0 add x0, x27, #1 2217# CHECK-NEXT: 1 17.1 0.1 3.0 <total> 2218 2219# CHECK: [23] Code Region - G24 2220 2221# CHECK: Iterations: 100 2222# CHECK-NEXT: Instructions: 1000 2223# CHECK-NEXT: Total Cycles: 2603 2224# CHECK-NEXT: Total uOps: 2500 2225 2226# CHECK: Dispatch Width: 15 2227# CHECK-NEXT: uOps Per Cycle: 0.96 2228# CHECK-NEXT: IPC: 0.38 2229# CHECK-NEXT: Block RThroughput: 2.5 2230 2231# CHECK: Timeline view: 2232# CHECK-NEXT: 0123456789 2233# CHECK-NEXT: Index 0123456789 012345678 2234 2235# CHECK: [0,0] DeeeeeeeeER . . . . ld2 { v1.s, v2.s }[0], [x27], x28 2236# CHECK-NEXT: [0,1] D=eE------R . . . . add x0, x27, #1 2237# CHECK-NEXT: [0,2] D========eeeeeeeeER . . . ld2 { v1.d, v2.d }[0], [x27], #16 2238# CHECK-NEXT: [0,3] D=========eE------R . . . add x0, x27, #1 2239# CHECK-NEXT: [0,4] D================eeeeeeeeER . ld2 { v1.d, v2.d }[0], [x27], x28 2240# CHECK-NEXT: [0,5] D=================eE------R . add x0, x27, #1 2241# CHECK-NEXT: [0,6] .D================eeeeeeeeER. ld2r { v1.1d, v2.1d }, [x27], #16 2242# CHECK-NEXT: [0,7] .D=================eE------R. add x0, x27, #1 2243# CHECK-NEXT: [0,8] .D=================eeeeeeeeER ld2r { v1.2d, v2.2d }, [x27], #16 2244# CHECK-NEXT: [0,9] .D==================eE------R add x0, x27, #1 2245 2246# CHECK: Average Wait times (based on the timeline view): 2247# CHECK-NEXT: [0]: Executions 2248# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2249# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2250# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2251 2252# CHECK: [0] [1] [2] [3] 2253# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.s, v2.s }[0], [x27], x28 2254# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2255# CHECK-NEXT: 2. 1 9.0 0.0 0.0 ld2 { v1.d, v2.d }[0], [x27], #16 2256# CHECK-NEXT: 3. 1 10.0 0.0 6.0 add x0, x27, #1 2257# CHECK-NEXT: 4. 1 17.0 0.0 0.0 ld2 { v1.d, v2.d }[0], [x27], x28 2258# CHECK-NEXT: 5. 1 18.0 0.0 6.0 add x0, x27, #1 2259# CHECK-NEXT: 6. 1 17.0 0.0 0.0 ld2r { v1.1d, v2.1d }, [x27], #16 2260# CHECK-NEXT: 7. 1 18.0 0.0 6.0 add x0, x27, #1 2261# CHECK-NEXT: 8. 1 18.0 0.0 0.0 ld2r { v1.2d, v2.2d }, [x27], #16 2262# CHECK-NEXT: 9. 1 19.0 0.0 6.0 add x0, x27, #1 2263# CHECK-NEXT: 1 12.9 0.1 3.0 <total> 2264 2265# CHECK: [24] Code Region - G25 2266 2267# CHECK: Iterations: 100 2268# CHECK-NEXT: Instructions: 1000 2269# CHECK-NEXT: Total Cycles: 510 2270# CHECK-NEXT: Total uOps: 2500 2271 2272# CHECK: Dispatch Width: 15 2273# CHECK-NEXT: uOps Per Cycle: 4.90 2274# CHECK-NEXT: IPC: 1.96 2275# CHECK-NEXT: Block RThroughput: 2.5 2276 2277# CHECK: Timeline view: 2278# CHECK-NEXT: 01234 2279# CHECK-NEXT: Index 0123456789 2280 2281# CHECK: [0,0] DeeeeeeeeER . ld2r { v1.2s, v2.2s }, [x27], #8 2282# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 2283# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld2r { v1.4h, v2.4h }, [x27], #4 2284# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 2285# CHECK-NEXT: [0,4] D==eeeeeeeeER . ld2r { v1.4s, v2.4s }, [x27], #8 2286# CHECK-NEXT: [0,5] D===eE------R . add x0, x27, #1 2287# CHECK-NEXT: [0,6] .D==eeeeeeeeER. ld2r { v1.8b, v2.8b }, [x27], #2 2288# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 2289# CHECK-NEXT: [0,8] .D===eeeeeeeeER ld2r { v1.8h, v2.8h }, [x27], #4 2290# CHECK-NEXT: [0,9] .D====eE------R add x0, x27, #1 2291 2292# CHECK: Average Wait times (based on the timeline view): 2293# CHECK-NEXT: [0]: Executions 2294# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2295# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2296# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2297 2298# CHECK: [0] [1] [2] [3] 2299# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2r { v1.2s, v2.2s }, [x27], #8 2300# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2301# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld2r { v1.4h, v2.4h }, [x27], #4 2302# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 2303# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld2r { v1.4s, v2.4s }, [x27], #8 2304# CHECK-NEXT: 5. 1 4.0 0.0 6.0 add x0, x27, #1 2305# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld2r { v1.8b, v2.8b }, [x27], #2 2306# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 2307# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld2r { v1.8h, v2.8h }, [x27], #4 2308# CHECK-NEXT: 9. 1 5.0 0.0 6.0 add x0, x27, #1 2309# CHECK-NEXT: 1 3.1 0.1 3.0 <total> 2310 2311# CHECK: [25] Code Region - G26 2312 2313# CHECK: Iterations: 100 2314# CHECK-NEXT: Instructions: 1000 2315# CHECK-NEXT: Total Cycles: 510 2316# CHECK-NEXT: Total uOps: 2500 2317 2318# CHECK: Dispatch Width: 15 2319# CHECK-NEXT: uOps Per Cycle: 4.90 2320# CHECK-NEXT: IPC: 1.96 2321# CHECK-NEXT: Block RThroughput: 2.5 2322 2323# CHECK: Timeline view: 2324# CHECK-NEXT: 01234 2325# CHECK-NEXT: Index 0123456789 2326 2327# CHECK: [0,0] DeeeeeeeeER . ld2r { v1.16b, v2.16b }, [x27], #2 2328# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 2329# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld2r { v1.1d, v2.1d }, [x27], x28 2330# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 2331# CHECK-NEXT: [0,4] D==eeeeeeeeER . ld2r { v1.2d, v2.2d }, [x27], x28 2332# CHECK-NEXT: [0,5] D===eE------R . add x0, x27, #1 2333# CHECK-NEXT: [0,6] .D==eeeeeeeeER. ld2r { v1.2s, v2.2s }, [x27], x28 2334# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 2335# CHECK-NEXT: [0,8] .D===eeeeeeeeER ld2r { v1.4h, v2.4h }, [x27], x28 2336# CHECK-NEXT: [0,9] .D====eE------R add x0, x27, #1 2337 2338# CHECK: Average Wait times (based on the timeline view): 2339# CHECK-NEXT: [0]: Executions 2340# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2341# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2342# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2343 2344# CHECK: [0] [1] [2] [3] 2345# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2r { v1.16b, v2.16b }, [x27], #2 2346# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2347# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld2r { v1.1d, v2.1d }, [x27], x28 2348# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 2349# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld2r { v1.2d, v2.2d }, [x27], x28 2350# CHECK-NEXT: 5. 1 4.0 0.0 6.0 add x0, x27, #1 2351# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld2r { v1.2s, v2.2s }, [x27], x28 2352# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 2353# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld2r { v1.4h, v2.4h }, [x27], x28 2354# CHECK-NEXT: 9. 1 5.0 0.0 6.0 add x0, x27, #1 2355# CHECK-NEXT: 1 3.1 0.1 3.0 <total> 2356 2357# CHECK: [26] Code Region - G27 2358 2359# CHECK: Iterations: 100 2360# CHECK-NEXT: Instructions: 1000 2361# CHECK-NEXT: Total Cycles: 510 2362# CHECK-NEXT: Total uOps: 2800 2363 2364# CHECK: Dispatch Width: 15 2365# CHECK-NEXT: uOps Per Cycle: 5.49 2366# CHECK-NEXT: IPC: 1.96 2367# CHECK-NEXT: Block RThroughput: 2.8 2368 2369# CHECK: Timeline view: 2370# CHECK-NEXT: 01234 2371# CHECK-NEXT: Index 0123456789 2372 2373# CHECK: [0,0] DeeeeeeeeER . ld2r { v1.4s, v2.4s }, [x27], x28 2374# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 2375# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld2r { v1.8b, v2.8b }, [x27], x28 2376# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 2377# CHECK-NEXT: [0,4] D==eeeeeeeeER . ld2r { v1.8h, v2.8h }, [x27], x28 2378# CHECK-NEXT: [0,5] D===eE------R . add x0, x27, #1 2379# CHECK-NEXT: [0,6] .D==eeeeeeeeER. ld2r { v1.16b, v2.16b }, [x27], x28 2380# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 2381# CHECK-NEXT: [0,8] .D===eeeeeeeeER ld3 { v1.2d, v2.2d, v3.2d }, [x27], #48 2382# CHECK-NEXT: [0,9] .D====eE------R add x0, x27, #1 2383 2384# CHECK: Average Wait times (based on the timeline view): 2385# CHECK-NEXT: [0]: Executions 2386# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2387# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2388# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2389 2390# CHECK: [0] [1] [2] [3] 2391# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2r { v1.4s, v2.4s }, [x27], x28 2392# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2393# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld2r { v1.8b, v2.8b }, [x27], x28 2394# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 2395# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ld2r { v1.8h, v2.8h }, [x27], x28 2396# CHECK-NEXT: 5. 1 4.0 0.0 6.0 add x0, x27, #1 2397# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld2r { v1.16b, v2.16b }, [x27], x28 2398# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 2399# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ld3 { v1.2d, v2.2d, v3.2d }, [x27], #48 2400# CHECK-NEXT: 9. 1 5.0 0.0 6.0 add x0, x27, #1 2401# CHECK-NEXT: 1 3.1 0.1 3.0 <total> 2402 2403# CHECK: [27] Code Region - G28 2404 2405# CHECK: Iterations: 100 2406# CHECK-NEXT: Instructions: 1000 2407# CHECK-NEXT: Total Cycles: 510 2408# CHECK-NEXT: Total uOps: 3700 2409 2410# CHECK: Dispatch Width: 15 2411# CHECK-NEXT: uOps Per Cycle: 7.25 2412# CHECK-NEXT: IPC: 1.96 2413# CHECK-NEXT: Block RThroughput: 4.0 2414 2415# CHECK: Timeline view: 2416# CHECK-NEXT: 01234 2417# CHECK-NEXT: Index 0123456789 2418 2419# CHECK: [0,0] DeeeeeeeeER . ld3 { v1.2s, v2.2s, v3.2s }, [x27], #24 2420# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 2421# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld3 { v1.4h, v2.4h, v3.4h }, [x27], #24 2422# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 2423# CHECK-NEXT: [0,4] .D=eeeeeeeeER . ld3 { v1.4s, v2.4s, v3.4s }, [x27], #48 2424# CHECK-NEXT: [0,5] .D==eE------R . add x0, x27, #1 2425# CHECK-NEXT: [0,6] .D==eeeeeeeeER. ld3 { v1.8b, v2.8b, v3.8b }, [x27], #24 2426# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 2427# CHECK-NEXT: [0,8] . D==eeeeeeeeER ld3 { v1.8h, v2.8h, v3.8h }, [x27], #48 2428# CHECK-NEXT: [0,9] . D===eE------R add x0, x27, #1 2429 2430# CHECK: Average Wait times (based on the timeline view): 2431# CHECK-NEXT: [0]: Executions 2432# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2433# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2434# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2435 2436# CHECK: [0] [1] [2] [3] 2437# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.2s, v2.2s, v3.2s }, [x27], #24 2438# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2439# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld3 { v1.4h, v2.4h, v3.4h }, [x27], #24 2440# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 2441# CHECK-NEXT: 4. 1 2.0 0.0 0.0 ld3 { v1.4s, v2.4s, v3.4s }, [x27], #48 2442# CHECK-NEXT: 5. 1 3.0 0.0 6.0 add x0, x27, #1 2443# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld3 { v1.8b, v2.8b, v3.8b }, [x27], #24 2444# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 2445# CHECK-NEXT: 8. 1 3.0 0.0 0.0 ld3 { v1.8h, v2.8h, v3.8h }, [x27], #48 2446# CHECK-NEXT: 9. 1 4.0 0.0 6.0 add x0, x27, #1 2447# CHECK-NEXT: 1 2.7 0.1 3.0 <total> 2448 2449# CHECK: [28] Code Region - G29 2450 2451# CHECK: Iterations: 100 2452# CHECK-NEXT: Instructions: 1000 2453# CHECK-NEXT: Total Cycles: 510 2454# CHECK-NEXT: Total uOps: 3800 2455 2456# CHECK: Dispatch Width: 15 2457# CHECK-NEXT: uOps Per Cycle: 7.45 2458# CHECK-NEXT: IPC: 1.96 2459# CHECK-NEXT: Block RThroughput: 4.3 2460 2461# CHECK: Timeline view: 2462# CHECK-NEXT: 01234 2463# CHECK-NEXT: Index 0123456789 2464 2465# CHECK: [0,0] DeeeeeeeeER . ld3 { v1.16b, v2.16b, v3.16b }, [x27], #48 2466# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 2467# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld3 { v1.2d, v2.2d, v3.2d }, [x27], x28 2468# CHECK-NEXT: [0,3] .D=eE------R . add x0, x27, #1 2469# CHECK-NEXT: [0,4] .D=eeeeeeeeER . ld3 { v1.2s, v2.2s, v3.2s }, [x27], x28 2470# CHECK-NEXT: [0,5] .D==eE------R . add x0, x27, #1 2471# CHECK-NEXT: [0,6] .D==eeeeeeeeER. ld3 { v1.4h, v2.4h, v3.4h }, [x27], x28 2472# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 2473# CHECK-NEXT: [0,8] . D==eeeeeeeeER ld3 { v1.4s, v2.4s, v3.4s }, [x27], x28 2474# CHECK-NEXT: [0,9] . D===eE------R add x0, x27, #1 2475 2476# CHECK: Average Wait times (based on the timeline view): 2477# CHECK-NEXT: [0]: Executions 2478# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2479# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2480# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2481 2482# CHECK: [0] [1] [2] [3] 2483# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.16b, v2.16b, v3.16b }, [x27], #48 2484# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2485# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld3 { v1.2d, v2.2d, v3.2d }, [x27], x28 2486# CHECK-NEXT: 3. 1 2.0 0.0 6.0 add x0, x27, #1 2487# CHECK-NEXT: 4. 1 2.0 0.0 0.0 ld3 { v1.2s, v2.2s, v3.2s }, [x27], x28 2488# CHECK-NEXT: 5. 1 3.0 0.0 6.0 add x0, x27, #1 2489# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld3 { v1.4h, v2.4h, v3.4h }, [x27], x28 2490# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 2491# CHECK-NEXT: 8. 1 3.0 0.0 0.0 ld3 { v1.4s, v2.4s, v3.4s }, [x27], x28 2492# CHECK-NEXT: 9. 1 4.0 0.0 6.0 add x0, x27, #1 2493# CHECK-NEXT: 1 2.6 0.1 3.0 <total> 2494 2495# CHECK: [29] Code Region - G30 2496 2497# CHECK: Iterations: 100 2498# CHECK-NEXT: Instructions: 1000 2499# CHECK-NEXT: Total Cycles: 1910 2500# CHECK-NEXT: Total uOps: 3700 2501 2502# CHECK: Dispatch Width: 15 2503# CHECK-NEXT: uOps Per Cycle: 1.94 2504# CHECK-NEXT: IPC: 0.52 2505# CHECK-NEXT: Block RThroughput: 4.0 2506 2507# CHECK: Timeline view: 2508# CHECK-NEXT: 0123456789 2509# CHECK-NEXT: Index 0123456789 012345678 2510 2511# CHECK: [0,0] DeeeeeeeeER . . . . ld3 { v1.8b, v2.8b, v3.8b }, [x27], x28 2512# CHECK-NEXT: [0,1] D=eE------R . . . . add x0, x27, #1 2513# CHECK-NEXT: [0,2] D=eeeeeeeeER . . . . ld3 { v1.8h, v2.8h, v3.8h }, [x27], x28 2514# CHECK-NEXT: [0,3] D==eE------R . . . . add x0, x27, #1 2515# CHECK-NEXT: [0,4] .D=eeeeeeeeER . . . . ld3 { v1.16b, v2.16b, v3.16b }, [x27], x28 2516# CHECK-NEXT: [0,5] .D==eE------R . . . . add x0, x27, #1 2517# CHECK-NEXT: [0,6] .D=========eeeeeeeeER . . ld3 { v1.b, v2.b, v3.b }[0], [x27], #3 2518# CHECK-NEXT: [0,7] .D==========eE------R . . add x0, x27, #1 2519# CHECK-NEXT: [0,8] . D================eeeeeeeeER ld3 { v1.b, v2.b, v3.b }[8], [x27], #3 2520# CHECK-NEXT: [0,9] . D=================eE------R add x0, x27, #1 2521 2522# CHECK: Average Wait times (based on the timeline view): 2523# CHECK-NEXT: [0]: Executions 2524# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2525# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2526# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2527 2528# CHECK: [0] [1] [2] [3] 2529# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.8b, v2.8b, v3.8b }, [x27], x28 2530# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2531# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld3 { v1.8h, v2.8h, v3.8h }, [x27], x28 2532# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 2533# CHECK-NEXT: 4. 1 2.0 0.0 0.0 ld3 { v1.16b, v2.16b, v3.16b }, [x27], x28 2534# CHECK-NEXT: 5. 1 3.0 0.0 6.0 add x0, x27, #1 2535# CHECK-NEXT: 6. 1 10.0 0.0 0.0 ld3 { v1.b, v2.b, v3.b }[0], [x27], #3 2536# CHECK-NEXT: 7. 1 11.0 0.0 6.0 add x0, x27, #1 2537# CHECK-NEXT: 8. 1 17.0 0.0 0.0 ld3 { v1.b, v2.b, v3.b }[8], [x27], #3 2538# CHECK-NEXT: 9. 1 18.0 0.0 6.0 add x0, x27, #1 2539# CHECK-NEXT: 1 6.9 0.1 3.0 <total> 2540 2541# CHECK: [30] Code Region - G31 2542 2543# CHECK: Iterations: 100 2544# CHECK-NEXT: Instructions: 1000 2545# CHECK-NEXT: Total Cycles: 4003 2546# CHECK-NEXT: Total uOps: 3500 2547 2548# CHECK: Dispatch Width: 15 2549# CHECK-NEXT: uOps Per Cycle: 0.87 2550# CHECK-NEXT: IPC: 0.25 2551# CHECK-NEXT: Block RThroughput: 3.8 2552 2553# CHECK: Timeline view: 2554# CHECK-NEXT: 0123456789 0123456789 2555# CHECK-NEXT: Index 0123456789 0123456789 012 2556 2557# CHECK: [0,0] DeeeeeeeeER . . . . . . . ld3 { v1.b, v2.b, v3.b }[0], [x27], x28 2558# CHECK-NEXT: [0,1] D=eE------R . . . . . . . add x0, x27, #1 2559# CHECK-NEXT: [0,2] D========eeeeeeeeER . . . . . . ld3 { v1.b, v2.b, v3.b }[8], [x27], x28 2560# CHECK-NEXT: [0,3] D=========eE------R . . . . . . add x0, x27, #1 2561# CHECK-NEXT: [0,4] .D===============eeeeeeeeER . . . . ld3 { v1.h, v2.h, v3.h }[0], [x27], #6 2562# CHECK-NEXT: [0,5] .D================eE------R . . . . add x0, x27, #1 2563# CHECK-NEXT: [0,6] .D=======================eeeeeeeeER. . . ld3 { v1.h, v2.h, v3.h }[4], [x27], #6 2564# CHECK-NEXT: [0,7] .D========================eE------R. . . add x0, x27, #1 2565# CHECK-NEXT: [0,8] . D==============================eeeeeeeeER ld3 { v1.h, v2.h, v3.h }[0], [x27], x28 2566# CHECK-NEXT: [0,9] . D===============================eE------R add x0, x27, #1 2567 2568# CHECK: Average Wait times (based on the timeline view): 2569# CHECK-NEXT: [0]: Executions 2570# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2571# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2572# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2573 2574# CHECK: [0] [1] [2] [3] 2575# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.b, v2.b, v3.b }[0], [x27], x28 2576# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2577# CHECK-NEXT: 2. 1 9.0 0.0 0.0 ld3 { v1.b, v2.b, v3.b }[8], [x27], x28 2578# CHECK-NEXT: 3. 1 10.0 0.0 6.0 add x0, x27, #1 2579# CHECK-NEXT: 4. 1 16.0 0.0 0.0 ld3 { v1.h, v2.h, v3.h }[0], [x27], #6 2580# CHECK-NEXT: 5. 1 17.0 0.0 6.0 add x0, x27, #1 2581# CHECK-NEXT: 6. 1 24.0 0.0 0.0 ld3 { v1.h, v2.h, v3.h }[4], [x27], #6 2582# CHECK-NEXT: 7. 1 25.0 0.0 6.0 add x0, x27, #1 2583# CHECK-NEXT: 8. 1 31.0 0.0 0.0 ld3 { v1.h, v2.h, v3.h }[0], [x27], x28 2584# CHECK-NEXT: 9. 1 32.0 0.0 6.0 add x0, x27, #1 2585# CHECK-NEXT: 1 16.7 0.1 3.0 <total> 2586 2587# CHECK: [31] Code Region - G32 2588 2589# CHECK: Iterations: 100 2590# CHECK-NEXT: Instructions: 1000 2591# CHECK-NEXT: Total Cycles: 4003 2592# CHECK-NEXT: Total uOps: 3500 2593 2594# CHECK: Dispatch Width: 15 2595# CHECK-NEXT: uOps Per Cycle: 0.87 2596# CHECK-NEXT: IPC: 0.25 2597# CHECK-NEXT: Block RThroughput: 3.8 2598 2599# CHECK: Timeline view: 2600# CHECK-NEXT: 0123456789 0123456789 2601# CHECK-NEXT: Index 0123456789 0123456789 012 2602 2603# CHECK: [0,0] DeeeeeeeeER . . . . . . . ld3 { v1.h, v2.h, v3.h }[4], [x27], x28 2604# CHECK-NEXT: [0,1] D=eE------R . . . . . . . add x0, x27, #1 2605# CHECK-NEXT: [0,2] D========eeeeeeeeER . . . . . . ld3 { v1.s, v2.s, v3.s }[0], [x27], #12 2606# CHECK-NEXT: [0,3] D=========eE------R . . . . . . add x0, x27, #1 2607# CHECK-NEXT: [0,4] .D===============eeeeeeeeER . . . . ld3 { v1.s, v2.s, v3.s }[0], [x27], x28 2608# CHECK-NEXT: [0,5] .D================eE------R . . . . add x0, x27, #1 2609# CHECK-NEXT: [0,6] .D=======================eeeeeeeeER. . . ld3 { v1.d, v2.d, v3.d }[0], [x27], #24 2610# CHECK-NEXT: [0,7] .D========================eE------R. . . add x0, x27, #1 2611# CHECK-NEXT: [0,8] . D==============================eeeeeeeeER ld3 { v1.d, v2.d, v3.d }[0], [x27], x28 2612# CHECK-NEXT: [0,9] . D===============================eE------R add x0, x27, #1 2613 2614# CHECK: Average Wait times (based on the timeline view): 2615# CHECK-NEXT: [0]: Executions 2616# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2617# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2618# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2619 2620# CHECK: [0] [1] [2] [3] 2621# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.h, v2.h, v3.h }[4], [x27], x28 2622# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2623# CHECK-NEXT: 2. 1 9.0 0.0 0.0 ld3 { v1.s, v2.s, v3.s }[0], [x27], #12 2624# CHECK-NEXT: 3. 1 10.0 0.0 6.0 add x0, x27, #1 2625# CHECK-NEXT: 4. 1 16.0 0.0 0.0 ld3 { v1.s, v2.s, v3.s }[0], [x27], x28 2626# CHECK-NEXT: 5. 1 17.0 0.0 6.0 add x0, x27, #1 2627# CHECK-NEXT: 6. 1 24.0 0.0 0.0 ld3 { v1.d, v2.d, v3.d }[0], [x27], #24 2628# CHECK-NEXT: 7. 1 25.0 0.0 6.0 add x0, x27, #1 2629# CHECK-NEXT: 8. 1 31.0 0.0 0.0 ld3 { v1.d, v2.d, v3.d }[0], [x27], x28 2630# CHECK-NEXT: 9. 1 32.0 0.0 6.0 add x0, x27, #1 2631# CHECK-NEXT: 1 16.7 0.1 3.0 <total> 2632 2633# CHECK: [32] Code Region - G33 2634 2635# CHECK: Iterations: 100 2636# CHECK-NEXT: Instructions: 1000 2637# CHECK-NEXT: Total Cycles: 510 2638# CHECK-NEXT: Total uOps: 3500 2639 2640# CHECK: Dispatch Width: 15 2641# CHECK-NEXT: uOps Per Cycle: 6.86 2642# CHECK-NEXT: IPC: 1.96 2643# CHECK-NEXT: Block RThroughput: 3.8 2644 2645# CHECK: Timeline view: 2646# CHECK-NEXT: 01234 2647# CHECK-NEXT: Index 0123456789 2648 2649# CHECK: [0,0] DeeeeeeeeER . ld3r { v1.1d, v2.1d, v3.1d }, [x27], #24 2650# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 2651# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld3r { v1.2d, v2.2d, v3.2d }, [x27], #24 2652# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 2653# CHECK-NEXT: [0,4] .D=eeeeeeeeER . ld3r { v1.2s, v2.2s, v3.2s }, [x27], #12 2654# CHECK-NEXT: [0,5] .D==eE------R . add x0, x27, #1 2655# CHECK-NEXT: [0,6] .D==eeeeeeeeER. ld3r { v1.4h, v2.4h, v3.4h }, [x27], #6 2656# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 2657# CHECK-NEXT: [0,8] . D==eeeeeeeeER ld3r { v1.4s, v2.4s, v3.4s }, [x27], #12 2658# CHECK-NEXT: [0,9] . D===eE------R add x0, x27, #1 2659 2660# CHECK: Average Wait times (based on the timeline view): 2661# CHECK-NEXT: [0]: Executions 2662# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2663# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2664# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2665 2666# CHECK: [0] [1] [2] [3] 2667# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3r { v1.1d, v2.1d, v3.1d }, [x27], #24 2668# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2669# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld3r { v1.2d, v2.2d, v3.2d }, [x27], #24 2670# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 2671# CHECK-NEXT: 4. 1 2.0 0.0 0.0 ld3r { v1.2s, v2.2s, v3.2s }, [x27], #12 2672# CHECK-NEXT: 5. 1 3.0 0.0 6.0 add x0, x27, #1 2673# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld3r { v1.4h, v2.4h, v3.4h }, [x27], #6 2674# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 2675# CHECK-NEXT: 8. 1 3.0 0.0 0.0 ld3r { v1.4s, v2.4s, v3.4s }, [x27], #12 2676# CHECK-NEXT: 9. 1 4.0 0.0 6.0 add x0, x27, #1 2677# CHECK-NEXT: 1 2.7 0.1 3.0 <total> 2678 2679# CHECK: [33] Code Region - G34 2680 2681# CHECK: Iterations: 100 2682# CHECK-NEXT: Instructions: 1000 2683# CHECK-NEXT: Total Cycles: 510 2684# CHECK-NEXT: Total uOps: 3500 2685 2686# CHECK: Dispatch Width: 15 2687# CHECK-NEXT: uOps Per Cycle: 6.86 2688# CHECK-NEXT: IPC: 1.96 2689# CHECK-NEXT: Block RThroughput: 3.8 2690 2691# CHECK: Timeline view: 2692# CHECK-NEXT: 01234 2693# CHECK-NEXT: Index 0123456789 2694 2695# CHECK: [0,0] DeeeeeeeeER . ld3r { v1.8b, v2.8b, v3.8b }, [x27], #3 2696# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 2697# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld3r { v1.8h, v2.8h, v3.8h }, [x27], #6 2698# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 2699# CHECK-NEXT: [0,4] .D=eeeeeeeeER . ld3r { v1.16b, v2.16b, v3.16b }, [x27], #3 2700# CHECK-NEXT: [0,5] .D==eE------R . add x0, x27, #1 2701# CHECK-NEXT: [0,6] .D==eeeeeeeeER. ld3r { v1.1d, v2.1d, v3.1d }, [x27], x28 2702# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 2703# CHECK-NEXT: [0,8] . D==eeeeeeeeER ld3r { v1.2d, v2.2d, v3.2d }, [x27], x28 2704# CHECK-NEXT: [0,9] . D===eE------R add x0, x27, #1 2705 2706# CHECK: Average Wait times (based on the timeline view): 2707# CHECK-NEXT: [0]: Executions 2708# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2709# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2710# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2711 2712# CHECK: [0] [1] [2] [3] 2713# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3r { v1.8b, v2.8b, v3.8b }, [x27], #3 2714# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2715# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld3r { v1.8h, v2.8h, v3.8h }, [x27], #6 2716# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 2717# CHECK-NEXT: 4. 1 2.0 0.0 0.0 ld3r { v1.16b, v2.16b, v3.16b }, [x27], #3 2718# CHECK-NEXT: 5. 1 3.0 0.0 6.0 add x0, x27, #1 2719# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld3r { v1.1d, v2.1d, v3.1d }, [x27], x28 2720# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 2721# CHECK-NEXT: 8. 1 3.0 0.0 0.0 ld3r { v1.2d, v2.2d, v3.2d }, [x27], x28 2722# CHECK-NEXT: 9. 1 4.0 0.0 6.0 add x0, x27, #1 2723# CHECK-NEXT: 1 2.7 0.1 3.0 <total> 2724 2725# CHECK: [34] Code Region - G35 2726 2727# CHECK: Iterations: 100 2728# CHECK-NEXT: Instructions: 1000 2729# CHECK-NEXT: Total Cycles: 510 2730# CHECK-NEXT: Total uOps: 3500 2731 2732# CHECK: Dispatch Width: 15 2733# CHECK-NEXT: uOps Per Cycle: 6.86 2734# CHECK-NEXT: IPC: 1.96 2735# CHECK-NEXT: Block RThroughput: 3.8 2736 2737# CHECK: Timeline view: 2738# CHECK-NEXT: 01234 2739# CHECK-NEXT: Index 0123456789 2740 2741# CHECK: [0,0] DeeeeeeeeER . ld3r { v1.2s, v2.2s, v3.2s }, [x27], x28 2742# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 2743# CHECK-NEXT: [0,2] D=eeeeeeeeER . ld3r { v1.4h, v2.4h, v3.4h }, [x27], x28 2744# CHECK-NEXT: [0,3] D==eE------R . add x0, x27, #1 2745# CHECK-NEXT: [0,4] .D=eeeeeeeeER . ld3r { v1.4s, v2.4s, v3.4s }, [x27], x28 2746# CHECK-NEXT: [0,5] .D==eE------R . add x0, x27, #1 2747# CHECK-NEXT: [0,6] .D==eeeeeeeeER. ld3r { v1.8b, v2.8b, v3.8b }, [x27], x28 2748# CHECK-NEXT: [0,7] .D===eE------R. add x0, x27, #1 2749# CHECK-NEXT: [0,8] . D==eeeeeeeeER ld3r { v1.8h, v2.8h, v3.8h }, [x27], x28 2750# CHECK-NEXT: [0,9] . D===eE------R add x0, x27, #1 2751 2752# CHECK: Average Wait times (based on the timeline view): 2753# CHECK-NEXT: [0]: Executions 2754# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2755# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2756# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2757 2758# CHECK: [0] [1] [2] [3] 2759# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3r { v1.2s, v2.2s, v3.2s }, [x27], x28 2760# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2761# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ld3r { v1.4h, v2.4h, v3.4h }, [x27], x28 2762# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 2763# CHECK-NEXT: 4. 1 2.0 0.0 0.0 ld3r { v1.4s, v2.4s, v3.4s }, [x27], x28 2764# CHECK-NEXT: 5. 1 3.0 0.0 6.0 add x0, x27, #1 2765# CHECK-NEXT: 6. 1 3.0 0.0 0.0 ld3r { v1.8b, v2.8b, v3.8b }, [x27], x28 2766# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 2767# CHECK-NEXT: 8. 1 3.0 0.0 0.0 ld3r { v1.8h, v2.8h, v3.8h }, [x27], x28 2768# CHECK-NEXT: 9. 1 4.0 0.0 6.0 add x0, x27, #1 2769# CHECK-NEXT: 1 2.7 0.1 3.0 <total> 2770 2771# CHECK: [35] Code Region - G36 2772 2773# CHECK: Iterations: 100 2774# CHECK-NEXT: Instructions: 1000 2775# CHECK-NEXT: Total Cycles: 611 2776# CHECK-NEXT: Total uOps: 4500 2777 2778# CHECK: Dispatch Width: 15 2779# CHECK-NEXT: uOps Per Cycle: 7.36 2780# CHECK-NEXT: IPC: 1.64 2781# CHECK-NEXT: Block RThroughput: 5.3 2782 2783# CHECK: Timeline view: 2784# CHECK-NEXT: 0123456 2785# CHECK-NEXT: Index 0123456789 2786 2787# CHECK: [0,0] DeeeeeeeeER .. ld3r { v1.16b, v2.16b, v3.16b }, [x27], x28 2788# CHECK-NEXT: [0,1] D=eE------R .. add x0, x27, #1 2789# CHECK-NEXT: [0,2] .DeeeeeeeeeER .. ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 2790# CHECK-NEXT: [0,3] .D=eE-------R .. add x0, x27, #1 2791# CHECK-NEXT: [0,4] . DeeeeeeeeER .. ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 2792# CHECK-NEXT: [0,5] . D=eE------R .. add x0, x27, #1 2793# CHECK-NEXT: [0,6] . DeeeeeeeeER .. ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 2794# CHECK-NEXT: [0,7] . D=eE------R .. add x0, x27, #1 2795# CHECK-NEXT: [0,8] . D=eeeeeeeeeER ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 2796# CHECK-NEXT: [0,9] . D==eE-------R add x0, x27, #1 2797 2798# CHECK: Average Wait times (based on the timeline view): 2799# CHECK-NEXT: [0]: Executions 2800# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2801# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2802# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2803 2804# CHECK: [0] [1] [2] [3] 2805# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3r { v1.16b, v2.16b, v3.16b }, [x27], x28 2806# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2807# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 2808# CHECK-NEXT: 3. 1 2.0 0.0 7.0 add x0, x27, #1 2809# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 2810# CHECK-NEXT: 5. 1 2.0 0.0 6.0 add x0, x27, #1 2811# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 2812# CHECK-NEXT: 7. 1 2.0 0.0 6.0 add x0, x27, #1 2813# CHECK-NEXT: 8. 1 2.0 1.0 0.0 ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 2814# CHECK-NEXT: 9. 1 3.0 0.0 7.0 add x0, x27, #1 2815# CHECK-NEXT: 1 1.7 0.2 3.2 <total> 2816 2817# CHECK: [36] Code Region - G37 2818 2819# CHECK: Iterations: 100 2820# CHECK-NEXT: Instructions: 1000 2821# CHECK-NEXT: Total Cycles: 610 2822# CHECK-NEXT: Total uOps: 4800 2823 2824# CHECK: Dispatch Width: 15 2825# CHECK-NEXT: uOps Per Cycle: 7.87 2826# CHECK-NEXT: IPC: 1.64 2827# CHECK-NEXT: Block RThroughput: 6.0 2828 2829# CHECK: Timeline view: 2830# CHECK-NEXT: 012345 2831# CHECK-NEXT: Index 0123456789 2832 2833# CHECK: [0,0] DeeeeeeeeER . ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 2834# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 2835# CHECK-NEXT: [0,2] .DeeeeeeeeeER . ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 2836# CHECK-NEXT: [0,3] .D=eE-------R . add x0, x27, #1 2837# CHECK-NEXT: [0,4] . DeeeeeeeeeER . ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 2838# CHECK-NEXT: [0,5] . D=eE-------R . add x0, x27, #1 2839# CHECK-NEXT: [0,6] . DeeeeeeeeeER. ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 2840# CHECK-NEXT: [0,7] . D=eE-------R. add x0, x27, #1 2841# CHECK-NEXT: [0,8] . D=eeeeeeeeER ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 2842# CHECK-NEXT: [0,9] . D==eE------R add x0, x27, #1 2843 2844# CHECK: Average Wait times (based on the timeline view): 2845# CHECK-NEXT: [0]: Executions 2846# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2847# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2848# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2849 2850# CHECK: [0] [1] [2] [3] 2851# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 2852# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2853# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 2854# CHECK-NEXT: 3. 1 2.0 0.0 7.0 add x0, x27, #1 2855# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 2856# CHECK-NEXT: 5. 1 2.0 0.0 7.0 add x0, x27, #1 2857# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 2858# CHECK-NEXT: 7. 1 2.0 0.0 7.0 add x0, x27, #1 2859# CHECK-NEXT: 8. 1 2.0 1.0 0.0 ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 2860# CHECK-NEXT: 9. 1 3.0 0.0 6.0 add x0, x27, #1 2861# CHECK-NEXT: 1 1.7 0.2 3.3 <total> 2862 2863# CHECK: [37] Code Region - G38 2864 2865# CHECK: Iterations: 100 2866# CHECK-NEXT: Instructions: 1000 2867# CHECK-NEXT: Total Cycles: 660 2868# CHECK-NEXT: Total uOps: 4800 2869 2870# CHECK: Dispatch Width: 15 2871# CHECK-NEXT: uOps Per Cycle: 7.27 2872# CHECK-NEXT: IPC: 1.52 2873# CHECK-NEXT: Block RThroughput: 6.0 2874 2875# CHECK: Timeline view: 2876# CHECK-NEXT: 0123456 2877# CHECK-NEXT: Index 0123456789 2878 2879# CHECK: [0,0] DeeeeeeeeER .. ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 2880# CHECK-NEXT: [0,1] D=eE------R .. add x0, x27, #1 2881# CHECK-NEXT: [0,2] .DeeeeeeeeeER .. ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 2882# CHECK-NEXT: [0,3] .D=eE-------R .. add x0, x27, #1 2883# CHECK-NEXT: [0,4] . DeeeeeeeeER .. ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 2884# CHECK-NEXT: [0,5] . D=eE------R .. add x0, x27, #1 2885# CHECK-NEXT: [0,6] . DeeeeeeeeeER.. ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 2886# CHECK-NEXT: [0,7] . D=eE-------R.. add x0, x27, #1 2887# CHECK-NEXT: [0,8] . D=eeeeeeeeeER ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 2888# CHECK-NEXT: [0,9] . D==eE-------R add x0, x27, #1 2889 2890# CHECK: Average Wait times (based on the timeline view): 2891# CHECK-NEXT: [0]: Executions 2892# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2893# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2894# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2895 2896# CHECK: [0] [1] [2] [3] 2897# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 2898# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2899# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 2900# CHECK-NEXT: 3. 1 2.0 0.0 7.0 add x0, x27, #1 2901# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 2902# CHECK-NEXT: 5. 1 2.0 0.0 6.0 add x0, x27, #1 2903# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 2904# CHECK-NEXT: 7. 1 2.0 0.0 7.0 add x0, x27, #1 2905# CHECK-NEXT: 8. 1 2.0 1.0 0.0 ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 2906# CHECK-NEXT: 9. 1 3.0 0.0 7.0 add x0, x27, #1 2907# CHECK-NEXT: 1 1.7 0.2 3.3 <total> 2908 2909# CHECK: [38] Code Region - G39 2910 2911# CHECK: Iterations: 100 2912# CHECK-NEXT: Instructions: 1000 2913# CHECK-NEXT: Total Cycles: 4003 2914# CHECK-NEXT: Total uOps: 4500 2915 2916# CHECK: Dispatch Width: 15 2917# CHECK-NEXT: uOps Per Cycle: 1.12 2918# CHECK-NEXT: IPC: 0.25 2919# CHECK-NEXT: Block RThroughput: 5.0 2920 2921# CHECK: Timeline view: 2922# CHECK-NEXT: 0123456789 0123456789 2923# CHECK-NEXT: Index 0123456789 0123456789 012 2924 2925# CHECK: [0,0] DeeeeeeeeER . . . . . . . ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4 2926# CHECK-NEXT: [0,1] D=eE------R . . . . . . . add x0, x27, #1 2927# CHECK-NEXT: [0,2] .D=======eeeeeeeeER . . . . . . ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4 2928# CHECK-NEXT: [0,3] .D========eE------R . . . . . . add x0, x27, #1 2929# CHECK-NEXT: [0,4] . D==============eeeeeeeeER . . . . ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28 2930# CHECK-NEXT: [0,5] . D===============eE------R . . . . add x0, x27, #1 2931# CHECK-NEXT: [0,6] . D=====================eeeeeeeeER. . . ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28 2932# CHECK-NEXT: [0,7] . D======================eE------R. . . add x0, x27, #1 2933# CHECK-NEXT: [0,8] . D============================eeeeeeeeER ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8 2934# CHECK-NEXT: [0,9] . D=============================eE------R add x0, x27, #1 2935 2936# CHECK: Average Wait times (based on the timeline view): 2937# CHECK-NEXT: [0]: Executions 2938# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2939# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2940# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2941 2942# CHECK: [0] [1] [2] [3] 2943# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4 2944# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2945# CHECK-NEXT: 2. 1 8.0 0.0 0.0 ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4 2946# CHECK-NEXT: 3. 1 9.0 0.0 6.0 add x0, x27, #1 2947# CHECK-NEXT: 4. 1 15.0 0.0 0.0 ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28 2948# CHECK-NEXT: 5. 1 16.0 0.0 6.0 add x0, x27, #1 2949# CHECK-NEXT: 6. 1 22.0 0.0 0.0 ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28 2950# CHECK-NEXT: 7. 1 23.0 0.0 6.0 add x0, x27, #1 2951# CHECK-NEXT: 8. 1 29.0 0.0 0.0 ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8 2952# CHECK-NEXT: 9. 1 30.0 0.0 6.0 add x0, x27, #1 2953# CHECK-NEXT: 1 15.5 0.1 3.0 <total> 2954 2955# CHECK: [39] Code Region - G40 2956 2957# CHECK: Iterations: 100 2958# CHECK-NEXT: Instructions: 1000 2959# CHECK-NEXT: Total Cycles: 4003 2960# CHECK-NEXT: Total uOps: 4500 2961 2962# CHECK: Dispatch Width: 15 2963# CHECK-NEXT: uOps Per Cycle: 1.12 2964# CHECK-NEXT: IPC: 0.25 2965# CHECK-NEXT: Block RThroughput: 5.0 2966 2967# CHECK: Timeline view: 2968# CHECK-NEXT: 0123456789 0123456789 2969# CHECK-NEXT: Index 0123456789 0123456789 012 2970 2971# CHECK: [0,0] DeeeeeeeeER . . . . . . . ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8 2972# CHECK-NEXT: [0,1] D=eE------R . . . . . . . add x0, x27, #1 2973# CHECK-NEXT: [0,2] .D=======eeeeeeeeER . . . . . . ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28 2974# CHECK-NEXT: [0,3] .D========eE------R . . . . . . add x0, x27, #1 2975# CHECK-NEXT: [0,4] . D==============eeeeeeeeER . . . . ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28 2976# CHECK-NEXT: [0,5] . D===============eE------R . . . . add x0, x27, #1 2977# CHECK-NEXT: [0,6] . D=====================eeeeeeeeER. . . ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16 2978# CHECK-NEXT: [0,7] . D======================eE------R. . . add x0, x27, #1 2979# CHECK-NEXT: [0,8] . D============================eeeeeeeeER ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28 2980# CHECK-NEXT: [0,9] . D=============================eE------R add x0, x27, #1 2981 2982# CHECK: Average Wait times (based on the timeline view): 2983# CHECK-NEXT: [0]: Executions 2984# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2985# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2986# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2987 2988# CHECK: [0] [1] [2] [3] 2989# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8 2990# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 2991# CHECK-NEXT: 2. 1 8.0 0.0 0.0 ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28 2992# CHECK-NEXT: 3. 1 9.0 0.0 6.0 add x0, x27, #1 2993# CHECK-NEXT: 4. 1 15.0 0.0 0.0 ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28 2994# CHECK-NEXT: 5. 1 16.0 0.0 6.0 add x0, x27, #1 2995# CHECK-NEXT: 6. 1 22.0 0.0 0.0 ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16 2996# CHECK-NEXT: 7. 1 23.0 0.0 6.0 add x0, x27, #1 2997# CHECK-NEXT: 8. 1 29.0 0.0 0.0 ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28 2998# CHECK-NEXT: 9. 1 30.0 0.0 6.0 add x0, x27, #1 2999# CHECK-NEXT: 1 15.5 0.1 3.0 <total> 3000 3001# CHECK: [40] Code Region - G41 3002 3003# CHECK: Iterations: 100 3004# CHECK-NEXT: Instructions: 1000 3005# CHECK-NEXT: Total Cycles: 1903 3006# CHECK-NEXT: Total uOps: 4500 3007 3008# CHECK: Dispatch Width: 15 3009# CHECK-NEXT: uOps Per Cycle: 2.36 3010# CHECK-NEXT: IPC: 0.53 3011# CHECK-NEXT: Block RThroughput: 5.0 3012 3013# CHECK: Timeline view: 3014# CHECK-NEXT: 0123456789 3015# CHECK-NEXT: Index 0123456789 01 3016 3017# CHECK: [0,0] DeeeeeeeeER . .. ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32 3018# CHECK-NEXT: [0,1] D=eE------R . .. add x0, x27, #1 3019# CHECK-NEXT: [0,2] .D=======eeeeeeeeER .. ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28 3020# CHECK-NEXT: [0,3] .D========eE------R .. add x0, x27, #1 3021# CHECK-NEXT: [0,4] . D=======eeeeeeeeER.. ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 3022# CHECK-NEXT: [0,5] . D========eE------R.. add x0, x27, #1 3023# CHECK-NEXT: [0,6] . D=======eeeeeeeeER. ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32 3024# CHECK-NEXT: [0,7] . D========eE------R. add x0, x27, #1 3025# CHECK-NEXT: [0,8] . D=======eeeeeeeeER ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16 3026# CHECK-NEXT: [0,9] . D========eE------R add x0, x27, #1 3027 3028# CHECK: Average Wait times (based on the timeline view): 3029# CHECK-NEXT: [0]: Executions 3030# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3031# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3032# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3033 3034# CHECK: [0] [1] [2] [3] 3035# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32 3036# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 3037# CHECK-NEXT: 2. 1 8.0 0.0 0.0 ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28 3038# CHECK-NEXT: 3. 1 9.0 0.0 6.0 add x0, x27, #1 3039# CHECK-NEXT: 4. 1 8.0 0.0 0.0 ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 3040# CHECK-NEXT: 5. 1 9.0 0.0 6.0 add x0, x27, #1 3041# CHECK-NEXT: 6. 1 8.0 0.0 0.0 ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32 3042# CHECK-NEXT: 7. 1 9.0 0.0 6.0 add x0, x27, #1 3043# CHECK-NEXT: 8. 1 8.0 0.0 0.0 ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16 3044# CHECK-NEXT: 9. 1 9.0 0.0 6.0 add x0, x27, #1 3045# CHECK-NEXT: 1 7.1 0.1 3.0 <total> 3046 3047# CHECK: [41] Code Region - G42 3048 3049# CHECK: Iterations: 100 3050# CHECK-NEXT: Instructions: 1000 3051# CHECK-NEXT: Total Cycles: 510 3052# CHECK-NEXT: Total uOps: 4500 3053 3054# CHECK: Dispatch Width: 15 3055# CHECK-NEXT: uOps Per Cycle: 8.82 3056# CHECK-NEXT: IPC: 1.96 3057# CHECK-NEXT: Block RThroughput: 5.0 3058 3059# CHECK: Timeline view: 3060# CHECK-NEXT: 01234 3061# CHECK-NEXT: Index 0123456789 3062 3063# CHECK: [0,0] DeeeeeeeeER . ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8 3064# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 3065# CHECK-NEXT: [0,2] .DeeeeeeeeER . ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16 3066# CHECK-NEXT: [0,3] .D=eE------R . add x0, x27, #1 3067# CHECK-NEXT: [0,4] . DeeeeeeeeER . ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4 3068# CHECK-NEXT: [0,5] . D=eE------R . add x0, x27, #1 3069# CHECK-NEXT: [0,6] . DeeeeeeeeER. ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8 3070# CHECK-NEXT: [0,7] . D=eE------R. add x0, x27, #1 3071# CHECK-NEXT: [0,8] . DeeeeeeeeER ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4 3072# CHECK-NEXT: [0,9] . D=eE------R add x0, x27, #1 3073 3074# CHECK: Average Wait times (based on the timeline view): 3075# CHECK-NEXT: [0]: Executions 3076# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3077# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3078# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3079 3080# CHECK: [0] [1] [2] [3] 3081# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8 3082# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 3083# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16 3084# CHECK-NEXT: 3. 1 2.0 0.0 6.0 add x0, x27, #1 3085# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4 3086# CHECK-NEXT: 5. 1 2.0 0.0 6.0 add x0, x27, #1 3087# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8 3088# CHECK-NEXT: 7. 1 2.0 0.0 6.0 add x0, x27, #1 3089# CHECK-NEXT: 8. 1 1.0 0.0 0.0 ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4 3090# CHECK-NEXT: 9. 1 2.0 0.0 6.0 add x0, x27, #1 3091# CHECK-NEXT: 1 1.5 0.1 3.0 <total> 3092 3093# CHECK: [42] Code Region - G43 3094 3095# CHECK: Iterations: 100 3096# CHECK-NEXT: Instructions: 1000 3097# CHECK-NEXT: Total Cycles: 510 3098# CHECK-NEXT: Total uOps: 4500 3099 3100# CHECK: Dispatch Width: 15 3101# CHECK-NEXT: uOps Per Cycle: 8.82 3102# CHECK-NEXT: IPC: 1.96 3103# CHECK-NEXT: Block RThroughput: 5.0 3104 3105# CHECK: Timeline view: 3106# CHECK-NEXT: 01234 3107# CHECK-NEXT: Index 0123456789 3108 3109# CHECK: [0,0] DeeeeeeeeER . ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 3110# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 3111# CHECK-NEXT: [0,2] .DeeeeeeeeER . ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 3112# CHECK-NEXT: [0,3] .D=eE------R . add x0, x27, #1 3113# CHECK-NEXT: [0,4] . DeeeeeeeeER . ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 3114# CHECK-NEXT: [0,5] . D=eE------R . add x0, x27, #1 3115# CHECK-NEXT: [0,6] . DeeeeeeeeER. ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 3116# CHECK-NEXT: [0,7] . D=eE------R. add x0, x27, #1 3117# CHECK-NEXT: [0,8] . DeeeeeeeeER ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 3118# CHECK-NEXT: [0,9] . D=eE------R add x0, x27, #1 3119 3120# CHECK: Average Wait times (based on the timeline view): 3121# CHECK-NEXT: [0]: Executions 3122# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3123# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3124# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3125 3126# CHECK: [0] [1] [2] [3] 3127# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 3128# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 3129# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 3130# CHECK-NEXT: 3. 1 2.0 0.0 6.0 add x0, x27, #1 3131# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 3132# CHECK-NEXT: 5. 1 2.0 0.0 6.0 add x0, x27, #1 3133# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 3134# CHECK-NEXT: 7. 1 2.0 0.0 6.0 add x0, x27, #1 3135# CHECK-NEXT: 8. 1 1.0 0.0 0.0 ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 3136# CHECK-NEXT: 9. 1 2.0 0.0 6.0 add x0, x27, #1 3137# CHECK-NEXT: 1 1.5 0.1 3.0 <total> 3138 3139# CHECK: [43] Code Region - G44 3140 3141# CHECK: Iterations: 100 3142# CHECK-NEXT: Instructions: 1000 3143# CHECK-NEXT: Total Cycles: 508 3144# CHECK-NEXT: Total uOps: 3300 3145 3146# CHECK: Dispatch Width: 15 3147# CHECK-NEXT: uOps Per Cycle: 6.50 3148# CHECK-NEXT: IPC: 1.97 3149# CHECK-NEXT: Block RThroughput: 3.7 3150 3151# CHECK: Timeline view: 3152# CHECK-NEXT: 012 3153# CHECK-NEXT: Index 0123456789 3154 3155# CHECK: [0,0] DeeeeeeeeER . ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 3156# CHECK-NEXT: [0,1] D=eE------R . add x0, x27, #1 3157# CHECK-NEXT: [0,2] .DeeeeeeeeER. ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 3158# CHECK-NEXT: [0,3] .D=eE------R. add x0, x27, #1 3159# CHECK-NEXT: [0,4] . DeeeeeeeeER ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 3160# CHECK-NEXT: [0,5] . D=eE------R add x0, x27, #1 3161# CHECK-NEXT: [0,6] . D=eeeeeeE-R ldp s1, s2, [x27], #248 3162# CHECK-NEXT: [0,7] . D==eE-----R add x0, x27, #1 3163# CHECK-NEXT: [0,8] . D==eeeeeeER ldp d1, d2, [x27], #496 3164# CHECK-NEXT: [0,9] . D===eE----R add x0, x27, #1 3165 3166# CHECK: Average Wait times (based on the timeline view): 3167# CHECK-NEXT: [0]: Executions 3168# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3169# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3170# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3171 3172# CHECK: [0] [1] [2] [3] 3173# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 3174# CHECK-NEXT: 1. 1 2.0 0.0 6.0 add x0, x27, #1 3175# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 3176# CHECK-NEXT: 3. 1 2.0 0.0 6.0 add x0, x27, #1 3177# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 3178# CHECK-NEXT: 5. 1 2.0 0.0 6.0 add x0, x27, #1 3179# CHECK-NEXT: 6. 1 2.0 0.0 1.0 ldp s1, s2, [x27], #248 3180# CHECK-NEXT: 7. 1 3.0 0.0 5.0 add x0, x27, #1 3181# CHECK-NEXT: 8. 1 3.0 0.0 0.0 ldp d1, d2, [x27], #496 3182# CHECK-NEXT: 9. 1 4.0 0.0 4.0 add x0, x27, #1 3183# CHECK-NEXT: 1 2.1 0.1 2.8 <total> 3184 3185# CHECK: [44] Code Region - G45 3186 3187# CHECK: Iterations: 100 3188# CHECK-NEXT: Instructions: 1000 3189# CHECK-NEXT: Total Cycles: 507 3190# CHECK-NEXT: Total uOps: 1700 3191 3192# CHECK: Dispatch Width: 15 3193# CHECK-NEXT: uOps Per Cycle: 3.35 3194# CHECK-NEXT: IPC: 1.97 3195# CHECK-NEXT: Block RThroughput: 2.5 3196 3197# CHECK: Timeline view: 3198# CHECK-NEXT: 01 3199# CHECK-NEXT: Index 0123456789 3200 3201# CHECK: [0,0] DeeeeeeER .. ldp q1, q2, [x27], #992 3202# CHECK-NEXT: [0,1] D=eE----R .. add x0, x27, #1 3203# CHECK-NEXT: [0,2] D=eeeeeeER.. ldp s1, s2, [x27, #248]! 3204# CHECK-NEXT: [0,3] D==eE----R.. add x0, x27, #1 3205# CHECK-NEXT: [0,4] D==eeeeeeER. ldp d1, d2, [x27, #496]! 3206# CHECK-NEXT: [0,5] D===eE----R. add x0, x27, #1 3207# CHECK-NEXT: [0,6] D===eeeeeeER ldp q1, q2, [x27, #992]! 3208# CHECK-NEXT: [0,7] D====eE----R add x0, x27, #1 3209# CHECK-NEXT: [0,8] .D===eeeeE-R ldp w1, w2, [x27], #248 3210# CHECK-NEXT: [0,9] .D====eE---R add x0, x27, #1 3211 3212# CHECK: Average Wait times (based on the timeline view): 3213# CHECK-NEXT: [0]: Executions 3214# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3215# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3216# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3217 3218# CHECK: [0] [1] [2] [3] 3219# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldp q1, q2, [x27], #992 3220# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 3221# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ldp s1, s2, [x27, #248]! 3222# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 3223# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ldp d1, d2, [x27, #496]! 3224# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 3225# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ldp q1, q2, [x27, #992]! 3226# CHECK-NEXT: 7. 1 5.0 0.0 4.0 add x0, x27, #1 3227# CHECK-NEXT: 8. 1 4.0 0.0 1.0 ldp w1, w2, [x27], #248 3228# CHECK-NEXT: 9. 1 5.0 0.0 3.0 add x0, x27, #1 3229# CHECK-NEXT: 1 3.3 0.1 2.0 <total> 3230 3231# CHECK: [45] Code Region - G46 3232 3233# CHECK: Iterations: 100 3234# CHECK-NEXT: Instructions: 1000 3235# CHECK-NEXT: Total Cycles: 507 3236# CHECK-NEXT: Total uOps: 1900 3237 3238# CHECK: Dispatch Width: 15 3239# CHECK-NEXT: uOps Per Cycle: 3.75 3240# CHECK-NEXT: IPC: 1.97 3241# CHECK-NEXT: Block RThroughput: 3.0 3242 3243# CHECK: Timeline view: 3244# CHECK-NEXT: 01 3245# CHECK-NEXT: Index 0123456789 3246 3247# CHECK: [0,0] DeeeeER .. ldp x1, x2, [x27], #496 3248# CHECK-NEXT: [0,1] D=eE--R .. add x0, x27, #1 3249# CHECK-NEXT: [0,2] D=eeeeER .. ldp w1, w2, [x27, #248]! 3250# CHECK-NEXT: [0,3] D==eE--R .. add x0, x27, #1 3251# CHECK-NEXT: [0,4] D==eeeeER .. ldp x1, x2, [x27, #496]! 3252# CHECK-NEXT: [0,5] D===eE--R .. add x0, x27, #1 3253# CHECK-NEXT: [0,6] D===eeeeeER. ldpsw x1, x2, [x27], #248 3254# CHECK-NEXT: [0,7] D====eE---R. add x0, x27, #1 3255# CHECK-NEXT: [0,8] .D===eeeeeER ldpsw x1, x2, [x27, #248]! 3256# CHECK-NEXT: [0,9] .D====eE---R add x0, x27, #1 3257 3258# CHECK: Average Wait times (based on the timeline view): 3259# CHECK-NEXT: [0]: Executions 3260# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3261# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3262# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3263 3264# CHECK: [0] [1] [2] [3] 3265# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldp x1, x2, [x27], #496 3266# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 3267# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ldp w1, w2, [x27, #248]! 3268# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 3269# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ldp x1, x2, [x27, #496]! 3270# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 3271# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ldpsw x1, x2, [x27], #248 3272# CHECK-NEXT: 7. 1 5.0 0.0 3.0 add x0, x27, #1 3273# CHECK-NEXT: 8. 1 4.0 0.0 0.0 ldpsw x1, x2, [x27, #248]! 3274# CHECK-NEXT: 9. 1 5.0 0.0 3.0 add x0, x27, #1 3275# CHECK-NEXT: 1 3.3 0.1 1.2 <total> 3276 3277# CHECK: [46] Code Region - G47 3278 3279# CHECK: Iterations: 100 3280# CHECK-NEXT: Instructions: 1000 3281# CHECK-NEXT: Total Cycles: 508 3282# CHECK-NEXT: Total uOps: 1500 3283 3284# CHECK: Dispatch Width: 15 3285# CHECK-NEXT: uOps Per Cycle: 2.95 3286# CHECK-NEXT: IPC: 1.97 3287# CHECK-NEXT: Block RThroughput: 2.5 3288 3289# CHECK: Timeline view: 3290# CHECK-NEXT: 012 3291# CHECK-NEXT: Index 0123456789 3292 3293# CHECK: [0,0] DeeeeeeER . . ldr b1, [x27], #254 3294# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 3295# CHECK-NEXT: [0,2] D=eeeeeeER. . ldr h1, [x27], #254 3296# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 3297# CHECK-NEXT: [0,4] D==eeeeeeER . ldr s1, [x27], #254 3298# CHECK-NEXT: [0,5] D===eE----R . add x0, x27, #1 3299# CHECK-NEXT: [0,6] D===eeeeeeER. ldr d1, [x27], #254 3300# CHECK-NEXT: [0,7] D====eE----R. add x0, x27, #1 3301# CHECK-NEXT: [0,8] D====eeeeeeER ldr q1, [x27], #254 3302# CHECK-NEXT: [0,9] D=====eE----R add x0, x27, #1 3303 3304# CHECK: Average Wait times (based on the timeline view): 3305# CHECK-NEXT: [0]: Executions 3306# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3307# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3308# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3309 3310# CHECK: [0] [1] [2] [3] 3311# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldr b1, [x27], #254 3312# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 3313# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ldr h1, [x27], #254 3314# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 3315# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ldr s1, [x27], #254 3316# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 3317# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ldr d1, [x27], #254 3318# CHECK-NEXT: 7. 1 5.0 0.0 4.0 add x0, x27, #1 3319# CHECK-NEXT: 8. 1 5.0 0.0 0.0 ldr q1, [x27], #254 3320# CHECK-NEXT: 9. 1 6.0 0.0 4.0 add x0, x27, #1 3321# CHECK-NEXT: 1 3.5 0.1 2.0 <total> 3322 3323# CHECK: [47] Code Region - G48 3324 3325# CHECK: Iterations: 100 3326# CHECK-NEXT: Instructions: 1000 3327# CHECK-NEXT: Total Cycles: 508 3328# CHECK-NEXT: Total uOps: 1500 3329 3330# CHECK: Dispatch Width: 15 3331# CHECK-NEXT: uOps Per Cycle: 2.95 3332# CHECK-NEXT: IPC: 1.97 3333# CHECK-NEXT: Block RThroughput: 2.5 3334 3335# CHECK: Timeline view: 3336# CHECK-NEXT: 012 3337# CHECK-NEXT: Index 0123456789 3338 3339# CHECK: [0,0] DeeeeeeER . . ldr b1, [x27, #254]! 3340# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 3341# CHECK-NEXT: [0,2] D=eeeeeeER. . ldr h1, [x27, #254]! 3342# CHECK-NEXT: [0,3] D==eE----R. . add x0, x27, #1 3343# CHECK-NEXT: [0,4] D==eeeeeeER . ldr s1, [x27, #254]! 3344# CHECK-NEXT: [0,5] D===eE----R . add x0, x27, #1 3345# CHECK-NEXT: [0,6] D===eeeeeeER. ldr d1, [x27, #254]! 3346# CHECK-NEXT: [0,7] D====eE----R. add x0, x27, #1 3347# CHECK-NEXT: [0,8] D====eeeeeeER ldr q1, [x27, #254]! 3348# CHECK-NEXT: [0,9] D=====eE----R add x0, x27, #1 3349 3350# CHECK: Average Wait times (based on the timeline view): 3351# CHECK-NEXT: [0]: Executions 3352# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3353# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3354# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3355 3356# CHECK: [0] [1] [2] [3] 3357# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldr b1, [x27, #254]! 3358# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 3359# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ldr h1, [x27, #254]! 3360# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 3361# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ldr s1, [x27, #254]! 3362# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 3363# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ldr d1, [x27, #254]! 3364# CHECK-NEXT: 7. 1 5.0 0.0 4.0 add x0, x27, #1 3365# CHECK-NEXT: 8. 1 5.0 0.0 0.0 ldr q1, [x27, #254]! 3366# CHECK-NEXT: 9. 1 6.0 0.0 4.0 add x0, x27, #1 3367# CHECK-NEXT: 1 3.5 0.1 2.0 <total> 3368 3369# CHECK: [48] Code Region - G49 3370 3371# CHECK: Iterations: 100 3372# CHECK-NEXT: Instructions: 1000 3373# CHECK-NEXT: Total Cycles: 506 3374# CHECK-NEXT: Total uOps: 1500 3375 3376# CHECK: Dispatch Width: 15 3377# CHECK-NEXT: uOps Per Cycle: 2.96 3378# CHECK-NEXT: IPC: 1.98 3379# CHECK-NEXT: Block RThroughput: 2.5 3380 3381# CHECK: Timeline view: 3382# CHECK-NEXT: 0 3383# CHECK-NEXT: Index 0123456789 3384 3385# CHECK: [0,0] DeeeeER . ldr w1, [x27], #254 3386# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 3387# CHECK-NEXT: [0,2] D=eeeeER . ldr x1, [x27], #254 3388# CHECK-NEXT: [0,3] D==eE--R . add x0, x27, #1 3389# CHECK-NEXT: [0,4] D==eeeeER . ldr w1, [x27, #254]! 3390# CHECK-NEXT: [0,5] D===eE--R . add x0, x27, #1 3391# CHECK-NEXT: [0,6] D===eeeeER. ldr x1, [x27, #254]! 3392# CHECK-NEXT: [0,7] D====eE--R. add x0, x27, #1 3393# CHECK-NEXT: [0,8] D====eeeeER ldrb w1, [x27], #254 3394# CHECK-NEXT: [0,9] D=====eE--R add x0, x27, #1 3395 3396# CHECK: Average Wait times (based on the timeline view): 3397# CHECK-NEXT: [0]: Executions 3398# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3399# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3400# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3401 3402# CHECK: [0] [1] [2] [3] 3403# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldr w1, [x27], #254 3404# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 3405# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ldr x1, [x27], #254 3406# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 3407# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ldr w1, [x27, #254]! 3408# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 3409# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ldr x1, [x27, #254]! 3410# CHECK-NEXT: 7. 1 5.0 0.0 2.0 add x0, x27, #1 3411# CHECK-NEXT: 8. 1 5.0 0.0 0.0 ldrb w1, [x27], #254 3412# CHECK-NEXT: 9. 1 6.0 0.0 2.0 add x0, x27, #1 3413# CHECK-NEXT: 1 3.5 0.1 1.0 <total> 3414 3415# CHECK: [49] Code Region - G50 3416 3417# CHECK: Iterations: 100 3418# CHECK-NEXT: Instructions: 1000 3419# CHECK-NEXT: Total Cycles: 506 3420# CHECK-NEXT: Total uOps: 1500 3421 3422# CHECK: Dispatch Width: 15 3423# CHECK-NEXT: uOps Per Cycle: 2.96 3424# CHECK-NEXT: IPC: 1.98 3425# CHECK-NEXT: Block RThroughput: 2.5 3426 3427# CHECK: Timeline view: 3428# CHECK-NEXT: 0 3429# CHECK-NEXT: Index 0123456789 3430 3431# CHECK: [0,0] DeeeeER . ldrb w1, [x27, #254]! 3432# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 3433# CHECK-NEXT: [0,2] D=eeeeER . ldrh w1, [x27], #254 3434# CHECK-NEXT: [0,3] D==eE--R . add x0, x27, #1 3435# CHECK-NEXT: [0,4] D==eeeeER . ldrh w1, [x27, #254]! 3436# CHECK-NEXT: [0,5] D===eE--R . add x0, x27, #1 3437# CHECK-NEXT: [0,6] D===eeeeER. ldrsb w1, [x27], #254 3438# CHECK-NEXT: [0,7] D====eE--R. add x0, x27, #1 3439# CHECK-NEXT: [0,8] D====eeeeER ldrsb x1, [x27], #254 3440# CHECK-NEXT: [0,9] D=====eE--R add x0, x27, #1 3441 3442# CHECK: Average Wait times (based on the timeline view): 3443# CHECK-NEXT: [0]: Executions 3444# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3445# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3446# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3447 3448# CHECK: [0] [1] [2] [3] 3449# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldrb w1, [x27, #254]! 3450# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 3451# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ldrh w1, [x27], #254 3452# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 3453# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ldrh w1, [x27, #254]! 3454# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 3455# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ldrsb w1, [x27], #254 3456# CHECK-NEXT: 7. 1 5.0 0.0 2.0 add x0, x27, #1 3457# CHECK-NEXT: 8. 1 5.0 0.0 0.0 ldrsb x1, [x27], #254 3458# CHECK-NEXT: 9. 1 6.0 0.0 2.0 add x0, x27, #1 3459# CHECK-NEXT: 1 3.5 0.1 1.0 <total> 3460 3461# CHECK: [50] Code Region - G51 3462 3463# CHECK: Iterations: 100 3464# CHECK-NEXT: Instructions: 1000 3465# CHECK-NEXT: Total Cycles: 506 3466# CHECK-NEXT: Total uOps: 1500 3467 3468# CHECK: Dispatch Width: 15 3469# CHECK-NEXT: uOps Per Cycle: 2.96 3470# CHECK-NEXT: IPC: 1.98 3471# CHECK-NEXT: Block RThroughput: 2.5 3472 3473# CHECK: Timeline view: 3474# CHECK-NEXT: 0 3475# CHECK-NEXT: Index 0123456789 3476 3477# CHECK: [0,0] DeeeeER . ldrsb w1, [x27, #254]! 3478# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 3479# CHECK-NEXT: [0,2] D=eeeeER . ldrsb x1, [x27, #254]! 3480# CHECK-NEXT: [0,3] D==eE--R . add x0, x27, #1 3481# CHECK-NEXT: [0,4] D==eeeeER . ldrsh w1, [x27], #254 3482# CHECK-NEXT: [0,5] D===eE--R . add x0, x27, #1 3483# CHECK-NEXT: [0,6] D===eeeeER. ldrsh x1, [x27], #254 3484# CHECK-NEXT: [0,7] D====eE--R. add x0, x27, #1 3485# CHECK-NEXT: [0,8] D====eeeeER ldrsh w1, [x27, #254]! 3486# CHECK-NEXT: [0,9] D=====eE--R add x0, x27, #1 3487 3488# CHECK: Average Wait times (based on the timeline view): 3489# CHECK-NEXT: [0]: Executions 3490# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3491# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3492# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3493 3494# CHECK: [0] [1] [2] [3] 3495# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldrsb w1, [x27, #254]! 3496# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 3497# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ldrsb x1, [x27, #254]! 3498# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 3499# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ldrsh w1, [x27], #254 3500# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 3501# CHECK-NEXT: 6. 1 4.0 0.0 0.0 ldrsh x1, [x27], #254 3502# CHECK-NEXT: 7. 1 5.0 0.0 2.0 add x0, x27, #1 3503# CHECK-NEXT: 8. 1 5.0 0.0 0.0 ldrsh w1, [x27, #254]! 3504# CHECK-NEXT: 9. 1 6.0 0.0 2.0 add x0, x27, #1 3505# CHECK-NEXT: 1 3.5 0.1 1.0 <total> 3506 3507# CHECK: [51] Code Region - G52 3508 3509# CHECK: Iterations: 100 3510# CHECK-NEXT: Instructions: 1000 3511# CHECK-NEXT: Total Cycles: 504 3512# CHECK-NEXT: Total uOps: 1700 3513 3514# CHECK: Dispatch Width: 15 3515# CHECK-NEXT: uOps Per Cycle: 3.37 3516# CHECK-NEXT: IPC: 1.98 3517# CHECK-NEXT: Block RThroughput: 2.5 3518 3519# CHECK: Timeline view: 3520# CHECK-NEXT: Index 012345678 3521 3522# CHECK: [0,0] DeeeeER . ldrsh x1, [x27, #254]! 3523# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 3524# CHECK-NEXT: [0,2] D=eeeeER. ldrsw x1, [x27], #254 3525# CHECK-NEXT: [0,3] D==eE--R. add x0, x27, #1 3526# CHECK-NEXT: [0,4] D==eeeeER ldrsw x1, [x27, #254]! 3527# CHECK-NEXT: [0,5] D===eE--R add x0, x27, #1 3528# CHECK-NEXT: [0,6] D===eeE-R st1 { v1.1d }, [x27], #8 3529# CHECK-NEXT: [0,7] D====eE-R add x0, x27, #1 3530# CHECK-NEXT: [0,8] .D===eeER st1 { v1.2d }, [x27], #16 3531# CHECK-NEXT: [0,9] .D====eER add x0, x27, #1 3532 3533# CHECK: Average Wait times (based on the timeline view): 3534# CHECK-NEXT: [0]: Executions 3535# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3536# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3537# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3538 3539# CHECK: [0] [1] [2] [3] 3540# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldrsh x1, [x27, #254]! 3541# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 3542# CHECK-NEXT: 2. 1 2.0 0.0 0.0 ldrsw x1, [x27], #254 3543# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 3544# CHECK-NEXT: 4. 1 3.0 0.0 0.0 ldrsw x1, [x27, #254]! 3545# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 3546# CHECK-NEXT: 6. 1 4.0 0.0 1.0 st1 { v1.1d }, [x27], #8 3547# CHECK-NEXT: 7. 1 5.0 0.0 1.0 add x0, x27, #1 3548# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st1 { v1.2d }, [x27], #16 3549# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 3550# CHECK-NEXT: 1 3.3 0.1 0.8 <total> 3551 3552# CHECK: [52] Code Region - G53 3553 3554# CHECK: Iterations: 100 3555# CHECK-NEXT: Instructions: 1000 3556# CHECK-NEXT: Total Cycles: 504 3557# CHECK-NEXT: Total uOps: 2000 3558 3559# CHECK: Dispatch Width: 15 3560# CHECK-NEXT: uOps Per Cycle: 3.97 3561# CHECK-NEXT: IPC: 1.98 3562# CHECK-NEXT: Block RThroughput: 2.5 3563 3564# CHECK: Timeline view: 3565# CHECK-NEXT: Index 012345678 3566 3567# CHECK: [0,0] DeeER. . st1 { v1.2s }, [x27], #8 3568# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 3569# CHECK-NEXT: [0,2] D=eeER . st1 { v1.4h }, [x27], #8 3570# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 3571# CHECK-NEXT: [0,4] D==eeER . st1 { v1.4s }, [x27], #16 3572# CHECK-NEXT: [0,5] D===eER . add x0, x27, #1 3573# CHECK-NEXT: [0,6] D===eeER. st1 { v1.8b }, [x27], #8 3574# CHECK-NEXT: [0,7] .D===eER. add x0, x27, #1 3575# CHECK-NEXT: [0,8] .D===eeER st1 { v1.8h }, [x27], #16 3576# CHECK-NEXT: [0,9] .D====eER add x0, x27, #1 3577 3578# CHECK: Average Wait times (based on the timeline view): 3579# CHECK-NEXT: [0]: Executions 3580# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3581# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3582# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3583 3584# CHECK: [0] [1] [2] [3] 3585# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.2s }, [x27], #8 3586# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 3587# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.4h }, [x27], #8 3588# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 3589# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st1 { v1.4s }, [x27], #16 3590# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 3591# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st1 { v1.8b }, [x27], #8 3592# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 3593# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st1 { v1.8h }, [x27], #16 3594# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 3595# CHECK-NEXT: 1 3.2 0.1 0.0 <total> 3596 3597# CHECK: [53] Code Region - G54 3598 3599# CHECK: Iterations: 100 3600# CHECK-NEXT: Instructions: 1000 3601# CHECK-NEXT: Total Cycles: 504 3602# CHECK-NEXT: Total uOps: 2000 3603 3604# CHECK: Dispatch Width: 15 3605# CHECK-NEXT: uOps Per Cycle: 3.97 3606# CHECK-NEXT: IPC: 1.98 3607# CHECK-NEXT: Block RThroughput: 2.5 3608 3609# CHECK: Timeline view: 3610# CHECK-NEXT: Index 012345678 3611 3612# CHECK: [0,0] DeeER. . st1 { v1.16b }, [x27], #16 3613# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 3614# CHECK-NEXT: [0,2] D=eeER . st1 { v1.1d }, [x27], x28 3615# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 3616# CHECK-NEXT: [0,4] D==eeER . st1 { v1.2d }, [x27], x28 3617# CHECK-NEXT: [0,5] D===eER . add x0, x27, #1 3618# CHECK-NEXT: [0,6] D===eeER. st1 { v1.2s }, [x27], x28 3619# CHECK-NEXT: [0,7] .D===eER. add x0, x27, #1 3620# CHECK-NEXT: [0,8] .D===eeER st1 { v1.4h }, [x27], x28 3621# CHECK-NEXT: [0,9] .D====eER add x0, x27, #1 3622 3623# CHECK: Average Wait times (based on the timeline view): 3624# CHECK-NEXT: [0]: Executions 3625# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3626# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3627# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3628 3629# CHECK: [0] [1] [2] [3] 3630# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.16b }, [x27], #16 3631# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 3632# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.1d }, [x27], x28 3633# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 3634# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st1 { v1.2d }, [x27], x28 3635# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 3636# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st1 { v1.2s }, [x27], x28 3637# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 3638# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st1 { v1.4h }, [x27], x28 3639# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 3640# CHECK-NEXT: 1 3.2 0.1 0.0 <total> 3641 3642# CHECK: [54] Code Region - G55 3643 3644# CHECK: Iterations: 100 3645# CHECK-NEXT: Instructions: 1000 3646# CHECK-NEXT: Total Cycles: 504 3647# CHECK-NEXT: Total uOps: 2000 3648 3649# CHECK: Dispatch Width: 15 3650# CHECK-NEXT: uOps Per Cycle: 3.97 3651# CHECK-NEXT: IPC: 1.98 3652# CHECK-NEXT: Block RThroughput: 2.5 3653 3654# CHECK: Timeline view: 3655# CHECK-NEXT: Index 012345678 3656 3657# CHECK: [0,0] DeeER. . st1 { v1.4s }, [x27], x28 3658# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 3659# CHECK-NEXT: [0,2] D=eeER . st1 { v1.8b }, [x27], x28 3660# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 3661# CHECK-NEXT: [0,4] D==eeER . st1 { v1.8h }, [x27], x28 3662# CHECK-NEXT: [0,5] D===eER . add x0, x27, #1 3663# CHECK-NEXT: [0,6] D===eeER. st1 { v1.16b }, [x27], x28 3664# CHECK-NEXT: [0,7] .D===eER. add x0, x27, #1 3665# CHECK-NEXT: [0,8] .D===eeER st1 { v1.1d, v2.1d }, [x27], #16 3666# CHECK-NEXT: [0,9] .D====eER add x0, x27, #1 3667 3668# CHECK: Average Wait times (based on the timeline view): 3669# CHECK-NEXT: [0]: Executions 3670# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3671# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3672# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3673 3674# CHECK: [0] [1] [2] [3] 3675# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.4s }, [x27], x28 3676# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 3677# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.8b }, [x27], x28 3678# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 3679# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st1 { v1.8h }, [x27], x28 3680# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 3681# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st1 { v1.16b }, [x27], x28 3682# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 3683# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st1 { v1.1d, v2.1d }, [x27], #16 3684# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 3685# CHECK-NEXT: 1 3.2 0.1 0.0 <total> 3686 3687# CHECK: [55] Code Region - G56 3688 3689# CHECK: Iterations: 100 3690# CHECK-NEXT: Instructions: 1000 3691# CHECK-NEXT: Total Cycles: 504 3692# CHECK-NEXT: Total uOps: 2400 3693 3694# CHECK: Dispatch Width: 15 3695# CHECK-NEXT: uOps Per Cycle: 4.76 3696# CHECK-NEXT: IPC: 1.98 3697# CHECK-NEXT: Block RThroughput: 3.5 3698 3699# CHECK: Timeline view: 3700# CHECK-NEXT: Index 012345678 3701 3702# CHECK: [0,0] DeeER. . st1 { v1.2d, v2.2d }, [x27], #32 3703# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 3704# CHECK-NEXT: [0,2] D=eeER . st1 { v1.2s, v2.2s }, [x27], #16 3705# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 3706# CHECK-NEXT: [0,4] D==eeER . st1 { v1.4h, v2.4h }, [x27], #16 3707# CHECK-NEXT: [0,5] D===eER . add x0, x27, #1 3708# CHECK-NEXT: [0,6] .D==eeER. st1 { v1.4s, v2.4s }, [x27], #32 3709# CHECK-NEXT: [0,7] .D===eER. add x0, x27, #1 3710# CHECK-NEXT: [0,8] .D===eeER st1 { v1.8b, v2.8b }, [x27], #16 3711# CHECK-NEXT: [0,9] .D====eER add x0, x27, #1 3712 3713# CHECK: Average Wait times (based on the timeline view): 3714# CHECK-NEXT: [0]: Executions 3715# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3716# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3717# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3718 3719# CHECK: [0] [1] [2] [3] 3720# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.2d, v2.2d }, [x27], #32 3721# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 3722# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.2s, v2.2s }, [x27], #16 3723# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 3724# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st1 { v1.4h, v2.4h }, [x27], #16 3725# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 3726# CHECK-NEXT: 6. 1 3.0 0.0 0.0 st1 { v1.4s, v2.4s }, [x27], #32 3727# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 3728# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st1 { v1.8b, v2.8b }, [x27], #16 3729# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 3730# CHECK-NEXT: 1 3.1 0.1 0.0 <total> 3731 3732# CHECK: [56] Code Region - G57 3733 3734# CHECK: Iterations: 100 3735# CHECK-NEXT: Instructions: 1000 3736# CHECK-NEXT: Total Cycles: 504 3737# CHECK-NEXT: Total uOps: 2600 3738 3739# CHECK: Dispatch Width: 15 3740# CHECK-NEXT: uOps Per Cycle: 5.16 3741# CHECK-NEXT: IPC: 1.98 3742# CHECK-NEXT: Block RThroughput: 4.0 3743 3744# CHECK: Timeline view: 3745# CHECK-NEXT: Index 012345678 3746 3747# CHECK: [0,0] DeeER. . st1 { v1.8h, v2.8h }, [x27], #32 3748# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 3749# CHECK-NEXT: [0,2] D=eeER . st1 { v1.16b, v2.16b }, [x27], #32 3750# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 3751# CHECK-NEXT: [0,4] D==eeER . st1 { v1.1d, v2.1d }, [x27], x28 3752# CHECK-NEXT: [0,5] .D==eER . add x0, x27, #1 3753# CHECK-NEXT: [0,6] .D==eeER. st1 { v1.2d, v2.2d }, [x27], x28 3754# CHECK-NEXT: [0,7] .D===eER. add x0, x27, #1 3755# CHECK-NEXT: [0,8] .D===eeER st1 { v1.2s, v2.2s }, [x27], x28 3756# CHECK-NEXT: [0,9] .D====eER add x0, x27, #1 3757 3758# CHECK: Average Wait times (based on the timeline view): 3759# CHECK-NEXT: [0]: Executions 3760# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3761# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3762# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3763 3764# CHECK: [0] [1] [2] [3] 3765# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.8h, v2.8h }, [x27], #32 3766# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 3767# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.16b, v2.16b }, [x27], #32 3768# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 3769# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st1 { v1.1d, v2.1d }, [x27], x28 3770# CHECK-NEXT: 5. 1 3.0 0.0 0.0 add x0, x27, #1 3771# CHECK-NEXT: 6. 1 3.0 0.0 0.0 st1 { v1.2d, v2.2d }, [x27], x28 3772# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 3773# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st1 { v1.2s, v2.2s }, [x27], x28 3774# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 3775# CHECK-NEXT: 1 3.0 0.1 0.0 <total> 3776 3777# CHECK: [57] Code Region - G58 3778 3779# CHECK: Iterations: 100 3780# CHECK-NEXT: Instructions: 1000 3781# CHECK-NEXT: Total Cycles: 504 3782# CHECK-NEXT: Total uOps: 2600 3783 3784# CHECK: Dispatch Width: 15 3785# CHECK-NEXT: uOps Per Cycle: 5.16 3786# CHECK-NEXT: IPC: 1.98 3787# CHECK-NEXT: Block RThroughput: 4.0 3788 3789# CHECK: Timeline view: 3790# CHECK-NEXT: Index 012345678 3791 3792# CHECK: [0,0] DeeER. . st1 { v1.4h, v2.4h }, [x27], x28 3793# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 3794# CHECK-NEXT: [0,2] D=eeER . st1 { v1.4s, v2.4s }, [x27], x28 3795# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 3796# CHECK-NEXT: [0,4] D==eeER . st1 { v1.8b, v2.8b }, [x27], x28 3797# CHECK-NEXT: [0,5] D===eER . add x0, x27, #1 3798# CHECK-NEXT: [0,6] .D==eeER. st1 { v1.8h, v2.8h }, [x27], x28 3799# CHECK-NEXT: [0,7] .D===eER. add x0, x27, #1 3800# CHECK-NEXT: [0,8] .D===eeER st1 { v1.16b, v2.16b }, [x27], x28 3801# CHECK-NEXT: [0,9] .D====eER add x0, x27, #1 3802 3803# CHECK: Average Wait times (based on the timeline view): 3804# CHECK-NEXT: [0]: Executions 3805# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3806# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3807# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3808 3809# CHECK: [0] [1] [2] [3] 3810# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.4h, v2.4h }, [x27], x28 3811# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 3812# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.4s, v2.4s }, [x27], x28 3813# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 3814# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st1 { v1.8b, v2.8b }, [x27], x28 3815# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 3816# CHECK-NEXT: 6. 1 3.0 0.0 0.0 st1 { v1.8h, v2.8h }, [x27], x28 3817# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 3818# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st1 { v1.16b, v2.16b }, [x27], x28 3819# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 3820# CHECK-NEXT: 1 3.1 0.1 0.0 <total> 3821 3822# CHECK: [58] Code Region - G59 3823 3824# CHECK: Iterations: 100 3825# CHECK-NEXT: Instructions: 1000 3826# CHECK-NEXT: Total Cycles: 703 3827# CHECK-NEXT: Total uOps: 3400 3828 3829# CHECK: Dispatch Width: 15 3830# CHECK-NEXT: uOps Per Cycle: 4.84 3831# CHECK-NEXT: IPC: 1.42 3832# CHECK-NEXT: Block RThroughput: 6.0 3833 3834# CHECK: Timeline view: 3835# CHECK-NEXT: Index 0123456789 3836 3837# CHECK: [0,0] DeeER. . st1 { v1.1d, v2.1d, v3.1d }, [x27], #24 3838# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 3839# CHECK-NEXT: [0,2] D=eeER . st1 { v1.2d, v2.2d, v3.2d }, [x27], #48 3840# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 3841# CHECK-NEXT: [0,4] .D=eeER . st1 { v1.2s, v2.2s, v3.2s }, [x27], #24 3842# CHECK-NEXT: [0,5] .D==eER . add x0, x27, #1 3843# CHECK-NEXT: [0,6] .D===eeER. st1 { v1.4h, v2.4h, v3.4h }, [x27], #24 3844# CHECK-NEXT: [0,7] .D====eER. add x0, x27, #1 3845# CHECK-NEXT: [0,8] . D===eeER st1 { v1.4s, v2.4s, v3.4s }, [x27], #48 3846# CHECK-NEXT: [0,9] . D====eER add x0, x27, #1 3847 3848# CHECK: Average Wait times (based on the timeline view): 3849# CHECK-NEXT: [0]: Executions 3850# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3851# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3852# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3853 3854# CHECK: [0] [1] [2] [3] 3855# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.1d, v2.1d, v3.1d }, [x27], #24 3856# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 3857# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.2d, v2.2d, v3.2d }, [x27], #48 3858# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 3859# CHECK-NEXT: 4. 1 2.0 0.0 0.0 st1 { v1.2s, v2.2s, v3.2s }, [x27], #24 3860# CHECK-NEXT: 5. 1 3.0 0.0 0.0 add x0, x27, #1 3861# CHECK-NEXT: 6. 1 4.0 1.0 0.0 st1 { v1.4h, v2.4h, v3.4h }, [x27], #24 3862# CHECK-NEXT: 7. 1 5.0 0.0 0.0 add x0, x27, #1 3863# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st1 { v1.4s, v2.4s, v3.4s }, [x27], #48 3864# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 3865# CHECK-NEXT: 1 3.1 0.2 0.0 <total> 3866 3867# CHECK: [59] Code Region - G60 3868 3869# CHECK: Iterations: 100 3870# CHECK-NEXT: Instructions: 1000 3871# CHECK-NEXT: Total Cycles: 703 3872# CHECK-NEXT: Total uOps: 3600 3873 3874# CHECK: Dispatch Width: 15 3875# CHECK-NEXT: uOps Per Cycle: 5.12 3876# CHECK-NEXT: IPC: 1.42 3877# CHECK-NEXT: Block RThroughput: 6.5 3878 3879# CHECK: Timeline view: 3880# CHECK-NEXT: Index 0123456789 3881 3882# CHECK: [0,0] DeeER. . st1 { v1.8b, v2.8b, v3.8b }, [x27], #24 3883# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 3884# CHECK-NEXT: [0,2] D=eeER . st1 { v1.8h, v2.8h, v3.8h }, [x27], #48 3885# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 3886# CHECK-NEXT: [0,4] .D=eeER . st1 { v1.16b, v2.16b, v3.16b }, [x27], #48 3887# CHECK-NEXT: [0,5] .D==eER . add x0, x27, #1 3888# CHECK-NEXT: [0,6] .D===eeER. st1 { v1.1d, v2.1d, v3.1d }, [x27], x28 3889# CHECK-NEXT: [0,7] .D====eER. add x0, x27, #1 3890# CHECK-NEXT: [0,8] . D===eeER st1 { v1.2d, v2.2d, v3.2d }, [x27], x28 3891# CHECK-NEXT: [0,9] . D====eER add x0, x27, #1 3892 3893# CHECK: Average Wait times (based on the timeline view): 3894# CHECK-NEXT: [0]: Executions 3895# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3896# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3897# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3898 3899# CHECK: [0] [1] [2] [3] 3900# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.8b, v2.8b, v3.8b }, [x27], #24 3901# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 3902# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.8h, v2.8h, v3.8h }, [x27], #48 3903# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 3904# CHECK-NEXT: 4. 1 2.0 0.0 0.0 st1 { v1.16b, v2.16b, v3.16b }, [x27], #48 3905# CHECK-NEXT: 5. 1 3.0 0.0 0.0 add x0, x27, #1 3906# CHECK-NEXT: 6. 1 4.0 1.0 0.0 st1 { v1.1d, v2.1d, v3.1d }, [x27], x28 3907# CHECK-NEXT: 7. 1 5.0 0.0 0.0 add x0, x27, #1 3908# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st1 { v1.2d, v2.2d, v3.2d }, [x27], x28 3909# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 3910# CHECK-NEXT: 1 3.1 0.2 0.0 <total> 3911 3912# CHECK: [60] Code Region - G61 3913 3914# CHECK: Iterations: 100 3915# CHECK-NEXT: Instructions: 1000 3916# CHECK-NEXT: Total Cycles: 703 3917# CHECK-NEXT: Total uOps: 3400 3918 3919# CHECK: Dispatch Width: 15 3920# CHECK-NEXT: uOps Per Cycle: 4.84 3921# CHECK-NEXT: IPC: 1.42 3922# CHECK-NEXT: Block RThroughput: 6.0 3923 3924# CHECK: Timeline view: 3925# CHECK-NEXT: Index 0123456789 3926 3927# CHECK: [0,0] DeeER. . st1 { v1.2s, v2.2s, v3.2s }, [x27], x28 3928# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 3929# CHECK-NEXT: [0,2] D=eeER . st1 { v1.4h, v2.4h, v3.4h }, [x27], x28 3930# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 3931# CHECK-NEXT: [0,4] .D=eeER . st1 { v1.4s, v2.4s, v3.4s }, [x27], x28 3932# CHECK-NEXT: [0,5] .D==eER . add x0, x27, #1 3933# CHECK-NEXT: [0,6] .D==eeER . st1 { v1.8b, v2.8b, v3.8b }, [x27], x28 3934# CHECK-NEXT: [0,7] .D===eER . add x0, x27, #1 3935# CHECK-NEXT: [0,8] . D===eeER st1 { v1.8h, v2.8h, v3.8h }, [x27], x28 3936# CHECK-NEXT: [0,9] . D====eER add x0, x27, #1 3937 3938# CHECK: Average Wait times (based on the timeline view): 3939# CHECK-NEXT: [0]: Executions 3940# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3941# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3942# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3943 3944# CHECK: [0] [1] [2] [3] 3945# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.2s, v2.2s, v3.2s }, [x27], x28 3946# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 3947# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.4h, v2.4h, v3.4h }, [x27], x28 3948# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 3949# CHECK-NEXT: 4. 1 2.0 0.0 0.0 st1 { v1.4s, v2.4s, v3.4s }, [x27], x28 3950# CHECK-NEXT: 5. 1 3.0 0.0 0.0 add x0, x27, #1 3951# CHECK-NEXT: 6. 1 3.0 0.0 0.0 st1 { v1.8b, v2.8b, v3.8b }, [x27], x28 3952# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 3953# CHECK-NEXT: 8. 1 4.0 1.0 0.0 st1 { v1.8h, v2.8h, v3.8h }, [x27], x28 3954# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 3955# CHECK-NEXT: 1 2.9 0.2 0.0 <total> 3956 3957# CHECK: [61] Code Region - G62 3958 3959# CHECK: Iterations: 100 3960# CHECK-NEXT: Instructions: 1000 3961# CHECK-NEXT: Total Cycles: 704 3962# CHECK-NEXT: Total uOps: 3600 3963 3964# CHECK: Dispatch Width: 15 3965# CHECK-NEXT: uOps Per Cycle: 5.11 3966# CHECK-NEXT: IPC: 1.42 3967# CHECK-NEXT: Block RThroughput: 6.5 3968 3969# CHECK: Timeline view: 3970# CHECK-NEXT: 0 3971# CHECK-NEXT: Index 0123456789 3972 3973# CHECK: [0,0] DeeER. . st1 { v1.16b, v2.16b, v3.16b }, [x27], x28 3974# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 3975# CHECK-NEXT: [0,2] D=eeER . st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 3976# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 3977# CHECK-NEXT: [0,4] .D==eeER . st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 3978# CHECK-NEXT: [0,5] .D===eER . add x0, x27, #1 3979# CHECK-NEXT: [0,6] .D===eeER . st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 3980# CHECK-NEXT: [0,7] . D===eER . add x0, x27, #1 3981# CHECK-NEXT: [0,8] . D====eeER st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 3982# CHECK-NEXT: [0,9] . D=====eER add x0, x27, #1 3983 3984# CHECK: Average Wait times (based on the timeline view): 3985# CHECK-NEXT: [0]: Executions 3986# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3987# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3988# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3989 3990# CHECK: [0] [1] [2] [3] 3991# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.16b, v2.16b, v3.16b }, [x27], x28 3992# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 3993# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 3994# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 3995# CHECK-NEXT: 4. 1 3.0 1.0 0.0 st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 3996# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 3997# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 3998# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 3999# CHECK-NEXT: 8. 1 5.0 1.0 0.0 st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 4000# CHECK-NEXT: 9. 1 6.0 0.0 0.0 add x0, x27, #1 4001# CHECK-NEXT: 1 3.4 0.3 0.0 <total> 4002 4003# CHECK: [62] Code Region - G63 4004 4005# CHECK: Iterations: 100 4006# CHECK-NEXT: Instructions: 1000 4007# CHECK-NEXT: Total Cycles: 804 4008# CHECK-NEXT: Total uOps: 4200 4009 4010# CHECK: Dispatch Width: 15 4011# CHECK-NEXT: uOps Per Cycle: 5.22 4012# CHECK-NEXT: IPC: 1.24 4013# CHECK-NEXT: Block RThroughput: 8.0 4014 4015# CHECK: Timeline view: 4016# CHECK-NEXT: 01 4017# CHECK-NEXT: Index 0123456789 4018 4019# CHECK: [0,0] DeeER. .. st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 4020# CHECK-NEXT: [0,1] D=eER. .. add x0, x27, #1 4021# CHECK-NEXT: [0,2] D=eeER .. st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 4022# CHECK-NEXT: [0,3] .D=eER .. add x0, x27, #1 4023# CHECK-NEXT: [0,4] .D==eeER .. st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 4024# CHECK-NEXT: [0,5] .D===eER .. add x0, x27, #1 4025# CHECK-NEXT: [0,6] . D==eeER .. st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 4026# CHECK-NEXT: [0,7] . D===eER .. add x0, x27, #1 4027# CHECK-NEXT: [0,8] . D=====eeER st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 4028# CHECK-NEXT: [0,9] . D=====eER add x0, x27, #1 4029 4030# CHECK: Average Wait times (based on the timeline view): 4031# CHECK-NEXT: [0]: Executions 4032# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4033# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4034# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4035 4036# CHECK: [0] [1] [2] [3] 4037# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 4038# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 4039# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 4040# CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1 4041# CHECK-NEXT: 4. 1 3.0 1.0 0.0 st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 4042# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 4043# CHECK-NEXT: 6. 1 3.0 0.0 0.0 st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 4044# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 4045# CHECK-NEXT: 8. 1 6.0 2.0 0.0 st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 4046# CHECK-NEXT: 9. 1 6.0 0.0 0.0 add x0, x27, #1 4047# CHECK-NEXT: 1 3.3 0.4 0.0 <total> 4048 4049# CHECK: [63] Code Region - G64 4050 4051# CHECK: Iterations: 100 4052# CHECK-NEXT: Instructions: 1000 4053# CHECK-NEXT: Total Cycles: 703 4054# CHECK-NEXT: Total uOps: 3800 4055 4056# CHECK: Dispatch Width: 15 4057# CHECK-NEXT: uOps Per Cycle: 5.41 4058# CHECK-NEXT: IPC: 1.42 4059# CHECK-NEXT: Block RThroughput: 7.0 4060 4061# CHECK: Timeline view: 4062# CHECK-NEXT: Index 0123456789 4063 4064# CHECK: [0,0] DeeER. . st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 4065# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 4066# CHECK-NEXT: [0,2] D=eeER . st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 4067# CHECK-NEXT: [0,3] .D=eER . add x0, x27, #1 4068# CHECK-NEXT: [0,4] .D==eeER . st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 4069# CHECK-NEXT: [0,5] .D===eER . add x0, x27, #1 4070# CHECK-NEXT: [0,6] . D==eeER. st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 4071# CHECK-NEXT: [0,7] . D===eER. add x0, x27, #1 4072# CHECK-NEXT: [0,8] . D===eeER st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 4073# CHECK-NEXT: [0,9] . D===eER add x0, x27, #1 4074 4075# CHECK: Average Wait times (based on the timeline view): 4076# CHECK-NEXT: [0]: Executions 4077# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4078# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4079# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4080 4081# CHECK: [0] [1] [2] [3] 4082# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 4083# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 4084# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 4085# CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1 4086# CHECK-NEXT: 4. 1 3.0 1.0 0.0 st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 4087# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 4088# CHECK-NEXT: 6. 1 3.0 0.0 0.0 st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 4089# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 4090# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 4091# CHECK-NEXT: 9. 1 4.0 0.0 0.0 add x0, x27, #1 4092# CHECK-NEXT: 1 2.9 0.2 0.0 <total> 4093 4094# CHECK: [64] Code Region - G65 4095 4096# CHECK: Iterations: 100 4097# CHECK-NEXT: Instructions: 1000 4098# CHECK-NEXT: Total Cycles: 706 4099# CHECK-NEXT: Total uOps: 3200 4100 4101# CHECK: Dispatch Width: 15 4102# CHECK-NEXT: uOps Per Cycle: 4.53 4103# CHECK-NEXT: IPC: 1.42 4104# CHECK-NEXT: Block RThroughput: 5.5 4105 4106# CHECK: Timeline view: 4107# CHECK-NEXT: 012 4108# CHECK-NEXT: Index 0123456789 4109 4110# CHECK: [0,0] DeeER. . . st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 4111# CHECK-NEXT: [0,1] D=eER. . . add x0, x27, #1 4112# CHECK-NEXT: [0,2] .DeeER . . st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 4113# CHECK-NEXT: [0,3] .D=eER . . add x0, x27, #1 4114# CHECK-NEXT: [0,4] .D===eeeeER . st1 { v1.b }[0], [x27], #1 4115# CHECK-NEXT: [0,5] .D====eE--R . add x0, x27, #1 4116# CHECK-NEXT: [0,6] . D===eeeeER. st1 { v1.b }[8], [x27], #1 4117# CHECK-NEXT: [0,7] . D====eE--R. add x0, x27, #1 4118# CHECK-NEXT: [0,8] . D====eeeeER st1 { v1.b }[0], [x27], x28 4119# CHECK-NEXT: [0,9] . D=====eE--R add x0, x27, #1 4120 4121# CHECK: Average Wait times (based on the timeline view): 4122# CHECK-NEXT: [0]: Executions 4123# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4124# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4125# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4126 4127# CHECK: [0] [1] [2] [3] 4128# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 4129# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 4130# CHECK-NEXT: 2. 1 1.0 0.0 0.0 st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 4131# CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1 4132# CHECK-NEXT: 4. 1 4.0 2.0 0.0 st1 { v1.b }[0], [x27], #1 4133# CHECK-NEXT: 5. 1 5.0 0.0 2.0 add x0, x27, #1 4134# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st1 { v1.b }[8], [x27], #1 4135# CHECK-NEXT: 7. 1 5.0 0.0 2.0 add x0, x27, #1 4136# CHECK-NEXT: 8. 1 5.0 0.0 0.0 st1 { v1.b }[0], [x27], x28 4137# CHECK-NEXT: 9. 1 6.0 0.0 2.0 add x0, x27, #1 4138# CHECK-NEXT: 1 3.5 0.3 0.6 <total> 4139 4140# CHECK: [65] Code Region - G66 4141 4142# CHECK: Iterations: 100 4143# CHECK-NEXT: Instructions: 1000 4144# CHECK-NEXT: Total Cycles: 506 4145# CHECK-NEXT: Total uOps: 2000 4146 4147# CHECK: Dispatch Width: 15 4148# CHECK-NEXT: uOps Per Cycle: 3.95 4149# CHECK-NEXT: IPC: 1.98 4150# CHECK-NEXT: Block RThroughput: 2.5 4151 4152# CHECK: Timeline view: 4153# CHECK-NEXT: 0 4154# CHECK-NEXT: Index 0123456789 4155 4156# CHECK: [0,0] DeeeeER . st1 { v1.b }[8], [x27], x28 4157# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 4158# CHECK-NEXT: [0,2] D=eeeeER . st1 { v1.h }[0], [x27], #2 4159# CHECK-NEXT: [0,3] D==eE--R . add x0, x27, #1 4160# CHECK-NEXT: [0,4] D==eeeeER . st1 { v1.h }[4], [x27], #2 4161# CHECK-NEXT: [0,5] D===eE--R . add x0, x27, #1 4162# CHECK-NEXT: [0,6] D===eeeeER. st1 { v1.h }[0], [x27], x28 4163# CHECK-NEXT: [0,7] .D===eE--R. add x0, x27, #1 4164# CHECK-NEXT: [0,8] .D===eeeeER st1 { v1.h }[4], [x27], x28 4165# CHECK-NEXT: [0,9] .D====eE--R add x0, x27, #1 4166 4167# CHECK: Average Wait times (based on the timeline view): 4168# CHECK-NEXT: [0]: Executions 4169# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4170# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4171# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4172 4173# CHECK: [0] [1] [2] [3] 4174# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.b }[8], [x27], x28 4175# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 4176# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.h }[0], [x27], #2 4177# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4178# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st1 { v1.h }[4], [x27], #2 4179# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 4180# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st1 { v1.h }[0], [x27], x28 4181# CHECK-NEXT: 7. 1 4.0 0.0 2.0 add x0, x27, #1 4182# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st1 { v1.h }[4], [x27], x28 4183# CHECK-NEXT: 9. 1 5.0 0.0 2.0 add x0, x27, #1 4184# CHECK-NEXT: 1 3.2 0.1 1.0 <total> 4185 4186# CHECK: [66] Code Region - G67 4187 4188# CHECK: Iterations: 100 4189# CHECK-NEXT: Instructions: 1000 4190# CHECK-NEXT: Total Cycles: 506 4191# CHECK-NEXT: Total uOps: 2200 4192 4193# CHECK: Dispatch Width: 15 4194# CHECK-NEXT: uOps Per Cycle: 4.35 4195# CHECK-NEXT: IPC: 1.98 4196# CHECK-NEXT: Block RThroughput: 3.0 4197 4198# CHECK: Timeline view: 4199# CHECK-NEXT: 0 4200# CHECK-NEXT: Index 0123456789 4201 4202# CHECK: [0,0] DeeeeER . st1 { v1.s }[0], [x27], #4 4203# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 4204# CHECK-NEXT: [0,2] D=eeeeER . st1 { v1.s }[0], [x27], x28 4205# CHECK-NEXT: [0,3] D==eE--R . add x0, x27, #1 4206# CHECK-NEXT: [0,4] D==eeeeER . st1 { v1.d }[0], [x27], #8 4207# CHECK-NEXT: [0,5] D===eE--R . add x0, x27, #1 4208# CHECK-NEXT: [0,6] D===eeeeER. st1 { v1.d }[0], [x27], x28 4209# CHECK-NEXT: [0,7] .D===eE--R. add x0, x27, #1 4210# CHECK-NEXT: [0,8] .D===eeeeER st2 { v1.2d, v2.2d }, [x27], #32 4211# CHECK-NEXT: [0,9] .D====eE--R add x0, x27, #1 4212 4213# CHECK: Average Wait times (based on the timeline view): 4214# CHECK-NEXT: [0]: Executions 4215# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4216# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4217# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4218 4219# CHECK: [0] [1] [2] [3] 4220# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.s }[0], [x27], #4 4221# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 4222# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st1 { v1.s }[0], [x27], x28 4223# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4224# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st1 { v1.d }[0], [x27], #8 4225# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 4226# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st1 { v1.d }[0], [x27], x28 4227# CHECK-NEXT: 7. 1 4.0 0.0 2.0 add x0, x27, #1 4228# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st2 { v1.2d, v2.2d }, [x27], #32 4229# CHECK-NEXT: 9. 1 5.0 0.0 2.0 add x0, x27, #1 4230# CHECK-NEXT: 1 3.2 0.1 1.0 <total> 4231 4232# CHECK: [67] Code Region - G68 4233 4234# CHECK: Iterations: 100 4235# CHECK-NEXT: Instructions: 1000 4236# CHECK-NEXT: Total Cycles: 506 4237# CHECK-NEXT: Total uOps: 2400 4238 4239# CHECK: Dispatch Width: 15 4240# CHECK-NEXT: uOps Per Cycle: 4.74 4241# CHECK-NEXT: IPC: 1.98 4242# CHECK-NEXT: Block RThroughput: 3.5 4243 4244# CHECK: Timeline view: 4245# CHECK-NEXT: 0 4246# CHECK-NEXT: Index 0123456789 4247 4248# CHECK: [0,0] DeeeeER . st2 { v1.2s, v2.2s }, [x27], #16 4249# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 4250# CHECK-NEXT: [0,2] D=eeeeER . st2 { v1.4h, v2.4h }, [x27], #16 4251# CHECK-NEXT: [0,3] D==eE--R . add x0, x27, #1 4252# CHECK-NEXT: [0,4] D==eeeeER . st2 { v1.4s, v2.4s }, [x27], #32 4253# CHECK-NEXT: [0,5] D===eE--R . add x0, x27, #1 4254# CHECK-NEXT: [0,6] .D==eeeeER. st2 { v1.8b, v2.8b }, [x27], #16 4255# CHECK-NEXT: [0,7] .D===eE--R. add x0, x27, #1 4256# CHECK-NEXT: [0,8] .D===eeeeER st2 { v1.8h, v2.8h }, [x27], #32 4257# CHECK-NEXT: [0,9] .D====eE--R add x0, x27, #1 4258 4259# CHECK: Average Wait times (based on the timeline view): 4260# CHECK-NEXT: [0]: Executions 4261# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4262# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4263# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4264 4265# CHECK: [0] [1] [2] [3] 4266# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.2s, v2.2s }, [x27], #16 4267# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 4268# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st2 { v1.4h, v2.4h }, [x27], #16 4269# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4270# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st2 { v1.4s, v2.4s }, [x27], #32 4271# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 4272# CHECK-NEXT: 6. 1 3.0 0.0 0.0 st2 { v1.8b, v2.8b }, [x27], #16 4273# CHECK-NEXT: 7. 1 4.0 0.0 2.0 add x0, x27, #1 4274# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st2 { v1.8h, v2.8h }, [x27], #32 4275# CHECK-NEXT: 9. 1 5.0 0.0 2.0 add x0, x27, #1 4276# CHECK-NEXT: 1 3.1 0.1 1.0 <total> 4277 4278# CHECK: [68] Code Region - G69 4279 4280# CHECK: Iterations: 100 4281# CHECK-NEXT: Instructions: 1000 4282# CHECK-NEXT: Total Cycles: 506 4283# CHECK-NEXT: Total uOps: 2600 4284 4285# CHECK: Dispatch Width: 15 4286# CHECK-NEXT: uOps Per Cycle: 5.14 4287# CHECK-NEXT: IPC: 1.98 4288# CHECK-NEXT: Block RThroughput: 4.0 4289 4290# CHECK: Timeline view: 4291# CHECK-NEXT: 0 4292# CHECK-NEXT: Index 0123456789 4293 4294# CHECK: [0,0] DeeeeER . st2 { v1.16b, v2.16b }, [x27], #32 4295# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 4296# CHECK-NEXT: [0,2] D=eeeeER . st2 { v1.2d, v2.2d }, [x27], x28 4297# CHECK-NEXT: [0,3] D==eE--R . add x0, x27, #1 4298# CHECK-NEXT: [0,4] D==eeeeER . st2 { v1.2s, v2.2s }, [x27], x28 4299# CHECK-NEXT: [0,5] .D==eE--R . add x0, x27, #1 4300# CHECK-NEXT: [0,6] .D==eeeeER. st2 { v1.4h, v2.4h }, [x27], x28 4301# CHECK-NEXT: [0,7] .D===eE--R. add x0, x27, #1 4302# CHECK-NEXT: [0,8] .D===eeeeER st2 { v1.4s, v2.4s }, [x27], x28 4303# CHECK-NEXT: [0,9] .D====eE--R add x0, x27, #1 4304 4305# CHECK: Average Wait times (based on the timeline view): 4306# CHECK-NEXT: [0]: Executions 4307# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4308# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4309# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4310 4311# CHECK: [0] [1] [2] [3] 4312# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.16b, v2.16b }, [x27], #32 4313# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 4314# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st2 { v1.2d, v2.2d }, [x27], x28 4315# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4316# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st2 { v1.2s, v2.2s }, [x27], x28 4317# CHECK-NEXT: 5. 1 3.0 0.0 2.0 add x0, x27, #1 4318# CHECK-NEXT: 6. 1 3.0 0.0 0.0 st2 { v1.4h, v2.4h }, [x27], x28 4319# CHECK-NEXT: 7. 1 4.0 0.0 2.0 add x0, x27, #1 4320# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st2 { v1.4s, v2.4s }, [x27], x28 4321# CHECK-NEXT: 9. 1 5.0 0.0 2.0 add x0, x27, #1 4322# CHECK-NEXT: 1 3.0 0.1 1.0 <total> 4323 4324# CHECK: [69] Code Region - G70 4325 4326# CHECK: Iterations: 100 4327# CHECK-NEXT: Instructions: 1000 4328# CHECK-NEXT: Total Cycles: 506 4329# CHECK-NEXT: Total uOps: 2400 4330 4331# CHECK: Dispatch Width: 15 4332# CHECK-NEXT: uOps Per Cycle: 4.74 4333# CHECK-NEXT: IPC: 1.98 4334# CHECK-NEXT: Block RThroughput: 3.5 4335 4336# CHECK: Timeline view: 4337# CHECK-NEXT: 0 4338# CHECK-NEXT: Index 0123456789 4339 4340# CHECK: [0,0] DeeeeER . st2 { v1.8b, v2.8b }, [x27], x28 4341# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 4342# CHECK-NEXT: [0,2] D=eeeeER . st2 { v1.8h, v2.8h }, [x27], x28 4343# CHECK-NEXT: [0,3] D==eE--R . add x0, x27, #1 4344# CHECK-NEXT: [0,4] D==eeeeER . st2 { v1.16b, v2.16b }, [x27], x28 4345# CHECK-NEXT: [0,5] .D==eE--R . add x0, x27, #1 4346# CHECK-NEXT: [0,6] .D==eeeeER. st2 { v1.b, v2.b }[0], [x27], #2 4347# CHECK-NEXT: [0,7] .D===eE--R. add x0, x27, #1 4348# CHECK-NEXT: [0,8] .D===eeeeER st2 { v1.b, v2.b }[8], [x27], #2 4349# CHECK-NEXT: [0,9] .D====eE--R add x0, x27, #1 4350 4351# CHECK: Average Wait times (based on the timeline view): 4352# CHECK-NEXT: [0]: Executions 4353# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4354# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4355# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4356 4357# CHECK: [0] [1] [2] [3] 4358# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.8b, v2.8b }, [x27], x28 4359# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 4360# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st2 { v1.8h, v2.8h }, [x27], x28 4361# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4362# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st2 { v1.16b, v2.16b }, [x27], x28 4363# CHECK-NEXT: 5. 1 3.0 0.0 2.0 add x0, x27, #1 4364# CHECK-NEXT: 6. 1 3.0 0.0 0.0 st2 { v1.b, v2.b }[0], [x27], #2 4365# CHECK-NEXT: 7. 1 4.0 0.0 2.0 add x0, x27, #1 4366# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st2 { v1.b, v2.b }[8], [x27], #2 4367# CHECK-NEXT: 9. 1 5.0 0.0 2.0 add x0, x27, #1 4368# CHECK-NEXT: 1 3.0 0.1 1.0 <total> 4369 4370# CHECK: [70] Code Region - G71 4371 4372# CHECK: Iterations: 100 4373# CHECK-NEXT: Instructions: 1000 4374# CHECK-NEXT: Total Cycles: 506 4375# CHECK-NEXT: Total uOps: 2000 4376 4377# CHECK: Dispatch Width: 15 4378# CHECK-NEXT: uOps Per Cycle: 3.95 4379# CHECK-NEXT: IPC: 1.98 4380# CHECK-NEXT: Block RThroughput: 2.5 4381 4382# CHECK: Timeline view: 4383# CHECK-NEXT: 0 4384# CHECK-NEXT: Index 0123456789 4385 4386# CHECK: [0,0] DeeeeER . st2 { v1.b, v2.b }[0], [x27], x28 4387# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 4388# CHECK-NEXT: [0,2] D=eeeeER . st2 { v1.b, v2.b }[8], [x27], x28 4389# CHECK-NEXT: [0,3] D==eE--R . add x0, x27, #1 4390# CHECK-NEXT: [0,4] D==eeeeER . st2 { v1.h, v2.h }[0], [x27], #4 4391# CHECK-NEXT: [0,5] D===eE--R . add x0, x27, #1 4392# CHECK-NEXT: [0,6] D===eeeeER. st2 { v1.h, v2.h }[4], [x27], #4 4393# CHECK-NEXT: [0,7] .D===eE--R. add x0, x27, #1 4394# CHECK-NEXT: [0,8] .D===eeeeER st2 { v1.h, v2.h }[0], [x27], x28 4395# CHECK-NEXT: [0,9] .D====eE--R add x0, x27, #1 4396 4397# CHECK: Average Wait times (based on the timeline view): 4398# CHECK-NEXT: [0]: Executions 4399# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4400# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4401# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4402 4403# CHECK: [0] [1] [2] [3] 4404# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.b, v2.b }[0], [x27], x28 4405# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 4406# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st2 { v1.b, v2.b }[8], [x27], x28 4407# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4408# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st2 { v1.h, v2.h }[0], [x27], #4 4409# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 4410# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st2 { v1.h, v2.h }[4], [x27], #4 4411# CHECK-NEXT: 7. 1 4.0 0.0 2.0 add x0, x27, #1 4412# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st2 { v1.h, v2.h }[0], [x27], x28 4413# CHECK-NEXT: 9. 1 5.0 0.0 2.0 add x0, x27, #1 4414# CHECK-NEXT: 1 3.2 0.1 1.0 <total> 4415 4416# CHECK: [71] Code Region - G72 4417 4418# CHECK: Iterations: 100 4419# CHECK-NEXT: Instructions: 1000 4420# CHECK-NEXT: Total Cycles: 506 4421# CHECK-NEXT: Total uOps: 2000 4422 4423# CHECK: Dispatch Width: 15 4424# CHECK-NEXT: uOps Per Cycle: 3.95 4425# CHECK-NEXT: IPC: 1.98 4426# CHECK-NEXT: Block RThroughput: 2.5 4427 4428# CHECK: Timeline view: 4429# CHECK-NEXT: 0 4430# CHECK-NEXT: Index 0123456789 4431 4432# CHECK: [0,0] DeeeeER . st2 { v1.h, v2.h }[4], [x27], x28 4433# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 4434# CHECK-NEXT: [0,2] D=eeeeER . st2 { v1.s, v2.s }[0], [x27], #8 4435# CHECK-NEXT: [0,3] D==eE--R . add x0, x27, #1 4436# CHECK-NEXT: [0,4] D==eeeeER . st2 { v1.s, v2.s }[0], [x27], x28 4437# CHECK-NEXT: [0,5] D===eE--R . add x0, x27, #1 4438# CHECK-NEXT: [0,6] D===eeeeER. st2 { v1.d, v2.d }[0], [x27], #16 4439# CHECK-NEXT: [0,7] .D===eE--R. add x0, x27, #1 4440# CHECK-NEXT: [0,8] .D===eeeeER st2 { v1.d, v2.d }[0], [x27], x28 4441# CHECK-NEXT: [0,9] .D====eE--R add x0, x27, #1 4442 4443# CHECK: Average Wait times (based on the timeline view): 4444# CHECK-NEXT: [0]: Executions 4445# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4446# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4447# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4448 4449# CHECK: [0] [1] [2] [3] 4450# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.h, v2.h }[4], [x27], x28 4451# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 4452# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st2 { v1.s, v2.s }[0], [x27], #8 4453# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4454# CHECK-NEXT: 4. 1 3.0 0.0 0.0 st2 { v1.s, v2.s }[0], [x27], x28 4455# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 4456# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st2 { v1.d, v2.d }[0], [x27], #16 4457# CHECK-NEXT: 7. 1 4.0 0.0 2.0 add x0, x27, #1 4458# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st2 { v1.d, v2.d }[0], [x27], x28 4459# CHECK-NEXT: 9. 1 5.0 0.0 2.0 add x0, x27, #1 4460# CHECK-NEXT: 1 3.2 0.1 1.0 <total> 4461 4462# CHECK: [72] Code Region - G73 4463 4464# CHECK: Iterations: 100 4465# CHECK-NEXT: Instructions: 600 4466# CHECK-NEXT: Total Cycles: 406 4467# CHECK-NEXT: Total uOps: 2000 4468 4469# CHECK: Dispatch Width: 15 4470# CHECK-NEXT: uOps Per Cycle: 4.93 4471# CHECK-NEXT: IPC: 1.48 4472# CHECK-NEXT: Block RThroughput: 3.5 4473 4474# CHECK: Timeline view: 4475# CHECK-NEXT: Index 0123456789 4476 4477# CHECK: [0,0] DeeeeeER . st3 { v1.2d, v2.2d, v3.2d }, [x27], #48 4478# CHECK-NEXT: [0,1] D=eE---R . add x0, x27, #1 4479# CHECK-NEXT: [0,2] D=eeeeER . st3 { v1.2s, v2.2s, v3.2s }, [x27], #24 4480# CHECK-NEXT: [0,3] D==eE--R . add x0, x27, #1 4481# CHECK-NEXT: [0,4] .D==eeeeER st3 { v1.4h, v2.4h, v3.4h }, [x27], #24 4482# CHECK-NEXT: [0,5] .D===eE--R add x0, x27, #1 4483 4484# CHECK: Average Wait times (based on the timeline view): 4485# CHECK-NEXT: [0]: Executions 4486# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4487# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4488# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4489 4490# CHECK: [0] [1] [2] [3] 4491# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.2d, v2.2d, v3.2d }, [x27], #48 4492# CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1 4493# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st3 { v1.2s, v2.2s, v3.2s }, [x27], #24 4494# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4495# CHECK-NEXT: 4. 1 3.0 1.0 0.0 st3 { v1.4h, v2.4h, v3.4h }, [x27], #24 4496# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 4497# CHECK-NEXT: 1 2.5 0.3 1.2 <total> 4498 4499# CHECK: [73] Code Region - G74 4500 4501# CHECK: Iterations: 100 4502# CHECK-NEXT: Instructions: 1000 4503# CHECK-NEXT: Total Cycles: 707 4504# CHECK-NEXT: Total uOps: 3800 4505 4506# CHECK: Dispatch Width: 15 4507# CHECK-NEXT: uOps Per Cycle: 5.37 4508# CHECK-NEXT: IPC: 1.41 4509# CHECK-NEXT: Block RThroughput: 7.0 4510 4511# CHECK: Timeline view: 4512# CHECK-NEXT: 0123 4513# CHECK-NEXT: Index 0123456789 4514 4515# CHECK: [0,0] DeeeeeER . . st3 { v1.4s, v2.4s, v3.4s }, [x27], #48 4516# CHECK-NEXT: [0,1] D=eE---R . . add x0, x27, #1 4517# CHECK-NEXT: [0,2] D=eeeeER . . st3 { v1.8b, v2.8b, v3.8b }, [x27], #24 4518# CHECK-NEXT: [0,3] D==eE--R . . add x0, x27, #1 4519# CHECK-NEXT: [0,4] .D==eeeeeER . st3 { v1.8h, v2.8h, v3.8h }, [x27], #48 4520# CHECK-NEXT: [0,5] .D===eE---R . add x0, x27, #1 4521# CHECK-NEXT: [0,6] .D===eeeeeER . st3 { v1.16b, v2.16b, v3.16b }, [x27], #48 4522# CHECK-NEXT: [0,7] . D===eE---R . add x0, x27, #1 4523# CHECK-NEXT: [0,8] . D====eeeeeER st3 { v1.2d, v2.2d, v3.2d }, [x27], x28 4524# CHECK-NEXT: [0,9] . D=====eE---R add x0, x27, #1 4525 4526# CHECK: Average Wait times (based on the timeline view): 4527# CHECK-NEXT: [0]: Executions 4528# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4529# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4530# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4531 4532# CHECK: [0] [1] [2] [3] 4533# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.4s, v2.4s, v3.4s }, [x27], #48 4534# CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1 4535# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st3 { v1.8b, v2.8b, v3.8b }, [x27], #24 4536# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4537# CHECK-NEXT: 4. 1 3.0 1.0 0.0 st3 { v1.8h, v2.8h, v3.8h }, [x27], #48 4538# CHECK-NEXT: 5. 1 4.0 0.0 3.0 add x0, x27, #1 4539# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st3 { v1.16b, v2.16b, v3.16b }, [x27], #48 4540# CHECK-NEXT: 7. 1 4.0 0.0 3.0 add x0, x27, #1 4541# CHECK-NEXT: 8. 1 5.0 1.0 0.0 st3 { v1.2d, v2.2d, v3.2d }, [x27], x28 4542# CHECK-NEXT: 9. 1 6.0 0.0 3.0 add x0, x27, #1 4543# CHECK-NEXT: 1 3.4 0.3 1.4 <total> 4544 4545# CHECK: [74] Code Region - G75 4546 4547# CHECK: Iterations: 100 4548# CHECK-NEXT: Instructions: 1000 4549# CHECK-NEXT: Total Cycles: 706 4550# CHECK-NEXT: Total uOps: 3400 4551 4552# CHECK: Dispatch Width: 15 4553# CHECK-NEXT: uOps Per Cycle: 4.82 4554# CHECK-NEXT: IPC: 1.42 4555# CHECK-NEXT: Block RThroughput: 6.0 4556 4557# CHECK: Timeline view: 4558# CHECK-NEXT: 012 4559# CHECK-NEXT: Index 0123456789 4560 4561# CHECK: [0,0] DeeeeER . . st3 { v1.2s, v2.2s, v3.2s }, [x27], x28 4562# CHECK-NEXT: [0,1] D=eE--R . . add x0, x27, #1 4563# CHECK-NEXT: [0,2] D=eeeeER . . st3 { v1.4h, v2.4h, v3.4h }, [x27], x28 4564# CHECK-NEXT: [0,3] D==eE--R . . add x0, x27, #1 4565# CHECK-NEXT: [0,4] .D=eeeeeER. . st3 { v1.4s, v2.4s, v3.4s }, [x27], x28 4566# CHECK-NEXT: [0,5] .D==eE---R. . add x0, x27, #1 4567# CHECK-NEXT: [0,6] .D==eeeeER. . st3 { v1.8b, v2.8b, v3.8b }, [x27], x28 4568# CHECK-NEXT: [0,7] .D===eE--R. . add x0, x27, #1 4569# CHECK-NEXT: [0,8] . D===eeeeeER st3 { v1.8h, v2.8h, v3.8h }, [x27], x28 4570# CHECK-NEXT: [0,9] . D====eE---R add x0, x27, #1 4571 4572# CHECK: Average Wait times (based on the timeline view): 4573# CHECK-NEXT: [0]: Executions 4574# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4575# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4576# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4577 4578# CHECK: [0] [1] [2] [3] 4579# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.2s, v2.2s, v3.2s }, [x27], x28 4580# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 4581# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st3 { v1.4h, v2.4h, v3.4h }, [x27], x28 4582# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4583# CHECK-NEXT: 4. 1 2.0 0.0 0.0 st3 { v1.4s, v2.4s, v3.4s }, [x27], x28 4584# CHECK-NEXT: 5. 1 3.0 0.0 3.0 add x0, x27, #1 4585# CHECK-NEXT: 6. 1 3.0 0.0 0.0 st3 { v1.8b, v2.8b, v3.8b }, [x27], x28 4586# CHECK-NEXT: 7. 1 4.0 0.0 2.0 add x0, x27, #1 4587# CHECK-NEXT: 8. 1 4.0 1.0 0.0 st3 { v1.8h, v2.8h, v3.8h }, [x27], x28 4588# CHECK-NEXT: 9. 1 5.0 0.0 3.0 add x0, x27, #1 4589# CHECK-NEXT: 1 2.9 0.2 1.2 <total> 4590 4591# CHECK: [75] Code Region - G76 4592 4593# CHECK: Iterations: 100 4594# CHECK-NEXT: Instructions: 1000 4595# CHECK-NEXT: Total Cycles: 606 4596# CHECK-NEXT: Total uOps: 3200 4597 4598# CHECK: Dispatch Width: 15 4599# CHECK-NEXT: uOps Per Cycle: 5.28 4600# CHECK-NEXT: IPC: 1.65 4601# CHECK-NEXT: Block RThroughput: 5.5 4602 4603# CHECK: Timeline view: 4604# CHECK-NEXT: 01 4605# CHECK-NEXT: Index 0123456789 4606 4607# CHECK: [0,0] DeeeeeER .. st3 { v1.16b, v2.16b, v3.16b }, [x27], x28 4608# CHECK-NEXT: [0,1] D=eE---R .. add x0, x27, #1 4609# CHECK-NEXT: [0,2] D=eeeeER .. st3 { v1.b, v2.b, v3.b }[0], [x27], #3 4610# CHECK-NEXT: [0,3] D==eE--R .. add x0, x27, #1 4611# CHECK-NEXT: [0,4] .D==eeeeER.. st3 { v1.b, v2.b, v3.b }[8], [x27], #3 4612# CHECK-NEXT: [0,5] .D===eE--R.. add x0, x27, #1 4613# CHECK-NEXT: [0,6] .D===eeeeER. st3 { v1.b, v2.b, v3.b }[0], [x27], x28 4614# CHECK-NEXT: [0,7] .D====eE--R. add x0, x27, #1 4615# CHECK-NEXT: [0,8] . D===eeeeER st3 { v1.b, v2.b, v3.b }[8], [x27], x28 4616# CHECK-NEXT: [0,9] . D====eE--R add x0, x27, #1 4617 4618# CHECK: Average Wait times (based on the timeline view): 4619# CHECK-NEXT: [0]: Executions 4620# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4621# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4622# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4623 4624# CHECK: [0] [1] [2] [3] 4625# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.16b, v2.16b, v3.16b }, [x27], x28 4626# CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1 4627# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st3 { v1.b, v2.b, v3.b }[0], [x27], #3 4628# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4629# CHECK-NEXT: 4. 1 3.0 1.0 0.0 st3 { v1.b, v2.b, v3.b }[8], [x27], #3 4630# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 4631# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st3 { v1.b, v2.b, v3.b }[0], [x27], x28 4632# CHECK-NEXT: 7. 1 5.0 0.0 2.0 add x0, x27, #1 4633# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st3 { v1.b, v2.b, v3.b }[8], [x27], x28 4634# CHECK-NEXT: 9. 1 5.0 0.0 2.0 add x0, x27, #1 4635# CHECK-NEXT: 1 3.3 0.2 1.1 <total> 4636 4637# CHECK: [76] Code Region - G77 4638 4639# CHECK: Iterations: 100 4640# CHECK-NEXT: Instructions: 1000 4641# CHECK-NEXT: Total Cycles: 506 4642# CHECK-NEXT: Total uOps: 3000 4643 4644# CHECK: Dispatch Width: 15 4645# CHECK-NEXT: uOps Per Cycle: 5.93 4646# CHECK-NEXT: IPC: 1.98 4647# CHECK-NEXT: Block RThroughput: 5.0 4648 4649# CHECK: Timeline view: 4650# CHECK-NEXT: 0 4651# CHECK-NEXT: Index 0123456789 4652 4653# CHECK: [0,0] DeeeeER . st3 { v1.h, v2.h, v3.h }[0], [x27], #6 4654# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 4655# CHECK-NEXT: [0,2] D=eeeeER . st3 { v1.h, v2.h, v3.h }[4], [x27], #6 4656# CHECK-NEXT: [0,3] D==eE--R . add x0, x27, #1 4657# CHECK-NEXT: [0,4] .D=eeeeER . st3 { v1.h, v2.h, v3.h }[0], [x27], x28 4658# CHECK-NEXT: [0,5] .D==eE--R . add x0, x27, #1 4659# CHECK-NEXT: [0,6] .D==eeeeER. st3 { v1.h, v2.h, v3.h }[4], [x27], x28 4660# CHECK-NEXT: [0,7] .D===eE--R. add x0, x27, #1 4661# CHECK-NEXT: [0,8] . D==eeeeER st3 { v1.s, v2.s, v3.s }[0], [x27], #12 4662# CHECK-NEXT: [0,9] . D===eE--R add x0, x27, #1 4663 4664# CHECK: Average Wait times (based on the timeline view): 4665# CHECK-NEXT: [0]: Executions 4666# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4667# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4668# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4669 4670# CHECK: [0] [1] [2] [3] 4671# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.h, v2.h, v3.h }[0], [x27], #6 4672# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 4673# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st3 { v1.h, v2.h, v3.h }[4], [x27], #6 4674# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4675# CHECK-NEXT: 4. 1 2.0 0.0 0.0 st3 { v1.h, v2.h, v3.h }[0], [x27], x28 4676# CHECK-NEXT: 5. 1 3.0 0.0 2.0 add x0, x27, #1 4677# CHECK-NEXT: 6. 1 3.0 0.0 0.0 st3 { v1.h, v2.h, v3.h }[4], [x27], x28 4678# CHECK-NEXT: 7. 1 4.0 0.0 2.0 add x0, x27, #1 4679# CHECK-NEXT: 8. 1 3.0 0.0 0.0 st3 { v1.s, v2.s, v3.s }[0], [x27], #12 4680# CHECK-NEXT: 9. 1 4.0 0.0 2.0 add x0, x27, #1 4681# CHECK-NEXT: 1 2.7 0.1 1.0 <total> 4682 4683# CHECK: [77] Code Region - G78 4684 4685# CHECK: Iterations: 100 4686# CHECK-NEXT: Instructions: 1000 4687# CHECK-NEXT: Total Cycles: 706 4688# CHECK-NEXT: Total uOps: 3600 4689 4690# CHECK: Dispatch Width: 15 4691# CHECK-NEXT: uOps Per Cycle: 5.10 4692# CHECK-NEXT: IPC: 1.42 4693# CHECK-NEXT: Block RThroughput: 6.5 4694 4695# CHECK: Timeline view: 4696# CHECK-NEXT: 012 4697# CHECK-NEXT: Index 0123456789 4698 4699# CHECK: [0,0] DeeeeER . . st3 { v1.s, v2.s, v3.s }[0], [x27], x28 4700# CHECK-NEXT: [0,1] D=eE--R . . add x0, x27, #1 4701# CHECK-NEXT: [0,2] D=eeeeER . . st3 { v1.d, v2.d, v3.d }[0], [x27], #24 4702# CHECK-NEXT: [0,3] D==eE--R . . add x0, x27, #1 4703# CHECK-NEXT: [0,4] .D=eeeeER . . st3 { v1.d, v2.d, v3.d }[0], [x27], x28 4704# CHECK-NEXT: [0,5] .D==eE--R . . add x0, x27, #1 4705# CHECK-NEXT: [0,6] .D==eeeeER. . st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 4706# CHECK-NEXT: [0,7] . D==eE--R. . add x0, x27, #1 4707# CHECK-NEXT: [0,8] . D==eeeeeeER st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 4708# CHECK-NEXT: [0,9] . D===eE----R add x0, x27, #1 4709 4710# CHECK: Average Wait times (based on the timeline view): 4711# CHECK-NEXT: [0]: Executions 4712# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4713# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4714# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4715 4716# CHECK: [0] [1] [2] [3] 4717# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.s, v2.s, v3.s }[0], [x27], x28 4718# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 4719# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st3 { v1.d, v2.d, v3.d }[0], [x27], #24 4720# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4721# CHECK-NEXT: 4. 1 2.0 0.0 0.0 st3 { v1.d, v2.d, v3.d }[0], [x27], x28 4722# CHECK-NEXT: 5. 1 3.0 0.0 2.0 add x0, x27, #1 4723# CHECK-NEXT: 6. 1 3.0 0.0 0.0 st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 4724# CHECK-NEXT: 7. 1 3.0 0.0 2.0 add x0, x27, #1 4725# CHECK-NEXT: 8. 1 3.0 0.0 0.0 st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 4726# CHECK-NEXT: 9. 1 4.0 0.0 4.0 add x0, x27, #1 4727# CHECK-NEXT: 1 2.6 0.1 1.2 <total> 4728 4729# CHECK: [78] Code Region - G79 4730 4731# CHECK: Iterations: 100 4732# CHECK-NEXT: Instructions: 1000 4733# CHECK-NEXT: Total Cycles: 1205 4734# CHECK-NEXT: Total uOps: 5800 4735 4736# CHECK: Dispatch Width: 15 4737# CHECK-NEXT: uOps Per Cycle: 4.81 4738# CHECK-NEXT: IPC: 0.83 4739# CHECK-NEXT: Block RThroughput: 12.0 4740 4741# CHECK: Timeline view: 4742# CHECK-NEXT: 0123456 4743# CHECK-NEXT: Index 0123456789 4744 4745# CHECK: [0,0] DeeeeeeER . .. st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 4746# CHECK-NEXT: [0,1] D=eE----R . .. add x0, x27, #1 4747# CHECK-NEXT: [0,2] .DeeeeeeeER .. st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 4748# CHECK-NEXT: [0,3] .D=eE-----R .. add x0, x27, #1 4749# CHECK-NEXT: [0,4] . D=eeeeeeER .. st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 4750# CHECK-NEXT: [0,5] . D==eE----R .. add x0, x27, #1 4751# CHECK-NEXT: [0,6] . D===eeeeeeeER. st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 4752# CHECK-NEXT: [0,7] . D====eE-----R. add x0, x27, #1 4753# CHECK-NEXT: [0,8] . D===eeeeeeeER st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 4754# CHECK-NEXT: [0,9] . D====eE-----R add x0, x27, #1 4755 4756# CHECK: Average Wait times (based on the timeline view): 4757# CHECK-NEXT: [0]: Executions 4758# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4759# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4760# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4761 4762# CHECK: [0] [1] [2] [3] 4763# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 4764# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 4765# CHECK-NEXT: 2. 1 1.0 0.0 0.0 st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 4766# CHECK-NEXT: 3. 1 2.0 0.0 5.0 add x0, x27, #1 4767# CHECK-NEXT: 4. 1 2.0 1.0 0.0 st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 4768# CHECK-NEXT: 5. 1 3.0 0.0 4.0 add x0, x27, #1 4769# CHECK-NEXT: 6. 1 4.0 2.0 0.0 st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 4770# CHECK-NEXT: 7. 1 5.0 0.0 5.0 add x0, x27, #1 4771# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 4772# CHECK-NEXT: 9. 1 5.0 0.0 5.0 add x0, x27, #1 4773# CHECK-NEXT: 1 2.9 0.4 2.3 <total> 4774 4775# CHECK: [79] Code Region - G80 4776 4777# CHECK: Iterations: 100 4778# CHECK-NEXT: Instructions: 1000 4779# CHECK-NEXT: Total Cycles: 1006 4780# CHECK-NEXT: Total uOps: 4800 4781 4782# CHECK: Dispatch Width: 15 4783# CHECK-NEXT: uOps Per Cycle: 4.77 4784# CHECK-NEXT: IPC: 0.99 4785# CHECK-NEXT: Block RThroughput: 9.5 4786 4787# CHECK: Timeline view: 4788# CHECK-NEXT: 012345 4789# CHECK-NEXT: Index 0123456789 4790 4791# CHECK: [0,0] DeeeeER . . st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 4792# CHECK-NEXT: [0,1] D=eE--R . . add x0, x27, #1 4793# CHECK-NEXT: [0,2] .DeeeeeeER. . st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 4794# CHECK-NEXT: [0,3] .D=eE----R. . add x0, x27, #1 4795# CHECK-NEXT: [0,4] .D===eeeeeeER . st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 4796# CHECK-NEXT: [0,5] . D===eE----R . add x0, x27, #1 4797# CHECK-NEXT: [0,6] . D===eeeeeeeER. st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 4798# CHECK-NEXT: [0,7] . D====eE-----R. add x0, x27, #1 4799# CHECK-NEXT: [0,8] . D====eeeeeeER st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 4800# CHECK-NEXT: [0,9] . D=====eE----R add x0, x27, #1 4801 4802# CHECK: Average Wait times (based on the timeline view): 4803# CHECK-NEXT: [0]: Executions 4804# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4805# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4806# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4807 4808# CHECK: [0] [1] [2] [3] 4809# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 4810# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 4811# CHECK-NEXT: 2. 1 1.0 0.0 0.0 st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 4812# CHECK-NEXT: 3. 1 2.0 0.0 4.0 add x0, x27, #1 4813# CHECK-NEXT: 4. 1 4.0 2.0 0.0 st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 4814# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 4815# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 4816# CHECK-NEXT: 7. 1 5.0 0.0 5.0 add x0, x27, #1 4817# CHECK-NEXT: 8. 1 5.0 1.0 0.0 st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 4818# CHECK-NEXT: 9. 1 6.0 0.0 4.0 add x0, x27, #1 4819# CHECK-NEXT: 1 3.4 0.4 1.9 <total> 4820 4821# CHECK: [80] Code Region - G81 4822 4823# CHECK: Iterations: 100 4824# CHECK-NEXT: Instructions: 1000 4825# CHECK-NEXT: Total Cycles: 807 4826# CHECK-NEXT: Total uOps: 5200 4827 4828# CHECK: Dispatch Width: 15 4829# CHECK-NEXT: uOps Per Cycle: 6.44 4830# CHECK-NEXT: IPC: 1.24 4831# CHECK-NEXT: Block RThroughput: 6.0 4832 4833# CHECK: Timeline view: 4834# CHECK-NEXT: 01234 4835# CHECK-NEXT: Index 0123456789 4836 4837# CHECK: [0,0] DeeeeeeeER. . st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 4838# CHECK-NEXT: [0,1] D=eE-----R. . add x0, x27, #1 4839# CHECK-NEXT: [0,2] .DeeeeeeeER . st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 4840# CHECK-NEXT: [0,3] .D=eE-----R . add x0, x27, #1 4841# CHECK-NEXT: [0,4] . DeeeeeeER . st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4 4842# CHECK-NEXT: [0,5] . D=eE----R . add x0, x27, #1 4843# CHECK-NEXT: [0,6] . D===eeeeeeER. st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4 4844# CHECK-NEXT: [0,7] . D===eE----R. add x0, x27, #1 4845# CHECK-NEXT: [0,8] . D===eeeeeeER st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28 4846# CHECK-NEXT: [0,9] . D====eE----R add x0, x27, #1 4847 4848# CHECK: Average Wait times (based on the timeline view): 4849# CHECK-NEXT: [0]: Executions 4850# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4851# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4852# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4853 4854# CHECK: [0] [1] [2] [3] 4855# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 4856# CHECK-NEXT: 1. 1 2.0 0.0 5.0 add x0, x27, #1 4857# CHECK-NEXT: 2. 1 1.0 0.0 0.0 st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 4858# CHECK-NEXT: 3. 1 2.0 0.0 5.0 add x0, x27, #1 4859# CHECK-NEXT: 4. 1 1.0 0.0 0.0 st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4 4860# CHECK-NEXT: 5. 1 2.0 0.0 4.0 add x0, x27, #1 4861# CHECK-NEXT: 6. 1 4.0 2.0 0.0 st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4 4862# CHECK-NEXT: 7. 1 4.0 0.0 4.0 add x0, x27, #1 4863# CHECK-NEXT: 8. 1 4.0 0.0 0.0 st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28 4864# CHECK-NEXT: 9. 1 5.0 0.0 4.0 add x0, x27, #1 4865# CHECK-NEXT: 1 2.6 0.3 2.2 <total> 4866 4867# CHECK: [81] Code Region - G82 4868 4869# CHECK: Iterations: 100 4870# CHECK-NEXT: Instructions: 1000 4871# CHECK-NEXT: Total Cycles: 508 4872# CHECK-NEXT: Total uOps: 4000 4873 4874# CHECK: Dispatch Width: 15 4875# CHECK-NEXT: uOps Per Cycle: 7.87 4876# CHECK-NEXT: IPC: 1.97 4877# CHECK-NEXT: Block RThroughput: 5.0 4878 4879# CHECK: Timeline view: 4880# CHECK-NEXT: 012 4881# CHECK-NEXT: Index 0123456789 4882 4883# CHECK: [0,0] DeeeeeeER . . st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28 4884# CHECK-NEXT: [0,1] D=eE----R . . add x0, x27, #1 4885# CHECK-NEXT: [0,2] D=eeeeeeER. . st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8 4886# CHECK-NEXT: [0,3] .D=eE----R. . add x0, x27, #1 4887# CHECK-NEXT: [0,4] .D=eeeeeeER . st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8 4888# CHECK-NEXT: [0,5] .D==eE----R . add x0, x27, #1 4889# CHECK-NEXT: [0,6] . D=eeeeeeER. st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28 4890# CHECK-NEXT: [0,7] . D==eE----R. add x0, x27, #1 4891# CHECK-NEXT: [0,8] . D==eeeeeeER st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28 4892# CHECK-NEXT: [0,9] . D==eE----R add x0, x27, #1 4893 4894# CHECK: Average Wait times (based on the timeline view): 4895# CHECK-NEXT: [0]: Executions 4896# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4897# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4898# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4899 4900# CHECK: [0] [1] [2] [3] 4901# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28 4902# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 4903# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8 4904# CHECK-NEXT: 3. 1 2.0 0.0 4.0 add x0, x27, #1 4905# CHECK-NEXT: 4. 1 2.0 0.0 0.0 st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8 4906# CHECK-NEXT: 5. 1 3.0 0.0 4.0 add x0, x27, #1 4907# CHECK-NEXT: 6. 1 2.0 0.0 0.0 st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28 4908# CHECK-NEXT: 7. 1 3.0 0.0 4.0 add x0, x27, #1 4909# CHECK-NEXT: 8. 1 3.0 0.0 0.0 st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28 4910# CHECK-NEXT: 9. 1 3.0 0.0 4.0 add x0, x27, #1 4911# CHECK-NEXT: 1 2.3 0.1 2.0 <total> 4912 4913# CHECK: [82] Code Region - G83 4914 4915# CHECK: Iterations: 100 4916# CHECK-NEXT: Instructions: 800 4917# CHECK-NEXT: Total Cycles: 506 4918# CHECK-NEXT: Total uOps: 2800 4919 4920# CHECK: Dispatch Width: 15 4921# CHECK-NEXT: uOps Per Cycle: 5.53 4922# CHECK-NEXT: IPC: 1.58 4923# CHECK-NEXT: Block RThroughput: 2.0 4924 4925# CHECK: Timeline view: 4926# CHECK-NEXT: 0 4927# CHECK-NEXT: Index 0123456789 4928 4929# CHECK: [0,0] DeeeeeeER . st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16 4930# CHECK-NEXT: [0,1] D=eE----R . add x0, x27, #1 4931# CHECK-NEXT: [0,2] D=eeeeeeER. st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28 4932# CHECK-NEXT: [0,3] .D=eE----R. add x0, x27, #1 4933# CHECK-NEXT: [0,4] .D==eeeeER. st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32 4934# CHECK-NEXT: [0,5] .D===eE--R. add x0, x27, #1 4935# CHECK-NEXT: [0,6] .D===eeeeER st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28 4936# CHECK-NEXT: [0,7] .D====eE--R add x0, x27, #1 4937 4938# CHECK: Average Wait times (based on the timeline view): 4939# CHECK-NEXT: [0]: Executions 4940# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4941# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4942# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4943 4944# CHECK: [0] [1] [2] [3] 4945# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16 4946# CHECK-NEXT: 1. 1 2.0 0.0 4.0 add x0, x27, #1 4947# CHECK-NEXT: 2. 1 2.0 0.0 0.0 st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28 4948# CHECK-NEXT: 3. 1 2.0 0.0 4.0 add x0, x27, #1 4949# CHECK-NEXT: 4. 1 3.0 1.0 0.0 st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32 4950# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 4951# CHECK-NEXT: 6. 1 4.0 0.0 0.0 st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28 4952# CHECK-NEXT: 7. 1 5.0 0.0 2.0 add x0, x27, #1 4953# CHECK-NEXT: 1 2.9 0.3 1.5 <total> 4954 4955# CHECK: [83] Code Region - G84 4956 4957# CHECK: Iterations: 100 4958# CHECK-NEXT: Instructions: 400 4959# CHECK-NEXT: Total Cycles: 204 4960# CHECK-NEXT: Total uOps: 800 4961 4962# CHECK: Dispatch Width: 15 4963# CHECK-NEXT: uOps Per Cycle: 3.92 4964# CHECK-NEXT: IPC: 1.96 4965# CHECK-NEXT: Block RThroughput: 1.0 4966 4967# CHECK: Timeline view: 4968# CHECK-NEXT: Index 012345 4969 4970# CHECK: [0,0] DeeER. stp s1, s2, [x27], #248 4971# CHECK-NEXT: [0,1] D=eER. add x0, x27, #1 4972# CHECK-NEXT: [0,2] D=eeER stp d1, d2, [x27], #496 4973# CHECK-NEXT: [0,3] D==eER add x0, x27, #1 4974 4975# CHECK: Average Wait times (based on the timeline view): 4976# CHECK-NEXT: [0]: Executions 4977# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4978# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4979# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4980 4981# CHECK: [0] [1] [2] [3] 4982# CHECK-NEXT: 0. 1 1.0 1.0 0.0 stp s1, s2, [x27], #248 4983# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 4984# CHECK-NEXT: 2. 1 2.0 0.0 0.0 stp d1, d2, [x27], #496 4985# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 4986# CHECK-NEXT: 1 2.0 0.3 0.0 <total> 4987 4988# CHECK: [84] Code Region - G85 4989 4990# CHECK: Iterations: 100 4991# CHECK-NEXT: Instructions: 1000 4992# CHECK-NEXT: Total Cycles: 504 4993# CHECK-NEXT: Total uOps: 2200 4994 4995# CHECK: Dispatch Width: 15 4996# CHECK-NEXT: uOps Per Cycle: 4.37 4997# CHECK-NEXT: IPC: 1.98 4998# CHECK-NEXT: Block RThroughput: 3.5 4999 5000# CHECK: Timeline view: 5001# CHECK-NEXT: Index 012345678 5002 5003# CHECK: [0,0] DeeER. . stp q1, q2, [x27], #992 5004# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 5005# CHECK-NEXT: [0,2] D=eeER . stp s1, s2, [x27, #248]! 5006# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 5007# CHECK-NEXT: [0,4] D==eeER . stp d1, d2, [x27, #496]! 5008# CHECK-NEXT: [0,5] D===eER . add x0, x27, #1 5009# CHECK-NEXT: [0,6] .D==eeER. stp q1, q2, [x27, #992]! 5010# CHECK-NEXT: [0,7] .D===eER. add x0, x27, #1 5011# CHECK-NEXT: [0,8] .D===eER. stp w1, w2, [x27], #248 5012# CHECK-NEXT: [0,9] .D====eER add x0, x27, #1 5013 5014# CHECK: Average Wait times (based on the timeline view): 5015# CHECK-NEXT: [0]: Executions 5016# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5017# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5018# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5019 5020# CHECK: [0] [1] [2] [3] 5021# CHECK-NEXT: 0. 1 1.0 1.0 0.0 stp q1, q2, [x27], #992 5022# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 5023# CHECK-NEXT: 2. 1 2.0 0.0 0.0 stp s1, s2, [x27, #248]! 5024# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 5025# CHECK-NEXT: 4. 1 3.0 0.0 0.0 stp d1, d2, [x27, #496]! 5026# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 5027# CHECK-NEXT: 6. 1 3.0 0.0 0.0 stp q1, q2, [x27, #992]! 5028# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 5029# CHECK-NEXT: 8. 1 4.0 0.0 0.0 stp w1, w2, [x27], #248 5030# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 5031# CHECK-NEXT: 1 3.1 0.1 0.0 <total> 5032 5033# CHECK: [85] Code Region - G86 5034 5035# CHECK: Iterations: 100 5036# CHECK-NEXT: Instructions: 1000 5037# CHECK-NEXT: Total Cycles: 504 5038# CHECK-NEXT: Total uOps: 2000 5039 5040# CHECK: Dispatch Width: 15 5041# CHECK-NEXT: uOps Per Cycle: 3.97 5042# CHECK-NEXT: IPC: 1.98 5043# CHECK-NEXT: Block RThroughput: 2.5 5044 5045# CHECK: Timeline view: 5046# CHECK-NEXT: Index 012345678 5047 5048# CHECK: [0,0] DeER . . stp x1, x2, [x27], #496 5049# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 5050# CHECK-NEXT: [0,2] D=eER. . stp w1, w2, [x27, #248]! 5051# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 5052# CHECK-NEXT: [0,4] D==eER . stp x1, x2, [x27, #496]! 5053# CHECK-NEXT: [0,5] D===eER . add x0, x27, #1 5054# CHECK-NEXT: [0,6] D===eeER. str b1, [x27], #254 5055# CHECK-NEXT: [0,7] .D===eER. add x0, x27, #1 5056# CHECK-NEXT: [0,8] .D===eeER str h1, [x27], #254 5057# CHECK-NEXT: [0,9] .D====eER add x0, x27, #1 5058 5059# CHECK: Average Wait times (based on the timeline view): 5060# CHECK-NEXT: [0]: Executions 5061# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5062# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5063# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5064 5065# CHECK: [0] [1] [2] [3] 5066# CHECK-NEXT: 0. 1 1.0 1.0 0.0 stp x1, x2, [x27], #496 5067# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 5068# CHECK-NEXT: 2. 1 2.0 0.0 0.0 stp w1, w2, [x27, #248]! 5069# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 5070# CHECK-NEXT: 4. 1 3.0 0.0 0.0 stp x1, x2, [x27, #496]! 5071# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 5072# CHECK-NEXT: 6. 1 4.0 0.0 0.0 str b1, [x27], #254 5073# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 5074# CHECK-NEXT: 8. 1 4.0 0.0 0.0 str h1, [x27], #254 5075# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 5076# CHECK-NEXT: 1 3.2 0.1 0.0 <total> 5077 5078# CHECK: [86] Code Region - G87 5079 5080# CHECK: Iterations: 100 5081# CHECK-NEXT: Instructions: 1000 5082# CHECK-NEXT: Total Cycles: 504 5083# CHECK-NEXT: Total uOps: 2000 5084 5085# CHECK: Dispatch Width: 15 5086# CHECK-NEXT: uOps Per Cycle: 3.97 5087# CHECK-NEXT: IPC: 1.98 5088# CHECK-NEXT: Block RThroughput: 2.5 5089 5090# CHECK: Timeline view: 5091# CHECK-NEXT: Index 012345678 5092 5093# CHECK: [0,0] DeeER. . str s1, [x27], #254 5094# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 5095# CHECK-NEXT: [0,2] D=eeER . str d1, [x27], #254 5096# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 5097# CHECK-NEXT: [0,4] D==eeER . str q1, [x27], #254 5098# CHECK-NEXT: [0,5] D===eER . add x0, x27, #1 5099# CHECK-NEXT: [0,6] D===eeER. str b1, [x27, #254]! 5100# CHECK-NEXT: [0,7] .D===eER. add x0, x27, #1 5101# CHECK-NEXT: [0,8] .D===eeER str h1, [x27, #254]! 5102# CHECK-NEXT: [0,9] .D====eER add x0, x27, #1 5103 5104# CHECK: Average Wait times (based on the timeline view): 5105# CHECK-NEXT: [0]: Executions 5106# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5107# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5108# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5109 5110# CHECK: [0] [1] [2] [3] 5111# CHECK-NEXT: 0. 1 1.0 1.0 0.0 str s1, [x27], #254 5112# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 5113# CHECK-NEXT: 2. 1 2.0 0.0 0.0 str d1, [x27], #254 5114# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 5115# CHECK-NEXT: 4. 1 3.0 0.0 0.0 str q1, [x27], #254 5116# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 5117# CHECK-NEXT: 6. 1 4.0 0.0 0.0 str b1, [x27, #254]! 5118# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 5119# CHECK-NEXT: 8. 1 4.0 0.0 0.0 str h1, [x27, #254]! 5120# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 5121# CHECK-NEXT: 1 3.2 0.1 0.0 <total> 5122 5123# CHECK: [87] Code Region - G88 5124 5125# CHECK: Iterations: 100 5126# CHECK-NEXT: Instructions: 1000 5127# CHECK-NEXT: Total Cycles: 504 5128# CHECK-NEXT: Total uOps: 2000 5129 5130# CHECK: Dispatch Width: 15 5131# CHECK-NEXT: uOps Per Cycle: 3.97 5132# CHECK-NEXT: IPC: 1.98 5133# CHECK-NEXT: Block RThroughput: 2.5 5134 5135# CHECK: Timeline view: 5136# CHECK-NEXT: Index 012345678 5137 5138# CHECK: [0,0] DeeER. . str s1, [x27, #254]! 5139# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 5140# CHECK-NEXT: [0,2] D=eeER . str d1, [x27, #254]! 5141# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 5142# CHECK-NEXT: [0,4] D==eeER . str q1, [x27, #254]! 5143# CHECK-NEXT: [0,5] D===eER . add x0, x27, #1 5144# CHECK-NEXT: [0,6] D===eER . str w1, [x27], #254 5145# CHECK-NEXT: [0,7] .D===eER. add x0, x27, #1 5146# CHECK-NEXT: [0,8] .D===eER. str x1, [x27], #254 5147# CHECK-NEXT: [0,9] .D====eER add x0, x27, #1 5148 5149# CHECK: Average Wait times (based on the timeline view): 5150# CHECK-NEXT: [0]: Executions 5151# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5152# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5153# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5154 5155# CHECK: [0] [1] [2] [3] 5156# CHECK-NEXT: 0. 1 1.0 1.0 0.0 str s1, [x27, #254]! 5157# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 5158# CHECK-NEXT: 2. 1 2.0 0.0 0.0 str d1, [x27, #254]! 5159# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 5160# CHECK-NEXT: 4. 1 3.0 0.0 0.0 str q1, [x27, #254]! 5161# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 5162# CHECK-NEXT: 6. 1 4.0 0.0 0.0 str w1, [x27], #254 5163# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 5164# CHECK-NEXT: 8. 1 4.0 0.0 0.0 str x1, [x27], #254 5165# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 5166# CHECK-NEXT: 1 3.2 0.1 0.0 <total> 5167 5168# CHECK: [88] Code Region - G89 5169 5170# CHECK: Iterations: 100 5171# CHECK-NEXT: Instructions: 1000 5172# CHECK-NEXT: Total Cycles: 504 5173# CHECK-NEXT: Total uOps: 2000 5174 5175# CHECK: Dispatch Width: 15 5176# CHECK-NEXT: uOps Per Cycle: 3.97 5177# CHECK-NEXT: IPC: 1.98 5178# CHECK-NEXT: Block RThroughput: 2.5 5179 5180# CHECK: Timeline view: 5181# CHECK-NEXT: Index 012345678 5182 5183# CHECK: [0,0] DeER . . str w1, [x27, #254]! 5184# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 5185# CHECK-NEXT: [0,2] D=eER. . str x1, [x27, #254]! 5186# CHECK-NEXT: [0,3] D==eER . add x0, x27, #1 5187# CHECK-NEXT: [0,4] D==eER . strb w1, [x27], #254 5188# CHECK-NEXT: [0,5] D===eER . add x0, x27, #1 5189# CHECK-NEXT: [0,6] D===eER . strb w1, [x27, #254]! 5190# CHECK-NEXT: [0,7] .D===eER. add x0, x27, #1 5191# CHECK-NEXT: [0,8] .D===eER. strh w1, [x27], #254 5192# CHECK-NEXT: [0,9] .D====eER add x0, x27, #1 5193 5194# CHECK: Average Wait times (based on the timeline view): 5195# CHECK-NEXT: [0]: Executions 5196# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5197# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5198# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5199 5200# CHECK: [0] [1] [2] [3] 5201# CHECK-NEXT: 0. 1 1.0 1.0 0.0 str w1, [x27, #254]! 5202# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 5203# CHECK-NEXT: 2. 1 2.0 0.0 0.0 str x1, [x27, #254]! 5204# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 5205# CHECK-NEXT: 4. 1 3.0 0.0 0.0 strb w1, [x27], #254 5206# CHECK-NEXT: 5. 1 4.0 0.0 0.0 add x0, x27, #1 5207# CHECK-NEXT: 6. 1 4.0 0.0 0.0 strb w1, [x27, #254]! 5208# CHECK-NEXT: 7. 1 4.0 0.0 0.0 add x0, x27, #1 5209# CHECK-NEXT: 8. 1 4.0 0.0 0.0 strh w1, [x27], #254 5210# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 5211# CHECK-NEXT: 1 3.2 0.1 0.0 <total> 5212 5213# CHECK: [89] Code Region - G90 5214 5215# CHECK: Iterations: 100 5216# CHECK-NEXT: Instructions: 200 5217# CHECK-NEXT: Total Cycles: 104 5218# CHECK-NEXT: Total uOps: 400 5219 5220# CHECK: Dispatch Width: 15 5221# CHECK-NEXT: uOps Per Cycle: 3.85 5222# CHECK-NEXT: IPC: 1.92 5223# CHECK-NEXT: Block RThroughput: 0.5 5224 5225# CHECK: Timeline view: 5226# CHECK-NEXT: Index 01234 5227 5228# CHECK: [0,0] DeER. strh w1, [x27, #254]! 5229# CHECK-NEXT: [0,1] D=eER add x0, x27, #1 5230 5231# CHECK: Average Wait times (based on the timeline view): 5232# CHECK-NEXT: [0]: Executions 5233# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5234# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5235# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5236 5237# CHECK: [0] [1] [2] [3] 5238# CHECK-NEXT: 0. 1 1.0 1.0 0.0 strh w1, [x27, #254]! 5239# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 5240# CHECK-NEXT: 1 1.5 0.5 0.0 <total> 5241 5242# CHECK: [90] Code Region - G91 5243 5244# CHECK: Iterations: 100 5245# CHECK-NEXT: Instructions: 400 5246# CHECK-NEXT: Total Cycles: 110 5247# CHECK-NEXT: Total uOps: 600 5248 5249# CHECK: Dispatch Width: 15 5250# CHECK-NEXT: uOps Per Cycle: 5.45 5251# CHECK-NEXT: IPC: 3.64 5252# CHECK-NEXT: Block RThroughput: 1.0 5253 5254# CHECK: Timeline view: 5255# CHECK-NEXT: 0 5256# CHECK-NEXT: Index 0123456789 5257 5258# CHECK: [0,0] DeeeeER . ldr x1, [x27], #254 5259# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 5260# CHECK-NEXT: [0,2] D====eeeeER ldr x2, [x1], #254 5261# CHECK-NEXT: [0,3] D=eE------R add x0, x27, #1 5262 5263# CHECK: Average Wait times (based on the timeline view): 5264# CHECK-NEXT: [0]: Executions 5265# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5266# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5267# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5268 5269# CHECK: [0] [1] [2] [3] 5270# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldr x1, [x27], #254 5271# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 5272# CHECK-NEXT: 2. 1 5.0 0.0 0.0 ldr x2, [x1], #254 5273# CHECK-NEXT: 3. 1 2.0 0.0 6.0 add x0, x27, #1 5274# CHECK-NEXT: 1 2.5 0.3 2.0 <total> 5275