1# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py 2# RUN: llvm-mca -mtriple=aarch64 -mcpu=cortex-a57 --instruction-info=0 --resource-pressure=0 --timeline --timeline-max-iterations=1 < %s | FileCheck %s 3 4# LLVM-MCA-BEGIN G01 5ld1 { v1.1d }, [x27], #8 6add x0, x27, 1 7ld1 { v1.2d }, [x27], #16 8add x0, x27, 1 9ld1 { v1.2s }, [x27], #8 10add x0, x27, 1 11ld1 { v1.4h }, [x27], #8 12add x0, x27, 1 13ld1 { v1.4s }, [x27], #16 14add x0, x27, 1 15# LLVM-MCA-END 16 17# LLVM-MCA-BEGIN G02 18ld1 { v1.8b }, [x27], #8 19add x0, x27, 1 20ld1 { v1.8h }, [x27], #16 21add x0, x27, 1 22ld1 { v1.16b }, [x27], #16 23add x0, x27, 1 24ld1 { v1.1d }, [x27], x28 25add x0, x27, 1 26ld1 { v1.2d }, [x27], x28 27add x0, x27, 1 28# LLVM-MCA-END 29 30# LLVM-MCA-BEGIN G03 31ld1 { v1.2s }, [x27], x28 32add x0, x27, 1 33ld1 { v1.4h }, [x27], x28 34add x0, x27, 1 35ld1 { v1.4s }, [x27], x28 36add x0, x27, 1 37ld1 { v1.8b }, [x27], x28 38add x0, x27, 1 39ld1 { v1.8h }, [x27], x28 40add x0, x27, 1 41# LLVM-MCA-END 42 43# LLVM-MCA-BEGIN G04 44ld1 { v1.16b }, [x27], x28 45add x0, x27, 1 46ld1 { v1.1d, v2.1d }, [x27], #16 47add x0, x27, 1 48ld1 { v1.2d, v2.2d }, [x27], #32 49add x0, x27, 1 50ld1 { v1.2s, v2.2s }, [x27], #16 51add x0, x27, 1 52ld1 { v1.4h, v2.4h }, [x27], #16 53add x0, x27, 1 54# LLVM-MCA-END 55 56# LLVM-MCA-BEGIN G05 57ld1 { v1.4s, v2.4s }, [x27], #32 58add x0, x27, 1 59ld1 { v1.8b, v2.8b }, [x27], #16 60add x0, x27, 1 61ld1 { v1.8h, v2.8h }, [x27], #32 62add x0, x27, 1 63ld1 { v1.16b, v2.16b }, [x27], #32 64add x0, x27, 1 65ld1 { v1.1d, v2.1d }, [x27], x28 66add x0, x27, 1 67# LLVM-MCA-END 68 69# LLVM-MCA-BEGIN G06 70ld1 { v1.2d, v2.2d }, [x27], x28 71add x0, x27, 1 72ld1 { v1.2s, v2.2s }, [x27], x28 73add x0, x27, 1 74ld1 { v1.4h, v2.4h }, [x27], x28 75add x0, x27, 1 76ld1 { v1.4s, v2.4s }, [x27], x28 77add x0, x27, 1 78ld1 { v1.8b, v2.8b }, [x27], x28 79add x0, x27, 1 80# LLVM-MCA-END 81 82# LLVM-MCA-BEGIN G07 83ld1 { v1.8h, v2.8h }, [x27], x28 84add x0, x27, 1 85ld1 { v1.16b, v2.16b }, [x27], x28 86add x0, x27, 1 87ld1 { v1.1d, v2.1d, v3.1d }, [x27], #24 88add x0, x27, 1 89ld1 { v1.2d, v2.2d, v3.2d }, [x27], #48 90add x0, x27, 1 91ld1 { v1.2s, v2.2s, v3.2s }, [x27], #24 92add x0, x27, 1 93# LLVM-MCA-END 94 95# LLVM-MCA-BEGIN G08 96ld1 { v1.4h, v2.4h, v3.4h }, [x27], #24 97add x0, x27, 1 98ld1 { v1.4s, v2.4s, v3.4s }, [x27], #48 99add x0, x27, 1 100ld1 { v1.8b, v2.8b, v3.8b }, [x27], #24 101add x0, x27, 1 102ld1 { v1.8h, v2.8h, v3.8h }, [x27], #48 103add x0, x27, 1 104ld1 { v1.16b, v2.16b, v3.16b }, [x27], #48 105add x0, x27, 1 106# LLVM-MCA-END 107 108# LLVM-MCA-BEGIN G09 109ld1 { v1.1d, v2.1d, v3.1d }, [x27], x28 110add x0, x27, 1 111ld1 { v1.2d, v2.2d, v3.2d }, [x27], x28 112add x0, x27, 1 113ld1 { v1.2s, v2.2s, v3.2s }, [x27], x28 114add x0, x27, 1 115ld1 { v1.4h, v2.4h, v3.4h }, [x27], x28 116add x0, x27, 1 117ld1 { v1.4s, v2.4s, v3.4s }, [x27], x28 118add x0, x27, 1 119# LLVM-MCA-END 120 121# LLVM-MCA-BEGIN G10 122ld1 { v1.8b, v2.8b, v3.8b }, [x27], x28 123add x0, x27, 1 124ld1 { v1.8h, v2.8h, v3.8h }, [x27], x28 125add x0, x27, 1 126ld1 { v1.16b, v2.16b, v3.16b }, [x27], x28 127add x0, x27, 1 128ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 129add x0, x27, 1 130ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 131add x0, x27, 1 132# LLVM-MCA-END 133 134# LLVM-MCA-BEGIN G11 135ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 136add x0, x27, 1 137ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 138add x0, x27, 1 139ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 140add x0, x27, 1 141ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 142add x0, x27, 1 143ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 144add x0, x27, 1 145# LLVM-MCA-END 146 147# LLVM-MCA-BEGIN G12 148ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 149add x0, x27, 1 150ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 151add x0, x27, 1 152ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 153add x0, x27, 1 154ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 155add x0, x27, 1 156ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 157add x0, x27, 1 158# LLVM-MCA-END 159 160# LLVM-MCA-BEGIN G13 161ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 162add x0, x27, 1 163ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 164add x0, x27, 1 165ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 166add x0, x27, 1 167ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 168add x0, x27, 1 169ld1 { v1.b }[0], [x27], #1 170add x0, x27, 1 171# LLVM-MCA-END 172 173# LLVM-MCA-BEGIN G14 174ld1 { v1.b }[8], [x27], #1 175add x0, x27, 1 176ld1 { v1.b }[0], [x27], x28 177add x0, x27, 1 178ld1 { v1.b }[8], [x27], x28 179add x0, x27, 1 180ld1 { v1.h }[0], [x27], #2 181add x0, x27, 1 182ld1 { v1.h }[4], [x27], #2 183add x0, x27, 1 184# LLVM-MCA-END 185 186# LLVM-MCA-BEGIN G15 187ld1 { v1.h }[0], [x27], x28 188add x0, x27, 1 189ld1 { v1.h }[4], [x27], x28 190add x0, x27, 1 191ld1 { v1.s }[0], [x27], #4 192add x0, x27, 1 193ld1 { v1.s }[0], [x27], x28 194add x0, x27, 1 195ld1 { v1.d }[0], [x27], #8 196add x0, x27, 1 197# LLVM-MCA-END 198 199# LLVM-MCA-BEGIN G16 200ld1 { v1.d }[0], [x27], x28 201add x0, x27, 1 202ld1r { v1.1d }, [x27], #8 203add x0, x27, 1 204ld1r { v1.2d }, [x27], #8 205add x0, x27, 1 206ld1r { v1.2s }, [x27], #4 207add x0, x27, 1 208ld1r { v1.4h }, [x27], #2 209add x0, x27, 1 210# LLVM-MCA-END 211 212# LLVM-MCA-BEGIN G17 213ld1r { v1.4s }, [x27], #4 214add x0, x27, 1 215ld1r { v1.8b }, [x27], #1 216add x0, x27, 1 217ld1r { v1.8h }, [x27], #2 218add x0, x27, 1 219ld1r { v1.16b }, [x27], #1 220add x0, x27, 1 221ld1r { v1.1d }, [x27], x28 222add x0, x27, 1 223# LLVM-MCA-END 224 225# LLVM-MCA-BEGIN G18 226ld1r { v1.2d }, [x27], x28 227add x0, x27, 1 228ld1r { v1.2s }, [x27], x28 229add x0, x27, 1 230ld1r { v1.4h }, [x27], x28 231add x0, x27, 1 232ld1r { v1.4s }, [x27], x28 233add x0, x27, 1 234ld1r { v1.8b }, [x27], x28 235add x0, x27, 1 236# LLVM-MCA-END 237 238# LLVM-MCA-BEGIN G19 239ld1r { v1.8h }, [x27], x28 240add x0, x27, 1 241ld1r { v1.16b }, [x27], x28 242add x0, x27, 1 243ld2 { v1.2d, v2.2d }, [x27], #32 244add x0, x27, 1 245ld2 { v1.2s, v2.2s }, [x27], #16 246add x0, x27, 1 247ld2 { v1.4h, v2.4h }, [x27], #16 248add x0, x27, 1 249# LLVM-MCA-END 250 251# LLVM-MCA-BEGIN G20 252ld2 { v1.4s, v2.4s }, [x27], #32 253add x0, x27, 1 254ld2 { v1.8b, v2.8b }, [x27], #16 255add x0, x27, 1 256ld2 { v1.8h, v2.8h }, [x27], #32 257add x0, x27, 1 258ld2 { v1.16b, v2.16b }, [x27], #32 259add x0, x27, 1 260ld2 { v1.2d, v2.2d }, [x27], x28 261add x0, x27, 1 262# LLVM-MCA-END 263 264# LLVM-MCA-BEGIN G21 265ld2 { v1.2s, v2.2s }, [x27], x28 266add x0, x27, 1 267ld2 { v1.4h, v2.4h }, [x27], x28 268add x0, x27, 1 269ld2 { v1.4s, v2.4s }, [x27], x28 270add x0, x27, 1 271ld2 { v1.8b, v2.8b }, [x27], x28 272add x0, x27, 1 273ld2 { v1.8h, v2.8h }, [x27], x28 274add x0, x27, 1 275# LLVM-MCA-END 276 277# LLVM-MCA-BEGIN G22 278ld2 { v1.16b, v2.16b }, [x27], x28 279add x0, x27, 1 280ld2 { v1.b, v2.b }[0], [x27], #2 281add x0, x27, 1 282ld2 { v1.b, v2.b }[8], [x27], #2 283add x0, x27, 1 284ld2 { v1.b, v2.b }[0], [x27], x28 285add x0, x27, 1 286ld2 { v1.b, v2.b }[8], [x27], x28 287add x0, x27, 1 288# LLVM-MCA-END 289 290# LLVM-MCA-BEGIN G23 291ld2 { v1.h, v2.h }[0], [x27], #4 292add x0, x27, 1 293ld2 { v1.h, v2.h }[4], [x27], #4 294add x0, x27, 1 295ld2 { v1.h, v2.h }[0], [x27], x28 296add x0, x27, 1 297ld2 { v1.h, v2.h }[4], [x27], x28 298add x0, x27, 1 299ld2 { v1.s, v2.s }[0], [x27], #8 300add x0, x27, 1 301# LLVM-MCA-END 302 303# LLVM-MCA-BEGIN G24 304ld2 { v1.s, v2.s }[0], [x27], x28 305add x0, x27, 1 306ld2 { v1.d, v2.d }[0], [x27], #16 307add x0, x27, 1 308ld2 { v1.d, v2.d }[0], [x27], x28 309add x0, x27, 1 310ld2r { v1.1d, v2.1d }, [x27], #16 311add x0, x27, 1 312ld2r { v1.2d, v2.2d }, [x27], #16 313add x0, x27, 1 314# LLVM-MCA-END 315 316# LLVM-MCA-BEGIN G25 317ld2r { v1.2s, v2.2s }, [x27], #8 318add x0, x27, 1 319ld2r { v1.4h, v2.4h }, [x27], #4 320add x0, x27, 1 321ld2r { v1.4s, v2.4s }, [x27], #8 322add x0, x27, 1 323ld2r { v1.8b, v2.8b }, [x27], #2 324add x0, x27, 1 325ld2r { v1.8h, v2.8h }, [x27], #4 326add x0, x27, 1 327# LLVM-MCA-END 328 329# LLVM-MCA-BEGIN G26 330ld2r { v1.16b, v2.16b }, [x27], #2 331add x0, x27, 1 332ld2r { v1.1d, v2.1d }, [x27], x28 333add x0, x27, 1 334ld2r { v1.2d, v2.2d }, [x27], x28 335add x0, x27, 1 336ld2r { v1.2s, v2.2s }, [x27], x28 337add x0, x27, 1 338ld2r { v1.4h, v2.4h }, [x27], x28 339add x0, x27, 1 340# LLVM-MCA-END 341 342# LLVM-MCA-BEGIN G27 343ld2r { v1.4s, v2.4s }, [x27], x28 344add x0, x27, 1 345ld2r { v1.8b, v2.8b }, [x27], x28 346add x0, x27, 1 347ld2r { v1.8h, v2.8h }, [x27], x28 348add x0, x27, 1 349ld2r { v1.16b, v2.16b }, [x27], x28 350add x0, x27, 1 351ld3 { v1.2d, v2.2d, v3.2d }, [x27], #48 352add x0, x27, 1 353# LLVM-MCA-END 354 355# LLVM-MCA-BEGIN G28 356ld3 { v1.2s, v2.2s, v3.2s }, [x27], #24 357add x0, x27, 1 358ld3 { v1.4h, v2.4h, v3.4h }, [x27], #24 359add x0, x27, 1 360ld3 { v1.4s, v2.4s, v3.4s }, [x27], #48 361add x0, x27, 1 362ld3 { v1.8b, v2.8b, v3.8b }, [x27], #24 363add x0, x27, 1 364ld3 { v1.8h, v2.8h, v3.8h }, [x27], #48 365add x0, x27, 1 366# LLVM-MCA-END 367 368# LLVM-MCA-BEGIN G29 369ld3 { v1.16b, v2.16b, v3.16b }, [x27], #48 370add x0, x27, 1 371ld3 { v1.2d, v2.2d, v3.2d }, [x27], x28 372add x0, x27, 1 373ld3 { v1.2s, v2.2s, v3.2s }, [x27], x28 374add x0, x27, 1 375ld3 { v1.4h, v2.4h, v3.4h }, [x27], x28 376add x0, x27, 1 377ld3 { v1.4s, v2.4s, v3.4s }, [x27], x28 378add x0, x27, 1 379# LLVM-MCA-END 380 381# LLVM-MCA-BEGIN G30 382ld3 { v1.8b, v2.8b, v3.8b }, [x27], x28 383add x0, x27, 1 384ld3 { v1.8h, v2.8h, v3.8h }, [x27], x28 385add x0, x27, 1 386ld3 { v1.16b, v2.16b, v3.16b }, [x27], x28 387add x0, x27, 1 388ld3 { v1.b, v2.b, v3.b }[0], [x27], #3 389add x0, x27, 1 390ld3 { v1.b, v2.b, v3.b }[8], [x27], #3 391add x0, x27, 1 392# LLVM-MCA-END 393 394# LLVM-MCA-BEGIN G31 395ld3 { v1.b, v2.b, v3.b }[0], [x27], x28 396add x0, x27, 1 397ld3 { v1.b, v2.b, v3.b }[8], [x27], x28 398add x0, x27, 1 399ld3 { v1.h, v2.h, v3.h }[0], [x27], #6 400add x0, x27, 1 401ld3 { v1.h, v2.h, v3.h }[4], [x27], #6 402add x0, x27, 1 403ld3 { v1.h, v2.h, v3.h }[0], [x27], x28 404add x0, x27, 1 405# LLVM-MCA-END 406 407# LLVM-MCA-BEGIN G32 408ld3 { v1.h, v2.h, v3.h }[4], [x27], x28 409add x0, x27, 1 410ld3 { v1.s, v2.s, v3.s }[0], [x27], #12 411add x0, x27, 1 412ld3 { v1.s, v2.s, v3.s }[0], [x27], x28 413add x0, x27, 1 414ld3 { v1.d, v2.d, v3.d }[0], [x27], #24 415add x0, x27, 1 416ld3 { v1.d, v2.d, v3.d }[0], [x27], x28 417add x0, x27, 1 418# LLVM-MCA-END 419 420# LLVM-MCA-BEGIN G33 421ld3r { v1.1d, v2.1d, v3.1d }, [x27], #24 422add x0, x27, 1 423ld3r { v1.2d, v2.2d, v3.2d }, [x27], #24 424add x0, x27, 1 425ld3r { v1.2s, v2.2s, v3.2s }, [x27], #12 426add x0, x27, 1 427ld3r { v1.4h, v2.4h, v3.4h }, [x27], #6 428add x0, x27, 1 429ld3r { v1.4s, v2.4s, v3.4s }, [x27], #12 430add x0, x27, 1 431# LLVM-MCA-END 432 433# LLVM-MCA-BEGIN G34 434ld3r { v1.8b, v2.8b, v3.8b }, [x27], #3 435add x0, x27, 1 436ld3r { v1.8h, v2.8h, v3.8h }, [x27], #6 437add x0, x27, 1 438ld3r { v1.16b, v2.16b, v3.16b }, [x27], #3 439add x0, x27, 1 440ld3r { v1.1d, v2.1d, v3.1d }, [x27], x28 441add x0, x27, 1 442ld3r { v1.2d, v2.2d, v3.2d }, [x27], x28 443add x0, x27, 1 444# LLVM-MCA-END 445 446# LLVM-MCA-BEGIN G35 447ld3r { v1.2s, v2.2s, v3.2s }, [x27], x28 448add x0, x27, 1 449ld3r { v1.4h, v2.4h, v3.4h }, [x27], x28 450add x0, x27, 1 451ld3r { v1.4s, v2.4s, v3.4s }, [x27], x28 452add x0, x27, 1 453ld3r { v1.8b, v2.8b, v3.8b }, [x27], x28 454add x0, x27, 1 455ld3r { v1.8h, v2.8h, v3.8h }, [x27], x28 456add x0, x27, 1 457# LLVM-MCA-END 458 459# LLVM-MCA-BEGIN G36 460ld3r { v1.16b, v2.16b, v3.16b }, [x27], x28 461add x0, x27, 1 462ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 463add x0, x27, 1 464ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 465add x0, x27, 1 466ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 467add x0, x27, 1 468ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 469add x0, x27, 1 470# LLVM-MCA-END 471 472# LLVM-MCA-BEGIN G37 473ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 474add x0, x27, 1 475ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 476add x0, x27, 1 477ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 478add x0, x27, 1 479ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 480add x0, x27, 1 481ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 482add x0, x27, 1 483# LLVM-MCA-END 484 485# LLVM-MCA-BEGIN G38 486ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 487add x0, x27, 1 488ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 489add x0, x27, 1 490ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 491add x0, x27, 1 492ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 493add x0, x27, 1 494ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 495add x0, x27, 1 496# LLVM-MCA-END 497 498# LLVM-MCA-BEGIN G39 499ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4 500add x0, x27, 1 501ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4 502add x0, x27, 1 503ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28 504add x0, x27, 1 505ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28 506add x0, x27, 1 507ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8 508add x0, x27, 1 509# LLVM-MCA-END 510 511# LLVM-MCA-BEGIN G40 512ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8 513add x0, x27, 1 514ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28 515add x0, x27, 1 516ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28 517add x0, x27, 1 518ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16 519add x0, x27, 1 520ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28 521add x0, x27, 1 522# LLVM-MCA-END 523 524# LLVM-MCA-BEGIN G41 525ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32 526add x0, x27, 1 527ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28 528add x0, x27, 1 529ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 530add x0, x27, 1 531ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32 532add x0, x27, 1 533ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16 534add x0, x27, 1 535# LLVM-MCA-END 536 537# LLVM-MCA-BEGIN G42 538ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8 539add x0, x27, 1 540ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16 541add x0, x27, 1 542ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4 543add x0, x27, 1 544ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8 545add x0, x27, 1 546ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4 547add x0, x27, 1 548# LLVM-MCA-END 549 550# LLVM-MCA-BEGIN G43 551ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 552add x0, x27, 1 553ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 554add x0, x27, 1 555ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 556add x0, x27, 1 557ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 558add x0, x27, 1 559ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 560add x0, x27, 1 561# LLVM-MCA-END 562 563# LLVM-MCA-BEGIN G44 564ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 565add x0, x27, 1 566ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 567add x0, x27, 1 568ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 569add x0, x27, 1 570ldp s1, s2, [x27], #248 571add x0, x27, 1 572ldp d1, d2, [x27], #496 573add x0, x27, 1 574# LLVM-MCA-END 575 576# LLVM-MCA-BEGIN G45 577ldp q1, q2, [x27], #992 578add x0, x27, 1 579ldp s1, s2, [x27, #248]! 580add x0, x27, 1 581ldp d1, d2, [x27, #496]! 582add x0, x27, 1 583ldp q1, q2, [x27, #992]! 584add x0, x27, 1 585ldp w1, w2, [x27], #248 586add x0, x27, 1 587# LLVM-MCA-END 588 589# LLVM-MCA-BEGIN G46 590ldp x1, x2, [x27], #496 591add x0, x27, 1 592ldp w1, w2, [x27, #248]! 593add x0, x27, 1 594ldp x1, x2, [x27, #496]! 595add x0, x27, 1 596ldpsw x1, x2, [x27], #248 597add x0, x27, 1 598ldpsw x1, x2, [x27, #248]! 599add x0, x27, 1 600# LLVM-MCA-END 601 602# LLVM-MCA-BEGIN G47 603ldr b1, [x27], #254 604add x0, x27, 1 605ldr h1, [x27], #254 606add x0, x27, 1 607ldr s1, [x27], #254 608add x0, x27, 1 609ldr d1, [x27], #254 610add x0, x27, 1 611ldr q1, [x27], #254 612add x0, x27, 1 613# LLVM-MCA-END 614 615# LLVM-MCA-BEGIN G48 616ldr b1, [x27, #254]! 617add x0, x27, 1 618ldr h1, [x27, #254]! 619add x0, x27, 1 620ldr s1, [x27, #254]! 621add x0, x27, 1 622ldr d1, [x27, #254]! 623add x0, x27, 1 624ldr q1, [x27, #254]! 625add x0, x27, 1 626# LLVM-MCA-END 627 628# LLVM-MCA-BEGIN G49 629ldr w1, [x27], #254 630add x0, x27, 1 631ldr x1, [x27], #254 632add x0, x27, 1 633ldr w1, [x27, #254]! 634add x0, x27, 1 635ldr x1, [x27, #254]! 636add x0, x27, 1 637ldrb w1, [x27], #254 638add x0, x27, 1 639# LLVM-MCA-END 640 641# LLVM-MCA-BEGIN G50 642ldrb w1, [x27, #254]! 643add x0, x27, 1 644ldrh w1, [x27], #254 645add x0, x27, 1 646ldrh w1, [x27, #254]! 647add x0, x27, 1 648ldrsb w1, [x27], #254 649add x0, x27, 1 650ldrsb x1, [x27], #254 651add x0, x27, 1 652# LLVM-MCA-END 653 654# LLVM-MCA-BEGIN G51 655ldrsb w1, [x27, #254]! 656add x0, x27, 1 657ldrsb x1, [x27, #254]! 658add x0, x27, 1 659ldrsh w1, [x27], #254 660add x0, x27, 1 661ldrsh x1, [x27], #254 662add x0, x27, 1 663ldrsh w1, [x27, #254]! 664add x0, x27, 1 665# LLVM-MCA-END 666 667# LLVM-MCA-BEGIN G52 668ldrsh x1, [x27, #254]! 669add x0, x27, 1 670ldrsw x1, [x27], #254 671add x0, x27, 1 672ldrsw x1, [x27, #254]! 673add x0, x27, 1 674st1 { v1.1d }, [x27], #8 675add x0, x27, 1 676st1 { v1.2d }, [x27], #16 677add x0, x27, 1 678# LLVM-MCA-END 679 680# LLVM-MCA-BEGIN G53 681st1 { v1.2s }, [x27], #8 682add x0, x27, 1 683st1 { v1.4h }, [x27], #8 684add x0, x27, 1 685st1 { v1.4s }, [x27], #16 686add x0, x27, 1 687st1 { v1.8b }, [x27], #8 688add x0, x27, 1 689st1 { v1.8h }, [x27], #16 690add x0, x27, 1 691# LLVM-MCA-END 692 693# LLVM-MCA-BEGIN G54 694st1 { v1.16b }, [x27], #16 695add x0, x27, 1 696st1 { v1.1d }, [x27], x28 697add x0, x27, 1 698st1 { v1.2d }, [x27], x28 699add x0, x27, 1 700st1 { v1.2s }, [x27], x28 701add x0, x27, 1 702st1 { v1.4h }, [x27], x28 703add x0, x27, 1 704# LLVM-MCA-END 705 706# LLVM-MCA-BEGIN G55 707st1 { v1.4s }, [x27], x28 708add x0, x27, 1 709st1 { v1.8b }, [x27], x28 710add x0, x27, 1 711st1 { v1.8h }, [x27], x28 712add x0, x27, 1 713st1 { v1.16b }, [x27], x28 714add x0, x27, 1 715st1 { v1.1d, v2.1d }, [x27], #16 716add x0, x27, 1 717# LLVM-MCA-END 718 719# LLVM-MCA-BEGIN G56 720st1 { v1.2d, v2.2d }, [x27], #32 721add x0, x27, 1 722st1 { v1.2s, v2.2s }, [x27], #16 723add x0, x27, 1 724st1 { v1.4h, v2.4h }, [x27], #16 725add x0, x27, 1 726st1 { v1.4s, v2.4s }, [x27], #32 727add x0, x27, 1 728st1 { v1.8b, v2.8b }, [x27], #16 729add x0, x27, 1 730# LLVM-MCA-END 731 732# LLVM-MCA-BEGIN G57 733st1 { v1.8h, v2.8h }, [x27], #32 734add x0, x27, 1 735st1 { v1.16b, v2.16b }, [x27], #32 736add x0, x27, 1 737st1 { v1.1d, v2.1d }, [x27], x28 738add x0, x27, 1 739st1 { v1.2d, v2.2d }, [x27], x28 740add x0, x27, 1 741st1 { v1.2s, v2.2s }, [x27], x28 742add x0, x27, 1 743# LLVM-MCA-END 744 745# LLVM-MCA-BEGIN G58 746st1 { v1.4h, v2.4h }, [x27], x28 747add x0, x27, 1 748st1 { v1.4s, v2.4s }, [x27], x28 749add x0, x27, 1 750st1 { v1.8b, v2.8b }, [x27], x28 751add x0, x27, 1 752st1 { v1.8h, v2.8h }, [x27], x28 753add x0, x27, 1 754st1 { v1.16b, v2.16b }, [x27], x28 755add x0, x27, 1 756# LLVM-MCA-END 757 758# LLVM-MCA-BEGIN G59 759st1 { v1.1d, v2.1d, v3.1d }, [x27], #24 760add x0, x27, 1 761st1 { v1.2d, v2.2d, v3.2d }, [x27], #48 762add x0, x27, 1 763st1 { v1.2s, v2.2s, v3.2s }, [x27], #24 764add x0, x27, 1 765st1 { v1.4h, v2.4h, v3.4h }, [x27], #24 766add x0, x27, 1 767st1 { v1.4s, v2.4s, v3.4s }, [x27], #48 768add x0, x27, 1 769# LLVM-MCA-END 770 771# LLVM-MCA-BEGIN G60 772st1 { v1.8b, v2.8b, v3.8b }, [x27], #24 773add x0, x27, 1 774st1 { v1.8h, v2.8h, v3.8h }, [x27], #48 775add x0, x27, 1 776st1 { v1.16b, v2.16b, v3.16b }, [x27], #48 777add x0, x27, 1 778st1 { v1.1d, v2.1d, v3.1d }, [x27], x28 779add x0, x27, 1 780st1 { v1.2d, v2.2d, v3.2d }, [x27], x28 781add x0, x27, 1 782# LLVM-MCA-END 783 784# LLVM-MCA-BEGIN G61 785st1 { v1.2s, v2.2s, v3.2s }, [x27], x28 786add x0, x27, 1 787st1 { v1.4h, v2.4h, v3.4h }, [x27], x28 788add x0, x27, 1 789st1 { v1.4s, v2.4s, v3.4s }, [x27], x28 790add x0, x27, 1 791st1 { v1.8b, v2.8b, v3.8b }, [x27], x28 792add x0, x27, 1 793st1 { v1.8h, v2.8h, v3.8h }, [x27], x28 794add x0, x27, 1 795# LLVM-MCA-END 796 797# LLVM-MCA-BEGIN G62 798st1 { v1.16b, v2.16b, v3.16b }, [x27], x28 799add x0, x27, 1 800st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 801add x0, x27, 1 802st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 803add x0, x27, 1 804st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 805add x0, x27, 1 806st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 807add x0, x27, 1 808# LLVM-MCA-END 809 810# LLVM-MCA-BEGIN G63 811st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 812add x0, x27, 1 813st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 814add x0, x27, 1 815st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 816add x0, x27, 1 817st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 818add x0, x27, 1 819st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 820add x0, x27, 1 821# LLVM-MCA-END 822 823# LLVM-MCA-BEGIN G64 824st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 825add x0, x27, 1 826st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 827add x0, x27, 1 828st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 829add x0, x27, 1 830st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 831add x0, x27, 1 832st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 833add x0, x27, 1 834# LLVM-MCA-END 835 836# LLVM-MCA-BEGIN G65 837st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 838add x0, x27, 1 839st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 840add x0, x27, 1 841st1 { v1.b }[0], [x27], #1 842add x0, x27, 1 843st1 { v1.b }[8], [x27], #1 844add x0, x27, 1 845st1 { v1.b }[0], [x27], x28 846add x0, x27, 1 847# LLVM-MCA-END 848 849# LLVM-MCA-BEGIN G66 850st1 { v1.b }[8], [x27], x28 851add x0, x27, 1 852st1 { v1.h }[0], [x27], #2 853add x0, x27, 1 854st1 { v1.h }[4], [x27], #2 855add x0, x27, 1 856st1 { v1.h }[0], [x27], x28 857add x0, x27, 1 858st1 { v1.h }[4], [x27], x28 859add x0, x27, 1 860# LLVM-MCA-END 861 862# LLVM-MCA-BEGIN G67 863st1 { v1.s }[0], [x27], #4 864add x0, x27, 1 865st1 { v1.s }[0], [x27], x28 866add x0, x27, 1 867st1 { v1.d }[0], [x27], #8 868add x0, x27, 1 869st1 { v1.d }[0], [x27], x28 870add x0, x27, 1 871st2 { v1.2d, v2.2d }, [x27], #32 872add x0, x27, 1 873# LLVM-MCA-END 874 875# LLVM-MCA-BEGIN G68 876st2 { v1.2s, v2.2s }, [x27], #16 877add x0, x27, 1 878st2 { v1.4h, v2.4h }, [x27], #16 879add x0, x27, 1 880st2 { v1.4s, v2.4s }, [x27], #32 881add x0, x27, 1 882st2 { v1.8b, v2.8b }, [x27], #16 883add x0, x27, 1 884st2 { v1.8h, v2.8h }, [x27], #32 885add x0, x27, 1 886# LLVM-MCA-END 887 888# LLVM-MCA-BEGIN G69 889st2 { v1.16b, v2.16b }, [x27], #32 890add x0, x27, 1 891st2 { v1.2d, v2.2d }, [x27], x28 892add x0, x27, 1 893st2 { v1.2s, v2.2s }, [x27], x28 894add x0, x27, 1 895st2 { v1.4h, v2.4h }, [x27], x28 896add x0, x27, 1 897st2 { v1.4s, v2.4s }, [x27], x28 898add x0, x27, 1 899# LLVM-MCA-END 900 901# LLVM-MCA-BEGIN G70 902st2 { v1.8b, v2.8b }, [x27], x28 903add x0, x27, 1 904st2 { v1.8h, v2.8h }, [x27], x28 905add x0, x27, 1 906st2 { v1.16b, v2.16b }, [x27], x28 907add x0, x27, 1 908st2 { v1.b, v2.b }[0], [x27], #2 909add x0, x27, 1 910st2 { v1.b, v2.b }[8], [x27], #2 911add x0, x27, 1 912# LLVM-MCA-END 913 914# LLVM-MCA-BEGIN G71 915st2 { v1.b, v2.b }[0], [x27], x28 916add x0, x27, 1 917st2 { v1.b, v2.b }[8], [x27], x28 918add x0, x27, 1 919st2 { v1.h, v2.h }[0], [x27], #4 920add x0, x27, 1 921st2 { v1.h, v2.h }[4], [x27], #4 922add x0, x27, 1 923st2 { v1.h, v2.h }[0], [x27], x28 924add x0, x27, 1 925# LLVM-MCA-END 926 927# LLVM-MCA-BEGIN G72 928st2 { v1.h, v2.h }[4], [x27], x28 929add x0, x27, 1 930st2 { v1.s, v2.s }[0], [x27], #8 931add x0, x27, 1 932st2 { v1.s, v2.s }[0], [x27], x28 933add x0, x27, 1 934st2 { v1.d, v2.d }[0], [x27], #16 935add x0, x27, 1 936st2 { v1.d, v2.d }[0], [x27], x28 937add x0, x27, 1 938# LLVM-MCA-END 939 940# LLVM-MCA-BEGIN G73 941st3 { v1.2d, v2.2d, v3.2d }, [x27], #48 942add x0, x27, 1 943st3 { v1.2s, v2.2s, v3.2s }, [x27], #24 944add x0, x27, 1 945st3 { v1.4h, v2.4h, v3.4h }, [x27], #24 946add x0, x27, 1 947# LLVM-MCA-END 948 949# LLVM-MCA-BEGIN G74 950st3 { v1.4s, v2.4s, v3.4s }, [x27], #48 951add x0, x27, 1 952st3 { v1.8b, v2.8b, v3.8b }, [x27], #24 953add x0, x27, 1 954st3 { v1.8h, v2.8h, v3.8h }, [x27], #48 955add x0, x27, 1 956st3 { v1.16b, v2.16b, v3.16b }, [x27], #48 957add x0, x27, 1 958st3 { v1.2d, v2.2d, v3.2d }, [x27], x28 959add x0, x27, 1 960# LLVM-MCA-END 961 962# LLVM-MCA-BEGIN G75 963st3 { v1.2s, v2.2s, v3.2s }, [x27], x28 964add x0, x27, 1 965st3 { v1.4h, v2.4h, v3.4h }, [x27], x28 966add x0, x27, 1 967st3 { v1.4s, v2.4s, v3.4s }, [x27], x28 968add x0, x27, 1 969st3 { v1.8b, v2.8b, v3.8b }, [x27], x28 970add x0, x27, 1 971st3 { v1.8h, v2.8h, v3.8h }, [x27], x28 972add x0, x27, 1 973# LLVM-MCA-END 974 975# LLVM-MCA-BEGIN G76 976st3 { v1.16b, v2.16b, v3.16b }, [x27], x28 977add x0, x27, 1 978st3 { v1.b, v2.b, v3.b }[0], [x27], #3 979add x0, x27, 1 980st3 { v1.b, v2.b, v3.b }[8], [x27], #3 981add x0, x27, 1 982st3 { v1.b, v2.b, v3.b }[0], [x27], x28 983add x0, x27, 1 984st3 { v1.b, v2.b, v3.b }[8], [x27], x28 985add x0, x27, 1 986# LLVM-MCA-END 987 988# LLVM-MCA-BEGIN G77 989st3 { v1.h, v2.h, v3.h }[0], [x27], #6 990add x0, x27, 1 991st3 { v1.h, v2.h, v3.h }[4], [x27], #6 992add x0, x27, 1 993st3 { v1.h, v2.h, v3.h }[0], [x27], x28 994add x0, x27, 1 995st3 { v1.h, v2.h, v3.h }[4], [x27], x28 996add x0, x27, 1 997st3 { v1.s, v2.s, v3.s }[0], [x27], #12 998add x0, x27, 1 999# LLVM-MCA-END 1000 1001# LLVM-MCA-BEGIN G78 1002st3 { v1.s, v2.s, v3.s }[0], [x27], x28 1003add x0, x27, 1 1004st3 { v1.d, v2.d, v3.d }[0], [x27], #24 1005add x0, x27, 1 1006st3 { v1.d, v2.d, v3.d }[0], [x27], x28 1007add x0, x27, 1 1008st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 1009add x0, x27, 1 1010st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 1011add x0, x27, 1 1012# LLVM-MCA-END 1013 1014# LLVM-MCA-BEGIN G79 1015st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 1016add x0, x27, 1 1017st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 1018add x0, x27, 1 1019st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 1020add x0, x27, 1 1021st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 1022add x0, x27, 1 1023st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 1024add x0, x27, 1 1025# LLVM-MCA-END 1026 1027# LLVM-MCA-BEGIN G80 1028st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 1029add x0, x27, 1 1030st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 1031add x0, x27, 1 1032st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 1033add x0, x27, 1 1034st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 1035add x0, x27, 1 1036st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 1037add x0, x27, 1 1038# LLVM-MCA-END 1039 1040# LLVM-MCA-BEGIN G81 1041st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 1042add x0, x27, 1 1043st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 1044add x0, x27, 1 1045st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4 1046add x0, x27, 1 1047st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4 1048add x0, x27, 1 1049st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28 1050add x0, x27, 1 1051# LLVM-MCA-END 1052 1053# LLVM-MCA-BEGIN G82 1054st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28 1055add x0, x27, 1 1056st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8 1057add x0, x27, 1 1058st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8 1059add x0, x27, 1 1060st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28 1061add x0, x27, 1 1062st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28 1063add x0, x27, 1 1064# LLVM-MCA-END 1065 1066# LLVM-MCA-BEGIN G83 1067st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16 1068add x0, x27, 1 1069st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28 1070add x0, x27, 1 1071st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32 1072add x0, x27, 1 1073st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28 1074add x0, x27, 1 1075# LLVM-MCA-END 1076 1077# LLVM-MCA-BEGIN G84 1078stp s1, s2, [x27], #248 1079add x0, x27, 1 1080stp d1, d2, [x27], #496 1081add x0, x27, 1 1082# LLVM-MCA-END 1083 1084# LLVM-MCA-BEGIN G85 1085stp q1, q2, [x27], #992 1086add x0, x27, 1 1087stp s1, s2, [x27, #248]! 1088add x0, x27, 1 1089stp d1, d2, [x27, #496]! 1090add x0, x27, 1 1091stp q1, q2, [x27, #992]! 1092add x0, x27, 1 1093stp w1, w2, [x27], #248 1094add x0, x27, 1 1095# LLVM-MCA-END 1096 1097# LLVM-MCA-BEGIN G86 1098stp x1, x2, [x27], #496 1099add x0, x27, 1 1100stp w1, w2, [x27, #248]! 1101add x0, x27, 1 1102stp x1, x2, [x27, #496]! 1103add x0, x27, 1 1104str b1, [x27], #254 1105add x0, x27, 1 1106str h1, [x27], #254 1107add x0, x27, 1 1108# LLVM-MCA-END 1109 1110# LLVM-MCA-BEGIN G87 1111str s1, [x27], #254 1112add x0, x27, 1 1113str d1, [x27], #254 1114add x0, x27, 1 1115str q1, [x27], #254 1116add x0, x27, 1 1117str b1, [x27, #254]! 1118add x0, x27, 1 1119str h1, [x27, #254]! 1120add x0, x27, 1 1121# LLVM-MCA-END 1122 1123# LLVM-MCA-BEGIN G88 1124str s1, [x27, #254]! 1125add x0, x27, 1 1126str d1, [x27, #254]! 1127add x0, x27, 1 1128str q1, [x27, #254]! 1129add x0, x27, 1 1130str w1, [x27], #254 1131add x0, x27, 1 1132str x1, [x27], #254 1133add x0, x27, 1 1134# LLVM-MCA-END 1135 1136# LLVM-MCA-BEGIN G89 1137str w1, [x27, #254]! 1138add x0, x27, 1 1139str x1, [x27, #254]! 1140add x0, x27, 1 1141strb w1, [x27], #254 1142add x0, x27, 1 1143strb w1, [x27, #254]! 1144add x0, x27, 1 1145strh w1, [x27], #254 1146add x0, x27, 1 1147# LLVM-MCA-END 1148 1149# LLVM-MCA-BEGIN G90 1150strh w1, [x27, #254]! 1151add x0, x27, 1 1152# LLVM-MCA-END 1153 1154# LLVM-MCA-BEGIN G91 1155ldr x1, [x27], #254 1156add x0, x27, 1 1157ldr x2, [x1], #254 1158add x0, x27, 1 1159# LLVM-MCA-END 1160 1161# CHECK: [0] Code Region - G01 1162 1163# CHECK: Iterations: 100 1164# CHECK-NEXT: Instructions: 1000 1165# CHECK-NEXT: Total Cycles: 507 1166# CHECK-NEXT: Total uOps: 1500 1167 1168# CHECK: Dispatch Width: 3 1169# CHECK-NEXT: uOps Per Cycle: 2.96 1170# CHECK-NEXT: IPC: 1.97 1171# CHECK-NEXT: Block RThroughput: 5.0 1172 1173# CHECK: Timeline view: 1174# CHECK-NEXT: 01 1175# CHECK-NEXT: Index 0123456789 1176 1177# CHECK: [0,0] DeeeeeER .. ld1 { v1.1d }, [x27], #8 1178# CHECK-NEXT: [0,1] D=eE---R .. add x0, x27, #1 1179# CHECK-NEXT: [0,2] .DeeeeeER .. ld1 { v1.2d }, [x27], #16 1180# CHECK-NEXT: [0,3] .D=eE---R .. add x0, x27, #1 1181# CHECK-NEXT: [0,4] . DeeeeeER.. ld1 { v1.2s }, [x27], #8 1182# CHECK-NEXT: [0,5] . D=eE---R.. add x0, x27, #1 1183# CHECK-NEXT: [0,6] . DeeeeeER. ld1 { v1.4h }, [x27], #8 1184# CHECK-NEXT: [0,7] . D=eE---R. add x0, x27, #1 1185# CHECK-NEXT: [0,8] . DeeeeeER ld1 { v1.4s }, [x27], #16 1186# CHECK-NEXT: [0,9] . D=eE---R add x0, x27, #1 1187 1188# CHECK: Average Wait times (based on the timeline view): 1189# CHECK-NEXT: [0]: Executions 1190# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1191# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1192# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1193 1194# CHECK: [0] [1] [2] [3] 1195# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.1d }, [x27], #8 1196# CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1 1197# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld1 { v1.2d }, [x27], #16 1198# CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1 1199# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld1 { v1.2s }, [x27], #8 1200# CHECK-NEXT: 5. 1 2.0 0.0 3.0 add x0, x27, #1 1201# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld1 { v1.4h }, [x27], #8 1202# CHECK-NEXT: 7. 1 2.0 0.0 3.0 add x0, x27, #1 1203# CHECK-NEXT: 8. 1 1.0 0.0 0.0 ld1 { v1.4s }, [x27], #16 1204# CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1 1205# CHECK-NEXT: 1 1.5 0.1 1.5 <total> 1206 1207# CHECK: [1] Code Region - G02 1208 1209# CHECK: Iterations: 100 1210# CHECK-NEXT: Instructions: 1000 1211# CHECK-NEXT: Total Cycles: 507 1212# CHECK-NEXT: Total uOps: 1500 1213 1214# CHECK: Dispatch Width: 3 1215# CHECK-NEXT: uOps Per Cycle: 2.96 1216# CHECK-NEXT: IPC: 1.97 1217# CHECK-NEXT: Block RThroughput: 5.0 1218 1219# CHECK: Timeline view: 1220# CHECK-NEXT: 01 1221# CHECK-NEXT: Index 0123456789 1222 1223# CHECK: [0,0] DeeeeeER .. ld1 { v1.8b }, [x27], #8 1224# CHECK-NEXT: [0,1] D=eE---R .. add x0, x27, #1 1225# CHECK-NEXT: [0,2] .DeeeeeER .. ld1 { v1.8h }, [x27], #16 1226# CHECK-NEXT: [0,3] .D=eE---R .. add x0, x27, #1 1227# CHECK-NEXT: [0,4] . DeeeeeER.. ld1 { v1.16b }, [x27], #16 1228# CHECK-NEXT: [0,5] . D=eE---R.. add x0, x27, #1 1229# CHECK-NEXT: [0,6] . DeeeeeER. ld1 { v1.1d }, [x27], x28 1230# CHECK-NEXT: [0,7] . D=eE---R. add x0, x27, #1 1231# CHECK-NEXT: [0,8] . DeeeeeER ld1 { v1.2d }, [x27], x28 1232# CHECK-NEXT: [0,9] . D=eE---R add x0, x27, #1 1233 1234# CHECK: Average Wait times (based on the timeline view): 1235# CHECK-NEXT: [0]: Executions 1236# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1237# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1238# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1239 1240# CHECK: [0] [1] [2] [3] 1241# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.8b }, [x27], #8 1242# CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1 1243# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld1 { v1.8h }, [x27], #16 1244# CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1 1245# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld1 { v1.16b }, [x27], #16 1246# CHECK-NEXT: 5. 1 2.0 0.0 3.0 add x0, x27, #1 1247# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld1 { v1.1d }, [x27], x28 1248# CHECK-NEXT: 7. 1 2.0 0.0 3.0 add x0, x27, #1 1249# CHECK-NEXT: 8. 1 1.0 0.0 0.0 ld1 { v1.2d }, [x27], x28 1250# CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1 1251# CHECK-NEXT: 1 1.5 0.1 1.5 <total> 1252 1253# CHECK: [2] Code Region - G03 1254 1255# CHECK: Iterations: 100 1256# CHECK-NEXT: Instructions: 1000 1257# CHECK-NEXT: Total Cycles: 507 1258# CHECK-NEXT: Total uOps: 1500 1259 1260# CHECK: Dispatch Width: 3 1261# CHECK-NEXT: uOps Per Cycle: 2.96 1262# CHECK-NEXT: IPC: 1.97 1263# CHECK-NEXT: Block RThroughput: 5.0 1264 1265# CHECK: Timeline view: 1266# CHECK-NEXT: 01 1267# CHECK-NEXT: Index 0123456789 1268 1269# CHECK: [0,0] DeeeeeER .. ld1 { v1.2s }, [x27], x28 1270# CHECK-NEXT: [0,1] D=eE---R .. add x0, x27, #1 1271# CHECK-NEXT: [0,2] .DeeeeeER .. ld1 { v1.4h }, [x27], x28 1272# CHECK-NEXT: [0,3] .D=eE---R .. add x0, x27, #1 1273# CHECK-NEXT: [0,4] . DeeeeeER.. ld1 { v1.4s }, [x27], x28 1274# CHECK-NEXT: [0,5] . D=eE---R.. add x0, x27, #1 1275# CHECK-NEXT: [0,6] . DeeeeeER. ld1 { v1.8b }, [x27], x28 1276# CHECK-NEXT: [0,7] . D=eE---R. add x0, x27, #1 1277# CHECK-NEXT: [0,8] . DeeeeeER ld1 { v1.8h }, [x27], x28 1278# CHECK-NEXT: [0,9] . D=eE---R add x0, x27, #1 1279 1280# CHECK: Average Wait times (based on the timeline view): 1281# CHECK-NEXT: [0]: Executions 1282# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1283# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1284# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1285 1286# CHECK: [0] [1] [2] [3] 1287# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.2s }, [x27], x28 1288# CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1 1289# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld1 { v1.4h }, [x27], x28 1290# CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1 1291# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld1 { v1.4s }, [x27], x28 1292# CHECK-NEXT: 5. 1 2.0 0.0 3.0 add x0, x27, #1 1293# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld1 { v1.8b }, [x27], x28 1294# CHECK-NEXT: 7. 1 2.0 0.0 3.0 add x0, x27, #1 1295# CHECK-NEXT: 8. 1 1.0 0.0 0.0 ld1 { v1.8h }, [x27], x28 1296# CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1 1297# CHECK-NEXT: 1 1.5 0.1 1.5 <total> 1298 1299# CHECK: [3] Code Region - G04 1300 1301# CHECK: Iterations: 100 1302# CHECK-NEXT: Instructions: 1000 1303# CHECK-NEXT: Total Cycles: 607 1304# CHECK-NEXT: Total uOps: 1600 1305 1306# CHECK: Dispatch Width: 3 1307# CHECK-NEXT: uOps Per Cycle: 2.64 1308# CHECK-NEXT: IPC: 1.65 1309# CHECK-NEXT: Block RThroughput: 6.0 1310 1311# CHECK: Timeline view: 1312# CHECK-NEXT: 012 1313# CHECK-NEXT: Index 0123456789 1314 1315# CHECK: [0,0] DeeeeeER . . ld1 { v1.16b }, [x27], x28 1316# CHECK-NEXT: [0,1] D=eE---R . . add x0, x27, #1 1317# CHECK-NEXT: [0,2] .DeeeeeER . . ld1 { v1.1d, v2.1d }, [x27], #16 1318# CHECK-NEXT: [0,3] .D=eE---R . . add x0, x27, #1 1319# CHECK-NEXT: [0,4] . DeeeeeeER . ld1 { v1.2d, v2.2d }, [x27], #32 1320# CHECK-NEXT: [0,5] . DeE----R . add x0, x27, #1 1321# CHECK-NEXT: [0,6] . D=eeeeeER. ld1 { v1.2s, v2.2s }, [x27], #16 1322# CHECK-NEXT: [0,7] . D=eE---R. add x0, x27, #1 1323# CHECK-NEXT: [0,8] . D=eeeeeER ld1 { v1.4h, v2.4h }, [x27], #16 1324# CHECK-NEXT: [0,9] . D=eE---R add x0, x27, #1 1325 1326# CHECK: Average Wait times (based on the timeline view): 1327# CHECK-NEXT: [0]: Executions 1328# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1329# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1330# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1331 1332# CHECK: [0] [1] [2] [3] 1333# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.16b }, [x27], x28 1334# CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1 1335# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld1 { v1.1d, v2.1d }, [x27], #16 1336# CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1 1337# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld1 { v1.2d, v2.2d }, [x27], #32 1338# CHECK-NEXT: 5. 1 1.0 0.0 4.0 add x0, x27, #1 1339# CHECK-NEXT: 6. 1 2.0 1.0 0.0 ld1 { v1.2s, v2.2s }, [x27], #16 1340# CHECK-NEXT: 7. 1 2.0 0.0 3.0 add x0, x27, #1 1341# CHECK-NEXT: 8. 1 2.0 0.0 0.0 ld1 { v1.4h, v2.4h }, [x27], #16 1342# CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1 1343# CHECK-NEXT: 1 1.6 0.2 1.6 <total> 1344 1345# CHECK: [4] Code Region - G05 1346 1347# CHECK: Iterations: 100 1348# CHECK-NEXT: Instructions: 1000 1349# CHECK-NEXT: Total Cycles: 807 1350# CHECK-NEXT: Total uOps: 1800 1351 1352# CHECK: Dispatch Width: 3 1353# CHECK-NEXT: uOps Per Cycle: 2.23 1354# CHECK-NEXT: IPC: 1.24 1355# CHECK-NEXT: Block RThroughput: 8.0 1356 1357# CHECK: Timeline view: 1358# CHECK-NEXT: 01234 1359# CHECK-NEXT: Index 0123456789 1360 1361# CHECK: [0,0] DeeeeeeER . . ld1 { v1.4s, v2.4s }, [x27], #32 1362# CHECK-NEXT: [0,1] .DeE----R . . add x0, x27, #1 1363# CHECK-NEXT: [0,2] .D=eeeeeER. . ld1 { v1.8b, v2.8b }, [x27], #16 1364# CHECK-NEXT: [0,3] . D=eE---R. . add x0, x27, #1 1365# CHECK-NEXT: [0,4] . DeeeeeeER . ld1 { v1.8h, v2.8h }, [x27], #32 1366# CHECK-NEXT: [0,5] . DeE----R . add x0, x27, #1 1367# CHECK-NEXT: [0,6] . DeeeeeeER. ld1 { v1.16b, v2.16b }, [x27], #32 1368# CHECK-NEXT: [0,7] . .DeE----R. add x0, x27, #1 1369# CHECK-NEXT: [0,8] . .D=eeeeeER ld1 { v1.1d, v2.1d }, [x27], x28 1370# CHECK-NEXT: [0,9] . . D=eE---R add x0, x27, #1 1371 1372# CHECK: Average Wait times (based on the timeline view): 1373# CHECK-NEXT: [0]: Executions 1374# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1375# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1376# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1377 1378# CHECK: [0] [1] [2] [3] 1379# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.4s, v2.4s }, [x27], #32 1380# CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1 1381# CHECK-NEXT: 2. 1 2.0 1.0 0.0 ld1 { v1.8b, v2.8b }, [x27], #16 1382# CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1 1383# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld1 { v1.8h, v2.8h }, [x27], #32 1384# CHECK-NEXT: 5. 1 1.0 0.0 4.0 add x0, x27, #1 1385# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld1 { v1.16b, v2.16b }, [x27], #32 1386# CHECK-NEXT: 7. 1 1.0 0.0 4.0 add x0, x27, #1 1387# CHECK-NEXT: 8. 1 2.0 1.0 0.0 ld1 { v1.1d, v2.1d }, [x27], x28 1388# CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1 1389# CHECK-NEXT: 1 1.4 0.4 1.8 <total> 1390 1391# CHECK: [5] Code Region - G06 1392 1393# CHECK: Iterations: 100 1394# CHECK-NEXT: Instructions: 1000 1395# CHECK-NEXT: Total Cycles: 707 1396# CHECK-NEXT: Total uOps: 1700 1397 1398# CHECK: Dispatch Width: 3 1399# CHECK-NEXT: uOps Per Cycle: 2.40 1400# CHECK-NEXT: IPC: 1.41 1401# CHECK-NEXT: Block RThroughput: 7.0 1402 1403# CHECK: Timeline view: 1404# CHECK-NEXT: 0123 1405# CHECK-NEXT: Index 0123456789 1406 1407# CHECK: [0,0] DeeeeeeER . . ld1 { v1.2d, v2.2d }, [x27], x28 1408# CHECK-NEXT: [0,1] .DeE----R . . add x0, x27, #1 1409# CHECK-NEXT: [0,2] .D=eeeeeER. . ld1 { v1.2s, v2.2s }, [x27], x28 1410# CHECK-NEXT: [0,3] . D=eE---R. . add x0, x27, #1 1411# CHECK-NEXT: [0,4] . D=eeeeeER . ld1 { v1.4h, v2.4h }, [x27], x28 1412# CHECK-NEXT: [0,5] . D=eE---R . add x0, x27, #1 1413# CHECK-NEXT: [0,6] . DeeeeeeER. ld1 { v1.4s, v2.4s }, [x27], x28 1414# CHECK-NEXT: [0,7] . DeE----R. add x0, x27, #1 1415# CHECK-NEXT: [0,8] . D=eeeeeER ld1 { v1.8b, v2.8b }, [x27], x28 1416# CHECK-NEXT: [0,9] . .D=eE---R add x0, x27, #1 1417 1418# CHECK: Average Wait times (based on the timeline view): 1419# CHECK-NEXT: [0]: Executions 1420# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1421# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1422# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1423 1424# CHECK: [0] [1] [2] [3] 1425# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.2d, v2.2d }, [x27], x28 1426# CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1 1427# CHECK-NEXT: 2. 1 2.0 1.0 0.0 ld1 { v1.2s, v2.2s }, [x27], x28 1428# CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1 1429# CHECK-NEXT: 4. 1 2.0 0.0 0.0 ld1 { v1.4h, v2.4h }, [x27], x28 1430# CHECK-NEXT: 5. 1 2.0 0.0 3.0 add x0, x27, #1 1431# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ld1 { v1.4s, v2.4s }, [x27], x28 1432# CHECK-NEXT: 7. 1 1.0 0.0 4.0 add x0, x27, #1 1433# CHECK-NEXT: 8. 1 2.0 1.0 0.0 ld1 { v1.8b, v2.8b }, [x27], x28 1434# CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1 1435# CHECK-NEXT: 1 1.6 0.3 1.7 <total> 1436 1437# CHECK: [6] Code Region - G07 1438 1439# CHECK: Iterations: 100 1440# CHECK-NEXT: Instructions: 1000 1441# CHECK-NEXT: Total Cycles: 1107 1442# CHECK-NEXT: Total uOps: 2100 1443 1444# CHECK: Dispatch Width: 3 1445# CHECK-NEXT: uOps Per Cycle: 1.90 1446# CHECK-NEXT: IPC: 0.90 1447# CHECK-NEXT: Block RThroughput: 11.0 1448 1449# CHECK: Timeline view: 1450# CHECK-NEXT: 01234567 1451# CHECK-NEXT: Index 0123456789 1452 1453# CHECK: [0,0] DeeeeeeER . . . ld1 { v1.8h, v2.8h }, [x27], x28 1454# CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1 1455# CHECK-NEXT: [0,2] . DeeeeeeER . . ld1 { v1.16b, v2.16b }, [x27], x28 1456# CHECK-NEXT: [0,3] . DeE----R . . add x0, x27, #1 1457# CHECK-NEXT: [0,4] . DeeeeeeER . . ld1 { v1.1d, v2.1d, v3.1d }, [x27], #24 1458# CHECK-NEXT: [0,5] . DeE----R . . add x0, x27, #1 1459# CHECK-NEXT: [0,6] . .DeeeeeeeER . ld1 { v1.2d, v2.2d, v3.2d }, [x27], #48 1460# CHECK-NEXT: [0,7] . . DeE-----R . add x0, x27, #1 1461# CHECK-NEXT: [0,8] . . D=eeeeeeER ld1 { v1.2s, v2.2s, v3.2s }, [x27], #24 1462# CHECK-NEXT: [0,9] . . D=eE----R add x0, x27, #1 1463 1464# CHECK: Average Wait times (based on the timeline view): 1465# CHECK-NEXT: [0]: Executions 1466# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1467# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1468# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1469 1470# CHECK: [0] [1] [2] [3] 1471# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.8h, v2.8h }, [x27], x28 1472# CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1 1473# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1 { v1.16b, v2.16b }, [x27], x28 1474# CHECK-NEXT: 3. 1 1.0 0.0 4.0 add x0, x27, #1 1475# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld1 { v1.1d, v2.1d, v3.1d }, [x27], #24 1476# CHECK-NEXT: 5. 1 1.0 0.0 4.0 add x0, x27, #1 1477# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld1 { v1.2d, v2.2d, v3.2d }, [x27], #48 1478# CHECK-NEXT: 7. 1 1.0 0.0 5.0 add x0, x27, #1 1479# CHECK-NEXT: 8. 1 2.0 2.0 0.0 ld1 { v1.2s, v2.2s, v3.2s }, [x27], #24 1480# CHECK-NEXT: 9. 1 2.0 0.0 4.0 add x0, x27, #1 1481# CHECK-NEXT: 1 1.2 0.6 2.1 <total> 1482 1483# CHECK: [7] Code Region - G08 1484 1485# CHECK: Iterations: 100 1486# CHECK-NEXT: Instructions: 1000 1487# CHECK-NEXT: Total Cycles: 1307 1488# CHECK-NEXT: Total uOps: 2300 1489 1490# CHECK: Dispatch Width: 3 1491# CHECK-NEXT: uOps Per Cycle: 1.76 1492# CHECK-NEXT: IPC: 0.77 1493# CHECK-NEXT: Block RThroughput: 13.0 1494 1495# CHECK: Timeline view: 1496# CHECK-NEXT: 0123456789 1497# CHECK-NEXT: Index 0123456789 1498 1499# CHECK: [0,0] DeeeeeeER . . . ld1 { v1.4h, v2.4h, v3.4h }, [x27], #24 1500# CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1 1501# CHECK-NEXT: [0,2] . DeeeeeeeER . . ld1 { v1.4s, v2.4s, v3.4s }, [x27], #48 1502# CHECK-NEXT: [0,3] . DeE-----R . . add x0, x27, #1 1503# CHECK-NEXT: [0,4] . D=eeeeeeER . . ld1 { v1.8b, v2.8b, v3.8b }, [x27], #24 1504# CHECK-NEXT: [0,5] . D=eE----R . . add x0, x27, #1 1505# CHECK-NEXT: [0,6] . .D=eeeeeeeER . ld1 { v1.8h, v2.8h, v3.8h }, [x27], #48 1506# CHECK-NEXT: [0,7] . . D=eE-----R . add x0, x27, #1 1507# CHECK-NEXT: [0,8] . . D==eeeeeeeER ld1 { v1.16b, v2.16b, v3.16b }, [x27], #48 1508# CHECK-NEXT: [0,9] . . D==eE-----R add x0, x27, #1 1509 1510# CHECK: Average Wait times (based on the timeline view): 1511# CHECK-NEXT: [0]: Executions 1512# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1513# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1514# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1515 1516# CHECK: [0] [1] [2] [3] 1517# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.4h, v2.4h, v3.4h }, [x27], #24 1518# CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1 1519# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1 { v1.4s, v2.4s, v3.4s }, [x27], #48 1520# CHECK-NEXT: 3. 1 1.0 0.0 5.0 add x0, x27, #1 1521# CHECK-NEXT: 4. 1 2.0 2.0 0.0 ld1 { v1.8b, v2.8b, v3.8b }, [x27], #24 1522# CHECK-NEXT: 5. 1 2.0 0.0 4.0 add x0, x27, #1 1523# CHECK-NEXT: 6. 1 2.0 1.0 0.0 ld1 { v1.8h, v2.8h, v3.8h }, [x27], #48 1524# CHECK-NEXT: 7. 1 2.0 0.0 5.0 add x0, x27, #1 1525# CHECK-NEXT: 8. 1 3.0 2.0 0.0 ld1 { v1.16b, v2.16b, v3.16b }, [x27], #48 1526# CHECK-NEXT: 9. 1 3.0 0.0 5.0 add x0, x27, #1 1527# CHECK-NEXT: 1 1.8 0.7 2.3 <total> 1528 1529# CHECK: [8] Code Region - G09 1530 1531# CHECK: Iterations: 100 1532# CHECK-NEXT: Instructions: 1000 1533# CHECK-NEXT: Total Cycles: 1207 1534# CHECK-NEXT: Total uOps: 2200 1535 1536# CHECK: Dispatch Width: 3 1537# CHECK-NEXT: uOps Per Cycle: 1.82 1538# CHECK-NEXT: IPC: 0.83 1539# CHECK-NEXT: Block RThroughput: 12.0 1540 1541# CHECK: Timeline view: 1542# CHECK-NEXT: 012345678 1543# CHECK-NEXT: Index 0123456789 1544 1545# CHECK: [0,0] DeeeeeeER . . . ld1 { v1.1d, v2.1d, v3.1d }, [x27], x28 1546# CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1 1547# CHECK-NEXT: [0,2] . DeeeeeeeER . . ld1 { v1.2d, v2.2d, v3.2d }, [x27], x28 1548# CHECK-NEXT: [0,3] . DeE-----R . . add x0, x27, #1 1549# CHECK-NEXT: [0,4] . D=eeeeeeER . . ld1 { v1.2s, v2.2s, v3.2s }, [x27], x28 1550# CHECK-NEXT: [0,5] . D=eE----R . . add x0, x27, #1 1551# CHECK-NEXT: [0,6] . .D=eeeeeeER . ld1 { v1.4h, v2.4h, v3.4h }, [x27], x28 1552# CHECK-NEXT: [0,7] . . D=eE----R . add x0, x27, #1 1553# CHECK-NEXT: [0,8] . . D=eeeeeeeER ld1 { v1.4s, v2.4s, v3.4s }, [x27], x28 1554# CHECK-NEXT: [0,9] . . D=eE-----R add x0, x27, #1 1555 1556# CHECK: Average Wait times (based on the timeline view): 1557# CHECK-NEXT: [0]: Executions 1558# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1559# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1560# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1561 1562# CHECK: [0] [1] [2] [3] 1563# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.1d, v2.1d, v3.1d }, [x27], x28 1564# CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1 1565# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1 { v1.2d, v2.2d, v3.2d }, [x27], x28 1566# CHECK-NEXT: 3. 1 1.0 0.0 5.0 add x0, x27, #1 1567# CHECK-NEXT: 4. 1 2.0 2.0 0.0 ld1 { v1.2s, v2.2s, v3.2s }, [x27], x28 1568# CHECK-NEXT: 5. 1 2.0 0.0 4.0 add x0, x27, #1 1569# CHECK-NEXT: 6. 1 2.0 1.0 0.0 ld1 { v1.4h, v2.4h, v3.4h }, [x27], x28 1570# CHECK-NEXT: 7. 1 2.0 0.0 4.0 add x0, x27, #1 1571# CHECK-NEXT: 8. 1 2.0 1.0 0.0 ld1 { v1.4s, v2.4s, v3.4s }, [x27], x28 1572# CHECK-NEXT: 9. 1 2.0 0.0 5.0 add x0, x27, #1 1573# CHECK-NEXT: 1 1.6 0.6 2.2 <total> 1574 1575# CHECK: [9] Code Region - G10 1576 1577# CHECK: Iterations: 100 1578# CHECK-NEXT: Instructions: 1000 1579# CHECK-NEXT: Total Cycles: 1407 1580# CHECK-NEXT: Total uOps: 2400 1581 1582# CHECK: Dispatch Width: 3 1583# CHECK-NEXT: uOps Per Cycle: 1.71 1584# CHECK-NEXT: IPC: 0.71 1585# CHECK-NEXT: Block RThroughput: 14.0 1586 1587# CHECK: Timeline view: 1588# CHECK-NEXT: 0123456789 1589# CHECK-NEXT: Index 0123456789 0 1590 1591# CHECK: [0,0] DeeeeeeER . . . ld1 { v1.8b, v2.8b, v3.8b }, [x27], x28 1592# CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1 1593# CHECK-NEXT: [0,2] . DeeeeeeeER . . ld1 { v1.8h, v2.8h, v3.8h }, [x27], x28 1594# CHECK-NEXT: [0,3] . DeE-----R . . add x0, x27, #1 1595# CHECK-NEXT: [0,4] . D=eeeeeeeER. . ld1 { v1.16b, v2.16b, v3.16b }, [x27], x28 1596# CHECK-NEXT: [0,5] . D=eE-----R. . add x0, x27, #1 1597# CHECK-NEXT: [0,6] . .D==eeeeeeER . ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 1598# CHECK-NEXT: [0,7] . . D==eE----R . add x0, x27, #1 1599# CHECK-NEXT: [0,8] . . D==eeeeeeeeER ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 1600# CHECK-NEXT: [0,9] . . D==eE------R add x0, x27, #1 1601 1602# CHECK: Average Wait times (based on the timeline view): 1603# CHECK-NEXT: [0]: Executions 1604# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1605# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1606# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1607 1608# CHECK: [0] [1] [2] [3] 1609# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.8b, v2.8b, v3.8b }, [x27], x28 1610# CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1 1611# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1 { v1.8h, v2.8h, v3.8h }, [x27], x28 1612# CHECK-NEXT: 3. 1 1.0 0.0 5.0 add x0, x27, #1 1613# CHECK-NEXT: 4. 1 2.0 2.0 0.0 ld1 { v1.16b, v2.16b, v3.16b }, [x27], x28 1614# CHECK-NEXT: 5. 1 2.0 0.0 5.0 add x0, x27, #1 1615# CHECK-NEXT: 6. 1 3.0 2.0 0.0 ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 1616# CHECK-NEXT: 7. 1 3.0 0.0 4.0 add x0, x27, #1 1617# CHECK-NEXT: 8. 1 3.0 1.0 0.0 ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 1618# CHECK-NEXT: 9. 1 3.0 0.0 6.0 add x0, x27, #1 1619# CHECK-NEXT: 1 2.0 0.7 2.4 <total> 1620 1621# CHECK: [10] Code Region - G11 1622 1623# CHECK: Iterations: 100 1624# CHECK-NEXT: Instructions: 1000 1625# CHECK-NEXT: Total Cycles: 1407 1626# CHECK-NEXT: Total uOps: 2400 1627 1628# CHECK: Dispatch Width: 3 1629# CHECK-NEXT: uOps Per Cycle: 1.71 1630# CHECK-NEXT: IPC: 0.71 1631# CHECK-NEXT: Block RThroughput: 14.0 1632 1633# CHECK: Timeline view: 1634# CHECK-NEXT: 0123456789 1635# CHECK-NEXT: Index 0123456789 0 1636 1637# CHECK: [0,0] DeeeeeeER . . . ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 1638# CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1 1639# CHECK-NEXT: [0,2] . DeeeeeeER . . ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 1640# CHECK-NEXT: [0,3] . DeE----R . . add x0, x27, #1 1641# CHECK-NEXT: [0,4] . DeeeeeeeeER. . ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 1642# CHECK-NEXT: [0,5] . DeE------R. . add x0, x27, #1 1643# CHECK-NEXT: [0,6] . .D==eeeeeeER . ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 1644# CHECK-NEXT: [0,7] . . D==eE----R . add x0, x27, #1 1645# CHECK-NEXT: [0,8] . . D==eeeeeeeeER ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 1646# CHECK-NEXT: [0,9] . . D==eE------R add x0, x27, #1 1647 1648# CHECK: Average Wait times (based on the timeline view): 1649# CHECK-NEXT: [0]: Executions 1650# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1651# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1652# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1653 1654# CHECK: [0] [1] [2] [3] 1655# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 1656# CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1 1657# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 1658# CHECK-NEXT: 3. 1 1.0 0.0 4.0 add x0, x27, #1 1659# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 1660# CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1 1661# CHECK-NEXT: 6. 1 3.0 3.0 0.0 ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 1662# CHECK-NEXT: 7. 1 3.0 0.0 4.0 add x0, x27, #1 1663# CHECK-NEXT: 8. 1 3.0 1.0 0.0 ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 1664# CHECK-NEXT: 9. 1 3.0 0.0 6.0 add x0, x27, #1 1665# CHECK-NEXT: 1 1.8 0.7 2.4 <total> 1666 1667# CHECK: [11] Code Region - G12 1668 1669# CHECK: Iterations: 100 1670# CHECK-NEXT: Instructions: 1000 1671# CHECK-NEXT: Total Cycles: 1407 1672# CHECK-NEXT: Total uOps: 2400 1673 1674# CHECK: Dispatch Width: 3 1675# CHECK-NEXT: uOps Per Cycle: 1.71 1676# CHECK-NEXT: IPC: 0.71 1677# CHECK-NEXT: Block RThroughput: 14.0 1678 1679# CHECK: Timeline view: 1680# CHECK-NEXT: 0123456789 1681# CHECK-NEXT: Index 0123456789 0 1682 1683# CHECK: [0,0] DeeeeeeeeER . . ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 1684# CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1 1685# CHECK-NEXT: [0,2] . D==eeeeeeER . . ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 1686# CHECK-NEXT: [0,3] . D==eE----R . . add x0, x27, #1 1687# CHECK-NEXT: [0,4] . D==eeeeeeeeER . ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 1688# CHECK-NEXT: [0,5] . D==eE------R . add x0, x27, #1 1689# CHECK-NEXT: [0,6] . .D====eeeeeeER . ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 1690# CHECK-NEXT: [0,7] . . D====eE----R . add x0, x27, #1 1691# CHECK-NEXT: [0,8] . . D====eeeeeeER ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 1692# CHECK-NEXT: [0,9] . . D====eE----R add x0, x27, #1 1693 1694# CHECK: Average Wait times (based on the timeline view): 1695# CHECK-NEXT: [0]: Executions 1696# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1697# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1698# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1699 1700# CHECK: [0] [1] [2] [3] 1701# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 1702# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 1703# CHECK-NEXT: 2. 1 3.0 3.0 0.0 ld1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 1704# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1705# CHECK-NEXT: 4. 1 3.0 1.0 0.0 ld1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 1706# CHECK-NEXT: 5. 1 3.0 0.0 6.0 add x0, x27, #1 1707# CHECK-NEXT: 6. 1 5.0 3.0 0.0 ld1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 1708# CHECK-NEXT: 7. 1 5.0 0.0 4.0 add x0, x27, #1 1709# CHECK-NEXT: 8. 1 5.0 1.0 0.0 ld1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 1710# CHECK-NEXT: 9. 1 5.0 0.0 4.0 add x0, x27, #1 1711# CHECK-NEXT: 1 3.4 0.9 2.4 <total> 1712 1713# CHECK: [12] Code Region - G13 1714 1715# CHECK: Iterations: 100 1716# CHECK-NEXT: Instructions: 1000 1717# CHECK-NEXT: Total Cycles: 1910 1718# CHECK-NEXT: Total uOps: 2600 1719 1720# CHECK: Dispatch Width: 3 1721# CHECK-NEXT: uOps Per Cycle: 1.36 1722# CHECK-NEXT: IPC: 0.52 1723# CHECK-NEXT: Block RThroughput: 15.0 1724 1725# CHECK: Timeline view: 1726# CHECK-NEXT: 0123456789 1727# CHECK-NEXT: Index 0123456789 012345678 1728 1729# CHECK: [0,0] DeeeeeeeeER . . . . ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 1730# CHECK-NEXT: [0,1] .DeE------R . . . . add x0, x27, #1 1731# CHECK-NEXT: [0,2] . D==eeeeeeER . . . . ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 1732# CHECK-NEXT: [0,3] . D==eE----R . . . . add x0, x27, #1 1733# CHECK-NEXT: [0,4] . D==eeeeeeeeER . . . ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 1734# CHECK-NEXT: [0,5] . D==eE------R . . . add x0, x27, #1 1735# CHECK-NEXT: [0,6] . .D====eeeeeeeeER . . ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 1736# CHECK-NEXT: [0,7] . . D====eE------R . . add x0, x27, #1 1737# CHECK-NEXT: [0,8] . . D==========eeeeeeeeER ld1 { v1.b }[0], [x27], #1 1738# CHECK-NEXT: [0,9] . . D==========eE------R add x0, x27, #1 1739 1740# CHECK: Average Wait times (based on the timeline view): 1741# CHECK-NEXT: [0]: Executions 1742# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1743# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1744# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1745 1746# CHECK: [0] [1] [2] [3] 1747# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 1748# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 1749# CHECK-NEXT: 2. 1 3.0 3.0 0.0 ld1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 1750# CHECK-NEXT: 3. 1 3.0 0.0 4.0 add x0, x27, #1 1751# CHECK-NEXT: 4. 1 3.0 1.0 0.0 ld1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 1752# CHECK-NEXT: 5. 1 3.0 0.0 6.0 add x0, x27, #1 1753# CHECK-NEXT: 6. 1 5.0 3.0 0.0 ld1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 1754# CHECK-NEXT: 7. 1 5.0 0.0 6.0 add x0, x27, #1 1755# CHECK-NEXT: 8. 1 11.0 0.0 0.0 ld1 { v1.b }[0], [x27], #1 1756# CHECK-NEXT: 9. 1 11.0 0.0 6.0 add x0, x27, #1 1757# CHECK-NEXT: 1 4.6 0.8 2.8 <total> 1758 1759# CHECK: [13] Code Region - G14 1760 1761# CHECK: Iterations: 100 1762# CHECK-NEXT: Instructions: 1000 1763# CHECK-NEXT: Total Cycles: 4003 1764# CHECK-NEXT: Total uOps: 2000 1765 1766# CHECK: Dispatch Width: 3 1767# CHECK-NEXT: uOps Per Cycle: 0.50 1768# CHECK-NEXT: IPC: 0.25 1769# CHECK-NEXT: Block RThroughput: 6.7 1770 1771# CHECK: Timeline view: 1772# CHECK-NEXT: 0123456789 0123456789 1773# CHECK-NEXT: Index 0123456789 0123456789 012 1774 1775# CHECK: [0,0] DeeeeeeeeER . . . . . . . ld1 { v1.b }[8], [x27], #1 1776# CHECK-NEXT: [0,1] .DeE------R . . . . . . . add x0, x27, #1 1777# CHECK-NEXT: [0,2] . D======eeeeeeeeER . . . . . . ld1 { v1.b }[0], [x27], x28 1778# CHECK-NEXT: [0,3] . D======eE------R . . . . . . add x0, x27, #1 1779# CHECK-NEXT: [0,4] . D============eeeeeeeeER . . . . ld1 { v1.b }[8], [x27], x28 1780# CHECK-NEXT: [0,5] . D============eE------R . . . . add x0, x27, #1 1781# CHECK-NEXT: [0,6] . .D==================eeeeeeeeER. . . ld1 { v1.h }[0], [x27], #2 1782# CHECK-NEXT: [0,7] . . D==================eE------R. . . add x0, x27, #1 1783# CHECK-NEXT: [0,8] . . D========================eeeeeeeeER ld1 { v1.h }[4], [x27], #2 1784# CHECK-NEXT: [0,9] . . D========================eE------R add x0, x27, #1 1785 1786# CHECK: Average Wait times (based on the timeline view): 1787# CHECK-NEXT: [0]: Executions 1788# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1789# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1790# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1791 1792# CHECK: [0] [1] [2] [3] 1793# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.b }[8], [x27], #1 1794# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 1795# CHECK-NEXT: 2. 1 7.0 0.0 0.0 ld1 { v1.b }[0], [x27], x28 1796# CHECK-NEXT: 3. 1 7.0 0.0 6.0 add x0, x27, #1 1797# CHECK-NEXT: 4. 1 13.0 0.0 0.0 ld1 { v1.b }[8], [x27], x28 1798# CHECK-NEXT: 5. 1 13.0 0.0 6.0 add x0, x27, #1 1799# CHECK-NEXT: 6. 1 19.0 0.0 0.0 ld1 { v1.h }[0], [x27], #2 1800# CHECK-NEXT: 7. 1 19.0 0.0 6.0 add x0, x27, #1 1801# CHECK-NEXT: 8. 1 25.0 0.0 0.0 ld1 { v1.h }[4], [x27], #2 1802# CHECK-NEXT: 9. 1 25.0 0.0 6.0 add x0, x27, #1 1803# CHECK-NEXT: 1 13.0 0.1 3.0 <total> 1804 1805# CHECK: [14] Code Region - G15 1806 1807# CHECK: Iterations: 100 1808# CHECK-NEXT: Instructions: 1000 1809# CHECK-NEXT: Total Cycles: 3703 1810# CHECK-NEXT: Total uOps: 1900 1811 1812# CHECK: Dispatch Width: 3 1813# CHECK-NEXT: uOps Per Cycle: 0.51 1814# CHECK-NEXT: IPC: 0.27 1815# CHECK-NEXT: Block RThroughput: 6.3 1816 1817# CHECK: Timeline view: 1818# CHECK-NEXT: 0123456789 0123456789 1819# CHECK-NEXT: Index 0123456789 0123456789 1820 1821# CHECK: [0,0] DeeeeeeeeER . . . . . . ld1 { v1.h }[0], [x27], x28 1822# CHECK-NEXT: [0,1] .DeE------R . . . . . . add x0, x27, #1 1823# CHECK-NEXT: [0,2] . D======eeeeeeeeER . . . . . ld1 { v1.h }[4], [x27], x28 1824# CHECK-NEXT: [0,3] . D======eE------R . . . . . add x0, x27, #1 1825# CHECK-NEXT: [0,4] . D============eeeeeeeeER . . . ld1 { v1.s }[0], [x27], #4 1826# CHECK-NEXT: [0,5] . D============eE------R . . . add x0, x27, #1 1827# CHECK-NEXT: [0,6] . .D==================eeeeeeeeER. . ld1 { v1.s }[0], [x27], x28 1828# CHECK-NEXT: [0,7] . . D==================eE------R. . add x0, x27, #1 1829# CHECK-NEXT: [0,8] . . D=========================eeeeeER ld1 { v1.d }[0], [x27], #8 1830# CHECK-NEXT: [0,9] . . D=========================eE---R add x0, x27, #1 1831 1832# CHECK: Average Wait times (based on the timeline view): 1833# CHECK-NEXT: [0]: Executions 1834# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1835# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1836# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1837 1838# CHECK: [0] [1] [2] [3] 1839# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.h }[0], [x27], x28 1840# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 1841# CHECK-NEXT: 2. 1 7.0 0.0 0.0 ld1 { v1.h }[4], [x27], x28 1842# CHECK-NEXT: 3. 1 7.0 0.0 6.0 add x0, x27, #1 1843# CHECK-NEXT: 4. 1 13.0 0.0 0.0 ld1 { v1.s }[0], [x27], #4 1844# CHECK-NEXT: 5. 1 13.0 0.0 6.0 add x0, x27, #1 1845# CHECK-NEXT: 6. 1 19.0 0.0 0.0 ld1 { v1.s }[0], [x27], x28 1846# CHECK-NEXT: 7. 1 19.0 0.0 6.0 add x0, x27, #1 1847# CHECK-NEXT: 8. 1 26.0 0.0 0.0 ld1 { v1.d }[0], [x27], #8 1848# CHECK-NEXT: 9. 1 26.0 0.0 3.0 add x0, x27, #1 1849# CHECK-NEXT: 1 13.2 0.1 2.7 <total> 1850 1851# CHECK: [15] Code Region - G16 1852 1853# CHECK: Iterations: 100 1854# CHECK-NEXT: Instructions: 1000 1855# CHECK-NEXT: Total Cycles: 1205 1856# CHECK-NEXT: Total uOps: 1800 1857 1858# CHECK: Dispatch Width: 3 1859# CHECK-NEXT: uOps Per Cycle: 1.49 1860# CHECK-NEXT: IPC: 0.83 1861# CHECK-NEXT: Block RThroughput: 6.0 1862 1863# CHECK: Timeline view: 1864# CHECK-NEXT: 0123456 1865# CHECK-NEXT: Index 0123456789 1866 1867# CHECK: [0,0] DeeeeeER . .. ld1 { v1.d }[0], [x27], x28 1868# CHECK-NEXT: [0,1] D=eE---R . .. add x0, x27, #1 1869# CHECK-NEXT: [0,2] .DeeeeeER . .. ld1r { v1.1d }, [x27], #8 1870# CHECK-NEXT: [0,3] .D=eE---R . .. add x0, x27, #1 1871# CHECK-NEXT: [0,4] . DeeeeeeeeER .. ld1r { v1.2d }, [x27], #8 1872# CHECK-NEXT: [0,5] . DeE------R .. add x0, x27, #1 1873# CHECK-NEXT: [0,6] . DeeeeeeeeER.. ld1r { v1.2s }, [x27], #4 1874# CHECK-NEXT: [0,7] . DeE------R.. add x0, x27, #1 1875# CHECK-NEXT: [0,8] . .DeeeeeeeeER ld1r { v1.4h }, [x27], #2 1876# CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1 1877 1878# CHECK: Average Wait times (based on the timeline view): 1879# CHECK-NEXT: [0]: Executions 1880# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1881# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1882# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1883 1884# CHECK: [0] [1] [2] [3] 1885# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1 { v1.d }[0], [x27], x28 1886# CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1 1887# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ld1r { v1.1d }, [x27], #8 1888# CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1 1889# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld1r { v1.2d }, [x27], #8 1890# CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1 1891# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld1r { v1.2s }, [x27], #4 1892# CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1 1893# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld1r { v1.4h }, [x27], #2 1894# CHECK-NEXT: 9. 1 1.0 0.0 6.0 add x0, x27, #1 1895# CHECK-NEXT: 1 1.2 0.3 2.4 <total> 1896 1897# CHECK: [16] Code Region - G17 1898 1899# CHECK: Iterations: 100 1900# CHECK-NEXT: Instructions: 1000 1901# CHECK-NEXT: Total Cycles: 908 1902# CHECK-NEXT: Total uOps: 1900 1903 1904# CHECK: Dispatch Width: 3 1905# CHECK-NEXT: uOps Per Cycle: 2.09 1906# CHECK-NEXT: IPC: 1.10 1907# CHECK-NEXT: Block RThroughput: 6.3 1908 1909# CHECK: Timeline view: 1910# CHECK-NEXT: 0123456 1911# CHECK-NEXT: Index 0123456789 1912 1913# CHECK: [0,0] DeeeeeeeeER .. ld1r { v1.4s }, [x27], #4 1914# CHECK-NEXT: [0,1] .DeE------R .. add x0, x27, #1 1915# CHECK-NEXT: [0,2] . DeeeeeeeeER .. ld1r { v1.8b }, [x27], #1 1916# CHECK-NEXT: [0,3] . DeE------R .. add x0, x27, #1 1917# CHECK-NEXT: [0,4] . DeeeeeeeeER.. ld1r { v1.8h }, [x27], #2 1918# CHECK-NEXT: [0,5] . DeE------R.. add x0, x27, #1 1919# CHECK-NEXT: [0,6] . .DeeeeeeeeER ld1r { v1.16b }, [x27], #1 1920# CHECK-NEXT: [0,7] . . DeE------R add x0, x27, #1 1921# CHECK-NEXT: [0,8] . . DeeeeeE--R ld1r { v1.1d }, [x27], x28 1922# CHECK-NEXT: [0,9] . . DeE-----R add x0, x27, #1 1923 1924# CHECK: Average Wait times (based on the timeline view): 1925# CHECK-NEXT: [0]: Executions 1926# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1927# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1928# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1929 1930# CHECK: [0] [1] [2] [3] 1931# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1r { v1.4s }, [x27], #4 1932# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 1933# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1r { v1.8b }, [x27], #1 1934# CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1 1935# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld1r { v1.8h }, [x27], #2 1936# CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1 1937# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld1r { v1.16b }, [x27], #1 1938# CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1 1939# CHECK-NEXT: 8. 1 1.0 0.0 2.0 ld1r { v1.1d }, [x27], x28 1940# CHECK-NEXT: 9. 1 1.0 0.0 5.0 add x0, x27, #1 1941# CHECK-NEXT: 1 1.0 0.4 3.1 <total> 1942 1943# CHECK: [17] Code Region - G18 1944 1945# CHECK: Iterations: 100 1946# CHECK-NEXT: Instructions: 1000 1947# CHECK-NEXT: Total Cycles: 1009 1948# CHECK-NEXT: Total uOps: 2000 1949 1950# CHECK: Dispatch Width: 3 1951# CHECK-NEXT: uOps Per Cycle: 1.98 1952# CHECK-NEXT: IPC: 0.99 1953# CHECK-NEXT: Block RThroughput: 6.7 1954 1955# CHECK: Timeline view: 1956# CHECK-NEXT: 012345678 1957# CHECK-NEXT: Index 0123456789 1958 1959# CHECK: [0,0] DeeeeeeeeER . . ld1r { v1.2d }, [x27], x28 1960# CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1 1961# CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld1r { v1.2s }, [x27], x28 1962# CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1 1963# CHECK-NEXT: [0,4] . DeeeeeeeeER. . ld1r { v1.4h }, [x27], x28 1964# CHECK-NEXT: [0,5] . DeE------R. . add x0, x27, #1 1965# CHECK-NEXT: [0,6] . .DeeeeeeeeER . ld1r { v1.4s }, [x27], x28 1966# CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1 1967# CHECK-NEXT: [0,8] . . DeeeeeeeeER ld1r { v1.8b }, [x27], x28 1968# CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1 1969 1970# CHECK: Average Wait times (based on the timeline view): 1971# CHECK-NEXT: [0]: Executions 1972# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 1973# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 1974# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 1975 1976# CHECK: [0] [1] [2] [3] 1977# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1r { v1.2d }, [x27], x28 1978# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 1979# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1r { v1.2s }, [x27], x28 1980# CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1 1981# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld1r { v1.4h }, [x27], x28 1982# CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1 1983# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld1r { v1.4s }, [x27], x28 1984# CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1 1985# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld1r { v1.8b }, [x27], x28 1986# CHECK-NEXT: 9. 1 1.0 0.0 6.0 add x0, x27, #1 1987# CHECK-NEXT: 1 1.0 0.5 3.0 <total> 1988 1989# CHECK: [18] Code Region - G19 1990 1991# CHECK: Iterations: 100 1992# CHECK-NEXT: Instructions: 1000 1993# CHECK-NEXT: Total Cycles: 1009 1994# CHECK-NEXT: Total uOps: 2000 1995 1996# CHECK: Dispatch Width: 3 1997# CHECK-NEXT: uOps Per Cycle: 1.98 1998# CHECK-NEXT: IPC: 0.99 1999# CHECK-NEXT: Block RThroughput: 6.7 2000 2001# CHECK: Timeline view: 2002# CHECK-NEXT: 012345678 2003# CHECK-NEXT: Index 0123456789 2004 2005# CHECK: [0,0] DeeeeeeeeER . . ld1r { v1.8h }, [x27], x28 2006# CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1 2007# CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld1r { v1.16b }, [x27], x28 2008# CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1 2009# CHECK-NEXT: [0,4] . DeeeeeeER . . ld2 { v1.2d, v2.2d }, [x27], #32 2010# CHECK-NEXT: [0,5] . DeE----R . . add x0, x27, #1 2011# CHECK-NEXT: [0,6] . .DeeeeeeeeER . ld2 { v1.2s, v2.2s }, [x27], #16 2012# CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1 2013# CHECK-NEXT: [0,8] . . DeeeeeeeeER ld2 { v1.4h, v2.4h }, [x27], #16 2014# CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1 2015 2016# CHECK: Average Wait times (based on the timeline view): 2017# CHECK-NEXT: [0]: Executions 2018# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2019# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2020# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2021 2022# CHECK: [0] [1] [2] [3] 2023# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld1r { v1.8h }, [x27], x28 2024# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 2025# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld1r { v1.16b }, [x27], x28 2026# CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1 2027# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld2 { v1.2d, v2.2d }, [x27], #32 2028# CHECK-NEXT: 5. 1 1.0 0.0 4.0 add x0, x27, #1 2029# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld2 { v1.2s, v2.2s }, [x27], #16 2030# CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1 2031# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld2 { v1.4h, v2.4h }, [x27], #16 2032# CHECK-NEXT: 9. 1 1.0 0.0 6.0 add x0, x27, #1 2033# CHECK-NEXT: 1 1.0 0.5 2.8 <total> 2034 2035# CHECK: [19] Code Region - G20 2036 2037# CHECK: Iterations: 100 2038# CHECK-NEXT: Instructions: 1000 2039# CHECK-NEXT: Total Cycles: 1008 2040# CHECK-NEXT: Total uOps: 2600 2041 2042# CHECK: Dispatch Width: 3 2043# CHECK-NEXT: uOps Per Cycle: 2.58 2044# CHECK-NEXT: IPC: 0.99 2045# CHECK-NEXT: Block RThroughput: 9.0 2046 2047# CHECK: Timeline view: 2048# CHECK-NEXT: 01234567 2049# CHECK-NEXT: Index 0123456789 2050 2051# CHECK: [0,0] DeeeeeeeeeER . . ld2 { v1.4s, v2.4s }, [x27], #32 2052# CHECK-NEXT: [0,1] .DeE-------R . . add x0, x27, #1 2053# CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld2 { v1.8b, v2.8b }, [x27], #16 2054# CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1 2055# CHECK-NEXT: [0,4] . DeeeeeeeeeER . ld2 { v1.8h, v2.8h }, [x27], #32 2056# CHECK-NEXT: [0,5] . DeE-------R . add x0, x27, #1 2057# CHECK-NEXT: [0,6] . .DeeeeeeeeeER ld2 { v1.16b, v2.16b }, [x27], #32 2058# CHECK-NEXT: [0,7] . . DeE-------R add x0, x27, #1 2059# CHECK-NEXT: [0,8] . . DeeeeeeE-R ld2 { v1.2d, v2.2d }, [x27], x28 2060# CHECK-NEXT: [0,9] . . DeE-----R add x0, x27, #1 2061 2062# CHECK: Average Wait times (based on the timeline view): 2063# CHECK-NEXT: [0]: Executions 2064# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2065# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2066# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2067 2068# CHECK: [0] [1] [2] [3] 2069# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.4s, v2.4s }, [x27], #32 2070# CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1 2071# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld2 { v1.8b, v2.8b }, [x27], #16 2072# CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1 2073# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld2 { v1.8h, v2.8h }, [x27], #32 2074# CHECK-NEXT: 5. 1 1.0 0.0 7.0 add x0, x27, #1 2075# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld2 { v1.16b, v2.16b }, [x27], #32 2076# CHECK-NEXT: 7. 1 1.0 0.0 7.0 add x0, x27, #1 2077# CHECK-NEXT: 8. 1 1.0 1.0 1.0 ld2 { v1.2d, v2.2d }, [x27], x28 2078# CHECK-NEXT: 9. 1 1.0 0.0 5.0 add x0, x27, #1 2079# CHECK-NEXT: 1 1.0 0.5 3.3 <total> 2080 2081# CHECK: [20] Code Region - G21 2082 2083# CHECK: Iterations: 100 2084# CHECK-NEXT: Instructions: 1000 2085# CHECK-NEXT: Total Cycles: 1010 2086# CHECK-NEXT: Total uOps: 2400 2087 2088# CHECK: Dispatch Width: 3 2089# CHECK-NEXT: uOps Per Cycle: 2.38 2090# CHECK-NEXT: IPC: 0.99 2091# CHECK-NEXT: Block RThroughput: 8.0 2092 2093# CHECK: Timeline view: 2094# CHECK-NEXT: 0123456789 2095# CHECK-NEXT: Index 0123456789 2096 2097# CHECK: [0,0] DeeeeeeeeER . . ld2 { v1.2s, v2.2s }, [x27], x28 2098# CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1 2099# CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld2 { v1.4h, v2.4h }, [x27], x28 2100# CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1 2101# CHECK-NEXT: [0,4] . DeeeeeeeeeER . ld2 { v1.4s, v2.4s }, [x27], x28 2102# CHECK-NEXT: [0,5] . DeE-------R . add x0, x27, #1 2103# CHECK-NEXT: [0,6] . .DeeeeeeeeER . ld2 { v1.8b, v2.8b }, [x27], x28 2104# CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1 2105# CHECK-NEXT: [0,8] . . DeeeeeeeeeER ld2 { v1.8h, v2.8h }, [x27], x28 2106# CHECK-NEXT: [0,9] . . DeE-------R add x0, x27, #1 2107 2108# CHECK: Average Wait times (based on the timeline view): 2109# CHECK-NEXT: [0]: Executions 2110# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2111# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2112# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2113 2114# CHECK: [0] [1] [2] [3] 2115# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.2s, v2.2s }, [x27], x28 2116# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 2117# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld2 { v1.4h, v2.4h }, [x27], x28 2118# CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1 2119# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld2 { v1.4s, v2.4s }, [x27], x28 2120# CHECK-NEXT: 5. 1 1.0 0.0 7.0 add x0, x27, #1 2121# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld2 { v1.8b, v2.8b }, [x27], x28 2122# CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1 2123# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld2 { v1.8h, v2.8h }, [x27], x28 2124# CHECK-NEXT: 9. 1 1.0 0.0 7.0 add x0, x27, #1 2125# CHECK-NEXT: 1 1.0 0.5 3.2 <total> 2126 2127# CHECK: [21] Code Region - G22 2128 2129# CHECK: Iterations: 100 2130# CHECK-NEXT: Instructions: 1000 2131# CHECK-NEXT: Total Cycles: 3410 2132# CHECK-NEXT: Total uOps: 2600 2133 2134# CHECK: Dispatch Width: 3 2135# CHECK-NEXT: uOps Per Cycle: 0.76 2136# CHECK-NEXT: IPC: 0.29 2137# CHECK-NEXT: Block RThroughput: 8.7 2138 2139# CHECK: Timeline view: 2140# CHECK-NEXT: 0123456789 0123456789 2141# CHECK-NEXT: Index 0123456789 0123456789 0123 2142 2143# CHECK: [0,0] DeeeeeeeeeER . . . . . . . ld2 { v1.16b, v2.16b }, [x27], x28 2144# CHECK-NEXT: [0,1] .DeE-------R . . . . . . . add x0, x27, #1 2145# CHECK-NEXT: [0,2] . D=======eeeeeeeeER. . . . . . ld2 { v1.b, v2.b }[0], [x27], #2 2146# CHECK-NEXT: [0,3] . D=======eE------R. . . . . . add x0, x27, #1 2147# CHECK-NEXT: [0,4] . D=============eeeeeeeeER . . . . ld2 { v1.b, v2.b }[8], [x27], #2 2148# CHECK-NEXT: [0,5] . D=============eE------R . . . . add x0, x27, #1 2149# CHECK-NEXT: [0,6] . .D===================eeeeeeeeER . . ld2 { v1.b, v2.b }[0], [x27], x28 2150# CHECK-NEXT: [0,7] . . D===================eE------R . . add x0, x27, #1 2151# CHECK-NEXT: [0,8] . . D=========================eeeeeeeeER ld2 { v1.b, v2.b }[8], [x27], x28 2152# CHECK-NEXT: [0,9] . . D=========================eE------R add x0, x27, #1 2153 2154# CHECK: Average Wait times (based on the timeline view): 2155# CHECK-NEXT: [0]: Executions 2156# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2157# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2158# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2159 2160# CHECK: [0] [1] [2] [3] 2161# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.16b, v2.16b }, [x27], x28 2162# CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1 2163# CHECK-NEXT: 2. 1 8.0 0.0 0.0 ld2 { v1.b, v2.b }[0], [x27], #2 2164# CHECK-NEXT: 3. 1 8.0 0.0 6.0 add x0, x27, #1 2165# CHECK-NEXT: 4. 1 14.0 0.0 0.0 ld2 { v1.b, v2.b }[8], [x27], #2 2166# CHECK-NEXT: 5. 1 14.0 0.0 6.0 add x0, x27, #1 2167# CHECK-NEXT: 6. 1 20.0 0.0 0.0 ld2 { v1.b, v2.b }[0], [x27], x28 2168# CHECK-NEXT: 7. 1 20.0 0.0 6.0 add x0, x27, #1 2169# CHECK-NEXT: 8. 1 26.0 0.0 0.0 ld2 { v1.b, v2.b }[8], [x27], x28 2170# CHECK-NEXT: 9. 1 26.0 0.0 6.0 add x0, x27, #1 2171# CHECK-NEXT: 1 13.8 0.1 3.1 <total> 2172 2173# CHECK: [22] Code Region - G23 2174 2175# CHECK: Iterations: 100 2176# CHECK-NEXT: Instructions: 1000 2177# CHECK-NEXT: Total Cycles: 3803 2178# CHECK-NEXT: Total uOps: 2400 2179 2180# CHECK: Dispatch Width: 3 2181# CHECK-NEXT: uOps Per Cycle: 0.63 2182# CHECK-NEXT: IPC: 0.26 2183# CHECK-NEXT: Block RThroughput: 8.0 2184 2185# CHECK: Timeline view: 2186# CHECK-NEXT: 0123456789 0123456789 2187# CHECK-NEXT: Index 0123456789 0123456789 0 2188 2189# CHECK: [0,0] DeeeeeeeeER . . . . . . ld2 { v1.h, v2.h }[0], [x27], #4 2190# CHECK-NEXT: [0,1] .DeE------R . . . . . . add x0, x27, #1 2191# CHECK-NEXT: [0,2] . D======eeeeeeeeER . . . . . ld2 { v1.h, v2.h }[4], [x27], #4 2192# CHECK-NEXT: [0,3] . D======eE------R . . . . . add x0, x27, #1 2193# CHECK-NEXT: [0,4] . D============eeeeeeeeER . . . ld2 { v1.h, v2.h }[0], [x27], x28 2194# CHECK-NEXT: [0,5] . D============eE------R . . . add x0, x27, #1 2195# CHECK-NEXT: [0,6] . .D==================eeeeeeeeER. . ld2 { v1.h, v2.h }[4], [x27], x28 2196# CHECK-NEXT: [0,7] . . D==================eE------R. . add x0, x27, #1 2197# CHECK-NEXT: [0,8] . . D========================eeeeeeER ld2 { v1.s, v2.s }[0], [x27], #8 2198# CHECK-NEXT: [0,9] . . D========================eE----R add x0, x27, #1 2199 2200# CHECK: Average Wait times (based on the timeline view): 2201# CHECK-NEXT: [0]: Executions 2202# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2203# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2204# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2205 2206# CHECK: [0] [1] [2] [3] 2207# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.h, v2.h }[0], [x27], #4 2208# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 2209# CHECK-NEXT: 2. 1 7.0 0.0 0.0 ld2 { v1.h, v2.h }[4], [x27], #4 2210# CHECK-NEXT: 3. 1 7.0 0.0 6.0 add x0, x27, #1 2211# CHECK-NEXT: 4. 1 13.0 0.0 0.0 ld2 { v1.h, v2.h }[0], [x27], x28 2212# CHECK-NEXT: 5. 1 13.0 0.0 6.0 add x0, x27, #1 2213# CHECK-NEXT: 6. 1 19.0 0.0 0.0 ld2 { v1.h, v2.h }[4], [x27], x28 2214# CHECK-NEXT: 7. 1 19.0 0.0 6.0 add x0, x27, #1 2215# CHECK-NEXT: 8. 1 25.0 0.0 0.0 ld2 { v1.s, v2.s }[0], [x27], #8 2216# CHECK-NEXT: 9. 1 25.0 0.0 4.0 add x0, x27, #1 2217# CHECK-NEXT: 1 13.0 0.1 2.8 <total> 2218 2219# CHECK: [23] Code Region - G24 2220 2221# CHECK: Iterations: 100 2222# CHECK-NEXT: Instructions: 1000 2223# CHECK-NEXT: Total Cycles: 2403 2224# CHECK-NEXT: Total uOps: 2000 2225 2226# CHECK: Dispatch Width: 3 2227# CHECK-NEXT: uOps Per Cycle: 0.83 2228# CHECK-NEXT: IPC: 0.42 2229# CHECK-NEXT: Block RThroughput: 6.7 2230 2231# CHECK: Timeline view: 2232# CHECK-NEXT: 0123456789 2233# CHECK-NEXT: Index 0123456789 0123456 2234 2235# CHECK: [0,0] DeeeeeeER . . . .. ld2 { v1.s, v2.s }[0], [x27], x28 2236# CHECK-NEXT: [0,1] .DeE----R . . . .. add x0, x27, #1 2237# CHECK-NEXT: [0,2] . D====eeeeeeeeER . .. ld2 { v1.d, v2.d }[0], [x27], #16 2238# CHECK-NEXT: [0,3] . D====eE------R . .. add x0, x27, #1 2239# CHECK-NEXT: [0,4] . D==========eeeeeeeeER.. ld2 { v1.d, v2.d }[0], [x27], x28 2240# CHECK-NEXT: [0,5] . D==========eE------R.. add x0, x27, #1 2241# CHECK-NEXT: [0,6] . D==========eeeeeE--R.. ld2r { v1.1d, v2.1d }, [x27], #16 2242# CHECK-NEXT: [0,7] . .D==========eE-----R.. add x0, x27, #1 2243# CHECK-NEXT: [0,8] . . D=========eeeeeeeeER ld2r { v1.2d, v2.2d }, [x27], #16 2244# CHECK-NEXT: [0,9] . . D=========eE------R add x0, x27, #1 2245 2246# CHECK: Average Wait times (based on the timeline view): 2247# CHECK-NEXT: [0]: Executions 2248# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2249# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2250# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2251 2252# CHECK: [0] [1] [2] [3] 2253# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2 { v1.s, v2.s }[0], [x27], x28 2254# CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1 2255# CHECK-NEXT: 2. 1 5.0 0.0 0.0 ld2 { v1.d, v2.d }[0], [x27], #16 2256# CHECK-NEXT: 3. 1 5.0 0.0 6.0 add x0, x27, #1 2257# CHECK-NEXT: 4. 1 11.0 0.0 0.0 ld2 { v1.d, v2.d }[0], [x27], x28 2258# CHECK-NEXT: 5. 1 11.0 0.0 6.0 add x0, x27, #1 2259# CHECK-NEXT: 6. 1 11.0 0.0 2.0 ld2r { v1.1d, v2.1d }, [x27], #16 2260# CHECK-NEXT: 7. 1 11.0 0.0 5.0 add x0, x27, #1 2261# CHECK-NEXT: 8. 1 10.0 0.0 0.0 ld2r { v1.2d, v2.2d }, [x27], #16 2262# CHECK-NEXT: 9. 1 10.0 0.0 6.0 add x0, x27, #1 2263# CHECK-NEXT: 1 7.6 0.1 2.9 <total> 2264 2265# CHECK: [24] Code Region - G25 2266 2267# CHECK: Iterations: 100 2268# CHECK-NEXT: Instructions: 1000 2269# CHECK-NEXT: Total Cycles: 1009 2270# CHECK-NEXT: Total uOps: 2200 2271 2272# CHECK: Dispatch Width: 3 2273# CHECK-NEXT: uOps Per Cycle: 2.18 2274# CHECK-NEXT: IPC: 0.99 2275# CHECK-NEXT: Block RThroughput: 7.3 2276 2277# CHECK: Timeline view: 2278# CHECK-NEXT: 012345678 2279# CHECK-NEXT: Index 0123456789 2280 2281# CHECK: [0,0] DeeeeeeeeER . . ld2r { v1.2s, v2.2s }, [x27], #8 2282# CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1 2283# CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld2r { v1.4h, v2.4h }, [x27], #4 2284# CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1 2285# CHECK-NEXT: [0,4] . DeeeeeeeeER. . ld2r { v1.4s, v2.4s }, [x27], #8 2286# CHECK-NEXT: [0,5] . DeE------R. . add x0, x27, #1 2287# CHECK-NEXT: [0,6] . .DeeeeeeeeER . ld2r { v1.8b, v2.8b }, [x27], #2 2288# CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1 2289# CHECK-NEXT: [0,8] . . DeeeeeeeeER ld2r { v1.8h, v2.8h }, [x27], #4 2290# CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1 2291 2292# CHECK: Average Wait times (based on the timeline view): 2293# CHECK-NEXT: [0]: Executions 2294# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2295# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2296# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2297 2298# CHECK: [0] [1] [2] [3] 2299# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2r { v1.2s, v2.2s }, [x27], #8 2300# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 2301# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld2r { v1.4h, v2.4h }, [x27], #4 2302# CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1 2303# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld2r { v1.4s, v2.4s }, [x27], #8 2304# CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1 2305# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld2r { v1.8b, v2.8b }, [x27], #2 2306# CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1 2307# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld2r { v1.8h, v2.8h }, [x27], #4 2308# CHECK-NEXT: 9. 1 1.0 0.0 6.0 add x0, x27, #1 2309# CHECK-NEXT: 1 1.0 0.5 3.0 <total> 2310 2311# CHECK: [25] Code Region - G26 2312 2313# CHECK: Iterations: 100 2314# CHECK-NEXT: Instructions: 1000 2315# CHECK-NEXT: Total Cycles: 909 2316# CHECK-NEXT: Total uOps: 2100 2317 2318# CHECK: Dispatch Width: 3 2319# CHECK-NEXT: uOps Per Cycle: 2.31 2320# CHECK-NEXT: IPC: 1.10 2321# CHECK-NEXT: Block RThroughput: 7.0 2322 2323# CHECK: Timeline view: 2324# CHECK-NEXT: 01234567 2325# CHECK-NEXT: Index 0123456789 2326 2327# CHECK: [0,0] DeeeeeeeeER . . ld2r { v1.16b, v2.16b }, [x27], #2 2328# CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1 2329# CHECK-NEXT: [0,2] . DeeeeeE-R . . ld2r { v1.1d, v2.1d }, [x27], x28 2330# CHECK-NEXT: [0,3] . D=eE----R . . add x0, x27, #1 2331# CHECK-NEXT: [0,4] . DeeeeeeeeER . . ld2r { v1.2d, v2.2d }, [x27], x28 2332# CHECK-NEXT: [0,5] . DeE------R . . add x0, x27, #1 2333# CHECK-NEXT: [0,6] . DeeeeeeeeER . ld2r { v1.2s, v2.2s }, [x27], x28 2334# CHECK-NEXT: [0,7] . .DeE------R . add x0, x27, #1 2335# CHECK-NEXT: [0,8] . . DeeeeeeeeER ld2r { v1.4h, v2.4h }, [x27], x28 2336# CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1 2337 2338# CHECK: Average Wait times (based on the timeline view): 2339# CHECK-NEXT: [0]: Executions 2340# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2341# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2342# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2343 2344# CHECK: [0] [1] [2] [3] 2345# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2r { v1.16b, v2.16b }, [x27], #2 2346# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 2347# CHECK-NEXT: 2. 1 1.0 1.0 1.0 ld2r { v1.1d, v2.1d }, [x27], x28 2348# CHECK-NEXT: 3. 1 2.0 0.0 4.0 add x0, x27, #1 2349# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ld2r { v1.2d, v2.2d }, [x27], x28 2350# CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1 2351# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld2r { v1.2s, v2.2s }, [x27], x28 2352# CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1 2353# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld2r { v1.4h, v2.4h }, [x27], x28 2354# CHECK-NEXT: 9. 1 1.0 0.0 6.0 add x0, x27, #1 2355# CHECK-NEXT: 1 1.1 0.4 2.9 <total> 2356 2357# CHECK: [26] Code Region - G27 2358 2359# CHECK: Iterations: 100 2360# CHECK-NEXT: Instructions: 1000 2361# CHECK-NEXT: Total Cycles: 1009 2362# CHECK-NEXT: Total uOps: 2500 2363 2364# CHECK: Dispatch Width: 3 2365# CHECK-NEXT: uOps Per Cycle: 2.48 2366# CHECK-NEXT: IPC: 0.99 2367# CHECK-NEXT: Block RThroughput: 8.3 2368 2369# CHECK: Timeline view: 2370# CHECK-NEXT: 012345678 2371# CHECK-NEXT: Index 0123456789 2372 2373# CHECK: [0,0] DeeeeeeeeER . . ld2r { v1.4s, v2.4s }, [x27], x28 2374# CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1 2375# CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld2r { v1.8b, v2.8b }, [x27], x28 2376# CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1 2377# CHECK-NEXT: [0,4] . DeeeeeeeeER. . ld2r { v1.8h, v2.8h }, [x27], x28 2378# CHECK-NEXT: [0,5] . DeE------R. . add x0, x27, #1 2379# CHECK-NEXT: [0,6] . .DeeeeeeeeER . ld2r { v1.16b, v2.16b }, [x27], x28 2380# CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1 2381# CHECK-NEXT: [0,8] . . DeeeeeeeeER ld3 { v1.2d, v2.2d, v3.2d }, [x27], #48 2382# CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1 2383 2384# CHECK: Average Wait times (based on the timeline view): 2385# CHECK-NEXT: [0]: Executions 2386# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2387# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2388# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2389 2390# CHECK: [0] [1] [2] [3] 2391# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld2r { v1.4s, v2.4s }, [x27], x28 2392# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 2393# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld2r { v1.8b, v2.8b }, [x27], x28 2394# CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1 2395# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld2r { v1.8h, v2.8h }, [x27], x28 2396# CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1 2397# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld2r { v1.16b, v2.16b }, [x27], x28 2398# CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1 2399# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld3 { v1.2d, v2.2d, v3.2d }, [x27], #48 2400# CHECK-NEXT: 9. 1 1.0 0.0 6.0 add x0, x27, #1 2401# CHECK-NEXT: 1 1.0 0.5 3.0 <total> 2402 2403# CHECK: [27] Code Region - G28 2404 2405# CHECK: Iterations: 100 2406# CHECK-NEXT: Instructions: 1000 2407# CHECK-NEXT: Total Cycles: 1210 2408# CHECK-NEXT: Total uOps: 3600 2409 2410# CHECK: Dispatch Width: 3 2411# CHECK-NEXT: uOps Per Cycle: 2.98 2412# CHECK-NEXT: IPC: 0.83 2413# CHECK-NEXT: Block RThroughput: 12.0 2414 2415# CHECK: Timeline view: 2416# CHECK-NEXT: 0123456789 2417# CHECK-NEXT: Index 0123456789 01 2418 2419# CHECK: [0,0] DeeeeeeeeeER . .. ld3 { v1.2s, v2.2s, v3.2s }, [x27], #24 2420# CHECK-NEXT: [0,1] .DeE-------R . .. add x0, x27, #1 2421# CHECK-NEXT: [0,2] . DeeeeeeeeeER . .. ld3 { v1.4h, v2.4h, v3.4h }, [x27], #24 2422# CHECK-NEXT: [0,3] . DeE-------R . .. add x0, x27, #1 2423# CHECK-NEXT: [0,4] . DeeeeeeeeeeER .. ld3 { v1.4s, v2.4s, v3.4s }, [x27], #48 2424# CHECK-NEXT: [0,5] . .DeE-------R .. add x0, x27, #1 2425# CHECK-NEXT: [0,6] . . DeeeeeeeeeER .. ld3 { v1.8b, v2.8b, v3.8b }, [x27], #24 2426# CHECK-NEXT: [0,7] . . DeE-------R .. add x0, x27, #1 2427# CHECK-NEXT: [0,8] . . DeeeeeeeeeeER ld3 { v1.8h, v2.8h, v3.8h }, [x27], #48 2428# CHECK-NEXT: [0,9] . . .DeE-------R add x0, x27, #1 2429 2430# CHECK: Average Wait times (based on the timeline view): 2431# CHECK-NEXT: [0]: Executions 2432# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2433# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2434# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2435 2436# CHECK: [0] [1] [2] [3] 2437# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.2s, v2.2s, v3.2s }, [x27], #24 2438# CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1 2439# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld3 { v1.4h, v2.4h, v3.4h }, [x27], #24 2440# CHECK-NEXT: 3. 1 1.0 0.0 7.0 add x0, x27, #1 2441# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld3 { v1.4s, v2.4s, v3.4s }, [x27], #48 2442# CHECK-NEXT: 5. 1 1.0 1.0 7.0 add x0, x27, #1 2443# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld3 { v1.8b, v2.8b, v3.8b }, [x27], #24 2444# CHECK-NEXT: 7. 1 1.0 0.0 7.0 add x0, x27, #1 2445# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld3 { v1.8h, v2.8h, v3.8h }, [x27], #48 2446# CHECK-NEXT: 9. 1 1.0 1.0 7.0 add x0, x27, #1 2447# CHECK-NEXT: 1 1.0 0.7 3.5 <total> 2448 2449# CHECK: [28] Code Region - G29 2450 2451# CHECK: Iterations: 100 2452# CHECK-NEXT: Instructions: 1000 2453# CHECK-NEXT: Total Cycles: 1410 2454# CHECK-NEXT: Total uOps: 3600 2455 2456# CHECK: Dispatch Width: 3 2457# CHECK-NEXT: uOps Per Cycle: 2.55 2458# CHECK-NEXT: IPC: 0.71 2459# CHECK-NEXT: Block RThroughput: 14.0 2460 2461# CHECK: Timeline view: 2462# CHECK-NEXT: 0123456789 2463# CHECK-NEXT: Index 0123456789 0123 2464 2465# CHECK: [0,0] DeeeeeeeeeeER . . . ld3 { v1.16b, v2.16b, v3.16b }, [x27], #48 2466# CHECK-NEXT: [0,1] . DeE-------R . . . add x0, x27, #1 2467# CHECK-NEXT: [0,2] . DeeeeeeeeER . . . ld3 { v1.2d, v2.2d, v3.2d }, [x27], x28 2468# CHECK-NEXT: [0,3] . DeE------R . . . add x0, x27, #1 2469# CHECK-NEXT: [0,4] . D==eeeeeeeeeER . . ld3 { v1.2s, v2.2s, v3.2s }, [x27], x28 2470# CHECK-NEXT: [0,5] . .D==eE-------R . . add x0, x27, #1 2471# CHECK-NEXT: [0,6] . . D==eeeeeeeeeER . ld3 { v1.4h, v2.4h, v3.4h }, [x27], x28 2472# CHECK-NEXT: [0,7] . . D==eE-------R . add x0, x27, #1 2473# CHECK-NEXT: [0,8] . . D==eeeeeeeeeeER ld3 { v1.4s, v2.4s, v3.4s }, [x27], x28 2474# CHECK-NEXT: [0,9] . . .D=eE--------R add x0, x27, #1 2475 2476# CHECK: Average Wait times (based on the timeline view): 2477# CHECK-NEXT: [0]: Executions 2478# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2479# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2480# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2481 2482# CHECK: [0] [1] [2] [3] 2483# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.16b, v2.16b, v3.16b }, [x27], #48 2484# CHECK-NEXT: 1. 1 1.0 1.0 7.0 add x0, x27, #1 2485# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld3 { v1.2d, v2.2d, v3.2d }, [x27], x28 2486# CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1 2487# CHECK-NEXT: 4. 1 3.0 3.0 0.0 ld3 { v1.2s, v2.2s, v3.2s }, [x27], x28 2488# CHECK-NEXT: 5. 1 3.0 0.0 7.0 add x0, x27, #1 2489# CHECK-NEXT: 6. 1 3.0 1.0 0.0 ld3 { v1.4h, v2.4h, v3.4h }, [x27], x28 2490# CHECK-NEXT: 7. 1 3.0 0.0 7.0 add x0, x27, #1 2491# CHECK-NEXT: 8. 1 3.0 1.0 0.0 ld3 { v1.4s, v2.4s, v3.4s }, [x27], x28 2492# CHECK-NEXT: 9. 1 2.0 0.0 8.0 add x0, x27, #1 2493# CHECK-NEXT: 1 2.1 0.8 3.5 <total> 2494 2495# CHECK: [29] Code Region - G30 2496 2497# CHECK: Iterations: 100 2498# CHECK-NEXT: Instructions: 1000 2499# CHECK-NEXT: Total Cycles: 2511 2500# CHECK-NEXT: Total uOps: 3600 2501 2502# CHECK: Dispatch Width: 3 2503# CHECK-NEXT: uOps Per Cycle: 1.43 2504# CHECK-NEXT: IPC: 0.40 2505# CHECK-NEXT: Block RThroughput: 12.0 2506 2507# CHECK: Timeline view: 2508# CHECK-NEXT: 0123456789 012345 2509# CHECK-NEXT: Index 0123456789 0123456789 2510 2511# CHECK: [0,0] DeeeeeeeeeER . . . . . ld3 { v1.8b, v2.8b, v3.8b }, [x27], x28 2512# CHECK-NEXT: [0,1] .DeE-------R . . . . . add x0, x27, #1 2513# CHECK-NEXT: [0,2] . DeeeeeeeeeeER. . . . . ld3 { v1.8h, v2.8h, v3.8h }, [x27], x28 2514# CHECK-NEXT: [0,3] . DeE-------R. . . . . add x0, x27, #1 2515# CHECK-NEXT: [0,4] . DeeeeeeeeeeER . . . . ld3 { v1.16b, v2.16b, v3.16b }, [x27], x28 2516# CHECK-NEXT: [0,5] . . DeE-------R . . . . add x0, x27, #1 2517# CHECK-NEXT: [0,6] . . D=======eeeeeeeeeER . . ld3 { v1.b, v2.b, v3.b }[0], [x27], #3 2518# CHECK-NEXT: [0,7] . . D=======eE-------R . . add x0, x27, #1 2519# CHECK-NEXT: [0,8] . . D==============eeeeeeeeeER ld3 { v1.b, v2.b, v3.b }[8], [x27], #3 2520# CHECK-NEXT: [0,9] . . .D==============eE-------R add x0, x27, #1 2521 2522# CHECK: Average Wait times (based on the timeline view): 2523# CHECK-NEXT: [0]: Executions 2524# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2525# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2526# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2527 2528# CHECK: [0] [1] [2] [3] 2529# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.8b, v2.8b, v3.8b }, [x27], x28 2530# CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1 2531# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld3 { v1.8h, v2.8h, v3.8h }, [x27], x28 2532# CHECK-NEXT: 3. 1 1.0 1.0 7.0 add x0, x27, #1 2533# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld3 { v1.16b, v2.16b, v3.16b }, [x27], x28 2534# CHECK-NEXT: 5. 1 1.0 1.0 7.0 add x0, x27, #1 2535# CHECK-NEXT: 6. 1 8.0 0.0 0.0 ld3 { v1.b, v2.b, v3.b }[0], [x27], #3 2536# CHECK-NEXT: 7. 1 8.0 0.0 7.0 add x0, x27, #1 2537# CHECK-NEXT: 8. 1 15.0 0.0 0.0 ld3 { v1.b, v2.b, v3.b }[8], [x27], #3 2538# CHECK-NEXT: 9. 1 15.0 0.0 7.0 add x0, x27, #1 2539# CHECK-NEXT: 1 5.2 0.5 3.5 <total> 2540 2541# CHECK: [30] Code Region - G31 2542 2543# CHECK: Iterations: 100 2544# CHECK-NEXT: Instructions: 1000 2545# CHECK-NEXT: Total Cycles: 4503 2546# CHECK-NEXT: Total uOps: 3000 2547 2548# CHECK: Dispatch Width: 3 2549# CHECK-NEXT: uOps Per Cycle: 0.67 2550# CHECK-NEXT: IPC: 0.22 2551# CHECK-NEXT: Block RThroughput: 10.0 2552 2553# CHECK: Timeline view: 2554# CHECK-NEXT: 0123456789 0123456789 2555# CHECK-NEXT: Index 0123456789 0123456789 01234567 2556 2557# CHECK: [0,0] DeeeeeeeeeER . . . . . . . . ld3 { v1.b, v2.b, v3.b }[0], [x27], x28 2558# CHECK-NEXT: [0,1] .DeE-------R . . . . . . . . add x0, x27, #1 2559# CHECK-NEXT: [0,2] . D=======eeeeeeeeeER . . . . . . ld3 { v1.b, v2.b, v3.b }[8], [x27], x28 2560# CHECK-NEXT: [0,3] . D=======eE-------R . . . . . . add x0, x27, #1 2561# CHECK-NEXT: [0,4] . D==============eeeeeeeeeER. . . . . ld3 { v1.h, v2.h, v3.h }[0], [x27], #6 2562# CHECK-NEXT: [0,5] . D==============eE-------R. . . . . add x0, x27, #1 2563# CHECK-NEXT: [0,6] . .D=====================eeeeeeeeeER . . . ld3 { v1.h, v2.h, v3.h }[4], [x27], #6 2564# CHECK-NEXT: [0,7] . . D=====================eE-------R . . . add x0, x27, #1 2565# CHECK-NEXT: [0,8] . . D============================eeeeeeeeeER ld3 { v1.h, v2.h, v3.h }[0], [x27], x28 2566# CHECK-NEXT: [0,9] . . D============================eE-------R add x0, x27, #1 2567 2568# CHECK: Average Wait times (based on the timeline view): 2569# CHECK-NEXT: [0]: Executions 2570# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2571# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2572# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2573 2574# CHECK: [0] [1] [2] [3] 2575# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.b, v2.b, v3.b }[0], [x27], x28 2576# CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1 2577# CHECK-NEXT: 2. 1 8.0 0.0 0.0 ld3 { v1.b, v2.b, v3.b }[8], [x27], x28 2578# CHECK-NEXT: 3. 1 8.0 0.0 7.0 add x0, x27, #1 2579# CHECK-NEXT: 4. 1 15.0 0.0 0.0 ld3 { v1.h, v2.h, v3.h }[0], [x27], #6 2580# CHECK-NEXT: 5. 1 15.0 0.0 7.0 add x0, x27, #1 2581# CHECK-NEXT: 6. 1 22.0 0.0 0.0 ld3 { v1.h, v2.h, v3.h }[4], [x27], #6 2582# CHECK-NEXT: 7. 1 22.0 0.0 7.0 add x0, x27, #1 2583# CHECK-NEXT: 8. 1 29.0 0.0 0.0 ld3 { v1.h, v2.h, v3.h }[0], [x27], x28 2584# CHECK-NEXT: 9. 1 29.0 0.0 7.0 add x0, x27, #1 2585# CHECK-NEXT: 1 15.0 0.1 3.5 <total> 2586 2587# CHECK: [31] Code Region - G32 2588 2589# CHECK: Iterations: 100 2590# CHECK-NEXT: Instructions: 1000 2591# CHECK-NEXT: Total Cycles: 3703 2592# CHECK-NEXT: Total uOps: 2400 2593 2594# CHECK: Dispatch Width: 3 2595# CHECK-NEXT: uOps Per Cycle: 0.65 2596# CHECK-NEXT: IPC: 0.27 2597# CHECK-NEXT: Block RThroughput: 8.0 2598 2599# CHECK: Timeline view: 2600# CHECK-NEXT: 0123456789 0123456789 2601# CHECK-NEXT: Index 0123456789 0123456789 2602 2603# CHECK: [0,0] DeeeeeeeeeER . . . . . . ld3 { v1.h, v2.h, v3.h }[4], [x27], x28 2604# CHECK-NEXT: [0,1] .DeE-------R . . . . . . add x0, x27, #1 2605# CHECK-NEXT: [0,2] . D=======eeeeeeeeER. . . . . ld3 { v1.s, v2.s, v3.s }[0], [x27], #12 2606# CHECK-NEXT: [0,3] . D=======eE------R. . . . . add x0, x27, #1 2607# CHECK-NEXT: [0,4] . D=============eeeeeeeeER . . . ld3 { v1.s, v2.s, v3.s }[0], [x27], x28 2608# CHECK-NEXT: [0,5] . D=============eE------R . . . add x0, x27, #1 2609# CHECK-NEXT: [0,6] . .D===================eeeeeeER . . ld3 { v1.d, v2.d, v3.d }[0], [x27], #24 2610# CHECK-NEXT: [0,7] . . D===================eE----R . . add x0, x27, #1 2611# CHECK-NEXT: [0,8] . . D=======================eeeeeeER ld3 { v1.d, v2.d, v3.d }[0], [x27], x28 2612# CHECK-NEXT: [0,9] . . D=======================eE----R add x0, x27, #1 2613 2614# CHECK: Average Wait times (based on the timeline view): 2615# CHECK-NEXT: [0]: Executions 2616# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2617# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2618# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2619 2620# CHECK: [0] [1] [2] [3] 2621# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3 { v1.h, v2.h, v3.h }[4], [x27], x28 2622# CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1 2623# CHECK-NEXT: 2. 1 8.0 0.0 0.0 ld3 { v1.s, v2.s, v3.s }[0], [x27], #12 2624# CHECK-NEXT: 3. 1 8.0 0.0 6.0 add x0, x27, #1 2625# CHECK-NEXT: 4. 1 14.0 0.0 0.0 ld3 { v1.s, v2.s, v3.s }[0], [x27], x28 2626# CHECK-NEXT: 5. 1 14.0 0.0 6.0 add x0, x27, #1 2627# CHECK-NEXT: 6. 1 20.0 0.0 0.0 ld3 { v1.d, v2.d, v3.d }[0], [x27], #24 2628# CHECK-NEXT: 7. 1 20.0 0.0 4.0 add x0, x27, #1 2629# CHECK-NEXT: 8. 1 24.0 0.0 0.0 ld3 { v1.d, v2.d, v3.d }[0], [x27], x28 2630# CHECK-NEXT: 9. 1 24.0 0.0 4.0 add x0, x27, #1 2631# CHECK-NEXT: 1 13.4 0.1 2.7 <total> 2632 2633# CHECK: [32] Code Region - G33 2634 2635# CHECK: Iterations: 100 2636# CHECK-NEXT: Instructions: 1000 2637# CHECK-NEXT: Total Cycles: 1110 2638# CHECK-NEXT: Total uOps: 2700 2639 2640# CHECK: Dispatch Width: 3 2641# CHECK-NEXT: uOps Per Cycle: 2.43 2642# CHECK-NEXT: IPC: 0.90 2643# CHECK-NEXT: Block RThroughput: 9.0 2644 2645# CHECK: Timeline view: 2646# CHECK-NEXT: 0123456789 2647# CHECK-NEXT: Index 0123456789 0 2648 2649# CHECK: [0,0] DeeeeeeER . . . ld3r { v1.1d, v2.1d, v3.1d }, [x27], #24 2650# CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1 2651# CHECK-NEXT: [0,2] . DeeeeeeeeeER . . ld3r { v1.2d, v2.2d, v3.2d }, [x27], #24 2652# CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1 2653# CHECK-NEXT: [0,4] . DeeeeeeeeER . ld3r { v1.2s, v2.2s, v3.2s }, [x27], #12 2654# CHECK-NEXT: [0,5] . .DeE------R . add x0, x27, #1 2655# CHECK-NEXT: [0,6] . . DeeeeeeeeER . ld3r { v1.4h, v2.4h, v3.4h }, [x27], #6 2656# CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1 2657# CHECK-NEXT: [0,8] . . DeeeeeeeeeER ld3r { v1.4s, v2.4s, v3.4s }, [x27], #12 2658# CHECK-NEXT: [0,9] . . DeE-------R add x0, x27, #1 2659 2660# CHECK: Average Wait times (based on the timeline view): 2661# CHECK-NEXT: [0]: Executions 2662# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2663# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2664# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2665 2666# CHECK: [0] [1] [2] [3] 2667# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3r { v1.1d, v2.1d, v3.1d }, [x27], #24 2668# CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1 2669# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld3r { v1.2d, v2.2d, v3.2d }, [x27], #24 2670# CHECK-NEXT: 3. 1 1.0 1.0 6.0 add x0, x27, #1 2671# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld3r { v1.2s, v2.2s, v3.2s }, [x27], #12 2672# CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1 2673# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld3r { v1.4h, v2.4h, v3.4h }, [x27], #6 2674# CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1 2675# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld3r { v1.4s, v2.4s, v3.4s }, [x27], #12 2676# CHECK-NEXT: 9. 1 1.0 0.0 7.0 add x0, x27, #1 2677# CHECK-NEXT: 1 1.0 0.6 2.9 <total> 2678 2679# CHECK: [33] Code Region - G34 2680 2681# CHECK: Iterations: 100 2682# CHECK-NEXT: Instructions: 1000 2683# CHECK-NEXT: Total Cycles: 1109 2684# CHECK-NEXT: Total uOps: 2800 2685 2686# CHECK: Dispatch Width: 3 2687# CHECK-NEXT: uOps Per Cycle: 2.52 2688# CHECK-NEXT: IPC: 0.90 2689# CHECK-NEXT: Block RThroughput: 9.3 2690 2691# CHECK: Timeline view: 2692# CHECK-NEXT: 0123456789 2693# CHECK-NEXT: Index 0123456789 2694 2695# CHECK: [0,0] DeeeeeeeeER . . ld3r { v1.8b, v2.8b, v3.8b }, [x27], #3 2696# CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1 2697# CHECK-NEXT: [0,2] . DeeeeeeeeeER . . ld3r { v1.8h, v2.8h, v3.8h }, [x27], #6 2698# CHECK-NEXT: [0,3] . DeE-------R . . add x0, x27, #1 2699# CHECK-NEXT: [0,4] . DeeeeeeeeeER . ld3r { v1.16b, v2.16b, v3.16b }, [x27], #3 2700# CHECK-NEXT: [0,5] . DeE-------R . add x0, x27, #1 2701# CHECK-NEXT: [0,6] . .DeeeeeeE-R . ld3r { v1.1d, v2.1d, v3.1d }, [x27], x28 2702# CHECK-NEXT: [0,7] . . DeE-----R . add x0, x27, #1 2703# CHECK-NEXT: [0,8] . . DeeeeeeeeeER ld3r { v1.2d, v2.2d, v3.2d }, [x27], x28 2704# CHECK-NEXT: [0,9] . . DeE------R add x0, x27, #1 2705 2706# CHECK: Average Wait times (based on the timeline view): 2707# CHECK-NEXT: [0]: Executions 2708# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2709# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2710# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2711 2712# CHECK: [0] [1] [2] [3] 2713# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3r { v1.8b, v2.8b, v3.8b }, [x27], #3 2714# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 2715# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld3r { v1.8h, v2.8h, v3.8h }, [x27], #6 2716# CHECK-NEXT: 3. 1 1.0 0.0 7.0 add x0, x27, #1 2717# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld3r { v1.16b, v2.16b, v3.16b }, [x27], #3 2718# CHECK-NEXT: 5. 1 1.0 0.0 7.0 add x0, x27, #1 2719# CHECK-NEXT: 6. 1 1.0 1.0 1.0 ld3r { v1.1d, v2.1d, v3.1d }, [x27], x28 2720# CHECK-NEXT: 7. 1 1.0 0.0 5.0 add x0, x27, #1 2721# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld3r { v1.2d, v2.2d, v3.2d }, [x27], x28 2722# CHECK-NEXT: 9. 1 1.0 1.0 6.0 add x0, x27, #1 2723# CHECK-NEXT: 1 1.0 0.6 3.2 <total> 2724 2725# CHECK: [34] Code Region - G35 2726 2727# CHECK: Iterations: 100 2728# CHECK-NEXT: Instructions: 1000 2729# CHECK-NEXT: Total Cycles: 1010 2730# CHECK-NEXT: Total uOps: 2700 2731 2732# CHECK: Dispatch Width: 3 2733# CHECK-NEXT: uOps Per Cycle: 2.67 2734# CHECK-NEXT: IPC: 0.99 2735# CHECK-NEXT: Block RThroughput: 9.0 2736 2737# CHECK: Timeline view: 2738# CHECK-NEXT: 0123456789 2739# CHECK-NEXT: Index 0123456789 2740 2741# CHECK: [0,0] DeeeeeeeeER . . ld3r { v1.2s, v2.2s, v3.2s }, [x27], x28 2742# CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1 2743# CHECK-NEXT: [0,2] . DeeeeeeeeER . . ld3r { v1.4h, v2.4h, v3.4h }, [x27], x28 2744# CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1 2745# CHECK-NEXT: [0,4] . DeeeeeeeeeER . ld3r { v1.4s, v2.4s, v3.4s }, [x27], x28 2746# CHECK-NEXT: [0,5] . DeE-------R . add x0, x27, #1 2747# CHECK-NEXT: [0,6] . .DeeeeeeeeER . ld3r { v1.8b, v2.8b, v3.8b }, [x27], x28 2748# CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1 2749# CHECK-NEXT: [0,8] . . DeeeeeeeeeER ld3r { v1.8h, v2.8h, v3.8h }, [x27], x28 2750# CHECK-NEXT: [0,9] . . DeE-------R add x0, x27, #1 2751 2752# CHECK: Average Wait times (based on the timeline view): 2753# CHECK-NEXT: [0]: Executions 2754# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2755# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2756# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2757 2758# CHECK: [0] [1] [2] [3] 2759# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3r { v1.2s, v2.2s, v3.2s }, [x27], x28 2760# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 2761# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld3r { v1.4h, v2.4h, v3.4h }, [x27], x28 2762# CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1 2763# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld3r { v1.4s, v2.4s, v3.4s }, [x27], x28 2764# CHECK-NEXT: 5. 1 1.0 0.0 7.0 add x0, x27, #1 2765# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld3r { v1.8b, v2.8b, v3.8b }, [x27], x28 2766# CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1 2767# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld3r { v1.8h, v2.8h, v3.8h }, [x27], x28 2768# CHECK-NEXT: 9. 1 1.0 0.0 7.0 add x0, x27, #1 2769# CHECK-NEXT: 1 1.0 0.5 3.2 <total> 2770 2771# CHECK: [35] Code Region - G36 2772 2773# CHECK: Iterations: 100 2774# CHECK-NEXT: Instructions: 1000 2775# CHECK-NEXT: Total Cycles: 1311 2776# CHECK-NEXT: Total uOps: 3400 2777 2778# CHECK: Dispatch Width: 3 2779# CHECK-NEXT: uOps Per Cycle: 2.59 2780# CHECK-NEXT: IPC: 0.76 2781# CHECK-NEXT: Block RThroughput: 13.0 2782 2783# CHECK: Timeline view: 2784# CHECK-NEXT: 0123456789 2785# CHECK-NEXT: Index 0123456789 0123 2786 2787# CHECK: [0,0] DeeeeeeeeeER . . . ld3r { v1.16b, v2.16b, v3.16b }, [x27], x28 2788# CHECK-NEXT: [0,1] .DeE-------R . . . add x0, x27, #1 2789# CHECK-NEXT: [0,2] . DeeeeeeeeER . . . ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 2790# CHECK-NEXT: [0,3] . DeE------R . . . add x0, x27, #1 2791# CHECK-NEXT: [0,4] . D==eeeeeeeeeER . . ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 2792# CHECK-NEXT: [0,5] . D==eE-------R . . add x0, x27, #1 2793# CHECK-NEXT: [0,6] . .D==eeeeeeeeeER. . ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 2794# CHECK-NEXT: [0,7] . . D==eE-------R. . add x0, x27, #1 2795# CHECK-NEXT: [0,8] . . D==eeeeeeeeeeeER ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 2796# CHECK-NEXT: [0,9] . . .DeE---------R add x0, x27, #1 2797 2798# CHECK: Average Wait times (based on the timeline view): 2799# CHECK-NEXT: [0]: Executions 2800# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2801# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2802# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2803 2804# CHECK: [0] [1] [2] [3] 2805# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld3r { v1.16b, v2.16b, v3.16b }, [x27], x28 2806# CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1 2807# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 2808# CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1 2809# CHECK-NEXT: 4. 1 3.0 3.0 0.0 ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 2810# CHECK-NEXT: 5. 1 3.0 0.0 7.0 add x0, x27, #1 2811# CHECK-NEXT: 6. 1 3.0 1.0 0.0 ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 2812# CHECK-NEXT: 7. 1 3.0 0.0 7.0 add x0, x27, #1 2813# CHECK-NEXT: 8. 1 3.0 1.0 0.0 ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 2814# CHECK-NEXT: 9. 1 1.0 0.0 9.0 add x0, x27, #1 2815# CHECK-NEXT: 1 2.0 0.7 3.6 <total> 2816 2817# CHECK: [36] Code Region - G37 2818 2819# CHECK: Iterations: 100 2820# CHECK-NEXT: Instructions: 1000 2821# CHECK-NEXT: Total Cycles: 1610 2822# CHECK-NEXT: Total uOps: 3800 2823 2824# CHECK: Dispatch Width: 3 2825# CHECK-NEXT: uOps Per Cycle: 2.36 2826# CHECK-NEXT: IPC: 0.62 2827# CHECK-NEXT: Block RThroughput: 16.0 2828 2829# CHECK: Timeline view: 2830# CHECK-NEXT: 0123456789 2831# CHECK-NEXT: Index 0123456789 012345 2832 2833# CHECK: [0,0] DeeeeeeeeeER . . . ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 2834# CHECK-NEXT: [0,1] .DeE-------R . . . add x0, x27, #1 2835# CHECK-NEXT: [0,2] . DeeeeeeeeeeeER . . ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 2836# CHECK-NEXT: [0,3] . DeE-------R . . add x0, x27, #1 2837# CHECK-NEXT: [0,4] . .DeeeeeeeeeeeER. . ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 2838# CHECK-NEXT: [0,5] . . DeE-------R. . add x0, x27, #1 2839# CHECK-NEXT: [0,6] . . DeeeeeeeeER . ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 2840# CHECK-NEXT: [0,7] . . .DeE------R . add x0, x27, #1 2841# CHECK-NEXT: [0,8] . . . D==eeeeeeeeeER ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 2842# CHECK-NEXT: [0,9] . . . D==eE-------R add x0, x27, #1 2843 2844# CHECK: Average Wait times (based on the timeline view): 2845# CHECK-NEXT: [0]: Executions 2846# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2847# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2848# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2849 2850# CHECK: [0] [1] [2] [3] 2851# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 2852# CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1 2853# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 2854# CHECK-NEXT: 3. 1 1.0 1.0 7.0 add x0, x27, #1 2855# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 2856# CHECK-NEXT: 5. 1 1.0 1.0 7.0 add x0, x27, #1 2857# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 2858# CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1 2859# CHECK-NEXT: 8. 1 3.0 3.0 0.0 ld4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 2860# CHECK-NEXT: 9. 1 3.0 0.0 7.0 add x0, x27, #1 2861# CHECK-NEXT: 1 1.4 0.9 3.4 <total> 2862 2863# CHECK: [37] Code Region - G38 2864 2865# CHECK: Iterations: 100 2866# CHECK-NEXT: Instructions: 1000 2867# CHECK-NEXT: Total Cycles: 1610 2868# CHECK-NEXT: Total uOps: 4200 2869 2870# CHECK: Dispatch Width: 3 2871# CHECK-NEXT: uOps Per Cycle: 2.61 2872# CHECK-NEXT: IPC: 0.62 2873# CHECK-NEXT: Block RThroughput: 16.0 2874 2875# CHECK: Timeline view: 2876# CHECK-NEXT: 0123456789 2877# CHECK-NEXT: Index 0123456789 012345 2878 2879# CHECK: [0,0] DeeeeeeeeeER . . . ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 2880# CHECK-NEXT: [0,1] .DeE-------R . . . add x0, x27, #1 2881# CHECK-NEXT: [0,2] . DeeeeeeeeeeeER . . ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 2882# CHECK-NEXT: [0,3] . DeE-------R . . add x0, x27, #1 2883# CHECK-NEXT: [0,4] . .DeeeeeeeeeER . . ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 2884# CHECK-NEXT: [0,5] . . DeE-------R . . add x0, x27, #1 2885# CHECK-NEXT: [0,6] . . DeeeeeeeeeeeER . ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 2886# CHECK-NEXT: [0,7] . . .DeE-------R . add x0, x27, #1 2887# CHECK-NEXT: [0,8] . . . DeeeeeeeeeeeER ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 2888# CHECK-NEXT: [0,9] . . . DeE-------R add x0, x27, #1 2889 2890# CHECK: Average Wait times (based on the timeline view): 2891# CHECK-NEXT: [0]: Executions 2892# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2893# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2894# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2895 2896# CHECK: [0] [1] [2] [3] 2897# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 2898# CHECK-NEXT: 1. 1 1.0 0.0 7.0 add x0, x27, #1 2899# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 2900# CHECK-NEXT: 3. 1 1.0 1.0 7.0 add x0, x27, #1 2901# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 2902# CHECK-NEXT: 5. 1 1.0 0.0 7.0 add x0, x27, #1 2903# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 2904# CHECK-NEXT: 7. 1 1.0 1.0 7.0 add x0, x27, #1 2905# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 2906# CHECK-NEXT: 9. 1 1.0 1.0 7.0 add x0, x27, #1 2907# CHECK-NEXT: 1 1.0 0.8 3.5 <total> 2908 2909# CHECK: [38] Code Region - G39 2910 2911# CHECK: Iterations: 100 2912# CHECK-NEXT: Instructions: 1000 2913# CHECK-NEXT: Total Cycles: 4503 2914# CHECK-NEXT: Total uOps: 3500 2915 2916# CHECK: Dispatch Width: 3 2917# CHECK-NEXT: uOps Per Cycle: 0.78 2918# CHECK-NEXT: IPC: 0.22 2919# CHECK-NEXT: Block RThroughput: 11.7 2920 2921# CHECK: Timeline view: 2922# CHECK-NEXT: 0123456789 0123456789 2923# CHECK-NEXT: Index 0123456789 0123456789 01234567 2924 2925# CHECK: [0,0] DeeeeeeeeeER . . . . . . . . ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4 2926# CHECK-NEXT: [0,1] . DeE------R . . . . . . . . add x0, x27, #1 2927# CHECK-NEXT: [0,2] . D======eeeeeeeeeER . . . . . . ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4 2928# CHECK-NEXT: [0,3] . D=====eE-------R . . . . . . add x0, x27, #1 2929# CHECK-NEXT: [0,4] . .D============eeeeeeeeeER. . . . . ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28 2930# CHECK-NEXT: [0,5] . . D===========eE-------R. . . . . add x0, x27, #1 2931# CHECK-NEXT: [0,6] . . D==================eeeeeeeeeER . . . ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28 2932# CHECK-NEXT: [0,7] . . .D=================eE-------R . . . add x0, x27, #1 2933# CHECK-NEXT: [0,8] . . . D========================eeeeeeeeeER ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8 2934# CHECK-NEXT: [0,9] . . . D=======================eE-------R add x0, x27, #1 2935 2936# CHECK: Average Wait times (based on the timeline view): 2937# CHECK-NEXT: [0]: Executions 2938# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2939# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2940# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2941 2942# CHECK: [0] [1] [2] [3] 2943# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4 2944# CHECK-NEXT: 1. 1 1.0 1.0 6.0 add x0, x27, #1 2945# CHECK-NEXT: 2. 1 7.0 0.0 0.0 ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4 2946# CHECK-NEXT: 3. 1 6.0 0.0 7.0 add x0, x27, #1 2947# CHECK-NEXT: 4. 1 13.0 0.0 0.0 ld4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28 2948# CHECK-NEXT: 5. 1 12.0 0.0 7.0 add x0, x27, #1 2949# CHECK-NEXT: 6. 1 19.0 0.0 0.0 ld4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28 2950# CHECK-NEXT: 7. 1 18.0 0.0 7.0 add x0, x27, #1 2951# CHECK-NEXT: 8. 1 25.0 0.0 0.0 ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8 2952# CHECK-NEXT: 9. 1 24.0 0.0 7.0 add x0, x27, #1 2953# CHECK-NEXT: 1 12.6 0.2 3.4 <total> 2954 2955# CHECK: [39] Code Region - G40 2956 2957# CHECK: Iterations: 100 2958# CHECK-NEXT: Instructions: 1000 2959# CHECK-NEXT: Total Cycles: 4303 2960# CHECK-NEXT: Total uOps: 3100 2961 2962# CHECK: Dispatch Width: 3 2963# CHECK-NEXT: uOps Per Cycle: 0.72 2964# CHECK-NEXT: IPC: 0.23 2965# CHECK-NEXT: Block RThroughput: 10.3 2966 2967# CHECK: Timeline view: 2968# CHECK-NEXT: 0123456789 0123456789 2969# CHECK-NEXT: Index 0123456789 0123456789 012345 2970 2971# CHECK: [0,0] DeeeeeeeeeER . . . . . . . ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8 2972# CHECK-NEXT: [0,1] . DeE------R . . . . . . . add x0, x27, #1 2973# CHECK-NEXT: [0,2] . D======eeeeeeeeeER . . . . . ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28 2974# CHECK-NEXT: [0,3] . D=====eE-------R . . . . . add x0, x27, #1 2975# CHECK-NEXT: [0,4] . .D============eeeeeeeeeER. . . . ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28 2976# CHECK-NEXT: [0,5] . . D===========eE-------R. . . . add x0, x27, #1 2977# CHECK-NEXT: [0,6] . . D==================eeeeeeeeER . . ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16 2978# CHECK-NEXT: [0,7] . . D==================eE------R . . add x0, x27, #1 2979# CHECK-NEXT: [0,8] . . .D========================eeeeeeeeER ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28 2980# CHECK-NEXT: [0,9] . . . D========================eE------R add x0, x27, #1 2981 2982# CHECK: Average Wait times (based on the timeline view): 2983# CHECK-NEXT: [0]: Executions 2984# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 2985# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 2986# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 2987 2988# CHECK: [0] [1] [2] [3] 2989# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8 2990# CHECK-NEXT: 1. 1 1.0 1.0 6.0 add x0, x27, #1 2991# CHECK-NEXT: 2. 1 7.0 0.0 0.0 ld4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28 2992# CHECK-NEXT: 3. 1 6.0 0.0 7.0 add x0, x27, #1 2993# CHECK-NEXT: 4. 1 13.0 0.0 0.0 ld4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28 2994# CHECK-NEXT: 5. 1 12.0 0.0 7.0 add x0, x27, #1 2995# CHECK-NEXT: 6. 1 19.0 0.0 0.0 ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16 2996# CHECK-NEXT: 7. 1 19.0 0.0 6.0 add x0, x27, #1 2997# CHECK-NEXT: 8. 1 25.0 0.0 0.0 ld4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28 2998# CHECK-NEXT: 9. 1 25.0 0.0 6.0 add x0, x27, #1 2999# CHECK-NEXT: 1 12.8 0.2 3.2 <total> 3000 3001# CHECK: [40] Code Region - G41 3002 3003# CHECK: Iterations: 100 3004# CHECK-NEXT: Instructions: 1000 3005# CHECK-NEXT: Total Cycles: 2303 3006# CHECK-NEXT: Total uOps: 3100 3007 3008# CHECK: Dispatch Width: 3 3009# CHECK-NEXT: uOps Per Cycle: 1.35 3010# CHECK-NEXT: IPC: 0.43 3011# CHECK-NEXT: Block RThroughput: 10.3 3012 3013# CHECK: Timeline view: 3014# CHECK-NEXT: 0123456789 3015# CHECK-NEXT: Index 0123456789 012345 3016 3017# CHECK: [0,0] DeeeeeeeeeER . . . ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32 3018# CHECK-NEXT: [0,1] . DeE------R . . . add x0, x27, #1 3019# CHECK-NEXT: [0,2] . D======eeeeeeeeeER . ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28 3020# CHECK-NEXT: [0,3] . D=====eE-------R . add x0, x27, #1 3021# CHECK-NEXT: [0,4] . .D=====eeeeeeE-R . ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 3022# CHECK-NEXT: [0,5] . . D=====eE-----R . add x0, x27, #1 3023# CHECK-NEXT: [0,6] . . D=====eeeeeeeeeER. ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32 3024# CHECK-NEXT: [0,7] . . D====eE-------R. add x0, x27, #1 3025# CHECK-NEXT: [0,8] . . .D====eeeeeeeeER ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16 3026# CHECK-NEXT: [0,9] . . . D====eE------R add x0, x27, #1 3027 3028# CHECK: Average Wait times (based on the timeline view): 3029# CHECK-NEXT: [0]: Executions 3030# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3031# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3032# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3033 3034# CHECK: [0] [1] [2] [3] 3035# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32 3036# CHECK-NEXT: 1. 1 1.0 1.0 6.0 add x0, x27, #1 3037# CHECK-NEXT: 2. 1 7.0 0.0 0.0 ld4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28 3038# CHECK-NEXT: 3. 1 6.0 0.0 7.0 add x0, x27, #1 3039# CHECK-NEXT: 4. 1 6.0 1.0 1.0 ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 3040# CHECK-NEXT: 5. 1 6.0 0.0 5.0 add x0, x27, #1 3041# CHECK-NEXT: 6. 1 6.0 1.0 0.0 ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #32 3042# CHECK-NEXT: 7. 1 5.0 0.0 7.0 add x0, x27, #1 3043# CHECK-NEXT: 8. 1 5.0 1.0 0.0 ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #16 3044# CHECK-NEXT: 9. 1 5.0 0.0 6.0 add x0, x27, #1 3045# CHECK-NEXT: 1 4.8 0.5 3.2 <total> 3046 3047# CHECK: [41] Code Region - G42 3048 3049# CHECK: Iterations: 100 3050# CHECK-NEXT: Instructions: 1000 3051# CHECK-NEXT: Total Cycles: 1309 3052# CHECK-NEXT: Total uOps: 3100 3053 3054# CHECK: Dispatch Width: 3 3055# CHECK-NEXT: uOps Per Cycle: 2.37 3056# CHECK-NEXT: IPC: 0.76 3057# CHECK-NEXT: Block RThroughput: 10.3 3058 3059# CHECK: Timeline view: 3060# CHECK-NEXT: 0123456789 3061# CHECK-NEXT: Index 0123456789 01 3062 3063# CHECK: [0,0] DeeeeeeeeER . .. ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8 3064# CHECK-NEXT: [0,1] .DeE------R . .. add x0, x27, #1 3065# CHECK-NEXT: [0,2] . DeeeeeeeeeER . .. ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16 3066# CHECK-NEXT: [0,3] . DeE------R . .. add x0, x27, #1 3067# CHECK-NEXT: [0,4] . DeeeeeeeeER .. ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4 3068# CHECK-NEXT: [0,5] . .DeE------R .. add x0, x27, #1 3069# CHECK-NEXT: [0,6] . . DeeeeeeeeeER .. ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8 3070# CHECK-NEXT: [0,7] . . DeE------R .. add x0, x27, #1 3071# CHECK-NEXT: [0,8] . . DeeeeeeeeeER ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4 3072# CHECK-NEXT: [0,9] . . . DeE------R add x0, x27, #1 3073 3074# CHECK: Average Wait times (based on the timeline view): 3075# CHECK-NEXT: [0]: Executions 3076# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3077# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3078# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3079 3080# CHECK: [0] [1] [2] [3] 3081# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #8 3082# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 3083# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #16 3084# CHECK-NEXT: 3. 1 1.0 1.0 6.0 add x0, x27, #1 3085# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #4 3086# CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1 3087# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #8 3088# CHECK-NEXT: 7. 1 1.0 1.0 6.0 add x0, x27, #1 3089# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #4 3090# CHECK-NEXT: 9. 1 1.0 1.0 6.0 add x0, x27, #1 3091# CHECK-NEXT: 1 1.0 0.8 3.0 <total> 3092 3093# CHECK: [42] Code Region - G43 3094 3095# CHECK: Iterations: 100 3096# CHECK-NEXT: Instructions: 1000 3097# CHECK-NEXT: Total Cycles: 1209 3098# CHECK-NEXT: Total uOps: 2900 3099 3100# CHECK: Dispatch Width: 3 3101# CHECK-NEXT: uOps Per Cycle: 2.40 3102# CHECK-NEXT: IPC: 0.83 3103# CHECK-NEXT: Block RThroughput: 9.7 3104 3105# CHECK: Timeline view: 3106# CHECK-NEXT: 0123456789 3107# CHECK-NEXT: Index 0123456789 0 3108 3109# CHECK: [0,0] DeeeeeeER . . . ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 3110# CHECK-NEXT: [0,1] .DeE----R . . . add x0, x27, #1 3111# CHECK-NEXT: [0,2] . DeeeeeeeeeER . . ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 3112# CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1 3113# CHECK-NEXT: [0,4] . DeeeeeeeeER . ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 3114# CHECK-NEXT: [0,5] . .DeE------R . add x0, x27, #1 3115# CHECK-NEXT: [0,6] . . DeeeeeeeeER . ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 3116# CHECK-NEXT: [0,7] . . DeE------R . add x0, x27, #1 3117# CHECK-NEXT: [0,8] . . DeeeeeeeeeER ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 3118# CHECK-NEXT: [0,9] . . .DeE------R add x0, x27, #1 3119 3120# CHECK: Average Wait times (based on the timeline view): 3121# CHECK-NEXT: [0]: Executions 3122# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3123# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3124# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3125 3126# CHECK: [0] [1] [2] [3] 3127# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4r { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 3128# CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1 3129# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld4r { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 3130# CHECK-NEXT: 3. 1 1.0 1.0 6.0 add x0, x27, #1 3131# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld4r { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 3132# CHECK-NEXT: 5. 1 1.0 0.0 6.0 add x0, x27, #1 3133# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ld4r { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 3134# CHECK-NEXT: 7. 1 1.0 0.0 6.0 add x0, x27, #1 3135# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ld4r { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 3136# CHECK-NEXT: 9. 1 1.0 1.0 6.0 add x0, x27, #1 3137# CHECK-NEXT: 1 1.0 0.7 2.8 <total> 3138 3139# CHECK: [43] Code Region - G44 3140 3141# CHECK: Iterations: 100 3142# CHECK-NEXT: Instructions: 1000 3143# CHECK-NEXT: Total Cycles: 1206 3144# CHECK-NEXT: Total uOps: 2700 3145 3146# CHECK: Dispatch Width: 3 3147# CHECK-NEXT: uOps Per Cycle: 2.24 3148# CHECK-NEXT: IPC: 0.83 3149# CHECK-NEXT: Block RThroughput: 9.0 3150 3151# CHECK: Timeline view: 3152# CHECK-NEXT: 01234567 3153# CHECK-NEXT: Index 0123456789 3154 3155# CHECK: [0,0] DeeeeeeeeER . . ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 3156# CHECK-NEXT: [0,1] .DeE------R . . add x0, x27, #1 3157# CHECK-NEXT: [0,2] . DeeeeeeeeeER . . ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 3158# CHECK-NEXT: [0,3] . DeE------R . . add x0, x27, #1 3159# CHECK-NEXT: [0,4] . DeeeeeeeeeER. ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 3160# CHECK-NEXT: [0,5] . . DeE------R. add x0, x27, #1 3161# CHECK-NEXT: [0,6] . . DeeeeeE-R. ldp s1, s2, [x27], #248 3162# CHECK-NEXT: [0,7] . . DeE----R. add x0, x27, #1 3163# CHECK-NEXT: [0,8] . . DeeeeeER ldp d1, d2, [x27], #496 3164# CHECK-NEXT: [0,9] . . .DeE---R add x0, x27, #1 3165 3166# CHECK: Average Wait times (based on the timeline view): 3167# CHECK-NEXT: [0]: Executions 3168# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3169# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3170# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3171 3172# CHECK: [0] [1] [2] [3] 3173# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ld4r { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 3174# CHECK-NEXT: 1. 1 1.0 0.0 6.0 add x0, x27, #1 3175# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ld4r { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 3176# CHECK-NEXT: 3. 1 1.0 1.0 6.0 add x0, x27, #1 3177# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ld4r { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 3178# CHECK-NEXT: 5. 1 1.0 1.0 6.0 add x0, x27, #1 3179# CHECK-NEXT: 6. 1 1.0 1.0 1.0 ldp s1, s2, [x27], #248 3180# CHECK-NEXT: 7. 1 1.0 0.0 4.0 add x0, x27, #1 3181# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ldp d1, d2, [x27], #496 3182# CHECK-NEXT: 9. 1 1.0 0.0 3.0 add x0, x27, #1 3183# CHECK-NEXT: 1 1.0 0.7 2.6 <total> 3184 3185# CHECK: [44] Code Region - G45 3186 3187# CHECK: Iterations: 100 3188# CHECK-NEXT: Instructions: 1000 3189# CHECK-NEXT: Total Cycles: 1005 3190# CHECK-NEXT: Total uOps: 2200 3191 3192# CHECK: Dispatch Width: 3 3193# CHECK-NEXT: uOps Per Cycle: 2.19 3194# CHECK-NEXT: IPC: 1.00 3195# CHECK-NEXT: Block RThroughput: 7.3 3196 3197# CHECK: Timeline view: 3198# CHECK-NEXT: 01234 3199# CHECK-NEXT: Index 0123456789 3200 3201# CHECK: [0,0] DeeeeeeER . . ldp q1, q2, [x27], #992 3202# CHECK-NEXT: [0,1] .DeE----R . . add x0, x27, #1 3203# CHECK-NEXT: [0,2] . DeeeeeER. . ldp s1, s2, [x27, #248]! 3204# CHECK-NEXT: [0,3] . DeE---R. . add x0, x27, #1 3205# CHECK-NEXT: [0,4] . DeeeeeER . ldp d1, d2, [x27, #496]! 3206# CHECK-NEXT: [0,5] . DeE---R . add x0, x27, #1 3207# CHECK-NEXT: [0,6] . .DeeeeeeER ldp q1, q2, [x27, #992]! 3208# CHECK-NEXT: [0,7] . . DeE----R add x0, x27, #1 3209# CHECK-NEXT: [0,8] . . DeeeeER ldp w1, w2, [x27], #248 3210# CHECK-NEXT: [0,9] . . DeE--R add x0, x27, #1 3211 3212# CHECK: Average Wait times (based on the timeline view): 3213# CHECK-NEXT: [0]: Executions 3214# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3215# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3216# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3217 3218# CHECK: [0] [1] [2] [3] 3219# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldp q1, q2, [x27], #992 3220# CHECK-NEXT: 1. 1 1.0 0.0 4.0 add x0, x27, #1 3221# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ldp s1, s2, [x27, #248]! 3222# CHECK-NEXT: 3. 1 1.0 0.0 3.0 add x0, x27, #1 3223# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ldp d1, d2, [x27, #496]! 3224# CHECK-NEXT: 5. 1 1.0 0.0 3.0 add x0, x27, #1 3225# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ldp q1, q2, [x27, #992]! 3226# CHECK-NEXT: 7. 1 1.0 0.0 4.0 add x0, x27, #1 3227# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ldp w1, w2, [x27], #248 3228# CHECK-NEXT: 9. 1 1.0 0.0 2.0 add x0, x27, #1 3229# CHECK-NEXT: 1 1.0 0.5 1.6 <total> 3230 3231# CHECK: [45] Code Region - G46 3232 3233# CHECK: Iterations: 100 3234# CHECK-NEXT: Instructions: 1000 3235# CHECK-NEXT: Total Cycles: 1006 3236# CHECK-NEXT: Total uOps: 2400 3237 3238# CHECK: Dispatch Width: 3 3239# CHECK-NEXT: uOps Per Cycle: 2.39 3240# CHECK-NEXT: IPC: 0.99 3241# CHECK-NEXT: Block RThroughput: 8.0 3242 3243# CHECK: Timeline view: 3244# CHECK-NEXT: 012345 3245# CHECK-NEXT: Index 0123456789 3246 3247# CHECK: [0,0] DeeeeER . . ldp x1, x2, [x27], #496 3248# CHECK-NEXT: [0,1] .DeE--R . . add x0, x27, #1 3249# CHECK-NEXT: [0,2] . DeeeeER . . ldp w1, w2, [x27, #248]! 3250# CHECK-NEXT: [0,3] . DeE--R . . add x0, x27, #1 3251# CHECK-NEXT: [0,4] . DeeeeER . ldp x1, x2, [x27, #496]! 3252# CHECK-NEXT: [0,5] . DeE--R . add x0, x27, #1 3253# CHECK-NEXT: [0,6] . .DeeeeeER . ldpsw x1, x2, [x27], #248 3254# CHECK-NEXT: [0,7] . . DeE---R . add x0, x27, #1 3255# CHECK-NEXT: [0,8] . . DeeeeeER ldpsw x1, x2, [x27, #248]! 3256# CHECK-NEXT: [0,9] . . DeE---R add x0, x27, #1 3257 3258# CHECK: Average Wait times (based on the timeline view): 3259# CHECK-NEXT: [0]: Executions 3260# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3261# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3262# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3263 3264# CHECK: [0] [1] [2] [3] 3265# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldp x1, x2, [x27], #496 3266# CHECK-NEXT: 1. 1 1.0 0.0 2.0 add x0, x27, #1 3267# CHECK-NEXT: 2. 1 1.0 1.0 0.0 ldp w1, w2, [x27, #248]! 3268# CHECK-NEXT: 3. 1 1.0 0.0 2.0 add x0, x27, #1 3269# CHECK-NEXT: 4. 1 1.0 1.0 0.0 ldp x1, x2, [x27, #496]! 3270# CHECK-NEXT: 5. 1 1.0 0.0 2.0 add x0, x27, #1 3271# CHECK-NEXT: 6. 1 1.0 1.0 0.0 ldpsw x1, x2, [x27], #248 3272# CHECK-NEXT: 7. 1 1.0 0.0 3.0 add x0, x27, #1 3273# CHECK-NEXT: 8. 1 1.0 1.0 0.0 ldpsw x1, x2, [x27, #248]! 3274# CHECK-NEXT: 9. 1 1.0 0.0 3.0 add x0, x27, #1 3275# CHECK-NEXT: 1 1.0 0.5 1.2 <total> 3276 3277# CHECK: [46] Code Region - G47 3278 3279# CHECK: Iterations: 100 3280# CHECK-NEXT: Instructions: 1000 3281# CHECK-NEXT: Total Cycles: 2504 3282# CHECK-NEXT: Total uOps: 1500 3283 3284# CHECK: Dispatch Width: 3 3285# CHECK-NEXT: uOps Per Cycle: 0.60 3286# CHECK-NEXT: IPC: 0.40 3287# CHECK-NEXT: Block RThroughput: 5.0 3288 3289# CHECK: Timeline view: 3290# CHECK-NEXT: 0123456789 3291# CHECK-NEXT: Index 0123456789 012345678 3292 3293# CHECK: [0,0] DeeeeeER . . . . . ldr b1, [x27], #254 3294# CHECK-NEXT: [0,1] D=====eER . . . . . add x0, x27, #1 3295# CHECK-NEXT: [0,2] .D====eeeeeER . . . . ldr h1, [x27], #254 3296# CHECK-NEXT: [0,3] .D=========eER . . . . add x0, x27, #1 3297# CHECK-NEXT: [0,4] . D========eeeeeER . . . ldr s1, [x27], #254 3298# CHECK-NEXT: [0,5] . D=============eER . . . add x0, x27, #1 3299# CHECK-NEXT: [0,6] . D============eeeeeER . . ldr d1, [x27], #254 3300# CHECK-NEXT: [0,7] . D=================eER . . add x0, x27, #1 3301# CHECK-NEXT: [0,8] . D================eeeeeER. ldr q1, [x27], #254 3302# CHECK-NEXT: [0,9] . D=====================eER add x0, x27, #1 3303 3304# CHECK: Average Wait times (based on the timeline view): 3305# CHECK-NEXT: [0]: Executions 3306# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3307# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3308# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3309 3310# CHECK: [0] [1] [2] [3] 3311# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldr b1, [x27], #254 3312# CHECK-NEXT: 1. 1 6.0 0.0 0.0 add x0, x27, #1 3313# CHECK-NEXT: 2. 1 5.0 0.0 0.0 ldr h1, [x27], #254 3314# CHECK-NEXT: 3. 1 10.0 0.0 0.0 add x0, x27, #1 3315# CHECK-NEXT: 4. 1 9.0 0.0 0.0 ldr s1, [x27], #254 3316# CHECK-NEXT: 5. 1 14.0 0.0 0.0 add x0, x27, #1 3317# CHECK-NEXT: 6. 1 13.0 0.0 0.0 ldr d1, [x27], #254 3318# CHECK-NEXT: 7. 1 18.0 0.0 0.0 add x0, x27, #1 3319# CHECK-NEXT: 8. 1 17.0 0.0 0.0 ldr q1, [x27], #254 3320# CHECK-NEXT: 9. 1 22.0 0.0 0.0 add x0, x27, #1 3321# CHECK-NEXT: 1 11.5 0.1 0.0 <total> 3322 3323# CHECK: [47] Code Region - G48 3324 3325# CHECK: Iterations: 100 3326# CHECK-NEXT: Instructions: 1000 3327# CHECK-NEXT: Total Cycles: 507 3328# CHECK-NEXT: Total uOps: 1500 3329 3330# CHECK: Dispatch Width: 3 3331# CHECK-NEXT: uOps Per Cycle: 2.96 3332# CHECK-NEXT: IPC: 1.97 3333# CHECK-NEXT: Block RThroughput: 5.0 3334 3335# CHECK: Timeline view: 3336# CHECK-NEXT: 01 3337# CHECK-NEXT: Index 0123456789 3338 3339# CHECK: [0,0] DeeeeeER .. ldr b1, [x27, #254]! 3340# CHECK-NEXT: [0,1] D=eE---R .. add x0, x27, #1 3341# CHECK-NEXT: [0,2] .DeeeeeER .. ldr h1, [x27, #254]! 3342# CHECK-NEXT: [0,3] .D=eE---R .. add x0, x27, #1 3343# CHECK-NEXT: [0,4] . DeeeeeER.. ldr s1, [x27, #254]! 3344# CHECK-NEXT: [0,5] . D=eE---R.. add x0, x27, #1 3345# CHECK-NEXT: [0,6] . DeeeeeER. ldr d1, [x27, #254]! 3346# CHECK-NEXT: [0,7] . D=eE---R. add x0, x27, #1 3347# CHECK-NEXT: [0,8] . DeeeeeER ldr q1, [x27, #254]! 3348# CHECK-NEXT: [0,9] . D=eE---R add x0, x27, #1 3349 3350# CHECK: Average Wait times (based on the timeline view): 3351# CHECK-NEXT: [0]: Executions 3352# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3353# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3354# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3355 3356# CHECK: [0] [1] [2] [3] 3357# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldr b1, [x27, #254]! 3358# CHECK-NEXT: 1. 1 2.0 0.0 3.0 add x0, x27, #1 3359# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ldr h1, [x27, #254]! 3360# CHECK-NEXT: 3. 1 2.0 0.0 3.0 add x0, x27, #1 3361# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ldr s1, [x27, #254]! 3362# CHECK-NEXT: 5. 1 2.0 0.0 3.0 add x0, x27, #1 3363# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ldr d1, [x27, #254]! 3364# CHECK-NEXT: 7. 1 2.0 0.0 3.0 add x0, x27, #1 3365# CHECK-NEXT: 8. 1 1.0 0.0 0.0 ldr q1, [x27, #254]! 3366# CHECK-NEXT: 9. 1 2.0 0.0 3.0 add x0, x27, #1 3367# CHECK-NEXT: 1 1.5 0.1 1.5 <total> 3368 3369# CHECK: [48] Code Region - G49 3370 3371# CHECK: Iterations: 100 3372# CHECK-NEXT: Instructions: 1000 3373# CHECK-NEXT: Total Cycles: 506 3374# CHECK-NEXT: Total uOps: 1500 3375 3376# CHECK: Dispatch Width: 3 3377# CHECK-NEXT: uOps Per Cycle: 2.96 3378# CHECK-NEXT: IPC: 1.98 3379# CHECK-NEXT: Block RThroughput: 5.0 3380 3381# CHECK: Timeline view: 3382# CHECK-NEXT: 0 3383# CHECK-NEXT: Index 0123456789 3384 3385# CHECK: [0,0] DeeeeER . ldr w1, [x27], #254 3386# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 3387# CHECK-NEXT: [0,2] .DeeeeER . ldr x1, [x27], #254 3388# CHECK-NEXT: [0,3] .D=eE--R . add x0, x27, #1 3389# CHECK-NEXT: [0,4] . DeeeeER . ldr w1, [x27, #254]! 3390# CHECK-NEXT: [0,5] . D=eE--R . add x0, x27, #1 3391# CHECK-NEXT: [0,6] . DeeeeER. ldr x1, [x27, #254]! 3392# CHECK-NEXT: [0,7] . D=eE--R. add x0, x27, #1 3393# CHECK-NEXT: [0,8] . DeeeeER ldrb w1, [x27], #254 3394# CHECK-NEXT: [0,9] . D=eE--R add x0, x27, #1 3395 3396# CHECK: Average Wait times (based on the timeline view): 3397# CHECK-NEXT: [0]: Executions 3398# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3399# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3400# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3401 3402# CHECK: [0] [1] [2] [3] 3403# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldr w1, [x27], #254 3404# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 3405# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ldr x1, [x27], #254 3406# CHECK-NEXT: 3. 1 2.0 0.0 2.0 add x0, x27, #1 3407# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ldr w1, [x27, #254]! 3408# CHECK-NEXT: 5. 1 2.0 0.0 2.0 add x0, x27, #1 3409# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ldr x1, [x27, #254]! 3410# CHECK-NEXT: 7. 1 2.0 0.0 2.0 add x0, x27, #1 3411# CHECK-NEXT: 8. 1 1.0 0.0 0.0 ldrb w1, [x27], #254 3412# CHECK-NEXT: 9. 1 2.0 0.0 2.0 add x0, x27, #1 3413# CHECK-NEXT: 1 1.5 0.1 1.0 <total> 3414 3415# CHECK: [49] Code Region - G50 3416 3417# CHECK: Iterations: 100 3418# CHECK-NEXT: Instructions: 1000 3419# CHECK-NEXT: Total Cycles: 506 3420# CHECK-NEXT: Total uOps: 1500 3421 3422# CHECK: Dispatch Width: 3 3423# CHECK-NEXT: uOps Per Cycle: 2.96 3424# CHECK-NEXT: IPC: 1.98 3425# CHECK-NEXT: Block RThroughput: 5.0 3426 3427# CHECK: Timeline view: 3428# CHECK-NEXT: 0 3429# CHECK-NEXT: Index 0123456789 3430 3431# CHECK: [0,0] DeeeeER . ldrb w1, [x27, #254]! 3432# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 3433# CHECK-NEXT: [0,2] .DeeeeER . ldrh w1, [x27], #254 3434# CHECK-NEXT: [0,3] .D=eE--R . add x0, x27, #1 3435# CHECK-NEXT: [0,4] . DeeeeER . ldrh w1, [x27, #254]! 3436# CHECK-NEXT: [0,5] . D=eE--R . add x0, x27, #1 3437# CHECK-NEXT: [0,6] . DeeeeER. ldrsb w1, [x27], #254 3438# CHECK-NEXT: [0,7] . D=eE--R. add x0, x27, #1 3439# CHECK-NEXT: [0,8] . DeeeeER ldrsb x1, [x27], #254 3440# CHECK-NEXT: [0,9] . D=eE--R add x0, x27, #1 3441 3442# CHECK: Average Wait times (based on the timeline view): 3443# CHECK-NEXT: [0]: Executions 3444# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3445# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3446# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3447 3448# CHECK: [0] [1] [2] [3] 3449# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldrb w1, [x27, #254]! 3450# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 3451# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ldrh w1, [x27], #254 3452# CHECK-NEXT: 3. 1 2.0 0.0 2.0 add x0, x27, #1 3453# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ldrh w1, [x27, #254]! 3454# CHECK-NEXT: 5. 1 2.0 0.0 2.0 add x0, x27, #1 3455# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ldrsb w1, [x27], #254 3456# CHECK-NEXT: 7. 1 2.0 0.0 2.0 add x0, x27, #1 3457# CHECK-NEXT: 8. 1 1.0 0.0 0.0 ldrsb x1, [x27], #254 3458# CHECK-NEXT: 9. 1 2.0 0.0 2.0 add x0, x27, #1 3459# CHECK-NEXT: 1 1.5 0.1 1.0 <total> 3460 3461# CHECK: [50] Code Region - G51 3462 3463# CHECK: Iterations: 100 3464# CHECK-NEXT: Instructions: 1000 3465# CHECK-NEXT: Total Cycles: 506 3466# CHECK-NEXT: Total uOps: 1500 3467 3468# CHECK: Dispatch Width: 3 3469# CHECK-NEXT: uOps Per Cycle: 2.96 3470# CHECK-NEXT: IPC: 1.98 3471# CHECK-NEXT: Block RThroughput: 5.0 3472 3473# CHECK: Timeline view: 3474# CHECK-NEXT: 0 3475# CHECK-NEXT: Index 0123456789 3476 3477# CHECK: [0,0] DeeeeER . ldrsb w1, [x27, #254]! 3478# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 3479# CHECK-NEXT: [0,2] .DeeeeER . ldrsb x1, [x27, #254]! 3480# CHECK-NEXT: [0,3] .D=eE--R . add x0, x27, #1 3481# CHECK-NEXT: [0,4] . DeeeeER . ldrsh w1, [x27], #254 3482# CHECK-NEXT: [0,5] . D=eE--R . add x0, x27, #1 3483# CHECK-NEXT: [0,6] . DeeeeER. ldrsh x1, [x27], #254 3484# CHECK-NEXT: [0,7] . D=eE--R. add x0, x27, #1 3485# CHECK-NEXT: [0,8] . DeeeeER ldrsh w1, [x27, #254]! 3486# CHECK-NEXT: [0,9] . D=eE--R add x0, x27, #1 3487 3488# CHECK: Average Wait times (based on the timeline view): 3489# CHECK-NEXT: [0]: Executions 3490# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3491# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3492# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3493 3494# CHECK: [0] [1] [2] [3] 3495# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldrsb w1, [x27, #254]! 3496# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 3497# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ldrsb x1, [x27, #254]! 3498# CHECK-NEXT: 3. 1 2.0 0.0 2.0 add x0, x27, #1 3499# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ldrsh w1, [x27], #254 3500# CHECK-NEXT: 5. 1 2.0 0.0 2.0 add x0, x27, #1 3501# CHECK-NEXT: 6. 1 1.0 0.0 0.0 ldrsh x1, [x27], #254 3502# CHECK-NEXT: 7. 1 2.0 0.0 2.0 add x0, x27, #1 3503# CHECK-NEXT: 8. 1 1.0 0.0 0.0 ldrsh w1, [x27, #254]! 3504# CHECK-NEXT: 9. 1 2.0 0.0 2.0 add x0, x27, #1 3505# CHECK-NEXT: 1 1.5 0.1 1.0 <total> 3506 3507# CHECK: [51] Code Region - G52 3508 3509# CHECK: Iterations: 100 3510# CHECK-NEXT: Instructions: 1000 3511# CHECK-NEXT: Total Cycles: 603 3512# CHECK-NEXT: Total uOps: 1600 3513 3514# CHECK: Dispatch Width: 3 3515# CHECK-NEXT: uOps Per Cycle: 2.65 3516# CHECK-NEXT: IPC: 1.66 3517# CHECK-NEXT: Block RThroughput: 5.3 3518 3519# CHECK: Timeline view: 3520# CHECK-NEXT: Index 012345678 3521 3522# CHECK: [0,0] DeeeeER . ldrsh x1, [x27, #254]! 3523# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 3524# CHECK-NEXT: [0,2] .DeeeeER. ldrsw x1, [x27], #254 3525# CHECK-NEXT: [0,3] .D=eE--R. add x0, x27, #1 3526# CHECK-NEXT: [0,4] . DeeeeER ldrsw x1, [x27, #254]! 3527# CHECK-NEXT: [0,5] . D=eE--R add x0, x27, #1 3528# CHECK-NEXT: [0,6] . DeE--R st1 { v1.1d }, [x27], #8 3529# CHECK-NEXT: [0,7] . D=eE-R add x0, x27, #1 3530# CHECK-NEXT: [0,8] . DeeER st1 { v1.2d }, [x27], #16 3531# CHECK-NEXT: [0,9] . DeER add x0, x27, #1 3532 3533# CHECK: Average Wait times (based on the timeline view): 3534# CHECK-NEXT: [0]: Executions 3535# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3536# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3537# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3538 3539# CHECK: [0] [1] [2] [3] 3540# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldrsh x1, [x27, #254]! 3541# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 3542# CHECK-NEXT: 2. 1 1.0 0.0 0.0 ldrsw x1, [x27], #254 3543# CHECK-NEXT: 3. 1 2.0 0.0 2.0 add x0, x27, #1 3544# CHECK-NEXT: 4. 1 1.0 0.0 0.0 ldrsw x1, [x27, #254]! 3545# CHECK-NEXT: 5. 1 2.0 0.0 2.0 add x0, x27, #1 3546# CHECK-NEXT: 6. 1 1.0 0.0 2.0 st1 { v1.1d }, [x27], #8 3547# CHECK-NEXT: 7. 1 2.0 0.0 1.0 add x0, x27, #1 3548# CHECK-NEXT: 8. 1 1.0 0.0 0.0 st1 { v1.2d }, [x27], #16 3549# CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1 3550# CHECK-NEXT: 1 1.4 0.1 0.9 <total> 3551 3552# CHECK: [52] Code Region - G53 3553 3554# CHECK: Iterations: 100 3555# CHECK-NEXT: Instructions: 1000 3556# CHECK-NEXT: Total Cycles: 703 3557# CHECK-NEXT: Total uOps: 1700 3558 3559# CHECK: Dispatch Width: 3 3560# CHECK-NEXT: uOps Per Cycle: 2.42 3561# CHECK-NEXT: IPC: 1.42 3562# CHECK-NEXT: Block RThroughput: 7.0 3563 3564# CHECK: Timeline view: 3565# CHECK-NEXT: Index 0123456789 3566 3567# CHECK: [0,0] DeER . . st1 { v1.2s }, [x27], #8 3568# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 3569# CHECK-NEXT: [0,2] .DeER. . st1 { v1.4h }, [x27], #8 3570# CHECK-NEXT: [0,3] .D=eER . add x0, x27, #1 3571# CHECK-NEXT: [0,4] . DeeER . st1 { v1.4s }, [x27], #16 3572# CHECK-NEXT: [0,5] . DeER . add x0, x27, #1 3573# CHECK-NEXT: [0,6] . D=eER . st1 { v1.8b }, [x27], #8 3574# CHECK-NEXT: [0,7] . D=eER. add x0, x27, #1 3575# CHECK-NEXT: [0,8] . DeeER st1 { v1.8h }, [x27], #16 3576# CHECK-NEXT: [0,9] . .DeER add x0, x27, #1 3577 3578# CHECK: Average Wait times (based on the timeline view): 3579# CHECK-NEXT: [0]: Executions 3580# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3581# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3582# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3583 3584# CHECK: [0] [1] [2] [3] 3585# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.2s }, [x27], #8 3586# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 3587# CHECK-NEXT: 2. 1 1.0 0.0 0.0 st1 { v1.4h }, [x27], #8 3588# CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1 3589# CHECK-NEXT: 4. 1 1.0 0.0 0.0 st1 { v1.4s }, [x27], #16 3590# CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1 3591# CHECK-NEXT: 6. 1 2.0 1.0 0.0 st1 { v1.8b }, [x27], #8 3592# CHECK-NEXT: 7. 1 2.0 0.0 0.0 add x0, x27, #1 3593# CHECK-NEXT: 8. 1 1.0 0.0 0.0 st1 { v1.8h }, [x27], #16 3594# CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1 3595# CHECK-NEXT: 1 1.4 0.2 0.0 <total> 3596 3597# CHECK: [53] Code Region - G54 3598 3599# CHECK: Iterations: 100 3600# CHECK-NEXT: Instructions: 1000 3601# CHECK-NEXT: Total Cycles: 704 3602# CHECK-NEXT: Total uOps: 1700 3603 3604# CHECK: Dispatch Width: 3 3605# CHECK-NEXT: uOps Per Cycle: 2.41 3606# CHECK-NEXT: IPC: 1.42 3607# CHECK-NEXT: Block RThroughput: 7.0 3608 3609# CHECK: Timeline view: 3610# CHECK-NEXT: 0 3611# CHECK-NEXT: Index 0123456789 3612 3613# CHECK: [0,0] DeeER. . st1 { v1.16b }, [x27], #16 3614# CHECK-NEXT: [0,1] .DeER. . add x0, x27, #1 3615# CHECK-NEXT: [0,2] .D=eER . st1 { v1.1d }, [x27], x28 3616# CHECK-NEXT: [0,3] . D=eER . add x0, x27, #1 3617# CHECK-NEXT: [0,4] . DeeER . st1 { v1.2d }, [x27], x28 3618# CHECK-NEXT: [0,5] . DeER . add x0, x27, #1 3619# CHECK-NEXT: [0,6] . D=eER . st1 { v1.2s }, [x27], x28 3620# CHECK-NEXT: [0,7] . D=eER. add x0, x27, #1 3621# CHECK-NEXT: [0,8] . D=eER. st1 { v1.4h }, [x27], x28 3622# CHECK-NEXT: [0,9] . .D=eER add x0, x27, #1 3623 3624# CHECK: Average Wait times (based on the timeline view): 3625# CHECK-NEXT: [0]: Executions 3626# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3627# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3628# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3629 3630# CHECK: [0] [1] [2] [3] 3631# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.16b }, [x27], #16 3632# CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1 3633# CHECK-NEXT: 2. 1 2.0 1.0 0.0 st1 { v1.1d }, [x27], x28 3634# CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1 3635# CHECK-NEXT: 4. 1 1.0 0.0 0.0 st1 { v1.2d }, [x27], x28 3636# CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1 3637# CHECK-NEXT: 6. 1 2.0 1.0 0.0 st1 { v1.2s }, [x27], x28 3638# CHECK-NEXT: 7. 1 2.0 0.0 0.0 add x0, x27, #1 3639# CHECK-NEXT: 8. 1 2.0 0.0 0.0 st1 { v1.4h }, [x27], x28 3640# CHECK-NEXT: 9. 1 2.0 0.0 0.0 add x0, x27, #1 3641# CHECK-NEXT: 1 1.6 0.3 0.0 <total> 3642 3643# CHECK: [54] Code Region - G55 3644 3645# CHECK: Iterations: 100 3646# CHECK-NEXT: Instructions: 1000 3647# CHECK-NEXT: Total Cycles: 903 3648# CHECK-NEXT: Total uOps: 1900 3649 3650# CHECK: Dispatch Width: 3 3651# CHECK-NEXT: uOps Per Cycle: 2.10 3652# CHECK-NEXT: IPC: 1.11 3653# CHECK-NEXT: Block RThroughput: 9.0 3654 3655# CHECK: Timeline view: 3656# CHECK-NEXT: 01 3657# CHECK-NEXT: Index 0123456789 3658 3659# CHECK: [0,0] DeeER. .. st1 { v1.4s }, [x27], x28 3660# CHECK-NEXT: [0,1] .DeER. .. add x0, x27, #1 3661# CHECK-NEXT: [0,2] .D=eER .. st1 { v1.8b }, [x27], x28 3662# CHECK-NEXT: [0,3] . D=eER .. add x0, x27, #1 3663# CHECK-NEXT: [0,4] . DeeER .. st1 { v1.8h }, [x27], x28 3664# CHECK-NEXT: [0,5] . DeER .. add x0, x27, #1 3665# CHECK-NEXT: [0,6] . DeeER.. st1 { v1.16b }, [x27], x28 3666# CHECK-NEXT: [0,7] . .DeER.. add x0, x27, #1 3667# CHECK-NEXT: [0,8] . . DeeER st1 { v1.1d, v2.1d }, [x27], #16 3668# CHECK-NEXT: [0,9] . . DeER add x0, x27, #1 3669 3670# CHECK: Average Wait times (based on the timeline view): 3671# CHECK-NEXT: [0]: Executions 3672# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3673# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3674# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3675 3676# CHECK: [0] [1] [2] [3] 3677# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.4s }, [x27], x28 3678# CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1 3679# CHECK-NEXT: 2. 1 2.0 1.0 0.0 st1 { v1.8b }, [x27], x28 3680# CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1 3681# CHECK-NEXT: 4. 1 1.0 0.0 0.0 st1 { v1.8h }, [x27], x28 3682# CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1 3683# CHECK-NEXT: 6. 1 1.0 1.0 0.0 st1 { v1.16b }, [x27], x28 3684# CHECK-NEXT: 7. 1 1.0 0.0 0.0 add x0, x27, #1 3685# CHECK-NEXT: 8. 1 1.0 1.0 0.0 st1 { v1.1d, v2.1d }, [x27], #16 3686# CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1 3687# CHECK-NEXT: 1 1.2 0.4 0.0 <total> 3688 3689# CHECK: [55] Code Region - G56 3690 3691# CHECK: Iterations: 100 3692# CHECK-NEXT: Instructions: 1000 3693# CHECK-NEXT: Total Cycles: 1403 3694# CHECK-NEXT: Total uOps: 2400 3695 3696# CHECK: Dispatch Width: 3 3697# CHECK-NEXT: uOps Per Cycle: 1.71 3698# CHECK-NEXT: IPC: 0.71 3699# CHECK-NEXT: Block RThroughput: 14.0 3700 3701# CHECK: Timeline view: 3702# CHECK-NEXT: 0123456 3703# CHECK-NEXT: Index 0123456789 3704 3705# CHECK: [0,0] DeeeeER . .. st1 { v1.2d, v2.2d }, [x27], #32 3706# CHECK-NEXT: [0,1] .DeE--R . .. add x0, x27, #1 3707# CHECK-NEXT: [0,2] . D==eeER . .. st1 { v1.2s, v2.2s }, [x27], #16 3708# CHECK-NEXT: [0,3] . D==eER . .. add x0, x27, #1 3709# CHECK-NEXT: [0,4] . D==eeER .. st1 { v1.4h, v2.4h }, [x27], #16 3710# CHECK-NEXT: [0,5] . D==eER .. add x0, x27, #1 3711# CHECK-NEXT: [0,6] . .D==eeeeER.. st1 { v1.4s, v2.4s }, [x27], #32 3712# CHECK-NEXT: [0,7] . . D==eE--R.. add x0, x27, #1 3713# CHECK-NEXT: [0,8] . . D====eeER st1 { v1.8b, v2.8b }, [x27], #16 3714# CHECK-NEXT: [0,9] . . D====eER add x0, x27, #1 3715 3716# CHECK: Average Wait times (based on the timeline view): 3717# CHECK-NEXT: [0]: Executions 3718# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3719# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3720# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3721 3722# CHECK: [0] [1] [2] [3] 3723# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.2d, v2.2d }, [x27], #32 3724# CHECK-NEXT: 1. 1 1.0 0.0 2.0 add x0, x27, #1 3725# CHECK-NEXT: 2. 1 3.0 3.0 0.0 st1 { v1.2s, v2.2s }, [x27], #16 3726# CHECK-NEXT: 3. 1 3.0 0.0 0.0 add x0, x27, #1 3727# CHECK-NEXT: 4. 1 3.0 1.0 0.0 st1 { v1.4h, v2.4h }, [x27], #16 3728# CHECK-NEXT: 5. 1 3.0 0.0 0.0 add x0, x27, #1 3729# CHECK-NEXT: 6. 1 3.0 1.0 0.0 st1 { v1.4s, v2.4s }, [x27], #32 3730# CHECK-NEXT: 7. 1 3.0 0.0 2.0 add x0, x27, #1 3731# CHECK-NEXT: 8. 1 5.0 3.0 0.0 st1 { v1.8b, v2.8b }, [x27], #16 3732# CHECK-NEXT: 9. 1 5.0 0.0 0.0 add x0, x27, #1 3733# CHECK-NEXT: 1 3.0 0.9 0.4 <total> 3734 3735# CHECK: [56] Code Region - G57 3736 3737# CHECK: Iterations: 100 3738# CHECK-NEXT: Instructions: 1000 3739# CHECK-NEXT: Total Cycles: 1603 3740# CHECK-NEXT: Total uOps: 2600 3741 3742# CHECK: Dispatch Width: 3 3743# CHECK-NEXT: uOps Per Cycle: 1.62 3744# CHECK-NEXT: IPC: 0.62 3745# CHECK-NEXT: Block RThroughput: 16.0 3746 3747# CHECK: Timeline view: 3748# CHECK-NEXT: 012345678 3749# CHECK-NEXT: Index 0123456789 3750 3751# CHECK: [0,0] DeeeeER . . . st1 { v1.8h, v2.8h }, [x27], #32 3752# CHECK-NEXT: [0,1] .DeE--R . . . add x0, x27, #1 3753# CHECK-NEXT: [0,2] . D==eeeeER . . st1 { v1.16b, v2.16b }, [x27], #32 3754# CHECK-NEXT: [0,3] . D==eE--R . . add x0, x27, #1 3755# CHECK-NEXT: [0,4] . D====eeER . . st1 { v1.1d, v2.1d }, [x27], x28 3756# CHECK-NEXT: [0,5] . D====eER . . add x0, x27, #1 3757# CHECK-NEXT: [0,6] . .D====eeeeER . st1 { v1.2d, v2.2d }, [x27], x28 3758# CHECK-NEXT: [0,7] . . D====eE--R . add x0, x27, #1 3759# CHECK-NEXT: [0,8] . . D======eeER st1 { v1.2s, v2.2s }, [x27], x28 3760# CHECK-NEXT: [0,9] . . D======eER add x0, x27, #1 3761 3762# CHECK: Average Wait times (based on the timeline view): 3763# CHECK-NEXT: [0]: Executions 3764# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3765# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3766# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3767 3768# CHECK: [0] [1] [2] [3] 3769# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.8h, v2.8h }, [x27], #32 3770# CHECK-NEXT: 1. 1 1.0 0.0 2.0 add x0, x27, #1 3771# CHECK-NEXT: 2. 1 3.0 3.0 0.0 st1 { v1.16b, v2.16b }, [x27], #32 3772# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 3773# CHECK-NEXT: 4. 1 5.0 3.0 0.0 st1 { v1.1d, v2.1d }, [x27], x28 3774# CHECK-NEXT: 5. 1 5.0 0.0 0.0 add x0, x27, #1 3775# CHECK-NEXT: 6. 1 5.0 1.0 0.0 st1 { v1.2d, v2.2d }, [x27], x28 3776# CHECK-NEXT: 7. 1 5.0 0.0 2.0 add x0, x27, #1 3777# CHECK-NEXT: 8. 1 7.0 3.0 0.0 st1 { v1.2s, v2.2s }, [x27], x28 3778# CHECK-NEXT: 9. 1 7.0 0.0 0.0 add x0, x27, #1 3779# CHECK-NEXT: 1 4.2 1.1 0.6 <total> 3780 3781# CHECK: [57] Code Region - G58 3782 3783# CHECK: Iterations: 100 3784# CHECK-NEXT: Instructions: 1000 3785# CHECK-NEXT: Total Cycles: 1603 3786# CHECK-NEXT: Total uOps: 2600 3787 3788# CHECK: Dispatch Width: 3 3789# CHECK-NEXT: uOps Per Cycle: 1.62 3790# CHECK-NEXT: IPC: 0.62 3791# CHECK-NEXT: Block RThroughput: 16.0 3792 3793# CHECK: Timeline view: 3794# CHECK-NEXT: 012345678 3795# CHECK-NEXT: Index 0123456789 3796 3797# CHECK: [0,0] DeeER. . . . st1 { v1.4h, v2.4h }, [x27], x28 3798# CHECK-NEXT: [0,1] .DeER. . . . add x0, x27, #1 3799# CHECK-NEXT: [0,2] . DeeeeER . . . st1 { v1.4s, v2.4s }, [x27], x28 3800# CHECK-NEXT: [0,3] . DeE--R . . . add x0, x27, #1 3801# CHECK-NEXT: [0,4] . D==eeER . . st1 { v1.8b, v2.8b }, [x27], x28 3802# CHECK-NEXT: [0,5] . D==eER . . add x0, x27, #1 3803# CHECK-NEXT: [0,6] . .D==eeeeER. . st1 { v1.8h, v2.8h }, [x27], x28 3804# CHECK-NEXT: [0,7] . . D==eE--R. . add x0, x27, #1 3805# CHECK-NEXT: [0,8] . . D====eeeeER st1 { v1.16b, v2.16b }, [x27], x28 3806# CHECK-NEXT: [0,9] . . D====eE--R add x0, x27, #1 3807 3808# CHECK: Average Wait times (based on the timeline view): 3809# CHECK-NEXT: [0]: Executions 3810# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3811# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3812# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3813 3814# CHECK: [0] [1] [2] [3] 3815# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.4h, v2.4h }, [x27], x28 3816# CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1 3817# CHECK-NEXT: 2. 1 1.0 1.0 0.0 st1 { v1.4s, v2.4s }, [x27], x28 3818# CHECK-NEXT: 3. 1 1.0 0.0 2.0 add x0, x27, #1 3819# CHECK-NEXT: 4. 1 3.0 3.0 0.0 st1 { v1.8b, v2.8b }, [x27], x28 3820# CHECK-NEXT: 5. 1 3.0 0.0 0.0 add x0, x27, #1 3821# CHECK-NEXT: 6. 1 3.0 1.0 0.0 st1 { v1.8h, v2.8h }, [x27], x28 3822# CHECK-NEXT: 7. 1 3.0 0.0 2.0 add x0, x27, #1 3823# CHECK-NEXT: 8. 1 5.0 3.0 0.0 st1 { v1.16b, v2.16b }, [x27], x28 3824# CHECK-NEXT: 9. 1 5.0 0.0 2.0 add x0, x27, #1 3825# CHECK-NEXT: 1 2.6 0.9 0.6 <total> 3826 3827# CHECK: [58] Code Region - G59 3828 3829# CHECK: Iterations: 100 3830# CHECK-NEXT: Instructions: 1000 3831# CHECK-NEXT: Total Cycles: 2103 3832# CHECK-NEXT: Total uOps: 3100 3833 3834# CHECK: Dispatch Width: 3 3835# CHECK-NEXT: uOps Per Cycle: 1.47 3836# CHECK-NEXT: IPC: 0.48 3837# CHECK-NEXT: Block RThroughput: 21.0 3838 3839# CHECK: Timeline view: 3840# CHECK-NEXT: 0123456789 3841# CHECK-NEXT: Index 0123456789 0123 3842 3843# CHECK: [0,0] DeeeER . . . . st1 { v1.1d, v2.1d, v3.1d }, [x27], #24 3844# CHECK-NEXT: [0,1] .DeE-R . . . . add x0, x27, #1 3845# CHECK-NEXT: [0,2] . D=eeeeeeER . . . st1 { v1.2d, v2.2d, v3.2d }, [x27], #48 3846# CHECK-NEXT: [0,3] . DeE----R . . . add x0, x27, #1 3847# CHECK-NEXT: [0,4] . D====eeeER. . . st1 { v1.2s, v2.2s, v3.2s }, [x27], #24 3848# CHECK-NEXT: [0,5] . .D====eE-R. . . add x0, x27, #1 3849# CHECK-NEXT: [0,6] . . D=====eeeER . . st1 { v1.4h, v2.4h, v3.4h }, [x27], #24 3850# CHECK-NEXT: [0,7] . . D=====eE-R . . add x0, x27, #1 3851# CHECK-NEXT: [0,8] . . D======eeeeeeER st1 { v1.4s, v2.4s, v3.4s }, [x27], #48 3852# CHECK-NEXT: [0,9] . . .D=====eE----R add x0, x27, #1 3853 3854# CHECK: Average Wait times (based on the timeline view): 3855# CHECK-NEXT: [0]: Executions 3856# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3857# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3858# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3859 3860# CHECK: [0] [1] [2] [3] 3861# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.1d, v2.1d, v3.1d }, [x27], #24 3862# CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1 3863# CHECK-NEXT: 2. 1 2.0 2.0 0.0 st1 { v1.2d, v2.2d, v3.2d }, [x27], #48 3864# CHECK-NEXT: 3. 1 1.0 0.0 4.0 add x0, x27, #1 3865# CHECK-NEXT: 4. 1 5.0 5.0 0.0 st1 { v1.2s, v2.2s, v3.2s }, [x27], #24 3866# CHECK-NEXT: 5. 1 5.0 0.0 1.0 add x0, x27, #1 3867# CHECK-NEXT: 6. 1 6.0 2.0 0.0 st1 { v1.4h, v2.4h, v3.4h }, [x27], #24 3868# CHECK-NEXT: 7. 1 6.0 0.0 1.0 add x0, x27, #1 3869# CHECK-NEXT: 8. 1 7.0 2.0 0.0 st1 { v1.4s, v2.4s, v3.4s }, [x27], #48 3870# CHECK-NEXT: 9. 1 6.0 0.0 4.0 add x0, x27, #1 3871# CHECK-NEXT: 1 4.0 1.2 1.1 <total> 3872 3873# CHECK: [59] Code Region - G60 3874 3875# CHECK: Iterations: 100 3876# CHECK-NEXT: Instructions: 1000 3877# CHECK-NEXT: Total Cycles: 2403 3878# CHECK-NEXT: Total uOps: 3400 3879 3880# CHECK: Dispatch Width: 3 3881# CHECK-NEXT: uOps Per Cycle: 1.41 3882# CHECK-NEXT: IPC: 0.42 3883# CHECK-NEXT: Block RThroughput: 24.0 3884 3885# CHECK: Timeline view: 3886# CHECK-NEXT: 0123456789 3887# CHECK-NEXT: Index 0123456789 0123456 3888 3889# CHECK: [0,0] DeeeER . . . .. st1 { v1.8b, v2.8b, v3.8b }, [x27], #24 3890# CHECK-NEXT: [0,1] .DeE-R . . . .. add x0, x27, #1 3891# CHECK-NEXT: [0,2] . D=eeeeeeER . . .. st1 { v1.8h, v2.8h, v3.8h }, [x27], #48 3892# CHECK-NEXT: [0,3] . DeE----R . . .. add x0, x27, #1 3893# CHECK-NEXT: [0,4] . D====eeeeeeER . .. st1 { v1.16b, v2.16b, v3.16b }, [x27], #48 3894# CHECK-NEXT: [0,5] . . D===eE----R . .. add x0, x27, #1 3895# CHECK-NEXT: [0,6] . . D=======eeeER .. st1 { v1.1d, v2.1d, v3.1d }, [x27], x28 3896# CHECK-NEXT: [0,7] . . D=======eE-R .. add x0, x27, #1 3897# CHECK-NEXT: [0,8] . . D========eeeeeeER st1 { v1.2d, v2.2d, v3.2d }, [x27], x28 3898# CHECK-NEXT: [0,9] . . . D=======eE----R add x0, x27, #1 3899 3900# CHECK: Average Wait times (based on the timeline view): 3901# CHECK-NEXT: [0]: Executions 3902# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3903# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3904# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3905 3906# CHECK: [0] [1] [2] [3] 3907# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.8b, v2.8b, v3.8b }, [x27], #24 3908# CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1 3909# CHECK-NEXT: 2. 1 2.0 2.0 0.0 st1 { v1.8h, v2.8h, v3.8h }, [x27], #48 3910# CHECK-NEXT: 3. 1 1.0 0.0 4.0 add x0, x27, #1 3911# CHECK-NEXT: 4. 1 5.0 5.0 0.0 st1 { v1.16b, v2.16b, v3.16b }, [x27], #48 3912# CHECK-NEXT: 5. 1 4.0 0.0 4.0 add x0, x27, #1 3913# CHECK-NEXT: 6. 1 8.0 5.0 0.0 st1 { v1.1d, v2.1d, v3.1d }, [x27], x28 3914# CHECK-NEXT: 7. 1 8.0 0.0 1.0 add x0, x27, #1 3915# CHECK-NEXT: 8. 1 9.0 2.0 0.0 st1 { v1.2d, v2.2d, v3.2d }, [x27], x28 3916# CHECK-NEXT: 9. 1 8.0 0.0 4.0 add x0, x27, #1 3917# CHECK-NEXT: 1 4.7 1.5 1.4 <total> 3918 3919# CHECK: [60] Code Region - G61 3920 3921# CHECK: Iterations: 100 3922# CHECK-NEXT: Instructions: 1000 3923# CHECK-NEXT: Total Cycles: 2103 3924# CHECK-NEXT: Total uOps: 3100 3925 3926# CHECK: Dispatch Width: 3 3927# CHECK-NEXT: uOps Per Cycle: 1.47 3928# CHECK-NEXT: IPC: 0.48 3929# CHECK-NEXT: Block RThroughput: 21.0 3930 3931# CHECK: Timeline view: 3932# CHECK-NEXT: 0123456789 3933# CHECK-NEXT: Index 0123456789 0123 3934 3935# CHECK: [0,0] DeeeER . . . . st1 { v1.2s, v2.2s, v3.2s }, [x27], x28 3936# CHECK-NEXT: [0,1] .DeE-R . . . . add x0, x27, #1 3937# CHECK-NEXT: [0,2] . D=eeeER . . . . st1 { v1.4h, v2.4h, v3.4h }, [x27], x28 3938# CHECK-NEXT: [0,3] . D=eE-R . . . . add x0, x27, #1 3939# CHECK-NEXT: [0,4] . D==eeeeeeER. . . st1 { v1.4s, v2.4s, v3.4s }, [x27], x28 3940# CHECK-NEXT: [0,5] . .D=eE----R. . . add x0, x27, #1 3941# CHECK-NEXT: [0,6] . . D=====eeeER . . st1 { v1.8b, v2.8b, v3.8b }, [x27], x28 3942# CHECK-NEXT: [0,7] . . D=====eE-R . . add x0, x27, #1 3943# CHECK-NEXT: [0,8] . . D======eeeeeeER st1 { v1.8h, v2.8h, v3.8h }, [x27], x28 3944# CHECK-NEXT: [0,9] . . .D=====eE----R add x0, x27, #1 3945 3946# CHECK: Average Wait times (based on the timeline view): 3947# CHECK-NEXT: [0]: Executions 3948# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3949# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3950# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3951 3952# CHECK: [0] [1] [2] [3] 3953# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.2s, v2.2s, v3.2s }, [x27], x28 3954# CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1 3955# CHECK-NEXT: 2. 1 2.0 2.0 0.0 st1 { v1.4h, v2.4h, v3.4h }, [x27], x28 3956# CHECK-NEXT: 3. 1 2.0 0.0 1.0 add x0, x27, #1 3957# CHECK-NEXT: 4. 1 3.0 2.0 0.0 st1 { v1.4s, v2.4s, v3.4s }, [x27], x28 3958# CHECK-NEXT: 5. 1 2.0 0.0 4.0 add x0, x27, #1 3959# CHECK-NEXT: 6. 1 6.0 5.0 0.0 st1 { v1.8b, v2.8b, v3.8b }, [x27], x28 3960# CHECK-NEXT: 7. 1 6.0 0.0 1.0 add x0, x27, #1 3961# CHECK-NEXT: 8. 1 7.0 2.0 0.0 st1 { v1.8h, v2.8h, v3.8h }, [x27], x28 3962# CHECK-NEXT: 9. 1 6.0 0.0 4.0 add x0, x27, #1 3963# CHECK-NEXT: 1 3.6 1.2 1.1 <total> 3964 3965# CHECK: [61] Code Region - G62 3966 3967# CHECK: Iterations: 100 3968# CHECK-NEXT: Instructions: 1000 3969# CHECK-NEXT: Total Cycles: 2603 3970# CHECK-NEXT: Total uOps: 3600 3971 3972# CHECK: Dispatch Width: 3 3973# CHECK-NEXT: uOps Per Cycle: 1.38 3974# CHECK-NEXT: IPC: 0.38 3975# CHECK-NEXT: Block RThroughput: 26.0 3976 3977# CHECK: Timeline view: 3978# CHECK-NEXT: 0123456789 3979# CHECK-NEXT: Index 0123456789 012345678 3980 3981# CHECK: [0,0] DeeeeeeER . . . . . st1 { v1.16b, v2.16b, v3.16b }, [x27], x28 3982# CHECK-NEXT: [0,1] . DeE---R . . . . . add x0, x27, #1 3983# CHECK-NEXT: [0,2] . D===eeeeER . . . . st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 3984# CHECK-NEXT: [0,3] . D===eE--R . . . . add x0, x27, #1 3985# CHECK-NEXT: [0,4] . D=====eeeeeeeeER . . st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 3986# CHECK-NEXT: [0,5] . . D===eE------R . . add x0, x27, #1 3987# CHECK-NEXT: [0,6] . . D=========eeeeER. . st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 3988# CHECK-NEXT: [0,7] . . D=========eE--R. . add x0, x27, #1 3989# CHECK-NEXT: [0,8] . . .D===========eeeeER st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 3990# CHECK-NEXT: [0,9] . . . D===========eE--R add x0, x27, #1 3991 3992# CHECK: Average Wait times (based on the timeline view): 3993# CHECK-NEXT: [0]: Executions 3994# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 3995# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 3996# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 3997 3998# CHECK: [0] [1] [2] [3] 3999# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.16b, v2.16b, v3.16b }, [x27], x28 4000# CHECK-NEXT: 1. 1 1.0 1.0 3.0 add x0, x27, #1 4001# CHECK-NEXT: 2. 1 4.0 4.0 0.0 st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], #32 4002# CHECK-NEXT: 3. 1 4.0 0.0 2.0 add x0, x27, #1 4003# CHECK-NEXT: 4. 1 6.0 3.0 0.0 st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 4004# CHECK-NEXT: 5. 1 4.0 0.0 6.0 add x0, x27, #1 4005# CHECK-NEXT: 6. 1 10.0 7.0 0.0 st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 4006# CHECK-NEXT: 7. 1 10.0 0.0 2.0 add x0, x27, #1 4007# CHECK-NEXT: 8. 1 12.0 3.0 0.0 st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 4008# CHECK-NEXT: 9. 1 12.0 0.0 2.0 add x0, x27, #1 4009# CHECK-NEXT: 1 6.4 1.9 1.5 <total> 4010 4011# CHECK: [62] Code Region - G63 4012 4013# CHECK: Iterations: 100 4014# CHECK-NEXT: Instructions: 1000 4015# CHECK-NEXT: Total Cycles: 3203 4016# CHECK-NEXT: Total uOps: 4200 4017 4018# CHECK: Dispatch Width: 3 4019# CHECK-NEXT: uOps Per Cycle: 1.31 4020# CHECK-NEXT: IPC: 0.31 4021# CHECK-NEXT: Block RThroughput: 32.0 4022 4023# CHECK: Timeline view: 4024# CHECK-NEXT: 0123456789 01234 4025# CHECK-NEXT: Index 0123456789 0123456789 4026 4027# CHECK: [0,0] DeeeeeeeeER . . . . . st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 4028# CHECK-NEXT: [0,1] . DeE----R . . . . . add x0, x27, #1 4029# CHECK-NEXT: [0,2] . D====eeeeER. . . . . st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 4030# CHECK-NEXT: [0,3] . D====eE--R. . . . . add x0, x27, #1 4031# CHECK-NEXT: [0,4] . .D======eeeeeeeeER . . . st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 4032# CHECK-NEXT: [0,5] . . D====eE------R . . . add x0, x27, #1 4033# CHECK-NEXT: [0,6] . . D==========eeeeeeeeER . st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 4034# CHECK-NEXT: [0,7] . . . D========eE------R . add x0, x27, #1 4035# CHECK-NEXT: [0,8] . . . D==============eeeeER st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 4036# CHECK-NEXT: [0,9] . . . D==============eE--R add x0, x27, #1 4037 4038# CHECK: Average Wait times (based on the timeline view): 4039# CHECK-NEXT: [0]: Executions 4040# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4041# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4042# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4043 4044# CHECK: [0] [1] [2] [3] 4045# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 4046# CHECK-NEXT: 1. 1 1.0 1.0 4.0 add x0, x27, #1 4047# CHECK-NEXT: 2. 1 5.0 5.0 0.0 st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 4048# CHECK-NEXT: 3. 1 5.0 0.0 2.0 add x0, x27, #1 4049# CHECK-NEXT: 4. 1 7.0 3.0 0.0 st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 4050# CHECK-NEXT: 5. 1 5.0 0.0 6.0 add x0, x27, #1 4051# CHECK-NEXT: 6. 1 11.0 7.0 0.0 st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 4052# CHECK-NEXT: 7. 1 9.0 0.0 6.0 add x0, x27, #1 4053# CHECK-NEXT: 8. 1 15.0 7.0 0.0 st1 { v1.1d, v2.1d, v3.1d, v4.1d }, [x27], x28 4054# CHECK-NEXT: 9. 1 15.0 0.0 2.0 add x0, x27, #1 4055# CHECK-NEXT: 1 7.4 2.4 2.0 <total> 4056 4057# CHECK: [63] Code Region - G64 4058 4059# CHECK: Iterations: 100 4060# CHECK-NEXT: Instructions: 1000 4061# CHECK-NEXT: Total Cycles: 2803 4062# CHECK-NEXT: Total uOps: 3800 4063 4064# CHECK: Dispatch Width: 3 4065# CHECK-NEXT: uOps Per Cycle: 1.36 4066# CHECK-NEXT: IPC: 0.36 4067# CHECK-NEXT: Block RThroughput: 28.0 4068 4069# CHECK: Timeline view: 4070# CHECK-NEXT: 0123456789 0 4071# CHECK-NEXT: Index 0123456789 0123456789 4072 4073# CHECK: [0,0] DeeeeeeeeER . . . . st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 4074# CHECK-NEXT: [0,1] . DeE----R . . . . add x0, x27, #1 4075# CHECK-NEXT: [0,2] . D====eeeeER. . . . st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 4076# CHECK-NEXT: [0,3] . D====eE--R. . . . add x0, x27, #1 4077# CHECK-NEXT: [0,4] . .D======eeeeER . . . st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 4078# CHECK-NEXT: [0,5] . . D======eE--R . . . add x0, x27, #1 4079# CHECK-NEXT: [0,6] . . D========eeeeeeeeER . st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 4080# CHECK-NEXT: [0,7] . . .D======eE------R . add x0, x27, #1 4081# CHECK-NEXT: [0,8] . . . D============eeeeER st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 4082# CHECK-NEXT: [0,9] . . . D============eE--R add x0, x27, #1 4083 4084# CHECK: Average Wait times (based on the timeline view): 4085# CHECK-NEXT: [0]: Executions 4086# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4087# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4088# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4089 4090# CHECK: [0] [1] [2] [3] 4091# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 4092# CHECK-NEXT: 1. 1 1.0 1.0 4.0 add x0, x27, #1 4093# CHECK-NEXT: 2. 1 5.0 5.0 0.0 st1 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 4094# CHECK-NEXT: 3. 1 5.0 0.0 2.0 add x0, x27, #1 4095# CHECK-NEXT: 4. 1 7.0 3.0 0.0 st1 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 4096# CHECK-NEXT: 5. 1 7.0 0.0 2.0 add x0, x27, #1 4097# CHECK-NEXT: 6. 1 9.0 3.0 0.0 st1 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 4098# CHECK-NEXT: 7. 1 7.0 0.0 6.0 add x0, x27, #1 4099# CHECK-NEXT: 8. 1 13.0 7.0 0.0 st1 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 4100# CHECK-NEXT: 9. 1 13.0 0.0 2.0 add x0, x27, #1 4101# CHECK-NEXT: 1 6.8 2.0 1.6 <total> 4102 4103# CHECK: [64] Code Region - G65 4104 4105# CHECK: Iterations: 100 4106# CHECK-NEXT: Instructions: 1000 4107# CHECK-NEXT: Total Cycles: 1904 4108# CHECK-NEXT: Total uOps: 2900 4109 4110# CHECK: Dispatch Width: 3 4111# CHECK-NEXT: uOps Per Cycle: 1.52 4112# CHECK-NEXT: IPC: 0.53 4113# CHECK-NEXT: Block RThroughput: 19.0 4114 4115# CHECK: Timeline view: 4116# CHECK-NEXT: 0123456789 4117# CHECK-NEXT: Index 0123456789 012 4118 4119# CHECK: [0,0] DeeeeeeeeER . . . st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 4120# CHECK-NEXT: [0,1] . DeE----R . . . add x0, x27, #1 4121# CHECK-NEXT: [0,2] . D====eeeeeeeeER . . st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 4122# CHECK-NEXT: [0,3] . . D==eE------R . . add x0, x27, #1 4123# CHECK-NEXT: [0,4] . . D=========eER. . st1 { v1.b }[0], [x27], #1 4124# CHECK-NEXT: [0,5] . . D=========eER . add x0, x27, #1 4125# CHECK-NEXT: [0,6] . . D=========eER . st1 { v1.b }[8], [x27], #1 4126# CHECK-NEXT: [0,7] . . D=========eER. add x0, x27, #1 4127# CHECK-NEXT: [0,8] . . D=========eER. st1 { v1.b }[0], [x27], x28 4128# CHECK-NEXT: [0,9] . . D=========eER add x0, x27, #1 4129 4130# CHECK: Average Wait times (based on the timeline view): 4131# CHECK-NEXT: [0]: Executions 4132# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4133# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4134# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4135 4136# CHECK: [0] [1] [2] [3] 4137# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 4138# CHECK-NEXT: 1. 1 1.0 1.0 4.0 add x0, x27, #1 4139# CHECK-NEXT: 2. 1 5.0 5.0 0.0 st1 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 4140# CHECK-NEXT: 3. 1 3.0 0.0 6.0 add x0, x27, #1 4141# CHECK-NEXT: 4. 1 10.0 7.0 0.0 st1 { v1.b }[0], [x27], #1 4142# CHECK-NEXT: 5. 1 10.0 0.0 0.0 add x0, x27, #1 4143# CHECK-NEXT: 6. 1 10.0 0.0 0.0 st1 { v1.b }[8], [x27], #1 4144# CHECK-NEXT: 7. 1 10.0 0.0 0.0 add x0, x27, #1 4145# CHECK-NEXT: 8. 1 10.0 0.0 0.0 st1 { v1.b }[0], [x27], x28 4146# CHECK-NEXT: 9. 1 10.0 0.0 0.0 add x0, x27, #1 4147# CHECK-NEXT: 1 7.0 1.4 1.0 <total> 4148 4149# CHECK: [65] Code Region - G66 4150 4151# CHECK: Iterations: 100 4152# CHECK-NEXT: Instructions: 1000 4153# CHECK-NEXT: Total Cycles: 504 4154# CHECK-NEXT: Total uOps: 1500 4155 4156# CHECK: Dispatch Width: 3 4157# CHECK-NEXT: uOps Per Cycle: 2.98 4158# CHECK-NEXT: IPC: 1.98 4159# CHECK-NEXT: Block RThroughput: 5.0 4160 4161# CHECK: Timeline view: 4162# CHECK-NEXT: Index 012345678 4163 4164# CHECK: [0,0] DeER . . st1 { v1.b }[8], [x27], x28 4165# CHECK-NEXT: [0,1] D=eER. . add x0, x27, #1 4166# CHECK-NEXT: [0,2] .DeER. . st1 { v1.h }[0], [x27], #2 4167# CHECK-NEXT: [0,3] .D=eER . add x0, x27, #1 4168# CHECK-NEXT: [0,4] . DeER . st1 { v1.h }[4], [x27], #2 4169# CHECK-NEXT: [0,5] . D=eER . add x0, x27, #1 4170# CHECK-NEXT: [0,6] . DeER . st1 { v1.h }[0], [x27], x28 4171# CHECK-NEXT: [0,7] . D=eER. add x0, x27, #1 4172# CHECK-NEXT: [0,8] . DeER. st1 { v1.h }[4], [x27], x28 4173# CHECK-NEXT: [0,9] . D=eER add x0, x27, #1 4174 4175# CHECK: Average Wait times (based on the timeline view): 4176# CHECK-NEXT: [0]: Executions 4177# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4178# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4179# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4180 4181# CHECK: [0] [1] [2] [3] 4182# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.b }[8], [x27], x28 4183# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 4184# CHECK-NEXT: 2. 1 1.0 0.0 0.0 st1 { v1.h }[0], [x27], #2 4185# CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1 4186# CHECK-NEXT: 4. 1 1.0 0.0 0.0 st1 { v1.h }[4], [x27], #2 4187# CHECK-NEXT: 5. 1 2.0 0.0 0.0 add x0, x27, #1 4188# CHECK-NEXT: 6. 1 1.0 0.0 0.0 st1 { v1.h }[0], [x27], x28 4189# CHECK-NEXT: 7. 1 2.0 0.0 0.0 add x0, x27, #1 4190# CHECK-NEXT: 8. 1 1.0 0.0 0.0 st1 { v1.h }[4], [x27], x28 4191# CHECK-NEXT: 9. 1 2.0 0.0 0.0 add x0, x27, #1 4192# CHECK-NEXT: 1 1.5 0.1 0.0 <total> 4193 4194# CHECK: [66] Code Region - G67 4195 4196# CHECK: Iterations: 100 4197# CHECK-NEXT: Instructions: 1000 4198# CHECK-NEXT: Total Cycles: 805 4199# CHECK-NEXT: Total uOps: 2000 4200 4201# CHECK: Dispatch Width: 3 4202# CHECK-NEXT: uOps Per Cycle: 2.48 4203# CHECK-NEXT: IPC: 1.24 4204# CHECK-NEXT: Block RThroughput: 8.0 4205 4206# CHECK: Timeline view: 4207# CHECK-NEXT: 012 4208# CHECK-NEXT: Index 0123456789 4209 4210# CHECK: [0,0] DeER . . . st1 { v1.s }[0], [x27], #4 4211# CHECK-NEXT: [0,1] D=eER. . . add x0, x27, #1 4212# CHECK-NEXT: [0,2] .DeER. . . st1 { v1.s }[0], [x27], x28 4213# CHECK-NEXT: [0,3] .D=eER . . add x0, x27, #1 4214# CHECK-NEXT: [0,4] . DeeeER . . st1 { v1.d }[0], [x27], #8 4215# CHECK-NEXT: [0,5] . DeE-R . . add x0, x27, #1 4216# CHECK-NEXT: [0,6] . DeeeER. . st1 { v1.d }[0], [x27], x28 4217# CHECK-NEXT: [0,7] . DeE-R. . add x0, x27, #1 4218# CHECK-NEXT: [0,8] . .DeeeeER st2 { v1.2d, v2.2d }, [x27], #32 4219# CHECK-NEXT: [0,9] . . DeE--R add x0, x27, #1 4220 4221# CHECK: Average Wait times (based on the timeline view): 4222# CHECK-NEXT: [0]: Executions 4223# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4224# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4225# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4226 4227# CHECK: [0] [1] [2] [3] 4228# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st1 { v1.s }[0], [x27], #4 4229# CHECK-NEXT: 1. 1 2.0 0.0 0.0 add x0, x27, #1 4230# CHECK-NEXT: 2. 1 1.0 0.0 0.0 st1 { v1.s }[0], [x27], x28 4231# CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1 4232# CHECK-NEXT: 4. 1 1.0 0.0 0.0 st1 { v1.d }[0], [x27], #8 4233# CHECK-NEXT: 5. 1 1.0 0.0 1.0 add x0, x27, #1 4234# CHECK-NEXT: 6. 1 1.0 1.0 0.0 st1 { v1.d }[0], [x27], x28 4235# CHECK-NEXT: 7. 1 1.0 0.0 1.0 add x0, x27, #1 4236# CHECK-NEXT: 8. 1 1.0 1.0 0.0 st2 { v1.2d, v2.2d }, [x27], #32 4237# CHECK-NEXT: 9. 1 1.0 0.0 2.0 add x0, x27, #1 4238# CHECK-NEXT: 1 1.2 0.3 0.4 <total> 4239 4240# CHECK: [67] Code Region - G68 4241 4242# CHECK: Iterations: 100 4243# CHECK-NEXT: Instructions: 1000 4244# CHECK-NEXT: Total Cycles: 1403 4245# CHECK-NEXT: Total uOps: 3100 4246 4247# CHECK: Dispatch Width: 3 4248# CHECK-NEXT: uOps Per Cycle: 2.21 4249# CHECK-NEXT: IPC: 0.71 4250# CHECK-NEXT: Block RThroughput: 14.0 4251 4252# CHECK: Timeline view: 4253# CHECK-NEXT: 0123456 4254# CHECK-NEXT: Index 0123456789 4255 4256# CHECK: [0,0] DeeeER . .. st2 { v1.2s, v2.2s }, [x27], #16 4257# CHECK-NEXT: [0,1] .DeE-R . .. add x0, x27, #1 4258# CHECK-NEXT: [0,2] . DeeeER . .. st2 { v1.4h, v2.4h }, [x27], #16 4259# CHECK-NEXT: [0,3] . DeE-R . .. add x0, x27, #1 4260# CHECK-NEXT: [0,4] . DeeeeER .. st2 { v1.4s, v2.4s }, [x27], #32 4261# CHECK-NEXT: [0,5] . .DeE-R .. add x0, x27, #1 4262# CHECK-NEXT: [0,6] . . D=eeeER .. st2 { v1.8b, v2.8b }, [x27], #16 4263# CHECK-NEXT: [0,7] . . D=eE-R .. add x0, x27, #1 4264# CHECK-NEXT: [0,8] . . D=eeeeER st2 { v1.8h, v2.8h }, [x27], #32 4265# CHECK-NEXT: [0,9] . . .DeE--R add x0, x27, #1 4266 4267# CHECK: Average Wait times (based on the timeline view): 4268# CHECK-NEXT: [0]: Executions 4269# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4270# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4271# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4272 4273# CHECK: [0] [1] [2] [3] 4274# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.2s, v2.2s }, [x27], #16 4275# CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1 4276# CHECK-NEXT: 2. 1 1.0 1.0 0.0 st2 { v1.4h, v2.4h }, [x27], #16 4277# CHECK-NEXT: 3. 1 1.0 0.0 1.0 add x0, x27, #1 4278# CHECK-NEXT: 4. 1 1.0 1.0 0.0 st2 { v1.4s, v2.4s }, [x27], #32 4279# CHECK-NEXT: 5. 1 1.0 1.0 1.0 add x0, x27, #1 4280# CHECK-NEXT: 6. 1 2.0 2.0 0.0 st2 { v1.8b, v2.8b }, [x27], #16 4281# CHECK-NEXT: 7. 1 2.0 0.0 1.0 add x0, x27, #1 4282# CHECK-NEXT: 8. 1 2.0 1.0 0.0 st2 { v1.8h, v2.8h }, [x27], #32 4283# CHECK-NEXT: 9. 1 1.0 0.0 2.0 add x0, x27, #1 4284# CHECK-NEXT: 1 1.3 0.7 0.6 <total> 4285 4286# CHECK: [68] Code Region - G69 4287 4288# CHECK: Iterations: 100 4289# CHECK-NEXT: Instructions: 1000 4290# CHECK-NEXT: Total Cycles: 1603 4291# CHECK-NEXT: Total uOps: 3200 4292 4293# CHECK: Dispatch Width: 3 4294# CHECK-NEXT: uOps Per Cycle: 2.00 4295# CHECK-NEXT: IPC: 0.62 4296# CHECK-NEXT: Block RThroughput: 16.0 4297 4298# CHECK: Timeline view: 4299# CHECK-NEXT: 012345678 4300# CHECK-NEXT: Index 0123456789 4301 4302# CHECK: [0,0] DeeeeER . . . st2 { v1.16b, v2.16b }, [x27], #32 4303# CHECK-NEXT: [0,1] . DeE-R . . . add x0, x27, #1 4304# CHECK-NEXT: [0,2] . D=eeeeER . . st2 { v1.2d, v2.2d }, [x27], x28 4305# CHECK-NEXT: [0,3] . D=eE--R . . add x0, x27, #1 4306# CHECK-NEXT: [0,4] . D===eeeER . . st2 { v1.2s, v2.2s }, [x27], x28 4307# CHECK-NEXT: [0,5] . .D===eE-R . . add x0, x27, #1 4308# CHECK-NEXT: [0,6] . . D===eeeER . st2 { v1.4h, v2.4h }, [x27], x28 4309# CHECK-NEXT: [0,7] . . D===eE-R . add x0, x27, #1 4310# CHECK-NEXT: [0,8] . . D===eeeeER st2 { v1.4s, v2.4s }, [x27], x28 4311# CHECK-NEXT: [0,9] . . .D==eE--R add x0, x27, #1 4312 4313# CHECK: Average Wait times (based on the timeline view): 4314# CHECK-NEXT: [0]: Executions 4315# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4316# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4317# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4318 4319# CHECK: [0] [1] [2] [3] 4320# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.16b, v2.16b }, [x27], #32 4321# CHECK-NEXT: 1. 1 1.0 1.0 1.0 add x0, x27, #1 4322# CHECK-NEXT: 2. 1 2.0 2.0 0.0 st2 { v1.2d, v2.2d }, [x27], x28 4323# CHECK-NEXT: 3. 1 2.0 0.0 2.0 add x0, x27, #1 4324# CHECK-NEXT: 4. 1 4.0 3.0 0.0 st2 { v1.2s, v2.2s }, [x27], x28 4325# CHECK-NEXT: 5. 1 4.0 0.0 1.0 add x0, x27, #1 4326# CHECK-NEXT: 6. 1 4.0 1.0 0.0 st2 { v1.4h, v2.4h }, [x27], x28 4327# CHECK-NEXT: 7. 1 4.0 0.0 1.0 add x0, x27, #1 4328# CHECK-NEXT: 8. 1 4.0 1.0 0.0 st2 { v1.4s, v2.4s }, [x27], x28 4329# CHECK-NEXT: 9. 1 3.0 0.0 2.0 add x0, x27, #1 4330# CHECK-NEXT: 1 2.9 0.9 0.7 <total> 4331 4332# CHECK: [69] Code Region - G70 4333 4334# CHECK: Iterations: 100 4335# CHECK-NEXT: Instructions: 1000 4336# CHECK-NEXT: Total Cycles: 1205 4337# CHECK-NEXT: Total uOps: 2900 4338 4339# CHECK: Dispatch Width: 3 4340# CHECK-NEXT: uOps Per Cycle: 2.41 4341# CHECK-NEXT: IPC: 0.83 4342# CHECK-NEXT: Block RThroughput: 12.0 4343 4344# CHECK: Timeline view: 4345# CHECK-NEXT: 0123456 4346# CHECK-NEXT: Index 0123456789 4347 4348# CHECK: [0,0] DeeeER . .. st2 { v1.8b, v2.8b }, [x27], x28 4349# CHECK-NEXT: [0,1] .DeE-R . .. add x0, x27, #1 4350# CHECK-NEXT: [0,2] . DeeeeER . .. st2 { v1.8h, v2.8h }, [x27], x28 4351# CHECK-NEXT: [0,3] . DeE-R . .. add x0, x27, #1 4352# CHECK-NEXT: [0,4] . D=eeeeER .. st2 { v1.16b, v2.16b }, [x27], x28 4353# CHECK-NEXT: [0,5] . . DeE--R .. add x0, x27, #1 4354# CHECK-NEXT: [0,6] . . D==eeeER. st2 { v1.b, v2.b }[0], [x27], #2 4355# CHECK-NEXT: [0,7] . . D==eE-R. add x0, x27, #1 4356# CHECK-NEXT: [0,8] . . D=eeeER st2 { v1.b, v2.b }[8], [x27], #2 4357# CHECK-NEXT: [0,9] . . .D=eE-R add x0, x27, #1 4358 4359# CHECK: Average Wait times (based on the timeline view): 4360# CHECK-NEXT: [0]: Executions 4361# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4362# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4363# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4364 4365# CHECK: [0] [1] [2] [3] 4366# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.8b, v2.8b }, [x27], x28 4367# CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1 4368# CHECK-NEXT: 2. 1 1.0 1.0 0.0 st2 { v1.8h, v2.8h }, [x27], x28 4369# CHECK-NEXT: 3. 1 1.0 1.0 1.0 add x0, x27, #1 4370# CHECK-NEXT: 4. 1 2.0 2.0 0.0 st2 { v1.16b, v2.16b }, [x27], x28 4371# CHECK-NEXT: 5. 1 1.0 0.0 2.0 add x0, x27, #1 4372# CHECK-NEXT: 6. 1 3.0 3.0 0.0 st2 { v1.b, v2.b }[0], [x27], #2 4373# CHECK-NEXT: 7. 1 3.0 0.0 1.0 add x0, x27, #1 4374# CHECK-NEXT: 8. 1 2.0 0.0 0.0 st2 { v1.b, v2.b }[8], [x27], #2 4375# CHECK-NEXT: 9. 1 2.0 0.0 1.0 add x0, x27, #1 4376# CHECK-NEXT: 1 1.7 0.8 0.6 <total> 4377 4378# CHECK: [70] Code Region - G71 4379 4380# CHECK: Iterations: 100 4381# CHECK-NEXT: Instructions: 1000 4382# CHECK-NEXT: Total Cycles: 1004 4383# CHECK-NEXT: Total uOps: 2000 4384 4385# CHECK: Dispatch Width: 3 4386# CHECK-NEXT: uOps Per Cycle: 1.99 4387# CHECK-NEXT: IPC: 1.00 4388# CHECK-NEXT: Block RThroughput: 6.7 4389 4390# CHECK: Timeline view: 4391# CHECK-NEXT: 0123 4392# CHECK-NEXT: Index 0123456789 4393 4394# CHECK: [0,0] DeeeER . . st2 { v1.b, v2.b }[0], [x27], x28 4395# CHECK-NEXT: [0,1] .DeE-R . . add x0, x27, #1 4396# CHECK-NEXT: [0,2] . DeeeER . . st2 { v1.b, v2.b }[8], [x27], x28 4397# CHECK-NEXT: [0,3] . DeE-R . . add x0, x27, #1 4398# CHECK-NEXT: [0,4] . DeeeER. . st2 { v1.h, v2.h }[0], [x27], #4 4399# CHECK-NEXT: [0,5] . DeE-R. . add x0, x27, #1 4400# CHECK-NEXT: [0,6] . .DeeeER . st2 { v1.h, v2.h }[4], [x27], #4 4401# CHECK-NEXT: [0,7] . . DeE-R . add x0, x27, #1 4402# CHECK-NEXT: [0,8] . . DeeeER st2 { v1.h, v2.h }[0], [x27], x28 4403# CHECK-NEXT: [0,9] . . DeE-R add x0, x27, #1 4404 4405# CHECK: Average Wait times (based on the timeline view): 4406# CHECK-NEXT: [0]: Executions 4407# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4408# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4409# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4410 4411# CHECK: [0] [1] [2] [3] 4412# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.b, v2.b }[0], [x27], x28 4413# CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1 4414# CHECK-NEXT: 2. 1 1.0 1.0 0.0 st2 { v1.b, v2.b }[8], [x27], x28 4415# CHECK-NEXT: 3. 1 1.0 0.0 1.0 add x0, x27, #1 4416# CHECK-NEXT: 4. 1 1.0 1.0 0.0 st2 { v1.h, v2.h }[0], [x27], #4 4417# CHECK-NEXT: 5. 1 1.0 0.0 1.0 add x0, x27, #1 4418# CHECK-NEXT: 6. 1 1.0 1.0 0.0 st2 { v1.h, v2.h }[4], [x27], #4 4419# CHECK-NEXT: 7. 1 1.0 0.0 1.0 add x0, x27, #1 4420# CHECK-NEXT: 8. 1 1.0 1.0 0.0 st2 { v1.h, v2.h }[0], [x27], x28 4421# CHECK-NEXT: 9. 1 1.0 0.0 1.0 add x0, x27, #1 4422# CHECK-NEXT: 1 1.0 0.5 0.5 <total> 4423 4424# CHECK: [71] Code Region - G72 4425 4426# CHECK: Iterations: 100 4427# CHECK-NEXT: Instructions: 1000 4428# CHECK-NEXT: Total Cycles: 1003 4429# CHECK-NEXT: Total uOps: 2000 4430 4431# CHECK: Dispatch Width: 3 4432# CHECK-NEXT: uOps Per Cycle: 1.99 4433# CHECK-NEXT: IPC: 1.00 4434# CHECK-NEXT: Block RThroughput: 7.0 4435 4436# CHECK: Timeline view: 4437# CHECK-NEXT: 012 4438# CHECK-NEXT: Index 0123456789 4439 4440# CHECK: [0,0] DeeeER . . st2 { v1.h, v2.h }[4], [x27], x28 4441# CHECK-NEXT: [0,1] .DeE-R . . add x0, x27, #1 4442# CHECK-NEXT: [0,2] . DeeeER . . st2 { v1.s, v2.s }[0], [x27], #8 4443# CHECK-NEXT: [0,3] . DeE-R . . add x0, x27, #1 4444# CHECK-NEXT: [0,4] . DeeeER. . st2 { v1.s, v2.s }[0], [x27], x28 4445# CHECK-NEXT: [0,5] . DeE-R. . add x0, x27, #1 4446# CHECK-NEXT: [0,6] . .DeeER . st2 { v1.d, v2.d }[0], [x27], #16 4447# CHECK-NEXT: [0,7] . . DeER . add x0, x27, #1 4448# CHECK-NEXT: [0,8] . . DeeER st2 { v1.d, v2.d }[0], [x27], x28 4449# CHECK-NEXT: [0,9] . . DeER add x0, x27, #1 4450 4451# CHECK: Average Wait times (based on the timeline view): 4452# CHECK-NEXT: [0]: Executions 4453# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4454# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4455# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4456 4457# CHECK: [0] [1] [2] [3] 4458# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st2 { v1.h, v2.h }[4], [x27], x28 4459# CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1 4460# CHECK-NEXT: 2. 1 1.0 1.0 0.0 st2 { v1.s, v2.s }[0], [x27], #8 4461# CHECK-NEXT: 3. 1 1.0 0.0 1.0 add x0, x27, #1 4462# CHECK-NEXT: 4. 1 1.0 1.0 0.0 st2 { v1.s, v2.s }[0], [x27], x28 4463# CHECK-NEXT: 5. 1 1.0 0.0 1.0 add x0, x27, #1 4464# CHECK-NEXT: 6. 1 1.0 1.0 0.0 st2 { v1.d, v2.d }[0], [x27], #16 4465# CHECK-NEXT: 7. 1 1.0 0.0 0.0 add x0, x27, #1 4466# CHECK-NEXT: 8. 1 1.0 1.0 0.0 st2 { v1.d, v2.d }[0], [x27], x28 4467# CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1 4468# CHECK-NEXT: 1 1.0 0.5 0.3 <total> 4469 4470# CHECK: [72] Code Region - G73 4471 4472# CHECK: Iterations: 100 4473# CHECK-NEXT: Instructions: 600 4474# CHECK-NEXT: Total Cycles: 1203 4475# CHECK-NEXT: Total uOps: 2200 4476 4477# CHECK: Dispatch Width: 3 4478# CHECK-NEXT: uOps Per Cycle: 1.83 4479# CHECK-NEXT: IPC: 0.50 4480# CHECK-NEXT: Block RThroughput: 12.0 4481 4482# CHECK: Timeline view: 4483# CHECK-NEXT: 01234 4484# CHECK-NEXT: Index 0123456789 4485 4486# CHECK: [0,0] DeeeeeeER . . st3 { v1.2d, v2.2d, v3.2d }, [x27], #48 4487# CHECK-NEXT: [0,1] . DeE---R . . add x0, x27, #1 4488# CHECK-NEXT: [0,2] . D===eeeER . st3 { v1.2s, v2.2s, v3.2s }, [x27], #24 4489# CHECK-NEXT: [0,3] . D==eE-R . add x0, x27, #1 4490# CHECK-NEXT: [0,4] . .D===eeeER st3 { v1.4h, v2.4h, v3.4h }, [x27], #24 4491# CHECK-NEXT: [0,5] . . D==eE-R add x0, x27, #1 4492 4493# CHECK: Average Wait times (based on the timeline view): 4494# CHECK-NEXT: [0]: Executions 4495# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4496# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4497# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4498 4499# CHECK: [0] [1] [2] [3] 4500# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.2d, v2.2d, v3.2d }, [x27], #48 4501# CHECK-NEXT: 1. 1 1.0 1.0 3.0 add x0, x27, #1 4502# CHECK-NEXT: 2. 1 4.0 4.0 0.0 st3 { v1.2s, v2.2s, v3.2s }, [x27], #24 4503# CHECK-NEXT: 3. 1 3.0 0.0 1.0 add x0, x27, #1 4504# CHECK-NEXT: 4. 1 4.0 2.0 0.0 st3 { v1.4h, v2.4h, v3.4h }, [x27], #24 4505# CHECK-NEXT: 5. 1 3.0 0.0 1.0 add x0, x27, #1 4506# CHECK-NEXT: 1 2.7 1.3 0.8 <total> 4507 4508# CHECK: [73] Code Region - G74 4509 4510# CHECK: Iterations: 100 4511# CHECK-NEXT: Instructions: 1000 4512# CHECK-NEXT: Total Cycles: 2703 4513# CHECK-NEXT: Total uOps: 5100 4514 4515# CHECK: Dispatch Width: 3 4516# CHECK-NEXT: uOps Per Cycle: 1.89 4517# CHECK-NEXT: IPC: 0.37 4518# CHECK-NEXT: Block RThroughput: 27.0 4519 4520# CHECK: Timeline view: 4521# CHECK-NEXT: 0123456789 4522# CHECK-NEXT: Index 0123456789 0123456789 4523 4524# CHECK: [0,0] DeeeeeeER . . . . . st3 { v1.4s, v2.4s, v3.4s }, [x27], #48 4525# CHECK-NEXT: [0,1] . DeE--R . . . . . add x0, x27, #1 4526# CHECK-NEXT: [0,2] . D==eeeER . . . . st3 { v1.8b, v2.8b, v3.8b }, [x27], #24 4527# CHECK-NEXT: [0,3] . .D=eE-R . . . . add x0, x27, #1 4528# CHECK-NEXT: [0,4] . . D==eeeeeeER . . . st3 { v1.8h, v2.8h, v3.8h }, [x27], #48 4529# CHECK-NEXT: [0,5] . . DeE----R . . . add x0, x27, #1 4530# CHECK-NEXT: [0,6] . . .D====eeeeeeER . . st3 { v1.16b, v2.16b, v3.16b }, [x27], #48 4531# CHECK-NEXT: [0,7] . . . D==eE----R . . add x0, x27, #1 4532# CHECK-NEXT: [0,8] . . . D======eeeeeeER st3 { v1.2d, v2.2d, v3.2d }, [x27], x28 4533# CHECK-NEXT: [0,9] . . . . D=====eE----R add x0, x27, #1 4534 4535# CHECK: Average Wait times (based on the timeline view): 4536# CHECK-NEXT: [0]: Executions 4537# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4538# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4539# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4540 4541# CHECK: [0] [1] [2] [3] 4542# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.4s, v2.4s, v3.4s }, [x27], #48 4543# CHECK-NEXT: 1. 1 1.0 1.0 2.0 add x0, x27, #1 4544# CHECK-NEXT: 2. 1 3.0 3.0 0.0 st3 { v1.8b, v2.8b, v3.8b }, [x27], #24 4545# CHECK-NEXT: 3. 1 2.0 0.0 1.0 add x0, x27, #1 4546# CHECK-NEXT: 4. 1 3.0 2.0 0.0 st3 { v1.8h, v2.8h, v3.8h }, [x27], #48 4547# CHECK-NEXT: 5. 1 1.0 0.0 4.0 add x0, x27, #1 4548# CHECK-NEXT: 6. 1 5.0 5.0 0.0 st3 { v1.16b, v2.16b, v3.16b }, [x27], #48 4549# CHECK-NEXT: 7. 1 3.0 0.0 4.0 add x0, x27, #1 4550# CHECK-NEXT: 8. 1 7.0 5.0 0.0 st3 { v1.2d, v2.2d, v3.2d }, [x27], x28 4551# CHECK-NEXT: 9. 1 6.0 0.0 4.0 add x0, x27, #1 4552# CHECK-NEXT: 1 3.2 1.7 1.5 <total> 4553 4554# CHECK: [74] Code Region - G75 4555 4556# CHECK: Iterations: 100 4557# CHECK-NEXT: Instructions: 1000 4558# CHECK-NEXT: Total Cycles: 2103 4559# CHECK-NEXT: Total uOps: 4500 4560 4561# CHECK: Dispatch Width: 3 4562# CHECK-NEXT: uOps Per Cycle: 2.14 4563# CHECK-NEXT: IPC: 0.48 4564# CHECK-NEXT: Block RThroughput: 21.0 4565 4566# CHECK: Timeline view: 4567# CHECK-NEXT: 0123456789 4568# CHECK-NEXT: Index 0123456789 0123 4569 4570# CHECK: [0,0] DeeeER . . . . st3 { v1.2s, v2.2s, v3.2s }, [x27], x28 4571# CHECK-NEXT: [0,1] . DeER . . . . add x0, x27, #1 4572# CHECK-NEXT: [0,2] . DeeeER . . . . st3 { v1.4h, v2.4h, v3.4h }, [x27], x28 4573# CHECK-NEXT: [0,3] . DeER . . . . add x0, x27, #1 4574# CHECK-NEXT: [0,4] . .DeeeeeeER. . . st3 { v1.4s, v2.4s, v3.4s }, [x27], x28 4575# CHECK-NEXT: [0,5] . . DeE--R. . . add x0, x27, #1 4576# CHECK-NEXT: [0,6] . . D==eeeER . . st3 { v1.8b, v2.8b, v3.8b }, [x27], x28 4577# CHECK-NEXT: [0,7] . . . D=eE-R . . add x0, x27, #1 4578# CHECK-NEXT: [0,8] . . . D==eeeeeeER st3 { v1.8h, v2.8h, v3.8h }, [x27], x28 4579# CHECK-NEXT: [0,9] . . . .DeE----R add x0, x27, #1 4580 4581# CHECK: Average Wait times (based on the timeline view): 4582# CHECK-NEXT: [0]: Executions 4583# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4584# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4585# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4586 4587# CHECK: [0] [1] [2] [3] 4588# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.2s, v2.2s, v3.2s }, [x27], x28 4589# CHECK-NEXT: 1. 1 1.0 1.0 0.0 add x0, x27, #1 4590# CHECK-NEXT: 2. 1 1.0 1.0 0.0 st3 { v1.4h, v2.4h, v3.4h }, [x27], x28 4591# CHECK-NEXT: 3. 1 1.0 1.0 0.0 add x0, x27, #1 4592# CHECK-NEXT: 4. 1 1.0 1.0 0.0 st3 { v1.4s, v2.4s, v3.4s }, [x27], x28 4593# CHECK-NEXT: 5. 1 1.0 1.0 2.0 add x0, x27, #1 4594# CHECK-NEXT: 6. 1 3.0 3.0 0.0 st3 { v1.8b, v2.8b, v3.8b }, [x27], x28 4595# CHECK-NEXT: 7. 1 2.0 0.0 1.0 add x0, x27, #1 4596# CHECK-NEXT: 8. 1 3.0 2.0 0.0 st3 { v1.8h, v2.8h, v3.8h }, [x27], x28 4597# CHECK-NEXT: 9. 1 1.0 0.0 4.0 add x0, x27, #1 4598# CHECK-NEXT: 1 1.5 1.1 0.7 <total> 4599 4600# CHECK: [75] Code Region - G76 4601 4602# CHECK: Iterations: 100 4603# CHECK-NEXT: Instructions: 1000 4604# CHECK-NEXT: Total Cycles: 1204 4605# CHECK-NEXT: Total uOps: 2800 4606 4607# CHECK: Dispatch Width: 3 4608# CHECK-NEXT: uOps Per Cycle: 2.33 4609# CHECK-NEXT: IPC: 0.83 4610# CHECK-NEXT: Block RThroughput: 10.0 4611 4612# CHECK: Timeline view: 4613# CHECK-NEXT: 012345 4614# CHECK-NEXT: Index 0123456789 4615 4616# CHECK: [0,0] DeeeeeeER . . st3 { v1.16b, v2.16b, v3.16b }, [x27], x28 4617# CHECK-NEXT: [0,1] . DeE--R . . add x0, x27, #1 4618# CHECK-NEXT: [0,2] . D==eeeER . st3 { v1.b, v2.b, v3.b }[0], [x27], #3 4619# CHECK-NEXT: [0,3] . D==eE-R . add x0, x27, #1 4620# CHECK-NEXT: [0,4] . .D=eeeER . st3 { v1.b, v2.b, v3.b }[8], [x27], #3 4621# CHECK-NEXT: [0,5] . . D=eE-R . add x0, x27, #1 4622# CHECK-NEXT: [0,6] . . DeeeER . st3 { v1.b, v2.b, v3.b }[0], [x27], x28 4623# CHECK-NEXT: [0,7] . . DeE-R . add x0, x27, #1 4624# CHECK-NEXT: [0,8] . . DeeeER st3 { v1.b, v2.b, v3.b }[8], [x27], x28 4625# CHECK-NEXT: [0,9] . . .DeE-R add x0, x27, #1 4626 4627# CHECK: Average Wait times (based on the timeline view): 4628# CHECK-NEXT: [0]: Executions 4629# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4630# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4631# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4632 4633# CHECK: [0] [1] [2] [3] 4634# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.16b, v2.16b, v3.16b }, [x27], x28 4635# CHECK-NEXT: 1. 1 1.0 1.0 2.0 add x0, x27, #1 4636# CHECK-NEXT: 2. 1 3.0 3.0 0.0 st3 { v1.b, v2.b, v3.b }[0], [x27], #3 4637# CHECK-NEXT: 3. 1 3.0 0.0 1.0 add x0, x27, #1 4638# CHECK-NEXT: 4. 1 2.0 0.0 0.0 st3 { v1.b, v2.b, v3.b }[8], [x27], #3 4639# CHECK-NEXT: 5. 1 2.0 0.0 1.0 add x0, x27, #1 4640# CHECK-NEXT: 6. 1 1.0 0.0 0.0 st3 { v1.b, v2.b, v3.b }[0], [x27], x28 4641# CHECK-NEXT: 7. 1 1.0 0.0 1.0 add x0, x27, #1 4642# CHECK-NEXT: 8. 1 1.0 1.0 0.0 st3 { v1.b, v2.b, v3.b }[8], [x27], x28 4643# CHECK-NEXT: 9. 1 1.0 0.0 1.0 add x0, x27, #1 4644# CHECK-NEXT: 1 1.6 0.6 0.6 <total> 4645 4646# CHECK: [76] Code Region - G77 4647 4648# CHECK: Iterations: 100 4649# CHECK-NEXT: Instructions: 1000 4650# CHECK-NEXT: Total Cycles: 1004 4651# CHECK-NEXT: Total uOps: 2100 4652 4653# CHECK: Dispatch Width: 3 4654# CHECK-NEXT: uOps Per Cycle: 2.09 4655# CHECK-NEXT: IPC: 1.00 4656# CHECK-NEXT: Block RThroughput: 7.0 4657 4658# CHECK: Timeline view: 4659# CHECK-NEXT: 0123 4660# CHECK-NEXT: Index 0123456789 4661 4662# CHECK: [0,0] DeeeER . . st3 { v1.h, v2.h, v3.h }[0], [x27], #6 4663# CHECK-NEXT: [0,1] .DeE-R . . add x0, x27, #1 4664# CHECK-NEXT: [0,2] . DeeeER . . st3 { v1.h, v2.h, v3.h }[4], [x27], #6 4665# CHECK-NEXT: [0,3] . DeE-R . . add x0, x27, #1 4666# CHECK-NEXT: [0,4] . DeeeER. . st3 { v1.h, v2.h, v3.h }[0], [x27], x28 4667# CHECK-NEXT: [0,5] . DeE-R. . add x0, x27, #1 4668# CHECK-NEXT: [0,6] . .DeeeER . st3 { v1.h, v2.h, v3.h }[4], [x27], x28 4669# CHECK-NEXT: [0,7] . . DeE-R . add x0, x27, #1 4670# CHECK-NEXT: [0,8] . . DeeeER st3 { v1.s, v2.s, v3.s }[0], [x27], #12 4671# CHECK-NEXT: [0,9] . . DeE-R add x0, x27, #1 4672 4673# CHECK: Average Wait times (based on the timeline view): 4674# CHECK-NEXT: [0]: Executions 4675# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4676# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4677# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4678 4679# CHECK: [0] [1] [2] [3] 4680# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.h, v2.h, v3.h }[0], [x27], #6 4681# CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1 4682# CHECK-NEXT: 2. 1 1.0 1.0 0.0 st3 { v1.h, v2.h, v3.h }[4], [x27], #6 4683# CHECK-NEXT: 3. 1 1.0 0.0 1.0 add x0, x27, #1 4684# CHECK-NEXT: 4. 1 1.0 1.0 0.0 st3 { v1.h, v2.h, v3.h }[0], [x27], x28 4685# CHECK-NEXT: 5. 1 1.0 0.0 1.0 add x0, x27, #1 4686# CHECK-NEXT: 6. 1 1.0 1.0 0.0 st3 { v1.h, v2.h, v3.h }[4], [x27], x28 4687# CHECK-NEXT: 7. 1 1.0 0.0 1.0 add x0, x27, #1 4688# CHECK-NEXT: 8. 1 1.0 1.0 0.0 st3 { v1.s, v2.s, v3.s }[0], [x27], #12 4689# CHECK-NEXT: 9. 1 1.0 0.0 1.0 add x0, x27, #1 4690# CHECK-NEXT: 1 1.0 0.5 0.5 <total> 4691 4692# CHECK: [77] Code Region - G78 4693 4694# CHECK: Iterations: 100 4695# CHECK-NEXT: Instructions: 1000 4696# CHECK-NEXT: Total Cycles: 1903 4697# CHECK-NEXT: Total uOps: 3300 4698 4699# CHECK: Dispatch Width: 3 4700# CHECK-NEXT: uOps Per Cycle: 1.73 4701# CHECK-NEXT: IPC: 0.53 4702# CHECK-NEXT: Block RThroughput: 19.0 4703 4704# CHECK: Timeline view: 4705# CHECK-NEXT: 0123456789 4706# CHECK-NEXT: Index 0123456789 01 4707 4708# CHECK: [0,0] DeeeER . . .. st3 { v1.s, v2.s, v3.s }[0], [x27], x28 4709# CHECK-NEXT: [0,1] .DeE-R . . .. add x0, x27, #1 4710# CHECK-NEXT: [0,2] . D=eeeER . . .. st3 { v1.d, v2.d, v3.d }[0], [x27], #24 4711# CHECK-NEXT: [0,3] . D=eE-R . . .. add x0, x27, #1 4712# CHECK-NEXT: [0,4] . D=eeeER . .. st3 { v1.d, v2.d, v3.d }[0], [x27], x28 4713# CHECK-NEXT: [0,5] . D=eE-R . .. add x0, x27, #1 4714# CHECK-NEXT: [0,6] . .D=eeeeeeeeER .. st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 4715# CHECK-NEXT: [0,7] . . DeE-----R .. add x0, x27, #1 4716# CHECK-NEXT: [0,8] . . D=====eeeeER st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 4717# CHECK-NEXT: [0,9] . . . D====eE--R add x0, x27, #1 4718 4719# CHECK: Average Wait times (based on the timeline view): 4720# CHECK-NEXT: [0]: Executions 4721# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4722# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4723# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4724 4725# CHECK: [0] [1] [2] [3] 4726# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st3 { v1.s, v2.s, v3.s }[0], [x27], x28 4727# CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1 4728# CHECK-NEXT: 2. 1 2.0 2.0 0.0 st3 { v1.d, v2.d, v3.d }[0], [x27], #24 4729# CHECK-NEXT: 3. 1 2.0 0.0 1.0 add x0, x27, #1 4730# CHECK-NEXT: 4. 1 2.0 1.0 0.0 st3 { v1.d, v2.d, v3.d }[0], [x27], x28 4731# CHECK-NEXT: 5. 1 2.0 0.0 1.0 add x0, x27, #1 4732# CHECK-NEXT: 6. 1 2.0 1.0 0.0 st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], #64 4733# CHECK-NEXT: 7. 1 1.0 1.0 5.0 add x0, x27, #1 4734# CHECK-NEXT: 8. 1 6.0 6.0 0.0 st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], #32 4735# CHECK-NEXT: 9. 1 5.0 0.0 2.0 add x0, x27, #1 4736# CHECK-NEXT: 1 2.4 1.2 1.0 <total> 4737 4738# CHECK: [78] Code Region - G79 4739 4740# CHECK: Iterations: 100 4741# CHECK-NEXT: Instructions: 1000 4742# CHECK-NEXT: Total Cycles: 3203 4743# CHECK-NEXT: Total uOps: 5800 4744 4745# CHECK: Dispatch Width: 3 4746# CHECK-NEXT: uOps Per Cycle: 1.81 4747# CHECK-NEXT: IPC: 0.31 4748# CHECK-NEXT: Block RThroughput: 32.0 4749 4750# CHECK: Timeline view: 4751# CHECK-NEXT: 0123456789 01234 4752# CHECK-NEXT: Index 0123456789 0123456789 4753 4754# CHECK: [0,0] DeeeeER . . . . . . st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 4755# CHECK-NEXT: [0,1] . DeE-R . . . . . . add x0, x27, #1 4756# CHECK-NEXT: [0,2] . D=eeeeeeeeER. . . . . st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 4757# CHECK-NEXT: [0,3] . . DeE----R. . . . . add x0, x27, #1 4758# CHECK-NEXT: [0,4] . . D====eeeeER . . . . st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 4759# CHECK-NEXT: [0,5] . . D===eE--R . . . . add x0, x27, #1 4760# CHECK-NEXT: [0,6] . . .D=====eeeeeeeeER . . st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 4761# CHECK-NEXT: [0,7] . . . D==eE------R . . add x0, x27, #1 4762# CHECK-NEXT: [0,8] . . . .D========eeeeeeeeER st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 4763# CHECK-NEXT: [0,9] . . . . D=====eE------R add x0, x27, #1 4764 4765# CHECK: Average Wait times (based on the timeline view): 4766# CHECK-NEXT: [0]: Executions 4767# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4768# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4769# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4770 4771# CHECK: [0] [1] [2] [3] 4772# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], #32 4773# CHECK-NEXT: 1. 1 1.0 1.0 1.0 add x0, x27, #1 4774# CHECK-NEXT: 2. 1 2.0 2.0 0.0 st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], #64 4775# CHECK-NEXT: 3. 1 1.0 1.0 4.0 add x0, x27, #1 4776# CHECK-NEXT: 4. 1 5.0 5.0 0.0 st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], #32 4777# CHECK-NEXT: 5. 1 4.0 0.0 2.0 add x0, x27, #1 4778# CHECK-NEXT: 6. 1 6.0 3.0 0.0 st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], #64 4779# CHECK-NEXT: 7. 1 3.0 0.0 6.0 add x0, x27, #1 4780# CHECK-NEXT: 8. 1 9.0 7.0 0.0 st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], #64 4781# CHECK-NEXT: 9. 1 6.0 0.0 6.0 add x0, x27, #1 4782# CHECK-NEXT: 1 3.8 2.0 1.9 <total> 4783 4784# CHECK: [79] Code Region - G80 4785 4786# CHECK: Iterations: 100 4787# CHECK-NEXT: Instructions: 1000 4788# CHECK-NEXT: Total Cycles: 2803 4789# CHECK-NEXT: Total uOps: 4800 4790 4791# CHECK: Dispatch Width: 3 4792# CHECK-NEXT: uOps Per Cycle: 1.71 4793# CHECK-NEXT: IPC: 0.36 4794# CHECK-NEXT: Block RThroughput: 28.0 4795 4796# CHECK: Timeline view: 4797# CHECK-NEXT: 0123456789 0 4798# CHECK-NEXT: Index 0123456789 0123456789 4799 4800# CHECK: [0,0] DeeeeeeeeER . . . . st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 4801# CHECK-NEXT: [0,1] . DeE----R . . . . add x0, x27, #1 4802# CHECK-NEXT: [0,2] . D====eeeeER. . . . st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 4803# CHECK-NEXT: [0,3] . .D===eE--R. . . . add x0, x27, #1 4804# CHECK-NEXT: [0,4] . . D=====eeeeER . . . st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 4805# CHECK-NEXT: [0,5] . . D====eE--R . . . add x0, x27, #1 4806# CHECK-NEXT: [0,6] . . D======eeeeeeeeER . st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 4807# CHECK-NEXT: [0,7] . . . D===eE------R . add x0, x27, #1 4808# CHECK-NEXT: [0,8] . . . D=========eeeeER st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 4809# CHECK-NEXT: [0,9] . . . . D========eE--R add x0, x27, #1 4810 4811# CHECK: Average Wait times (based on the timeline view): 4812# CHECK-NEXT: [0]: Executions 4813# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4814# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4815# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4816 4817# CHECK: [0] [1] [2] [3] 4818# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.2d, v2.2d, v3.2d, v4.2d }, [x27], x28 4819# CHECK-NEXT: 1. 1 1.0 1.0 4.0 add x0, x27, #1 4820# CHECK-NEXT: 2. 1 5.0 5.0 0.0 st4 { v1.2s, v2.2s, v3.2s, v4.2s }, [x27], x28 4821# CHECK-NEXT: 3. 1 4.0 0.0 2.0 add x0, x27, #1 4822# CHECK-NEXT: 4. 1 6.0 3.0 0.0 st4 { v1.4h, v2.4h, v3.4h, v4.4h }, [x27], x28 4823# CHECK-NEXT: 5. 1 5.0 0.0 2.0 add x0, x27, #1 4824# CHECK-NEXT: 6. 1 7.0 3.0 0.0 st4 { v1.4s, v2.4s, v3.4s, v4.4s }, [x27], x28 4825# CHECK-NEXT: 7. 1 4.0 0.0 6.0 add x0, x27, #1 4826# CHECK-NEXT: 8. 1 10.0 7.0 0.0 st4 { v1.8b, v2.8b, v3.8b, v4.8b }, [x27], x28 4827# CHECK-NEXT: 9. 1 9.0 0.0 2.0 add x0, x27, #1 4828# CHECK-NEXT: 1 5.2 2.0 1.6 <total> 4829 4830# CHECK: [80] Code Region - G81 4831 4832# CHECK: Iterations: 100 4833# CHECK-NEXT: Instructions: 1000 4834# CHECK-NEXT: Total Cycles: 1905 4835# CHECK-NEXT: Total uOps: 4000 4836 4837# CHECK: Dispatch Width: 3 4838# CHECK-NEXT: uOps Per Cycle: 2.10 4839# CHECK-NEXT: IPC: 0.52 4840# CHECK-NEXT: Block RThroughput: 19.0 4841 4842# CHECK: Timeline view: 4843# CHECK-NEXT: 0123456789 4844# CHECK-NEXT: Index 0123456789 0123 4845 4846# CHECK: [0,0] DeeeeeeeeER . . . st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 4847# CHECK-NEXT: [0,1] . DeE---R . . . add x0, x27, #1 4848# CHECK-NEXT: [0,2] . D===eeeeeeeeER . . st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 4849# CHECK-NEXT: [0,3] . . DeE------R . . add x0, x27, #1 4850# CHECK-NEXT: [0,4] . . D======eeeER . st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4 4851# CHECK-NEXT: [0,5] . . .D======eE-R . add x0, x27, #1 4852# CHECK-NEXT: [0,6] . . . D=====eeeER. st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4 4853# CHECK-NEXT: [0,7] . . . D=====eE-R. add x0, x27, #1 4854# CHECK-NEXT: [0,8] . . . D====eeeER st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28 4855# CHECK-NEXT: [0,9] . . . D====eE-R add x0, x27, #1 4856 4857# CHECK: Average Wait times (based on the timeline view): 4858# CHECK-NEXT: [0]: Executions 4859# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4860# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4861# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4862 4863# CHECK: [0] [1] [2] [3] 4864# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.8h, v2.8h, v3.8h, v4.8h }, [x27], x28 4865# CHECK-NEXT: 1. 1 1.0 1.0 3.0 add x0, x27, #1 4866# CHECK-NEXT: 2. 1 4.0 4.0 0.0 st4 { v1.16b, v2.16b, v3.16b, v4.16b }, [x27], x28 4867# CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1 4868# CHECK-NEXT: 4. 1 7.0 7.0 0.0 st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], #4 4869# CHECK-NEXT: 5. 1 7.0 0.0 1.0 add x0, x27, #1 4870# CHECK-NEXT: 6. 1 6.0 0.0 0.0 st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], #4 4871# CHECK-NEXT: 7. 1 6.0 0.0 1.0 add x0, x27, #1 4872# CHECK-NEXT: 8. 1 5.0 0.0 0.0 st4 { v1.b, v2.b, v3.b, v4.b }[0], [x27], x28 4873# CHECK-NEXT: 9. 1 5.0 0.0 1.0 add x0, x27, #1 4874# CHECK-NEXT: 1 4.3 1.3 1.2 <total> 4875 4876# CHECK: [81] Code Region - G82 4877 4878# CHECK: Iterations: 100 4879# CHECK-NEXT: Instructions: 1000 4880# CHECK-NEXT: Total Cycles: 1004 4881# CHECK-NEXT: Total uOps: 2000 4882 4883# CHECK: Dispatch Width: 3 4884# CHECK-NEXT: uOps Per Cycle: 1.99 4885# CHECK-NEXT: IPC: 1.00 4886# CHECK-NEXT: Block RThroughput: 6.7 4887 4888# CHECK: Timeline view: 4889# CHECK-NEXT: 0123 4890# CHECK-NEXT: Index 0123456789 4891 4892# CHECK: [0,0] DeeeER . . st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28 4893# CHECK-NEXT: [0,1] .DeE-R . . add x0, x27, #1 4894# CHECK-NEXT: [0,2] . DeeeER . . st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8 4895# CHECK-NEXT: [0,3] . DeE-R . . add x0, x27, #1 4896# CHECK-NEXT: [0,4] . DeeeER. . st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8 4897# CHECK-NEXT: [0,5] . DeE-R. . add x0, x27, #1 4898# CHECK-NEXT: [0,6] . .DeeeER . st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28 4899# CHECK-NEXT: [0,7] . . DeE-R . add x0, x27, #1 4900# CHECK-NEXT: [0,8] . . DeeeER st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28 4901# CHECK-NEXT: [0,9] . . DeE-R add x0, x27, #1 4902 4903# CHECK: Average Wait times (based on the timeline view): 4904# CHECK-NEXT: [0]: Executions 4905# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4906# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4907# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4908 4909# CHECK: [0] [1] [2] [3] 4910# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.b, v2.b, v3.b, v4.b }[8], [x27], x28 4911# CHECK-NEXT: 1. 1 1.0 0.0 1.0 add x0, x27, #1 4912# CHECK-NEXT: 2. 1 1.0 1.0 0.0 st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], #8 4913# CHECK-NEXT: 3. 1 1.0 0.0 1.0 add x0, x27, #1 4914# CHECK-NEXT: 4. 1 1.0 1.0 0.0 st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], #8 4915# CHECK-NEXT: 5. 1 1.0 0.0 1.0 add x0, x27, #1 4916# CHECK-NEXT: 6. 1 1.0 1.0 0.0 st4 { v1.h, v2.h, v3.h, v4.h }[0], [x27], x28 4917# CHECK-NEXT: 7. 1 1.0 0.0 1.0 add x0, x27, #1 4918# CHECK-NEXT: 8. 1 1.0 1.0 0.0 st4 { v1.h, v2.h, v3.h, v4.h }[4], [x27], x28 4919# CHECK-NEXT: 9. 1 1.0 0.0 1.0 add x0, x27, #1 4920# CHECK-NEXT: 1 1.0 0.5 0.5 <total> 4921 4922# CHECK: [82] Code Region - G83 4923 4924# CHECK: Iterations: 100 4925# CHECK-NEXT: Instructions: 800 4926# CHECK-NEXT: Total Cycles: 1204 4927# CHECK-NEXT: Total uOps: 2200 4928 4929# CHECK: Dispatch Width: 3 4930# CHECK-NEXT: uOps Per Cycle: 1.83 4931# CHECK-NEXT: IPC: 0.66 4932# CHECK-NEXT: Block RThroughput: 12.0 4933 4934# CHECK: Timeline view: 4935# CHECK-NEXT: 012345 4936# CHECK-NEXT: Index 0123456789 4937 4938# CHECK: [0,0] DeeeeER . . st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16 4939# CHECK-NEXT: [0,1] .DeE--R . . add x0, x27, #1 4940# CHECK-NEXT: [0,2] . D==eeeeER . st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28 4941# CHECK-NEXT: [0,3] . D==eE--R . add x0, x27, #1 4942# CHECK-NEXT: [0,4] . D====eeeER . st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32 4943# CHECK-NEXT: [0,5] . D====eE-R . add x0, x27, #1 4944# CHECK-NEXT: [0,6] . .D====eeeER st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28 4945# CHECK-NEXT: [0,7] . . D====eE-R add x0, x27, #1 4946 4947# CHECK: Average Wait times (based on the timeline view): 4948# CHECK-NEXT: [0]: Executions 4949# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4950# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4951# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4952 4953# CHECK: [0] [1] [2] [3] 4954# CHECK-NEXT: 0. 1 1.0 1.0 0.0 st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], #16 4955# CHECK-NEXT: 1. 1 1.0 0.0 2.0 add x0, x27, #1 4956# CHECK-NEXT: 2. 1 3.0 3.0 0.0 st4 { v1.s, v2.s, v3.s, v4.s }[0], [x27], x28 4957# CHECK-NEXT: 3. 1 3.0 0.0 2.0 add x0, x27, #1 4958# CHECK-NEXT: 4. 1 5.0 3.0 0.0 st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], #32 4959# CHECK-NEXT: 5. 1 5.0 0.0 1.0 add x0, x27, #1 4960# CHECK-NEXT: 6. 1 5.0 1.0 0.0 st4 { v1.d, v2.d, v3.d, v4.d }[0], [x27], x28 4961# CHECK-NEXT: 7. 1 5.0 0.0 1.0 add x0, x27, #1 4962# CHECK-NEXT: 1 3.5 1.0 0.8 <total> 4963 4964# CHECK: [83] Code Region - G84 4965 4966# CHECK: Iterations: 100 4967# CHECK-NEXT: Instructions: 400 4968# CHECK-NEXT: Total Cycles: 403 4969# CHECK-NEXT: Total uOps: 900 4970 4971# CHECK: Dispatch Width: 3 4972# CHECK-NEXT: uOps Per Cycle: 2.23 4973# CHECK-NEXT: IPC: 0.99 4974# CHECK-NEXT: Block RThroughput: 3.0 4975 4976# CHECK: Timeline view: 4977# CHECK-NEXT: Index 0123456 4978 4979# CHECK: [0,0] DeER .. stp s1, s2, [x27], #248 4980# CHECK-NEXT: [0,1] .DeER.. add x0, x27, #1 4981# CHECK-NEXT: [0,2] . DeeER stp d1, d2, [x27], #496 4982# CHECK-NEXT: [0,3] . DeER add x0, x27, #1 4983 4984# CHECK: Average Wait times (based on the timeline view): 4985# CHECK-NEXT: [0]: Executions 4986# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 4987# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 4988# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 4989 4990# CHECK: [0] [1] [2] [3] 4991# CHECK-NEXT: 0. 1 1.0 1.0 0.0 stp s1, s2, [x27], #248 4992# CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1 4993# CHECK-NEXT: 2. 1 1.0 1.0 0.0 stp d1, d2, [x27], #496 4994# CHECK-NEXT: 3. 1 1.0 0.0 0.0 add x0, x27, #1 4995# CHECK-NEXT: 1 1.0 0.5 0.0 <total> 4996 4997# CHECK: [84] Code Region - G85 4998 4999# CHECK: Iterations: 100 5000# CHECK-NEXT: Instructions: 1000 5001# CHECK-NEXT: Total Cycles: 1207 5002# CHECK-NEXT: Total uOps: 2800 5003 5004# CHECK: Dispatch Width: 3 5005# CHECK-NEXT: uOps Per Cycle: 2.32 5006# CHECK-NEXT: IPC: 0.83 5007# CHECK-NEXT: Block RThroughput: 12.0 5008 5009# CHECK: Timeline view: 5010# CHECK-NEXT: 0123456 5011# CHECK-NEXT: Index 0123456789 5012 5013# CHECK: [0,0] DeeeeER . .. stp q1, q2, [x27], #992 5014# CHECK-NEXT: [0,1] . DeE-R . .. add x0, x27, #1 5015# CHECK-NEXT: [0,2] . D=eER . .. stp s1, s2, [x27, #248]! 5016# CHECK-NEXT: [0,3] . D=eER . .. add x0, x27, #1 5017# CHECK-NEXT: [0,4] . D=eeER .. stp d1, d2, [x27, #496]! 5018# CHECK-NEXT: [0,5] . .D=eER .. add x0, x27, #1 5019# CHECK-NEXT: [0,6] . . D=eeeeER.. stp q1, q2, [x27, #992]! 5020# CHECK-NEXT: [0,7] . . DeE--R.. add x0, x27, #1 5021# CHECK-NEXT: [0,8] . . D==eER. stp w1, w2, [x27], #248 5022# CHECK-NEXT: [0,9] . . .D==eER add x0, x27, #1 5023 5024# CHECK: Average Wait times (based on the timeline view): 5025# CHECK-NEXT: [0]: Executions 5026# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5027# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5028# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5029 5030# CHECK: [0] [1] [2] [3] 5031# CHECK-NEXT: 0. 1 1.0 1.0 0.0 stp q1, q2, [x27], #992 5032# CHECK-NEXT: 1. 1 1.0 1.0 1.0 add x0, x27, #1 5033# CHECK-NEXT: 2. 1 2.0 2.0 0.0 stp s1, s2, [x27, #248]! 5034# CHECK-NEXT: 3. 1 2.0 0.0 0.0 add x0, x27, #1 5035# CHECK-NEXT: 4. 1 2.0 1.0 0.0 stp d1, d2, [x27, #496]! 5036# CHECK-NEXT: 5. 1 2.0 0.0 0.0 add x0, x27, #1 5037# CHECK-NEXT: 6. 1 2.0 1.0 0.0 stp q1, q2, [x27, #992]! 5038# CHECK-NEXT: 7. 1 1.0 0.0 2.0 add x0, x27, #1 5039# CHECK-NEXT: 8. 1 3.0 3.0 0.0 stp w1, w2, [x27], #248 5040# CHECK-NEXT: 9. 1 3.0 0.0 0.0 add x0, x27, #1 5041# CHECK-NEXT: 1 1.9 0.9 0.3 <total> 5042 5043# CHECK: [85] Code Region - G86 5044 5045# CHECK: Iterations: 100 5046# CHECK-NEXT: Instructions: 1000 5047# CHECK-NEXT: Total Cycles: 1003 5048# CHECK-NEXT: Total uOps: 2200 5049 5050# CHECK: Dispatch Width: 3 5051# CHECK-NEXT: uOps Per Cycle: 2.19 5052# CHECK-NEXT: IPC: 1.00 5053# CHECK-NEXT: Block RThroughput: 7.5 5054 5055# CHECK: Timeline view: 5056# CHECK-NEXT: 012 5057# CHECK-NEXT: Index 0123456789 5058 5059# CHECK: [0,0] DeeER. . . stp x1, x2, [x27], #496 5060# CHECK-NEXT: [0,1] .DeER. . . add x0, x27, #1 5061# CHECK-NEXT: [0,2] . DeER . . stp w1, w2, [x27, #248]! 5062# CHECK-NEXT: [0,3] . DeER . . add x0, x27, #1 5063# CHECK-NEXT: [0,4] . DeeER . . stp x1, x2, [x27, #496]! 5064# CHECK-NEXT: [0,5] . DeER . . add x0, x27, #1 5065# CHECK-NEXT: [0,6] . .DeER. . str b1, [x27], #254 5066# CHECK-NEXT: [0,7] . . DeER . add x0, x27, #1 5067# CHECK-NEXT: [0,8] . . DeER. str h1, [x27], #254 5068# CHECK-NEXT: [0,9] . . DeER add x0, x27, #1 5069 5070# CHECK: Average Wait times (based on the timeline view): 5071# CHECK-NEXT: [0]: Executions 5072# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5073# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5074# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5075 5076# CHECK: [0] [1] [2] [3] 5077# CHECK-NEXT: 0. 1 1.0 1.0 0.0 stp x1, x2, [x27], #496 5078# CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1 5079# CHECK-NEXT: 2. 1 1.0 1.0 0.0 stp w1, w2, [x27, #248]! 5080# CHECK-NEXT: 3. 1 1.0 0.0 0.0 add x0, x27, #1 5081# CHECK-NEXT: 4. 1 1.0 1.0 0.0 stp x1, x2, [x27, #496]! 5082# CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1 5083# CHECK-NEXT: 6. 1 1.0 1.0 0.0 str b1, [x27], #254 5084# CHECK-NEXT: 7. 1 1.0 0.0 0.0 add x0, x27, #1 5085# CHECK-NEXT: 8. 1 1.0 1.0 0.0 str h1, [x27], #254 5086# CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1 5087# CHECK-NEXT: 1 1.0 0.5 0.0 <total> 5088 5089# CHECK: [86] Code Region - G87 5090 5091# CHECK: Iterations: 100 5092# CHECK-NEXT: Instructions: 1000 5093# CHECK-NEXT: Total Cycles: 1003 5094# CHECK-NEXT: Total uOps: 2100 5095 5096# CHECK: Dispatch Width: 3 5097# CHECK-NEXT: uOps Per Cycle: 2.09 5098# CHECK-NEXT: IPC: 1.00 5099# CHECK-NEXT: Block RThroughput: 7.5 5100 5101# CHECK: Timeline view: 5102# CHECK-NEXT: 012 5103# CHECK-NEXT: Index 0123456789 5104 5105# CHECK: [0,0] DeER . . . str s1, [x27], #254 5106# CHECK-NEXT: [0,1] .DeER. . . add x0, x27, #1 5107# CHECK-NEXT: [0,2] . DeER . . str d1, [x27], #254 5108# CHECK-NEXT: [0,3] . DeER . . add x0, x27, #1 5109# CHECK-NEXT: [0,4] . DeeER . . str q1, [x27], #254 5110# CHECK-NEXT: [0,5] . DeER . . add x0, x27, #1 5111# CHECK-NEXT: [0,6] . .DeER. . str b1, [x27, #254]! 5112# CHECK-NEXT: [0,7] . . DeER . add x0, x27, #1 5113# CHECK-NEXT: [0,8] . . DeER. str h1, [x27, #254]! 5114# CHECK-NEXT: [0,9] . . DeER add x0, x27, #1 5115 5116# CHECK: Average Wait times (based on the timeline view): 5117# CHECK-NEXT: [0]: Executions 5118# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5119# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5120# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5121 5122# CHECK: [0] [1] [2] [3] 5123# CHECK-NEXT: 0. 1 1.0 1.0 0.0 str s1, [x27], #254 5124# CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1 5125# CHECK-NEXT: 2. 1 1.0 1.0 0.0 str d1, [x27], #254 5126# CHECK-NEXT: 3. 1 1.0 0.0 0.0 add x0, x27, #1 5127# CHECK-NEXT: 4. 1 1.0 1.0 0.0 str q1, [x27], #254 5128# CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1 5129# CHECK-NEXT: 6. 1 1.0 1.0 0.0 str b1, [x27, #254]! 5130# CHECK-NEXT: 7. 1 1.0 0.0 0.0 add x0, x27, #1 5131# CHECK-NEXT: 8. 1 1.0 1.0 0.0 str h1, [x27, #254]! 5132# CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1 5133# CHECK-NEXT: 1 1.0 0.5 0.0 <total> 5134 5135# CHECK: [87] Code Region - G88 5136 5137# CHECK: Iterations: 100 5138# CHECK-NEXT: Instructions: 1000 5139# CHECK-NEXT: Total Cycles: 1003 5140# CHECK-NEXT: Total uOps: 2100 5141 5142# CHECK: Dispatch Width: 3 5143# CHECK-NEXT: uOps Per Cycle: 2.09 5144# CHECK-NEXT: IPC: 1.00 5145# CHECK-NEXT: Block RThroughput: 7.5 5146 5147# CHECK: Timeline view: 5148# CHECK-NEXT: 012 5149# CHECK-NEXT: Index 0123456789 5150 5151# CHECK: [0,0] DeER . . . str s1, [x27, #254]! 5152# CHECK-NEXT: [0,1] .DeER. . . add x0, x27, #1 5153# CHECK-NEXT: [0,2] . DeER . . str d1, [x27, #254]! 5154# CHECK-NEXT: [0,3] . DeER . . add x0, x27, #1 5155# CHECK-NEXT: [0,4] . DeeER . . str q1, [x27, #254]! 5156# CHECK-NEXT: [0,5] . DeER . . add x0, x27, #1 5157# CHECK-NEXT: [0,6] . .DeER. . str w1, [x27], #254 5158# CHECK-NEXT: [0,7] . . DeER . add x0, x27, #1 5159# CHECK-NEXT: [0,8] . . DeER. str x1, [x27], #254 5160# CHECK-NEXT: [0,9] . . DeER add x0, x27, #1 5161 5162# CHECK: Average Wait times (based on the timeline view): 5163# CHECK-NEXT: [0]: Executions 5164# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5165# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5166# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5167 5168# CHECK: [0] [1] [2] [3] 5169# CHECK-NEXT: 0. 1 1.0 1.0 0.0 str s1, [x27, #254]! 5170# CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1 5171# CHECK-NEXT: 2. 1 1.0 1.0 0.0 str d1, [x27, #254]! 5172# CHECK-NEXT: 3. 1 1.0 0.0 0.0 add x0, x27, #1 5173# CHECK-NEXT: 4. 1 1.0 1.0 0.0 str q1, [x27, #254]! 5174# CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1 5175# CHECK-NEXT: 6. 1 1.0 1.0 0.0 str w1, [x27], #254 5176# CHECK-NEXT: 7. 1 1.0 0.0 0.0 add x0, x27, #1 5177# CHECK-NEXT: 8. 1 1.0 1.0 0.0 str x1, [x27], #254 5178# CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1 5179# CHECK-NEXT: 1 1.0 0.5 0.0 <total> 5180 5181# CHECK: [88] Code Region - G89 5182 5183# CHECK: Iterations: 100 5184# CHECK-NEXT: Instructions: 1000 5185# CHECK-NEXT: Total Cycles: 1003 5186# CHECK-NEXT: Total uOps: 2000 5187 5188# CHECK: Dispatch Width: 3 5189# CHECK-NEXT: uOps Per Cycle: 1.99 5190# CHECK-NEXT: IPC: 1.00 5191# CHECK-NEXT: Block RThroughput: 7.5 5192 5193# CHECK: Timeline view: 5194# CHECK-NEXT: 012 5195# CHECK-NEXT: Index 0123456789 5196 5197# CHECK: [0,0] DeER . . . str w1, [x27, #254]! 5198# CHECK-NEXT: [0,1] .DeER. . . add x0, x27, #1 5199# CHECK-NEXT: [0,2] . DeER . . str x1, [x27, #254]! 5200# CHECK-NEXT: [0,3] . DeER . . add x0, x27, #1 5201# CHECK-NEXT: [0,4] . DeER . . strb w1, [x27], #254 5202# CHECK-NEXT: [0,5] . DeER . . add x0, x27, #1 5203# CHECK-NEXT: [0,6] . .DeER. . strb w1, [x27, #254]! 5204# CHECK-NEXT: [0,7] . . DeER . add x0, x27, #1 5205# CHECK-NEXT: [0,8] . . DeER. strh w1, [x27], #254 5206# CHECK-NEXT: [0,9] . . DeER add x0, x27, #1 5207 5208# CHECK: Average Wait times (based on the timeline view): 5209# CHECK-NEXT: [0]: Executions 5210# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5211# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5212# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5213 5214# CHECK: [0] [1] [2] [3] 5215# CHECK-NEXT: 0. 1 1.0 1.0 0.0 str w1, [x27, #254]! 5216# CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1 5217# CHECK-NEXT: 2. 1 1.0 1.0 0.0 str x1, [x27, #254]! 5218# CHECK-NEXT: 3. 1 1.0 0.0 0.0 add x0, x27, #1 5219# CHECK-NEXT: 4. 1 1.0 1.0 0.0 strb w1, [x27], #254 5220# CHECK-NEXT: 5. 1 1.0 0.0 0.0 add x0, x27, #1 5221# CHECK-NEXT: 6. 1 1.0 1.0 0.0 strb w1, [x27, #254]! 5222# CHECK-NEXT: 7. 1 1.0 0.0 0.0 add x0, x27, #1 5223# CHECK-NEXT: 8. 1 1.0 1.0 0.0 strh w1, [x27], #254 5224# CHECK-NEXT: 9. 1 1.0 0.0 0.0 add x0, x27, #1 5225# CHECK-NEXT: 1 1.0 0.5 0.0 <total> 5226 5227# CHECK: [89] Code Region - G90 5228 5229# CHECK: Iterations: 100 5230# CHECK-NEXT: Instructions: 200 5231# CHECK-NEXT: Total Cycles: 203 5232# CHECK-NEXT: Total uOps: 400 5233 5234# CHECK: Dispatch Width: 3 5235# CHECK-NEXT: uOps Per Cycle: 1.97 5236# CHECK-NEXT: IPC: 0.99 5237# CHECK-NEXT: Block RThroughput: 1.5 5238 5239# CHECK: Timeline view: 5240# CHECK-NEXT: Index 01234 5241 5242# CHECK: [0,0] DeER. strh w1, [x27, #254]! 5243# CHECK-NEXT: [0,1] .DeER add x0, x27, #1 5244 5245# CHECK: Average Wait times (based on the timeline view): 5246# CHECK-NEXT: [0]: Executions 5247# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5248# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5249# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5250 5251# CHECK: [0] [1] [2] [3] 5252# CHECK-NEXT: 0. 1 1.0 1.0 0.0 strh w1, [x27, #254]! 5253# CHECK-NEXT: 1. 1 1.0 0.0 0.0 add x0, x27, #1 5254# CHECK-NEXT: 1 1.0 0.5 0.0 <total> 5255 5256# CHECK: [90] Code Region - G91 5257 5258# CHECK: Iterations: 100 5259# CHECK-NEXT: Instructions: 400 5260# CHECK-NEXT: Total Cycles: 210 5261# CHECK-NEXT: Total uOps: 600 5262 5263# CHECK: Dispatch Width: 3 5264# CHECK-NEXT: uOps Per Cycle: 2.86 5265# CHECK-NEXT: IPC: 1.90 5266# CHECK-NEXT: Block RThroughput: 2.0 5267 5268# CHECK: Timeline view: 5269# CHECK-NEXT: 0 5270# CHECK-NEXT: Index 0123456789 5271 5272# CHECK: [0,0] DeeeeER . ldr x1, [x27], #254 5273# CHECK-NEXT: [0,1] D=eE--R . add x0, x27, #1 5274# CHECK-NEXT: [0,2] .D===eeeeER ldr x2, [x1], #254 5275# CHECK-NEXT: [0,3] .DeE------R add x0, x27, #1 5276 5277# CHECK: Average Wait times (based on the timeline view): 5278# CHECK-NEXT: [0]: Executions 5279# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue 5280# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready 5281# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage 5282 5283# CHECK: [0] [1] [2] [3] 5284# CHECK-NEXT: 0. 1 1.0 1.0 0.0 ldr x1, [x27], #254 5285# CHECK-NEXT: 1. 1 2.0 0.0 2.0 add x0, x27, #1 5286# CHECK-NEXT: 2. 1 4.0 0.0 0.0 ldr x2, [x1], #254 5287# CHECK-NEXT: 3. 1 1.0 0.0 6.0 add x0, x27, #1 5288# CHECK-NEXT: 1 2.0 0.3 2.0 <total> 5289