xref: /llvm-project/llvm/test/tools/llvm-mca/X86/Atom/zero-idioms.s (revision 8ea579203da0e2b2f3e9e04ea4b63b20248c52f3)
1# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
2# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=atom -timeline -register-file-stats -iterations=1 < %s | FileCheck %s
3
4subl  %eax, %eax
5subq  %rax, %rax
6xorl  %eax, %eax
7xorq  %rax, %rax
8
9pcmpgtb   %mm2, %mm2
10pcmpgtd   %mm2, %mm2
11# pcmpgtq   %mm2, %mm2 # invalid operand for instruction
12pcmpgtw   %mm2, %mm2
13
14pcmpgtb   %xmm2, %xmm2
15pcmpgtd   %xmm2, %xmm2
16pcmpgtq   %xmm2, %xmm2
17pcmpgtw   %xmm2, %xmm2
18
19psubb   %mm2, %mm2
20psubd   %mm2, %mm2
21psubq   %mm2, %mm2
22psubw   %mm2, %mm2
23psubb   %xmm2, %xmm2
24psubd   %xmm2, %xmm2
25psubq   %xmm2, %xmm2
26psubw   %xmm2, %xmm2
27
28psubsb   %mm2, %mm2
29psubsw   %mm2, %mm2
30psubsb   %xmm2, %xmm2
31psubsw   %xmm2, %xmm2
32
33psubusb   %mm2, %mm2
34psubusw   %mm2, %mm2
35psubusb   %xmm2, %xmm2
36psubusw   %xmm2, %xmm2
37
38andnps  %xmm0, %xmm0
39andnpd  %xmm1, %xmm1
40pandn   %mm2, %mm2
41pandn   %xmm2, %xmm2
42vpandn  %xmm3, %xmm3, %xmm3
43
44xorps  %xmm0, %xmm0
45xorpd  %xmm1, %xmm1
46pxor   %mm2, %mm2
47pxor   %xmm2, %xmm2
48
49# CHECK:      Iterations:        1
50# CHECK-NEXT: Instructions:      36
51# CHECK-NEXT: Total Cycles:      26
52# CHECK-NEXT: Total uOps:        36
53
54# CHECK:      Dispatch Width:    2
55# CHECK-NEXT: uOps Per Cycle:    1.38
56# CHECK-NEXT: IPC:               1.38
57# CHECK-NEXT: Block RThroughput: 19.0
58
59# CHECK:      Instruction Info:
60# CHECK-NEXT: [1]: #uOps
61# CHECK-NEXT: [2]: Latency
62# CHECK-NEXT: [3]: RThroughput
63# CHECK-NEXT: [4]: MayLoad
64# CHECK-NEXT: [5]: MayStore
65# CHECK-NEXT: [6]: HasSideEffects (U)
66
67# CHECK:      [1]    [2]    [3]    [4]    [5]    [6]    Instructions:
68# CHECK-NEXT:  1      1     0.50                        subl	%eax, %eax
69# CHECK-NEXT:  1      1     0.50                        subq	%rax, %rax
70# CHECK-NEXT:  1      1     0.50                        xorl	%eax, %eax
71# CHECK-NEXT:  1      1     0.50                        xorq	%rax, %rax
72# CHECK-NEXT:  1      1     0.50                        pcmpgtb	%mm2, %mm2
73# CHECK-NEXT:  1      1     0.50                        pcmpgtd	%mm2, %mm2
74# CHECK-NEXT:  1      1     0.50                        pcmpgtw	%mm2, %mm2
75# CHECK-NEXT:  1      1     0.50                        pcmpgtb	%xmm2, %xmm2
76# CHECK-NEXT:  1      1     0.50                        pcmpgtd	%xmm2, %xmm2
77# CHECK-NEXT:  1      1     0.50                        pcmpgtq	%xmm2, %xmm2
78# CHECK-NEXT:  1      1     0.50                        pcmpgtw	%xmm2, %xmm2
79# CHECK-NEXT:  1      1     0.50                        psubb	%mm2, %mm2
80# CHECK-NEXT:  1      1     0.50                        psubd	%mm2, %mm2
81# CHECK-NEXT:  1      2     1.00                        psubq	%mm2, %mm2
82# CHECK-NEXT:  1      1     0.50                        psubw	%mm2, %mm2
83# CHECK-NEXT:  1      1     0.50                        psubb	%xmm2, %xmm2
84# CHECK-NEXT:  1      1     0.50                        psubd	%xmm2, %xmm2
85# CHECK-NEXT:  1      2     1.00                        psubq	%xmm2, %xmm2
86# CHECK-NEXT:  1      1     0.50                        psubw	%xmm2, %xmm2
87# CHECK-NEXT:  1      1     0.50                        psubsb	%mm2, %mm2
88# CHECK-NEXT:  1      1     0.50                        psubsw	%mm2, %mm2
89# CHECK-NEXT:  1      1     0.50                        psubsb	%xmm2, %xmm2
90# CHECK-NEXT:  1      1     0.50                        psubsw	%xmm2, %xmm2
91# CHECK-NEXT:  1      1     0.50                        psubusb	%mm2, %mm2
92# CHECK-NEXT:  1      1     0.50                        psubusw	%mm2, %mm2
93# CHECK-NEXT:  1      1     0.50                        psubusb	%xmm2, %xmm2
94# CHECK-NEXT:  1      1     0.50                        psubusw	%xmm2, %xmm2
95# CHECK-NEXT:  1      1     0.50                        andnps	%xmm0, %xmm0
96# CHECK-NEXT:  1      1     0.50                        andnpd	%xmm1, %xmm1
97# CHECK-NEXT:  1      1     0.50                        pandn	%mm2, %mm2
98# CHECK-NEXT:  1      1     0.50                        pandn	%xmm2, %xmm2
99# CHECK-NEXT:  1      1     0.50                        vpandn	%xmm3, %xmm3, %xmm3
100# CHECK-NEXT:  1      1     0.50                        xorps	%xmm0, %xmm0
101# CHECK-NEXT:  1      1     0.50                        xorpd	%xmm1, %xmm1
102# CHECK-NEXT:  1      1     0.50                        pxor	%mm2, %mm2
103# CHECK-NEXT:  1      1     0.50                        pxor	%xmm2, %xmm2
104
105# CHECK:      Register File statistics:
106# CHECK-NEXT: Total number of mappings created:    40
107# CHECK-NEXT: Max number of mappings used:         3
108
109# CHECK:      Resources:
110# CHECK-NEXT: [0]   - AtomPort0
111# CHECK-NEXT: [1]   - AtomPort1
112
113# CHECK:      Resource pressure per iteration:
114# CHECK-NEXT: [0]    [1]
115# CHECK-NEXT: 20.00  18.00
116
117# CHECK:      Resource pressure by instruction:
118# CHECK-NEXT: [0]    [1]    Instructions:
119# CHECK-NEXT:  -     1.00   subl	%eax, %eax
120# CHECK-NEXT: 1.00    -     subq	%rax, %rax
121# CHECK-NEXT:  -     1.00   xorl	%eax, %eax
122# CHECK-NEXT: 1.00    -     xorq	%rax, %rax
123# CHECK-NEXT:  -     1.00   pcmpgtb	%mm2, %mm2
124# CHECK-NEXT: 1.00    -     pcmpgtd	%mm2, %mm2
125# CHECK-NEXT:  -     1.00   pcmpgtw	%mm2, %mm2
126# CHECK-NEXT: 1.00    -     pcmpgtb	%xmm2, %xmm2
127# CHECK-NEXT:  -     1.00   pcmpgtd	%xmm2, %xmm2
128# CHECK-NEXT: 1.00    -     pcmpgtq	%xmm2, %xmm2
129# CHECK-NEXT:  -     1.00   pcmpgtw	%xmm2, %xmm2
130# CHECK-NEXT: 1.00    -     psubb	%mm2, %mm2
131# CHECK-NEXT:  -     1.00   psubd	%mm2, %mm2
132# CHECK-NEXT: 2.00    -     psubq	%mm2, %mm2
133# CHECK-NEXT:  -     1.00   psubw	%mm2, %mm2
134# CHECK-NEXT: 1.00    -     psubb	%xmm2, %xmm2
135# CHECK-NEXT:  -     1.00   psubd	%xmm2, %xmm2
136# CHECK-NEXT: 2.00    -     psubq	%xmm2, %xmm2
137# CHECK-NEXT:  -     1.00   psubw	%xmm2, %xmm2
138# CHECK-NEXT: 1.00    -     psubsb	%mm2, %mm2
139# CHECK-NEXT:  -     1.00   psubsw	%mm2, %mm2
140# CHECK-NEXT: 1.00    -     psubsb	%xmm2, %xmm2
141# CHECK-NEXT:  -     1.00   psubsw	%xmm2, %xmm2
142# CHECK-NEXT: 1.00    -     psubusb	%mm2, %mm2
143# CHECK-NEXT:  -     1.00   psubusw	%mm2, %mm2
144# CHECK-NEXT: 1.00    -     psubusb	%xmm2, %xmm2
145# CHECK-NEXT:  -     1.00   psubusw	%xmm2, %xmm2
146# CHECK-NEXT: 1.00    -     andnps	%xmm0, %xmm0
147# CHECK-NEXT:  -     1.00   andnpd	%xmm1, %xmm1
148# CHECK-NEXT: 1.00    -     pandn	%mm2, %mm2
149# CHECK-NEXT:  -     1.00   pandn	%xmm2, %xmm2
150# CHECK-NEXT: 1.00    -     vpandn	%xmm3, %xmm3, %xmm3
151# CHECK-NEXT:  -     1.00   xorps	%xmm0, %xmm0
152# CHECK-NEXT: 1.00    -     xorpd	%xmm1, %xmm1
153# CHECK-NEXT:  -     1.00   pxor	%mm2, %mm2
154# CHECK-NEXT: 1.00    -     pxor	%xmm2, %xmm2
155
156# CHECK:      Timeline view:
157# CHECK-NEXT:                     0123456789
158# CHECK-NEXT: Index     0123456789          012345
159
160# CHECK:      [0,0]     DE   .    .    .    .    .   subl	%eax, %eax
161# CHECK-NEXT: [0,1]     .DE  .    .    .    .    .   subq	%rax, %rax
162# CHECK-NEXT: [0,2]     . DE .    .    .    .    .   xorl	%eax, %eax
163# CHECK-NEXT: [0,3]     .  DE.    .    .    .    .   xorq	%rax, %rax
164# CHECK-NEXT: [0,4]     .  DE.    .    .    .    .   pcmpgtb	%mm2, %mm2
165# CHECK-NEXT: [0,5]     .   DE    .    .    .    .   pcmpgtd	%mm2, %mm2
166# CHECK-NEXT: [0,6]     .    DE   .    .    .    .   pcmpgtw	%mm2, %mm2
167# CHECK-NEXT: [0,7]     .    DE   .    .    .    .   pcmpgtb	%xmm2, %xmm2
168# CHECK-NEXT: [0,8]     .    .DE  .    .    .    .   pcmpgtd	%xmm2, %xmm2
169# CHECK-NEXT: [0,9]     .    . DE .    .    .    .   pcmpgtq	%xmm2, %xmm2
170# CHECK-NEXT: [0,10]    .    .  DE.    .    .    .   pcmpgtw	%xmm2, %xmm2
171# CHECK-NEXT: [0,11]    .    .  DE.    .    .    .   psubb	%mm2, %mm2
172# CHECK-NEXT: [0,12]    .    .   DE    .    .    .   psubd	%mm2, %mm2
173# CHECK-NEXT: [0,13]    .    .    DeE  .    .    .   psubq	%mm2, %mm2
174# CHECK-NEXT: [0,14]    .    .    . DE .    .    .   psubw	%mm2, %mm2
175# CHECK-NEXT: [0,15]    .    .    . DE .    .    .   psubb	%xmm2, %xmm2
176# CHECK-NEXT: [0,16]    .    .    .  DE.    .    .   psubd	%xmm2, %xmm2
177# CHECK-NEXT: [0,17]    .    .    .   DeE   .    .   psubq	%xmm2, %xmm2
178# CHECK-NEXT: [0,18]    .    .    .    .DE  .    .   psubw	%xmm2, %xmm2
179# CHECK-NEXT: [0,19]    .    .    .    .DE  .    .   psubsb	%mm2, %mm2
180# CHECK-NEXT: [0,20]    .    .    .    . DE .    .   psubsw	%mm2, %mm2
181# CHECK-NEXT: [0,21]    .    .    .    . DE .    .   psubsb	%xmm2, %xmm2
182# CHECK-NEXT: [0,22]    .    .    .    .  DE.    .   psubsw	%xmm2, %xmm2
183# CHECK-NEXT: [0,23]    .    .    .    .  DE.    .   psubusb	%mm2, %mm2
184# CHECK-NEXT: [0,24]    .    .    .    .   DE    .   psubusw	%mm2, %mm2
185# CHECK-NEXT: [0,25]    .    .    .    .   DE    .   psubusb	%xmm2, %xmm2
186# CHECK-NEXT: [0,26]    .    .    .    .    DE   .   psubusw	%xmm2, %xmm2
187# CHECK-NEXT: [0,27]    .    .    .    .    DE   .   andnps	%xmm0, %xmm0
188# CHECK-NEXT: [0,28]    .    .    .    .    .DE  .   andnpd	%xmm1, %xmm1
189# CHECK-NEXT: [0,29]    .    .    .    .    .DE  .   pandn	%mm2, %mm2
190# CHECK-NEXT: [0,30]    .    .    .    .    . DE .   pandn	%xmm2, %xmm2
191# CHECK-NEXT: [0,31]    .    .    .    .    . DE .   vpandn	%xmm3, %xmm3, %xmm3
192# CHECK-NEXT: [0,32]    .    .    .    .    .  DE.   xorps	%xmm0, %xmm0
193# CHECK-NEXT: [0,33]    .    .    .    .    .  DE.   xorpd	%xmm1, %xmm1
194# CHECK-NEXT: [0,34]    .    .    .    .    .   DE   pxor	%mm2, %mm2
195# CHECK-NEXT: [0,35]    .    .    .    .    .   DE   pxor	%xmm2, %xmm2
196
197# CHECK:      Average Wait times (based on the timeline view):
198# CHECK-NEXT: [0]: Executions
199# CHECK-NEXT: [1]: Average time spent waiting in a scheduler's queue
200# CHECK-NEXT: [2]: Average time spent waiting in a scheduler's queue while ready
201# CHECK-NEXT: [3]: Average time elapsed from WB until retire stage
202
203# CHECK:            [0]    [1]    [2]    [3]
204# CHECK-NEXT: 0.     1     0.0    0.0    0.0       subl	%eax, %eax
205# CHECK-NEXT: 1.     1     0.0    0.0    0.0       subq	%rax, %rax
206# CHECK-NEXT: 2.     1     0.0    0.0    0.0       xorl	%eax, %eax
207# CHECK-NEXT: 3.     1     0.0    0.0    0.0       xorq	%rax, %rax
208# CHECK-NEXT: 4.     1     0.0    0.0    0.0       pcmpgtb	%mm2, %mm2
209# CHECK-NEXT: 5.     1     0.0    0.0    0.0       pcmpgtd	%mm2, %mm2
210# CHECK-NEXT: 6.     1     0.0    0.0    0.0       pcmpgtw	%mm2, %mm2
211# CHECK-NEXT: 7.     1     0.0    0.0    0.0       pcmpgtb	%xmm2, %xmm2
212# CHECK-NEXT: 8.     1     0.0    0.0    0.0       pcmpgtd	%xmm2, %xmm2
213# CHECK-NEXT: 9.     1     0.0    0.0    0.0       pcmpgtq	%xmm2, %xmm2
214# CHECK-NEXT: 10.    1     0.0    0.0    0.0       pcmpgtw	%xmm2, %xmm2
215# CHECK-NEXT: 11.    1     0.0    0.0    0.0       psubb	%mm2, %mm2
216# CHECK-NEXT: 12.    1     0.0    0.0    0.0       psubd	%mm2, %mm2
217# CHECK-NEXT: 13.    1     0.0    0.0    0.0       psubq	%mm2, %mm2
218# CHECK-NEXT: 14.    1     0.0    0.0    0.0       psubw	%mm2, %mm2
219# CHECK-NEXT: 15.    1     0.0    0.0    0.0       psubb	%xmm2, %xmm2
220# CHECK-NEXT: 16.    1     0.0    0.0    0.0       psubd	%xmm2, %xmm2
221# CHECK-NEXT: 17.    1     0.0    0.0    0.0       psubq	%xmm2, %xmm2
222# CHECK-NEXT: 18.    1     0.0    0.0    0.0       psubw	%xmm2, %xmm2
223# CHECK-NEXT: 19.    1     0.0    0.0    0.0       psubsb	%mm2, %mm2
224# CHECK-NEXT: 20.    1     0.0    0.0    0.0       psubsw	%mm2, %mm2
225# CHECK-NEXT: 21.    1     0.0    0.0    0.0       psubsb	%xmm2, %xmm2
226# CHECK-NEXT: 22.    1     0.0    0.0    0.0       psubsw	%xmm2, %xmm2
227# CHECK-NEXT: 23.    1     0.0    0.0    0.0       psubusb	%mm2, %mm2
228# CHECK-NEXT: 24.    1     0.0    0.0    0.0       psubusw	%mm2, %mm2
229# CHECK-NEXT: 25.    1     0.0    0.0    0.0       psubusb	%xmm2, %xmm2
230# CHECK-NEXT: 26.    1     0.0    0.0    0.0       psubusw	%xmm2, %xmm2
231# CHECK-NEXT: 27.    1     0.0    0.0    0.0       andnps	%xmm0, %xmm0
232# CHECK-NEXT: 28.    1     0.0    0.0    0.0       andnpd	%xmm1, %xmm1
233# CHECK-NEXT: 29.    1     0.0    0.0    0.0       pandn	%mm2, %mm2
234# CHECK-NEXT: 30.    1     0.0    0.0    0.0       pandn	%xmm2, %xmm2
235# CHECK-NEXT: 31.    1     0.0    0.0    0.0       vpandn	%xmm3, %xmm3, %xmm3
236# CHECK-NEXT: 32.    1     0.0    0.0    0.0       xorps	%xmm0, %xmm0
237# CHECK-NEXT: 33.    1     0.0    0.0    0.0       xorpd	%xmm1, %xmm1
238# CHECK-NEXT: 34.    1     0.0    0.0    0.0       pxor	%mm2, %mm2
239# CHECK-NEXT: 35.    1     0.0    0.0    0.0       pxor	%xmm2, %xmm2
240# CHECK-NEXT:        1     0.0    0.0    0.0       <total>
241