xref: /freebsd/lib/libpmc/pmu-events/arch/x86/skylakex/skx-metrics.json (revision 92b14858b44dc4b3b57154a10e9de1b39d791e41)
1959826caSMatt Macy[
2959826caSMatt Macy    {
3*92b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots where the processor's Frontend undersupplies its Backend",
4*92b14858SMatt Macy        "MetricExpr": "IDQ_UOPS_NOT_DELIVERED.CORE / (4 * cycles)",
5*92b14858SMatt Macy        "MetricGroup": "TopdownL1",
6*92b14858SMatt Macy        "MetricName": "Frontend_Bound",
7*92b14858SMatt Macy        "PublicDescription": "This category represents fraction of slots where the processor's Frontend undersupplies its Backend. Frontend denotes the first part of the processor core responsible to fetch operations that are executed later on by the Backend part. Within the Frontend; a branch predictor predicts the next address to fetch; cache-lines are fetched from the memory subsystem; parsed into instructions; and lastly decoded into micro-ops (uops). Ideally the Frontend can issue 4 uops every cycle to the Backend. Frontend Bound denotes unutilized issue-slots when there is no Backend stall; i.e. bubbles where Frontend delivered no uops while Backend could have accepted them. For example; stalls due to instruction-cache misses would be categorized under Frontend Bound."
8*92b14858SMatt Macy    },
9*92b14858SMatt Macy    {
10*92b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots where the processor's Frontend undersupplies its Backend. SMT version; use when SMT is enabled and measuring per logical CPU.",
11*92b14858SMatt Macy        "MetricExpr": "IDQ_UOPS_NOT_DELIVERED.CORE / (4 * (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )))",
12*92b14858SMatt Macy        "MetricGroup": "TopdownL1_SMT",
13*92b14858SMatt Macy        "MetricName": "Frontend_Bound_SMT",
14*92b14858SMatt Macy        "PublicDescription": "This category represents fraction of slots where the processor's Frontend undersupplies its Backend. Frontend denotes the first part of the processor core responsible to fetch operations that are executed later on by the Backend part. Within the Frontend; a branch predictor predicts the next address to fetch; cache-lines are fetched from the memory subsystem; parsed into instructions; and lastly decoded into micro-ops (uops). Ideally the Frontend can issue 4 uops every cycle to the Backend. Frontend Bound denotes unutilized issue-slots when there is no Backend stall; i.e. bubbles where Frontend delivered no uops while Backend could have accepted them. For example; stalls due to instruction-cache misses would be categorized under Frontend Bound. SMT version; use when SMT is enabled and measuring per logical CPU."
15*92b14858SMatt Macy    },
16*92b14858SMatt Macy    {
17*92b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots wasted due to incorrect speculations",
18*92b14858SMatt Macy        "MetricExpr": "( UOPS_ISSUED.ANY - UOPS_RETIRED.RETIRE_SLOTS + 4 * INT_MISC.RECOVERY_CYCLES ) / (4 * cycles)",
19*92b14858SMatt Macy        "MetricGroup": "TopdownL1",
20*92b14858SMatt Macy        "MetricName": "Bad_Speculation",
21*92b14858SMatt Macy        "PublicDescription": "This category represents fraction of slots wasted due to incorrect speculations. This include slots used to issue uops that do not eventually get retired and slots for which the issue-pipeline was blocked due to recovery from earlier incorrect speculation. For example; wasted work due to miss-predicted branches are categorized under Bad Speculation category. Incorrect data speculation followed by Memory Ordering Nukes is another example."
22*92b14858SMatt Macy    },
23*92b14858SMatt Macy    {
24*92b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots wasted due to incorrect speculations. SMT version; use when SMT is enabled and measuring per logical CPU.",
25*92b14858SMatt Macy        "MetricExpr": "( UOPS_ISSUED.ANY - UOPS_RETIRED.RETIRE_SLOTS + 4 * (( INT_MISC.RECOVERY_CYCLES_ANY / 2 )) ) / (4 * (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )))",
26*92b14858SMatt Macy        "MetricGroup": "TopdownL1_SMT",
27*92b14858SMatt Macy        "MetricName": "Bad_Speculation_SMT",
28*92b14858SMatt Macy        "PublicDescription": "This category represents fraction of slots wasted due to incorrect speculations. This include slots used to issue uops that do not eventually get retired and slots for which the issue-pipeline was blocked due to recovery from earlier incorrect speculation. For example; wasted work due to miss-predicted branches are categorized under Bad Speculation category. Incorrect data speculation followed by Memory Ordering Nukes is another example. SMT version; use when SMT is enabled and measuring per logical CPU."
29*92b14858SMatt Macy    },
30*92b14858SMatt Macy    {
31*92b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots where no uops are being delivered due to a lack of required resources for accepting new uops in the Backend",
32*92b14858SMatt Macy        "MetricExpr": "1 - ( (IDQ_UOPS_NOT_DELIVERED.CORE / (4 * cycles)) + (( UOPS_ISSUED.ANY - UOPS_RETIRED.RETIRE_SLOTS + 4 * INT_MISC.RECOVERY_CYCLES ) / (4 * cycles)) + (UOPS_RETIRED.RETIRE_SLOTS / (4 * cycles)) )",
33*92b14858SMatt Macy        "MetricGroup": "TopdownL1",
34*92b14858SMatt Macy        "MetricName": "Backend_Bound",
35*92b14858SMatt Macy        "PublicDescription": "This category represents fraction of slots where no uops are being delivered due to a lack of required resources for accepting new uops in the Backend. Backend is the portion of the processor core where the out-of-order scheduler dispatches ready uops into their respective execution units; and once completed these uops get retired according to program order. For example; stalls due to data-cache misses or stalls due to the divider unit being overloaded are both categorized under Backend Bound. Backend Bound is further divided into two main categories: Memory Bound and Core Bound."
36*92b14858SMatt Macy    },
37*92b14858SMatt Macy    {
38*92b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots where no uops are being delivered due to a lack of required resources for accepting new uops in the Backend. SMT version; use when SMT is enabled and measuring per logical CPU.",
39*92b14858SMatt Macy        "MetricExpr": "1 - ( (IDQ_UOPS_NOT_DELIVERED.CORE / (4 * (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )))) + (( UOPS_ISSUED.ANY - UOPS_RETIRED.RETIRE_SLOTS + 4 * (( INT_MISC.RECOVERY_CYCLES_ANY / 2 )) ) / (4 * (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )))) + (UOPS_RETIRED.RETIRE_SLOTS / (4 * (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )))) )",
40*92b14858SMatt Macy        "MetricGroup": "TopdownL1_SMT",
41*92b14858SMatt Macy        "MetricName": "Backend_Bound_SMT",
42*92b14858SMatt Macy        "PublicDescription": "This category represents fraction of slots where no uops are being delivered due to a lack of required resources for accepting new uops in the Backend. Backend is the portion of the processor core where the out-of-order scheduler dispatches ready uops into their respective execution units; and once completed these uops get retired according to program order. For example; stalls due to data-cache misses or stalls due to the divider unit being overloaded are both categorized under Backend Bound. Backend Bound is further divided into two main categories: Memory Bound and Core Bound. SMT version; use when SMT is enabled and measuring per logical CPU."
43*92b14858SMatt Macy    },
44*92b14858SMatt Macy    {
45*92b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots utilized by useful work i.e. issued uops that eventually get retired",
46*92b14858SMatt Macy        "MetricExpr": "UOPS_RETIRED.RETIRE_SLOTS / (4 * cycles)",
47*92b14858SMatt Macy        "MetricGroup": "TopdownL1",
48*92b14858SMatt Macy        "MetricName": "Retiring",
49*92b14858SMatt Macy        "PublicDescription": "This category represents fraction of slots utilized by useful work i.e. issued uops that eventually get retired. Ideally; all pipeline slots would be attributed to the Retiring category.  Retiring of 100% would indicate the maximum 4 uops retired per cycle has been achieved.  Maximizing Retiring typically increases the Instruction-Per-Cycle metric. Note that a high Retiring value does not necessary mean there is no room for more performance.  For example; Microcode assists are categorized under Retiring. They hurt performance and can often be avoided. "
50*92b14858SMatt Macy    },
51*92b14858SMatt Macy    {
52*92b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots utilized by useful work i.e. issued uops that eventually get retired. SMT version; use when SMT is enabled and measuring per logical CPU.",
53*92b14858SMatt Macy        "MetricExpr": "UOPS_RETIRED.RETIRE_SLOTS / (4 * (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )))",
54*92b14858SMatt Macy        "MetricGroup": "TopdownL1_SMT",
55*92b14858SMatt Macy        "MetricName": "Retiring_SMT",
56*92b14858SMatt Macy        "PublicDescription": "This category represents fraction of slots utilized by useful work i.e. issued uops that eventually get retired. Ideally; all pipeline slots would be attributed to the Retiring category.  Retiring of 100% would indicate the maximum 4 uops retired per cycle has been achieved.  Maximizing Retiring typically increases the Instruction-Per-Cycle metric. Note that a high Retiring value does not necessary mean there is no room for more performance.  For example; Microcode assists are categorized under Retiring. They hurt performance and can often be avoided. SMT version; use when SMT is enabled and measuring per logical CPU."
57*92b14858SMatt Macy    },
58*92b14858SMatt Macy    {
59*92b14858SMatt Macy        "BriefDescription": "Instructions Per Cycle (per Logical Processor)",
60959826caSMatt Macy        "MetricExpr": "INST_RETIRED.ANY / CPU_CLK_UNHALTED.THREAD",
61959826caSMatt Macy        "MetricGroup": "TopDownL1",
62959826caSMatt Macy        "MetricName": "IPC"
63959826caSMatt Macy    },
64959826caSMatt Macy    {
65959826caSMatt Macy        "BriefDescription": "Uops Per Instruction",
66959826caSMatt Macy        "MetricExpr": "UOPS_RETIRED.RETIRE_SLOTS / INST_RETIRED.ANY",
67*92b14858SMatt Macy        "MetricGroup": "Pipeline;Retire",
68959826caSMatt Macy        "MetricName": "UPI"
69959826caSMatt Macy    },
70959826caSMatt Macy    {
71*92b14858SMatt Macy        "BriefDescription": "Instruction per taken branch",
72*92b14858SMatt Macy        "MetricExpr": "INST_RETIRED.ANY / BR_INST_RETIRED.NEAR_TAKEN",
73*92b14858SMatt Macy        "MetricGroup": "Branches;Fetch_BW;PGO",
74*92b14858SMatt Macy        "MetricName": "IpTB"
75*92b14858SMatt Macy    },
76*92b14858SMatt Macy    {
77*92b14858SMatt Macy        "BriefDescription": "Branch instructions per taken branch. ",
78*92b14858SMatt Macy        "MetricExpr": "BR_INST_RETIRED.ALL_BRANCHES / BR_INST_RETIRED.NEAR_TAKEN",
79*92b14858SMatt Macy        "MetricGroup": "Branches;PGO",
80*92b14858SMatt Macy        "MetricName": "BpTB"
81*92b14858SMatt Macy    },
82*92b14858SMatt Macy    {
83*92b14858SMatt Macy        "BriefDescription": "Rough Estimation of fraction of fetched lines bytes that were likely (includes speculatively fetches) consumed by program instructions",
84959826caSMatt Macy        "MetricExpr": "min( 1 , UOPS_ISSUED.ANY / ( (UOPS_RETIRED.RETIRE_SLOTS / INST_RETIRED.ANY) * 64 * ( ICACHE_64B.IFTAG_HIT + ICACHE_64B.IFTAG_MISS ) / 4.1 ) )",
85*92b14858SMatt Macy        "MetricGroup": "PGO;IcMiss",
86959826caSMatt Macy        "MetricName": "IFetch_Line_Utilization"
87959826caSMatt Macy    },
88959826caSMatt Macy    {
89*92b14858SMatt Macy        "BriefDescription": "Fraction of Uops delivered by the DSB (aka Decoded ICache; or Uop Cache)",
90*92b14858SMatt Macy        "MetricExpr": "IDQ.DSB_UOPS / (IDQ.DSB_UOPS + IDQ.MITE_UOPS + IDQ.MS_UOPS)",
91*92b14858SMatt Macy        "MetricGroup": "DSB;Fetch_BW",
92959826caSMatt Macy        "MetricName": "DSB_Coverage"
93959826caSMatt Macy    },
94959826caSMatt Macy    {
95*92b14858SMatt Macy        "BriefDescription": "Cycles Per Instruction (per Logical Processor)",
96959826caSMatt Macy        "MetricExpr": "1 / (INST_RETIRED.ANY / cycles)",
97959826caSMatt Macy        "MetricGroup": "Pipeline;Summary",
98959826caSMatt Macy        "MetricName": "CPI"
99959826caSMatt Macy    },
100959826caSMatt Macy    {
101*92b14858SMatt Macy        "BriefDescription": "Per-Logical Processor actual clocks when the Logical Processor is active.",
102959826caSMatt Macy        "MetricExpr": "CPU_CLK_UNHALTED.THREAD",
103959826caSMatt Macy        "MetricGroup": "Summary",
104959826caSMatt Macy        "MetricName": "CLKS"
105959826caSMatt Macy    },
106959826caSMatt Macy    {
107*92b14858SMatt Macy        "BriefDescription": "Total issue-pipeline slots (per-Physical Core)",
108*92b14858SMatt Macy        "MetricExpr": "4 * cycles",
109959826caSMatt Macy        "MetricGroup": "TopDownL1",
110959826caSMatt Macy        "MetricName": "SLOTS"
111959826caSMatt Macy    },
112959826caSMatt Macy    {
113*92b14858SMatt Macy        "BriefDescription": "Total issue-pipeline slots (per-Physical Core)",
114*92b14858SMatt Macy        "MetricExpr": "4 * (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) ))",
115*92b14858SMatt Macy        "MetricGroup": "TopDownL1_SMT",
116*92b14858SMatt Macy        "MetricName": "SLOTS_SMT"
117*92b14858SMatt Macy    },
118*92b14858SMatt Macy    {
119*92b14858SMatt Macy        "BriefDescription": "Instructions per Load (lower number means higher occurance rate)",
120*92b14858SMatt Macy        "MetricExpr": "INST_RETIRED.ANY / MEM_INST_RETIRED.ALL_LOADS",
121*92b14858SMatt Macy        "MetricGroup": "Instruction_Type",
122*92b14858SMatt Macy        "MetricName": "IpL"
123*92b14858SMatt Macy    },
124*92b14858SMatt Macy    {
125*92b14858SMatt Macy        "BriefDescription": "Instructions per Store (lower number means higher occurance rate)",
126*92b14858SMatt Macy        "MetricExpr": "INST_RETIRED.ANY / MEM_INST_RETIRED.ALL_STORES",
127*92b14858SMatt Macy        "MetricGroup": "Instruction_Type",
128*92b14858SMatt Macy        "MetricName": "IpS"
129*92b14858SMatt Macy    },
130*92b14858SMatt Macy    {
131*92b14858SMatt Macy        "BriefDescription": "Instructions per Branch (lower number means higher occurance rate)",
132*92b14858SMatt Macy        "MetricExpr": "INST_RETIRED.ANY / BR_INST_RETIRED.ALL_BRANCHES",
133*92b14858SMatt Macy        "MetricGroup": "Branches;Instruction_Type",
134*92b14858SMatt Macy        "MetricName": "IpB"
135*92b14858SMatt Macy    },
136*92b14858SMatt Macy    {
137*92b14858SMatt Macy        "BriefDescription": "Instruction per (near) call (lower number means higher occurance rate)",
138*92b14858SMatt Macy        "MetricExpr": "INST_RETIRED.ANY / BR_INST_RETIRED.NEAR_CALL",
139*92b14858SMatt Macy        "MetricGroup": "Branches",
140*92b14858SMatt Macy        "MetricName": "IpCall"
141*92b14858SMatt Macy    },
142*92b14858SMatt Macy    {
143959826caSMatt Macy        "BriefDescription": "Total number of retired Instructions",
144959826caSMatt Macy        "MetricExpr": "INST_RETIRED.ANY",
145959826caSMatt Macy        "MetricGroup": "Summary",
146959826caSMatt Macy        "MetricName": "Instructions"
147959826caSMatt Macy    },
148959826caSMatt Macy    {
149959826caSMatt Macy        "BriefDescription": "Instructions Per Cycle (per physical core)",
150*92b14858SMatt Macy        "MetricExpr": "INST_RETIRED.ANY / cycles",
151959826caSMatt Macy        "MetricGroup": "SMT",
152959826caSMatt Macy        "MetricName": "CoreIPC"
153959826caSMatt Macy    },
154959826caSMatt Macy    {
155*92b14858SMatt Macy        "BriefDescription": "Instructions Per Cycle (per physical core)",
156*92b14858SMatt Macy        "MetricExpr": "INST_RETIRED.ANY / (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) ))",
157*92b14858SMatt Macy        "MetricGroup": "SMT",
158*92b14858SMatt Macy        "MetricName": "CoreIPC_SMT"
159*92b14858SMatt Macy    },
160*92b14858SMatt Macy    {
161*92b14858SMatt Macy        "BriefDescription": "Floating Point Operations Per Cycle",
162*92b14858SMatt Macy        "MetricExpr": "(( 1 * ( FP_ARITH_INST_RETIRED.SCALAR_SINGLE + FP_ARITH_INST_RETIRED.SCALAR_DOUBLE ) + 2 * FP_ARITH_INST_RETIRED.128B_PACKED_DOUBLE + 4 * ( FP_ARITH_INST_RETIRED.128B_PACKED_SINGLE + FP_ARITH_INST_RETIRED.256B_PACKED_DOUBLE ) + 8 * ( FP_ARITH_INST_RETIRED.256B_PACKED_SINGLE + FP_ARITH_INST_RETIRED.512B_PACKED_DOUBLE ) + 16 * FP_ARITH_INST_RETIRED.512B_PACKED_SINGLE )) / cycles",
163*92b14858SMatt Macy        "MetricGroup": "FLOPS",
164*92b14858SMatt Macy        "MetricName": "FLOPc"
165*92b14858SMatt Macy    },
166*92b14858SMatt Macy    {
167*92b14858SMatt Macy        "BriefDescription": "Floating Point Operations Per Cycle",
168*92b14858SMatt Macy        "MetricExpr": "(( 1 * ( FP_ARITH_INST_RETIRED.SCALAR_SINGLE + FP_ARITH_INST_RETIRED.SCALAR_DOUBLE ) + 2 * FP_ARITH_INST_RETIRED.128B_PACKED_DOUBLE + 4 * ( FP_ARITH_INST_RETIRED.128B_PACKED_SINGLE + FP_ARITH_INST_RETIRED.256B_PACKED_DOUBLE ) + 8 * ( FP_ARITH_INST_RETIRED.256B_PACKED_SINGLE + FP_ARITH_INST_RETIRED.512B_PACKED_DOUBLE ) + 16 * FP_ARITH_INST_RETIRED.512B_PACKED_SINGLE )) / (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) ))",
169*92b14858SMatt Macy        "MetricGroup": "FLOPS_SMT",
170*92b14858SMatt Macy        "MetricName": "FLOPc_SMT"
171*92b14858SMatt Macy    },
172*92b14858SMatt Macy    {
173959826caSMatt Macy        "BriefDescription": "Instruction-Level-Parallelism (average number of uops executed when there is at least 1 uop executed)",
174959826caSMatt Macy        "MetricExpr": "UOPS_EXECUTED.THREAD / (( UOPS_EXECUTED.CORE_CYCLES_GE_1 / 2 ) if #SMT_on else UOPS_EXECUTED.CORE_CYCLES_GE_1)",
175*92b14858SMatt Macy        "MetricGroup": "Pipeline",
176959826caSMatt Macy        "MetricName": "ILP"
177959826caSMatt Macy    },
178959826caSMatt Macy    {
179*92b14858SMatt Macy        "BriefDescription": "Branch Misprediction Cost: Fraction of TopDown slots wasted per non-speculative branch misprediction (jeclear)",
180*92b14858SMatt Macy        "MetricExpr": "( ((BR_MISP_RETIRED.ALL_BRANCHES / ( BR_MISP_RETIRED.ALL_BRANCHES + MACHINE_CLEARS.COUNT )) * (( UOPS_ISSUED.ANY - UOPS_RETIRED.RETIRE_SLOTS + 4 * INT_MISC.RECOVERY_CYCLES ) / (4 * cycles))) + (4 * IDQ_UOPS_NOT_DELIVERED.CYCLES_0_UOPS_DELIV.CORE / (4 * cycles)) * (( INT_MISC.CLEAR_RESTEER_CYCLES + 9 * BACLEARS.ANY ) / cycles) / (4 * IDQ_UOPS_NOT_DELIVERED.CYCLES_0_UOPS_DELIV.CORE / (4 * cycles)) ) * (4 * cycles) / BR_MISP_RETIRED.ALL_BRANCHES",
181*92b14858SMatt Macy        "MetricGroup": "BrMispredicts",
182*92b14858SMatt Macy        "MetricName": "Branch_Misprediction_Cost"
183959826caSMatt Macy    },
184959826caSMatt Macy    {
185*92b14858SMatt Macy        "BriefDescription": "Branch Misprediction Cost: Fraction of TopDown slots wasted per non-speculative branch misprediction (jeclear)",
186*92b14858SMatt Macy        "MetricExpr": "( ((BR_MISP_RETIRED.ALL_BRANCHES / ( BR_MISP_RETIRED.ALL_BRANCHES + MACHINE_CLEARS.COUNT )) * (( UOPS_ISSUED.ANY - UOPS_RETIRED.RETIRE_SLOTS + 4 * (( INT_MISC.RECOVERY_CYCLES_ANY / 2 )) ) / (4 * (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) ))))) + (4 * IDQ_UOPS_NOT_DELIVERED.CYCLES_0_UOPS_DELIV.CORE / (4 * (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )))) * (( INT_MISC.CLEAR_RESTEER_CYCLES + 9 * BACLEARS.ANY ) / cycles) / (4 * IDQ_UOPS_NOT_DELIVERED.CYCLES_0_UOPS_DELIV.CORE / (4 * (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )))) ) * (4 * (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) ))) / BR_MISP_RETIRED.ALL_BRANCHES",
187*92b14858SMatt Macy        "MetricGroup": "BrMispredicts_SMT",
188*92b14858SMatt Macy        "MetricName": "Branch_Misprediction_Cost_SMT"
189*92b14858SMatt Macy    },
190*92b14858SMatt Macy    {
191*92b14858SMatt Macy        "BriefDescription": "Number of Instructions per non-speculative Branch Misprediction (JEClear)",
192*92b14858SMatt Macy        "MetricExpr": "INST_RETIRED.ANY / BR_MISP_RETIRED.ALL_BRANCHES",
193*92b14858SMatt Macy        "MetricGroup": "BrMispredicts",
194*92b14858SMatt Macy        "MetricName": "IpMispredict"
195*92b14858SMatt Macy    },
196*92b14858SMatt Macy    {
197*92b14858SMatt Macy        "BriefDescription": "Core actual clocks when any Logical Processor is active on the Physical Core",
198*92b14858SMatt Macy        "MetricExpr": "( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )",
199959826caSMatt Macy        "MetricGroup": "SMT",
200959826caSMatt Macy        "MetricName": "CORE_CLKS"
201959826caSMatt Macy    },
202959826caSMatt Macy    {
203*92b14858SMatt Macy        "BriefDescription": "Actual Average Latency for L1 data-cache miss demand loads (in core cycles)",
204*92b14858SMatt Macy        "MetricExpr": "L1D_PEND_MISS.PENDING / ( MEM_LOAD_RETIRED.L1_MISS + MEM_LOAD_RETIRED.FB_HIT )",
205959826caSMatt Macy        "MetricGroup": "Memory_Bound;Memory_Lat",
206959826caSMatt Macy        "MetricName": "Load_Miss_Real_Latency"
207959826caSMatt Macy    },
208959826caSMatt Macy    {
209*92b14858SMatt Macy        "BriefDescription": "Memory-Level-Parallelism (average number of L1 miss demand load when there is at least one such miss. Per-Logical Processor)",
210*92b14858SMatt Macy        "MetricExpr": "L1D_PEND_MISS.PENDING / L1D_PEND_MISS.PENDING_CYCLES",
211959826caSMatt Macy        "MetricGroup": "Memory_Bound;Memory_BW",
212959826caSMatt Macy        "MetricName": "MLP"
213959826caSMatt Macy    },
214959826caSMatt Macy    {
215959826caSMatt Macy        "BriefDescription": "Utilization of the core's Page Walker(s) serving STLB misses triggered by instruction/Load/Store accesses",
216*92b14858SMatt Macy        "MetricExpr": "( ITLB_MISSES.WALK_PENDING + DTLB_LOAD_MISSES.WALK_PENDING + DTLB_STORE_MISSES.WALK_PENDING + EPT.WALK_PENDING ) / ( 2 * cycles )",
217959826caSMatt Macy        "MetricGroup": "TLB",
218*92b14858SMatt Macy        "MetricName": "Page_Walks_Utilization",
219*92b14858SMatt Macy        "MetricConstraint": "NO_NMI_WATCHDOG"
220*92b14858SMatt Macy    },
221*92b14858SMatt Macy    {
222*92b14858SMatt Macy        "BriefDescription": "Utilization of the core's Page Walker(s) serving STLB misses triggered by instruction/Load/Store accesses",
223*92b14858SMatt Macy        "MetricExpr": "( ITLB_MISSES.WALK_PENDING + DTLB_LOAD_MISSES.WALK_PENDING + DTLB_STORE_MISSES.WALK_PENDING + EPT.WALK_PENDING ) / ( 2 * (( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )) )",
224*92b14858SMatt Macy        "MetricGroup": "TLB_SMT",
225*92b14858SMatt Macy        "MetricName": "Page_Walks_Utilization_SMT"
226*92b14858SMatt Macy    },
227*92b14858SMatt Macy    {
228*92b14858SMatt Macy        "BriefDescription": "Average data fill bandwidth to the L1 data cache [GB / sec]",
229*92b14858SMatt Macy        "MetricExpr": "64 * L1D.REPLACEMENT / 1000000000 / duration_time",
230*92b14858SMatt Macy        "MetricGroup": "Memory_BW",
231*92b14858SMatt Macy        "MetricName": "L1D_Cache_Fill_BW"
232*92b14858SMatt Macy    },
233*92b14858SMatt Macy    {
234*92b14858SMatt Macy        "BriefDescription": "Average data fill bandwidth to the L2 cache [GB / sec]",
235*92b14858SMatt Macy        "MetricExpr": "64 * L2_LINES_IN.ALL / 1000000000 / duration_time",
236*92b14858SMatt Macy        "MetricGroup": "Memory_BW",
237*92b14858SMatt Macy        "MetricName": "L2_Cache_Fill_BW"
238*92b14858SMatt Macy    },
239*92b14858SMatt Macy    {
240*92b14858SMatt Macy        "BriefDescription": "Average per-core data fill bandwidth to the L3 cache [GB / sec]",
241*92b14858SMatt Macy        "MetricExpr": "64 * LONGEST_LAT_CACHE.MISS / 1000000000 / duration_time",
242*92b14858SMatt Macy        "MetricGroup": "Memory_BW",
243*92b14858SMatt Macy        "MetricName": "L3_Cache_Fill_BW"
244*92b14858SMatt Macy    },
245*92b14858SMatt Macy    {
246*92b14858SMatt Macy        "BriefDescription": "Average per-core data fill bandwidth to the L3 cache [GB / sec]",
247*92b14858SMatt Macy        "MetricExpr": "64 * OFFCORE_REQUESTS.ALL_REQUESTS / 1000000000 / duration_time",
248*92b14858SMatt Macy        "MetricGroup": "Memory_BW",
249*92b14858SMatt Macy        "MetricName": "L3_Cache_Access_BW"
250*92b14858SMatt Macy    },
251*92b14858SMatt Macy    {
252*92b14858SMatt Macy        "BriefDescription": "L1 cache true misses per kilo instruction for retired demand loads",
253*92b14858SMatt Macy        "MetricExpr": "1000 * MEM_LOAD_RETIRED.L1_MISS / INST_RETIRED.ANY",
254*92b14858SMatt Macy        "MetricGroup": "Cache_Misses",
255*92b14858SMatt Macy        "MetricName": "L1MPKI"
256*92b14858SMatt Macy    },
257*92b14858SMatt Macy    {
258*92b14858SMatt Macy        "BriefDescription": "L2 cache true misses per kilo instruction for retired demand loads",
259*92b14858SMatt Macy        "MetricExpr": "1000 * MEM_LOAD_RETIRED.L2_MISS / INST_RETIRED.ANY",
260*92b14858SMatt Macy        "MetricGroup": "Cache_Misses",
261*92b14858SMatt Macy        "MetricName": "L2MPKI"
262*92b14858SMatt Macy    },
263*92b14858SMatt Macy    {
264*92b14858SMatt Macy        "BriefDescription": "L2 cache misses per kilo instruction for all request types (including speculative)",
265*92b14858SMatt Macy        "MetricExpr": "1000 * L2_RQSTS.MISS / INST_RETIRED.ANY",
266*92b14858SMatt Macy        "MetricGroup": "Cache_Misses",
267*92b14858SMatt Macy        "MetricName": "L2MPKI_All"
268*92b14858SMatt Macy    },
269*92b14858SMatt Macy    {
270*92b14858SMatt Macy        "BriefDescription": "L2 cache hits per kilo instruction for all request types (including speculative)",
271*92b14858SMatt Macy        "MetricExpr": "1000 * ( L2_RQSTS.REFERENCES - L2_RQSTS.MISS ) / INST_RETIRED.ANY",
272*92b14858SMatt Macy        "MetricGroup": "Cache_Misses",
273*92b14858SMatt Macy        "MetricName": "L2HPKI_All"
274*92b14858SMatt Macy    },
275*92b14858SMatt Macy    {
276*92b14858SMatt Macy        "BriefDescription": "L3 cache true misses per kilo instruction for retired demand loads",
277*92b14858SMatt Macy        "MetricExpr": "1000 * MEM_LOAD_RETIRED.L3_MISS / INST_RETIRED.ANY",
278*92b14858SMatt Macy        "MetricGroup": "Cache_Misses",
279*92b14858SMatt Macy        "MetricName": "L3MPKI"
280*92b14858SMatt Macy    },
281*92b14858SMatt Macy    {
282*92b14858SMatt Macy        "BriefDescription": "Rate of silent evictions from the L2 cache per Kilo instruction where the evicted lines are dropped (no writeback to L3 or memory)",
283*92b14858SMatt Macy        "MetricExpr": "1000 * L2_LINES_OUT.SILENT / INST_RETIRED.ANY",
284*92b14858SMatt Macy        "MetricGroup": "",
285*92b14858SMatt Macy        "MetricName": "L2_Evictions_Silent_PKI"
286*92b14858SMatt Macy    },
287*92b14858SMatt Macy    {
288*92b14858SMatt Macy        "BriefDescription": "Rate of non silent evictions from the L2 cache per Kilo instruction",
289*92b14858SMatt Macy        "MetricExpr": "1000 * L2_LINES_OUT.NON_SILENT / INST_RETIRED.ANY",
290*92b14858SMatt Macy        "MetricGroup": "",
291*92b14858SMatt Macy        "MetricName": "L2_Evictions_NonSilent_PKI"
292959826caSMatt Macy    },
293959826caSMatt Macy    {
294959826caSMatt Macy        "BriefDescription": "Average CPU Utilization",
295959826caSMatt Macy        "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC / msr@tsc@",
296959826caSMatt Macy        "MetricGroup": "Summary",
297959826caSMatt Macy        "MetricName": "CPU_Utilization"
298959826caSMatt Macy    },
299959826caSMatt Macy    {
300959826caSMatt Macy        "BriefDescription": "Giga Floating Point Operations Per Second",
301*92b14858SMatt Macy        "MetricExpr": "( (( 1 * ( FP_ARITH_INST_RETIRED.SCALAR_SINGLE + FP_ARITH_INST_RETIRED.SCALAR_DOUBLE ) + 2 * FP_ARITH_INST_RETIRED.128B_PACKED_DOUBLE + 4 * ( FP_ARITH_INST_RETIRED.128B_PACKED_SINGLE + FP_ARITH_INST_RETIRED.256B_PACKED_DOUBLE ) + 8 * ( FP_ARITH_INST_RETIRED.256B_PACKED_SINGLE + FP_ARITH_INST_RETIRED.512B_PACKED_DOUBLE ) + 16 * FP_ARITH_INST_RETIRED.512B_PACKED_SINGLE )) / 1000000000 ) / duration_time",
302959826caSMatt Macy        "MetricGroup": "FLOPS;Summary",
303959826caSMatt Macy        "MetricName": "GFLOPs"
304959826caSMatt Macy    },
305959826caSMatt Macy    {
306959826caSMatt Macy        "BriefDescription": "Average Frequency Utilization relative nominal frequency",
307959826caSMatt Macy        "MetricExpr": "CPU_CLK_UNHALTED.THREAD / CPU_CLK_UNHALTED.REF_TSC",
308959826caSMatt Macy        "MetricGroup": "Power",
309959826caSMatt Macy        "MetricName": "Turbo_Utilization"
310959826caSMatt Macy    },
311959826caSMatt Macy    {
312*92b14858SMatt Macy        "BriefDescription": "Fraction of cycles where both hardware Logical Processors were active",
313959826caSMatt Macy        "MetricExpr": "1 - CPU_CLK_THREAD_UNHALTED.ONE_THREAD_ACTIVE / ( CPU_CLK_THREAD_UNHALTED.REF_XCLK_ANY / 2 ) if #SMT_on else 0",
314959826caSMatt Macy        "MetricGroup": "SMT;Summary",
315959826caSMatt Macy        "MetricName": "SMT_2T_Utilization"
316959826caSMatt Macy    },
317959826caSMatt Macy    {
318959826caSMatt Macy        "BriefDescription": "Fraction of cycles spent in Kernel mode",
319*92b14858SMatt Macy        "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:k / CPU_CLK_UNHALTED.REF_TSC",
320959826caSMatt Macy        "MetricGroup": "Summary",
321959826caSMatt Macy        "MetricName": "Kernel_Utilization"
322959826caSMatt Macy    },
323959826caSMatt Macy    {
324*92b14858SMatt Macy        "BriefDescription": "Average external Memory Bandwidth Use for reads and writes [GB / sec]",
325*92b14858SMatt Macy        "MetricExpr": "( 64 * ( uncore_imc@cas_count_read@ + uncore_imc@cas_count_write@ ) / 1000000000 ) / duration_time",
326*92b14858SMatt Macy        "MetricGroup": "Memory_BW",
327*92b14858SMatt Macy        "MetricName": "DRAM_BW_Use"
328*92b14858SMatt Macy    },
329*92b14858SMatt Macy    {
330*92b14858SMatt Macy        "BriefDescription": "Average latency of data read request to external memory (in nanoseconds). Accounts for demand loads and L1/L2 prefetches",
331*92b14858SMatt Macy        "MetricExpr": "1000000000 * ( cha@event\\=0x36\\\\\\,umask\\=0x21@ / cha@event\\=0x35\\\\\\,umask\\=0x21@ ) / ( cha_0@event\\=0x0@ / duration_time )",
332*92b14858SMatt Macy        "MetricGroup": "Memory_Lat",
333*92b14858SMatt Macy        "MetricName": "DRAM_Read_Latency"
334*92b14858SMatt Macy    },
335*92b14858SMatt Macy    {
336*92b14858SMatt Macy        "BriefDescription": "Average number of parallel data read requests to external memory. Accounts for demand loads and L1/L2 prefetches",
337*92b14858SMatt Macy        "MetricExpr": "cha@event\\=0x36\\\\\\,umask\\=0x21@ / cha@event\\=0x36\\\\\\,umask\\=0x21\\\\\\,thresh\\=1@",
338*92b14858SMatt Macy        "MetricGroup": "Memory_BW",
339*92b14858SMatt Macy        "MetricName": "DRAM_Parallel_Reads"
340*92b14858SMatt Macy    },
341*92b14858SMatt Macy    {
342*92b14858SMatt Macy        "BriefDescription": "Socket actual clocks when any core is active on that socket",
343*92b14858SMatt Macy        "MetricExpr": "cha_0@event\\=0x0@",
344*92b14858SMatt Macy        "MetricGroup": "",
345*92b14858SMatt Macy        "MetricName": "Socket_CLKS"
346*92b14858SMatt Macy    },
347*92b14858SMatt Macy    {
348*92b14858SMatt Macy        "BriefDescription": "Instructions per Far Branch ( Far Branches apply upon transition from application to operating system, handling interrupts, exceptions. )",
349*92b14858SMatt Macy        "MetricExpr": "INST_RETIRED.ANY / ( BR_INST_RETIRED.FAR_BRANCH / 2 )",
350*92b14858SMatt Macy        "MetricGroup": "",
351*92b14858SMatt Macy        "MetricName": "IpFarBranch"
352*92b14858SMatt Macy    },
353*92b14858SMatt Macy    {
354959826caSMatt Macy        "BriefDescription": "C3 residency percent per core",
355959826caSMatt Macy        "MetricExpr": "(cstate_core@c3\\-residency@ / msr@tsc@) * 100",
356959826caSMatt Macy        "MetricGroup": "Power",
357959826caSMatt Macy        "MetricName": "C3_Core_Residency"
358959826caSMatt Macy    },
359959826caSMatt Macy    {
360959826caSMatt Macy        "BriefDescription": "C6 residency percent per core",
361959826caSMatt Macy        "MetricExpr": "(cstate_core@c6\\-residency@ / msr@tsc@) * 100",
362959826caSMatt Macy        "MetricGroup": "Power",
363959826caSMatt Macy        "MetricName": "C6_Core_Residency"
364959826caSMatt Macy    },
365959826caSMatt Macy    {
366959826caSMatt Macy        "BriefDescription": "C7 residency percent per core",
367959826caSMatt Macy        "MetricExpr": "(cstate_core@c7\\-residency@ / msr@tsc@) * 100",
368959826caSMatt Macy        "MetricGroup": "Power",
369959826caSMatt Macy        "MetricName": "C7_Core_Residency"
370959826caSMatt Macy    },
371959826caSMatt Macy    {
372959826caSMatt Macy        "BriefDescription": "C2 residency percent per package",
373959826caSMatt Macy        "MetricExpr": "(cstate_pkg@c2\\-residency@ / msr@tsc@) * 100",
374959826caSMatt Macy        "MetricGroup": "Power",
375959826caSMatt Macy        "MetricName": "C2_Pkg_Residency"
376959826caSMatt Macy    },
377959826caSMatt Macy    {
378959826caSMatt Macy        "BriefDescription": "C3 residency percent per package",
379959826caSMatt Macy        "MetricExpr": "(cstate_pkg@c3\\-residency@ / msr@tsc@) * 100",
380959826caSMatt Macy        "MetricGroup": "Power",
381959826caSMatt Macy        "MetricName": "C3_Pkg_Residency"
382959826caSMatt Macy    },
383959826caSMatt Macy    {
384959826caSMatt Macy        "BriefDescription": "C6 residency percent per package",
385959826caSMatt Macy        "MetricExpr": "(cstate_pkg@c6\\-residency@ / msr@tsc@) * 100",
386959826caSMatt Macy        "MetricGroup": "Power",
387959826caSMatt Macy        "MetricName": "C6_Pkg_Residency"
388959826caSMatt Macy    },
389959826caSMatt Macy    {
390959826caSMatt Macy        "BriefDescription": "C7 residency percent per package",
391959826caSMatt Macy        "MetricExpr": "(cstate_pkg@c7\\-residency@ / msr@tsc@) * 100",
392959826caSMatt Macy        "MetricGroup": "Power",
393959826caSMatt Macy        "MetricName": "C7_Pkg_Residency"
394959826caSMatt Macy    }
395959826caSMatt Macy]
396