xref: /freebsd/lib/libpmc/pmu-events/arch/x86/ivybridge/ivb-metrics.json (revision 18054d0220cfc8df9c9568c437bd6fbb59d53c3c)
1959826caSMatt Macy[
2959826caSMatt Macy    {
392b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots where the processor's Frontend undersupplies its Backend",
4*18054d02SAlexander Motin        "MetricExpr": "IDQ_UOPS_NOT_DELIVERED.CORE / (4 * CPU_CLK_UNHALTED.THREAD)",
592b14858SMatt Macy        "MetricGroup": "TopdownL1",
692b14858SMatt Macy        "MetricName": "Frontend_Bound",
7*18054d02SAlexander Motin        "PublicDescription": "This category represents fraction of slots where the processor's Frontend undersupplies its Backend. Frontend denotes the first part of the processor core responsible to fetch operations that are executed later on by the Backend part. Within the Frontend; a branch predictor predicts the next address to fetch; cache-lines are fetched from the memory subsystem; parsed into instructions; and lastly decoded into micro-operations (uops). Ideally the Frontend can issue Machine_Width uops every cycle to the Backend. Frontend Bound denotes unutilized issue-slots when there is no Backend stall; i.e. bubbles where Frontend delivered no uops while Backend could have accepted them. For example; stalls due to instruction-cache misses would be categorized under Frontend Bound."
892b14858SMatt Macy    },
992b14858SMatt Macy    {
1092b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots where the processor's Frontend undersupplies its Backend. SMT version; use when SMT is enabled and measuring per logical CPU.",
11*18054d02SAlexander Motin        "MetricExpr": "IDQ_UOPS_NOT_DELIVERED.CORE / (4 * ( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) ))",
1292b14858SMatt Macy        "MetricGroup": "TopdownL1_SMT",
1392b14858SMatt Macy        "MetricName": "Frontend_Bound_SMT",
14*18054d02SAlexander Motin        "PublicDescription": "This category represents fraction of slots where the processor's Frontend undersupplies its Backend. Frontend denotes the first part of the processor core responsible to fetch operations that are executed later on by the Backend part. Within the Frontend; a branch predictor predicts the next address to fetch; cache-lines are fetched from the memory subsystem; parsed into instructions; and lastly decoded into micro-operations (uops). Ideally the Frontend can issue Machine_Width uops every cycle to the Backend. Frontend Bound denotes unutilized issue-slots when there is no Backend stall; i.e. bubbles where Frontend delivered no uops while Backend could have accepted them. For example; stalls due to instruction-cache misses would be categorized under Frontend Bound. SMT version; use when SMT is enabled and measuring per logical CPU."
1592b14858SMatt Macy    },
1692b14858SMatt Macy    {
1792b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots wasted due to incorrect speculations",
18*18054d02SAlexander Motin        "MetricExpr": "( UOPS_ISSUED.ANY - UOPS_RETIRED.RETIRE_SLOTS + 4 * INT_MISC.RECOVERY_CYCLES ) / (4 * CPU_CLK_UNHALTED.THREAD)",
1992b14858SMatt Macy        "MetricGroup": "TopdownL1",
2092b14858SMatt Macy        "MetricName": "Bad_Speculation",
2192b14858SMatt Macy        "PublicDescription": "This category represents fraction of slots wasted due to incorrect speculations. This include slots used to issue uops that do not eventually get retired and slots for which the issue-pipeline was blocked due to recovery from earlier incorrect speculation. For example; wasted work due to miss-predicted branches are categorized under Bad Speculation category. Incorrect data speculation followed by Memory Ordering Nukes is another example."
2292b14858SMatt Macy    },
2392b14858SMatt Macy    {
2492b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots wasted due to incorrect speculations. SMT version; use when SMT is enabled and measuring per logical CPU.",
25*18054d02SAlexander Motin        "MetricExpr": "( UOPS_ISSUED.ANY - UOPS_RETIRED.RETIRE_SLOTS + 4 * ( INT_MISC.RECOVERY_CYCLES_ANY / 2 ) ) / (4 * ( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) ))",
2692b14858SMatt Macy        "MetricGroup": "TopdownL1_SMT",
2792b14858SMatt Macy        "MetricName": "Bad_Speculation_SMT",
2892b14858SMatt Macy        "PublicDescription": "This category represents fraction of slots wasted due to incorrect speculations. This include slots used to issue uops that do not eventually get retired and slots for which the issue-pipeline was blocked due to recovery from earlier incorrect speculation. For example; wasted work due to miss-predicted branches are categorized under Bad Speculation category. Incorrect data speculation followed by Memory Ordering Nukes is another example. SMT version; use when SMT is enabled and measuring per logical CPU."
2992b14858SMatt Macy    },
3092b14858SMatt Macy    {
3192b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots where no uops are being delivered due to a lack of required resources for accepting new uops in the Backend",
32*18054d02SAlexander Motin        "MetricConstraint": "NO_NMI_WATCHDOG",
33*18054d02SAlexander Motin        "MetricExpr": "1 - ( (IDQ_UOPS_NOT_DELIVERED.CORE / (4 * CPU_CLK_UNHALTED.THREAD)) + (( UOPS_ISSUED.ANY - UOPS_RETIRED.RETIRE_SLOTS + 4 * INT_MISC.RECOVERY_CYCLES ) / (4 * CPU_CLK_UNHALTED.THREAD)) + (UOPS_RETIRED.RETIRE_SLOTS / (4 * CPU_CLK_UNHALTED.THREAD)) )",
3492b14858SMatt Macy        "MetricGroup": "TopdownL1",
3592b14858SMatt Macy        "MetricName": "Backend_Bound",
3692b14858SMatt Macy        "PublicDescription": "This category represents fraction of slots where no uops are being delivered due to a lack of required resources for accepting new uops in the Backend. Backend is the portion of the processor core where the out-of-order scheduler dispatches ready uops into their respective execution units; and once completed these uops get retired according to program order. For example; stalls due to data-cache misses or stalls due to the divider unit being overloaded are both categorized under Backend Bound. Backend Bound is further divided into two main categories: Memory Bound and Core Bound."
3792b14858SMatt Macy    },
3892b14858SMatt Macy    {
3992b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots where no uops are being delivered due to a lack of required resources for accepting new uops in the Backend. SMT version; use when SMT is enabled and measuring per logical CPU.",
40*18054d02SAlexander Motin        "MetricExpr": "1 - ( (IDQ_UOPS_NOT_DELIVERED.CORE / (4 * ( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) ))) + (( UOPS_ISSUED.ANY - UOPS_RETIRED.RETIRE_SLOTS + 4 * ( INT_MISC.RECOVERY_CYCLES_ANY / 2 ) ) / (4 * ( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) ))) + (UOPS_RETIRED.RETIRE_SLOTS / (4 * ( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) ))) )",
4192b14858SMatt Macy        "MetricGroup": "TopdownL1_SMT",
4292b14858SMatt Macy        "MetricName": "Backend_Bound_SMT",
4392b14858SMatt Macy        "PublicDescription": "This category represents fraction of slots where no uops are being delivered due to a lack of required resources for accepting new uops in the Backend. Backend is the portion of the processor core where the out-of-order scheduler dispatches ready uops into their respective execution units; and once completed these uops get retired according to program order. For example; stalls due to data-cache misses or stalls due to the divider unit being overloaded are both categorized under Backend Bound. Backend Bound is further divided into two main categories: Memory Bound and Core Bound. SMT version; use when SMT is enabled and measuring per logical CPU."
4492b14858SMatt Macy    },
4592b14858SMatt Macy    {
4692b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots utilized by useful work i.e. issued uops that eventually get retired",
47*18054d02SAlexander Motin        "MetricExpr": "UOPS_RETIRED.RETIRE_SLOTS / (4 * CPU_CLK_UNHALTED.THREAD)",
4892b14858SMatt Macy        "MetricGroup": "TopdownL1",
4992b14858SMatt Macy        "MetricName": "Retiring",
50*18054d02SAlexander Motin        "PublicDescription": "This category represents fraction of slots utilized by useful work i.e. issued uops that eventually get retired. Ideally; all pipeline slots would be attributed to the Retiring category.  Retiring of 100% would indicate the maximum Pipeline_Width throughput was achieved.  Maximizing Retiring typically increases the Instructions-per-cycle (see IPC metric). Note that a high Retiring value does not necessary mean there is no room for more performance.  For example; Heavy-operations or Microcode Assists are categorized under Retiring. They often indicate suboptimal performance and can often be optimized or avoided. "
5192b14858SMatt Macy    },
5292b14858SMatt Macy    {
5392b14858SMatt Macy        "BriefDescription": "This category represents fraction of slots utilized by useful work i.e. issued uops that eventually get retired. SMT version; use when SMT is enabled and measuring per logical CPU.",
54*18054d02SAlexander Motin        "MetricExpr": "UOPS_RETIRED.RETIRE_SLOTS / (4 * ( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) ))",
5592b14858SMatt Macy        "MetricGroup": "TopdownL1_SMT",
5692b14858SMatt Macy        "MetricName": "Retiring_SMT",
57*18054d02SAlexander Motin        "PublicDescription": "This category represents fraction of slots utilized by useful work i.e. issued uops that eventually get retired. Ideally; all pipeline slots would be attributed to the Retiring category.  Retiring of 100% would indicate the maximum Pipeline_Width throughput was achieved.  Maximizing Retiring typically increases the Instructions-per-cycle (see IPC metric). Note that a high Retiring value does not necessary mean there is no room for more performance.  For example; Heavy-operations or Microcode Assists are categorized under Retiring. They often indicate suboptimal performance and can often be optimized or avoided. SMT version; use when SMT is enabled and measuring per logical CPU."
5892b14858SMatt Macy    },
5992b14858SMatt Macy    {
6092b14858SMatt Macy        "BriefDescription": "Instructions Per Cycle (per Logical Processor)",
61959826caSMatt Macy        "MetricExpr": "INST_RETIRED.ANY / CPU_CLK_UNHALTED.THREAD",
62*18054d02SAlexander Motin        "MetricGroup": "Ret;Summary",
63959826caSMatt Macy        "MetricName": "IPC"
64959826caSMatt Macy    },
65959826caSMatt Macy    {
66959826caSMatt Macy        "BriefDescription": "Uops Per Instruction",
67959826caSMatt Macy        "MetricExpr": "UOPS_RETIRED.RETIRE_SLOTS / INST_RETIRED.ANY",
68*18054d02SAlexander Motin        "MetricGroup": "Pipeline;Ret;Retire",
69959826caSMatt Macy        "MetricName": "UPI"
70959826caSMatt Macy    },
71959826caSMatt Macy    {
7292b14858SMatt Macy        "BriefDescription": "Instruction per taken branch",
73*18054d02SAlexander Motin        "MetricExpr": "UOPS_RETIRED.RETIRE_SLOTS / BR_INST_RETIRED.NEAR_TAKEN",
74*18054d02SAlexander Motin        "MetricGroup": "Branches;Fed;FetchBW",
75*18054d02SAlexander Motin        "MetricName": "UpTB"
76959826caSMatt Macy    },
77959826caSMatt Macy    {
7892b14858SMatt Macy        "BriefDescription": "Cycles Per Instruction (per Logical Processor)",
79*18054d02SAlexander Motin        "MetricExpr": "1 / (INST_RETIRED.ANY / CPU_CLK_UNHALTED.THREAD)",
80*18054d02SAlexander Motin        "MetricGroup": "Pipeline;Mem",
81959826caSMatt Macy        "MetricName": "CPI"
82959826caSMatt Macy    },
83959826caSMatt Macy    {
8492b14858SMatt Macy        "BriefDescription": "Per-Logical Processor actual clocks when the Logical Processor is active.",
85959826caSMatt Macy        "MetricExpr": "CPU_CLK_UNHALTED.THREAD",
86*18054d02SAlexander Motin        "MetricGroup": "Pipeline",
87959826caSMatt Macy        "MetricName": "CLKS"
88959826caSMatt Macy    },
89959826caSMatt Macy    {
90*18054d02SAlexander Motin        "BriefDescription": "Total issue-pipeline slots (per-Physical Core till ICL; per-Logical Processor ICL onward)",
91*18054d02SAlexander Motin        "MetricExpr": "4 * CPU_CLK_UNHALTED.THREAD",
92*18054d02SAlexander Motin        "MetricGroup": "TmaL1",
93959826caSMatt Macy        "MetricName": "SLOTS"
94959826caSMatt Macy    },
95959826caSMatt Macy    {
96*18054d02SAlexander Motin        "BriefDescription": "Total issue-pipeline slots (per-Physical Core till ICL; per-Logical Processor ICL onward)",
97*18054d02SAlexander Motin        "MetricExpr": "4 * ( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )",
98*18054d02SAlexander Motin        "MetricGroup": "TmaL1_SMT",
9992b14858SMatt Macy        "MetricName": "SLOTS_SMT"
10092b14858SMatt Macy    },
10192b14858SMatt Macy    {
102*18054d02SAlexander Motin        "BriefDescription": "The ratio of Executed- by Issued-Uops",
103*18054d02SAlexander Motin        "MetricExpr": "UOPS_EXECUTED.THREAD / UOPS_ISSUED.ANY",
104*18054d02SAlexander Motin        "MetricGroup": "Cor;Pipeline",
105*18054d02SAlexander Motin        "MetricName": "Execute_per_Issue",
106*18054d02SAlexander Motin        "PublicDescription": "The ratio of Executed- by Issued-Uops. Ratio > 1 suggests high rate of uop micro-fusions. Ratio < 1 suggest high rate of \"execute\" at rename stage."
10792b14858SMatt Macy    },
10892b14858SMatt Macy    {
109*18054d02SAlexander Motin        "BriefDescription": "Instructions Per Cycle across hyper-threads (per physical core)",
110*18054d02SAlexander Motin        "MetricExpr": "INST_RETIRED.ANY / CPU_CLK_UNHALTED.THREAD",
111*18054d02SAlexander Motin        "MetricGroup": "Ret;SMT;TmaL1",
112959826caSMatt Macy        "MetricName": "CoreIPC"
113959826caSMatt Macy    },
114959826caSMatt Macy    {
115*18054d02SAlexander Motin        "BriefDescription": "Instructions Per Cycle across hyper-threads (per physical core)",
116*18054d02SAlexander Motin        "MetricExpr": "INST_RETIRED.ANY / ( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )",
117*18054d02SAlexander Motin        "MetricGroup": "Ret;SMT;TmaL1_SMT",
11892b14858SMatt Macy        "MetricName": "CoreIPC_SMT"
11992b14858SMatt Macy    },
12092b14858SMatt Macy    {
12192b14858SMatt Macy        "BriefDescription": "Floating Point Operations Per Cycle",
122*18054d02SAlexander Motin        "MetricExpr": "( 1 * ( FP_COMP_OPS_EXE.SSE_SCALAR_SINGLE + FP_COMP_OPS_EXE.SSE_SCALAR_DOUBLE ) + 2 * FP_COMP_OPS_EXE.SSE_PACKED_DOUBLE + 4 * ( FP_COMP_OPS_EXE.SSE_PACKED_SINGLE + SIMD_FP_256.PACKED_DOUBLE ) + 8 * SIMD_FP_256.PACKED_SINGLE ) / CPU_CLK_UNHALTED.THREAD",
123*18054d02SAlexander Motin        "MetricGroup": "Ret;Flops",
12492b14858SMatt Macy        "MetricName": "FLOPc"
12592b14858SMatt Macy    },
12692b14858SMatt Macy    {
12792b14858SMatt Macy        "BriefDescription": "Floating Point Operations Per Cycle",
128*18054d02SAlexander Motin        "MetricExpr": "( 1 * ( FP_COMP_OPS_EXE.SSE_SCALAR_SINGLE + FP_COMP_OPS_EXE.SSE_SCALAR_DOUBLE ) + 2 * FP_COMP_OPS_EXE.SSE_PACKED_DOUBLE + 4 * ( FP_COMP_OPS_EXE.SSE_PACKED_SINGLE + SIMD_FP_256.PACKED_DOUBLE ) + 8 * SIMD_FP_256.PACKED_SINGLE ) / ( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )",
129*18054d02SAlexander Motin        "MetricGroup": "Ret;Flops_SMT",
13092b14858SMatt Macy        "MetricName": "FLOPc_SMT"
13192b14858SMatt Macy    },
13292b14858SMatt Macy    {
133959826caSMatt Macy        "BriefDescription": "Instruction-Level-Parallelism (average number of uops executed when there is at least 1 uop executed)",
134959826caSMatt Macy        "MetricExpr": "UOPS_EXECUTED.THREAD / (( cpu@UOPS_EXECUTED.CORE\\,cmask\\=1@ / 2 ) if #SMT_on else UOPS_EXECUTED.CYCLES_GE_1_UOP_EXEC)",
135*18054d02SAlexander Motin        "MetricGroup": "Backend;Cor;Pipeline;PortsUtil",
136959826caSMatt Macy        "MetricName": "ILP"
137959826caSMatt Macy    },
138959826caSMatt Macy    {
13992b14858SMatt Macy        "BriefDescription": "Number of Instructions per non-speculative Branch Misprediction (JEClear)",
14092b14858SMatt Macy        "MetricExpr": "INST_RETIRED.ANY / BR_MISP_RETIRED.ALL_BRANCHES",
141*18054d02SAlexander Motin        "MetricGroup": "Bad;BadSpec;BrMispredicts",
14292b14858SMatt Macy        "MetricName": "IpMispredict"
143959826caSMatt Macy    },
144959826caSMatt Macy    {
14592b14858SMatt Macy        "BriefDescription": "Core actual clocks when any Logical Processor is active on the Physical Core",
14692b14858SMatt Macy        "MetricExpr": "( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )",
147959826caSMatt Macy        "MetricGroup": "SMT",
148959826caSMatt Macy        "MetricName": "CORE_CLKS"
149959826caSMatt Macy    },
150959826caSMatt Macy    {
151*18054d02SAlexander Motin        "BriefDescription": "Instructions per Load (lower number means higher occurrence rate)",
152*18054d02SAlexander Motin        "MetricExpr": "INST_RETIRED.ANY / MEM_UOPS_RETIRED.ALL_LOADS",
153*18054d02SAlexander Motin        "MetricGroup": "InsType",
154*18054d02SAlexander Motin        "MetricName": "IpLoad"
155*18054d02SAlexander Motin    },
156*18054d02SAlexander Motin    {
157*18054d02SAlexander Motin        "BriefDescription": "Instructions per Store (lower number means higher occurrence rate)",
158*18054d02SAlexander Motin        "MetricExpr": "INST_RETIRED.ANY / MEM_UOPS_RETIRED.ALL_STORES",
159*18054d02SAlexander Motin        "MetricGroup": "InsType",
160*18054d02SAlexander Motin        "MetricName": "IpStore"
161*18054d02SAlexander Motin    },
162*18054d02SAlexander Motin    {
163*18054d02SAlexander Motin        "BriefDescription": "Instructions per Branch (lower number means higher occurrence rate)",
164*18054d02SAlexander Motin        "MetricExpr": "INST_RETIRED.ANY / BR_INST_RETIRED.ALL_BRANCHES",
165*18054d02SAlexander Motin        "MetricGroup": "Branches;Fed;InsType",
166*18054d02SAlexander Motin        "MetricName": "IpBranch"
167*18054d02SAlexander Motin    },
168*18054d02SAlexander Motin    {
169*18054d02SAlexander Motin        "BriefDescription": "Instructions per (near) call (lower number means higher occurrence rate)",
170*18054d02SAlexander Motin        "MetricExpr": "INST_RETIRED.ANY / BR_INST_RETIRED.NEAR_CALL",
171*18054d02SAlexander Motin        "MetricGroup": "Branches;Fed;PGO",
172*18054d02SAlexander Motin        "MetricName": "IpCall"
173*18054d02SAlexander Motin    },
174*18054d02SAlexander Motin    {
175*18054d02SAlexander Motin        "BriefDescription": "Instruction per taken branch",
176*18054d02SAlexander Motin        "MetricExpr": "INST_RETIRED.ANY / BR_INST_RETIRED.NEAR_TAKEN",
177*18054d02SAlexander Motin        "MetricGroup": "Branches;Fed;FetchBW;Frontend;PGO",
178*18054d02SAlexander Motin        "MetricName": "IpTB"
179*18054d02SAlexander Motin    },
180*18054d02SAlexander Motin    {
181*18054d02SAlexander Motin        "BriefDescription": "Branch instructions per taken branch. ",
182*18054d02SAlexander Motin        "MetricExpr": "BR_INST_RETIRED.ALL_BRANCHES / BR_INST_RETIRED.NEAR_TAKEN",
183*18054d02SAlexander Motin        "MetricGroup": "Branches;Fed;PGO",
184*18054d02SAlexander Motin        "MetricName": "BpTkBranch"
185*18054d02SAlexander Motin    },
186*18054d02SAlexander Motin    {
187*18054d02SAlexander Motin        "BriefDescription": "Instructions per FP Arithmetic instruction (lower number means higher occurrence rate)",
188*18054d02SAlexander Motin        "MetricExpr": "1 / ( ((FP_COMP_OPS_EXE.SSE_SCALAR_SINGLE + FP_COMP_OPS_EXE.SSE_SCALAR_DOUBLE) / UOPS_EXECUTED.THREAD) + ((FP_COMP_OPS_EXE.SSE_PACKED_DOUBLE + FP_COMP_OPS_EXE.SSE_PACKED_SINGLE + SIMD_FP_256.PACKED_SINGLE + SIMD_FP_256.PACKED_DOUBLE) / UOPS_EXECUTED.THREAD) )",
189*18054d02SAlexander Motin        "MetricGroup": "Flops;InsType",
190*18054d02SAlexander Motin        "MetricName": "IpArith",
191*18054d02SAlexander Motin        "PublicDescription": "Instructions per FP Arithmetic instruction (lower number means higher occurrence rate). May undercount due to FMA double counting. Approximated prior to BDW."
192*18054d02SAlexander Motin    },
193*18054d02SAlexander Motin    {
194*18054d02SAlexander Motin        "BriefDescription": "Total number of retired Instructions, Sample with: INST_RETIRED.PREC_DIST",
195*18054d02SAlexander Motin        "MetricExpr": "INST_RETIRED.ANY",
196*18054d02SAlexander Motin        "MetricGroup": "Summary;TmaL1",
197*18054d02SAlexander Motin        "MetricName": "Instructions"
198*18054d02SAlexander Motin    },
199*18054d02SAlexander Motin    {
200*18054d02SAlexander Motin        "BriefDescription": "Fraction of Uops delivered by the DSB (aka Decoded ICache; or Uop Cache)",
201*18054d02SAlexander Motin        "MetricExpr": "IDQ.DSB_UOPS / (( IDQ.DSB_UOPS + LSD.UOPS + IDQ.MITE_UOPS + IDQ.MS_UOPS ) )",
202*18054d02SAlexander Motin        "MetricGroup": "DSB;Fed;FetchBW",
203*18054d02SAlexander Motin        "MetricName": "DSB_Coverage"
204*18054d02SAlexander Motin    },
205*18054d02SAlexander Motin    {
206*18054d02SAlexander Motin        "BriefDescription": "Actual Average Latency for L1 data-cache miss demand load instructions (in core cycles)",
207959826caSMatt Macy        "MetricExpr": "L1D_PEND_MISS.PENDING / ( MEM_LOAD_UOPS_RETIRED.L1_MISS + mem_load_uops_retired.hit_lfb )",
208*18054d02SAlexander Motin        "MetricGroup": "Mem;MemoryBound;MemoryLat",
209*18054d02SAlexander Motin        "MetricName": "Load_Miss_Real_Latency",
210*18054d02SAlexander Motin        "PublicDescription": "Actual Average Latency for L1 data-cache miss demand load instructions (in core cycles). Latency may be overestimated for multi-load instructions - e.g. repeat strings."
211959826caSMatt Macy    },
212959826caSMatt Macy    {
21392b14858SMatt Macy        "BriefDescription": "Memory-Level-Parallelism (average number of L1 miss demand load when there is at least one such miss. Per-Logical Processor)",
21492b14858SMatt Macy        "MetricExpr": "L1D_PEND_MISS.PENDING / L1D_PEND_MISS.PENDING_CYCLES",
215*18054d02SAlexander Motin        "MetricGroup": "Mem;MemoryBound;MemoryBW",
216959826caSMatt Macy        "MetricName": "MLP"
217959826caSMatt Macy    },
218959826caSMatt Macy    {
21992b14858SMatt Macy        "BriefDescription": "Average data fill bandwidth to the L1 data cache [GB / sec]",
22092b14858SMatt Macy        "MetricExpr": "64 * L1D.REPLACEMENT / 1000000000 / duration_time",
221*18054d02SAlexander Motin        "MetricGroup": "Mem;MemoryBW",
22292b14858SMatt Macy        "MetricName": "L1D_Cache_Fill_BW"
22392b14858SMatt Macy    },
22492b14858SMatt Macy    {
22592b14858SMatt Macy        "BriefDescription": "Average data fill bandwidth to the L2 cache [GB / sec]",
22692b14858SMatt Macy        "MetricExpr": "64 * L2_LINES_IN.ALL / 1000000000 / duration_time",
227*18054d02SAlexander Motin        "MetricGroup": "Mem;MemoryBW",
22892b14858SMatt Macy        "MetricName": "L2_Cache_Fill_BW"
22992b14858SMatt Macy    },
23092b14858SMatt Macy    {
23192b14858SMatt Macy        "BriefDescription": "Average per-core data fill bandwidth to the L3 cache [GB / sec]",
23292b14858SMatt Macy        "MetricExpr": "64 * LONGEST_LAT_CACHE.MISS / 1000000000 / duration_time",
233*18054d02SAlexander Motin        "MetricGroup": "Mem;MemoryBW",
23492b14858SMatt Macy        "MetricName": "L3_Cache_Fill_BW"
23592b14858SMatt Macy    },
23692b14858SMatt Macy    {
23792b14858SMatt Macy        "BriefDescription": "L1 cache true misses per kilo instruction for retired demand loads",
23892b14858SMatt Macy        "MetricExpr": "1000 * MEM_LOAD_UOPS_RETIRED.L1_MISS / INST_RETIRED.ANY",
239*18054d02SAlexander Motin        "MetricGroup": "Mem;CacheMisses",
24092b14858SMatt Macy        "MetricName": "L1MPKI"
24192b14858SMatt Macy    },
24292b14858SMatt Macy    {
24392b14858SMatt Macy        "BriefDescription": "L2 cache true misses per kilo instruction for retired demand loads",
24492b14858SMatt Macy        "MetricExpr": "1000 * MEM_LOAD_UOPS_RETIRED.L2_MISS / INST_RETIRED.ANY",
245*18054d02SAlexander Motin        "MetricGroup": "Mem;Backend;CacheMisses",
24692b14858SMatt Macy        "MetricName": "L2MPKI"
24792b14858SMatt Macy    },
24892b14858SMatt Macy    {
24992b14858SMatt Macy        "BriefDescription": "L3 cache true misses per kilo instruction for retired demand loads",
25092b14858SMatt Macy        "MetricExpr": "1000 * MEM_LOAD_UOPS_RETIRED.LLC_MISS / INST_RETIRED.ANY",
251*18054d02SAlexander Motin        "MetricGroup": "Mem;CacheMisses",
25292b14858SMatt Macy        "MetricName": "L3MPKI"
25392b14858SMatt Macy    },
25492b14858SMatt Macy    {
255*18054d02SAlexander Motin        "BriefDescription": "Utilization of the core's Page Walker(s) serving STLB misses triggered by instruction/Load/Store accesses",
256*18054d02SAlexander Motin        "MetricConstraint": "NO_NMI_WATCHDOG",
257*18054d02SAlexander Motin        "MetricExpr": "( ITLB_MISSES.WALK_DURATION + DTLB_LOAD_MISSES.WALK_DURATION + DTLB_STORE_MISSES.WALK_DURATION ) / CPU_CLK_UNHALTED.THREAD",
258*18054d02SAlexander Motin        "MetricGroup": "Mem;MemoryTLB",
259*18054d02SAlexander Motin        "MetricName": "Page_Walks_Utilization"
260*18054d02SAlexander Motin    },
261*18054d02SAlexander Motin    {
262*18054d02SAlexander Motin        "BriefDescription": "Utilization of the core's Page Walker(s) serving STLB misses triggered by instruction/Load/Store accesses",
263*18054d02SAlexander Motin        "MetricExpr": "( ITLB_MISSES.WALK_DURATION + DTLB_LOAD_MISSES.WALK_DURATION + DTLB_STORE_MISSES.WALK_DURATION ) / ( ( CPU_CLK_UNHALTED.THREAD / 2 ) * ( 1 + CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / CPU_CLK_UNHALTED.REF_XCLK ) )",
264*18054d02SAlexander Motin        "MetricGroup": "Mem;MemoryTLB_SMT",
265*18054d02SAlexander Motin        "MetricName": "Page_Walks_Utilization_SMT"
266*18054d02SAlexander Motin    },
267*18054d02SAlexander Motin    {
268959826caSMatt Macy        "BriefDescription": "Average CPU Utilization",
269959826caSMatt Macy        "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC / msr@tsc@",
270*18054d02SAlexander Motin        "MetricGroup": "HPC;Summary",
271959826caSMatt Macy        "MetricName": "CPU_Utilization"
272959826caSMatt Macy    },
273959826caSMatt Macy    {
274*18054d02SAlexander Motin        "BriefDescription": "Measured Average Frequency for unhalted processors [GHz]",
275*18054d02SAlexander Motin        "MetricExpr": "(CPU_CLK_UNHALTED.THREAD / CPU_CLK_UNHALTED.REF_TSC) * msr@tsc@ / 1000000000 / duration_time",
276*18054d02SAlexander Motin        "MetricGroup": "Summary;Power",
277*18054d02SAlexander Motin        "MetricName": "Average_Frequency"
278*18054d02SAlexander Motin    },
279*18054d02SAlexander Motin    {
280959826caSMatt Macy        "BriefDescription": "Giga Floating Point Operations Per Second",
281*18054d02SAlexander Motin        "MetricExpr": "( ( 1 * ( FP_COMP_OPS_EXE.SSE_SCALAR_SINGLE + FP_COMP_OPS_EXE.SSE_SCALAR_DOUBLE ) + 2 * FP_COMP_OPS_EXE.SSE_PACKED_DOUBLE + 4 * ( FP_COMP_OPS_EXE.SSE_PACKED_SINGLE + SIMD_FP_256.PACKED_DOUBLE ) + 8 * SIMD_FP_256.PACKED_SINGLE ) / 1000000000 ) / duration_time",
282*18054d02SAlexander Motin        "MetricGroup": "Cor;Flops;HPC",
283959826caSMatt Macy        "MetricName": "GFLOPs"
284959826caSMatt Macy    },
285959826caSMatt Macy    {
286959826caSMatt Macy        "BriefDescription": "Average Frequency Utilization relative nominal frequency",
287959826caSMatt Macy        "MetricExpr": "CPU_CLK_UNHALTED.THREAD / CPU_CLK_UNHALTED.REF_TSC",
288959826caSMatt Macy        "MetricGroup": "Power",
289959826caSMatt Macy        "MetricName": "Turbo_Utilization"
290959826caSMatt Macy    },
291959826caSMatt Macy    {
29292b14858SMatt Macy        "BriefDescription": "Fraction of cycles where both hardware Logical Processors were active",
293*18054d02SAlexander Motin        "MetricExpr": "1 - CPU_CLK_UNHALTED.ONE_THREAD_ACTIVE / ( CPU_CLK_UNHALTED.REF_XCLK_ANY / 2 ) if #SMT_on else 0",
294*18054d02SAlexander Motin        "MetricGroup": "SMT",
295959826caSMatt Macy        "MetricName": "SMT_2T_Utilization"
296959826caSMatt Macy    },
297959826caSMatt Macy    {
298*18054d02SAlexander Motin        "BriefDescription": "Fraction of cycles spent in the Operating System (OS) Kernel mode",
299*18054d02SAlexander Motin        "MetricExpr": "CPU_CLK_UNHALTED.THREAD_P:k / CPU_CLK_UNHALTED.THREAD",
300*18054d02SAlexander Motin        "MetricGroup": "OS",
301959826caSMatt Macy        "MetricName": "Kernel_Utilization"
302959826caSMatt Macy    },
303959826caSMatt Macy    {
304*18054d02SAlexander Motin        "BriefDescription": "Cycles Per Instruction for the Operating System (OS) Kernel mode",
305*18054d02SAlexander Motin        "MetricExpr": "CPU_CLK_UNHALTED.THREAD_P:k / INST_RETIRED.ANY_P:k",
306*18054d02SAlexander Motin        "MetricGroup": "OS",
307*18054d02SAlexander Motin        "MetricName": "Kernel_CPI"
308*18054d02SAlexander Motin    },
309*18054d02SAlexander Motin    {
31092b14858SMatt Macy        "BriefDescription": "Average external Memory Bandwidth Use for reads and writes [GB / sec]",
31192b14858SMatt Macy        "MetricExpr": "64 * ( arb@event\\=0x81\\,umask\\=0x1@ + arb@event\\=0x84\\,umask\\=0x1@ ) / 1000000 / duration_time / 1000",
312*18054d02SAlexander Motin        "MetricGroup": "HPC;Mem;MemoryBW;SoC",
31392b14858SMatt Macy        "MetricName": "DRAM_BW_Use"
31492b14858SMatt Macy    },
31592b14858SMatt Macy    {
316*18054d02SAlexander Motin        "BriefDescription": "Average latency of all requests to external memory (in Uncore cycles)",
317*18054d02SAlexander Motin        "MetricExpr": "UNC_ARB_TRK_OCCUPANCY.ALL / arb@event\\=0x81\\,umask\\=0x1@",
318*18054d02SAlexander Motin        "MetricGroup": "Mem;SoC",
319*18054d02SAlexander Motin        "MetricName": "MEM_Request_Latency"
320*18054d02SAlexander Motin    },
321*18054d02SAlexander Motin    {
322*18054d02SAlexander Motin        "BriefDescription": "Average number of parallel requests to external memory. Accounts for all requests",
323*18054d02SAlexander Motin        "MetricExpr": "UNC_ARB_TRK_OCCUPANCY.ALL / arb@event\\=0x81\\,umask\\=0x1@",
324*18054d02SAlexander Motin        "MetricGroup": "Mem;SoC",
325*18054d02SAlexander Motin        "MetricName": "MEM_Parallel_Requests"
326*18054d02SAlexander Motin    },
327*18054d02SAlexander Motin    {
328*18054d02SAlexander Motin        "BriefDescription": "Instructions per Far Branch ( Far Branches apply upon transition from application to operating system, handling interrupts, exceptions) [lower number means higher occurrence rate]",
329*18054d02SAlexander Motin        "MetricExpr": "INST_RETIRED.ANY / BR_INST_RETIRED.FAR_BRANCH:u",
330*18054d02SAlexander Motin        "MetricGroup": "Branches;OS",
331*18054d02SAlexander Motin        "MetricName": "IpFarBranch"
332*18054d02SAlexander Motin    },
333*18054d02SAlexander Motin    {
334959826caSMatt Macy        "BriefDescription": "C3 residency percent per core",
335959826caSMatt Macy        "MetricExpr": "(cstate_core@c3\\-residency@ / msr@tsc@) * 100",
336959826caSMatt Macy        "MetricGroup": "Power",
337959826caSMatt Macy        "MetricName": "C3_Core_Residency"
338959826caSMatt Macy    },
339959826caSMatt Macy    {
340959826caSMatt Macy        "BriefDescription": "C6 residency percent per core",
341959826caSMatt Macy        "MetricExpr": "(cstate_core@c6\\-residency@ / msr@tsc@) * 100",
342959826caSMatt Macy        "MetricGroup": "Power",
343959826caSMatt Macy        "MetricName": "C6_Core_Residency"
344959826caSMatt Macy    },
345959826caSMatt Macy    {
346959826caSMatt Macy        "BriefDescription": "C7 residency percent per core",
347959826caSMatt Macy        "MetricExpr": "(cstate_core@c7\\-residency@ / msr@tsc@) * 100",
348959826caSMatt Macy        "MetricGroup": "Power",
349959826caSMatt Macy        "MetricName": "C7_Core_Residency"
350959826caSMatt Macy    },
351959826caSMatt Macy    {
352959826caSMatt Macy        "BriefDescription": "C2 residency percent per package",
353959826caSMatt Macy        "MetricExpr": "(cstate_pkg@c2\\-residency@ / msr@tsc@) * 100",
354959826caSMatt Macy        "MetricGroup": "Power",
355959826caSMatt Macy        "MetricName": "C2_Pkg_Residency"
356959826caSMatt Macy    },
357959826caSMatt Macy    {
358959826caSMatt Macy        "BriefDescription": "C3 residency percent per package",
359959826caSMatt Macy        "MetricExpr": "(cstate_pkg@c3\\-residency@ / msr@tsc@) * 100",
360959826caSMatt Macy        "MetricGroup": "Power",
361959826caSMatt Macy        "MetricName": "C3_Pkg_Residency"
362959826caSMatt Macy    },
363959826caSMatt Macy    {
364959826caSMatt Macy        "BriefDescription": "C6 residency percent per package",
365959826caSMatt Macy        "MetricExpr": "(cstate_pkg@c6\\-residency@ / msr@tsc@) * 100",
366959826caSMatt Macy        "MetricGroup": "Power",
367959826caSMatt Macy        "MetricName": "C6_Pkg_Residency"
368959826caSMatt Macy    },
369959826caSMatt Macy    {
370959826caSMatt Macy        "BriefDescription": "C7 residency percent per package",
371959826caSMatt Macy        "MetricExpr": "(cstate_pkg@c7\\-residency@ / msr@tsc@) * 100",
372959826caSMatt Macy        "MetricGroup": "Power",
373959826caSMatt Macy        "MetricName": "C7_Pkg_Residency"
374959826caSMatt Macy    }
375959826caSMatt Macy]
376