|
| 1 | +[ |
| 2 | + { |
| 3 | + "BriefDescription": "Instructions Per Cycle (per logical thread)", |
| 4 | + "MetricExpr": "INST_RETIRED.ANY / CPU_CLK_UNHALTED.THREAD", |
| 5 | + "MetricGroup": "TopDownL1", |
| 6 | + "MetricName": "IPC" |
| 7 | + }, |
| 8 | + { |
| 9 | + "BriefDescription": "Uops Per Instruction", |
| 10 | + "MetricExpr": "UOPS_RETIRED.RETIRE_SLOTS / INST_RETIRED.ANY", |
| 11 | + "MetricGroup": "Pipeline", |
| 12 | + "MetricName": "UPI" |
| 13 | + }, |
| 14 | + { |
| 15 | + "BriefDescription": "Rough Estimation of fraction of fetched lines bytes that were likely consumed by program instructions", |
| 16 | + "MetricExpr": "min( 1 , UOPS_ISSUED.ANY / ((UOPS_RETIRED.RETIRE_SLOTS / INST_RETIRED.ANY) * 64 * ( ICACHE_64B.IFTAG_HIT + ICACHE_64B.IFTAG_MISS ) / 4.1) )", |
| 17 | + "MetricGroup": "Frontend", |
| 18 | + "MetricName": "IFetch_Line_Utilization" |
| 19 | + }, |
| 20 | + { |
| 21 | + "BriefDescription": "Fraction of Uops delivered by the DSB (aka Decoded Icache; or Uop Cache)", |
| 22 | + "MetricExpr": "IDQ.DSB_UOPS / ( IDQ.DSB_UOPS + LSD.UOPS + IDQ.MITE_UOPS + IDQ.MS_UOPS )", |
| 23 | + "MetricGroup": "DSB; Frontend_Bandwidth", |
| 24 | + "MetricName": "DSB_Coverage" |
| 25 | + }, |
| 26 | + { |
| 27 | + "BriefDescription": "Cycles Per Instruction (threaded)", |
| 28 | + "MetricExpr": "1 / (INST_RETIRED.ANY / cycles)", |
| 29 | + "MetricGroup": "Pipeline;Summary", |
| 30 | + "MetricName": "CPI" |
| 31 | + }, |
| 32 | + { |
| 33 | + "BriefDescription": "Per-thread actual clocks when the logical processor is active. This is called 'Clockticks' in VTune.", |
| 34 | + "MetricExpr": "CPU_CLK_UNHALTED.THREAD", |
| 35 | + "MetricGroup": "Summary", |
| 36 | + "MetricName": "CLKS" |
| 37 | + }, |
| 38 | + { |
| 39 | + "BriefDescription": "Total issue-pipeline slots", |
| 40 | + "MetricExpr": "4*(( CPU_CLK_UNHALTED.THREAD_ANY / 2 ) if #SMT_on else cycles)", |
| 41 | + "MetricGroup": "TopDownL1", |
| 42 | + "MetricName": "SLOTS" |
| 43 | + }, |
| 44 | + { |
| 45 | + "BriefDescription": "Total number of retired Instructions", |
| 46 | + "MetricExpr": "INST_RETIRED.ANY", |
| 47 | + "MetricGroup": "Summary", |
| 48 | + "MetricName": "Instructions" |
| 49 | + }, |
| 50 | + { |
| 51 | + "BriefDescription": "Instructions Per Cycle (per physical core)", |
| 52 | + "MetricExpr": "INST_RETIRED.ANY / (( CPU_CLK_UNHALTED.THREAD_ANY / 2 ) if #SMT_on else cycles)", |
| 53 | + "MetricGroup": "SMT", |
| 54 | + "MetricName": "CoreIPC" |
| 55 | + }, |
| 56 | + { |
| 57 | + "BriefDescription": "Instruction-Level-Parallelism (average number of uops executed when there is at least 1 uop executed)", |
| 58 | + "MetricExpr": "UOPS_EXECUTED.THREAD / (( UOPS_EXECUTED.CORE_CYCLES_GE_1 / 2) if #SMT_on else UOPS_EXECUTED.CORE_CYCLES_GE_1)", |
| 59 | + "MetricGroup": "Pipeline;Ports_Utilization", |
| 60 | + "MetricName": "ILP" |
| 61 | + }, |
| 62 | + { |
| 63 | + "BriefDescription": "Average Branch Address Clear Cost (fraction of cycles)", |
| 64 | + "MetricExpr": "2* (( RS_EVENTS.EMPTY_CYCLES - ICACHE_16B.IFDATA_STALL - ICACHE_64B.IFTAG_STALL ) / RS_EVENTS.EMPTY_END)", |
| 65 | + "MetricGroup": "Unknown_Branches", |
| 66 | + "MetricName": "BAClear_Cost" |
| 67 | + }, |
| 68 | + { |
| 69 | + "BriefDescription": "Core actual clocks when any thread is active on the physical core", |
| 70 | + "MetricExpr": "( CPU_CLK_UNHALTED.THREAD_ANY / 2 ) if #SMT_on else CPU_CLK_UNHALTED.THREAD", |
| 71 | + "MetricGroup": "SMT", |
| 72 | + "MetricName": "CORE_CLKS" |
| 73 | + }, |
| 74 | + { |
| 75 | + "BriefDescription": "Actual Average Latency for L1 data-cache miss demand loads", |
| 76 | + "MetricExpr": "L1D_PEND_MISS.PENDING / ( MEM_LOAD_RETIRED.L1_MISS_PS + MEM_LOAD_RETIRED.FB_HIT_PS )", |
| 77 | + "MetricGroup": "Memory_Bound;Memory_Lat", |
| 78 | + "MetricName": "Load_Miss_Real_Latency" |
| 79 | + }, |
| 80 | + { |
| 81 | + "BriefDescription": "Memory-Level-Parallelism (average number of L1 miss demand load when there is at least 1 such miss)", |
| 82 | + "MetricExpr": "L1D_PEND_MISS.PENDING / (( L1D_PEND_MISS.PENDING_CYCLES_ANY / 2) if #SMT_on else L1D_PEND_MISS.PENDING_CYCLES)", |
| 83 | + "MetricGroup": "Memory_Bound;Memory_BW", |
| 84 | + "MetricName": "MLP" |
| 85 | + }, |
| 86 | + { |
| 87 | + "BriefDescription": "Utilization of the core's Page Walker(s) serving STLB misses triggered by instruction/Load/Store accesses", |
| 88 | + "MetricExpr": "( ITLB_MISSES.WALK_PENDING + DTLB_LOAD_MISSES.WALK_PENDING + DTLB_STORE_MISSES.WALK_PENDING + EPT.WALK_PENDING ) / ( 2 * (( CPU_CLK_UNHALTED.THREAD_ANY / 2 ) if #SMT_on else cycles) )", |
| 89 | + "MetricGroup": "TLB", |
| 90 | + "MetricName": "Page_Walks_Utilization" |
| 91 | + }, |
| 92 | + { |
| 93 | + "BriefDescription": "Average CPU Utilization", |
| 94 | + "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC / msr@tsc@", |
| 95 | + "MetricGroup": "Summary", |
| 96 | + "MetricName": "CPU_Utilization" |
| 97 | + }, |
| 98 | + { |
| 99 | + "BriefDescription": "Giga Floating Point Operations Per Second", |
| 100 | + "MetricExpr": "(( 1*( FP_ARITH_INST_RETIRED.SCALAR_SINGLE + FP_ARITH_INST_RETIRED.SCALAR_DOUBLE ) + 2* FP_ARITH_INST_RETIRED.128B_PACKED_DOUBLE + 4*( FP_ARITH_INST_RETIRED.128B_PACKED_SINGLE + FP_ARITH_INST_RETIRED.256B_PACKED_DOUBLE ) + 8* FP_ARITH_INST_RETIRED.256B_PACKED_SINGLE )) / 1000000000 / duration_time", |
| 101 | + "MetricGroup": "FLOPS;Summary", |
| 102 | + "MetricName": "GFLOPs" |
| 103 | + }, |
| 104 | + { |
| 105 | + "BriefDescription": "Average Frequency Utilization relative nominal frequency", |
| 106 | + "MetricExpr": "CPU_CLK_UNHALTED.THREAD / CPU_CLK_UNHALTED.REF_TSC", |
| 107 | + "MetricGroup": "Power", |
| 108 | + "MetricName": "Turbo_Utilization" |
| 109 | + }, |
| 110 | + { |
| 111 | + "BriefDescription": "Fraction of cycles where both hardware threads were active", |
| 112 | + "MetricExpr": "1 - CPU_CLK_THREAD_UNHALTED.ONE_THREAD_ACTIVE / ( CPU_CLK_THREAD_UNHALTED.REF_XCLK_ANY / 2 ) if #SMT_on else 0", |
| 113 | + "MetricGroup": "SMT;Summary", |
| 114 | + "MetricName": "SMT_2T_Utilization" |
| 115 | + }, |
| 116 | + { |
| 117 | + "BriefDescription": "Fraction of cycles spent in Kernel mode", |
| 118 | + "MetricExpr": "CPU_CLK_UNHALTED.REF_TSC:u / CPU_CLK_UNHALTED.REF_TSC", |
| 119 | + "MetricGroup": "Summary", |
| 120 | + "MetricName": "Kernel_Utilization" |
| 121 | + }, |
| 122 | + { |
| 123 | + "BriefDescription": "C3 residency percent per core", |
| 124 | + "MetricExpr": "(cstate_core@c3\\-residency@ / msr@tsc@) * 100", |
| 125 | + "MetricGroup": "Power", |
| 126 | + "MetricName": "C3_Core_Residency" |
| 127 | + }, |
| 128 | + { |
| 129 | + "BriefDescription": "C6 residency percent per core", |
| 130 | + "MetricExpr": "(cstate_core@c6\\-residency@ / msr@tsc@) * 100", |
| 131 | + "MetricGroup": "Power", |
| 132 | + "MetricName": "C6_Core_Residency" |
| 133 | + }, |
| 134 | + { |
| 135 | + "BriefDescription": "C7 residency percent per core", |
| 136 | + "MetricExpr": "(cstate_core@c7\\-residency@ / msr@tsc@) * 100", |
| 137 | + "MetricGroup": "Power", |
| 138 | + "MetricName": "C7_Core_Residency" |
| 139 | + }, |
| 140 | + { |
| 141 | + "BriefDescription": "C2 residency percent per package", |
| 142 | + "MetricExpr": "(cstate_pkg@c2\\-residency@ / msr@tsc@) * 100", |
| 143 | + "MetricGroup": "Power", |
| 144 | + "MetricName": "C2_Pkg_Residency" |
| 145 | + }, |
| 146 | + { |
| 147 | + "BriefDescription": "C3 residency percent per package", |
| 148 | + "MetricExpr": "(cstate_pkg@c3\\-residency@ / msr@tsc@) * 100", |
| 149 | + "MetricGroup": "Power", |
| 150 | + "MetricName": "C3_Pkg_Residency" |
| 151 | + }, |
| 152 | + { |
| 153 | + "BriefDescription": "C6 residency percent per package", |
| 154 | + "MetricExpr": "(cstate_pkg@c6\\-residency@ / msr@tsc@) * 100", |
| 155 | + "MetricGroup": "Power", |
| 156 | + "MetricName": "C6_Pkg_Residency" |
| 157 | + }, |
| 158 | + { |
| 159 | + "BriefDescription": "C7 residency percent per package", |
| 160 | + "MetricExpr": "(cstate_pkg@c7\\-residency@ / msr@tsc@) * 100", |
| 161 | + "MetricGroup": "Power", |
| 162 | + "MetricName": "C7_Pkg_Residency" |
| 163 | + } |
| 164 | +] |
0 commit comments