at v6.3-rc1 299 lines 8.3 kB view raw
1/* SPDX-License-Identifier: GPL-2.0 */ 2#ifndef __PERF_STATS_H 3#define __PERF_STATS_H 4 5#include <linux/types.h> 6#include <stdio.h> 7#include <sys/types.h> 8#include <sys/resource.h> 9#include "cpumap.h" 10#include "rblist.h" 11#include "counts.h" 12 13struct perf_cpu_map; 14struct perf_stat_config; 15struct timespec; 16 17struct stats { 18 double n, mean, M2; 19 u64 max, min; 20}; 21 22enum perf_stat_evsel_id { 23 PERF_STAT_EVSEL_ID__NONE = 0, 24 PERF_STAT_EVSEL_ID__CYCLES_IN_TX, 25 PERF_STAT_EVSEL_ID__TRANSACTION_START, 26 PERF_STAT_EVSEL_ID__ELISION_START, 27 PERF_STAT_EVSEL_ID__CYCLES_IN_TX_CP, 28 PERF_STAT_EVSEL_ID__TOPDOWN_TOTAL_SLOTS, 29 PERF_STAT_EVSEL_ID__TOPDOWN_SLOTS_ISSUED, 30 PERF_STAT_EVSEL_ID__TOPDOWN_SLOTS_RETIRED, 31 PERF_STAT_EVSEL_ID__TOPDOWN_FETCH_BUBBLES, 32 PERF_STAT_EVSEL_ID__TOPDOWN_RECOVERY_BUBBLES, 33 PERF_STAT_EVSEL_ID__TOPDOWN_RETIRING, 34 PERF_STAT_EVSEL_ID__TOPDOWN_BAD_SPEC, 35 PERF_STAT_EVSEL_ID__TOPDOWN_FE_BOUND, 36 PERF_STAT_EVSEL_ID__TOPDOWN_BE_BOUND, 37 PERF_STAT_EVSEL_ID__TOPDOWN_HEAVY_OPS, 38 PERF_STAT_EVSEL_ID__TOPDOWN_BR_MISPREDICT, 39 PERF_STAT_EVSEL_ID__TOPDOWN_FETCH_LAT, 40 PERF_STAT_EVSEL_ID__TOPDOWN_MEM_BOUND, 41 PERF_STAT_EVSEL_ID__SMI_NUM, 42 PERF_STAT_EVSEL_ID__APERF, 43 PERF_STAT_EVSEL_ID__MAX, 44}; 45 46/* hold aggregated event info */ 47struct perf_stat_aggr { 48 /* aggregated values */ 49 struct perf_counts_values counts; 50 /* number of entries (CPUs) aggregated */ 51 int nr; 52 /* whether any entry has failed to read/process event */ 53 bool failed; 54 /* to mark this data is processed already */ 55 bool used; 56}; 57 58/* per-evsel event stats */ 59struct perf_stat_evsel { 60 /* used for repeated runs */ 61 struct stats res_stats; 62 /* evsel id for quick check */ 63 enum perf_stat_evsel_id id; 64 /* number of allocated 'aggr' */ 65 int nr_aggr; 66 /* aggregated event values */ 67 struct perf_stat_aggr *aggr; 68 /* used for group read */ 69 u64 *group_data; 70}; 71 72enum aggr_mode { 73 AGGR_NONE, 74 AGGR_GLOBAL, 75 AGGR_SOCKET, 76 AGGR_DIE, 77 AGGR_CORE, 78 AGGR_THREAD, 79 AGGR_UNSET, 80 AGGR_NODE, 81 AGGR_MAX 82}; 83 84enum { 85 CTX_BIT_USER = 1 << 0, 86 CTX_BIT_KERNEL = 1 << 1, 87 CTX_BIT_HV = 1 << 2, 88 CTX_BIT_HOST = 1 << 3, 89 CTX_BIT_IDLE = 1 << 4, 90 CTX_BIT_MAX = 1 << 5, 91}; 92 93#define NUM_CTX CTX_BIT_MAX 94 95enum stat_type { 96 STAT_NONE = 0, 97 STAT_NSECS, 98 STAT_CYCLES, 99 STAT_STALLED_CYCLES_FRONT, 100 STAT_STALLED_CYCLES_BACK, 101 STAT_BRANCHES, 102 STAT_CACHEREFS, 103 STAT_L1_DCACHE, 104 STAT_L1_ICACHE, 105 STAT_LL_CACHE, 106 STAT_ITLB_CACHE, 107 STAT_DTLB_CACHE, 108 STAT_CYCLES_IN_TX, 109 STAT_TRANSACTION, 110 STAT_ELISION, 111 STAT_TOPDOWN_TOTAL_SLOTS, 112 STAT_TOPDOWN_SLOTS_ISSUED, 113 STAT_TOPDOWN_SLOTS_RETIRED, 114 STAT_TOPDOWN_FETCH_BUBBLES, 115 STAT_TOPDOWN_RECOVERY_BUBBLES, 116 STAT_TOPDOWN_RETIRING, 117 STAT_TOPDOWN_BAD_SPEC, 118 STAT_TOPDOWN_FE_BOUND, 119 STAT_TOPDOWN_BE_BOUND, 120 STAT_TOPDOWN_HEAVY_OPS, 121 STAT_TOPDOWN_BR_MISPREDICT, 122 STAT_TOPDOWN_FETCH_LAT, 123 STAT_TOPDOWN_MEM_BOUND, 124 STAT_SMI_NUM, 125 STAT_APERF, 126 STAT_MAX 127}; 128 129struct runtime_stat { 130 struct rblist value_list; 131}; 132 133struct rusage_stats { 134 struct stats ru_utime_usec_stat; 135 struct stats ru_stime_usec_stat; 136}; 137 138typedef struct aggr_cpu_id (*aggr_get_id_t)(struct perf_stat_config *config, struct perf_cpu cpu); 139 140struct perf_stat_config { 141 enum aggr_mode aggr_mode; 142 bool scale; 143 bool no_inherit; 144 bool identifier; 145 bool csv_output; 146 bool json_output; 147 bool interval_clear; 148 bool metric_only; 149 bool null_run; 150 bool ru_display; 151 bool big_num; 152 bool no_merge; 153 bool hybrid_merge; 154 bool walltime_run_table; 155 bool all_kernel; 156 bool all_user; 157 bool percore_show_thread; 158 bool summary; 159 bool no_csv_summary; 160 bool metric_no_group; 161 bool metric_no_merge; 162 bool stop_read_counter; 163 bool iostat_run; 164 char *user_requested_cpu_list; 165 bool system_wide; 166 FILE *output; 167 unsigned int interval; 168 unsigned int timeout; 169 int initial_delay; 170 unsigned int unit_width; 171 unsigned int metric_only_len; 172 int times; 173 int run_count; 174 int print_free_counters_hint; 175 int print_mixed_hw_group_error; 176 const char *csv_sep; 177 struct stats *walltime_nsecs_stats; 178 struct rusage ru_data; 179 struct rusage_stats *ru_stats; 180 struct cpu_aggr_map *aggr_map; 181 aggr_get_id_t aggr_get_id; 182 struct cpu_aggr_map *cpus_aggr_map; 183 u64 *walltime_run; 184 struct rblist metric_events; 185 int ctl_fd; 186 int ctl_fd_ack; 187 bool ctl_fd_close; 188 const char *cgroup_list; 189 unsigned int topdown_level; 190}; 191 192void perf_stat__set_big_num(int set); 193void perf_stat__set_no_csv_summary(int set); 194 195void update_stats(struct stats *stats, u64 val); 196double avg_stats(struct stats *stats); 197double stddev_stats(struct stats *stats); 198double rel_stddev_stats(double stddev, double avg); 199 200static inline void init_stats(struct stats *stats) 201{ 202 stats->n = 0.0; 203 stats->mean = 0.0; 204 stats->M2 = 0.0; 205 stats->min = (u64) -1; 206 stats->max = 0; 207} 208 209static inline void init_rusage_stats(struct rusage_stats *ru_stats) { 210 init_stats(&ru_stats->ru_utime_usec_stat); 211 init_stats(&ru_stats->ru_stime_usec_stat); 212} 213 214static inline void update_rusage_stats(struct rusage_stats *ru_stats, struct rusage* rusage) { 215 const u64 us_to_ns = 1000; 216 const u64 s_to_ns = 1000000000; 217 update_stats(&ru_stats->ru_utime_usec_stat, 218 (rusage->ru_utime.tv_usec * us_to_ns + rusage->ru_utime.tv_sec * s_to_ns)); 219 update_stats(&ru_stats->ru_stime_usec_stat, 220 (rusage->ru_stime.tv_usec * us_to_ns + rusage->ru_stime.tv_sec * s_to_ns)); 221} 222 223struct evsel; 224struct evlist; 225 226bool __perf_stat_evsel__is(struct evsel *evsel, enum perf_stat_evsel_id id); 227 228#define perf_stat_evsel__is(evsel, id) \ 229 __perf_stat_evsel__is(evsel, PERF_STAT_EVSEL_ID__ ## id) 230 231extern struct runtime_stat rt_stat; 232extern struct stats walltime_nsecs_stats; 233extern struct rusage_stats ru_stats; 234 235typedef void (*print_metric_t)(struct perf_stat_config *config, 236 void *ctx, const char *color, const char *unit, 237 const char *fmt, double val); 238typedef void (*new_line_t)(struct perf_stat_config *config, void *ctx); 239 240void runtime_stat__init(struct runtime_stat *st); 241void runtime_stat__exit(struct runtime_stat *st); 242void perf_stat__init_shadow_stats(void); 243void perf_stat__reset_shadow_stats(void); 244void perf_stat__reset_shadow_per_stat(struct runtime_stat *st); 245void perf_stat__update_shadow_stats(struct evsel *counter, u64 count, 246 int map_idx, struct runtime_stat *st); 247struct perf_stat_output_ctx { 248 void *ctx; 249 print_metric_t print_metric; 250 new_line_t new_line; 251 bool force_header; 252}; 253 254void perf_stat__print_shadow_stats(struct perf_stat_config *config, 255 struct evsel *evsel, 256 double avg, int map_idx, 257 struct perf_stat_output_ctx *out, 258 struct rblist *metric_events, 259 struct runtime_stat *st); 260 261int evlist__alloc_stats(struct perf_stat_config *config, 262 struct evlist *evlist, bool alloc_raw); 263void evlist__free_stats(struct evlist *evlist); 264void evlist__reset_stats(struct evlist *evlist); 265void evlist__reset_prev_raw_counts(struct evlist *evlist); 266void evlist__copy_prev_raw_counts(struct evlist *evlist); 267void evlist__save_aggr_prev_raw_counts(struct evlist *evlist); 268 269int evlist__alloc_aggr_stats(struct evlist *evlist, int nr_aggr); 270void evlist__reset_aggr_stats(struct evlist *evlist); 271 272int perf_stat_process_counter(struct perf_stat_config *config, 273 struct evsel *counter); 274void perf_stat_merge_counters(struct perf_stat_config *config, struct evlist *evlist); 275void perf_stat_process_percore(struct perf_stat_config *config, struct evlist *evlist); 276void perf_stat_process_shadow_stats(struct perf_stat_config *config, struct evlist *evlist); 277 278struct perf_tool; 279union perf_event; 280struct perf_session; 281struct target; 282 283int perf_event__process_stat_event(struct perf_session *session, 284 union perf_event *event); 285 286size_t perf_event__fprintf_stat(union perf_event *event, FILE *fp); 287size_t perf_event__fprintf_stat_round(union perf_event *event, FILE *fp); 288size_t perf_event__fprintf_stat_config(union perf_event *event, FILE *fp); 289 290int create_perf_stat_counter(struct evsel *evsel, 291 struct perf_stat_config *config, 292 struct target *target, 293 int cpu_map_idx); 294void evlist__print_counters(struct evlist *evlist, struct perf_stat_config *config, 295 struct target *_target, struct timespec *ts, int argc, const char **argv); 296 297struct metric_expr; 298double test_generic_metric(struct metric_expr *mexp, int map_idx, struct runtime_stat *st); 299#endif