at v6.3-rc6 298 lines 8.3 kB view raw
1/* SPDX-License-Identifier: GPL-2.0 */ 2#ifndef __PERF_STATS_H 3#define __PERF_STATS_H 4 5#include <linux/types.h> 6#include <stdio.h> 7#include <sys/types.h> 8#include <sys/resource.h> 9#include "cpumap.h" 10#include "rblist.h" 11#include "counts.h" 12 13struct perf_cpu_map; 14struct perf_stat_config; 15struct timespec; 16 17struct stats { 18 double n, mean, M2; 19 u64 max, min; 20}; 21 22enum perf_stat_evsel_id { 23 PERF_STAT_EVSEL_ID__NONE = 0, 24 PERF_STAT_EVSEL_ID__CYCLES_IN_TX, 25 PERF_STAT_EVSEL_ID__TRANSACTION_START, 26 PERF_STAT_EVSEL_ID__ELISION_START, 27 PERF_STAT_EVSEL_ID__CYCLES_IN_TX_CP, 28 PERF_STAT_EVSEL_ID__TOPDOWN_TOTAL_SLOTS, 29 PERF_STAT_EVSEL_ID__TOPDOWN_SLOTS_ISSUED, 30 PERF_STAT_EVSEL_ID__TOPDOWN_SLOTS_RETIRED, 31 PERF_STAT_EVSEL_ID__TOPDOWN_FETCH_BUBBLES, 32 PERF_STAT_EVSEL_ID__TOPDOWN_RECOVERY_BUBBLES, 33 PERF_STAT_EVSEL_ID__TOPDOWN_RETIRING, 34 PERF_STAT_EVSEL_ID__TOPDOWN_BAD_SPEC, 35 PERF_STAT_EVSEL_ID__TOPDOWN_FE_BOUND, 36 PERF_STAT_EVSEL_ID__TOPDOWN_BE_BOUND, 37 PERF_STAT_EVSEL_ID__TOPDOWN_HEAVY_OPS, 38 PERF_STAT_EVSEL_ID__TOPDOWN_BR_MISPREDICT, 39 PERF_STAT_EVSEL_ID__TOPDOWN_FETCH_LAT, 40 PERF_STAT_EVSEL_ID__TOPDOWN_MEM_BOUND, 41 PERF_STAT_EVSEL_ID__SMI_NUM, 42 PERF_STAT_EVSEL_ID__APERF, 43 PERF_STAT_EVSEL_ID__MAX, 44}; 45 46/* hold aggregated event info */ 47struct perf_stat_aggr { 48 /* aggregated values */ 49 struct perf_counts_values counts; 50 /* number of entries (CPUs) aggregated */ 51 int nr; 52 /* whether any entry has failed to read/process event */ 53 bool failed; 54 /* to mark this data is processed already */ 55 bool used; 56}; 57 58/* per-evsel event stats */ 59struct perf_stat_evsel { 60 /* used for repeated runs */ 61 struct stats res_stats; 62 /* evsel id for quick check */ 63 enum perf_stat_evsel_id id; 64 /* number of allocated 'aggr' */ 65 int nr_aggr; 66 /* aggregated event values */ 67 struct perf_stat_aggr *aggr; 68 /* used for group read */ 69 u64 *group_data; 70}; 71 72enum aggr_mode { 73 AGGR_NONE, 74 AGGR_GLOBAL, 75 AGGR_SOCKET, 76 AGGR_DIE, 77 AGGR_CORE, 78 AGGR_THREAD, 79 AGGR_UNSET, 80 AGGR_NODE, 81 AGGR_MAX 82}; 83 84enum { 85 CTX_BIT_USER = 1 << 0, 86 CTX_BIT_KERNEL = 1 << 1, 87 CTX_BIT_HV = 1 << 2, 88 CTX_BIT_HOST = 1 << 3, 89 CTX_BIT_IDLE = 1 << 4, 90 CTX_BIT_MAX = 1 << 5, 91}; 92 93#define NUM_CTX CTX_BIT_MAX 94 95enum stat_type { 96 STAT_NONE = 0, 97 STAT_NSECS, 98 STAT_CYCLES, 99 STAT_STALLED_CYCLES_FRONT, 100 STAT_STALLED_CYCLES_BACK, 101 STAT_BRANCHES, 102 STAT_CACHEREFS, 103 STAT_L1_DCACHE, 104 STAT_L1_ICACHE, 105 STAT_LL_CACHE, 106 STAT_ITLB_CACHE, 107 STAT_DTLB_CACHE, 108 STAT_CYCLES_IN_TX, 109 STAT_TRANSACTION, 110 STAT_ELISION, 111 STAT_TOPDOWN_TOTAL_SLOTS, 112 STAT_TOPDOWN_SLOTS_ISSUED, 113 STAT_TOPDOWN_SLOTS_RETIRED, 114 STAT_TOPDOWN_FETCH_BUBBLES, 115 STAT_TOPDOWN_RECOVERY_BUBBLES, 116 STAT_TOPDOWN_RETIRING, 117 STAT_TOPDOWN_BAD_SPEC, 118 STAT_TOPDOWN_FE_BOUND, 119 STAT_TOPDOWN_BE_BOUND, 120 STAT_TOPDOWN_HEAVY_OPS, 121 STAT_TOPDOWN_BR_MISPREDICT, 122 STAT_TOPDOWN_FETCH_LAT, 123 STAT_TOPDOWN_MEM_BOUND, 124 STAT_SMI_NUM, 125 STAT_APERF, 126 STAT_MAX 127}; 128 129struct runtime_stat { 130 struct rblist value_list; 131}; 132 133struct rusage_stats { 134 struct stats ru_utime_usec_stat; 135 struct stats ru_stime_usec_stat; 136}; 137 138typedef struct aggr_cpu_id (*aggr_get_id_t)(struct perf_stat_config *config, struct perf_cpu cpu); 139 140struct perf_stat_config { 141 enum aggr_mode aggr_mode; 142 bool scale; 143 bool no_inherit; 144 bool identifier; 145 bool csv_output; 146 bool json_output; 147 bool interval_clear; 148 bool metric_only; 149 bool null_run; 150 bool ru_display; 151 bool big_num; 152 bool no_merge; 153 bool hybrid_merge; 154 bool walltime_run_table; 155 bool all_kernel; 156 bool all_user; 157 bool percore_show_thread; 158 bool summary; 159 bool no_csv_summary; 160 bool metric_no_group; 161 bool metric_no_merge; 162 bool stop_read_counter; 163 bool iostat_run; 164 char *user_requested_cpu_list; 165 bool system_wide; 166 FILE *output; 167 unsigned int interval; 168 unsigned int timeout; 169 unsigned int unit_width; 170 unsigned int metric_only_len; 171 int times; 172 int run_count; 173 int print_free_counters_hint; 174 int print_mixed_hw_group_error; 175 const char *csv_sep; 176 struct stats *walltime_nsecs_stats; 177 struct rusage ru_data; 178 struct rusage_stats *ru_stats; 179 struct cpu_aggr_map *aggr_map; 180 aggr_get_id_t aggr_get_id; 181 struct cpu_aggr_map *cpus_aggr_map; 182 u64 *walltime_run; 183 struct rblist metric_events; 184 int ctl_fd; 185 int ctl_fd_ack; 186 bool ctl_fd_close; 187 const char *cgroup_list; 188 unsigned int topdown_level; 189}; 190 191void perf_stat__set_big_num(int set); 192void perf_stat__set_no_csv_summary(int set); 193 194void update_stats(struct stats *stats, u64 val); 195double avg_stats(struct stats *stats); 196double stddev_stats(struct stats *stats); 197double rel_stddev_stats(double stddev, double avg); 198 199static inline void init_stats(struct stats *stats) 200{ 201 stats->n = 0.0; 202 stats->mean = 0.0; 203 stats->M2 = 0.0; 204 stats->min = (u64) -1; 205 stats->max = 0; 206} 207 208static inline void init_rusage_stats(struct rusage_stats *ru_stats) { 209 init_stats(&ru_stats->ru_utime_usec_stat); 210 init_stats(&ru_stats->ru_stime_usec_stat); 211} 212 213static inline void update_rusage_stats(struct rusage_stats *ru_stats, struct rusage* rusage) { 214 const u64 us_to_ns = 1000; 215 const u64 s_to_ns = 1000000000; 216 update_stats(&ru_stats->ru_utime_usec_stat, 217 (rusage->ru_utime.tv_usec * us_to_ns + rusage->ru_utime.tv_sec * s_to_ns)); 218 update_stats(&ru_stats->ru_stime_usec_stat, 219 (rusage->ru_stime.tv_usec * us_to_ns + rusage->ru_stime.tv_sec * s_to_ns)); 220} 221 222struct evsel; 223struct evlist; 224 225bool __perf_stat_evsel__is(struct evsel *evsel, enum perf_stat_evsel_id id); 226 227#define perf_stat_evsel__is(evsel, id) \ 228 __perf_stat_evsel__is(evsel, PERF_STAT_EVSEL_ID__ ## id) 229 230extern struct runtime_stat rt_stat; 231extern struct stats walltime_nsecs_stats; 232extern struct rusage_stats ru_stats; 233 234typedef void (*print_metric_t)(struct perf_stat_config *config, 235 void *ctx, const char *color, const char *unit, 236 const char *fmt, double val); 237typedef void (*new_line_t)(struct perf_stat_config *config, void *ctx); 238 239void runtime_stat__init(struct runtime_stat *st); 240void runtime_stat__exit(struct runtime_stat *st); 241void perf_stat__init_shadow_stats(void); 242void perf_stat__reset_shadow_stats(void); 243void perf_stat__reset_shadow_per_stat(struct runtime_stat *st); 244void perf_stat__update_shadow_stats(struct evsel *counter, u64 count, 245 int map_idx, struct runtime_stat *st); 246struct perf_stat_output_ctx { 247 void *ctx; 248 print_metric_t print_metric; 249 new_line_t new_line; 250 bool force_header; 251}; 252 253void perf_stat__print_shadow_stats(struct perf_stat_config *config, 254 struct evsel *evsel, 255 double avg, int map_idx, 256 struct perf_stat_output_ctx *out, 257 struct rblist *metric_events, 258 struct runtime_stat *st); 259 260int evlist__alloc_stats(struct perf_stat_config *config, 261 struct evlist *evlist, bool alloc_raw); 262void evlist__free_stats(struct evlist *evlist); 263void evlist__reset_stats(struct evlist *evlist); 264void evlist__reset_prev_raw_counts(struct evlist *evlist); 265void evlist__copy_prev_raw_counts(struct evlist *evlist); 266void evlist__save_aggr_prev_raw_counts(struct evlist *evlist); 267 268int evlist__alloc_aggr_stats(struct evlist *evlist, int nr_aggr); 269void evlist__reset_aggr_stats(struct evlist *evlist); 270 271int perf_stat_process_counter(struct perf_stat_config *config, 272 struct evsel *counter); 273void perf_stat_merge_counters(struct perf_stat_config *config, struct evlist *evlist); 274void perf_stat_process_percore(struct perf_stat_config *config, struct evlist *evlist); 275void perf_stat_process_shadow_stats(struct perf_stat_config *config, struct evlist *evlist); 276 277struct perf_tool; 278union perf_event; 279struct perf_session; 280struct target; 281 282int perf_event__process_stat_event(struct perf_session *session, 283 union perf_event *event); 284 285size_t perf_event__fprintf_stat(union perf_event *event, FILE *fp); 286size_t perf_event__fprintf_stat_round(union perf_event *event, FILE *fp); 287size_t perf_event__fprintf_stat_config(union perf_event *event, FILE *fp); 288 289int create_perf_stat_counter(struct evsel *evsel, 290 struct perf_stat_config *config, 291 struct target *target, 292 int cpu_map_idx); 293void evlist__print_counters(struct evlist *evlist, struct perf_stat_config *config, 294 struct target *_target, struct timespec *ts, int argc, const char **argv); 295 296struct metric_expr; 297double test_generic_metric(struct metric_expr *mexp, int map_idx, struct runtime_stat *st); 298#endif