| 1 | #include <stdlib.h> |
| 2 | #include <stdio.h> |
| 3 | #include <inttypes.h> |
| 4 | #include <linux/string.h> |
| 5 | #include <linux/time64.h> |
| 6 | #include <math.h> |
| 7 | #include <perf/cpumap.h> |
| 8 | #include "color.h" |
| 9 | #include "counts.h" |
| 10 | #include "debug.h" |
| 11 | #include "evlist.h" |
| 12 | #include "evsel.h" |
| 13 | #include "stat.h" |
| 14 | #include "top.h" |
| 15 | #include "thread_map.h" |
| 16 | #include "cpumap.h" |
| 17 | #include "string2.h" |
| 18 | #include <linux/ctype.h> |
| 19 | #include "cgroup.h" |
| 20 | #include <api/fs/fs.h> |
| 21 | #include "util.h" |
| 22 | #include "iostat.h" |
| 23 | #include "pmu.h" |
| 24 | #include "pmus.h" |
| 25 | #include "tool_pmu.h" |
| 26 | |
| 27 | #define CNTR_NOT_SUPPORTED "<not supported>" |
| 28 | #define CNTR_NOT_COUNTED "<not counted>" |
| 29 | |
| 30 | #define MGROUP_LEN 50 |
| 31 | #define METRIC_LEN 38 |
| 32 | #define EVNAME_LEN 32 |
| 33 | #define COUNTS_LEN 18 |
| 34 | #define INTERVAL_LEN 16 |
| 35 | #define CGROUP_LEN 16 |
| 36 | #define COMM_LEN 16 |
| 37 | #define PID_LEN 7 |
| 38 | #define CPUS_LEN 4 |
| 39 | |
| 40 | static int [] = { |
| 41 | [AGGR_CORE] = 18, |
| 42 | [AGGR_CACHE] = 22, |
| 43 | [AGGR_CLUSTER] = 20, |
| 44 | [AGGR_DIE] = 12, |
| 45 | [AGGR_SOCKET] = 6, |
| 46 | [AGGR_NODE] = 6, |
| 47 | [AGGR_NONE] = 6, |
| 48 | [AGGR_THREAD] = 16, |
| 49 | [AGGR_GLOBAL] = 0, |
| 50 | }; |
| 51 | |
| 52 | static const char *[] = { |
| 53 | [AGGR_CORE] = "core,ctrs," , |
| 54 | [AGGR_CACHE] = "cache,ctrs," , |
| 55 | [AGGR_CLUSTER] = "cluster,ctrs," , |
| 56 | [AGGR_DIE] = "die,ctrs," , |
| 57 | [AGGR_SOCKET] = "socket,ctrs," , |
| 58 | [AGGR_NONE] = "cpu," , |
| 59 | [AGGR_THREAD] = "comm-pid," , |
| 60 | [AGGR_NODE] = "node," , |
| 61 | [AGGR_GLOBAL] = "" |
| 62 | }; |
| 63 | |
| 64 | static const char *[] = { |
| 65 | [AGGR_CORE] = "core" , |
| 66 | [AGGR_CACHE] = "cache" , |
| 67 | [AGGR_CLUSTER] = "cluster" , |
| 68 | [AGGR_DIE] = "die" , |
| 69 | [AGGR_SOCKET] = "socket" , |
| 70 | [AGGR_NONE] = "cpu" , |
| 71 | [AGGR_THREAD] = "comm-pid" , |
| 72 | [AGGR_NODE] = "node" , |
| 73 | [AGGR_GLOBAL] = "" |
| 74 | }; |
| 75 | |
| 76 | const char *metric_threshold_classify__color(enum metric_threshold_classify thresh) |
| 77 | { |
| 78 | const char * const colors[] = { |
| 79 | "" , /* unknown */ |
| 80 | PERF_COLOR_RED, /* bad */ |
| 81 | PERF_COLOR_MAGENTA, /* nearly bad */ |
| 82 | PERF_COLOR_YELLOW, /* less good */ |
| 83 | PERF_COLOR_GREEN, /* good */ |
| 84 | }; |
| 85 | static_assert(ARRAY_SIZE(colors) - 1 == METRIC_THRESHOLD_GOOD, "missing enum value" ); |
| 86 | return colors[thresh]; |
| 87 | } |
| 88 | |
| 89 | static const char *metric_threshold_classify__str(enum metric_threshold_classify thresh) |
| 90 | { |
| 91 | const char * const strs[] = { |
| 92 | "unknown" , |
| 93 | "bad" , |
| 94 | "nearly bad" , |
| 95 | "less good" , |
| 96 | "good" , |
| 97 | }; |
| 98 | static_assert(ARRAY_SIZE(strs) - 1 == METRIC_THRESHOLD_GOOD, "missing enum value" ); |
| 99 | return strs[thresh]; |
| 100 | } |
| 101 | |
| 102 | static void print_running_std(struct perf_stat_config *config, u64 run, u64 ena) |
| 103 | { |
| 104 | if (run != ena) |
| 105 | fprintf(config->output, " (%.2f%%)" , 100.0 * run / ena); |
| 106 | } |
| 107 | |
| 108 | static void print_running_csv(struct perf_stat_config *config, u64 run, u64 ena) |
| 109 | { |
| 110 | double enabled_percent = 100; |
| 111 | |
| 112 | if (run != ena) |
| 113 | enabled_percent = 100 * run / ena; |
| 114 | fprintf(config->output, "%s%" PRIu64 "%s%.2f" , |
| 115 | config->csv_sep, run, config->csv_sep, enabled_percent); |
| 116 | } |
| 117 | struct outstate { |
| 118 | /* Std mode: insert a newline before the next metric */ |
| 119 | bool newline; |
| 120 | /* JSON mode: track need for comma for a previous field or not */ |
| 121 | bool first; |
| 122 | /* Num CSV separators remaining to pad out when not all fields are printed */ |
| 123 | int csv_col_pad; |
| 124 | |
| 125 | /* |
| 126 | * The following don't track state across fields, but are here as a shortcut to |
| 127 | * pass data to the print functions. The alternative would be to update the |
| 128 | * function signatures of the entire print stack to pass them through. |
| 129 | */ |
| 130 | /* Place to output to */ |
| 131 | FILE * const fh; |
| 132 | /* Lines are timestamped in --interval-print mode */ |
| 133 | char timestamp[64]; |
| 134 | /* Num items aggregated in current line. See struct perf_stat_aggr.nr */ |
| 135 | int aggr_nr; |
| 136 | /* Core/socket/die etc ID for the current line */ |
| 137 | struct aggr_cpu_id id; |
| 138 | /* Event for current line */ |
| 139 | struct evsel *evsel; |
| 140 | /* Cgroup for current line */ |
| 141 | struct cgroup *cgrp; |
| 142 | }; |
| 143 | |
| 144 | static const char *json_sep(struct outstate *os) |
| 145 | { |
| 146 | const char *sep = os->first ? "" : ", " ; |
| 147 | |
| 148 | os->first = false; |
| 149 | return sep; |
| 150 | } |
| 151 | |
| 152 | #define json_out(os, format, ...) fprintf((os)->fh, "%s" format, json_sep(os), ##__VA_ARGS__) |
| 153 | |
| 154 | static void print_running_json(struct outstate *os, u64 run, u64 ena) |
| 155 | { |
| 156 | double enabled_percent = 100; |
| 157 | |
| 158 | if (run != ena) |
| 159 | enabled_percent = 100 * run / ena; |
| 160 | json_out(os, "\"event-runtime\" : %" PRIu64 ", \"pcnt-running\" : %.2f" , |
| 161 | run, enabled_percent); |
| 162 | } |
| 163 | |
| 164 | static void print_running(struct perf_stat_config *config, struct outstate *os, |
| 165 | u64 run, u64 ena, bool before_metric) |
| 166 | { |
| 167 | if (config->json_output) { |
| 168 | if (before_metric) |
| 169 | print_running_json(os, run, ena); |
| 170 | } else if (config->csv_output) { |
| 171 | if (before_metric) |
| 172 | print_running_csv(config, run, ena); |
| 173 | } else { |
| 174 | if (!before_metric) |
| 175 | print_running_std(config, run, ena); |
| 176 | } |
| 177 | } |
| 178 | |
| 179 | static void print_noise_pct_std(struct perf_stat_config *config, |
| 180 | double pct) |
| 181 | { |
| 182 | if (pct) |
| 183 | fprintf(config->output, " ( +-%6.2f%% )" , pct); |
| 184 | } |
| 185 | |
| 186 | static void print_noise_pct_csv(struct perf_stat_config *config, |
| 187 | double pct) |
| 188 | { |
| 189 | fprintf(config->output, "%s%.2f%%" , config->csv_sep, pct); |
| 190 | } |
| 191 | |
| 192 | static void print_noise_pct_json(struct outstate *os, |
| 193 | double pct) |
| 194 | { |
| 195 | json_out(os, "\"variance\" : %.2f" , pct); |
| 196 | } |
| 197 | |
| 198 | static void print_noise_pct(struct perf_stat_config *config, struct outstate *os, |
| 199 | double total, double avg, bool before_metric) |
| 200 | { |
| 201 | double pct = rel_stddev_stats(stddev: total, avg); |
| 202 | |
| 203 | if (config->json_output) { |
| 204 | if (before_metric) |
| 205 | print_noise_pct_json(os, pct); |
| 206 | } else if (config->csv_output) { |
| 207 | if (before_metric) |
| 208 | print_noise_pct_csv(config, pct); |
| 209 | } else { |
| 210 | if (!before_metric) |
| 211 | print_noise_pct_std(config, pct); |
| 212 | } |
| 213 | } |
| 214 | |
| 215 | static void print_noise(struct perf_stat_config *config, struct outstate *os, |
| 216 | struct evsel *evsel, double avg, bool before_metric) |
| 217 | { |
| 218 | struct perf_stat_evsel *ps; |
| 219 | |
| 220 | if (config->run_count == 1) |
| 221 | return; |
| 222 | |
| 223 | ps = evsel->stats; |
| 224 | print_noise_pct(config, os, total: stddev_stats(stats: &ps->res_stats), avg, before_metric); |
| 225 | } |
| 226 | |
| 227 | static void print_cgroup_std(struct perf_stat_config *config, const char *cgrp_name) |
| 228 | { |
| 229 | fprintf(config->output, " %-*s" , CGROUP_LEN, cgrp_name); |
| 230 | } |
| 231 | |
| 232 | static void print_cgroup_csv(struct perf_stat_config *config, const char *cgrp_name) |
| 233 | { |
| 234 | fprintf(config->output, "%s%s" , config->csv_sep, cgrp_name); |
| 235 | } |
| 236 | |
| 237 | static void print_cgroup_json(struct outstate *os, const char *cgrp_name) |
| 238 | { |
| 239 | json_out(os, "\"cgroup\" : \"%s\"" , cgrp_name); |
| 240 | } |
| 241 | |
| 242 | static void print_cgroup(struct perf_stat_config *config, struct outstate *os, |
| 243 | struct cgroup *cgrp) |
| 244 | { |
| 245 | if (nr_cgroups || config->cgroup_list) { |
| 246 | const char *cgrp_name = cgrp ? cgrp->name : "" ; |
| 247 | |
| 248 | if (config->json_output) |
| 249 | print_cgroup_json(os, cgrp_name); |
| 250 | else if (config->csv_output) |
| 251 | print_cgroup_csv(config, cgrp_name); |
| 252 | else |
| 253 | print_cgroup_std(config, cgrp_name); |
| 254 | } |
| 255 | } |
| 256 | |
| 257 | static void print_aggr_id_std(struct perf_stat_config *config, |
| 258 | struct evsel *evsel, struct aggr_cpu_id id, int aggr_nr) |
| 259 | { |
| 260 | FILE *output = config->output; |
| 261 | int idx = config->aggr_mode; |
| 262 | char buf[128]; |
| 263 | |
| 264 | switch (config->aggr_mode) { |
| 265 | case AGGR_CORE: |
| 266 | snprintf(buf, size: sizeof(buf), fmt: "S%d-D%d-C%d" , id.socket, id.die, id.core); |
| 267 | break; |
| 268 | case AGGR_CACHE: |
| 269 | snprintf(buf, size: sizeof(buf), fmt: "S%d-D%d-L%d-ID%d" , |
| 270 | id.socket, id.die, id.cache_lvl, id.cache); |
| 271 | break; |
| 272 | case AGGR_CLUSTER: |
| 273 | snprintf(buf, size: sizeof(buf), fmt: "S%d-D%d-CLS%d" , id.socket, id.die, id.cluster); |
| 274 | break; |
| 275 | case AGGR_DIE: |
| 276 | snprintf(buf, size: sizeof(buf), fmt: "S%d-D%d" , id.socket, id.die); |
| 277 | break; |
| 278 | case AGGR_SOCKET: |
| 279 | snprintf(buf, size: sizeof(buf), fmt: "S%d" , id.socket); |
| 280 | break; |
| 281 | case AGGR_NODE: |
| 282 | snprintf(buf, size: sizeof(buf), fmt: "N%d" , id.node); |
| 283 | break; |
| 284 | case AGGR_NONE: |
| 285 | if (evsel->percore && !config->percore_show_thread) { |
| 286 | snprintf(buf, size: sizeof(buf), fmt: "S%d-D%d-C%d " , |
| 287 | id.socket, id.die, id.core); |
| 288 | fprintf(output, "%-*s " , |
| 289 | aggr_header_lens[AGGR_CORE], buf); |
| 290 | } else if (id.cpu.cpu > -1) { |
| 291 | fprintf(output, "CPU%-*d " , |
| 292 | aggr_header_lens[AGGR_NONE] - 3, id.cpu.cpu); |
| 293 | } |
| 294 | return; |
| 295 | case AGGR_THREAD: |
| 296 | fprintf(output, "%*s-%-*d " , |
| 297 | COMM_LEN, perf_thread_map__comm(evsel->core.threads, id.thread_idx), |
| 298 | PID_LEN, perf_thread_map__pid(evsel->core.threads, id.thread_idx)); |
| 299 | return; |
| 300 | case AGGR_GLOBAL: |
| 301 | case AGGR_UNSET: |
| 302 | case AGGR_MAX: |
| 303 | default: |
| 304 | return; |
| 305 | } |
| 306 | |
| 307 | fprintf(output, "%-*s %*d " , aggr_header_lens[idx], buf, /*strlen("ctrs")*/ 4, aggr_nr); |
| 308 | } |
| 309 | |
| 310 | static void print_aggr_id_csv(struct perf_stat_config *config, |
| 311 | struct evsel *evsel, struct aggr_cpu_id id, int aggr_nr) |
| 312 | { |
| 313 | FILE *output = config->output; |
| 314 | const char *sep = config->csv_sep; |
| 315 | |
| 316 | switch (config->aggr_mode) { |
| 317 | case AGGR_CORE: |
| 318 | fprintf(output, "S%d-D%d-C%d%s%d%s" , |
| 319 | id.socket, id.die, id.core, sep, aggr_nr, sep); |
| 320 | break; |
| 321 | case AGGR_CACHE: |
| 322 | fprintf(config->output, "S%d-D%d-L%d-ID%d%s%d%s" , |
| 323 | id.socket, id.die, id.cache_lvl, id.cache, sep, aggr_nr, sep); |
| 324 | break; |
| 325 | case AGGR_CLUSTER: |
| 326 | fprintf(config->output, "S%d-D%d-CLS%d%s%d%s" , |
| 327 | id.socket, id.die, id.cluster, sep, aggr_nr, sep); |
| 328 | break; |
| 329 | case AGGR_DIE: |
| 330 | fprintf(output, "S%d-D%d%s%d%s" , |
| 331 | id.socket, id.die, sep, aggr_nr, sep); |
| 332 | break; |
| 333 | case AGGR_SOCKET: |
| 334 | fprintf(output, "S%d%s%d%s" , |
| 335 | id.socket, sep, aggr_nr, sep); |
| 336 | break; |
| 337 | case AGGR_NODE: |
| 338 | fprintf(output, "N%d%s%d%s" , |
| 339 | id.node, sep, aggr_nr, sep); |
| 340 | break; |
| 341 | case AGGR_NONE: |
| 342 | if (evsel->percore && !config->percore_show_thread) { |
| 343 | fprintf(output, "S%d-D%d-C%d%s" , |
| 344 | id.socket, id.die, id.core, sep); |
| 345 | } else if (id.cpu.cpu > -1) { |
| 346 | fprintf(output, "CPU%d%s" , |
| 347 | id.cpu.cpu, sep); |
| 348 | } |
| 349 | break; |
| 350 | case AGGR_THREAD: |
| 351 | fprintf(output, "%s-%d%s" , |
| 352 | perf_thread_map__comm(evsel->core.threads, id.thread_idx), |
| 353 | perf_thread_map__pid(evsel->core.threads, id.thread_idx), |
| 354 | sep); |
| 355 | break; |
| 356 | case AGGR_GLOBAL: |
| 357 | case AGGR_UNSET: |
| 358 | case AGGR_MAX: |
| 359 | default: |
| 360 | break; |
| 361 | } |
| 362 | } |
| 363 | |
| 364 | static void print_aggr_id_json(struct perf_stat_config *config, struct outstate *os, |
| 365 | struct evsel *evsel, struct aggr_cpu_id id, int aggr_nr) |
| 366 | { |
| 367 | switch (config->aggr_mode) { |
| 368 | case AGGR_CORE: |
| 369 | json_out(os, "\"core\" : \"S%d-D%d-C%d\", \"counters\" : %d" , |
| 370 | id.socket, id.die, id.core, aggr_nr); |
| 371 | break; |
| 372 | case AGGR_CACHE: |
| 373 | json_out(os, "\"cache\" : \"S%d-D%d-L%d-ID%d\", \"counters\" : %d" , |
| 374 | id.socket, id.die, id.cache_lvl, id.cache, aggr_nr); |
| 375 | break; |
| 376 | case AGGR_CLUSTER: |
| 377 | json_out(os, "\"cluster\" : \"S%d-D%d-CLS%d\", \"counters\" : %d" , |
| 378 | id.socket, id.die, id.cluster, aggr_nr); |
| 379 | break; |
| 380 | case AGGR_DIE: |
| 381 | json_out(os, "\"die\" : \"S%d-D%d\", \"counters\" : %d" , |
| 382 | id.socket, id.die, aggr_nr); |
| 383 | break; |
| 384 | case AGGR_SOCKET: |
| 385 | json_out(os, "\"socket\" : \"S%d\", \"counters\" : %d" , |
| 386 | id.socket, aggr_nr); |
| 387 | break; |
| 388 | case AGGR_NODE: |
| 389 | json_out(os, "\"node\" : \"N%d\", \"counters\" : %d" , |
| 390 | id.node, aggr_nr); |
| 391 | break; |
| 392 | case AGGR_NONE: |
| 393 | if (evsel->percore && !config->percore_show_thread) { |
| 394 | json_out(os, "\"core\" : \"S%d-D%d-C%d\"" , |
| 395 | id.socket, id.die, id.core); |
| 396 | } else if (id.cpu.cpu > -1) { |
| 397 | json_out(os, "\"cpu\" : \"%d\"" , |
| 398 | id.cpu.cpu); |
| 399 | } |
| 400 | break; |
| 401 | case AGGR_THREAD: |
| 402 | json_out(os, "\"thread\" : \"%s-%d\"" , |
| 403 | perf_thread_map__comm(evsel->core.threads, id.thread_idx), |
| 404 | perf_thread_map__pid(evsel->core.threads, id.thread_idx)); |
| 405 | break; |
| 406 | case AGGR_GLOBAL: |
| 407 | case AGGR_UNSET: |
| 408 | case AGGR_MAX: |
| 409 | default: |
| 410 | break; |
| 411 | } |
| 412 | } |
| 413 | |
| 414 | static void aggr_printout(struct perf_stat_config *config, struct outstate *os, |
| 415 | struct evsel *evsel, struct aggr_cpu_id id, int aggr_nr) |
| 416 | { |
| 417 | if (config->json_output) |
| 418 | print_aggr_id_json(config, os, evsel, id, aggr_nr); |
| 419 | else if (config->csv_output) |
| 420 | print_aggr_id_csv(config, evsel, id, aggr_nr); |
| 421 | else |
| 422 | print_aggr_id_std(config, evsel, id, aggr_nr); |
| 423 | } |
| 424 | |
| 425 | static void new_line_std(struct perf_stat_config *config __maybe_unused, |
| 426 | void *ctx) |
| 427 | { |
| 428 | struct outstate *os = ctx; |
| 429 | |
| 430 | os->newline = true; |
| 431 | } |
| 432 | |
| 433 | static inline void __new_line_std_csv(struct perf_stat_config *config, |
| 434 | struct outstate *os) |
| 435 | { |
| 436 | fputc('\n', os->fh); |
| 437 | if (config->interval) |
| 438 | fputs(os->timestamp, os->fh); |
| 439 | aggr_printout(config, os, evsel: os->evsel, id: os->id, aggr_nr: os->aggr_nr); |
| 440 | } |
| 441 | |
| 442 | static inline void __new_line_std(struct perf_stat_config *config, struct outstate *os) |
| 443 | { |
| 444 | fprintf(os->fh, "%*s" , COUNTS_LEN + EVNAME_LEN + config->unit_width + 2, "" ); |
| 445 | } |
| 446 | |
| 447 | static void do_new_line_std(struct perf_stat_config *config, |
| 448 | struct outstate *os) |
| 449 | { |
| 450 | __new_line_std_csv(config, os); |
| 451 | if (config->aggr_mode == AGGR_NONE) |
| 452 | fprintf(os->fh, " " ); |
| 453 | __new_line_std(config, os); |
| 454 | } |
| 455 | |
| 456 | static void print_metric_std(struct perf_stat_config *config, |
| 457 | void *ctx, enum metric_threshold_classify thresh, |
| 458 | const char *fmt, const char *unit, double val) |
| 459 | { |
| 460 | struct outstate *os = ctx; |
| 461 | FILE *out = os->fh; |
| 462 | int n; |
| 463 | bool newline = os->newline; |
| 464 | const char *color = metric_threshold_classify__color(thresh); |
| 465 | |
| 466 | os->newline = false; |
| 467 | |
| 468 | if (unit == NULL || fmt == NULL) { |
| 469 | fprintf(out, "%-*s" , METRIC_LEN, "" ); |
| 470 | return; |
| 471 | } |
| 472 | |
| 473 | if (newline) |
| 474 | do_new_line_std(config, os); |
| 475 | |
| 476 | n = fprintf(out, " # " ); |
| 477 | if (color) |
| 478 | n += color_fprintf(out, color, fmt, val); |
| 479 | else |
| 480 | n += fprintf(out, fmt, val); |
| 481 | fprintf(out, " %-*s" , METRIC_LEN - n - 1, unit); |
| 482 | } |
| 483 | |
| 484 | static void new_line_csv(struct perf_stat_config *config, void *ctx) |
| 485 | { |
| 486 | struct outstate *os = ctx; |
| 487 | int i; |
| 488 | |
| 489 | __new_line_std_csv(config, os); |
| 490 | for (i = 0; i < os->csv_col_pad; i++) |
| 491 | fputs(config->csv_sep, os->fh); |
| 492 | } |
| 493 | |
| 494 | static void print_metric_csv(struct perf_stat_config *config __maybe_unused, |
| 495 | void *ctx, |
| 496 | enum metric_threshold_classify thresh __maybe_unused, |
| 497 | const char *fmt, const char *unit, double val) |
| 498 | { |
| 499 | struct outstate *os = ctx; |
| 500 | FILE *out = os->fh; |
| 501 | char buf[64], *vals, *ends; |
| 502 | |
| 503 | if (unit == NULL || fmt == NULL) { |
| 504 | fprintf(out, "%s%s" , config->csv_sep, config->csv_sep); |
| 505 | return; |
| 506 | } |
| 507 | snprintf(buf, size: sizeof(buf), fmt, val); |
| 508 | ends = vals = skip_spaces(buf); |
| 509 | while (isdigit(c: *ends) || *ends == '.') |
| 510 | ends++; |
| 511 | *ends = 0; |
| 512 | fprintf(out, "%s%s%s%s" , config->csv_sep, vals, config->csv_sep, skip_spaces(unit)); |
| 513 | } |
| 514 | |
| 515 | static void print_metric_json(struct perf_stat_config *config __maybe_unused, |
| 516 | void *ctx, |
| 517 | enum metric_threshold_classify thresh, |
| 518 | const char *fmt __maybe_unused, |
| 519 | const char *unit, double val) |
| 520 | { |
| 521 | struct outstate *os = ctx; |
| 522 | FILE *out = os->fh; |
| 523 | |
| 524 | if (unit) { |
| 525 | json_out(os, "\"metric-value\" : \"%f\", \"metric-unit\" : \"%s\"" , val, unit); |
| 526 | if (thresh != METRIC_THRESHOLD_UNKNOWN) { |
| 527 | json_out(os, "\"metric-threshold\" : \"%s\"" , |
| 528 | metric_threshold_classify__str(thresh)); |
| 529 | } |
| 530 | } |
| 531 | if (!config->metric_only) |
| 532 | fprintf(out, "}" ); |
| 533 | } |
| 534 | |
| 535 | static void new_line_json(struct perf_stat_config *config, void *ctx) |
| 536 | { |
| 537 | struct outstate *os = ctx; |
| 538 | |
| 539 | fputs("\n{" , os->fh); |
| 540 | os->first = true; |
| 541 | if (config->interval) |
| 542 | json_out(os, "%s" , os->timestamp); |
| 543 | |
| 544 | aggr_printout(config, os, evsel: os->evsel, id: os->id, aggr_nr: os->aggr_nr); |
| 545 | } |
| 546 | |
| 547 | static void (struct perf_stat_config *config, |
| 548 | void *ctx, |
| 549 | const char *metricgroup_name) |
| 550 | { |
| 551 | if (!metricgroup_name) |
| 552 | return; |
| 553 | |
| 554 | json_out((struct outstate *) ctx, "\"metricgroup\" : \"%s\"}" , metricgroup_name); |
| 555 | new_line_json(config, ctx); |
| 556 | } |
| 557 | |
| 558 | static void (struct perf_stat_config *config, |
| 559 | void *ctx, |
| 560 | const char *metricgroup_name) |
| 561 | { |
| 562 | struct outstate *os = ctx; |
| 563 | int i; |
| 564 | |
| 565 | if (!metricgroup_name) { |
| 566 | /* Leave space for running and enabling */ |
| 567 | for (i = 0; i < os->csv_col_pad - 2; i++) |
| 568 | fputs(config->csv_sep, os->fh); |
| 569 | return; |
| 570 | } |
| 571 | |
| 572 | for (i = 0; i < os->csv_col_pad; i++) |
| 573 | fputs(config->csv_sep, os->fh); |
| 574 | fprintf(config->output, "%s" , metricgroup_name); |
| 575 | new_line_csv(config, ctx); |
| 576 | } |
| 577 | |
| 578 | static void (struct perf_stat_config *config, |
| 579 | void *ctx, |
| 580 | const char *metricgroup_name) |
| 581 | { |
| 582 | struct outstate *os = ctx; |
| 583 | int n; |
| 584 | |
| 585 | if (!metricgroup_name) { |
| 586 | __new_line_std(config, os); |
| 587 | return; |
| 588 | } |
| 589 | |
| 590 | n = fprintf(config->output, " %*s" , EVNAME_LEN, metricgroup_name); |
| 591 | |
| 592 | fprintf(config->output, "%*s" , MGROUP_LEN + config->unit_width + 2 - n, "" ); |
| 593 | } |
| 594 | |
| 595 | static void print_metric_only(struct perf_stat_config *config, |
| 596 | void *ctx, enum metric_threshold_classify thresh, |
| 597 | const char *fmt, const char *unit, double val) |
| 598 | { |
| 599 | struct outstate *os = ctx; |
| 600 | FILE *out = os->fh; |
| 601 | char str[1024]; |
| 602 | unsigned mlen = config->metric_only_len; |
| 603 | const char *color = metric_threshold_classify__color(thresh); |
| 604 | |
| 605 | if (!unit) |
| 606 | unit = "" ; |
| 607 | if (mlen < strlen(unit)) |
| 608 | mlen = strlen(unit) + 1; |
| 609 | |
| 610 | if (color) |
| 611 | mlen += strlen(color) + sizeof(PERF_COLOR_RESET) - 1; |
| 612 | |
| 613 | color_snprintf(bf: str, size: sizeof(str), color: color ?: "" , fmt: fmt ?: "" , val); |
| 614 | fprintf(out, "%*s " , mlen, str); |
| 615 | os->first = false; |
| 616 | } |
| 617 | |
| 618 | static void print_metric_only_csv(struct perf_stat_config *config __maybe_unused, |
| 619 | void *ctx, |
| 620 | enum metric_threshold_classify thresh __maybe_unused, |
| 621 | const char *fmt, |
| 622 | const char *unit __maybe_unused, double val) |
| 623 | { |
| 624 | struct outstate *os = ctx; |
| 625 | FILE *out = os->fh; |
| 626 | char buf[64], *vals, *ends; |
| 627 | |
| 628 | if (!unit) |
| 629 | return; |
| 630 | |
| 631 | snprintf(buf, size: sizeof(buf), fmt: fmt ?: "" , val); |
| 632 | ends = vals = skip_spaces(buf); |
| 633 | while (isdigit(c: *ends) || *ends == '.') |
| 634 | ends++; |
| 635 | *ends = 0; |
| 636 | fprintf(out, "%s%s" , vals, config->csv_sep); |
| 637 | os->first = false; |
| 638 | } |
| 639 | |
| 640 | static void print_metric_only_json(struct perf_stat_config *config __maybe_unused, |
| 641 | void *ctx, |
| 642 | enum metric_threshold_classify thresh __maybe_unused, |
| 643 | const char *fmt, |
| 644 | const char *unit, double val) |
| 645 | { |
| 646 | struct outstate *os = ctx; |
| 647 | char buf[64], *ends; |
| 648 | const char *vals; |
| 649 | |
| 650 | if (!unit || !unit[0]) |
| 651 | return; |
| 652 | snprintf(buf, size: sizeof(buf), fmt: fmt ?: "" , val); |
| 653 | vals = ends = skip_spaces(buf); |
| 654 | while (isdigit(c: *ends) || *ends == '.') |
| 655 | ends++; |
| 656 | *ends = 0; |
| 657 | if (!vals[0]) |
| 658 | vals = "none" ; |
| 659 | json_out(os, "\"%s\" : \"%s\"" , unit, vals); |
| 660 | } |
| 661 | |
| 662 | static void (struct perf_stat_config *config, |
| 663 | void *ctx, |
| 664 | enum metric_threshold_classify thresh __maybe_unused, |
| 665 | const char *fmt __maybe_unused, |
| 666 | const char *unit, double val __maybe_unused) |
| 667 | { |
| 668 | struct outstate *os = ctx; |
| 669 | |
| 670 | /* In case of iostat, print metric header for first root port only */ |
| 671 | if (config->iostat_run && |
| 672 | os->evsel->priv != os->evsel->evlist->selected->priv) |
| 673 | return; |
| 674 | |
| 675 | if (os->evsel->cgrp != os->cgrp) |
| 676 | return; |
| 677 | |
| 678 | if (!unit) |
| 679 | return; |
| 680 | |
| 681 | if (config->json_output) |
| 682 | return; |
| 683 | else if (config->csv_output) |
| 684 | fprintf(os->fh, "%s%s" , unit, config->csv_sep); |
| 685 | else |
| 686 | fprintf(os->fh, "%*s " , config->metric_only_len, unit); |
| 687 | } |
| 688 | |
| 689 | static void print_counter_value_std(struct perf_stat_config *config, |
| 690 | struct evsel *evsel, double avg, bool ok) |
| 691 | { |
| 692 | FILE *output = config->output; |
| 693 | double sc = evsel->scale; |
| 694 | const char *fmt; |
| 695 | const char *bad_count = evsel->supported ? CNTR_NOT_COUNTED : CNTR_NOT_SUPPORTED; |
| 696 | |
| 697 | if (config->big_num) |
| 698 | fmt = floor(sc) != sc ? "%'*.2f " : "%'*.0f " ; |
| 699 | else |
| 700 | fmt = floor(sc) != sc ? "%*.2f " : "%*.0f " ; |
| 701 | |
| 702 | if (ok) |
| 703 | fprintf(output, fmt, COUNTS_LEN, avg); |
| 704 | else |
| 705 | fprintf(output, "%*s " , COUNTS_LEN, bad_count); |
| 706 | |
| 707 | if (evsel->unit) |
| 708 | fprintf(output, "%-*s " , config->unit_width, evsel->unit); |
| 709 | |
| 710 | fprintf(output, "%-*s" , EVNAME_LEN, evsel__name(evsel)); |
| 711 | } |
| 712 | |
| 713 | static void print_counter_value_csv(struct perf_stat_config *config, |
| 714 | struct evsel *evsel, double avg, bool ok) |
| 715 | { |
| 716 | FILE *output = config->output; |
| 717 | double sc = evsel->scale; |
| 718 | const char *sep = config->csv_sep; |
| 719 | const char *fmt = floor(sc) != sc ? "%.2f%s" : "%.0f%s" ; |
| 720 | const char *bad_count = evsel->supported ? CNTR_NOT_COUNTED : CNTR_NOT_SUPPORTED; |
| 721 | |
| 722 | if (ok) |
| 723 | fprintf(output, fmt, avg, sep); |
| 724 | else |
| 725 | fprintf(output, "%s%s" , bad_count, sep); |
| 726 | |
| 727 | if (evsel->unit) |
| 728 | fprintf(output, "%s%s" , evsel->unit, sep); |
| 729 | |
| 730 | fprintf(output, "%s" , evsel__name(evsel)); |
| 731 | } |
| 732 | |
| 733 | static void print_counter_value_json(struct outstate *os, |
| 734 | struct evsel *evsel, double avg, bool ok) |
| 735 | { |
| 736 | const char *bad_count = evsel->supported ? CNTR_NOT_COUNTED : CNTR_NOT_SUPPORTED; |
| 737 | |
| 738 | if (ok) |
| 739 | json_out(os, "\"counter-value\" : \"%f\"" , avg); |
| 740 | else |
| 741 | json_out(os, "\"counter-value\" : \"%s\"" , bad_count); |
| 742 | |
| 743 | if (evsel->unit) |
| 744 | json_out(os, "\"unit\" : \"%s\"" , evsel->unit); |
| 745 | |
| 746 | json_out(os, "\"event\" : \"%s\"" , evsel__name(evsel)); |
| 747 | } |
| 748 | |
| 749 | static void print_counter_value(struct perf_stat_config *config, struct outstate *os, |
| 750 | struct evsel *evsel, double avg, bool ok) |
| 751 | { |
| 752 | if (config->json_output) |
| 753 | print_counter_value_json(os, evsel, avg, ok); |
| 754 | else if (config->csv_output) |
| 755 | print_counter_value_csv(config, evsel, avg, ok); |
| 756 | else |
| 757 | print_counter_value_std(config, evsel, avg, ok); |
| 758 | } |
| 759 | |
| 760 | static void abs_printout(struct perf_stat_config *config, |
| 761 | struct outstate *os, |
| 762 | struct aggr_cpu_id id, int aggr_nr, |
| 763 | struct evsel *evsel, double avg, bool ok) |
| 764 | { |
| 765 | aggr_printout(config, os, evsel, id, aggr_nr); |
| 766 | print_counter_value(config, os, evsel, avg, ok); |
| 767 | print_cgroup(config, os, cgrp: evsel->cgrp); |
| 768 | } |
| 769 | |
| 770 | static bool evlist__has_hybrid_pmus(struct evlist *evlist) |
| 771 | { |
| 772 | struct evsel *evsel; |
| 773 | struct perf_pmu *last_core_pmu = NULL; |
| 774 | |
| 775 | if (perf_pmus__num_core_pmus() == 1) |
| 776 | return false; |
| 777 | |
| 778 | evlist__for_each_entry(evlist, evsel) { |
| 779 | if (evsel->core.is_pmu_core) { |
| 780 | struct perf_pmu *pmu = evsel__find_pmu(evsel); |
| 781 | |
| 782 | if (pmu == last_core_pmu) |
| 783 | continue; |
| 784 | |
| 785 | if (last_core_pmu == NULL) { |
| 786 | last_core_pmu = pmu; |
| 787 | continue; |
| 788 | } |
| 789 | /* A distinct core PMU. */ |
| 790 | return true; |
| 791 | } |
| 792 | } |
| 793 | |
| 794 | return false; |
| 795 | } |
| 796 | |
| 797 | static void printout(struct perf_stat_config *config, struct outstate *os, |
| 798 | double uval, u64 run, u64 ena, double noise, int aggr_idx) |
| 799 | { |
| 800 | struct perf_stat_output_ctx out; |
| 801 | print_metric_t pm; |
| 802 | new_line_t nl; |
| 803 | print_metricgroup_header_t pmh; |
| 804 | bool ok = true; |
| 805 | struct evsel *counter = os->evsel; |
| 806 | |
| 807 | if (config->csv_output) { |
| 808 | pm = config->metric_only ? print_metric_only_csv : print_metric_csv; |
| 809 | nl = config->metric_only ? NULL : new_line_csv; |
| 810 | pmh = print_metricgroup_header_csv; |
| 811 | os->csv_col_pad = 4 + (counter->cgrp ? 1 : 0); |
| 812 | } else if (config->json_output) { |
| 813 | pm = config->metric_only ? print_metric_only_json : print_metric_json; |
| 814 | nl = config->metric_only ? NULL : new_line_json; |
| 815 | pmh = print_metricgroup_header_json; |
| 816 | } else { |
| 817 | pm = config->metric_only ? print_metric_only : print_metric_std; |
| 818 | nl = config->metric_only ? NULL : new_line_std; |
| 819 | pmh = print_metricgroup_header_std; |
| 820 | } |
| 821 | |
| 822 | if (run == 0 || ena == 0 || counter->counts->scaled == -1) { |
| 823 | if (config->metric_only) { |
| 824 | pm(config, os, METRIC_THRESHOLD_UNKNOWN, /*format=*/NULL, |
| 825 | /*unit=*/NULL, /*val=*/0); |
| 826 | return; |
| 827 | } |
| 828 | |
| 829 | ok = false; |
| 830 | |
| 831 | if (counter->supported) { |
| 832 | if (!evlist__has_hybrid_pmus(evlist: counter->evlist)) { |
| 833 | config->print_free_counters_hint = 1; |
| 834 | } |
| 835 | } |
| 836 | } |
| 837 | |
| 838 | out.print_metric = pm; |
| 839 | out.new_line = nl; |
| 840 | out.print_metricgroup_header = pmh; |
| 841 | out.ctx = os; |
| 842 | out.force_header = false; |
| 843 | |
| 844 | if (!config->metric_only && (!counter->default_metricgroup || counter->default_show_events)) { |
| 845 | abs_printout(config, os, id: os->id, aggr_nr: os->aggr_nr, evsel: counter, avg: uval, ok); |
| 846 | |
| 847 | print_noise(config, os, evsel: counter, avg: noise, /*before_metric=*/true); |
| 848 | print_running(config, os, run, ena, /*before_metric=*/true); |
| 849 | } |
| 850 | |
| 851 | if (ok) { |
| 852 | if (!config->metric_only && counter->default_metricgroup && !counter->default_show_events) { |
| 853 | void *from = NULL; |
| 854 | |
| 855 | aggr_printout(config, os, evsel: os->evsel, id: os->id, aggr_nr: os->aggr_nr); |
| 856 | /* Print out all the metricgroup with the same metric event. */ |
| 857 | do { |
| 858 | int num = 0; |
| 859 | |
| 860 | /* Print out the new line for the next new metricgroup. */ |
| 861 | if (from) { |
| 862 | if (config->json_output) |
| 863 | new_line_json(config, ctx: (void *)os); |
| 864 | else |
| 865 | __new_line_std_csv(config, os); |
| 866 | } |
| 867 | |
| 868 | print_noise(config, os, evsel: counter, avg: noise, /*before_metric=*/true); |
| 869 | print_running(config, os, run, ena, /*before_metric=*/true); |
| 870 | from = perf_stat__print_shadow_stats_metricgroup(config, evsel: counter, aggr_idx, |
| 871 | num: &num, from, out: &out); |
| 872 | } while (from != NULL); |
| 873 | } else { |
| 874 | perf_stat__print_shadow_stats(config, evsel: counter, aggr_idx, out: &out); |
| 875 | } |
| 876 | } else { |
| 877 | pm(config, os, METRIC_THRESHOLD_UNKNOWN, /*format=*/NULL, /*unit=*/NULL, /*val=*/0); |
| 878 | } |
| 879 | |
| 880 | if (!config->metric_only) { |
| 881 | print_noise(config, os, evsel: counter, avg: noise, /*before_metric=*/false); |
| 882 | print_running(config, os, run, ena, /*before_metric=*/false); |
| 883 | } |
| 884 | } |
| 885 | |
| 886 | /** |
| 887 | * should_skip_zero_count() - Check if the event should print 0 values. |
| 888 | * @config: The perf stat configuration (including aggregation mode). |
| 889 | * @counter: The evsel with its associated cpumap. |
| 890 | * @id: The aggregation id that is being queried. |
| 891 | * |
| 892 | * Due to mismatch between the event cpumap or thread-map and the |
| 893 | * aggregation mode, sometimes it'd iterate the counter with the map |
| 894 | * which does not contain any values. |
| 895 | * |
| 896 | * For example, uncore events have dedicated CPUs to manage them, |
| 897 | * result for other CPUs should be zero and skipped. |
| 898 | * |
| 899 | * Return: %true if the value should NOT be printed, %false if the value |
| 900 | * needs to be printed like "<not counted>" or "<not supported>". |
| 901 | */ |
| 902 | static bool should_skip_zero_counter(struct perf_stat_config *config, |
| 903 | struct evsel *counter, |
| 904 | const struct aggr_cpu_id *id) |
| 905 | { |
| 906 | struct perf_cpu cpu; |
| 907 | int idx; |
| 908 | |
| 909 | /* |
| 910 | * Skip unsupported default events when not verbose. (default events |
| 911 | * are all marked 'skippable'). |
| 912 | */ |
| 913 | if (verbose == 0 && counter->skippable && !counter->supported) |
| 914 | return true; |
| 915 | |
| 916 | /* Metric only counts won't be displayed but the metric wants to be computed. */ |
| 917 | if (config->metric_only) |
| 918 | return false; |
| 919 | /* |
| 920 | * Skip value 0 when enabling --per-thread globally, |
| 921 | * otherwise it will have too many 0 output. |
| 922 | */ |
| 923 | if (config->aggr_mode == AGGR_THREAD && config->system_wide) |
| 924 | return true; |
| 925 | |
| 926 | /* |
| 927 | * In per-thread mode the aggr_map and aggr_get_id functions may be |
| 928 | * NULL, assume all 0 values should be output in that case. |
| 929 | */ |
| 930 | if (!config->aggr_map || !config->aggr_get_id) |
| 931 | return false; |
| 932 | |
| 933 | /* |
| 934 | * Tool events may be gathered on all logical CPUs, for example |
| 935 | * system_time, but for many the first index is the only one used, for |
| 936 | * example num_cores. Don't skip for the first index. |
| 937 | */ |
| 938 | if (evsel__is_tool(evsel: counter)) { |
| 939 | struct aggr_cpu_id own_id = |
| 940 | config->aggr_get_id(config, (struct perf_cpu){ .cpu = 0 }); |
| 941 | |
| 942 | return !aggr_cpu_id__equal(a: id, b: &own_id); |
| 943 | } |
| 944 | /* |
| 945 | * Skip value 0 when the counter's cpumask doesn't match the given aggr |
| 946 | * id. |
| 947 | */ |
| 948 | |
| 949 | perf_cpu_map__for_each_cpu(cpu, idx, counter->core.cpus) { |
| 950 | struct aggr_cpu_id own_id = config->aggr_get_id(config, cpu); |
| 951 | |
| 952 | if (aggr_cpu_id__equal(a: id, b: &own_id)) |
| 953 | return false; |
| 954 | } |
| 955 | return true; |
| 956 | } |
| 957 | |
| 958 | static void print_counter_aggrdata(struct perf_stat_config *config, |
| 959 | struct evsel *counter, int aggr_idx, |
| 960 | struct outstate *os) |
| 961 | { |
| 962 | FILE *output = config->output; |
| 963 | u64 ena, run, val; |
| 964 | double uval; |
| 965 | struct perf_stat_evsel *ps = counter->stats; |
| 966 | struct perf_stat_aggr *aggr = &ps->aggr[aggr_idx]; |
| 967 | struct aggr_cpu_id id = config->aggr_map->map[aggr_idx]; |
| 968 | double avg = aggr->counts.val; |
| 969 | bool metric_only = config->metric_only; |
| 970 | |
| 971 | os->id = id; |
| 972 | os->aggr_nr = aggr->nr; |
| 973 | os->evsel = counter; |
| 974 | |
| 975 | /* Skip already merged uncore/hybrid events */ |
| 976 | if (config->aggr_mode != AGGR_NONE) { |
| 977 | if (evsel__is_hybrid(evsel: counter)) { |
| 978 | if (config->hybrid_merge && counter->first_wildcard_match != NULL) |
| 979 | return; |
| 980 | } else { |
| 981 | if (counter->first_wildcard_match != NULL) |
| 982 | return; |
| 983 | } |
| 984 | } |
| 985 | |
| 986 | val = aggr->counts.val; |
| 987 | ena = aggr->counts.ena; |
| 988 | run = aggr->counts.run; |
| 989 | |
| 990 | if (perf_stat__skip_metric_event(evsel: counter, ena, run)) |
| 991 | return; |
| 992 | |
| 993 | if (val == 0 && should_skip_zero_counter(config, counter, id: &id)) |
| 994 | return; |
| 995 | |
| 996 | if (!metric_only) { |
| 997 | if (config->json_output) { |
| 998 | os->first = true; |
| 999 | fputc('{', output); |
| 1000 | } |
| 1001 | if (config->interval) { |
| 1002 | if (config->json_output) |
| 1003 | json_out(os, "%s" , os->timestamp); |
| 1004 | else |
| 1005 | fprintf(output, "%s" , os->timestamp); |
| 1006 | } else if (config->summary && config->csv_output && |
| 1007 | !config->no_csv_summary) |
| 1008 | fprintf(output, "%s%s" , "summary" , config->csv_sep); |
| 1009 | } |
| 1010 | |
| 1011 | uval = val * counter->scale; |
| 1012 | |
| 1013 | printout(config, os, uval, run, ena, noise: avg, aggr_idx); |
| 1014 | |
| 1015 | if (!metric_only) |
| 1016 | fputc('\n', output); |
| 1017 | } |
| 1018 | |
| 1019 | static void print_metric_begin(struct perf_stat_config *config, |
| 1020 | struct evlist *evlist, |
| 1021 | struct outstate *os, int aggr_idx) |
| 1022 | { |
| 1023 | struct perf_stat_aggr *aggr; |
| 1024 | struct aggr_cpu_id id; |
| 1025 | struct evsel *evsel; |
| 1026 | |
| 1027 | os->first = true; |
| 1028 | if (!config->metric_only) |
| 1029 | return; |
| 1030 | |
| 1031 | if (config->json_output) |
| 1032 | fputc('{', config->output); |
| 1033 | |
| 1034 | if (config->interval) { |
| 1035 | if (config->json_output) |
| 1036 | json_out(os, "%s" , os->timestamp); |
| 1037 | else |
| 1038 | fprintf(config->output, "%s" , os->timestamp); |
| 1039 | } |
| 1040 | evsel = evlist__first(evlist); |
| 1041 | id = config->aggr_map->map[aggr_idx]; |
| 1042 | aggr = &evsel->stats->aggr[aggr_idx]; |
| 1043 | aggr_printout(config, os, evsel, id, aggr_nr: aggr->nr); |
| 1044 | |
| 1045 | print_cgroup(config, os, cgrp: os->cgrp ? : evsel->cgrp); |
| 1046 | } |
| 1047 | |
| 1048 | static void print_metric_end(struct perf_stat_config *config, struct outstate *os) |
| 1049 | { |
| 1050 | FILE *output = config->output; |
| 1051 | |
| 1052 | if (!config->metric_only) |
| 1053 | return; |
| 1054 | |
| 1055 | if (config->json_output) { |
| 1056 | if (os->first) |
| 1057 | fputs("\"metric-value\" : \"none\"" , output); |
| 1058 | fputc('}', output); |
| 1059 | } |
| 1060 | fputc('\n', output); |
| 1061 | } |
| 1062 | |
| 1063 | static void print_aggr(struct perf_stat_config *config, |
| 1064 | struct evlist *evlist, |
| 1065 | struct outstate *os) |
| 1066 | { |
| 1067 | struct evsel *counter; |
| 1068 | int aggr_idx; |
| 1069 | |
| 1070 | if (!config->aggr_map || !config->aggr_get_id) |
| 1071 | return; |
| 1072 | |
| 1073 | /* |
| 1074 | * With metric_only everything is on a single line. |
| 1075 | * Without each counter has its own line. |
| 1076 | */ |
| 1077 | cpu_aggr_map__for_each_idx(aggr_idx, config->aggr_map) { |
| 1078 | print_metric_begin(config, evlist, os, aggr_idx); |
| 1079 | |
| 1080 | evlist__for_each_entry(evlist, counter) { |
| 1081 | print_counter_aggrdata(config, counter, aggr_idx, os); |
| 1082 | } |
| 1083 | print_metric_end(config, os); |
| 1084 | } |
| 1085 | } |
| 1086 | |
| 1087 | static void print_aggr_cgroup(struct perf_stat_config *config, |
| 1088 | struct evlist *evlist, |
| 1089 | struct outstate *os) |
| 1090 | { |
| 1091 | struct evsel *counter, *evsel; |
| 1092 | int aggr_idx; |
| 1093 | |
| 1094 | if (!config->aggr_map || !config->aggr_get_id) |
| 1095 | return; |
| 1096 | |
| 1097 | evlist__for_each_entry(evlist, evsel) { |
| 1098 | if (os->cgrp == evsel->cgrp) |
| 1099 | continue; |
| 1100 | |
| 1101 | os->cgrp = evsel->cgrp; |
| 1102 | |
| 1103 | cpu_aggr_map__for_each_idx(aggr_idx, config->aggr_map) { |
| 1104 | print_metric_begin(config, evlist, os, aggr_idx); |
| 1105 | |
| 1106 | evlist__for_each_entry(evlist, counter) { |
| 1107 | if (counter->cgrp != os->cgrp) |
| 1108 | continue; |
| 1109 | |
| 1110 | print_counter_aggrdata(config, counter, aggr_idx, os); |
| 1111 | } |
| 1112 | print_metric_end(config, os); |
| 1113 | } |
| 1114 | } |
| 1115 | } |
| 1116 | |
| 1117 | static void print_counter(struct perf_stat_config *config, |
| 1118 | struct evsel *counter, struct outstate *os) |
| 1119 | { |
| 1120 | int aggr_idx; |
| 1121 | |
| 1122 | /* AGGR_THREAD doesn't have config->aggr_get_id */ |
| 1123 | if (!config->aggr_map) |
| 1124 | return; |
| 1125 | |
| 1126 | cpu_aggr_map__for_each_idx(aggr_idx, config->aggr_map) { |
| 1127 | print_counter_aggrdata(config, counter, aggr_idx, os); |
| 1128 | } |
| 1129 | } |
| 1130 | |
| 1131 | static void print_no_aggr_metric(struct perf_stat_config *config, |
| 1132 | struct evlist *evlist, |
| 1133 | struct outstate *os) |
| 1134 | { |
| 1135 | int all_idx; |
| 1136 | struct perf_cpu cpu; |
| 1137 | |
| 1138 | perf_cpu_map__for_each_cpu(cpu, all_idx, evlist->core.user_requested_cpus) { |
| 1139 | struct evsel *counter; |
| 1140 | bool first = true; |
| 1141 | |
| 1142 | evlist__for_each_entry(evlist, counter) { |
| 1143 | u64 ena, run, val; |
| 1144 | double uval; |
| 1145 | struct perf_stat_evsel *ps = counter->stats; |
| 1146 | int aggr_idx = 0; |
| 1147 | |
| 1148 | if (!perf_cpu_map__has(evsel__cpus(evsel: counter), cpu)) |
| 1149 | continue; |
| 1150 | |
| 1151 | cpu_aggr_map__for_each_idx(aggr_idx, config->aggr_map) { |
| 1152 | if (config->aggr_map->map[aggr_idx].cpu.cpu == cpu.cpu) |
| 1153 | break; |
| 1154 | } |
| 1155 | |
| 1156 | os->evsel = counter; |
| 1157 | os->id = aggr_cpu_id__cpu(cpu: cpu, /*data=*/NULL); |
| 1158 | if (first) { |
| 1159 | print_metric_begin(config, evlist, os, aggr_idx); |
| 1160 | first = false; |
| 1161 | } |
| 1162 | val = ps->aggr[aggr_idx].counts.val; |
| 1163 | ena = ps->aggr[aggr_idx].counts.ena; |
| 1164 | run = ps->aggr[aggr_idx].counts.run; |
| 1165 | |
| 1166 | uval = val * counter->scale; |
| 1167 | printout(config, os, uval, run, ena, noise: 1.0, aggr_idx); |
| 1168 | } |
| 1169 | if (!first) |
| 1170 | print_metric_end(config, os); |
| 1171 | } |
| 1172 | } |
| 1173 | |
| 1174 | static void (struct perf_stat_config *config, |
| 1175 | bool no_indent) |
| 1176 | { |
| 1177 | fputc(' ', config->output); |
| 1178 | |
| 1179 | if (!no_indent) { |
| 1180 | int len = aggr_header_lens[config->aggr_mode]; |
| 1181 | |
| 1182 | if (nr_cgroups || config->cgroup_list) |
| 1183 | len += CGROUP_LEN + 1; |
| 1184 | |
| 1185 | fprintf(config->output, "%*s" , len, "" ); |
| 1186 | } |
| 1187 | } |
| 1188 | |
| 1189 | static void (struct perf_stat_config *config, |
| 1190 | bool no_indent __maybe_unused) |
| 1191 | { |
| 1192 | const char *p; |
| 1193 | |
| 1194 | if (config->interval) |
| 1195 | fprintf(config->output, "time%s" , config->csv_sep); |
| 1196 | if (config->iostat_run) |
| 1197 | return; |
| 1198 | |
| 1199 | p = aggr_header_csv[config->aggr_mode]; |
| 1200 | while (*p) { |
| 1201 | if (*p == ',') |
| 1202 | fputs(config->csv_sep, config->output); |
| 1203 | else |
| 1204 | fputc(*p, config->output); |
| 1205 | p++; |
| 1206 | } |
| 1207 | } |
| 1208 | |
| 1209 | static void (struct perf_stat_config *config __maybe_unused, |
| 1210 | bool no_indent __maybe_unused) |
| 1211 | { |
| 1212 | } |
| 1213 | |
| 1214 | static void (struct perf_stat_config *config, |
| 1215 | struct evlist *evlist, bool no_indent) |
| 1216 | { |
| 1217 | struct evsel *counter; |
| 1218 | struct outstate os = { |
| 1219 | .fh = config->output |
| 1220 | }; |
| 1221 | struct perf_stat_output_ctx out = { |
| 1222 | .ctx = &os, |
| 1223 | .print_metric = print_metric_header, |
| 1224 | .new_line = NULL, |
| 1225 | .force_header = true, |
| 1226 | }; |
| 1227 | |
| 1228 | if (config->json_output) |
| 1229 | print_metric_headers_json(config, no_indent); |
| 1230 | else if (config->csv_output) |
| 1231 | print_metric_headers_csv(config, no_indent); |
| 1232 | else |
| 1233 | print_metric_headers_std(config, no_indent); |
| 1234 | |
| 1235 | if (config->iostat_run) |
| 1236 | iostat_print_header_prefix(config); |
| 1237 | |
| 1238 | if (config->cgroup_list) |
| 1239 | os.cgrp = evlist__first(evlist)->cgrp; |
| 1240 | |
| 1241 | /* Print metrics headers only */ |
| 1242 | evlist__for_each_entry(evlist, counter) { |
| 1243 | if (!config->iostat_run && |
| 1244 | config->aggr_mode != AGGR_NONE && counter->metric_leader != counter) |
| 1245 | continue; |
| 1246 | |
| 1247 | os.evsel = counter; |
| 1248 | |
| 1249 | perf_stat__print_shadow_stats(config, evsel: counter, /*aggr_idx=*/0, out: &out); |
| 1250 | } |
| 1251 | |
| 1252 | if (!config->json_output) |
| 1253 | fputc('\n', config->output); |
| 1254 | } |
| 1255 | |
| 1256 | static void prepare_timestamp(struct perf_stat_config *config, |
| 1257 | struct outstate *os, struct timespec *ts) |
| 1258 | { |
| 1259 | if (config->iostat_run) |
| 1260 | return; |
| 1261 | |
| 1262 | if (config->json_output) |
| 1263 | scnprintf(buf: os->timestamp, size: sizeof(os->timestamp), fmt: "\"interval\" : %lu.%09lu" , |
| 1264 | (unsigned long) ts->tv_sec, ts->tv_nsec); |
| 1265 | else if (config->csv_output) |
| 1266 | scnprintf(buf: os->timestamp, size: sizeof(os->timestamp), fmt: "%lu.%09lu%s" , |
| 1267 | (unsigned long) ts->tv_sec, ts->tv_nsec, config->csv_sep); |
| 1268 | else |
| 1269 | scnprintf(buf: os->timestamp, size: sizeof(os->timestamp), fmt: "%6lu.%09lu " , |
| 1270 | (unsigned long) ts->tv_sec, ts->tv_nsec); |
| 1271 | } |
| 1272 | |
| 1273 | static void (struct perf_stat_config *config, |
| 1274 | struct target *_target __maybe_unused, |
| 1275 | struct evlist *evlist, |
| 1276 | int argc __maybe_unused, |
| 1277 | const char **argv __maybe_unused) |
| 1278 | { |
| 1279 | FILE *output = config->output; |
| 1280 | |
| 1281 | switch (config->aggr_mode) { |
| 1282 | case AGGR_NODE: |
| 1283 | case AGGR_SOCKET: |
| 1284 | case AGGR_DIE: |
| 1285 | case AGGR_CLUSTER: |
| 1286 | case AGGR_CACHE: |
| 1287 | case AGGR_CORE: |
| 1288 | fprintf(output, "#%*s %-*s ctrs" , |
| 1289 | INTERVAL_LEN - 1, "time" , |
| 1290 | aggr_header_lens[config->aggr_mode], |
| 1291 | aggr_header_std[config->aggr_mode]); |
| 1292 | break; |
| 1293 | case AGGR_NONE: |
| 1294 | fprintf(output, "#%*s %-*s" , |
| 1295 | INTERVAL_LEN - 1, "time" , |
| 1296 | aggr_header_lens[config->aggr_mode], |
| 1297 | aggr_header_std[config->aggr_mode]); |
| 1298 | break; |
| 1299 | case AGGR_THREAD: |
| 1300 | fprintf(output, "#%*s %*s-%-*s" , |
| 1301 | INTERVAL_LEN - 1, "time" , |
| 1302 | COMM_LEN, "comm" , PID_LEN, "pid" ); |
| 1303 | break; |
| 1304 | case AGGR_GLOBAL: |
| 1305 | default: |
| 1306 | if (!config->iostat_run) |
| 1307 | fprintf(output, "#%*s" , |
| 1308 | INTERVAL_LEN - 1, "time" ); |
| 1309 | case AGGR_UNSET: |
| 1310 | case AGGR_MAX: |
| 1311 | break; |
| 1312 | } |
| 1313 | |
| 1314 | if (config->metric_only) |
| 1315 | print_metric_headers(config, evlist, no_indent: true); |
| 1316 | else |
| 1317 | fprintf(output, " %*s %*s events\n" , |
| 1318 | COUNTS_LEN, "counts" , config->unit_width, "unit" ); |
| 1319 | } |
| 1320 | |
| 1321 | static void (struct perf_stat_config *config, |
| 1322 | struct target *_target, struct evlist *evlist, |
| 1323 | int argc, const char **argv) |
| 1324 | { |
| 1325 | FILE *output = config->output; |
| 1326 | int i; |
| 1327 | |
| 1328 | fprintf(output, "\n" ); |
| 1329 | fprintf(output, " Performance counter stats for " ); |
| 1330 | if (_target->bpf_str) |
| 1331 | fprintf(output, "\'BPF program(s) %s" , _target->bpf_str); |
| 1332 | else if (_target->system_wide) |
| 1333 | fprintf(output, "\'system wide" ); |
| 1334 | else if (_target->cpu_list) |
| 1335 | fprintf(output, "\'CPU(s) %s" , _target->cpu_list); |
| 1336 | else if (!target__has_task(_target)) { |
| 1337 | fprintf(output, "\'%s" , argv ? argv[0] : "pipe" ); |
| 1338 | for (i = 1; argv && (i < argc); i++) |
| 1339 | fprintf(output, " %s" , argv[i]); |
| 1340 | } else if (_target->pid) |
| 1341 | fprintf(output, "process id \'%s" , _target->pid); |
| 1342 | else |
| 1343 | fprintf(output, "thread id \'%s" , _target->tid); |
| 1344 | |
| 1345 | fprintf(output, "\'" ); |
| 1346 | if (config->run_count > 1) |
| 1347 | fprintf(output, " (%d runs)" , config->run_count); |
| 1348 | fprintf(output, ":\n\n" ); |
| 1349 | |
| 1350 | if (config->metric_only) |
| 1351 | print_metric_headers(config, evlist, no_indent: false); |
| 1352 | } |
| 1353 | |
| 1354 | static void (struct perf_stat_config *config, |
| 1355 | struct target *_target __maybe_unused, |
| 1356 | struct evlist *evlist, |
| 1357 | int argc __maybe_unused, |
| 1358 | const char **argv __maybe_unused) |
| 1359 | { |
| 1360 | if (config->metric_only) |
| 1361 | print_metric_headers(config, evlist, no_indent: true); |
| 1362 | } |
| 1363 | static void (struct perf_stat_config *config, |
| 1364 | struct target *_target __maybe_unused, |
| 1365 | struct evlist *evlist, |
| 1366 | int argc __maybe_unused, |
| 1367 | const char **argv __maybe_unused) |
| 1368 | { |
| 1369 | if (config->metric_only) |
| 1370 | print_metric_headers(config, evlist, no_indent: true); |
| 1371 | } |
| 1372 | |
| 1373 | static void (struct perf_stat_config *config, |
| 1374 | struct target *_target, |
| 1375 | struct evlist *evlist, |
| 1376 | int argc, const char **argv) |
| 1377 | { |
| 1378 | static int num_print_iv; |
| 1379 | |
| 1380 | fflush(stdout); |
| 1381 | |
| 1382 | if (config->interval_clear) |
| 1383 | puts(CONSOLE_CLEAR); |
| 1384 | |
| 1385 | if (num_print_iv == 0 || config->interval_clear) { |
| 1386 | if (config->json_output) |
| 1387 | print_header_json(config, _target, evlist, argc, argv); |
| 1388 | else if (config->csv_output) |
| 1389 | print_header_csv(config, _target, evlist, argc, argv); |
| 1390 | else if (config->interval) |
| 1391 | print_header_interval_std(config, _target, evlist, argc, argv); |
| 1392 | else |
| 1393 | print_header_std(config, _target, evlist, argc, argv); |
| 1394 | } |
| 1395 | |
| 1396 | if (num_print_iv++ == 25) |
| 1397 | num_print_iv = 0; |
| 1398 | } |
| 1399 | |
| 1400 | static int get_precision(double num) |
| 1401 | { |
| 1402 | if (num > 1) |
| 1403 | return 0; |
| 1404 | |
| 1405 | return lround(ceil(-log10(num))); |
| 1406 | } |
| 1407 | |
| 1408 | static void print_table(struct perf_stat_config *config, |
| 1409 | FILE *output, int precision, double avg) |
| 1410 | { |
| 1411 | char tmp[64]; |
| 1412 | int idx, indent = 0; |
| 1413 | |
| 1414 | scnprintf(buf: tmp, size: 64, fmt: " %17.*f" , precision, avg); |
| 1415 | while (tmp[indent] == ' ') |
| 1416 | indent++; |
| 1417 | |
| 1418 | fprintf(output, "%*s# Table of individual measurements:\n" , indent, "" ); |
| 1419 | |
| 1420 | for (idx = 0; idx < config->run_count; idx++) { |
| 1421 | double run = (double) config->walltime_run[idx] / NSEC_PER_SEC; |
| 1422 | int h, n = 1 + abs((int) (100.0 * (run - avg)/run) / 5); |
| 1423 | |
| 1424 | fprintf(output, " %17.*f (%+.*f) " , |
| 1425 | precision, run, precision, run - avg); |
| 1426 | |
| 1427 | for (h = 0; h < n; h++) |
| 1428 | fprintf(output, "#" ); |
| 1429 | |
| 1430 | fprintf(output, "\n" ); |
| 1431 | } |
| 1432 | |
| 1433 | fprintf(output, "\n%*s# Final result:\n" , indent, "" ); |
| 1434 | } |
| 1435 | |
| 1436 | static double timeval2double(struct timeval *t) |
| 1437 | { |
| 1438 | return t->tv_sec + (double) t->tv_usec/USEC_PER_SEC; |
| 1439 | } |
| 1440 | |
| 1441 | static void (struct perf_stat_config *config) |
| 1442 | { |
| 1443 | double avg = avg_stats(stats: config->walltime_nsecs_stats) / NSEC_PER_SEC; |
| 1444 | FILE *output = config->output; |
| 1445 | |
| 1446 | if (config->interval || config->csv_output || config->json_output) |
| 1447 | return; |
| 1448 | |
| 1449 | if (!config->null_run) |
| 1450 | fprintf(output, "\n" ); |
| 1451 | |
| 1452 | if (config->run_count == 1) { |
| 1453 | fprintf(output, " %17.9f seconds time elapsed" , avg); |
| 1454 | |
| 1455 | if (config->ru_display) { |
| 1456 | double ru_utime = timeval2double(t: &config->ru_data.ru_utime); |
| 1457 | double ru_stime = timeval2double(t: &config->ru_data.ru_stime); |
| 1458 | |
| 1459 | fprintf(output, "\n\n" ); |
| 1460 | fprintf(output, " %17.9f seconds user\n" , ru_utime); |
| 1461 | fprintf(output, " %17.9f seconds sys\n" , ru_stime); |
| 1462 | } |
| 1463 | } else { |
| 1464 | double sd = stddev_stats(stats: config->walltime_nsecs_stats) / NSEC_PER_SEC; |
| 1465 | /* |
| 1466 | * Display at most 2 more significant |
| 1467 | * digits than the stddev inaccuracy. |
| 1468 | */ |
| 1469 | int precision = get_precision(num: sd) + 2; |
| 1470 | |
| 1471 | if (config->walltime_run_table) |
| 1472 | print_table(config, output, precision, avg); |
| 1473 | |
| 1474 | fprintf(output, " %17.*f +- %.*f seconds time elapsed" , |
| 1475 | precision, avg, precision, sd); |
| 1476 | |
| 1477 | print_noise_pct(config, NULL, total: sd, avg, /*before_metric=*/false); |
| 1478 | } |
| 1479 | fprintf(output, "\n\n" ); |
| 1480 | |
| 1481 | if (config->print_free_counters_hint && sysctl__nmi_watchdog_enabled()) |
| 1482 | fprintf(output, |
| 1483 | "Some events weren't counted. Try disabling the NMI watchdog:\n" |
| 1484 | " echo 0 > /proc/sys/kernel/nmi_watchdog\n" |
| 1485 | " perf stat ...\n" |
| 1486 | " echo 1 > /proc/sys/kernel/nmi_watchdog\n" ); |
| 1487 | } |
| 1488 | |
| 1489 | static void print_percore(struct perf_stat_config *config, |
| 1490 | struct evsel *counter, struct outstate *os) |
| 1491 | { |
| 1492 | bool metric_only = config->metric_only; |
| 1493 | FILE *output = config->output; |
| 1494 | struct cpu_aggr_map *core_map; |
| 1495 | int aggr_idx, core_map_len = 0; |
| 1496 | |
| 1497 | if (!config->aggr_map || !config->aggr_get_id) |
| 1498 | return; |
| 1499 | |
| 1500 | if (config->percore_show_thread) |
| 1501 | return print_counter(config, counter, os); |
| 1502 | |
| 1503 | /* |
| 1504 | * core_map will hold the aggr_cpu_id for the cores that have been |
| 1505 | * printed so that each core is printed just once. |
| 1506 | */ |
| 1507 | core_map = cpu_aggr_map__empty_new(nr: config->aggr_map->nr); |
| 1508 | if (core_map == NULL) { |
| 1509 | fprintf(output, "Cannot allocate per-core aggr map for display\n" ); |
| 1510 | return; |
| 1511 | } |
| 1512 | |
| 1513 | cpu_aggr_map__for_each_idx(aggr_idx, config->aggr_map) { |
| 1514 | struct perf_cpu curr_cpu = config->aggr_map->map[aggr_idx].cpu; |
| 1515 | struct aggr_cpu_id core_id = aggr_cpu_id__core(cpu: curr_cpu, NULL); |
| 1516 | bool found = false; |
| 1517 | |
| 1518 | for (int i = 0; i < core_map_len; i++) { |
| 1519 | if (aggr_cpu_id__equal(a: &core_map->map[i], b: &core_id)) { |
| 1520 | found = true; |
| 1521 | break; |
| 1522 | } |
| 1523 | } |
| 1524 | if (found) |
| 1525 | continue; |
| 1526 | |
| 1527 | print_counter_aggrdata(config, counter, aggr_idx, os); |
| 1528 | |
| 1529 | core_map->map[core_map_len++] = core_id; |
| 1530 | } |
| 1531 | free(core_map); |
| 1532 | |
| 1533 | if (metric_only) |
| 1534 | fputc('\n', output); |
| 1535 | } |
| 1536 | |
| 1537 | static void print_cgroup_counter(struct perf_stat_config *config, struct evlist *evlist, |
| 1538 | struct outstate *os) |
| 1539 | { |
| 1540 | struct evsel *counter; |
| 1541 | |
| 1542 | evlist__for_each_entry(evlist, counter) { |
| 1543 | if (os->cgrp != counter->cgrp) { |
| 1544 | if (os->cgrp != NULL) |
| 1545 | print_metric_end(config, os); |
| 1546 | |
| 1547 | os->cgrp = counter->cgrp; |
| 1548 | print_metric_begin(config, evlist, os, /*aggr_idx=*/0); |
| 1549 | } |
| 1550 | |
| 1551 | print_counter(config, counter, os); |
| 1552 | } |
| 1553 | if (os->cgrp) |
| 1554 | print_metric_end(config, os); |
| 1555 | } |
| 1556 | |
| 1557 | void evlist__print_counters(struct evlist *evlist, struct perf_stat_config *config, |
| 1558 | struct target *_target, struct timespec *ts, |
| 1559 | int argc, const char **argv) |
| 1560 | { |
| 1561 | bool metric_only = config->metric_only; |
| 1562 | struct evsel *counter; |
| 1563 | struct outstate os = { |
| 1564 | .fh = config->output, |
| 1565 | .first = true, |
| 1566 | }; |
| 1567 | |
| 1568 | evlist__uniquify_evsel_names(evlist, config); |
| 1569 | |
| 1570 | if (config->iostat_run) |
| 1571 | evlist->selected = evlist__first(evlist); |
| 1572 | |
| 1573 | if (config->interval) |
| 1574 | prepare_timestamp(config, os: &os, ts); |
| 1575 | |
| 1576 | print_header(config, _target, evlist, argc, argv); |
| 1577 | |
| 1578 | switch (config->aggr_mode) { |
| 1579 | case AGGR_CORE: |
| 1580 | case AGGR_CACHE: |
| 1581 | case AGGR_CLUSTER: |
| 1582 | case AGGR_DIE: |
| 1583 | case AGGR_SOCKET: |
| 1584 | case AGGR_NODE: |
| 1585 | if (config->cgroup_list) |
| 1586 | print_aggr_cgroup(config, evlist, os: &os); |
| 1587 | else |
| 1588 | print_aggr(config, evlist, os: &os); |
| 1589 | break; |
| 1590 | case AGGR_THREAD: |
| 1591 | case AGGR_GLOBAL: |
| 1592 | if (config->iostat_run) { |
| 1593 | iostat_print_counters(evlist, config, ts, prefix: os.timestamp, |
| 1594 | print_cnt_cb: (iostat_print_counter_t)print_counter, arg: &os); |
| 1595 | } else if (config->cgroup_list) { |
| 1596 | print_cgroup_counter(config, evlist, os: &os); |
| 1597 | } else { |
| 1598 | print_metric_begin(config, evlist, os: &os, /*aggr_idx=*/0); |
| 1599 | evlist__for_each_entry(evlist, counter) { |
| 1600 | print_counter(config, counter, os: &os); |
| 1601 | } |
| 1602 | print_metric_end(config, os: &os); |
| 1603 | } |
| 1604 | break; |
| 1605 | case AGGR_NONE: |
| 1606 | if (metric_only) |
| 1607 | print_no_aggr_metric(config, evlist, os: &os); |
| 1608 | else { |
| 1609 | evlist__for_each_entry(evlist, counter) { |
| 1610 | if (counter->percore) |
| 1611 | print_percore(config, counter, os: &os); |
| 1612 | else |
| 1613 | print_counter(config, counter, os: &os); |
| 1614 | } |
| 1615 | } |
| 1616 | break; |
| 1617 | case AGGR_MAX: |
| 1618 | case AGGR_UNSET: |
| 1619 | default: |
| 1620 | break; |
| 1621 | } |
| 1622 | |
| 1623 | print_footer(config); |
| 1624 | |
| 1625 | fflush(config->output); |
| 1626 | } |
| 1627 | |