2 * Copyright (c) 2003-2007, Joseph Koshy
3 * Copyright (c) 2007 The FreeBSD Foundation
6 * Portions of this software were developed by A. Joseph Koshy under
7 * sponsorship from the FreeBSD Foundation and Google, Inc.
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
18 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
19 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
22 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31 #include <sys/cdefs.h>
32 __FBSDID("$FreeBSD$");
34 #include <sys/types.h>
35 #include <sys/event.h>
36 #include <sys/param.h>
37 #include <sys/queue.h>
38 #include <sys/socket.h>
40 #include <sys/sysctl.h>
42 #include <sys/ttycom.h>
69 * A given invocation of pmcstat(8) can manage multiple PMCs of both
70 * the system-wide and per-process variety. Each of these could be in
71 * 'counting mode' or in 'sampling mode'.
73 * For 'counting mode' PMCs, pmcstat(8) will periodically issue a
74 * pmc_read() at the configured time interval and print out the value
75 * of the requested PMCs.
77 * For 'sampling mode' PMCs it can log to a file for offline analysis,
78 * or can analyse sampling data "on the fly", either by converting
79 * samples to printed textual form or by creating gprof(1) compatible
80 * profiles, one per program executed. When creating gprof(1)
81 * profiles it can optionally merge entries from multiple processes
82 * for a given executable into a single profile file.
84 * pmcstat(8) can also execute a command line and attach PMCs to the
85 * resulting child process. The protocol used is as follows:
87 * - parent creates a socketpair for two way communication and
93 * - Wait for childs token.
95 * - Awaits signal to start.
96 * - Attaches PMCs to the child's pid
97 * and starts them. Sets up
98 * monitoring for the child.
99 * - Signals child to start.
100 * - Recieves signal, attempts exec().
102 * After this point normal processing can happen.
107 int pmcstat_interrupt = 0;
108 int pmcstat_displayheight = DEFAULT_DISPLAY_HEIGHT;
109 int pmcstat_sockpair[NSOCKPAIRFD];
112 struct kinfo_proc *pmcstat_plist;
115 pmcstat_attach_pmcs(struct pmcstat_args *a)
117 struct pmcstat_ev *ev;
118 struct pmcstat_target *pt;
121 /* Attach all process PMCs to target processes. */
123 STAILQ_FOREACH(ev, &a->pa_events, ev_next) {
124 if (PMC_IS_SYSTEM_MODE(ev->ev_mode))
126 SLIST_FOREACH(pt, &a->pa_targets, pt_next)
127 if (pmc_attach(ev->ev_pmcid, pt->pt_pid) == 0)
129 else if (errno != ESRCH)
130 err(EX_OSERR, "ERROR: cannot attach pmc "
131 "\"%s\" to process %d", ev->ev_name,
136 errx(EX_DATAERR, "ERROR: No processes were attached to.");
141 pmcstat_cleanup(struct pmcstat_args *a)
143 struct pmcstat_ev *ev, *tmp;
145 /* release allocated PMCs. */
146 STAILQ_FOREACH_SAFE(ev, &a->pa_events, ev_next, tmp)
147 if (ev->ev_pmcid != PMC_ID_INVALID) {
148 if (pmc_release(ev->ev_pmcid) < 0)
149 err(EX_OSERR, "ERROR: cannot release pmc "
150 "0x%x \"%s\"", ev->ev_pmcid, ev->ev_name);
153 STAILQ_REMOVE(&a->pa_events, ev, pmcstat_ev, ev_next);
157 /* de-configure the log file if present. */
158 if (a->pa_flags & (FLAG_HAS_PIPE | FLAG_HAS_OUTPUT_LOGFILE))
159 (void) pmc_configure_logfile(-1);
161 if (a->pa_logparser) {
162 pmclog_close(a->pa_logparser);
163 a->pa_logparser = NULL;
166 if (a->pa_flags & (FLAG_HAS_PIPE | FLAG_HAS_OUTPUT_LOGFILE))
167 pmcstat_shutdown_logging(a);
171 pmcstat_clone_event_descriptor(struct pmcstat_args *a, struct pmcstat_ev *ev,
175 struct pmcstat_ev *ev_clone;
177 while ((cpu = ffs(cpumask)) > 0) {
180 if ((ev_clone = malloc(sizeof(*ev_clone))) == NULL)
181 errx(EX_SOFTWARE, "ERROR: Out of memory");
182 (void) memset(ev_clone, 0, sizeof(*ev_clone));
184 ev_clone->ev_count = ev->ev_count;
185 ev_clone->ev_cpu = cpu;
186 ev_clone->ev_cumulative = ev->ev_cumulative;
187 ev_clone->ev_flags = ev->ev_flags;
188 ev_clone->ev_mode = ev->ev_mode;
189 ev_clone->ev_name = strdup(ev->ev_name);
190 ev_clone->ev_pmcid = ev->ev_pmcid;
191 ev_clone->ev_saved = ev->ev_saved;
192 ev_clone->ev_spec = strdup(ev->ev_spec);
194 STAILQ_INSERT_TAIL(&a->pa_events, ev_clone, ev_next);
196 cpumask &= ~(1 << cpu);
201 pmcstat_create_process(struct pmcstat_args *a)
206 struct pmcstat_target *pt;
208 if (socketpair(AF_UNIX, SOCK_STREAM, 0, pmcstat_sockpair) < 0)
209 err(EX_OSERR, "ERROR: cannot create socket pair");
211 switch (pid = fork()) {
213 err(EX_OSERR, "ERROR: cannot fork");
217 (void) close(pmcstat_sockpair[PARENTSOCKET]);
219 /* Write a token to tell our parent we've started executing. */
220 if (write(pmcstat_sockpair[CHILDSOCKET], "+", 1) != 1)
221 err(EX_OSERR, "ERROR (child): cannot write token");
223 /* Wait for our parent to signal us to start. */
224 if (read(pmcstat_sockpair[CHILDSOCKET], &token, 1) < 0)
225 err(EX_OSERR, "ERROR (child): cannot read token");
226 (void) close(pmcstat_sockpair[CHILDSOCKET]);
228 /* exec() the program requested */
229 execvp(*a->pa_argv, a->pa_argv);
230 /* and if that fails, notify the parent */
231 kill(getppid(), SIGCHLD);
232 err(EX_OSERR, "ERROR: execvp \"%s\" failed", *a->pa_argv);
235 default: /* parent */
236 (void) close(pmcstat_sockpair[CHILDSOCKET]);
240 /* Ask to be notified via a kevent when the target process exits. */
241 EV_SET(&kev, pid, EVFILT_PROC, EV_ADD|EV_ONESHOT, NOTE_EXIT, 0,
243 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
244 err(EX_OSERR, "ERROR: cannot monitor child process %d", pid);
246 if ((pt = malloc(sizeof(*pt))) == NULL)
247 errx(EX_SOFTWARE, "ERROR: Out of memory.");
250 SLIST_INSERT_HEAD(&a->pa_targets, pt, pt_next);
252 /* Wait for the child to signal that its ready to go. */
253 if (read(pmcstat_sockpair[PARENTSOCKET], &token, 1) < 0)
254 err(EX_OSERR, "ERROR (parent): cannot read token");
260 pmcstat_find_targets(struct pmcstat_args *a, const char *spec)
262 int n, nproc, pid, rv;
263 struct pmcstat_target *pt;
264 char errbuf[_POSIX2_LINE_MAX], *end;
265 static struct kinfo_proc *kp;
269 /* First check if we've been given a process id. */
270 pid = strtol(spec, &end, 0);
271 if (end != spec && pid >= 0) {
272 if ((pt = malloc(sizeof(*pt))) == NULL)
275 SLIST_INSERT_HEAD(&a->pa_targets, pt, pt_next);
279 /* Otherwise treat arg as a regular expression naming processes. */
280 if (pmcstat_kvm == NULL) {
281 if ((pmcstat_kvm = kvm_openfiles(NULL, "/dev/null", NULL, 0,
283 err(EX_OSERR, "ERROR: Cannot open kernel \"%s\"",
285 if ((pmcstat_plist = kvm_getprocs(pmcstat_kvm, KERN_PROC_PROC,
287 err(EX_OSERR, "ERROR: Cannot get process list: %s",
288 kvm_geterr(pmcstat_kvm));
291 if ((rv = regcomp(®, spec, REG_EXTENDED|REG_NOSUB)) != 0) {
292 regerror(rv, ®, errbuf, sizeof(errbuf));
293 err(EX_DATAERR, "ERROR: Failed to compile regex \"%s\": %s",
297 for (n = 0, kp = pmcstat_plist; n < nproc; n++, kp++) {
298 if ((rv = regexec(®, kp->ki_comm, 1, ®match, 0)) == 0) {
299 if ((pt = malloc(sizeof(*pt))) == NULL)
301 pt->pt_pid = kp->ki_pid;
302 SLIST_INSERT_HEAD(&a->pa_targets, pt, pt_next);
303 } else if (rv != REG_NOMATCH) {
304 regerror(rv, ®, errbuf, sizeof(errbuf));
305 errx(EX_SOFTWARE, "ERROR: Regex evalation failed: %s",
315 errx(EX_SOFTWARE, "Out of memory.");
320 pmcstat_get_cpumask(const char *cpuspec)
331 cpu = strtol(s, &end, 0);
332 if (cpu < 0 || end == s)
333 errx(EX_USAGE, "ERROR: Illegal CPU specification "
335 cpumask |= (1 << cpu);
336 s = end + strspn(end, ", \t");
343 pmcstat_kill_process(struct pmcstat_args *a)
345 struct pmcstat_target *pt;
347 assert(a->pa_flags & FLAG_HAS_COMMANDLINE);
350 * If a command line was specified, it would be the very first
351 * in the list, before any other processes specified by -t.
353 pt = SLIST_FIRST(&a->pa_targets);
356 if (kill(pt->pt_pid, SIGINT) != 0)
357 err(EX_OSERR, "ERROR: cannot signal child process");
361 pmcstat_start_pmcs(struct pmcstat_args *a)
363 struct pmcstat_ev *ev;
365 STAILQ_FOREACH(ev, &args.pa_events, ev_next) {
367 assert(ev->ev_pmcid != PMC_ID_INVALID);
369 if (pmc_start(ev->ev_pmcid) < 0) {
370 warn("ERROR: Cannot start pmc 0x%x \"%s\"",
371 ev->ev_pmcid, ev->ev_name);
380 pmcstat_print_headers(struct pmcstat_args *a)
382 struct pmcstat_ev *ev;
385 (void) fprintf(a->pa_printfile, PRINT_HEADER_PREFIX);
387 STAILQ_FOREACH(ev, &a->pa_events, ev_next) {
388 if (PMC_IS_SAMPLING_MODE(ev->ev_mode))
391 c = PMC_IS_SYSTEM_MODE(ev->ev_mode) ? 's' : 'p';
393 if (ev->ev_fieldskip != 0)
394 (void) fprintf(a->pa_printfile, "%*s",
395 ev->ev_fieldskip, "");
396 w = ev->ev_fieldwidth - ev->ev_fieldskip - 2;
399 (void) fprintf(a->pa_printfile, "s/%02d/%-*s ",
400 ev->ev_cpu, w-3, ev->ev_name);
402 (void) fprintf(a->pa_printfile, "p/%*s ", w,
406 (void) fflush(a->pa_printfile);
410 pmcstat_print_counters(struct pmcstat_args *a)
413 struct pmcstat_ev *ev;
416 extra_width = sizeof(PRINT_HEADER_PREFIX) - 1;
418 STAILQ_FOREACH(ev, &a->pa_events, ev_next) {
420 /* skip sampling mode counters */
421 if (PMC_IS_SAMPLING_MODE(ev->ev_mode))
424 if (pmc_read(ev->ev_pmcid, &value) < 0)
425 err(EX_OSERR, "ERROR: Cannot read pmc "
426 "\"%s\"", ev->ev_name);
428 (void) fprintf(a->pa_printfile, "%*ju ",
429 ev->ev_fieldwidth + extra_width,
430 (uintmax_t) ev->ev_cumulative ? value :
431 (value - ev->ev_saved));
433 if (ev->ev_cumulative == 0)
434 ev->ev_saved = value;
438 (void) fflush(a->pa_printfile);
446 pmcstat_print_pmcs(struct pmcstat_args *a)
448 static int linecount = 0;
450 /* check if we need to print a header line */
451 if (++linecount > pmcstat_displayheight) {
452 (void) fprintf(a->pa_printfile, "\n");
456 pmcstat_print_headers(a);
457 (void) fprintf(a->pa_printfile, "\n");
459 pmcstat_print_counters(a);
465 * Do process profiling
467 * If a pid was specified, attach each allocated PMC to the target
468 * process. Otherwise, fork a child and attach the PMCs to the child,
469 * and have the child exec() the target program.
473 pmcstat_start_process(void)
475 /* Signal the child to proceed. */
476 if (write(pmcstat_sockpair[PARENTSOCKET], "!", 1) != 1)
477 err(EX_OSERR, "ERROR (parent): write of token failed");
479 (void) close(pmcstat_sockpair[PARENTSOCKET]);
483 pmcstat_show_usage(void)
486 "[options] [commandline]\n"
487 "\t Measure process and/or system performance using hardware\n"
488 "\t performance monitoring counters.\n"
489 "\t Options include:\n"
490 "\t -C\t\t (toggle) show cumulative counts\n"
491 "\t -D path\t create profiles in directory \"path\"\n"
492 "\t -E\t\t (toggle) show counts at process exit\n"
493 "\t -G file\t write a system-wide callgraph to \"file\"\n"
494 "\t -M file\t print executable/gmon file map to \"file\"\n"
495 "\t -N\t\t (toggle) capture callchains\n"
496 "\t -O file\t send log output to \"file\"\n"
497 "\t -P spec\t allocate a process-private sampling PMC\n"
498 "\t -R file\t read events from \"file\"\n"
499 "\t -S spec\t allocate a system-wide sampling PMC\n"
500 "\t -W\t\t (toggle) show counts per context switch\n"
501 "\t -c cpu-list\t set cpus for subsequent system-wide PMCs\n"
502 "\t -d\t\t (toggle) track descendants\n"
503 "\t -g\t\t produce gprof(1) compatible profiles\n"
504 "\t -k dir\t\t set the path to the kernel\n"
505 "\t -n rate\t set sampling rate\n"
506 "\t -o file\t send print output to \"file\"\n"
507 "\t -p spec\t allocate a process-private counting PMC\n"
508 "\t -q\t\t suppress verbosity\n"
509 "\t -r fsroot\t specify FS root directory\n"
510 "\t -s spec\t allocate a system-wide counting PMC\n"
511 "\t -t pid\t\t attach to running process with pid \"pid\"\n"
512 "\t -v\t\t increase verbosity\n"
513 "\t -w secs\t set printing time interval\n"
514 "\t -z depth\t limit callchain display depth"
523 main(int argc, char **argv)
526 int option, npmc, ncpu, haltedcpus;
527 int c, check_driver_stats, current_cpu, current_sampling_count;
528 int do_callchain, do_descendants, do_logproccsw, do_logprocexit;
533 int use_cumulative_counts;
536 const char *errmsg, *graphfilename;
537 enum pmcstat_state runstate;
538 struct pmc_driverstats ds_start, ds_end;
539 struct pmcstat_ev *ev;
544 char buffer[PATH_MAX];
546 check_driver_stats = 0;
548 current_sampling_count = DEFAULT_SAMPLE_COUNT;
553 use_cumulative_counts = 0;
555 args.pa_required = 0;
557 args.pa_verbosity = 1;
560 args.pa_kernel = strdup("/boot/kernel");
561 args.pa_samplesdir = ".";
562 args.pa_printfile = stderr;
563 args.pa_graphdepth = DEFAULT_CALLGRAPH_DEPTH;
564 args.pa_graphfile = NULL;
565 args.pa_interval = DEFAULT_WAIT_INTERVAL;
566 args.pa_mapfilename = NULL;
567 args.pa_inputpath = NULL;
568 args.pa_outputpath = NULL;
569 STAILQ_INIT(&args.pa_events);
570 SLIST_INIT(&args.pa_targets);
571 bzero(&ds_start, sizeof(ds_start));
572 bzero(&ds_end, sizeof(ds_end));
576 * The initial CPU mask specifies all non-halted CPUS in the
580 if (sysctlbyname("hw.ncpu", &ncpu, &dummy, NULL, 0) < 0)
581 err(EX_OSERR, "ERROR: Cannot determine the number of CPUs");
582 cpumask = (1 << ncpu) - 1;
584 if (sysctlbyname("machdep.hlt_cpus", &haltedcpus, &dummy,
586 err(EX_OSERR, "ERROR: Cannot determine which CPUs are "
588 cpumask &= ~haltedcpus;
591 while ((option = getopt(argc, argv,
592 "CD:EG:M:NO:P:R:S:Wc:dgk:n:o:p:qr:s:t:vw:z:")) != -1)
594 case 'C': /* cumulative values */
595 use_cumulative_counts = !use_cumulative_counts;
596 args.pa_required |= FLAG_HAS_COUNTING_PMCS;
601 if (optarg[0] == '*' && optarg[1] == '\0')
602 cpumask = (1 << ncpu) - 1;
604 cpumask = pmcstat_get_cpumask(optarg);
606 args.pa_required |= FLAG_HAS_SYSTEM_PMCS;
610 if (stat(optarg, &sb) < 0)
611 err(EX_OSERR, "ERROR: Cannot stat \"%s\"",
613 if (!S_ISDIR(sb.st_mode))
614 errx(EX_USAGE, "ERROR: \"%s\" is not a "
615 "directory.", optarg);
616 args.pa_samplesdir = optarg;
617 args.pa_flags |= FLAG_HAS_SAMPLESDIR;
618 args.pa_required |= FLAG_DO_GPROF;
621 case 'd': /* toggle descendents */
622 do_descendants = !do_descendants;
623 args.pa_required |= FLAG_HAS_PROCESS_PMCS;
626 case 'G': /* produce a system-wide callgraph */
627 args.pa_flags |= FLAG_DO_CALLGRAPHS;
628 graphfilename = optarg;
631 case 'g': /* produce gprof compatible profiles */
632 args.pa_flags |= FLAG_DO_GPROF;
635 case 'k': /* pathname to the kernel */
636 free(args.pa_kernel);
637 args.pa_kernel = strdup(optarg);
638 args.pa_required |= FLAG_DO_ANALYSIS;
639 args.pa_flags |= FLAG_HAS_KERNELPATH;
642 case 'E': /* log process exit */
643 do_logprocexit = !do_logprocexit;
644 args.pa_required |= (FLAG_HAS_PROCESS_PMCS |
645 FLAG_HAS_COUNTING_PMCS | FLAG_HAS_OUTPUT_LOGFILE);
648 case 'M': /* mapfile */
649 args.pa_mapfilename = optarg;
653 do_callchain = !do_callchain;
654 args.pa_required |= FLAG_HAS_SAMPLING_PMCS;
657 case 'p': /* process virtual counting PMC */
658 case 's': /* system-wide counting PMC */
659 case 'P': /* process virtual sampling PMC */
660 case 'S': /* system-wide sampling PMC */
661 if ((ev = malloc(sizeof(*ev))) == NULL)
662 errx(EX_SOFTWARE, "ERROR: Out of memory.");
665 case 'p': ev->ev_mode = PMC_MODE_TC; break;
666 case 's': ev->ev_mode = PMC_MODE_SC; break;
667 case 'P': ev->ev_mode = PMC_MODE_TS; break;
668 case 'S': ev->ev_mode = PMC_MODE_SS; break;
671 if (option == 'P' || option == 'p') {
672 args.pa_flags |= FLAG_HAS_PROCESS_PMCS;
673 args.pa_required |= (FLAG_HAS_COMMANDLINE |
677 if (option == 'P' || option == 'S') {
678 args.pa_flags |= FLAG_HAS_SAMPLING_PMCS;
679 args.pa_required |= (FLAG_HAS_PIPE |
680 FLAG_HAS_OUTPUT_LOGFILE);
683 if (option == 'p' || option == 's')
684 args.pa_flags |= FLAG_HAS_COUNTING_PMCS;
686 if (option == 's' || option == 'S')
687 args.pa_flags |= FLAG_HAS_SYSTEM_PMCS;
689 ev->ev_spec = strdup(optarg);
691 if (option == 'S' || option == 'P')
692 ev->ev_count = current_sampling_count;
696 if (option == 'S' || option == 's')
697 ev->ev_cpu = ffs(cpumask) - 1;
699 ev->ev_cpu = PMC_CPU_ANY;
703 ev->ev_flags |= PMC_F_CALLCHAIN;
705 ev->ev_flags |= PMC_F_DESCENDANTS;
707 ev->ev_flags |= PMC_F_LOG_PROCEXIT;
709 ev->ev_flags |= PMC_F_LOG_PROCCSW;
711 ev->ev_cumulative = use_cumulative_counts;
714 ev->ev_pmcid = PMC_ID_INVALID;
716 /* extract event name */
717 c = strcspn(optarg, ", \t");
718 ev->ev_name = malloc(c + 1);
719 (void) strncpy(ev->ev_name, optarg, c);
720 *(ev->ev_name + c) = '\0';
722 STAILQ_INSERT_TAIL(&args.pa_events, ev, ev_next);
724 if (option == 's' || option == 'S')
725 pmcstat_clone_event_descriptor(&args, ev,
726 cpumask & ~(1 << ev->ev_cpu));
730 case 'n': /* sampling count */
731 current_sampling_count = strtol(optarg, &end, 0);
732 if (*end != '\0' || current_sampling_count <= 0)
734 "ERROR: Illegal count value \"%s\".",
736 args.pa_required |= FLAG_HAS_SAMPLING_PMCS;
739 case 'o': /* outputfile */
740 if (args.pa_printfile != NULL)
741 (void) fclose(args.pa_printfile);
742 if ((args.pa_printfile = fopen(optarg, "w")) == NULL)
743 errx(EX_OSERR, "ERROR: cannot open \"%s\" for "
745 args.pa_flags |= FLAG_DO_PRINT;
748 case 'O': /* sampling output */
749 if (args.pa_outputpath)
750 errx(EX_USAGE, "ERROR: option -O may only be "
752 args.pa_outputpath = optarg;
753 args.pa_flags |= FLAG_HAS_OUTPUT_LOGFILE;
756 case 'q': /* quiet mode */
757 args.pa_verbosity = 0;
760 case 'r': /* root FS path */
761 args.pa_fsroot = optarg;
764 case 'R': /* read an existing log file */
765 if (args.pa_inputpath != NULL)
766 errx(EX_USAGE, "ERROR: option -R may only be "
768 args.pa_inputpath = optarg;
769 if (args.pa_printfile == stderr)
770 args.pa_printfile = stdout;
771 args.pa_flags |= FLAG_READ_LOGFILE;
774 case 't': /* target pid or process name */
775 pmcstat_find_targets(&args, optarg);
777 args.pa_flags |= FLAG_HAS_TARGET;
778 args.pa_required |= FLAG_HAS_PROCESS_PMCS;
781 case 'v': /* verbose */
785 case 'w': /* wait interval */
786 interval = strtod(optarg, &end);
787 if (*end != '\0' || interval <= 0)
788 errx(EX_USAGE, "ERROR: Illegal wait interval "
789 "value \"%s\".", optarg);
790 args.pa_flags |= FLAG_HAS_WAIT_INTERVAL;
791 args.pa_required |= FLAG_HAS_COUNTING_PMCS;
792 args.pa_interval = interval;
795 case 'W': /* toggle LOG_CSW */
796 do_logproccsw = !do_logproccsw;
797 args.pa_required |= (FLAG_HAS_PROCESS_PMCS |
798 FLAG_HAS_COUNTING_PMCS | FLAG_HAS_OUTPUT_LOGFILE);
802 graphdepth = strtod(optarg, &end);
803 if (*end != '\0' || graphdepth <= 0)
804 errx(EX_USAGE, "ERROR: Illegal callchain "
805 "depth \"%s\".", optarg);
806 args.pa_graphdepth = graphdepth;
807 args.pa_required |= FLAG_DO_CALLGRAPHS;
812 pmcstat_show_usage();
817 args.pa_argc = (argc -= optind);
818 args.pa_argv = (argv += optind);
820 args.pa_cpumask = cpumask; /* For selecting CPUs using -R. */
822 if (argc) /* command line present */
823 args.pa_flags |= FLAG_HAS_COMMANDLINE;
825 if (args.pa_flags & (FLAG_DO_GPROF | FLAG_DO_CALLGRAPHS))
826 args.pa_flags |= FLAG_DO_ANALYSIS;
829 * Check invocation syntax.
832 /* disallow -O and -R together */
833 if (args.pa_outputpath && args.pa_inputpath)
834 errx(EX_USAGE, "ERROR: options -O and -R are mutually "
837 if (args.pa_flags & FLAG_READ_LOGFILE) {
839 if (args.pa_flags & FLAG_HAS_COMMANDLINE)
840 errmsg = "a command line specification";
841 else if (args.pa_flags & FLAG_HAS_TARGET)
842 errmsg = "option -t";
843 else if (!STAILQ_EMPTY(&args.pa_events))
844 errmsg = "a PMC event specification";
846 errx(EX_USAGE, "ERROR: option -R may not be used with "
848 } else if (STAILQ_EMPTY(&args.pa_events))
849 /* All other uses require a PMC spec. */
850 pmcstat_show_usage();
852 /* check for -t pid without a process PMC spec */
853 if ((args.pa_required & FLAG_HAS_TARGET) &&
854 (args.pa_flags & FLAG_HAS_PROCESS_PMCS) == 0)
855 errx(EX_USAGE, "ERROR: option -t requires a process mode PMC "
858 /* check for process-mode options without a command or -t pid */
859 if ((args.pa_required & FLAG_HAS_PROCESS_PMCS) &&
860 (args.pa_flags & (FLAG_HAS_COMMANDLINE | FLAG_HAS_TARGET)) == 0)
861 errx(EX_USAGE, "ERROR: options -d, -E, -p, -P, and -W require "
862 "a command line or target process.");
864 /* check for -p | -P without a target process of some sort */
865 if ((args.pa_required & (FLAG_HAS_COMMANDLINE | FLAG_HAS_TARGET)) &&
866 (args.pa_flags & (FLAG_HAS_COMMANDLINE | FLAG_HAS_TARGET)) == 0)
867 errx(EX_USAGE, "ERROR: options -P and -p require a "
868 "target process or a command line.");
870 /* check for process-mode options without a process-mode PMC */
871 if ((args.pa_required & FLAG_HAS_PROCESS_PMCS) &&
872 (args.pa_flags & FLAG_HAS_PROCESS_PMCS) == 0)
873 errx(EX_USAGE, "ERROR: options -d, -E, and -W require a "
874 "process mode PMC to be specified.");
876 /* check for -c cpu with no system mode PMCs or logfile. */
877 if ((args.pa_required & FLAG_HAS_SYSTEM_PMCS) &&
878 (args.pa_flags & FLAG_HAS_SYSTEM_PMCS) == 0 &&
879 (args.pa_flags & FLAG_READ_LOGFILE) == 0)
880 errx(EX_USAGE, "ERROR: option -c requires at least one "
881 "system mode PMC to be specified.");
883 /* check for counting mode options without a counting PMC */
884 if ((args.pa_required & FLAG_HAS_COUNTING_PMCS) &&
885 (args.pa_flags & FLAG_HAS_COUNTING_PMCS) == 0)
886 errx(EX_USAGE, "ERROR: options -C, -W, -o and -w require at "
887 "least one counting mode PMC to be specified.");
889 /* check for sampling mode options without a sampling PMC spec */
890 if ((args.pa_required & FLAG_HAS_SAMPLING_PMCS) &&
891 (args.pa_flags & FLAG_HAS_SAMPLING_PMCS) == 0)
892 errx(EX_USAGE, "ERROR: options -N, -n and -O require at "
893 "least one sampling mode PMC to be specified.");
895 /* check if -g/-G are being used correctly */
896 if ((args.pa_flags & FLAG_DO_ANALYSIS) &&
897 !(args.pa_flags & (FLAG_HAS_SAMPLING_PMCS|FLAG_READ_LOGFILE)))
898 errx(EX_USAGE, "ERROR: options -g/-G require sampling PMCs "
899 "or -R to be specified.");
901 /* check if -O was spuriously specified */
902 if ((args.pa_flags & FLAG_HAS_OUTPUT_LOGFILE) &&
903 (args.pa_required & FLAG_HAS_OUTPUT_LOGFILE) == 0)
905 "ERROR: option -O is used only with options "
906 "-E, -P, -S and -W.");
908 /* -k kernel path require -g/-G or -R */
909 if ((args.pa_flags & FLAG_HAS_KERNELPATH) &&
910 (args.pa_flags & FLAG_DO_ANALYSIS) == 0 &&
911 (args.pa_flags & FLAG_READ_LOGFILE) == 0)
912 errx(EX_USAGE, "ERROR: option -k is only used with -g/-R.");
914 /* -D only applies to gprof output mode (-g) */
915 if ((args.pa_flags & FLAG_HAS_SAMPLESDIR) &&
916 (args.pa_flags & FLAG_DO_GPROF) == 0)
917 errx(EX_USAGE, "ERROR: option -D is only used with -g.");
919 /* -M mapfile requires -g or -R */
920 if (args.pa_mapfilename != NULL &&
921 (args.pa_flags & FLAG_DO_GPROF) == 0 &&
922 (args.pa_flags & FLAG_READ_LOGFILE) == 0)
923 errx(EX_USAGE, "ERROR: option -M is only used with -g/-R.");
926 * Disallow textual output of sampling PMCs if counting PMCs
927 * have also been asked for, mostly because the combined output
928 * is difficult to make sense of.
930 if ((args.pa_flags & FLAG_HAS_COUNTING_PMCS) &&
931 (args.pa_flags & FLAG_HAS_SAMPLING_PMCS) &&
932 ((args.pa_flags & FLAG_HAS_OUTPUT_LOGFILE) == 0))
933 errx(EX_USAGE, "ERROR: option -O is required if counting and "
934 "sampling PMCs are specified together.");
937 * Check if "-k kerneldir" was specified, and if whether
938 * 'kerneldir' actually refers to a a file. If so, use
939 * `dirname path` to determine the kernel directory.
941 if (args.pa_flags & FLAG_HAS_KERNELPATH) {
942 (void) snprintf(buffer, sizeof(buffer), "%s%s", args.pa_fsroot,
944 if (stat(buffer, &sb) < 0)
945 err(EX_OSERR, "ERROR: Cannot locate kernel \"%s\"",
947 if (!S_ISREG(sb.st_mode) && !S_ISDIR(sb.st_mode))
948 errx(EX_USAGE, "ERROR: \"%s\": Unsupported file type.",
950 if (!S_ISDIR(sb.st_mode)) {
951 tmp = args.pa_kernel;
952 args.pa_kernel = strdup(dirname(args.pa_kernel));
954 (void) snprintf(buffer, sizeof(buffer), "%s%s",
955 args.pa_fsroot, args.pa_kernel);
956 if (stat(buffer, &sb) < 0)
957 err(EX_OSERR, "ERROR: Cannot stat \"%s\"",
959 if (!S_ISDIR(sb.st_mode))
960 errx(EX_USAGE, "ERROR: \"%s\" is not a "
961 "directory.", buffer);
966 * If we have a callgraph be created, select the outputfile.
968 if (args.pa_flags & FLAG_DO_CALLGRAPHS) {
969 if (strcmp(graphfilename, "-") == 0)
970 args.pa_graphfile = args.pa_printfile;
972 args.pa_graphfile = fopen(graphfilename, "w");
973 if (args.pa_graphfile == NULL)
974 err(EX_OSERR, "ERROR: cannot open \"%s\" "
975 "for writing", graphfilename);
979 /* if we've been asked to process a log file, do that and exit */
980 if (args.pa_flags & FLAG_READ_LOGFILE) {
982 * Print the log in textual form if we haven't been
983 * asked to generate profiling information.
985 if ((args.pa_flags & FLAG_DO_ANALYSIS) == 0)
986 args.pa_flags |= FLAG_DO_PRINT;
988 pmcstat_initialize_logging(&args);
989 args.pa_logfd = pmcstat_open_log(args.pa_inputpath,
990 PMCSTAT_OPEN_FOR_READ);
991 if ((args.pa_logparser = pmclog_open(args.pa_logfd)) == NULL)
992 err(EX_OSERR, "ERROR: Cannot create parser");
993 pmcstat_process_log(&args);
994 pmcstat_shutdown_logging(&args);
998 /* otherwise, we've been asked to collect data */
1001 "ERROR: Initialization of the pmc(3) library failed");
1003 if ((npmc = pmc_npmc(0)) < 0) /* assume all CPUs are identical */
1004 err(EX_OSERR, "ERROR: Cannot determine the number of PMCs "
1007 /* Allocate a kqueue */
1008 if ((pmcstat_kq = kqueue()) < 0)
1009 err(EX_OSERR, "ERROR: Cannot allocate kqueue");
1012 * Configure the specified log file or setup a default log
1013 * consumer via a pipe.
1015 if (args.pa_required & FLAG_HAS_OUTPUT_LOGFILE) {
1016 if (args.pa_outputpath)
1017 args.pa_logfd = pmcstat_open_log(args.pa_outputpath,
1018 PMCSTAT_OPEN_FOR_WRITE);
1021 * process the log on the fly by reading it in
1024 if (pipe(pipefd) < 0)
1025 err(EX_OSERR, "ERROR: pipe(2) failed");
1027 if (fcntl(pipefd[READPIPEFD], F_SETFL, O_NONBLOCK) < 0)
1028 err(EX_OSERR, "ERROR: fcntl(2) failed");
1030 EV_SET(&kev, pipefd[READPIPEFD], EVFILT_READ, EV_ADD,
1033 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
1034 err(EX_OSERR, "ERROR: Cannot register kevent");
1036 args.pa_logfd = pipefd[WRITEPIPEFD];
1038 args.pa_flags |= (FLAG_HAS_PIPE | FLAG_DO_PRINT);
1039 args.pa_logparser = pmclog_open(pipefd[READPIPEFD]);
1042 if (pmc_configure_logfile(args.pa_logfd) < 0)
1043 err(EX_OSERR, "ERROR: Cannot configure log file");
1046 /* remember to check for driver errors if we are sampling or logging */
1047 check_driver_stats = (args.pa_flags & FLAG_HAS_SAMPLING_PMCS) ||
1048 (args.pa_flags & FLAG_HAS_OUTPUT_LOGFILE);
1054 STAILQ_FOREACH(ev, &args.pa_events, ev_next) {
1055 if (pmc_allocate(ev->ev_spec, ev->ev_mode,
1056 ev->ev_flags, ev->ev_cpu, &ev->ev_pmcid) < 0)
1057 err(EX_OSERR, "ERROR: Cannot allocate %s-mode pmc with "
1058 "specification \"%s\"",
1059 PMC_IS_SYSTEM_MODE(ev->ev_mode) ? "system" : "process",
1062 if (PMC_IS_SAMPLING_MODE(ev->ev_mode) &&
1063 pmc_set(ev->ev_pmcid, ev->ev_count) < 0)
1064 err(EX_OSERR, "ERROR: Cannot set sampling count "
1065 "for PMC \"%s\"", ev->ev_name);
1068 /* compute printout widths */
1069 STAILQ_FOREACH(ev, &args.pa_events, ev_next) {
1074 (void) pmc_width(ev->ev_pmcid, &counter_width);
1075 header_width = strlen(ev->ev_name) + 2; /* prefix '%c/' */
1076 display_width = (int) floor(counter_width / 3.32193) + 1;
1078 if (PMC_IS_SYSTEM_MODE(ev->ev_mode))
1079 header_width += 3; /* 2 digit CPU number + '/' */
1081 if (header_width > display_width) {
1082 ev->ev_fieldskip = 0;
1083 ev->ev_fieldwidth = header_width;
1085 ev->ev_fieldskip = display_width -
1087 ev->ev_fieldwidth = display_width;
1092 * If our output is being set to a terminal, register a handler
1093 * for window size changes.
1096 if (isatty(fileno(args.pa_printfile))) {
1098 if (ioctl(fileno(args.pa_printfile), TIOCGWINSZ, &ws) < 0)
1099 err(EX_OSERR, "ERROR: Cannot determine window size");
1101 pmcstat_displayheight = ws.ws_row - 1;
1103 EV_SET(&kev, SIGWINCH, EVFILT_SIGNAL, EV_ADD, 0, 0, NULL);
1105 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
1106 err(EX_OSERR, "ERROR: Cannot register kevent for "
1110 EV_SET(&kev, SIGINT, EVFILT_SIGNAL, EV_ADD, 0, 0, NULL);
1111 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
1112 err(EX_OSERR, "ERROR: Cannot register kevent for SIGINT");
1114 EV_SET(&kev, SIGIO, EVFILT_SIGNAL, EV_ADD, 0, 0, NULL);
1115 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
1116 err(EX_OSERR, "ERROR: Cannot register kevent for SIGIO");
1119 * An exec() failure of a forked child is signalled by the
1120 * child sending the parent a SIGCHLD. We don't register an
1121 * actual signal handler for SIGCHLD, but instead use our
1122 * kqueue to pick up the signal.
1124 EV_SET(&kev, SIGCHLD, EVFILT_SIGNAL, EV_ADD, 0, 0, NULL);
1125 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
1126 err(EX_OSERR, "ERROR: Cannot register kevent for SIGCHLD");
1128 /* setup a timer if we have counting mode PMCs needing to be printed */
1129 if ((args.pa_flags & FLAG_HAS_COUNTING_PMCS) &&
1130 (args.pa_required & FLAG_HAS_OUTPUT_LOGFILE) == 0) {
1131 EV_SET(&kev, 0, EVFILT_TIMER, EV_ADD, 0,
1132 args.pa_interval * 1000, NULL);
1134 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
1135 err(EX_OSERR, "ERROR: Cannot register kevent for "
1139 /* attach PMCs to the target process, starting it if specified */
1140 if (args.pa_flags & FLAG_HAS_COMMANDLINE)
1141 pmcstat_create_process(&args);
1143 if (check_driver_stats && pmc_get_driver_stats(&ds_start) < 0)
1144 err(EX_OSERR, "ERROR: Cannot retrieve driver statistics");
1146 /* Attach process pmcs to the target process. */
1147 if (args.pa_flags & FLAG_HAS_TARGET) {
1148 if (SLIST_EMPTY(&args.pa_targets))
1149 errx(EX_DATAERR, "ERROR: No matching target "
1152 pmcstat_attach_pmcs(&args);
1155 kvm_close(pmcstat_kvm);
1160 /* start the pmcs */
1161 pmcstat_start_pmcs(&args);
1163 /* start the (commandline) process if needed */
1164 if (args.pa_flags & FLAG_HAS_COMMANDLINE)
1165 pmcstat_start_process();
1167 /* initialize logging if printing the configured log */
1168 if ((args.pa_flags & FLAG_DO_PRINT) &&
1169 (args.pa_flags & (FLAG_HAS_PIPE | FLAG_HAS_OUTPUT_LOGFILE)))
1170 pmcstat_initialize_logging(&args);
1172 /* Handle SIGINT using the kqueue loop */
1173 sa.sa_handler = SIG_IGN;
1175 (void) sigemptyset(&sa.sa_mask);
1177 if (sigaction(SIGINT, &sa, NULL) < 0)
1178 err(EX_OSERR, "ERROR: Cannot install signal handler");
1181 * loop till either the target process (if any) exits, or we
1182 * are killed by a SIGINT.
1184 runstate = PMCSTAT_RUNNING;
1187 if ((c = kevent(pmcstat_kq, NULL, 0, &kev, 1, NULL)) <= 0) {
1189 err(EX_OSERR, "ERROR: kevent failed");
1194 if (kev.flags & EV_ERROR)
1195 errc(EX_OSERR, kev.data, "ERROR: kevent failed");
1197 switch (kev.filter) {
1198 case EVFILT_PROC: /* target has exited */
1199 if (args.pa_flags & (FLAG_HAS_OUTPUT_LOGFILE |
1201 runstate = pmcstat_close_log(&args);
1203 runstate = PMCSTAT_FINISHED;
1207 case EVFILT_READ: /* log file data is present */
1208 runstate = pmcstat_process_log(&args);
1212 if (kev.ident == SIGCHLD) {
1214 * The child process sends us a
1215 * SIGCHLD if its exec() failed. We
1216 * wait for it to exit and then exit
1220 runstate = PMCSTAT_FINISHED;
1221 } else if (kev.ident == SIGIO) {
1223 * We get a SIGIO if a PMC loses all
1224 * of its targets, or if logfile
1225 * writes encounter an error.
1227 if (args.pa_flags & (FLAG_HAS_OUTPUT_LOGFILE |
1229 runstate = pmcstat_close_log(&args);
1231 (FLAG_DO_PRINT|FLAG_DO_ANALYSIS))
1232 pmcstat_process_log(&args);
1234 do_print = 1; /* print PMCs at exit */
1235 runstate = PMCSTAT_FINISHED;
1236 } else if (kev.ident == SIGINT) {
1237 /* Kill the child process if we started it */
1238 if (args.pa_flags & FLAG_HAS_COMMANDLINE)
1239 pmcstat_kill_process(&args);
1240 runstate = PMCSTAT_FINISHED;
1241 } else if (kev.ident == SIGWINCH) {
1242 if (ioctl(fileno(args.pa_printfile),
1243 TIOCGWINSZ, &ws) < 0)
1244 err(EX_OSERR, "ERROR: Cannot determine "
1246 pmcstat_displayheight = ws.ws_row - 1;
1252 case EVFILT_TIMER: /* print out counting PMCs */
1259 (args.pa_required & FLAG_HAS_OUTPUT_LOGFILE) == 0) {
1260 pmcstat_print_pmcs(&args);
1261 if (runstate == PMCSTAT_FINISHED && /* final newline */
1262 (args.pa_flags & FLAG_DO_PRINT) == 0)
1263 (void) fprintf(args.pa_printfile, "\n");
1267 } while (runstate != PMCSTAT_FINISHED);
1269 /* flush any pending log entries */
1270 if (args.pa_flags & (FLAG_HAS_OUTPUT_LOGFILE | FLAG_HAS_PIPE))
1271 pmc_flush_logfile();
1273 pmcstat_cleanup(&args);
1275 free(args.pa_kernel);
1277 /* check if the driver lost any samples or events */
1278 if (check_driver_stats) {
1279 if (pmc_get_driver_stats(&ds_end) < 0)
1280 err(EX_OSERR, "ERROR: Cannot retrieve driver "
1282 if (ds_start.pm_intr_bufferfull != ds_end.pm_intr_bufferfull &&
1283 args.pa_verbosity > 0)
1284 warnx("WARNING: some samples were dropped. Please "
1285 "consider tuning the \"kern.hwpmc.nsamples\" "
1287 if (ds_start.pm_buffer_requests_failed !=
1288 ds_end.pm_buffer_requests_failed &&
1289 args.pa_verbosity > 0)
1290 warnx("WARNING: some events were discarded. Please "
1291 "consider tuning the \"kern.hwpmc.nbuffers\" "