2 * Copyright (c) 2003-2008, Joseph Koshy
3 * Copyright (c) 2007 The FreeBSD Foundation
6 * Portions of this software were developed by A. Joseph Koshy under
7 * sponsorship from the FreeBSD Foundation and Google, Inc.
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution.
18 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
19 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
22 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31 #include <sys/cdefs.h>
32 __FBSDID("$FreeBSD$");
34 #include <sys/types.h>
35 #include <sys/event.h>
36 #include <sys/param.h>
37 #include <sys/queue.h>
38 #include <sys/socket.h>
40 #include <sys/sysctl.h>
42 #include <sys/ttycom.h>
69 * A given invocation of pmcstat(8) can manage multiple PMCs of both
70 * the system-wide and per-process variety. Each of these could be in
71 * 'counting mode' or in 'sampling mode'.
73 * For 'counting mode' PMCs, pmcstat(8) will periodically issue a
74 * pmc_read() at the configured time interval and print out the value
75 * of the requested PMCs.
77 * For 'sampling mode' PMCs it can log to a file for offline analysis,
78 * or can analyse sampling data "on the fly", either by converting
79 * samples to printed textual form or by creating gprof(1) compatible
80 * profiles, one per program executed. When creating gprof(1)
81 * profiles it can optionally merge entries from multiple processes
82 * for a given executable into a single profile file.
84 * pmcstat(8) can also execute a command line and attach PMCs to the
85 * resulting child process. The protocol used is as follows:
87 * - parent creates a socketpair for two way communication and
93 * - Wait for childs token.
95 * - Awaits signal to start.
96 * - Attaches PMCs to the child's pid
97 * and starts them. Sets up
98 * monitoring for the child.
99 * - Signals child to start.
100 * - Recieves signal, attempts exec().
102 * After this point normal processing can happen.
107 int pmcstat_interrupt = 0;
108 int pmcstat_displayheight = DEFAULT_DISPLAY_HEIGHT;
109 int pmcstat_sockpair[NSOCKPAIRFD];
112 struct kinfo_proc *pmcstat_plist;
115 pmcstat_attach_pmcs(struct pmcstat_args *a)
117 struct pmcstat_ev *ev;
118 struct pmcstat_target *pt;
121 /* Attach all process PMCs to target processes. */
123 STAILQ_FOREACH(ev, &a->pa_events, ev_next) {
124 if (PMC_IS_SYSTEM_MODE(ev->ev_mode))
126 SLIST_FOREACH(pt, &a->pa_targets, pt_next)
127 if (pmc_attach(ev->ev_pmcid, pt->pt_pid) == 0)
129 else if (errno != ESRCH)
130 err(EX_OSERR, "ERROR: cannot attach pmc "
131 "\"%s\" to process %d", ev->ev_name,
136 errx(EX_DATAERR, "ERROR: No processes were attached to.");
141 pmcstat_cleanup(struct pmcstat_args *a)
143 struct pmcstat_ev *ev, *tmp;
145 /* release allocated PMCs. */
146 STAILQ_FOREACH_SAFE(ev, &a->pa_events, ev_next, tmp)
147 if (ev->ev_pmcid != PMC_ID_INVALID) {
148 if (pmc_release(ev->ev_pmcid) < 0)
149 err(EX_OSERR, "ERROR: cannot release pmc "
150 "0x%x \"%s\"", ev->ev_pmcid, ev->ev_name);
153 STAILQ_REMOVE(&a->pa_events, ev, pmcstat_ev, ev_next);
157 /* de-configure the log file if present. */
158 if (a->pa_flags & (FLAG_HAS_PIPE | FLAG_HAS_OUTPUT_LOGFILE))
159 (void) pmc_configure_logfile(-1);
161 if (a->pa_logparser) {
162 pmclog_close(a->pa_logparser);
163 a->pa_logparser = NULL;
166 if (a->pa_flags & (FLAG_HAS_PIPE | FLAG_HAS_OUTPUT_LOGFILE))
167 pmcstat_shutdown_logging(a);
171 pmcstat_clone_event_descriptor(struct pmcstat_args *a, struct pmcstat_ev *ev,
175 struct pmcstat_ev *ev_clone;
177 while ((cpu = ffs(cpumask)) > 0) {
180 if ((ev_clone = malloc(sizeof(*ev_clone))) == NULL)
181 errx(EX_SOFTWARE, "ERROR: Out of memory");
182 (void) memset(ev_clone, 0, sizeof(*ev_clone));
184 ev_clone->ev_count = ev->ev_count;
185 ev_clone->ev_cpu = cpu;
186 ev_clone->ev_cumulative = ev->ev_cumulative;
187 ev_clone->ev_flags = ev->ev_flags;
188 ev_clone->ev_mode = ev->ev_mode;
189 ev_clone->ev_name = strdup(ev->ev_name);
190 ev_clone->ev_pmcid = ev->ev_pmcid;
191 ev_clone->ev_saved = ev->ev_saved;
192 ev_clone->ev_spec = strdup(ev->ev_spec);
194 STAILQ_INSERT_TAIL(&a->pa_events, ev_clone, ev_next);
196 cpumask &= ~(1 << cpu);
201 pmcstat_create_process(struct pmcstat_args *a)
206 struct pmcstat_target *pt;
208 if (socketpair(AF_UNIX, SOCK_STREAM, 0, pmcstat_sockpair) < 0)
209 err(EX_OSERR, "ERROR: cannot create socket pair");
211 switch (pid = fork()) {
213 err(EX_OSERR, "ERROR: cannot fork");
217 (void) close(pmcstat_sockpair[PARENTSOCKET]);
219 /* Write a token to tell our parent we've started executing. */
220 if (write(pmcstat_sockpair[CHILDSOCKET], "+", 1) != 1)
221 err(EX_OSERR, "ERROR (child): cannot write token");
223 /* Wait for our parent to signal us to start. */
224 if (read(pmcstat_sockpair[CHILDSOCKET], &token, 1) < 0)
225 err(EX_OSERR, "ERROR (child): cannot read token");
226 (void) close(pmcstat_sockpair[CHILDSOCKET]);
228 /* exec() the program requested */
229 execvp(*a->pa_argv, a->pa_argv);
230 /* and if that fails, notify the parent */
231 kill(getppid(), SIGCHLD);
232 err(EX_OSERR, "ERROR: execvp \"%s\" failed", *a->pa_argv);
235 default: /* parent */
236 (void) close(pmcstat_sockpair[CHILDSOCKET]);
240 /* Ask to be notified via a kevent when the target process exits. */
241 EV_SET(&kev, pid, EVFILT_PROC, EV_ADD|EV_ONESHOT, NOTE_EXIT, 0,
243 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
244 err(EX_OSERR, "ERROR: cannot monitor child process %d", pid);
246 if ((pt = malloc(sizeof(*pt))) == NULL)
247 errx(EX_SOFTWARE, "ERROR: Out of memory.");
250 SLIST_INSERT_HEAD(&a->pa_targets, pt, pt_next);
252 /* Wait for the child to signal that its ready to go. */
253 if (read(pmcstat_sockpair[PARENTSOCKET], &token, 1) < 0)
254 err(EX_OSERR, "ERROR (parent): cannot read token");
260 pmcstat_find_targets(struct pmcstat_args *a, const char *spec)
262 int n, nproc, pid, rv;
263 struct pmcstat_target *pt;
264 char errbuf[_POSIX2_LINE_MAX], *end;
265 static struct kinfo_proc *kp;
269 /* First check if we've been given a process id. */
270 pid = strtol(spec, &end, 0);
271 if (end != spec && pid >= 0) {
272 if ((pt = malloc(sizeof(*pt))) == NULL)
275 SLIST_INSERT_HEAD(&a->pa_targets, pt, pt_next);
279 /* Otherwise treat arg as a regular expression naming processes. */
280 if (pmcstat_kvm == NULL) {
281 if ((pmcstat_kvm = kvm_openfiles(NULL, "/dev/null", NULL, 0,
283 err(EX_OSERR, "ERROR: Cannot open kernel \"%s\"",
285 if ((pmcstat_plist = kvm_getprocs(pmcstat_kvm, KERN_PROC_PROC,
287 err(EX_OSERR, "ERROR: Cannot get process list: %s",
288 kvm_geterr(pmcstat_kvm));
291 if ((rv = regcomp(®, spec, REG_EXTENDED|REG_NOSUB)) != 0) {
292 regerror(rv, ®, errbuf, sizeof(errbuf));
293 err(EX_DATAERR, "ERROR: Failed to compile regex \"%s\": %s",
297 for (n = 0, kp = pmcstat_plist; n < nproc; n++, kp++) {
298 if ((rv = regexec(®, kp->ki_comm, 1, ®match, 0)) == 0) {
299 if ((pt = malloc(sizeof(*pt))) == NULL)
301 pt->pt_pid = kp->ki_pid;
302 SLIST_INSERT_HEAD(&a->pa_targets, pt, pt_next);
303 } else if (rv != REG_NOMATCH) {
304 regerror(rv, ®, errbuf, sizeof(errbuf));
305 errx(EX_SOFTWARE, "ERROR: Regex evalation failed: %s",
315 errx(EX_SOFTWARE, "Out of memory.");
320 pmcstat_get_cpumask(const char *cpuspec)
331 cpu = strtol(s, &end, 0);
332 if (cpu < 0 || end == s)
333 errx(EX_USAGE, "ERROR: Illegal CPU specification "
335 cpumask |= (1 << cpu);
336 s = end + strspn(end, ", \t");
343 pmcstat_kill_process(struct pmcstat_args *a)
345 struct pmcstat_target *pt;
347 assert(a->pa_flags & FLAG_HAS_COMMANDLINE);
350 * If a command line was specified, it would be the very first
351 * in the list, before any other processes specified by -t.
353 pt = SLIST_FIRST(&a->pa_targets);
356 if (kill(pt->pt_pid, SIGINT) != 0)
357 err(EX_OSERR, "ERROR: cannot signal child process");
361 pmcstat_start_pmcs(struct pmcstat_args *a)
363 struct pmcstat_ev *ev;
365 STAILQ_FOREACH(ev, &args.pa_events, ev_next) {
367 assert(ev->ev_pmcid != PMC_ID_INVALID);
369 if (pmc_start(ev->ev_pmcid) < 0) {
370 warn("ERROR: Cannot start pmc 0x%x \"%s\"",
371 ev->ev_pmcid, ev->ev_name);
380 pmcstat_print_headers(struct pmcstat_args *a)
382 struct pmcstat_ev *ev;
385 (void) fprintf(a->pa_printfile, PRINT_HEADER_PREFIX);
387 STAILQ_FOREACH(ev, &a->pa_events, ev_next) {
388 if (PMC_IS_SAMPLING_MODE(ev->ev_mode))
391 c = PMC_IS_SYSTEM_MODE(ev->ev_mode) ? 's' : 'p';
393 if (ev->ev_fieldskip != 0)
394 (void) fprintf(a->pa_printfile, "%*s",
395 ev->ev_fieldskip, "");
396 w = ev->ev_fieldwidth - ev->ev_fieldskip - 2;
399 (void) fprintf(a->pa_printfile, "s/%02d/%-*s ",
400 ev->ev_cpu, w-3, ev->ev_name);
402 (void) fprintf(a->pa_printfile, "p/%*s ", w,
406 (void) fflush(a->pa_printfile);
410 pmcstat_print_counters(struct pmcstat_args *a)
413 struct pmcstat_ev *ev;
416 extra_width = sizeof(PRINT_HEADER_PREFIX) - 1;
418 STAILQ_FOREACH(ev, &a->pa_events, ev_next) {
420 /* skip sampling mode counters */
421 if (PMC_IS_SAMPLING_MODE(ev->ev_mode))
424 if (pmc_read(ev->ev_pmcid, &value) < 0)
425 err(EX_OSERR, "ERROR: Cannot read pmc "
426 "\"%s\"", ev->ev_name);
428 (void) fprintf(a->pa_printfile, "%*ju ",
429 ev->ev_fieldwidth + extra_width,
430 (uintmax_t) ev->ev_cumulative ? value :
431 (value - ev->ev_saved));
433 if (ev->ev_cumulative == 0)
434 ev->ev_saved = value;
438 (void) fflush(a->pa_printfile);
446 pmcstat_print_pmcs(struct pmcstat_args *a)
448 static int linecount = 0;
450 /* check if we need to print a header line */
451 if (++linecount > pmcstat_displayheight) {
452 (void) fprintf(a->pa_printfile, "\n");
456 pmcstat_print_headers(a);
457 (void) fprintf(a->pa_printfile, "\n");
459 pmcstat_print_counters(a);
465 * Do process profiling
467 * If a pid was specified, attach each allocated PMC to the target
468 * process. Otherwise, fork a child and attach the PMCs to the child,
469 * and have the child exec() the target program.
473 pmcstat_start_process(void)
475 /* Signal the child to proceed. */
476 if (write(pmcstat_sockpair[PARENTSOCKET], "!", 1) != 1)
477 err(EX_OSERR, "ERROR (parent): write of token failed");
479 (void) close(pmcstat_sockpair[PARENTSOCKET]);
483 pmcstat_show_usage(void)
486 "[options] [commandline]\n"
487 "\t Measure process and/or system performance using hardware\n"
488 "\t performance monitoring counters.\n"
489 "\t Options include:\n"
490 "\t -C\t\t (toggle) show cumulative counts\n"
491 "\t -D path\t create profiles in directory \"path\"\n"
492 "\t -E\t\t (toggle) show counts at process exit\n"
493 "\t -G file\t write a system-wide callgraph to \"file\"\n"
494 "\t -M file\t print executable/gmon file map to \"file\"\n"
495 "\t -N\t\t (toggle) capture callchains\n"
496 "\t -O file\t send log output to \"file\"\n"
497 "\t -P spec\t allocate a process-private sampling PMC\n"
498 "\t -R file\t read events from \"file\"\n"
499 "\t -S spec\t allocate a system-wide sampling PMC\n"
500 "\t -W\t\t (toggle) show counts per context switch\n"
501 "\t -c cpu-list\t set cpus for subsequent system-wide PMCs\n"
502 "\t -d\t\t (toggle) track descendants\n"
503 "\t -g\t\t produce gprof(1) compatible profiles\n"
504 "\t -k dir\t\t set the path to the kernel\n"
505 "\t -n rate\t set sampling rate\n"
506 "\t -o file\t send print output to \"file\"\n"
507 "\t -p spec\t allocate a process-private counting PMC\n"
508 "\t -q\t\t suppress verbosity\n"
509 "\t -r fsroot\t specify FS root directory\n"
510 "\t -s spec\t allocate a system-wide counting PMC\n"
511 "\t -t process-spec attach to running processes matching "
513 "\t -v\t\t increase verbosity\n"
514 "\t -w secs\t set printing time interval\n"
515 "\t -z depth\t limit callchain display depth"
524 main(int argc, char **argv)
527 int option, npmc, ncpu, haltedcpus;
528 int c, check_driver_stats, current_cpu, current_sampling_count;
529 int do_callchain, do_descendants, do_logproccsw, do_logprocexit;
534 int use_cumulative_counts;
537 const char *errmsg, *graphfilename;
538 enum pmcstat_state runstate;
539 struct pmc_driverstats ds_start, ds_end;
540 struct pmcstat_ev *ev;
545 char buffer[PATH_MAX];
547 check_driver_stats = 0;
549 current_sampling_count = DEFAULT_SAMPLE_COUNT;
554 use_cumulative_counts = 0;
556 args.pa_required = 0;
558 args.pa_verbosity = 1;
561 args.pa_kernel = strdup("/boot/kernel");
562 args.pa_samplesdir = ".";
563 args.pa_printfile = stderr;
564 args.pa_graphdepth = DEFAULT_CALLGRAPH_DEPTH;
565 args.pa_graphfile = NULL;
566 args.pa_interval = DEFAULT_WAIT_INTERVAL;
567 args.pa_mapfilename = NULL;
568 args.pa_inputpath = NULL;
569 args.pa_outputpath = NULL;
570 STAILQ_INIT(&args.pa_events);
571 SLIST_INIT(&args.pa_targets);
572 bzero(&ds_start, sizeof(ds_start));
573 bzero(&ds_end, sizeof(ds_end));
577 * The initial CPU mask specifies all non-halted CPUS in the
581 if (sysctlbyname("hw.ncpu", &ncpu, &dummy, NULL, 0) < 0)
582 err(EX_OSERR, "ERROR: Cannot determine the number of CPUs");
583 cpumask = (1 << ncpu) - 1;
585 if (sysctlbyname("machdep.hlt_cpus", &haltedcpus, &dummy,
587 err(EX_OSERR, "ERROR: Cannot determine which CPUs are "
589 cpumask &= ~haltedcpus;
592 while ((option = getopt(argc, argv,
593 "CD:EG:M:NO:P:R:S:Wc:dgk:n:o:p:qr:s:t:vw:z:")) != -1)
595 case 'C': /* cumulative values */
596 use_cumulative_counts = !use_cumulative_counts;
597 args.pa_required |= FLAG_HAS_COUNTING_PMCS;
602 if (optarg[0] == '*' && optarg[1] == '\0')
603 cpumask = (1 << ncpu) - 1;
605 cpumask = pmcstat_get_cpumask(optarg);
607 args.pa_required |= FLAG_HAS_SYSTEM_PMCS;
611 if (stat(optarg, &sb) < 0)
612 err(EX_OSERR, "ERROR: Cannot stat \"%s\"",
614 if (!S_ISDIR(sb.st_mode))
615 errx(EX_USAGE, "ERROR: \"%s\" is not a "
616 "directory.", optarg);
617 args.pa_samplesdir = optarg;
618 args.pa_flags |= FLAG_HAS_SAMPLESDIR;
619 args.pa_required |= FLAG_DO_GPROF;
622 case 'd': /* toggle descendents */
623 do_descendants = !do_descendants;
624 args.pa_required |= FLAG_HAS_PROCESS_PMCS;
627 case 'G': /* produce a system-wide callgraph */
628 args.pa_flags |= FLAG_DO_CALLGRAPHS;
629 graphfilename = optarg;
632 case 'g': /* produce gprof compatible profiles */
633 args.pa_flags |= FLAG_DO_GPROF;
636 case 'k': /* pathname to the kernel */
637 free(args.pa_kernel);
638 args.pa_kernel = strdup(optarg);
639 args.pa_required |= FLAG_DO_ANALYSIS;
640 args.pa_flags |= FLAG_HAS_KERNELPATH;
643 case 'E': /* log process exit */
644 do_logprocexit = !do_logprocexit;
645 args.pa_required |= (FLAG_HAS_PROCESS_PMCS |
646 FLAG_HAS_COUNTING_PMCS | FLAG_HAS_OUTPUT_LOGFILE);
649 case 'M': /* mapfile */
650 args.pa_mapfilename = optarg;
654 do_callchain = !do_callchain;
655 args.pa_required |= FLAG_HAS_SAMPLING_PMCS;
658 case 'p': /* process virtual counting PMC */
659 case 's': /* system-wide counting PMC */
660 case 'P': /* process virtual sampling PMC */
661 case 'S': /* system-wide sampling PMC */
662 if ((ev = malloc(sizeof(*ev))) == NULL)
663 errx(EX_SOFTWARE, "ERROR: Out of memory.");
666 case 'p': ev->ev_mode = PMC_MODE_TC; break;
667 case 's': ev->ev_mode = PMC_MODE_SC; break;
668 case 'P': ev->ev_mode = PMC_MODE_TS; break;
669 case 'S': ev->ev_mode = PMC_MODE_SS; break;
672 if (option == 'P' || option == 'p') {
673 args.pa_flags |= FLAG_HAS_PROCESS_PMCS;
674 args.pa_required |= (FLAG_HAS_COMMANDLINE |
678 if (option == 'P' || option == 'S') {
679 args.pa_flags |= FLAG_HAS_SAMPLING_PMCS;
680 args.pa_required |= (FLAG_HAS_PIPE |
681 FLAG_HAS_OUTPUT_LOGFILE);
684 if (option == 'p' || option == 's')
685 args.pa_flags |= FLAG_HAS_COUNTING_PMCS;
687 if (option == 's' || option == 'S')
688 args.pa_flags |= FLAG_HAS_SYSTEM_PMCS;
690 ev->ev_spec = strdup(optarg);
692 if (option == 'S' || option == 'P')
693 ev->ev_count = current_sampling_count;
697 if (option == 'S' || option == 's')
698 ev->ev_cpu = ffs(cpumask) - 1;
700 ev->ev_cpu = PMC_CPU_ANY;
704 ev->ev_flags |= PMC_F_CALLCHAIN;
706 ev->ev_flags |= PMC_F_DESCENDANTS;
708 ev->ev_flags |= PMC_F_LOG_PROCEXIT;
710 ev->ev_flags |= PMC_F_LOG_PROCCSW;
712 ev->ev_cumulative = use_cumulative_counts;
715 ev->ev_pmcid = PMC_ID_INVALID;
717 /* extract event name */
718 c = strcspn(optarg, ", \t");
719 ev->ev_name = malloc(c + 1);
720 (void) strncpy(ev->ev_name, optarg, c);
721 *(ev->ev_name + c) = '\0';
723 STAILQ_INSERT_TAIL(&args.pa_events, ev, ev_next);
725 if (option == 's' || option == 'S')
726 pmcstat_clone_event_descriptor(&args, ev,
727 cpumask & ~(1 << ev->ev_cpu));
731 case 'n': /* sampling count */
732 current_sampling_count = strtol(optarg, &end, 0);
733 if (*end != '\0' || current_sampling_count <= 0)
735 "ERROR: Illegal count value \"%s\".",
737 args.pa_required |= FLAG_HAS_SAMPLING_PMCS;
740 case 'o': /* outputfile */
741 if (args.pa_printfile != NULL)
742 (void) fclose(args.pa_printfile);
743 if ((args.pa_printfile = fopen(optarg, "w")) == NULL)
744 errx(EX_OSERR, "ERROR: cannot open \"%s\" for "
746 args.pa_flags |= FLAG_DO_PRINT;
749 case 'O': /* sampling output */
750 if (args.pa_outputpath)
751 errx(EX_USAGE, "ERROR: option -O may only be "
753 args.pa_outputpath = optarg;
754 args.pa_flags |= FLAG_HAS_OUTPUT_LOGFILE;
757 case 'q': /* quiet mode */
758 args.pa_verbosity = 0;
761 case 'r': /* root FS path */
762 args.pa_fsroot = optarg;
765 case 'R': /* read an existing log file */
766 if (args.pa_inputpath != NULL)
767 errx(EX_USAGE, "ERROR: option -R may only be "
769 args.pa_inputpath = optarg;
770 if (args.pa_printfile == stderr)
771 args.pa_printfile = stdout;
772 args.pa_flags |= FLAG_READ_LOGFILE;
775 case 't': /* target pid or process name */
776 pmcstat_find_targets(&args, optarg);
778 args.pa_flags |= FLAG_HAS_TARGET;
779 args.pa_required |= FLAG_HAS_PROCESS_PMCS;
782 case 'v': /* verbose */
786 case 'w': /* wait interval */
787 interval = strtod(optarg, &end);
788 if (*end != '\0' || interval <= 0)
789 errx(EX_USAGE, "ERROR: Illegal wait interval "
790 "value \"%s\".", optarg);
791 args.pa_flags |= FLAG_HAS_WAIT_INTERVAL;
792 args.pa_required |= FLAG_HAS_COUNTING_PMCS;
793 args.pa_interval = interval;
796 case 'W': /* toggle LOG_CSW */
797 do_logproccsw = !do_logproccsw;
798 args.pa_required |= (FLAG_HAS_PROCESS_PMCS |
799 FLAG_HAS_COUNTING_PMCS | FLAG_HAS_OUTPUT_LOGFILE);
803 graphdepth = strtod(optarg, &end);
804 if (*end != '\0' || graphdepth <= 0)
805 errx(EX_USAGE, "ERROR: Illegal callchain "
806 "depth \"%s\".", optarg);
807 args.pa_graphdepth = graphdepth;
808 args.pa_required |= FLAG_DO_CALLGRAPHS;
813 pmcstat_show_usage();
818 args.pa_argc = (argc -= optind);
819 args.pa_argv = (argv += optind);
821 args.pa_cpumask = cpumask; /* For selecting CPUs using -R. */
823 if (argc) /* command line present */
824 args.pa_flags |= FLAG_HAS_COMMANDLINE;
826 if (args.pa_flags & (FLAG_DO_GPROF | FLAG_DO_CALLGRAPHS))
827 args.pa_flags |= FLAG_DO_ANALYSIS;
830 * Check invocation syntax.
833 /* disallow -O and -R together */
834 if (args.pa_outputpath && args.pa_inputpath)
835 errx(EX_USAGE, "ERROR: options -O and -R are mutually "
838 if (args.pa_flags & FLAG_READ_LOGFILE) {
840 if (args.pa_flags & FLAG_HAS_COMMANDLINE)
841 errmsg = "a command line specification";
842 else if (args.pa_flags & FLAG_HAS_TARGET)
843 errmsg = "option -t";
844 else if (!STAILQ_EMPTY(&args.pa_events))
845 errmsg = "a PMC event specification";
847 errx(EX_USAGE, "ERROR: option -R may not be used with "
849 } else if (STAILQ_EMPTY(&args.pa_events))
850 /* All other uses require a PMC spec. */
851 pmcstat_show_usage();
853 /* check for -t pid without a process PMC spec */
854 if ((args.pa_required & FLAG_HAS_TARGET) &&
855 (args.pa_flags & FLAG_HAS_PROCESS_PMCS) == 0)
856 errx(EX_USAGE, "ERROR: option -t requires a process mode PMC "
859 /* check for process-mode options without a command or -t pid */
860 if ((args.pa_required & FLAG_HAS_PROCESS_PMCS) &&
861 (args.pa_flags & (FLAG_HAS_COMMANDLINE | FLAG_HAS_TARGET)) == 0)
862 errx(EX_USAGE, "ERROR: options -d, -E, -p, -P, and -W require "
863 "a command line or target process.");
865 /* check for -p | -P without a target process of some sort */
866 if ((args.pa_required & (FLAG_HAS_COMMANDLINE | FLAG_HAS_TARGET)) &&
867 (args.pa_flags & (FLAG_HAS_COMMANDLINE | FLAG_HAS_TARGET)) == 0)
868 errx(EX_USAGE, "ERROR: options -P and -p require a "
869 "target process or a command line.");
871 /* check for process-mode options without a process-mode PMC */
872 if ((args.pa_required & FLAG_HAS_PROCESS_PMCS) &&
873 (args.pa_flags & FLAG_HAS_PROCESS_PMCS) == 0)
874 errx(EX_USAGE, "ERROR: options -d, -E, and -W require a "
875 "process mode PMC to be specified.");
877 /* check for -c cpu with no system mode PMCs or logfile. */
878 if ((args.pa_required & FLAG_HAS_SYSTEM_PMCS) &&
879 (args.pa_flags & FLAG_HAS_SYSTEM_PMCS) == 0 &&
880 (args.pa_flags & FLAG_READ_LOGFILE) == 0)
881 errx(EX_USAGE, "ERROR: option -c requires at least one "
882 "system mode PMC to be specified.");
884 /* check for counting mode options without a counting PMC */
885 if ((args.pa_required & FLAG_HAS_COUNTING_PMCS) &&
886 (args.pa_flags & FLAG_HAS_COUNTING_PMCS) == 0)
887 errx(EX_USAGE, "ERROR: options -C, -W, -o and -w require at "
888 "least one counting mode PMC to be specified.");
890 /* check for sampling mode options without a sampling PMC spec */
891 if ((args.pa_required & FLAG_HAS_SAMPLING_PMCS) &&
892 (args.pa_flags & FLAG_HAS_SAMPLING_PMCS) == 0)
893 errx(EX_USAGE, "ERROR: options -N, -n and -O require at "
894 "least one sampling mode PMC to be specified.");
896 /* check if -g/-G are being used correctly */
897 if ((args.pa_flags & FLAG_DO_ANALYSIS) &&
898 !(args.pa_flags & (FLAG_HAS_SAMPLING_PMCS|FLAG_READ_LOGFILE)))
899 errx(EX_USAGE, "ERROR: options -g/-G require sampling PMCs "
900 "or -R to be specified.");
902 /* check if -O was spuriously specified */
903 if ((args.pa_flags & FLAG_HAS_OUTPUT_LOGFILE) &&
904 (args.pa_required & FLAG_HAS_OUTPUT_LOGFILE) == 0)
906 "ERROR: option -O is used only with options "
907 "-E, -P, -S and -W.");
909 /* -k kernel path require -g/-G or -R */
910 if ((args.pa_flags & FLAG_HAS_KERNELPATH) &&
911 (args.pa_flags & FLAG_DO_ANALYSIS) == 0 &&
912 (args.pa_flags & FLAG_READ_LOGFILE) == 0)
913 errx(EX_USAGE, "ERROR: option -k is only used with -g/-R.");
915 /* -D only applies to gprof output mode (-g) */
916 if ((args.pa_flags & FLAG_HAS_SAMPLESDIR) &&
917 (args.pa_flags & FLAG_DO_GPROF) == 0)
918 errx(EX_USAGE, "ERROR: option -D is only used with -g.");
920 /* -M mapfile requires -g or -R */
921 if (args.pa_mapfilename != NULL &&
922 (args.pa_flags & FLAG_DO_GPROF) == 0 &&
923 (args.pa_flags & FLAG_READ_LOGFILE) == 0)
924 errx(EX_USAGE, "ERROR: option -M is only used with -g/-R.");
927 * Disallow textual output of sampling PMCs if counting PMCs
928 * have also been asked for, mostly because the combined output
929 * is difficult to make sense of.
931 if ((args.pa_flags & FLAG_HAS_COUNTING_PMCS) &&
932 (args.pa_flags & FLAG_HAS_SAMPLING_PMCS) &&
933 ((args.pa_flags & FLAG_HAS_OUTPUT_LOGFILE) == 0))
934 errx(EX_USAGE, "ERROR: option -O is required if counting and "
935 "sampling PMCs are specified together.");
938 * Check if "-k kerneldir" was specified, and if whether
939 * 'kerneldir' actually refers to a a file. If so, use
940 * `dirname path` to determine the kernel directory.
942 if (args.pa_flags & FLAG_HAS_KERNELPATH) {
943 (void) snprintf(buffer, sizeof(buffer), "%s%s", args.pa_fsroot,
945 if (stat(buffer, &sb) < 0)
946 err(EX_OSERR, "ERROR: Cannot locate kernel \"%s\"",
948 if (!S_ISREG(sb.st_mode) && !S_ISDIR(sb.st_mode))
949 errx(EX_USAGE, "ERROR: \"%s\": Unsupported file type.",
951 if (!S_ISDIR(sb.st_mode)) {
952 tmp = args.pa_kernel;
953 args.pa_kernel = strdup(dirname(args.pa_kernel));
955 (void) snprintf(buffer, sizeof(buffer), "%s%s",
956 args.pa_fsroot, args.pa_kernel);
957 if (stat(buffer, &sb) < 0)
958 err(EX_OSERR, "ERROR: Cannot stat \"%s\"",
960 if (!S_ISDIR(sb.st_mode))
961 errx(EX_USAGE, "ERROR: \"%s\" is not a "
962 "directory.", buffer);
967 * If we have a callgraph be created, select the outputfile.
969 if (args.pa_flags & FLAG_DO_CALLGRAPHS) {
970 if (strcmp(graphfilename, "-") == 0)
971 args.pa_graphfile = args.pa_printfile;
973 args.pa_graphfile = fopen(graphfilename, "w");
974 if (args.pa_graphfile == NULL)
975 err(EX_OSERR, "ERROR: cannot open \"%s\" "
976 "for writing", graphfilename);
980 /* if we've been asked to process a log file, do that and exit */
981 if (args.pa_flags & FLAG_READ_LOGFILE) {
983 * Print the log in textual form if we haven't been
984 * asked to generate profiling information.
986 if ((args.pa_flags & FLAG_DO_ANALYSIS) == 0)
987 args.pa_flags |= FLAG_DO_PRINT;
989 pmcstat_initialize_logging(&args);
990 args.pa_logfd = pmcstat_open_log(args.pa_inputpath,
991 PMCSTAT_OPEN_FOR_READ);
992 if ((args.pa_logparser = pmclog_open(args.pa_logfd)) == NULL)
993 err(EX_OSERR, "ERROR: Cannot create parser");
994 pmcstat_process_log(&args);
995 pmcstat_shutdown_logging(&args);
999 /* otherwise, we've been asked to collect data */
1002 "ERROR: Initialization of the pmc(3) library failed");
1004 if ((npmc = pmc_npmc(0)) < 0) /* assume all CPUs are identical */
1005 err(EX_OSERR, "ERROR: Cannot determine the number of PMCs "
1008 /* Allocate a kqueue */
1009 if ((pmcstat_kq = kqueue()) < 0)
1010 err(EX_OSERR, "ERROR: Cannot allocate kqueue");
1013 * Configure the specified log file or setup a default log
1014 * consumer via a pipe.
1016 if (args.pa_required & FLAG_HAS_OUTPUT_LOGFILE) {
1017 if (args.pa_outputpath)
1018 args.pa_logfd = pmcstat_open_log(args.pa_outputpath,
1019 PMCSTAT_OPEN_FOR_WRITE);
1022 * process the log on the fly by reading it in
1025 if (pipe(pipefd) < 0)
1026 err(EX_OSERR, "ERROR: pipe(2) failed");
1028 if (fcntl(pipefd[READPIPEFD], F_SETFL, O_NONBLOCK) < 0)
1029 err(EX_OSERR, "ERROR: fcntl(2) failed");
1031 EV_SET(&kev, pipefd[READPIPEFD], EVFILT_READ, EV_ADD,
1034 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
1035 err(EX_OSERR, "ERROR: Cannot register kevent");
1037 args.pa_logfd = pipefd[WRITEPIPEFD];
1039 args.pa_flags |= (FLAG_HAS_PIPE | FLAG_DO_PRINT);
1040 args.pa_logparser = pmclog_open(pipefd[READPIPEFD]);
1043 if (pmc_configure_logfile(args.pa_logfd) < 0)
1044 err(EX_OSERR, "ERROR: Cannot configure log file");
1047 /* remember to check for driver errors if we are sampling or logging */
1048 check_driver_stats = (args.pa_flags & FLAG_HAS_SAMPLING_PMCS) ||
1049 (args.pa_flags & FLAG_HAS_OUTPUT_LOGFILE);
1055 STAILQ_FOREACH(ev, &args.pa_events, ev_next) {
1056 if (pmc_allocate(ev->ev_spec, ev->ev_mode,
1057 ev->ev_flags, ev->ev_cpu, &ev->ev_pmcid) < 0)
1058 err(EX_OSERR, "ERROR: Cannot allocate %s-mode pmc with "
1059 "specification \"%s\"",
1060 PMC_IS_SYSTEM_MODE(ev->ev_mode) ? "system" : "process",
1063 if (PMC_IS_SAMPLING_MODE(ev->ev_mode) &&
1064 pmc_set(ev->ev_pmcid, ev->ev_count) < 0)
1065 err(EX_OSERR, "ERROR: Cannot set sampling count "
1066 "for PMC \"%s\"", ev->ev_name);
1069 /* compute printout widths */
1070 STAILQ_FOREACH(ev, &args.pa_events, ev_next) {
1075 (void) pmc_width(ev->ev_pmcid, &counter_width);
1076 header_width = strlen(ev->ev_name) + 2; /* prefix '%c/' */
1077 display_width = (int) floor(counter_width / 3.32193) + 1;
1079 if (PMC_IS_SYSTEM_MODE(ev->ev_mode))
1080 header_width += 3; /* 2 digit CPU number + '/' */
1082 if (header_width > display_width) {
1083 ev->ev_fieldskip = 0;
1084 ev->ev_fieldwidth = header_width;
1086 ev->ev_fieldskip = display_width -
1088 ev->ev_fieldwidth = display_width;
1093 * If our output is being set to a terminal, register a handler
1094 * for window size changes.
1097 if (isatty(fileno(args.pa_printfile))) {
1099 if (ioctl(fileno(args.pa_printfile), TIOCGWINSZ, &ws) < 0)
1100 err(EX_OSERR, "ERROR: Cannot determine window size");
1102 pmcstat_displayheight = ws.ws_row - 1;
1104 EV_SET(&kev, SIGWINCH, EVFILT_SIGNAL, EV_ADD, 0, 0, NULL);
1106 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
1107 err(EX_OSERR, "ERROR: Cannot register kevent for "
1111 EV_SET(&kev, SIGINT, EVFILT_SIGNAL, EV_ADD, 0, 0, NULL);
1112 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
1113 err(EX_OSERR, "ERROR: Cannot register kevent for SIGINT");
1115 EV_SET(&kev, SIGIO, EVFILT_SIGNAL, EV_ADD, 0, 0, NULL);
1116 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
1117 err(EX_OSERR, "ERROR: Cannot register kevent for SIGIO");
1120 * An exec() failure of a forked child is signalled by the
1121 * child sending the parent a SIGCHLD. We don't register an
1122 * actual signal handler for SIGCHLD, but instead use our
1123 * kqueue to pick up the signal.
1125 EV_SET(&kev, SIGCHLD, EVFILT_SIGNAL, EV_ADD, 0, 0, NULL);
1126 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
1127 err(EX_OSERR, "ERROR: Cannot register kevent for SIGCHLD");
1129 /* setup a timer if we have counting mode PMCs needing to be printed */
1130 if ((args.pa_flags & FLAG_HAS_COUNTING_PMCS) &&
1131 (args.pa_required & FLAG_HAS_OUTPUT_LOGFILE) == 0) {
1132 EV_SET(&kev, 0, EVFILT_TIMER, EV_ADD, 0,
1133 args.pa_interval * 1000, NULL);
1135 if (kevent(pmcstat_kq, &kev, 1, NULL, 0, NULL) < 0)
1136 err(EX_OSERR, "ERROR: Cannot register kevent for "
1140 /* attach PMCs to the target process, starting it if specified */
1141 if (args.pa_flags & FLAG_HAS_COMMANDLINE)
1142 pmcstat_create_process(&args);
1144 if (check_driver_stats && pmc_get_driver_stats(&ds_start) < 0)
1145 err(EX_OSERR, "ERROR: Cannot retrieve driver statistics");
1147 /* Attach process pmcs to the target process. */
1148 if (args.pa_flags & (FLAG_HAS_TARGET | FLAG_HAS_COMMANDLINE)) {
1149 if (SLIST_EMPTY(&args.pa_targets))
1150 errx(EX_DATAERR, "ERROR: No matching target "
1153 pmcstat_attach_pmcs(&args);
1156 kvm_close(pmcstat_kvm);
1161 /* start the pmcs */
1162 pmcstat_start_pmcs(&args);
1164 /* start the (commandline) process if needed */
1165 if (args.pa_flags & FLAG_HAS_COMMANDLINE)
1166 pmcstat_start_process();
1168 /* initialize logging if printing the configured log */
1169 if ((args.pa_flags & FLAG_DO_PRINT) &&
1170 (args.pa_flags & (FLAG_HAS_PIPE | FLAG_HAS_OUTPUT_LOGFILE)))
1171 pmcstat_initialize_logging(&args);
1173 /* Handle SIGINT using the kqueue loop */
1174 sa.sa_handler = SIG_IGN;
1176 (void) sigemptyset(&sa.sa_mask);
1178 if (sigaction(SIGINT, &sa, NULL) < 0)
1179 err(EX_OSERR, "ERROR: Cannot install signal handler");
1182 * loop till either the target process (if any) exits, or we
1183 * are killed by a SIGINT.
1185 runstate = PMCSTAT_RUNNING;
1188 if ((c = kevent(pmcstat_kq, NULL, 0, &kev, 1, NULL)) <= 0) {
1190 err(EX_OSERR, "ERROR: kevent failed");
1195 if (kev.flags & EV_ERROR)
1196 errc(EX_OSERR, kev.data, "ERROR: kevent failed");
1198 switch (kev.filter) {
1199 case EVFILT_PROC: /* target has exited */
1200 if (args.pa_flags & (FLAG_HAS_OUTPUT_LOGFILE |
1202 runstate = pmcstat_close_log(&args);
1204 runstate = PMCSTAT_FINISHED;
1208 case EVFILT_READ: /* log file data is present */
1209 runstate = pmcstat_process_log(&args);
1213 if (kev.ident == SIGCHLD) {
1215 * The child process sends us a
1216 * SIGCHLD if its exec() failed. We
1217 * wait for it to exit and then exit
1221 runstate = PMCSTAT_FINISHED;
1222 } else if (kev.ident == SIGIO) {
1224 * We get a SIGIO if a PMC loses all
1225 * of its targets, or if logfile
1226 * writes encounter an error.
1228 if (args.pa_flags & (FLAG_HAS_OUTPUT_LOGFILE |
1230 runstate = pmcstat_close_log(&args);
1232 (FLAG_DO_PRINT|FLAG_DO_ANALYSIS))
1233 pmcstat_process_log(&args);
1235 do_print = 1; /* print PMCs at exit */
1236 runstate = PMCSTAT_FINISHED;
1237 } else if (kev.ident == SIGINT) {
1238 /* Kill the child process if we started it */
1239 if (args.pa_flags & FLAG_HAS_COMMANDLINE)
1240 pmcstat_kill_process(&args);
1241 runstate = PMCSTAT_FINISHED;
1242 } else if (kev.ident == SIGWINCH) {
1243 if (ioctl(fileno(args.pa_printfile),
1244 TIOCGWINSZ, &ws) < 0)
1245 err(EX_OSERR, "ERROR: Cannot determine "
1247 pmcstat_displayheight = ws.ws_row - 1;
1253 case EVFILT_TIMER: /* print out counting PMCs */
1260 (args.pa_required & FLAG_HAS_OUTPUT_LOGFILE) == 0) {
1261 pmcstat_print_pmcs(&args);
1262 if (runstate == PMCSTAT_FINISHED && /* final newline */
1263 (args.pa_flags & FLAG_DO_PRINT) == 0)
1264 (void) fprintf(args.pa_printfile, "\n");
1268 } while (runstate != PMCSTAT_FINISHED);
1270 /* flush any pending log entries */
1271 if (args.pa_flags & (FLAG_HAS_OUTPUT_LOGFILE | FLAG_HAS_PIPE))
1272 pmc_flush_logfile();
1274 pmcstat_cleanup(&args);
1276 free(args.pa_kernel);
1278 /* check if the driver lost any samples or events */
1279 if (check_driver_stats) {
1280 if (pmc_get_driver_stats(&ds_end) < 0)
1281 err(EX_OSERR, "ERROR: Cannot retrieve driver "
1283 if (ds_start.pm_intr_bufferfull != ds_end.pm_intr_bufferfull &&
1284 args.pa_verbosity > 0)
1285 warnx("WARNING: some samples were dropped. Please "
1286 "consider tuning the \"kern.hwpmc.nsamples\" "
1288 if (ds_start.pm_buffer_requests_failed !=
1289 ds_end.pm_buffer_requests_failed &&
1290 args.pa_verbosity > 0)
1291 warnx("WARNING: some events were discarded. Please "
1292 "consider tuning the \"kern.hwpmc.nbuffers\" "