]> CyberLeo.Net >> Repos - FreeBSD/FreeBSD.git/blob - lib/libpmc/pmclog.c
add -n option to suppress clearing the build tree and add -DNO_CLEAN
[FreeBSD/FreeBSD.git] / lib / libpmc / pmclog.c
1 /*-
2  * Copyright (c) 2005-2007 Joseph Koshy
3  * Copyright (c) 2007 The FreeBSD Foundation
4  * All rights reserved.
5  *
6  * Portions of this software were developed by A. Joseph Koshy under
7  * sponsorship from the FreeBSD Foundation and Google, Inc.
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  * 1. Redistributions of source code must retain the above copyright
13  *    notice, this list of conditions and the following disclaimer.
14  * 2. Redistributions in binary form must reproduce the above copyright
15  *    notice, this list of conditions and the following disclaimer in the
16  *    documentation and/or other materials provided with the distribution.
17  *
18  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
19  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
22  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28  * SUCH DAMAGE.
29  */
30
31 #include <sys/cdefs.h>
32 __FBSDID("$FreeBSD$");
33
34 #include <sys/param.h>
35 #include <sys/pmc.h>
36 #include <sys/pmclog.h>
37
38 #include <assert.h>
39 #include <errno.h>
40 #include <pmc.h>
41 #include <pmclog.h>
42 #include <stddef.h>
43 #include <stdlib.h>
44 #include <string.h>
45 #include <strings.h>
46 #include <unistd.h>
47
48 #include <machine/pmc_mdep.h>
49
50 #define PMCLOG_BUFFER_SIZE                      4096
51
52 /*
53  * API NOTES
54  *
55  * The pmclog(3) API is oriented towards parsing an event stream in
56  * "realtime", i.e., from an data source that may or may not preserve
57  * record boundaries -- for example when the data source is elsewhere
58  * on a network.  The API allows data to be fed into the parser zero
59  * or more bytes at a time.
60  *
61  * The state for a log file parser is maintained in a 'struct
62  * pmclog_parse_state'.  Parser invocations are done by calling
63  * 'pmclog_read()'; this function will inform the caller when a
64  * complete event is parsed.
65  *
66  * The parser first assembles a complete log file event in an internal
67  * work area (see "ps_saved" below).  Once a complete log file event
68  * is read, the parser then parses it and converts it to an event
69  * descriptor usable by the client.  We could possibly avoid this two
70  * step process by directly parsing the input log to set fields in the
71  * event record.  However the parser's state machine would get
72  * insanely complicated, and this code is unlikely to be used in
73  * performance critical paths.
74  */
75
76 enum pmclog_parser_state {
77         PL_STATE_NEW_RECORD,            /* in-between records */
78         PL_STATE_EXPECTING_HEADER,      /* header being read */
79         PL_STATE_PARTIAL_RECORD,        /* header present but not the record */
80         PL_STATE_ERROR                  /* parsing error encountered */
81 };
82
83 struct pmclog_parse_state {
84         enum pmclog_parser_state ps_state;
85         enum pmc_cputype        ps_arch;        /* log file architecture */
86         uint32_t                ps_version;     /* hwpmc version */
87         int                     ps_initialized; /* whether initialized */
88         int                     ps_count;       /* count of records processed */
89         off_t                   ps_offset;      /* stream byte offset */
90         union pmclog_entry      ps_saved;       /* saved partial log entry */
91         int                     ps_svcount;     /* #bytes saved */
92         int                     ps_fd;          /* active fd or -1 */
93         char                    *ps_buffer;     /* scratch buffer if fd != -1 */
94         char                    *ps_data;       /* current parse pointer */
95         size_t                  ps_len;         /* length of buffered data */
96 };
97
98 #define PMCLOG_HEADER_FROM_SAVED_STATE(PS)                              \
99         (* ((uint32_t *) &(PS)->ps_saved))
100
101 #define PMCLOG_INITIALIZE_READER(LE,A)  LE = (uint32_t *) &(A)
102 #define PMCLOG_READ32(LE,V)             do {                            \
103                 (V)  = *(LE)++;                                         \
104         } while (0)
105 #define PMCLOG_READ64(LE,V)             do {                            \
106                 uint64_t _v;                                            \
107                 _v  = (uint64_t) *(LE)++;                               \
108                 _v |= ((uint64_t) *(LE)++) << 32;                       \
109                 (V) = _v;                                               \
110         } while (0)
111
112 #define PMCLOG_READSTRING(LE,DST,LEN)   strlcpy((DST), (char *) (LE), (LEN))
113
114 /*
115  * Assemble a log record from '*len' octets starting from address '*data'.
116  * Update 'data' and 'len' to reflect the number of bytes consumed.
117  *
118  * '*data' is potentially an unaligned address and '*len' octets may
119  * not be enough to complete a event record.
120  */
121
122 static enum pmclog_parser_state
123 pmclog_get_record(struct pmclog_parse_state *ps, char **data, ssize_t *len)
124 {
125         int avail, copylen, recordsize, used;
126         uint32_t h;
127         const int HEADERSIZE = sizeof(uint32_t);
128         char *src, *dst;
129
130         if ((avail = *len) <= 0)
131                 return (ps->ps_state = PL_STATE_ERROR);
132
133         src = *data;
134         h = used = 0;
135
136         if (ps->ps_state == PL_STATE_NEW_RECORD)
137                 ps->ps_svcount = 0;
138
139         dst = (char *) &ps->ps_saved + ps->ps_svcount;
140
141         switch (ps->ps_state) {
142         case PL_STATE_NEW_RECORD:
143
144                 /*
145                  * Transitions:
146                  *
147                  * Case A: avail < headersize
148                  *      -> 'expecting header'
149                  *
150                  * Case B: avail >= headersize
151                  *    B.1: avail < recordsize
152                  *         -> 'partial record'
153                  *    B.2: avail >= recordsize
154                  *         -> 'new record'
155                  */
156
157                 copylen = avail < HEADERSIZE ? avail : HEADERSIZE;
158                 bcopy(src, dst, copylen);
159                 ps->ps_svcount = used = copylen;
160
161                 if (copylen < HEADERSIZE) {
162                         ps->ps_state = PL_STATE_EXPECTING_HEADER;
163                         goto done;
164                 }
165
166                 src += copylen;
167                 dst += copylen;
168
169                 h = PMCLOG_HEADER_FROM_SAVED_STATE(ps);
170                 recordsize = PMCLOG_HEADER_TO_LENGTH(h);
171
172                 if (recordsize <= 0)
173                         goto error;
174
175                 if (recordsize <= avail) { /* full record available */
176                         bcopy(src, dst, recordsize - copylen);
177                         ps->ps_svcount = used = recordsize;
178                         goto done;
179                 }
180
181                 /* header + a partial record is available */
182                 bcopy(src, dst, avail - copylen);
183                 ps->ps_svcount = used = avail;
184                 ps->ps_state = PL_STATE_PARTIAL_RECORD;
185
186                 break;
187
188         case PL_STATE_EXPECTING_HEADER:
189
190                 /*
191                  * Transitions:
192                  *
193                  * Case C: avail+saved < headersize
194                  *      -> 'expecting header'
195                  *
196                  * Case D: avail+saved >= headersize
197                  *    D.1: avail+saved < recordsize
198                  *      -> 'partial record'
199                  *    D.2: avail+saved >= recordsize
200                  *      -> 'new record'
201                  *    (see PARTIAL_RECORD handling below)
202                  */
203
204                 if (avail + ps->ps_svcount < HEADERSIZE) {
205                         bcopy(src, dst, avail);
206                         ps->ps_svcount += avail;
207                         used = avail;
208                         break;
209                 }
210
211                 used = copylen = HEADERSIZE - ps->ps_svcount;
212                 bcopy(src, dst, copylen);
213                 src += copylen;
214                 dst += copylen;
215                 avail -= copylen;
216                 ps->ps_svcount += copylen;
217
218                 /*FALLTHROUGH*/
219
220         case PL_STATE_PARTIAL_RECORD:
221
222                 /*
223                  * Transitions:
224                  *
225                  * Case E: avail+saved < recordsize
226                  *      -> 'partial record'
227                  *
228                  * Case F: avail+saved >= recordsize
229                  *      -> 'new record'
230                  */
231
232                 h = PMCLOG_HEADER_FROM_SAVED_STATE(ps);
233                 recordsize = PMCLOG_HEADER_TO_LENGTH(h);
234
235                 if (recordsize <= 0)
236                         goto error;
237
238                 if (avail + ps->ps_svcount < recordsize) {
239                         copylen = avail;
240                         ps->ps_state = PL_STATE_PARTIAL_RECORD;
241                 } else {
242                         copylen = recordsize - ps->ps_svcount;
243                         ps->ps_state = PL_STATE_NEW_RECORD;
244                 }
245
246                 bcopy(src, dst, copylen);
247                 ps->ps_svcount += copylen;
248                 used += copylen;
249                 break;
250
251         default:
252                 goto error;
253         }
254
255  done:
256         *data += used;
257         *len  -= used;
258         return ps->ps_state;
259
260  error:
261         ps->ps_state = PL_STATE_ERROR;
262         return ps->ps_state;
263 }
264
265 /*
266  * Get an event from the stream pointed to by '*data'.  '*len'
267  * indicates the number of bytes available to parse.  Arguments
268  * '*data' and '*len' are updated to indicate the number of bytes
269  * consumed.
270  */
271
272 static int
273 pmclog_get_event(void *cookie, char **data, ssize_t *len,
274     struct pmclog_ev *ev)
275 {
276         int evlen, pathlen;
277         uint32_t h, *le, npc;
278         enum pmclog_parser_state e;
279         struct pmclog_parse_state *ps;
280
281         ps = (struct pmclog_parse_state *) cookie;
282
283         assert(ps->ps_state != PL_STATE_ERROR);
284
285         if ((e = pmclog_get_record(ps,data,len)) == PL_STATE_ERROR) {
286                 ev->pl_state = PMCLOG_ERROR;
287                 return -1;
288         }
289
290         if (e != PL_STATE_NEW_RECORD) {
291                 ev->pl_state = PMCLOG_REQUIRE_DATA;
292                 return -1;
293         }
294
295         PMCLOG_INITIALIZE_READER(le, ps->ps_saved);
296
297         PMCLOG_READ32(le,h);
298
299         if (!PMCLOG_HEADER_CHECK_MAGIC(h)) {
300                 ps->ps_state = PL_STATE_ERROR;
301                 ev->pl_state = PMCLOG_ERROR;
302                 return -1;
303         }
304
305         /* copy out the time stamp */
306         PMCLOG_READ32(le,ev->pl_ts.tv_sec);
307         PMCLOG_READ32(le,ev->pl_ts.tv_nsec);
308
309         evlen = PMCLOG_HEADER_TO_LENGTH(h);
310
311 #define PMCLOG_GET_PATHLEN(P,E,TYPE) do {                               \
312                 (P) = (E) - offsetof(struct TYPE, pl_pathname);         \
313                 if ((P) > PATH_MAX || (P) < 0)                          \
314                         goto error;                                     \
315         } while (0)
316
317 #define PMCLOG_GET_CALLCHAIN_SIZE(SZ,E) do {                            \
318                 (SZ) = ((E) - offsetof(struct pmclog_callchain, pl_pc)) \
319                         / sizeof(uintfptr_t);                           \
320         } while (0);
321
322         switch (ev->pl_type = PMCLOG_HEADER_TO_TYPE(h)) {
323         case PMCLOG_TYPE_CALLCHAIN:
324                 PMCLOG_READ32(le,ev->pl_u.pl_cc.pl_pid);
325                 PMCLOG_READ32(le,ev->pl_u.pl_cc.pl_pmcid);
326                 PMCLOG_READ32(le,ev->pl_u.pl_cc.pl_cpuflags);
327                 PMCLOG_GET_CALLCHAIN_SIZE(ev->pl_u.pl_cc.pl_npc,evlen);
328                 for (npc = 0; npc < ev->pl_u.pl_cc.pl_npc; npc++)
329                         PMCLOG_READADDR(le,ev->pl_u.pl_cc.pl_pc[npc]);
330                 for (;npc < PMC_CALLCHAIN_DEPTH_MAX; npc++)
331                         ev->pl_u.pl_cc.pl_pc[npc] = (uintfptr_t) 0;
332                 break;
333         case PMCLOG_TYPE_CLOSELOG:
334         case PMCLOG_TYPE_DROPNOTIFY:
335                 /* nothing to do */
336                 break;
337         case PMCLOG_TYPE_INITIALIZE:
338                 PMCLOG_READ32(le,ev->pl_u.pl_i.pl_version);
339                 PMCLOG_READ32(le,ev->pl_u.pl_i.pl_arch);
340                 ps->ps_version = ev->pl_u.pl_i.pl_version;
341                 ps->ps_arch = ev->pl_u.pl_i.pl_arch;
342                 ps->ps_initialized = 1;
343                 break;
344         case PMCLOG_TYPE_MAP_IN:
345                 PMCLOG_GET_PATHLEN(pathlen,evlen,pmclog_map_in);
346                 PMCLOG_READ32(le,ev->pl_u.pl_mi.pl_pid);
347                 PMCLOG_READADDR(le,ev->pl_u.pl_mi.pl_start);
348                 PMCLOG_READSTRING(le, ev->pl_u.pl_mi.pl_pathname, pathlen);
349                 break;
350         case PMCLOG_TYPE_MAP_OUT:
351                 PMCLOG_READ32(le,ev->pl_u.pl_mo.pl_pid);
352                 PMCLOG_READADDR(le,ev->pl_u.pl_mo.pl_start);
353                 PMCLOG_READADDR(le,ev->pl_u.pl_mo.pl_end);
354                 break;
355         case PMCLOG_TYPE_PCSAMPLE:
356                 PMCLOG_READ32(le,ev->pl_u.pl_s.pl_pid);
357                 PMCLOG_READADDR(le,ev->pl_u.pl_s.pl_pc);
358                 PMCLOG_READ32(le,ev->pl_u.pl_s.pl_pmcid);
359                 PMCLOG_READ32(le,ev->pl_u.pl_s.pl_usermode);
360                 break;
361         case PMCLOG_TYPE_PMCALLOCATE:
362                 PMCLOG_READ32(le,ev->pl_u.pl_a.pl_pmcid);
363                 PMCLOG_READ32(le,ev->pl_u.pl_a.pl_event);
364                 PMCLOG_READ32(le,ev->pl_u.pl_a.pl_flags);
365                 if ((ev->pl_u.pl_a.pl_evname =
366                     pmc_name_of_event(ev->pl_u.pl_a.pl_event)) == NULL)
367                         goto error;
368                 break;
369         case PMCLOG_TYPE_PMCATTACH:
370                 PMCLOG_GET_PATHLEN(pathlen,evlen,pmclog_pmcattach);
371                 PMCLOG_READ32(le,ev->pl_u.pl_t.pl_pmcid);
372                 PMCLOG_READ32(le,ev->pl_u.pl_t.pl_pid);
373                 PMCLOG_READSTRING(le,ev->pl_u.pl_t.pl_pathname,pathlen);
374                 break;
375         case PMCLOG_TYPE_PMCDETACH:
376                 PMCLOG_READ32(le,ev->pl_u.pl_d.pl_pmcid);
377                 PMCLOG_READ32(le,ev->pl_u.pl_d.pl_pid);
378                 break;
379         case PMCLOG_TYPE_PROCCSW:
380                 PMCLOG_READ32(le,ev->pl_u.pl_c.pl_pmcid);
381                 PMCLOG_READ64(le,ev->pl_u.pl_c.pl_value);
382                 PMCLOG_READ32(le,ev->pl_u.pl_c.pl_pid);
383                 break;
384         case PMCLOG_TYPE_PROCEXEC:
385                 PMCLOG_GET_PATHLEN(pathlen,evlen,pmclog_procexec);
386                 PMCLOG_READ32(le,ev->pl_u.pl_x.pl_pid);
387                 PMCLOG_READADDR(le,ev->pl_u.pl_x.pl_entryaddr);
388                 PMCLOG_READ32(le,ev->pl_u.pl_x.pl_pmcid);
389                 PMCLOG_READSTRING(le,ev->pl_u.pl_x.pl_pathname,pathlen);
390                 break;
391         case PMCLOG_TYPE_PROCEXIT:
392                 PMCLOG_READ32(le,ev->pl_u.pl_e.pl_pmcid);
393                 PMCLOG_READ64(le,ev->pl_u.pl_e.pl_value);
394                 PMCLOG_READ32(le,ev->pl_u.pl_e.pl_pid);
395                 break;
396         case PMCLOG_TYPE_PROCFORK:
397                 PMCLOG_READ32(le,ev->pl_u.pl_f.pl_oldpid);
398                 PMCLOG_READ32(le,ev->pl_u.pl_f.pl_newpid);
399                 break;
400         case PMCLOG_TYPE_SYSEXIT:
401                 PMCLOG_READ32(le,ev->pl_u.pl_se.pl_pid);
402                 break;
403         case PMCLOG_TYPE_USERDATA:
404                 PMCLOG_READ32(le,ev->pl_u.pl_u.pl_userdata);
405                 break;
406         default:        /* unknown record type */
407                 ps->ps_state = PL_STATE_ERROR;
408                 ev->pl_state = PMCLOG_ERROR;
409                 return (-1);
410         }
411
412         ev->pl_offset = (ps->ps_offset += evlen);
413         ev->pl_count  = (ps->ps_count += 1);
414         ev->pl_state = PMCLOG_OK;
415         return 0;
416
417  error:
418         ev->pl_state = PMCLOG_ERROR;
419         ps->ps_state = PL_STATE_ERROR;
420         return -1;
421 }
422
423 /*
424  * Extract and return the next event from the byte stream.
425  *
426  * Returns 0 and sets the event's state to PMCLOG_OK in case an event
427  * was successfully parsed.  Otherwise this function returns -1 and
428  * sets the event's state to one of PMCLOG_REQUIRE_DATA (if more data
429  * is needed) or PMCLOG_EOF (if an EOF was seen) or PMCLOG_ERROR if
430  * a parse error was encountered.
431  */
432
433 int
434 pmclog_read(void *cookie, struct pmclog_ev *ev)
435 {
436         int retval;
437         ssize_t nread;
438         struct pmclog_parse_state *ps;
439
440         ps = (struct pmclog_parse_state *) cookie;
441
442         if (ps->ps_state == PL_STATE_ERROR) {
443                 ev->pl_state = PMCLOG_ERROR;
444                 return -1;
445         }
446
447         /*
448          * If there isn't enough data left for a new event try and get
449          * more data.
450          */
451         if (ps->ps_len == 0) {
452                 ev->pl_state = PMCLOG_REQUIRE_DATA;
453
454                 /*
455                  * If we have a valid file descriptor to read from, attempt
456                  * to read from that.  This read may return with an error,
457                  * (which may be EAGAIN or other recoverable error), or
458                  * can return EOF.
459                  */
460                 if (ps->ps_fd != PMCLOG_FD_NONE) {
461                 refill:
462                         nread = read(ps->ps_fd, ps->ps_buffer,
463                             PMCLOG_BUFFER_SIZE);
464
465                         if (nread <= 0) {
466                                 if (nread == 0)
467                                         ev->pl_state = PMCLOG_EOF;
468                                 else if (errno != EAGAIN) /* not restartable */
469                                         ev->pl_state = PMCLOG_ERROR;
470                                 return -1;
471                         }
472
473                         ps->ps_len = nread;
474                         ps->ps_data = ps->ps_buffer;
475                 } else
476                         return -1;
477         }
478
479         assert(ps->ps_len > 0);
480
481
482          /* Retrieve one event from the byte stream. */
483         retval = pmclog_get_event(ps, &ps->ps_data, &ps->ps_len, ev);
484
485         /*
486          * If we need more data and we have a configured fd, try read
487          * from it.
488          */
489         if (retval < 0 && ev->pl_state == PMCLOG_REQUIRE_DATA &&
490             ps->ps_fd != -1) {
491                 assert(ps->ps_len == 0);
492                 goto refill;
493         }
494
495         return retval;
496 }
497
498 /*
499  * Feed data to a memory based parser.
500  *
501  * The memory area pointed to by 'data' needs to be valid till the
502  * next error return from pmclog_next_event().
503  */
504
505 int
506 pmclog_feed(void *cookie, char *data, int len)
507 {
508         struct pmclog_parse_state *ps;
509
510         ps = (struct pmclog_parse_state *) cookie;
511
512         if (len < 0 ||          /* invalid length */
513             ps->ps_buffer ||    /* called for a file parser */
514             ps->ps_len != 0)    /* unnecessary call */
515                 return -1;
516
517         ps->ps_data = data;
518         ps->ps_len  = len;
519
520         return 0;
521 }
522
523 /*
524  * Allocate and initialize parser state.
525  */
526
527 void *
528 pmclog_open(int fd)
529 {
530         struct pmclog_parse_state *ps;
531
532         if ((ps = (struct pmclog_parse_state *) malloc(sizeof(*ps))) == NULL)
533                 return NULL;
534
535         ps->ps_state = PL_STATE_NEW_RECORD;
536         ps->ps_arch = -1;
537         ps->ps_initialized = 0;
538         ps->ps_count = 0;
539         ps->ps_offset = (off_t) 0;
540         bzero(&ps->ps_saved, sizeof(ps->ps_saved));
541         ps->ps_svcount = 0;
542         ps->ps_fd    = fd;
543         ps->ps_data  = NULL;
544         ps->ps_buffer = NULL;
545         ps->ps_len   = 0;
546
547         /* allocate space for a work area */
548         if (ps->ps_fd != PMCLOG_FD_NONE) {
549                 if ((ps->ps_buffer = malloc(PMCLOG_BUFFER_SIZE)) == NULL)
550                         return NULL;
551         }
552
553         return ps;
554 }
555
556
557 /*
558  * Free up parser state.
559  */
560
561 void
562 pmclog_close(void *cookie)
563 {
564         struct pmclog_parse_state *ps;
565
566         ps = (struct pmclog_parse_state *) cookie;
567
568         if (ps->ps_buffer)
569                 free(ps->ps_buffer);
570
571         free(ps);
572 }