2 * Copyright (c) 2007 Pawel Jakub Dawidek <pjd@FreeBSD.org>
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
14 * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND
15 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE
18 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 * Links to Illumos.org for more information on kstat function:
27 * [1] https://illumos.org/man/1M/kstat
28 * [2] https://illumos.org/man/9f/kstat_create
31 #include <sys/cdefs.h>
32 __FBSDID("$FreeBSD$");
34 #include <sys/types.h>
35 #include <sys/param.h>
36 #include <sys/kernel.h>
37 #include <sys/systm.h>
38 #include <sys/malloc.h>
39 #include <sys/sysctl.h>
40 #include <sys/kstat.h>
43 static MALLOC_DEFINE(M_KSTAT, "kstat_data", "Kernel statistics");
45 SYSCTL_ROOT_NODE(OID_AUTO, kstat, CTLFLAG_RW, 0, "Kernel statistics");
48 __kstat_set_raw_ops(kstat_t *ksp,
49 int (*headers)(char *buf, size_t size),
50 int (*data)(char *buf, size_t size, void *data),
51 void *(*addr)(kstat_t *ksp, loff_t index))
53 ksp->ks_raw_ops.headers = headers;
54 ksp->ks_raw_ops.data = data;
55 ksp->ks_raw_ops.addr = addr;
59 __kstat_set_seq_raw_ops(kstat_t *ksp,
60 int (*headers)(struct seq_file *f),
61 int (*data)(char *buf, size_t size, void *data),
62 void *(*addr)(kstat_t *ksp, loff_t index))
64 ksp->ks_raw_ops.seq_headers = headers;
65 ksp->ks_raw_ops.data = data;
66 ksp->ks_raw_ops.addr = addr;
70 kstat_default_update(kstat_t *ksp, int rw)
74 if (rw == KSTAT_WRITE)
81 kstat_resize_raw(kstat_t *ksp)
83 if (ksp->ks_raw_bufsize == KSTAT_RAW_MAX)
86 free(ksp->ks_raw_buf, M_TEMP);
87 ksp->ks_raw_bufsize = MIN(ksp->ks_raw_bufsize * 2, KSTAT_RAW_MAX);
88 ksp->ks_raw_buf = malloc(ksp->ks_raw_bufsize, M_TEMP, M_WAITOK);
94 kstat_raw_default_addr(kstat_t *ksp, loff_t n)
97 return (ksp->ks_data);
102 kstat_sysctl(SYSCTL_HANDLER_ARGS)
105 kstat_named_t *ksent;
108 ksent = ksp->ks_data;
109 /* Select the correct element */
111 /* Update the aggsums before reading */
112 (void) ksp->ks_update(ksp, KSTAT_READ);
113 val = ksent->value.ui64;
115 return (sysctl_handle_64(oidp, &val, 0, req));
119 kstat_sysctl_string(SYSCTL_HANDLER_ARGS)
122 kstat_named_t *ksent = ksp->ks_data;
126 /* Select the correct element */
128 /* Update the aggsums before reading */
129 (void) ksp->ks_update(ksp, KSTAT_READ);
130 val = KSTAT_NAMED_STR_PTR(ksent);
131 len = KSTAT_NAMED_STR_BUFLEN(ksent);
134 return (sysctl_handle_string(oidp, val, len, req));
138 kstat_sysctl_io(SYSCTL_HANDLER_ARGS)
142 kstat_io_t *kip = ksp->ks_data;
145 sb = sbuf_new_auto();
148 /* Update the aggsums before reading */
149 (void) ksp->ks_update(ksp, KSTAT_READ);
151 /* though wlentime & friends are signed, they will never be negative */
153 "%-8llu %-8llu %-8u %-8u %-8llu %-8llu "
154 "%-8llu %-8llu %-8llu %-8llu %-8u %-8u\n",
155 kip->nread, kip->nwritten,
156 kip->reads, kip->writes,
157 kip->wtime, kip->wlentime, kip->wlastupdate,
158 kip->rtime, kip->rlentime, kip->rlastupdate,
159 kip->wcnt, kip->rcnt);
160 rc = sbuf_finish(sb);
162 rc = SYSCTL_OUT(req, sbuf_data(sb), sbuf_len(sb));
168 kstat_sysctl_raw(SYSCTL_HANDLER_ARGS)
173 void *(*addr_op)(kstat_t *ksp, loff_t index);
174 int n, has_header, rc = 0;
176 sb = sbuf_new_auto();
180 if (ksp->ks_raw_ops.addr)
181 addr_op = ksp->ks_raw_ops.addr;
183 addr_op = kstat_raw_default_addr;
185 mutex_enter(ksp->ks_lock);
187 /* Update the aggsums before reading */
188 (void) ksp->ks_update(ksp, KSTAT_READ);
190 ksp->ks_raw_bufsize = PAGE_SIZE;
191 ksp->ks_raw_buf = malloc(PAGE_SIZE, M_TEMP, M_WAITOK);
194 has_header = (ksp->ks_raw_ops.headers ||
195 ksp->ks_raw_ops.seq_headers);
198 if (ksp->ks_raw_ops.headers) {
199 rc = ksp->ks_raw_ops.headers(
200 ksp->ks_raw_buf, ksp->ks_raw_bufsize);
201 } else if (ksp->ks_raw_ops.seq_headers) {
204 f.sf_buf = ksp->ks_raw_buf;
205 f.sf_size = ksp->ks_raw_bufsize;
206 rc = ksp->ks_raw_ops.seq_headers(&f);
209 if (rc == ENOMEM && !kstat_resize_raw(ksp))
210 goto restart_headers;
212 sbuf_printf(sb, "\n%s", ksp->ks_raw_buf);
215 while ((data = addr_op(ksp, n)) != NULL) {
217 if (ksp->ks_raw_ops.data) {
218 rc = ksp->ks_raw_ops.data(ksp->ks_raw_buf,
219 ksp->ks_raw_bufsize, data);
220 if (rc == ENOMEM && !kstat_resize_raw(ksp))
223 sbuf_printf(sb, "%s", ksp->ks_raw_buf);
226 ASSERT(ksp->ks_ndata == 1);
227 sbuf_hexdump(sb, ksp->ks_data,
228 ksp->ks_data_size, NULL, 0);
232 free(ksp->ks_raw_buf, M_TEMP);
233 mutex_exit(ksp->ks_lock);
235 rc = sbuf_finish(sb);
237 rc = SYSCTL_OUT(req, sbuf_data(sb), sbuf_len(sb));
243 __kstat_create(const char *module, int instance, const char *name,
244 const char *class, uchar_t ks_type, uint_t ks_ndata, uchar_t flags)
246 char buf[KSTAT_STRLEN];
247 struct sysctl_oid *root;
251 KASSERT(instance == 0, ("instance=%d", instance));
252 if ((ks_type == KSTAT_TYPE_INTR) || (ks_type == KSTAT_TYPE_IO))
253 ASSERT(ks_ndata == 1);
259 * Allocate the main structure. We don't need to keep a copy of
260 * module in here, because it is only used for sysctl node creation
261 * done in this function.
263 ksp = malloc(sizeof (*ksp), M_KSTAT, M_WAITOK|M_ZERO);
265 ksp->ks_crtime = gethrtime();
266 ksp->ks_snaptime = ksp->ks_crtime;
267 ksp->ks_instance = instance;
268 (void) strlcpy(ksp->ks_name, name, KSTAT_STRLEN);
269 (void) strlcpy(ksp->ks_class, class, KSTAT_STRLEN);
270 ksp->ks_type = ks_type;
271 ksp->ks_flags = flags;
272 ksp->ks_update = kstat_default_update;
274 mutex_init(&ksp->ks_private_lock, NULL, MUTEX_DEFAULT, NULL);
275 ksp->ks_lock = &ksp->ks_private_lock;
277 switch (ksp->ks_type) {
280 ksp->ks_data_size = ks_ndata;
282 case KSTAT_TYPE_NAMED:
283 ksp->ks_ndata = ks_ndata;
284 ksp->ks_data_size = ks_ndata * sizeof (kstat_named_t);
286 case KSTAT_TYPE_INTR:
287 ksp->ks_ndata = ks_ndata;
288 ksp->ks_data_size = ks_ndata * sizeof (kstat_intr_t);
291 ksp->ks_ndata = ks_ndata;
292 ksp->ks_data_size = ks_ndata * sizeof (kstat_io_t);
294 case KSTAT_TYPE_TIMER:
295 ksp->ks_ndata = ks_ndata;
296 ksp->ks_data_size = ks_ndata * sizeof (kstat_timer_t);
299 panic("Undefined kstat type %d\n", ksp->ks_type);
302 if (ksp->ks_flags & KSTAT_FLAG_VIRTUAL) {
305 ksp->ks_data = kmem_zalloc(ksp->ks_data_size, KM_SLEEP);
306 if (ksp->ks_data == NULL) {
307 kmem_free(ksp, sizeof (*ksp));
313 * Some kstats use a module name like "zfs/poolname" to distinguish a
314 * set of kstats belonging to a specific pool. Split on '/' to add an
315 * extra node for the pool name if needed.
317 (void) strlcpy(buf, module, KSTAT_STRLEN);
319 pool = strchr(module, '/');
324 * Create sysctl tree for those statistics:
326 * kstat.<module>[.<pool>].<class>.<name>
328 sysctl_ctx_init(&ksp->ks_sysctl_ctx);
329 root = SYSCTL_ADD_NODE(&ksp->ks_sysctl_ctx,
330 SYSCTL_STATIC_CHILDREN(_kstat), OID_AUTO, module, CTLFLAG_RW, 0,
333 printf("%s: Cannot create kstat.%s tree!\n", __func__, module);
334 sysctl_ctx_free(&ksp->ks_sysctl_ctx);
339 root = SYSCTL_ADD_NODE(&ksp->ks_sysctl_ctx,
340 SYSCTL_CHILDREN(root), OID_AUTO, pool, CTLFLAG_RW, 0, "");
342 printf("%s: Cannot create kstat.%s.%s tree!\n",
343 __func__, module, pool);
344 sysctl_ctx_free(&ksp->ks_sysctl_ctx);
349 root = SYSCTL_ADD_NODE(&ksp->ks_sysctl_ctx, SYSCTL_CHILDREN(root),
350 OID_AUTO, class, CTLFLAG_RW, 0, "");
353 printf("%s: Cannot create kstat.%s.%s.%s tree!\n",
354 __func__, module, pool, class);
356 printf("%s: Cannot create kstat.%s.%s tree!\n",
357 __func__, module, class);
358 sysctl_ctx_free(&ksp->ks_sysctl_ctx);
362 if (ksp->ks_type == KSTAT_TYPE_NAMED) {
363 root = SYSCTL_ADD_NODE(&ksp->ks_sysctl_ctx,
364 SYSCTL_CHILDREN(root),
365 OID_AUTO, name, CTLFLAG_RW, 0, "");
368 printf("%s: Cannot create kstat.%s.%s.%s.%s "
369 "tree!\n", __func__, module, pool, class,
372 printf("%s: Cannot create kstat.%s.%s.%s "
373 "tree!\n", __func__, module, class, name);
374 sysctl_ctx_free(&ksp->ks_sysctl_ctx);
380 ksp->ks_sysctl_root = root;
386 kstat_install_named(kstat_t *ksp)
388 kstat_named_t *ksent;
392 ksent = ksp->ks_data;
394 VERIFY((ksp->ks_flags & KSTAT_FLAG_VIRTUAL) || ksent != NULL);
399 for (int i = 0; i < ksp->ks_ndata; i++, ksent++) {
400 if (ksent->data_type != 0) {
401 typelast = ksent->data_type;
402 namelast = ksent->name;
405 case KSTAT_DATA_CHAR:
406 /* Not Implemented */
408 case KSTAT_DATA_INT32:
409 SYSCTL_ADD_PROC(&ksp->ks_sysctl_ctx,
410 SYSCTL_CHILDREN(ksp->ks_sysctl_root),
412 CTLTYPE_S32 | CTLFLAG_RD | CTLFLAG_MPSAFE,
413 ksp, i, kstat_sysctl, "I", namelast);
415 case KSTAT_DATA_UINT32:
416 SYSCTL_ADD_PROC(&ksp->ks_sysctl_ctx,
417 SYSCTL_CHILDREN(ksp->ks_sysctl_root),
419 CTLTYPE_U32 | CTLFLAG_RD | CTLFLAG_MPSAFE,
420 ksp, i, kstat_sysctl, "IU", namelast);
422 case KSTAT_DATA_INT64:
423 SYSCTL_ADD_PROC(&ksp->ks_sysctl_ctx,
424 SYSCTL_CHILDREN(ksp->ks_sysctl_root),
426 CTLTYPE_S64 | CTLFLAG_RD | CTLFLAG_MPSAFE,
427 ksp, i, kstat_sysctl, "Q", namelast);
429 case KSTAT_DATA_UINT64:
430 SYSCTL_ADD_PROC(&ksp->ks_sysctl_ctx,
431 SYSCTL_CHILDREN(ksp->ks_sysctl_root),
433 CTLTYPE_U64 | CTLFLAG_RD | CTLFLAG_MPSAFE,
434 ksp, i, kstat_sysctl, "QU", namelast);
436 case KSTAT_DATA_LONG:
437 SYSCTL_ADD_PROC(&ksp->ks_sysctl_ctx,
438 SYSCTL_CHILDREN(ksp->ks_sysctl_root),
440 CTLTYPE_LONG | CTLFLAG_RD | CTLFLAG_MPSAFE,
441 ksp, i, kstat_sysctl, "L", namelast);
443 case KSTAT_DATA_ULONG:
444 SYSCTL_ADD_PROC(&ksp->ks_sysctl_ctx,
445 SYSCTL_CHILDREN(ksp->ks_sysctl_root),
447 CTLTYPE_ULONG | CTLFLAG_RD | CTLFLAG_MPSAFE,
448 ksp, i, kstat_sysctl, "LU", namelast);
450 case KSTAT_DATA_STRING:
451 SYSCTL_ADD_PROC(&ksp->ks_sysctl_ctx,
452 SYSCTL_CHILDREN(ksp->ks_sysctl_root),
454 CTLTYPE_STRING | CTLFLAG_RD | CTLFLAG_MPSAFE,
455 ksp, i, kstat_sysctl_string, "A", namelast);
458 panic("unsupported type: %d", typelast);
464 kstat_install(kstat_t *ksp)
466 struct sysctl_oid *root;
468 if (ksp->ks_ndata == UINT32_MAX)
469 VERIFY(ksp->ks_type == KSTAT_TYPE_RAW);
471 switch (ksp->ks_type) {
472 case KSTAT_TYPE_NAMED:
473 return (kstat_install_named(ksp));
475 if (ksp->ks_raw_ops.data) {
476 root = SYSCTL_ADD_PROC(&ksp->ks_sysctl_ctx,
477 SYSCTL_CHILDREN(ksp->ks_sysctl_root),
478 OID_AUTO, ksp->ks_name,
479 CTLTYPE_STRING | CTLFLAG_RD | CTLFLAG_MPSAFE,
480 ksp, 0, kstat_sysctl_raw, "A", ksp->ks_name);
482 root = SYSCTL_ADD_PROC(&ksp->ks_sysctl_ctx,
483 SYSCTL_CHILDREN(ksp->ks_sysctl_root),
484 OID_AUTO, ksp->ks_name,
485 CTLTYPE_OPAQUE | CTLFLAG_RD | CTLFLAG_MPSAFE,
486 ksp, 0, kstat_sysctl_raw, "", ksp->ks_name);
490 root = SYSCTL_ADD_PROC(&ksp->ks_sysctl_ctx,
491 SYSCTL_CHILDREN(ksp->ks_sysctl_root),
492 OID_AUTO, ksp->ks_name,
493 CTLTYPE_STRING | CTLFLAG_RD | CTLFLAG_MPSAFE,
494 ksp, 0, kstat_sysctl_io, "A", ksp->ks_name);
496 case KSTAT_TYPE_TIMER:
497 case KSTAT_TYPE_INTR:
499 panic("unsupported kstat type %d\n", ksp->ks_type);
501 VERIFY(root != NULL);
502 ksp->ks_sysctl_root = root;
506 kstat_delete(kstat_t *ksp)
509 sysctl_ctx_free(&ksp->ks_sysctl_ctx);
511 mutex_destroy(&ksp->ks_private_lock);
516 kstat_waitq_enter(kstat_io_t *kiop)
522 delta = new - kiop->wlastupdate;
523 kiop->wlastupdate = new;
526 kiop->wlentime += delta * wcnt;
527 kiop->wtime += delta;
532 kstat_waitq_exit(kstat_io_t *kiop)
538 delta = new - kiop->wlastupdate;
539 kiop->wlastupdate = new;
541 ASSERT((int)wcnt > 0);
542 kiop->wlentime += delta * wcnt;
543 kiop->wtime += delta;
547 kstat_runq_enter(kstat_io_t *kiop)
553 delta = new - kiop->rlastupdate;
554 kiop->rlastupdate = new;
557 kiop->rlentime += delta * rcnt;
558 kiop->rtime += delta;
563 kstat_runq_exit(kstat_io_t *kiop)
569 delta = new - kiop->rlastupdate;
570 kiop->rlastupdate = new;
572 ASSERT((int)rcnt > 0);
573 kiop->rlentime += delta * rcnt;
574 kiop->rtime += delta;