2 * collectd - src/processes.c
3 * Copyright (C) 2005 Lyonel Vincent
4 * Copyright (C) 2006-2017 Florian octo Forster
5 * Copyright (C) 2008 Oleg King
6 * Copyright (C) 2009 Sebastian Harl
7 * Copyright (C) 2009 Andrés J. Díaz
8 * Copyright (C) 2009 Manuel Sanmartin
9 * Copyright (C) 2010 Clément Stenac
10 * Copyright (C) 2012 Cosmin Ioiart
12 * This program is free software; you can redistribute it and/or modify it
13 * under the terms of the GNU General Public License as published by the
14 * Free Software Foundation; either version 2 of the License, or (at your
15 * option) any later version.
17 * This program is distributed in the hope that it will be useful, but
18 * WITHOUT ANY WARRANTY; without even the implied warranty of
19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20 * General Public License for more details.
22 * You should have received a copy of the GNU General Public License along
23 * with this program; if not, write to the Free Software Foundation, Inc.,
24 * 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
27 * Lyonel Vincent <lyonel at ezix.org>
28 * Florian octo Forster <octo at collectd.org>
29 * Oleg King <king2 at kaluga.ru>
30 * Sebastian Harl <sh at tokkee.org>
31 * Andrés J. Díaz <ajdiaz at connectical.com>
33 * Clément Stenac <clement.stenac at diwi.org>
34 * Cosmin Ioiart <cioiart at gmail.com>
35 * Pavel Rochnyack <pavel2000 at ngs.ru>
36 * Wilfried Goesgens <dothebart at citadel.org>
45 #include "utils_complain.h"
46 #include "utils_taskstats.h"
49 /* Include header files for the mach system, if they exist.. */
51 #if HAVE_MACH_MACH_INIT_H
52 #include <mach/mach_init.h>
54 #if HAVE_MACH_HOST_PRIV_H
55 #include <mach/host_priv.h>
57 #if HAVE_MACH_MACH_ERROR_H
58 #include <mach/mach_error.h>
60 #if HAVE_MACH_MACH_HOST_H
61 #include <mach/mach_host.h>
63 #if HAVE_MACH_MACH_PORT_H
64 #include <mach/mach_port.h>
66 #if HAVE_MACH_MACH_TYPES_H
67 #include <mach/mach_types.h>
69 #if HAVE_MACH_MESSAGE_H
70 #include <mach/message.h>
72 #if HAVE_MACH_PROCESSOR_SET_H
73 #include <mach/processor_set.h>
76 #include <mach/task.h>
78 #if HAVE_MACH_THREAD_ACT_H
79 #include <mach/thread_act.h>
81 #if HAVE_MACH_VM_REGION_H
82 #include <mach/vm_region.h>
84 #if HAVE_MACH_VM_MAP_H
85 #include <mach/vm_map.h>
87 #if HAVE_MACH_VM_PROT_H
88 #include <mach/vm_prot.h>
91 #include <sys/sysctl.h>
93 /* #endif HAVE_THREAD_INFO */
96 #if HAVE_LINUX_CONFIG_H
97 #include <linux/config.h>
100 #define CONFIG_HZ 100
102 /* #endif KERNEL_LINUX */
104 #elif HAVE_LIBKVM_GETPROCS && \
105 (HAVE_STRUCT_KINFO_PROC_FREEBSD || HAVE_STRUCT_KINFO_PROC_OPENBSD)
107 #include <sys/param.h>
108 #include <sys/proc.h>
109 #include <sys/sysctl.h>
110 #include <sys/user.h>
111 /* #endif HAVE_LIBKVM_GETPROCS && (HAVE_STRUCT_KINFO_PROC_FREEBSD ||
112 * HAVE_STRUCT_KINFO_PROC_OPENBSD) */
114 #elif HAVE_PROCINFO_H
115 #include <procinfo.h>
116 #include <sys/types.h>
118 #define MAXPROCENTRY 32
119 #define MAXTHRDENTRY 16
120 #define MAXARGLN 1024
121 /* #endif HAVE_PROCINFO_H */
124 /* Hack: Avoid #error when building a 32-bit binary with
125 * _FILE_OFFSET_BITS=64. There is a reason for this #error, as one
126 * of the structures in <sys/procfs.h> uses an off_t, but that
127 * isn't relevant to our usage of procfs. */
128 #if !defined(_LP64) && _FILE_OFFSET_BITS == 64
130 #undef _FILE_OFFSET_BITS
136 #define _FILE_OFFSET_BITS 64
141 #include <sys/user.h>
147 /* #endif KERNEL_SOLARIS */
150 #error "No applicable input method."
161 #ifdef HAVE_SYS_CAPABILITY_H
162 #include <sys/capability.h>
165 #ifndef CMDLINE_BUFFER_SIZE
166 #if defined(ARG_MAX) && (ARG_MAX < 4096)
167 #define CMDLINE_BUFFER_SIZE ARG_MAX
169 #define CMDLINE_BUFFER_SIZE 4096
173 #define PROCSTAT_NAME_LEN 256
174 typedef struct process_entry_s {
176 char name[PROCSTAT_NAME_LEN];
178 unsigned long num_proc;
179 unsigned long num_lwp;
180 unsigned long num_fd;
181 unsigned long num_maps;
182 unsigned long vmem_size;
183 unsigned long vmem_rss;
184 unsigned long vmem_data;
185 unsigned long vmem_code;
186 unsigned long stack_size;
188 derive_t vmem_minflt_counter;
189 derive_t vmem_majflt_counter;
191 derive_t cpu_user_counter;
192 derive_t cpu_system_counter;
203 derive_t cswitch_vol;
204 derive_t cswitch_invol;
207 #if HAVE_LIBTASKSTATS
217 typedef struct procstat_entry_s {
221 derive_t vmem_minflt_counter;
222 derive_t vmem_majflt_counter;
224 derive_t cpu_user_counter;
225 derive_t cpu_system_counter;
235 derive_t cswitch_vol;
236 derive_t cswitch_invol;
238 #if HAVE_LIBTASKSTATS
239 value_to_rate_state_t delay_cpu;
240 value_to_rate_state_t delay_blkio;
241 value_to_rate_state_t delay_swapin;
242 value_to_rate_state_t delay_freepages;
245 struct procstat_entry_s *next;
248 typedef struct procstat {
249 char name[PROCSTAT_NAME_LEN];
254 unsigned long num_proc;
255 unsigned long num_lwp;
256 unsigned long num_fd;
257 unsigned long num_maps;
258 unsigned long vmem_size;
259 unsigned long vmem_rss;
260 unsigned long vmem_data;
261 unsigned long vmem_code;
262 unsigned long stack_size;
264 derive_t vmem_minflt_counter;
265 derive_t vmem_majflt_counter;
267 derive_t cpu_user_counter;
268 derive_t cpu_system_counter;
278 derive_t cswitch_vol;
279 derive_t cswitch_invol;
281 /* Linux Delay Accounting. Unit is ns/s. */
284 gauge_t delay_swapin;
285 gauge_t delay_freepages;
288 bool report_maps_num;
289 bool report_ctx_switch;
292 struct procstat *next;
293 struct procstat_entry_s *instances;
296 static procstat_t *list_head_g = NULL;
298 static bool want_init = true;
299 static bool report_ctx_switch;
300 static bool report_fd_num;
301 static bool report_maps_num;
302 static bool report_delay;
305 static mach_port_t port_host_self;
306 static mach_port_t port_task_self;
308 static processor_set_name_array_t pset_list;
309 static mach_msg_type_number_t pset_list_len;
310 /* #endif HAVE_THREAD_INFO */
313 static long pagesize_g;
314 static void ps_fill_details(const procstat_t *ps, process_entry_t *entry);
315 /* #endif KERNEL_LINUX */
317 #elif HAVE_LIBKVM_GETPROCS && \
318 (HAVE_STRUCT_KINFO_PROC_FREEBSD || HAVE_STRUCT_KINFO_PROC_OPENBSD)
320 /* #endif HAVE_LIBKVM_GETPROCS && (HAVE_STRUCT_KINFO_PROC_FREEBSD ||
321 * HAVE_STRUCT_KINFO_PROC_OPENBSD) */
323 #elif HAVE_PROCINFO_H
324 static struct procentry64 procentry[MAXPROCENTRY];
325 static struct thrdentry64 thrdentry[MAXTHRDENTRY];
328 #ifndef _AIXVERSION_610
329 int getprocs64(void *procsinfo, int sizproc, void *fdsinfo, int sizfd,
330 pid_t *index, int count);
331 int getthrds64(pid_t, void *, int, tid64_t *, int);
333 int getargs(void *processBuffer, int bufferLen, char *argsBuffer, int argsLen);
334 #endif /* HAVE_PROCINFO_H */
336 #if HAVE_LIBTASKSTATS
337 static ts_t *taskstats_handle = NULL;
340 /* put name of process from config to list_head_g tree
341 * list_head_g is a list of 'procstat_t' structs with
342 * processes names we want to watch */
343 static procstat_t *ps_list_register(const char *name, const char *regexp) {
348 new = calloc(1, sizeof(*new));
350 ERROR("processes plugin: ps_list_register: calloc failed.");
353 sstrncpy(new->name, name, sizeof(new->name));
361 new->cswitch_vol = -1;
362 new->cswitch_invol = -1;
364 new->report_fd_num = report_fd_num;
365 new->report_maps_num = report_maps_num;
366 new->report_ctx_switch = report_ctx_switch;
367 new->report_delay = report_delay;
370 if (regexp != NULL) {
371 DEBUG("ProcessMatch: adding \"%s\" as criteria to process %s.", regexp,
373 new->re = malloc(sizeof(*new->re));
374 if (new->re == NULL) {
375 ERROR("processes plugin: ps_list_register: malloc failed.");
380 status = regcomp(new->re, regexp, REG_EXTENDED | REG_NOSUB);
382 DEBUG("ProcessMatch: compiling the regular expression \"%s\" failed.",
390 if (regexp != NULL) {
391 ERROR("processes plugin: ps_list_register: "
392 "Regular expression \"%s\" found in config "
393 "file, but support for regular expressions "
394 "has been disabled at compile time.",
401 for (ptr = list_head_g; ptr != NULL; ptr = ptr->next) {
402 if (strcmp(ptr->name, name) == 0) {
403 WARNING("processes plugin: You have configured more "
404 "than one `Process' or "
405 "`ProcessMatch' with the same name. "
406 "All but the first setting will be "
415 if (ptr->next == NULL)
425 } /* void ps_list_register */
427 /* try to match name against entry, returns 1 if success */
428 static int ps_list_match(const char *name, const char *cmdline,
431 if (ps->re != NULL) {
436 if ((str == NULL) || (str[0] == 0))
441 status = regexec(ps->re, str,
449 if (strcmp(ps->name, name) == 0)
453 } /* int ps_list_match */
455 static void ps_update_counter(derive_t *group_counter, derive_t *curr_counter,
456 derive_t new_counter) {
457 unsigned long curr_value;
460 *curr_counter = new_counter;
464 if (new_counter < *curr_counter)
465 curr_value = new_counter + (ULONG_MAX - *curr_counter);
467 curr_value = new_counter - *curr_counter;
469 if (*group_counter == -1)
472 *curr_counter = new_counter;
473 *group_counter += curr_value;
476 #if HAVE_LIBTASKSTATS
477 static void ps_update_delay_one(gauge_t *out_rate_sum,
478 value_to_rate_state_t *state, uint64_t cnt,
481 int status = value_to_rate(&rate, (value_t){.counter = (counter_t)cnt},
482 DS_TYPE_COUNTER, t, state);
483 if ((status != 0) || isnan(rate)) {
487 if (isnan(*out_rate_sum)) {
488 *out_rate_sum = rate;
490 *out_rate_sum += rate;
494 static void ps_update_delay(procstat_t *out, procstat_entry_t *prev,
495 process_entry_t *curr) {
496 cdtime_t now = cdtime();
498 ps_update_delay_one(&out->delay_cpu, &prev->delay_cpu, curr->delay.cpu_ns,
500 ps_update_delay_one(&out->delay_blkio, &prev->delay_blkio,
501 curr->delay.blkio_ns, now);
502 ps_update_delay_one(&out->delay_swapin, &prev->delay_swapin,
503 curr->delay.swapin_ns, now);
504 ps_update_delay_one(&out->delay_freepages, &prev->delay_freepages,
505 curr->delay.freepages_ns, now);
509 /* add process entry to 'instances' of process 'name' (or refresh it) */
510 static void ps_list_add(const char *name, const char *cmdline,
511 process_entry_t *entry) {
512 procstat_entry_t *pse;
517 for (procstat_t *ps = list_head_g; ps != NULL; ps = ps->next) {
518 if ((ps_list_match(name, cmdline, ps)) == 0)
522 ps_fill_details(ps, entry);
525 for (pse = ps->instances; pse != NULL; pse = pse->next)
526 if ((pse->id == entry->id) || (pse->next == NULL))
529 if ((pse == NULL) || (pse->id != entry->id)) {
530 procstat_entry_t *new;
532 new = calloc(1, sizeof(*new));
547 ps->num_proc += entry->num_proc;
548 ps->num_lwp += entry->num_lwp;
549 ps->num_fd += entry->num_fd;
550 ps->num_maps += entry->num_maps;
551 ps->vmem_size += entry->vmem_size;
552 ps->vmem_rss += entry->vmem_rss;
553 ps->vmem_data += entry->vmem_data;
554 ps->vmem_code += entry->vmem_code;
555 ps->stack_size += entry->stack_size;
557 if ((entry->io_rchar != -1) && (entry->io_wchar != -1)) {
558 ps_update_counter(&ps->io_rchar, &pse->io_rchar, entry->io_rchar);
559 ps_update_counter(&ps->io_wchar, &pse->io_wchar, entry->io_wchar);
562 if ((entry->io_syscr != -1) && (entry->io_syscw != -1)) {
563 ps_update_counter(&ps->io_syscr, &pse->io_syscr, entry->io_syscr);
564 ps_update_counter(&ps->io_syscw, &pse->io_syscw, entry->io_syscw);
567 if ((entry->io_diskr != -1) && (entry->io_diskw != -1)) {
568 ps_update_counter(&ps->io_diskr, &pse->io_diskr, entry->io_diskr);
569 ps_update_counter(&ps->io_diskw, &pse->io_diskw, entry->io_diskw);
572 if ((entry->cswitch_vol != -1) && (entry->cswitch_invol != -1)) {
573 ps_update_counter(&ps->cswitch_vol, &pse->cswitch_vol,
575 ps_update_counter(&ps->cswitch_invol, &pse->cswitch_invol,
576 entry->cswitch_invol);
579 ps_update_counter(&ps->vmem_minflt_counter, &pse->vmem_minflt_counter,
580 entry->vmem_minflt_counter);
581 ps_update_counter(&ps->vmem_majflt_counter, &pse->vmem_majflt_counter,
582 entry->vmem_majflt_counter);
584 ps_update_counter(&ps->cpu_user_counter, &pse->cpu_user_counter,
585 entry->cpu_user_counter);
586 ps_update_counter(&ps->cpu_system_counter, &pse->cpu_system_counter,
587 entry->cpu_system_counter);
589 #if HAVE_LIBTASKSTATS
590 ps_update_delay(ps, pse, entry);
595 /* remove old entries from instances of processes in list_head_g */
596 static void ps_list_reset(void) {
597 procstat_entry_t *pse;
598 procstat_entry_t *pse_prev;
600 for (procstat_t *ps = list_head_g; ps != NULL; ps = ps->next) {
612 ps->delay_blkio = NAN;
613 ps->delay_swapin = NAN;
614 ps->delay_freepages = NAN;
618 while (pse != NULL) {
620 DEBUG("Removing this procstat entry cause it's too old: "
621 "id = %lu; name = %s;",
624 if (pse_prev == NULL) {
625 ps->instances = pse->next;
629 pse_prev->next = pse->next;
631 pse = pse_prev->next;
638 } /* while (pse != NULL) */
639 } /* for (ps = list_head_g; ps != NULL; ps = ps->next) */
642 static void ps_tune_instance(oconfig_item_t *ci, procstat_t *ps) {
643 for (int i = 0; i < ci->children_num; i++) {
644 oconfig_item_t *c = ci->children + i;
646 if (strcasecmp(c->key, "CollectContextSwitch") == 0)
647 cf_util_get_boolean(c, &ps->report_ctx_switch);
648 else if (strcasecmp(c->key, "CollectFileDescriptor") == 0)
649 cf_util_get_boolean(c, &ps->report_fd_num);
650 else if (strcasecmp(c->key, "CollectMemoryMaps") == 0)
651 cf_util_get_boolean(c, &ps->report_maps_num);
652 else if (strcasecmp(c->key, "CollectDelayAccounting") == 0) {
653 #if HAVE_LIBTASKSTATS
654 cf_util_get_boolean(c, &ps->report_delay);
656 WARNING("processes plugin: The plugin has been compiled without support "
657 "for the \"CollectDelayAccounting\" option.");
660 ERROR("processes plugin: Option \"%s\" not allowed here.", c->key);
662 } /* for (ci->children) */
663 } /* void ps_tune_instance */
665 /* put all pre-defined 'Process' names from config to list_head_g tree */
666 static int ps_config(oconfig_item_t *ci) {
668 const size_t max_procname_len = 15;
669 #elif KERNEL_SOLARIS || KERNEL_FREEBSD
670 const size_t max_procname_len = MAXCOMLEN - 1;
675 for (int i = 0; i < ci->children_num; ++i) {
676 oconfig_item_t *c = ci->children + i;
678 if (strcasecmp(c->key, "Process") == 0) {
679 if ((c->values_num != 1) || (OCONFIG_TYPE_STRING != c->values[0].type)) {
680 ERROR("processes plugin: `Process' expects exactly "
681 "one string argument (got %i).",
686 #if KERNEL_LINUX || KERNEL_SOLARIS || KERNEL_FREEBSD
687 if (strlen(c->values[0].value.string) > max_procname_len) {
688 WARNING("processes plugin: this platform has a %" PRIsz
690 "to process names. The `Process \"%s\"' option will "
691 "not work as expected.",
692 max_procname_len, c->values[0].value.string);
696 ps = ps_list_register(c->values[0].value.string, NULL);
698 if (c->children_num != 0 && ps != NULL)
699 ps_tune_instance(c, ps);
700 } else if (strcasecmp(c->key, "ProcessMatch") == 0) {
701 if ((c->values_num != 2) || (OCONFIG_TYPE_STRING != c->values[0].type) ||
702 (OCONFIG_TYPE_STRING != c->values[1].type)) {
703 ERROR("processes plugin: `ProcessMatch' needs exactly "
704 "two string arguments (got %i).",
709 ps = ps_list_register(c->values[0].value.string,
710 c->values[1].value.string);
712 if (c->children_num != 0 && ps != NULL)
713 ps_tune_instance(c, ps);
714 } else if (strcasecmp(c->key, "CollectContextSwitch") == 0) {
715 cf_util_get_boolean(c, &report_ctx_switch);
716 } else if (strcasecmp(c->key, "CollectFileDescriptor") == 0) {
717 cf_util_get_boolean(c, &report_fd_num);
718 } else if (strcasecmp(c->key, "CollectMemoryMaps") == 0) {
719 cf_util_get_boolean(c, &report_maps_num);
720 } else if (strcasecmp(c->key, "CollectDelayAccounting") == 0) {
721 #if HAVE_LIBTASKSTATS
722 cf_util_get_boolean(c, &report_delay);
724 WARNING("processes plugin: The plugin has been compiled without support "
725 "for the \"CollectDelayAccounting\" option.");
728 ERROR("processes plugin: The `%s' configuration option is not "
729 "understood and will be ignored.",
738 static int ps_init(void) {
740 kern_return_t status;
742 port_host_self = mach_host_self();
743 port_task_self = mach_task_self();
745 if (pset_list != NULL) {
746 vm_deallocate(port_task_self, (vm_address_t)pset_list,
747 pset_list_len * sizeof(processor_set_t));
752 if ((status = host_processor_sets(port_host_self, &pset_list,
753 &pset_list_len)) != KERN_SUCCESS) {
754 ERROR("host_processor_sets failed: %s\n", mach_error_string(status));
759 /* #endif HAVE_THREAD_INFO */
762 pagesize_g = sysconf(_SC_PAGESIZE);
763 DEBUG("pagesize_g = %li; CONFIG_HZ = %i;", pagesize_g, CONFIG_HZ);
765 #if HAVE_LIBTASKSTATS
766 if (taskstats_handle == NULL) {
767 taskstats_handle = ts_create();
768 if (taskstats_handle == NULL) {
769 WARNING("processes plugin: Creating taskstats handle failed.");
773 /* #endif KERNEL_LINUX */
775 #elif HAVE_LIBKVM_GETPROCS && \
776 (HAVE_STRUCT_KINFO_PROC_FREEBSD || HAVE_STRUCT_KINFO_PROC_OPENBSD)
777 pagesize = getpagesize();
778 /* #endif HAVE_LIBKVM_GETPROCS && (HAVE_STRUCT_KINFO_PROC_FREEBSD ||
779 * HAVE_STRUCT_KINFO_PROC_OPENBSD) */
781 #elif HAVE_PROCINFO_H
782 pagesize = getpagesize();
783 #endif /* HAVE_PROCINFO_H */
788 /* submit global state (e.g.: qty of zombies, running, etc..) */
789 static void ps_submit_state(const char *state, double value) {
790 value_list_t vl = VALUE_LIST_INIT;
792 vl.values = &(value_t){.gauge = value};
794 sstrncpy(vl.plugin, "processes", sizeof(vl.plugin));
795 sstrncpy(vl.plugin_instance, "", sizeof(vl.plugin_instance));
796 sstrncpy(vl.type, "ps_state", sizeof(vl.type));
797 sstrncpy(vl.type_instance, state, sizeof(vl.type_instance));
799 plugin_dispatch_values(&vl);
802 /* submit info about specific process (e.g.: memory taken, cpu usage, etc..) */
803 static void ps_submit_proc_list(procstat_t *ps) {
804 value_list_t vl = VALUE_LIST_INIT;
808 sstrncpy(vl.plugin, "processes", sizeof(vl.plugin));
809 sstrncpy(vl.plugin_instance, ps->name, sizeof(vl.plugin_instance));
811 sstrncpy(vl.type, "ps_vm", sizeof(vl.type));
812 vl.values[0].gauge = ps->vmem_size;
814 plugin_dispatch_values(&vl);
816 sstrncpy(vl.type, "ps_rss", sizeof(vl.type));
817 vl.values[0].gauge = ps->vmem_rss;
819 plugin_dispatch_values(&vl);
821 sstrncpy(vl.type, "ps_data", sizeof(vl.type));
822 vl.values[0].gauge = ps->vmem_data;
824 plugin_dispatch_values(&vl);
826 sstrncpy(vl.type, "ps_code", sizeof(vl.type));
827 vl.values[0].gauge = ps->vmem_code;
829 plugin_dispatch_values(&vl);
831 sstrncpy(vl.type, "ps_stacksize", sizeof(vl.type));
832 vl.values[0].gauge = ps->stack_size;
834 plugin_dispatch_values(&vl);
836 sstrncpy(vl.type, "ps_cputime", sizeof(vl.type));
837 vl.values[0].derive = ps->cpu_user_counter;
838 vl.values[1].derive = ps->cpu_system_counter;
840 plugin_dispatch_values(&vl);
842 sstrncpy(vl.type, "ps_count", sizeof(vl.type));
843 vl.values[0].gauge = ps->num_proc;
844 vl.values[1].gauge = ps->num_lwp;
846 plugin_dispatch_values(&vl);
848 sstrncpy(vl.type, "ps_pagefaults", sizeof(vl.type));
849 vl.values[0].derive = ps->vmem_minflt_counter;
850 vl.values[1].derive = ps->vmem_majflt_counter;
852 plugin_dispatch_values(&vl);
854 if ((ps->io_rchar != -1) && (ps->io_wchar != -1)) {
855 sstrncpy(vl.type, "io_octets", sizeof(vl.type));
856 vl.values[0].derive = ps->io_rchar;
857 vl.values[1].derive = ps->io_wchar;
859 plugin_dispatch_values(&vl);
862 if ((ps->io_syscr != -1) && (ps->io_syscw != -1)) {
863 sstrncpy(vl.type, "io_ops", sizeof(vl.type));
864 vl.values[0].derive = ps->io_syscr;
865 vl.values[1].derive = ps->io_syscw;
867 plugin_dispatch_values(&vl);
870 if ((ps->io_diskr != -1) && (ps->io_diskw != -1)) {
871 sstrncpy(vl.type, "disk_octets", sizeof(vl.type));
872 vl.values[0].derive = ps->io_diskr;
873 vl.values[1].derive = ps->io_diskw;
875 plugin_dispatch_values(&vl);
878 if (ps->num_fd > 0) {
879 sstrncpy(vl.type, "file_handles", sizeof(vl.type));
880 vl.values[0].gauge = ps->num_fd;
882 plugin_dispatch_values(&vl);
885 if (ps->num_maps > 0) {
886 sstrncpy(vl.type, "file_handles", sizeof(vl.type));
887 sstrncpy(vl.type_instance, "mapped", sizeof(vl.type_instance));
888 vl.values[0].gauge = ps->num_maps;
890 plugin_dispatch_values(&vl);
893 if ((ps->cswitch_vol != -1) && (ps->cswitch_invol != -1)) {
894 sstrncpy(vl.type, "contextswitch", sizeof(vl.type));
895 sstrncpy(vl.type_instance, "voluntary", sizeof(vl.type_instance));
896 vl.values[0].derive = ps->cswitch_vol;
898 plugin_dispatch_values(&vl);
900 sstrncpy(vl.type, "contextswitch", sizeof(vl.type));
901 sstrncpy(vl.type_instance, "involuntary", sizeof(vl.type_instance));
902 vl.values[0].derive = ps->cswitch_invol;
904 plugin_dispatch_values(&vl);
907 /* The ps->delay_* metrics are in nanoseconds per second. Convert to seconds
909 gauge_t const delay_factor = 1000000000.0;
914 } delay_metrics[] = {
915 {"delay-cpu", ps->delay_cpu},
916 {"delay-blkio", ps->delay_blkio},
917 {"delay-swapin", ps->delay_swapin},
918 {"delay-freepages", ps->delay_freepages},
920 for (size_t i = 0; i < STATIC_ARRAY_SIZE(delay_metrics); i++) {
921 if (isnan(delay_metrics[i].rate_ns)) {
924 sstrncpy(vl.type, "delay_rate", sizeof(vl.type));
925 sstrncpy(vl.type_instance, delay_metrics[i].type_instance,
926 sizeof(vl.type_instance));
927 vl.values[0].gauge = delay_metrics[i].rate_ns * delay_factor;
929 plugin_dispatch_values(&vl);
933 "name = %s; num_proc = %lu; num_lwp = %lu; num_fd = %lu; num_maps = %lu; "
934 "vmem_size = %lu; vmem_rss = %lu; vmem_data = %lu; "
936 "vmem_minflt_counter = %" PRIi64 "; vmem_majflt_counter = %" PRIi64 "; "
937 "cpu_user_counter = %" PRIi64 "; cpu_system_counter = %" PRIi64 "; "
938 "io_rchar = %" PRIi64 "; io_wchar = %" PRIi64 "; "
939 "io_syscr = %" PRIi64 "; io_syscw = %" PRIi64 "; "
940 "io_diskr = %" PRIi64 "; io_diskw = %" PRIi64 "; "
941 "cswitch_vol = %" PRIi64 "; cswitch_invol = %" PRIi64 "; "
942 "delay_cpu = %g; delay_blkio = %g; "
943 "delay_swapin = %g; delay_freepages = %g;",
944 ps->name, ps->num_proc, ps->num_lwp, ps->num_fd, ps->num_maps,
945 ps->vmem_size, ps->vmem_rss, ps->vmem_data, ps->vmem_code,
946 ps->vmem_minflt_counter, ps->vmem_majflt_counter, ps->cpu_user_counter,
947 ps->cpu_system_counter, ps->io_rchar, ps->io_wchar, ps->io_syscr,
948 ps->io_syscw, ps->io_diskr, ps->io_diskw, ps->cswitch_vol,
949 ps->cswitch_invol, ps->delay_cpu, ps->delay_blkio, ps->delay_swapin,
950 ps->delay_freepages);
952 } /* void ps_submit_proc_list */
954 #if KERNEL_LINUX || KERNEL_SOLARIS
955 static void ps_submit_fork_rate(derive_t value) {
956 value_list_t vl = VALUE_LIST_INIT;
958 vl.values = &(value_t){.derive = value};
960 sstrncpy(vl.plugin, "processes", sizeof(vl.plugin));
961 sstrncpy(vl.plugin_instance, "", sizeof(vl.plugin_instance));
962 sstrncpy(vl.type, "fork_rate", sizeof(vl.type));
963 sstrncpy(vl.type_instance, "", sizeof(vl.type_instance));
965 plugin_dispatch_values(&vl);
967 #endif /* KERNEL_LINUX || KERNEL_SOLARIS*/
969 /* ------- additional functions for KERNEL_LINUX/HAVE_THREAD_INFO ------- */
971 static int ps_read_tasks_status(process_entry_t *ps) {
977 derive_t cswitch_vol = 0;
978 derive_t cswitch_invol = 0;
983 snprintf(dirname, sizeof(dirname), "/proc/%li/task", ps->id);
985 if ((dh = opendir(dirname)) == NULL) {
986 DEBUG("Failed to open directory `%s'", dirname);
990 while ((ent = readdir(dh)) != NULL) {
993 if (!isdigit((int)ent->d_name[0]))
998 if (snprintf(filename, sizeof(filename), "/proc/%li/task/%s/status", ps->id,
999 tpid) >= sizeof(filename)) {
1000 DEBUG("Filename too long: `%s'", filename);
1004 if ((fh = fopen(filename, "r")) == NULL) {
1005 DEBUG("Failed to open file `%s'", filename);
1009 while (fgets(buffer, sizeof(buffer), fh) != NULL) {
1013 if (strncmp(buffer, "voluntary_ctxt_switches", 23) != 0 &&
1014 strncmp(buffer, "nonvoluntary_ctxt_switches", 26) != 0)
1017 numfields = strsplit(buffer, fields, STATIC_ARRAY_SIZE(fields));
1024 tmp = (derive_t)strtoll(fields[1], &endptr, /* base = */ 10);
1025 if ((errno == 0) && (endptr != fields[1])) {
1026 if (strncmp(buffer, "voluntary_ctxt_switches", 23) == 0) {
1028 } else if (strncmp(buffer, "nonvoluntary_ctxt_switches", 26) == 0) {
1029 cswitch_invol += tmp;
1032 } /* while (fgets) */
1035 WARNING("processes: fclose: %s", STRERRNO);
1040 ps->cswitch_vol = cswitch_vol;
1041 ps->cswitch_invol = cswitch_invol;
1044 } /* int *ps_read_tasks_status */
1046 /* Read data from /proc/pid/status */
1047 static int ps_read_status(long pid, process_entry_t *ps) {
1051 unsigned long lib = 0;
1052 unsigned long exe = 0;
1053 unsigned long data = 0;
1054 unsigned long threads = 0;
1058 snprintf(filename, sizeof(filename), "/proc/%li/status", pid);
1059 if ((fh = fopen(filename, "r")) == NULL)
1062 while (fgets(buffer, sizeof(buffer), fh) != NULL) {
1066 if (strncmp(buffer, "Vm", 2) != 0 && strncmp(buffer, "Threads", 7) != 0)
1069 numfields = strsplit(buffer, fields, STATIC_ARRAY_SIZE(fields));
1076 tmp = strtoul(fields[1], &endptr, /* base = */ 10);
1077 if ((errno == 0) && (endptr != fields[1])) {
1078 if (strncmp(buffer, "VmData", 6) == 0) {
1080 } else if (strncmp(buffer, "VmLib", 5) == 0) {
1082 } else if (strncmp(buffer, "VmExe", 5) == 0) {
1084 } else if (strncmp(buffer, "Threads", 7) == 0) {
1088 } /* while (fgets) */
1091 WARNING("processes: fclose: %s", STRERRNO);
1094 ps->vmem_data = data * 1024;
1095 ps->vmem_code = (exe + lib) * 1024;
1097 ps->num_lwp = threads;
1100 } /* int *ps_read_status */
1102 static int ps_read_io(process_entry_t *ps) {
1110 snprintf(filename, sizeof(filename), "/proc/%li/io", ps->id);
1111 if ((fh = fopen(filename, "r")) == NULL) {
1112 DEBUG("ps_read_io: Failed to open file `%s'", filename);
1116 while (fgets(buffer, sizeof(buffer), fh) != NULL) {
1117 derive_t *val = NULL;
1121 if (strncasecmp(buffer, "rchar:", 6) == 0)
1122 val = &(ps->io_rchar);
1123 else if (strncasecmp(buffer, "wchar:", 6) == 0)
1124 val = &(ps->io_wchar);
1125 else if (strncasecmp(buffer, "syscr:", 6) == 0)
1126 val = &(ps->io_syscr);
1127 else if (strncasecmp(buffer, "syscw:", 6) == 0)
1128 val = &(ps->io_syscw);
1129 else if (strncasecmp(buffer, "read_bytes:", 11) == 0)
1130 val = &(ps->io_diskr);
1131 else if (strncasecmp(buffer, "write_bytes:", 12) == 0)
1132 val = &(ps->io_diskw);
1136 numfields = strsplit(buffer, fields, STATIC_ARRAY_SIZE(fields));
1143 tmp = strtoll(fields[1], &endptr, /* base = */ 10);
1144 if ((errno != 0) || (endptr == fields[1]))
1147 *val = (derive_t)tmp;
1148 } /* while (fgets) */
1151 WARNING("processes: fclose: %s", STRERRNO);
1154 } /* int ps_read_io (...) */
1156 static int ps_count_maps(pid_t pid) {
1162 snprintf(filename, sizeof(filename), "/proc/%d/maps", pid);
1163 if ((fh = fopen(filename, "r")) == NULL) {
1164 DEBUG("ps_count_maps: Failed to open file `%s'", filename);
1168 while (fgets(buffer, sizeof(buffer), fh) != NULL) {
1169 if (strchr(buffer, '\n')) {
1172 } /* while (fgets) */
1175 WARNING("processes: fclose: %s", STRERRNO);
1178 } /* int ps_count_maps (...) */
1180 static int ps_count_fd(int pid) {
1186 snprintf(dirname, sizeof(dirname), "/proc/%i/fd", pid);
1188 if ((dh = opendir(dirname)) == NULL) {
1189 DEBUG("Failed to open directory `%s'", dirname);
1192 while ((ent = readdir(dh)) != NULL) {
1193 if (!isdigit((int)ent->d_name[0]))
1200 return (count >= 1) ? count : 1;
1201 } /* int ps_count_fd (pid) */
1203 #if HAVE_LIBTASKSTATS
1204 static int ps_delay(process_entry_t *ps) {
1205 if (taskstats_handle == NULL) {
1209 int status = ts_delay_by_tgid(taskstats_handle, (uint32_t)ps->id, &ps->delay);
1210 if (status == EPERM) {
1211 static c_complain_t c;
1212 #if defined(HAVE_SYS_CAPABILITY_H) && defined(CAP_NET_ADMIN)
1213 if (check_capability(CAP_NET_ADMIN) != 0) {
1214 if (getuid() == 0) {
1217 "processes plugin: Reading Delay Accounting metric failed: %s. "
1218 "collectd is running as root, but missing the CAP_NET_ADMIN "
1219 "capability. The most common cause for this is that the init "
1220 "system is dropping capabilities.",
1225 "processes plugin: Reading Delay Accounting metric failed: %s. "
1226 "collectd is not running as root and missing the CAP_NET_ADMIN "
1227 "capability. Either run collectd as root or grant it the "
1228 "CAP_NET_ADMIN capability using \"setcap cap_net_admin=ep " PREFIX
1229 "/sbin/collectd\".",
1233 ERROR("processes plugin: ts_delay_by_tgid failed: %s. The CAP_NET_ADMIN "
1234 "capability is available (I checked), so this error is utterly "
1239 c_complain(LOG_ERR, &c,
1240 "processes plugin: Reading Delay Accounting metric failed: %s. "
1241 "Reading Delay Accounting metrics requires root privileges.",
1245 } else if (status != 0) {
1246 ERROR("processes plugin: ts_delay_by_tgid failed: %s", STRERROR(status));
1254 static void ps_fill_details(const procstat_t *ps, process_entry_t *entry) {
1255 if (entry->has_io == 0) {
1260 if (ps->report_ctx_switch) {
1261 if (entry->has_cswitch == 0) {
1262 ps_read_tasks_status(entry);
1263 entry->has_cswitch = 1;
1267 if (ps->report_maps_num) {
1269 if (entry->has_maps == 0 && (num_maps = ps_count_maps(entry->id)) > 0) {
1270 entry->num_maps = num_maps;
1272 entry->has_maps = 1;
1275 if (ps->report_fd_num) {
1277 if (entry->has_fd == 0 && (num_fd = ps_count_fd(entry->id)) > 0) {
1278 entry->num_fd = num_fd;
1283 #if HAVE_LIBTASKSTATS
1284 if (ps->report_delay && !entry->has_delay) {
1285 if (ps_delay(entry) == 0) {
1286 entry->has_delay = 1;
1290 } /* void ps_fill_details (...) */
1292 /* ps_read_process reads process counters on Linux. */
1293 static int ps_read_process(long pid, process_entry_t *ps, char *state) {
1303 size_t name_start_pos;
1304 size_t name_end_pos;
1307 derive_t cpu_user_counter;
1308 derive_t cpu_system_counter;
1309 long long unsigned vmem_size;
1310 long long unsigned vmem_rss;
1311 long long unsigned stack_size;
1315 snprintf(filename, sizeof(filename), "/proc/%li/stat", pid);
1317 status = read_file_contents(filename, buffer, sizeof(buffer) - 1);
1320 buffer_len = (size_t)status;
1321 buffer[buffer_len] = 0;
1323 /* The name of the process is enclosed in parens. Since the name can
1324 * contain parens itself, spaces, numbers and pretty much everything
1325 * else, use these to determine the process name. We don't use
1326 * strchr(3) and strrchr(3) to avoid pointer arithmetic which would
1327 * otherwise be required to determine name_len. */
1329 while (name_start_pos < buffer_len && buffer[name_start_pos] != '(')
1332 name_end_pos = buffer_len;
1333 while (name_end_pos > 0 && buffer[name_end_pos] != ')')
1336 /* Either '(' or ')' is not found or they are in the wrong order.
1337 * Anyway, something weird that shouldn't happen ever. */
1338 if (name_start_pos >= name_end_pos) {
1339 ERROR("processes plugin: name_start_pos = %" PRIsz
1340 " >= name_end_pos = %" PRIsz,
1341 name_start_pos, name_end_pos);
1345 name_len = (name_end_pos - name_start_pos) - 1;
1346 if (name_len >= sizeof(ps->name))
1347 name_len = sizeof(ps->name) - 1;
1349 sstrncpy(ps->name, &buffer[name_start_pos + 1], name_len + 1);
1351 if ((buffer_len - name_end_pos) < 2)
1353 buffer_ptr = &buffer[name_end_pos + 2];
1355 fields_len = strsplit(buffer_ptr, fields, STATIC_ARRAY_SIZE(fields));
1356 if (fields_len < 22) {
1357 DEBUG("processes plugin: ps_read_process (pid = %li):"
1358 " `%s' has only %i fields..",
1359 pid, filename, fields_len);
1363 *state = fields[0][0];
1365 if (*state == 'Z') {
1369 ps->num_lwp = strtoul(fields[17], /* endptr = */ NULL, /* base = */ 10);
1370 if ((ps_read_status(pid, ps)) != 0) {
1374 DEBUG("ps_read_process: did not get vmem data for pid %li", pid);
1376 if (ps->num_lwp == 0)
1381 /* Leave the rest at zero if this is only a zombi */
1382 if (ps->num_proc == 0) {
1383 DEBUG("processes plugin: This is only a zombie: pid = %li; "
1389 cpu_user_counter = atoll(fields[11]);
1390 cpu_system_counter = atoll(fields[12]);
1391 vmem_size = atoll(fields[20]);
1392 vmem_rss = atoll(fields[21]);
1393 ps->vmem_minflt_counter = atol(fields[7]);
1394 ps->vmem_majflt_counter = atol(fields[9]);
1397 unsigned long long stack_start = atoll(fields[25]);
1398 unsigned long long stack_ptr = atoll(fields[26]);
1400 stack_size = (stack_start > stack_ptr) ? stack_start - stack_ptr
1401 : stack_ptr - stack_start;
1404 /* Convert jiffies to useconds */
1405 cpu_user_counter = cpu_user_counter * 1000000 / CONFIG_HZ;
1406 cpu_system_counter = cpu_system_counter * 1000000 / CONFIG_HZ;
1407 vmem_rss = vmem_rss * pagesize_g;
1409 ps->cpu_user_counter = cpu_user_counter;
1410 ps->cpu_system_counter = cpu_system_counter;
1411 ps->vmem_size = (unsigned long)vmem_size;
1412 ps->vmem_rss = (unsigned long)vmem_rss;
1413 ps->stack_size = (unsigned long)stack_size;
1415 /* no data by default. May be filled by ps_fill_details () */
1423 ps->cswitch_vol = -1;
1424 ps->cswitch_invol = -1;
1428 } /* int ps_read_process (...) */
1430 static char *ps_get_cmdline(long pid, char *name, char *buf, size_t buf_len) {
1434 char file[PATH_MAX];
1439 if ((pid < 1) || (NULL == buf) || (buf_len < 2))
1442 snprintf(file, sizeof(file), "/proc/%li/cmdline", pid);
1445 fd = open(file, O_RDONLY);
1447 /* ENOENT means the process exited while we were handling it.
1448 * Don't complain about this, it only fills the logs. */
1449 if (errno != ENOENT)
1450 WARNING("processes plugin: Failed to open `%s': %s.", file, STRERRNO);
1462 status = read(fd, (void *)buf_ptr, len);
1466 if ((EAGAIN == errno) || (EINTR == errno))
1469 WARNING("processes plugin: Failed to read from `%s': %s.", file,
1490 /* cmdline not available; e.g. kernel thread, zombie */
1494 snprintf(buf, buf_len, "[%s]", name);
1498 assert(n <= buf_len);
1505 /* remove trailing whitespace */
1506 while ((n > 0) && (isspace(buf[n]) || ('\0' == buf[n]))) {
1511 /* arguments are separated by '\0' in /proc/<pid>/cmdline */
1518 } /* char *ps_get_cmdline (...) */
1520 static int read_fork_rate(void) {
1524 bool value_valid = 0;
1526 proc_stat = fopen("/proc/stat", "r");
1527 if (proc_stat == NULL) {
1528 ERROR("processes plugin: fopen (/proc/stat) failed: %s", STRERRNO);
1532 while (fgets(buffer, sizeof(buffer), proc_stat) != NULL) {
1537 fields_num = strsplit(buffer, fields, STATIC_ARRAY_SIZE(fields));
1538 if (fields_num != 2)
1541 if (strcmp("processes", fields[0]) != 0)
1544 status = parse_value(fields[1], &value, DS_TYPE_DERIVE);
1555 ps_submit_fork_rate(value.derive);
1558 #endif /*KERNEL_LINUX */
1561 static char *ps_get_cmdline(long pid,
1562 char *name __attribute__((unused)), /* {{{ */
1563 char *buffer, size_t buffer_size) {
1564 char path[PATH_MAX];
1568 snprintf(path, sizeof(path), "/proc/%li/psinfo", pid);
1570 status = read_file_contents(path, (void *)&info, sizeof(info));
1571 if ((status < 0) || (((size_t)status) != sizeof(info))) {
1572 ERROR("processes plugin: Unexpected return value "
1573 "while reading \"%s\": "
1574 "Returned %zd but expected %" PRIsz ".",
1575 path, status, buffer_size);
1579 info.pr_psargs[sizeof(info.pr_psargs) - 1] = 0;
1580 sstrncpy(buffer, info.pr_psargs, buffer_size);
1583 } /* }}} int ps_get_cmdline */
1586 * Reads process information on the Solaris OS. The information comes mainly
1588 * /proc/PID/status, /proc/PID/psinfo and /proc/PID/usage
1589 * The values for input and ouput chars are calculated "by hand"
1590 * Added a few "solaris" specific process states as well
1592 static int ps_read_process(long pid, process_entry_t *ps, char *state) {
1594 char f_psinfo[64], f_usage[64];
1597 pstatus_t *myStatus;
1601 snprintf(filename, sizeof(filename), "/proc/%li/status", pid);
1602 snprintf(f_psinfo, sizeof(f_psinfo), "/proc/%li/psinfo", pid);
1603 snprintf(f_usage, sizeof(f_usage), "/proc/%li/usage", pid);
1605 buffer = calloc(1, sizeof(pstatus_t));
1606 read_file_contents(filename, buffer, sizeof(pstatus_t));
1607 myStatus = (pstatus_t *)buffer;
1609 buffer = calloc(1, sizeof(psinfo_t));
1610 read_file_contents(f_psinfo, buffer, sizeof(psinfo_t));
1611 myInfo = (psinfo_t *)buffer;
1613 buffer = calloc(1, sizeof(prusage_t));
1614 read_file_contents(f_usage, buffer, sizeof(prusage_t));
1615 myUsage = (prusage_t *)buffer;
1617 sstrncpy(ps->name, myInfo->pr_fname, sizeof(myInfo->pr_fname));
1618 ps->num_lwp = myStatus->pr_nlwp;
1619 if (myInfo->pr_wstat != 0) {
1630 ps->num_lwp = myInfo->pr_nlwp;
1634 * Convert system time and user time from nanoseconds to microseconds
1635 * for compatibility with the linux module
1637 ps->cpu_system_counter = myStatus->pr_stime.tv_nsec / 1000;
1638 ps->cpu_user_counter = myStatus->pr_utime.tv_nsec / 1000;
1641 * Convert rssize from KB to bytes to be consistent w/ the linux module
1643 ps->vmem_rss = myInfo->pr_rssize * 1024;
1644 ps->vmem_size = myInfo->pr_size * 1024;
1645 ps->vmem_minflt_counter = myUsage->pr_minf;
1646 ps->vmem_majflt_counter = myUsage->pr_majf;
1649 * TODO: Data and code segment calculations for Solaris
1654 ps->stack_size = myStatus->pr_stksize;
1657 * TODO: File descriptor count for Solaris
1661 /* Number of memory mappings */
1665 * Calculating input/ouput chars
1666 * Formula used is total chars / total blocks => chars/block
1667 * then convert input/output blocks to chars
1669 ulong_t tot_chars = myUsage->pr_ioch;
1670 ulong_t tot_blocks = myUsage->pr_inblk + myUsage->pr_oublk;
1671 ulong_t chars_per_block = 1;
1672 if (tot_blocks != 0)
1673 chars_per_block = tot_chars / tot_blocks;
1674 ps->io_rchar = myUsage->pr_inblk * chars_per_block;
1675 ps->io_wchar = myUsage->pr_oublk * chars_per_block;
1676 ps->io_syscr = myUsage->pr_sysc;
1677 ps->io_syscw = myUsage->pr_sysc;
1682 * TODO: context switch counters for Solaris
1684 ps->cswitch_vol = -1;
1685 ps->cswitch_invol = -1;
1688 * TODO: Find way of setting BLOCKED and PAGING status
1692 if (myStatus->pr_flags & PR_ASLEEP)
1694 else if (myStatus->pr_flags & PR_STOPPED)
1696 else if (myStatus->pr_flags & PR_DETACH)
1698 else if (myStatus->pr_flags & PR_DAEMON)
1700 else if (myStatus->pr_flags & PR_ISSYS)
1702 else if (myStatus->pr_flags & PR_ORPHAN)
1713 * Reads the number of threads created since the last reboot. On Solaris these
1714 * are retrieved from kstat (module cpu, name sys, class misc, stat nthreads).
1715 * The result is the sum for all the threads created on each cpu
1717 static int read_fork_rate(void) {
1718 extern kstat_ctl_t *kc;
1719 derive_t result = 0;
1724 for (kstat_t *ksp_chain = kc->kc_chain; ksp_chain != NULL;
1725 ksp_chain = ksp_chain->ks_next) {
1726 if ((strcmp(ksp_chain->ks_module, "cpu") == 0) &&
1727 (strcmp(ksp_chain->ks_name, "sys") == 0) &&
1728 (strcmp(ksp_chain->ks_class, "misc") == 0)) {
1731 kstat_read(kc, ksp_chain, NULL);
1733 tmp = get_kstat_value(ksp_chain, "nthreads");
1739 ps_submit_fork_rate(result);
1742 #endif /* KERNEL_SOLARIS */
1744 #if HAVE_THREAD_INFO
1745 static int mach_get_task_name(task_t t, int *pid, char *name,
1746 size_t name_max_len) {
1749 struct kinfo_proc kp;
1754 mib[2] = KERN_PROC_PID;
1756 if (pid_for_task(t, pid) != KERN_SUCCESS)
1760 kp_size = sizeof(kp);
1761 if (sysctl(mib, 4, &kp, &kp_size, NULL, 0) != 0)
1764 if (name_max_len > (MAXCOMLEN + 1))
1765 name_max_len = MAXCOMLEN + 1;
1767 strncpy(name, kp.kp_proc.p_comm, name_max_len - 1);
1768 name[name_max_len - 1] = '\0';
1770 DEBUG("pid = %i; name = %s;", *pid, name);
1772 /* We don't do the special handling for `p_comm == "LaunchCFMApp"' as
1773 * `top' does it, because it is a lot of work and only used when
1774 * debugging. -octo */
1778 #endif /* HAVE_THREAD_INFO */
1779 /* end of additional functions for KERNEL_LINUX/HAVE_THREAD_INFO */
1781 /* do actual readings from kernel */
1782 static int ps_read(void) {
1783 #if HAVE_THREAD_INFO
1784 kern_return_t status;
1786 processor_set_t port_pset_priv;
1788 task_array_t task_list;
1789 mach_msg_type_number_t task_list_len;
1792 char task_name[MAXCOMLEN + 1];
1794 thread_act_array_t thread_list;
1795 mach_msg_type_number_t thread_list_len;
1796 thread_basic_info_data_t thread_data;
1797 mach_msg_type_number_t thread_data_len;
1806 process_entry_t pse;
1811 * The Mach-concept is a little different from the traditional UNIX
1812 * concept: All the work is done in threads. Threads are contained in
1813 * `tasks'. Therefore, `task status' doesn't make much sense, since
1814 * it's actually a `thread status'.
1815 * Tasks are assigned to sets of processors, so that's where you go to
1818 for (mach_msg_type_number_t pset = 0; pset < pset_list_len; pset++) {
1819 if ((status = host_processor_set_priv(port_host_self, pset_list[pset],
1820 &port_pset_priv)) != KERN_SUCCESS) {
1821 ERROR("host_processor_set_priv failed: %s\n", mach_error_string(status));
1825 if ((status = processor_set_tasks(port_pset_priv, &task_list,
1826 &task_list_len)) != KERN_SUCCESS) {
1827 ERROR("processor_set_tasks failed: %s\n", mach_error_string(status));
1828 mach_port_deallocate(port_task_self, port_pset_priv);
1832 for (mach_msg_type_number_t task = 0; task < task_list_len; task++) {
1834 if (mach_get_task_name(task_list[task], &task_pid, task_name,
1835 PROCSTAT_NAME_LEN) == 0) {
1836 /* search for at least one match */
1837 for (ps = list_head_g; ps != NULL; ps = ps->next)
1838 /* FIXME: cmdline should be here instead of NULL */
1839 if (ps_list_match(task_name, NULL, ps) == 1)
1843 /* Collect more detailed statistics for this process */
1845 task_basic_info_data_t task_basic_info;
1846 mach_msg_type_number_t task_basic_info_len;
1847 task_events_info_data_t task_events_info;
1848 mach_msg_type_number_t task_events_info_len;
1849 task_absolutetime_info_data_t task_absolutetime_info;
1850 mach_msg_type_number_t task_absolutetime_info_len;
1852 memset(&pse, '\0', sizeof(pse));
1855 task_basic_info_len = TASK_BASIC_INFO_COUNT;
1856 status = task_info(task_list[task], TASK_BASIC_INFO,
1857 (task_info_t)&task_basic_info, &task_basic_info_len);
1858 if (status != KERN_SUCCESS) {
1859 ERROR("task_info failed: %s", mach_error_string(status));
1860 continue; /* with next thread_list */
1863 task_events_info_len = TASK_EVENTS_INFO_COUNT;
1865 task_info(task_list[task], TASK_EVENTS_INFO,
1866 (task_info_t)&task_events_info, &task_events_info_len);
1867 if (status != KERN_SUCCESS) {
1868 ERROR("task_info failed: %s", mach_error_string(status));
1869 continue; /* with next thread_list */
1872 task_absolutetime_info_len = TASK_ABSOLUTETIME_INFO_COUNT;
1873 status = task_info(task_list[task], TASK_ABSOLUTETIME_INFO,
1874 (task_info_t)&task_absolutetime_info,
1875 &task_absolutetime_info_len);
1876 if (status != KERN_SUCCESS) {
1877 ERROR("task_info failed: %s", mach_error_string(status));
1878 continue; /* with next thread_list */
1882 pse.vmem_size = task_basic_info.virtual_size;
1883 pse.vmem_rss = task_basic_info.resident_size;
1884 /* Does not seem to be easily exposed */
1895 /* File descriptor count not implemented */
1898 /* Number of memory mappings */
1901 pse.vmem_minflt_counter = task_events_info.cow_faults;
1902 pse.vmem_majflt_counter = task_events_info.faults;
1904 pse.cpu_user_counter = task_absolutetime_info.total_user;
1905 pse.cpu_system_counter = task_absolutetime_info.total_system;
1907 /* context switch counters not implemented */
1908 pse.cswitch_vol = -1;
1909 pse.cswitch_invol = -1;
1912 status = task_threads(task_list[task], &thread_list, &thread_list_len);
1913 if (status != KERN_SUCCESS) {
1914 /* Apple's `top' treats this case a zombie. It
1915 * makes sense to some extend: A `zombie'
1916 * thread is nonsense, since the task/process
1919 DEBUG("task_threads failed: %s", mach_error_string(status));
1920 if (task_list[task] != port_task_self)
1921 mach_port_deallocate(port_task_self, task_list[task]);
1922 continue; /* with next task_list */
1925 for (mach_msg_type_number_t thread = 0; thread < thread_list_len;
1927 thread_data_len = THREAD_BASIC_INFO_COUNT;
1928 status = thread_info(thread_list[thread], THREAD_BASIC_INFO,
1929 (thread_info_t)&thread_data, &thread_data_len);
1930 if (status != KERN_SUCCESS) {
1931 ERROR("thread_info failed: %s", mach_error_string(status));
1932 if (task_list[task] != port_task_self)
1933 mach_port_deallocate(port_task_self, thread_list[thread]);
1934 continue; /* with next thread_list */
1940 switch (thread_data.run_state) {
1941 case TH_STATE_RUNNING:
1944 case TH_STATE_STOPPED:
1945 /* What exactly is `halted'? */
1946 case TH_STATE_HALTED:
1949 case TH_STATE_WAITING:
1952 case TH_STATE_UNINTERRUPTIBLE:
1955 /* There is no `zombie' case here,
1956 * since there are no zombie-threads.
1957 * There's only zombie tasks, which are
1960 WARNING("Unknown thread status: %i", thread_data.run_state);
1962 } /* switch (thread_data.run_state) */
1964 if (task_list[task] != port_task_self) {
1965 status = mach_port_deallocate(port_task_self, thread_list[thread]);
1966 if (status != KERN_SUCCESS)
1967 ERROR("mach_port_deallocate failed: %s", mach_error_string(status));
1969 } /* for (thread_list) */
1971 if ((status = vm_deallocate(port_task_self, (vm_address_t)thread_list,
1972 thread_list_len * sizeof(thread_act_t))) !=
1974 ERROR("vm_deallocate failed: %s", mach_error_string(status));
1977 thread_list_len = 0;
1979 /* Only deallocate the task port, if it isn't our own.
1980 * Don't know what would happen in that case, but this
1981 * is what Apple's top does.. ;) */
1982 if (task_list[task] != port_task_self) {
1983 status = mach_port_deallocate(port_task_self, task_list[task]);
1984 if (status != KERN_SUCCESS)
1985 ERROR("mach_port_deallocate failed: %s", mach_error_string(status));
1989 /* FIXME: cmdline should be here instead of NULL */
1990 ps_list_add(task_name, NULL, &pse);
1991 } /* for (task_list) */
1993 if ((status = vm_deallocate(port_task_self, (vm_address_t)task_list,
1994 task_list_len * sizeof(task_t))) !=
1996 ERROR("vm_deallocate failed: %s", mach_error_string(status));
2001 if ((status = mach_port_deallocate(port_task_self, port_pset_priv)) !=
2003 ERROR("mach_port_deallocate failed: %s", mach_error_string(status));
2005 } /* for (pset_list) */
2007 ps_submit_state("running", running);
2008 ps_submit_state("sleeping", sleeping);
2009 ps_submit_state("zombies", zombies);
2010 ps_submit_state("stopped", stopped);
2011 ps_submit_state("blocked", blocked);
2013 for (ps = list_head_g; ps != NULL; ps = ps->next)
2014 ps_submit_proc_list(ps);
2015 /* #endif HAVE_THREAD_INFO */
2029 char cmdline[CMDLINE_BUFFER_SIZE];
2032 process_entry_t pse;
2035 running = sleeping = zombies = stopped = paging = blocked = 0;
2038 if ((proc = opendir("/proc")) == NULL) {
2039 ERROR("Cannot open `/proc': %s", STRERRNO);
2043 while ((ent = readdir(proc)) != NULL) {
2044 if (!isdigit(ent->d_name[0]))
2047 if ((pid = atol(ent->d_name)) < 1)
2050 memset(&pse, 0, sizeof(pse));
2053 status = ps_read_process(pid, &pse, &state);
2055 DEBUG("ps_read_process failed: %i", status);
2080 ps_list_add(pse.name,
2081 ps_get_cmdline(pid, pse.name, cmdline, sizeof(cmdline)), &pse);
2086 ps_submit_state("running", running);
2087 ps_submit_state("sleeping", sleeping);
2088 ps_submit_state("zombies", zombies);
2089 ps_submit_state("stopped", stopped);
2090 ps_submit_state("paging", paging);
2091 ps_submit_state("blocked", blocked);
2093 for (procstat_t *ps_ptr = list_head_g; ps_ptr != NULL; ps_ptr = ps_ptr->next)
2094 ps_submit_proc_list(ps_ptr);
2097 /* #endif KERNEL_LINUX */
2099 #elif HAVE_LIBKVM_GETPROCS && HAVE_STRUCT_KINFO_PROC_FREEBSD
2109 char errbuf[_POSIX2_LINE_MAX];
2110 struct kinfo_proc *procs; /* array of processes */
2111 struct kinfo_proc *proc_ptr = NULL;
2112 int count; /* returns number of processes */
2114 process_entry_t pse;
2118 /* Open the kvm interface, get a descriptor */
2119 kd = kvm_openfiles(NULL, "/dev/null", NULL, 0, errbuf);
2121 ERROR("processes plugin: Cannot open kvm interface: %s", errbuf);
2125 /* Get the list of processes. */
2126 procs = kvm_getprocs(kd, KERN_PROC_ALL, 0, &count);
2127 if (procs == NULL) {
2128 ERROR("processes plugin: Cannot get kvm processes list: %s",
2134 /* Iterate through the processes in kinfo_proc */
2135 for (int i = 0; i < count; i++) {
2136 /* Create only one process list entry per _process_, i.e.
2137 * filter out threads (duplicate PID entries). */
2138 if ((proc_ptr == NULL) || (proc_ptr->ki_pid != procs[i].ki_pid)) {
2139 char cmdline[CMDLINE_BUFFER_SIZE] = "";
2140 bool have_cmdline = 0;
2142 proc_ptr = &(procs[i]);
2143 /* Don't probe system processes and processes without arguments */
2144 if (((procs[i].ki_flag & P_SYSTEM) == 0) && (procs[i].ki_args != NULL)) {
2149 /* retrieve the arguments */
2150 argv = kvm_getargv(kd, proc_ptr, /* nchr = */ 0);
2152 if ((argv != NULL) && (argv[0] != NULL)) {
2153 while (argv[argc] != NULL)
2156 status = strjoin(cmdline, sizeof(cmdline), argv, argc, " ");
2158 WARNING("processes plugin: Command line did not fit into buffer.");
2162 } /* if (process has argument list) */
2164 memset(&pse, 0, sizeof(pse));
2165 pse.id = procs[i].ki_pid;
2168 pse.num_lwp = procs[i].ki_numthreads;
2170 pse.vmem_size = procs[i].ki_size;
2171 pse.vmem_rss = procs[i].ki_rssize * pagesize;
2172 pse.vmem_data = procs[i].ki_dsize * pagesize;
2173 pse.vmem_code = procs[i].ki_tsize * pagesize;
2174 pse.stack_size = procs[i].ki_ssize * pagesize;
2175 pse.vmem_minflt_counter = procs[i].ki_rusage.ru_minflt;
2176 pse.vmem_majflt_counter = procs[i].ki_rusage.ru_majflt;
2178 pse.cpu_user_counter = 0;
2179 pse.cpu_system_counter = 0;
2181 * The u-area might be swapped out, and we can't get
2182 * at it because we have a crashdump and no swap.
2183 * If it's here fill in these fields, otherwise, just
2186 if (procs[i].ki_flag & P_INMEM) {
2187 pse.cpu_user_counter = procs[i].ki_rusage.ru_utime.tv_usec +
2188 (1000000lu * procs[i].ki_rusage.ru_utime.tv_sec);
2189 pse.cpu_system_counter =
2190 procs[i].ki_rusage.ru_stime.tv_usec +
2191 (1000000lu * procs[i].ki_rusage.ru_stime.tv_sec);
2202 /* file descriptor count not implemented */
2205 /* Number of memory mappings */
2208 /* context switch counters not implemented */
2209 pse.cswitch_vol = -1;
2210 pse.cswitch_invol = -1;
2212 ps_list_add(procs[i].ki_comm, have_cmdline ? cmdline : NULL, &pse);
2214 switch (procs[i].ki_stat) {
2237 } /* if ((proc_ptr == NULL) || (proc_ptr->ki_pid != procs[i].ki_pid)) */
2242 ps_submit_state("running", running);
2243 ps_submit_state("sleeping", sleeping);
2244 ps_submit_state("zombies", zombies);
2245 ps_submit_state("stopped", stopped);
2246 ps_submit_state("blocked", blocked);
2247 ps_submit_state("idle", idle);
2248 ps_submit_state("wait", wait);
2250 for (procstat_t *ps_ptr = list_head_g; ps_ptr != NULL; ps_ptr = ps_ptr->next)
2251 ps_submit_proc_list(ps_ptr);
2252 /* #endif HAVE_LIBKVM_GETPROCS && HAVE_STRUCT_KINFO_PROC_FREEBSD */
2254 #elif HAVE_LIBKVM_GETPROCS && HAVE_STRUCT_KINFO_PROC_OPENBSD
2265 struct kinfo_proc *procs; /* array of processes */
2266 struct kinfo_proc *proc_ptr = NULL;
2267 int count; /* returns number of processes */
2269 process_entry_t pse;
2273 /* Open the kvm interface, get a descriptor */
2274 kd = kvm_openfiles(NULL, NULL, NULL, KVM_NO_FILES, errbuf);
2276 ERROR("processes plugin: Cannot open kvm interface: %s", errbuf);
2280 /* Get the list of processes. */
2281 procs = kvm_getprocs(kd, KERN_PROC_ALL, 0, sizeof(struct kinfo_proc), &count);
2282 if (procs == NULL) {
2283 ERROR("processes plugin: Cannot get kvm processes list: %s",
2289 /* Iterate through the processes in kinfo_proc */
2290 for (int i = 0; i < count; i++) {
2291 /* Create only one process list entry per _process_, i.e.
2292 * filter out threads (duplicate PID entries). */
2293 if ((proc_ptr == NULL) || (proc_ptr->p_pid != procs[i].p_pid)) {
2294 char cmdline[CMDLINE_BUFFER_SIZE] = "";
2295 bool have_cmdline = 0;
2297 proc_ptr = &(procs[i]);
2298 /* Don't probe zombie processes */
2299 if (!P_ZOMBIE(proc_ptr)) {
2304 /* retrieve the arguments */
2305 argv = kvm_getargv(kd, proc_ptr, /* nchr = */ 0);
2307 if ((argv != NULL) && (argv[0] != NULL)) {
2308 while (argv[argc] != NULL)
2311 status = strjoin(cmdline, sizeof(cmdline), argv, argc, " ");
2313 WARNING("processes plugin: Command line did not fit into buffer.");
2317 } /* if (process has argument list) */
2319 memset(&pse, 0, sizeof(pse));
2320 pse.id = procs[i].p_pid;
2323 pse.num_lwp = 1; /* XXX: accumulate p_tid values for a single p_pid ? */
2325 pse.vmem_rss = procs[i].p_vm_rssize * pagesize;
2326 pse.vmem_data = procs[i].p_vm_dsize * pagesize;
2327 pse.vmem_code = procs[i].p_vm_tsize * pagesize;
2328 pse.stack_size = procs[i].p_vm_ssize * pagesize;
2329 pse.vmem_size = pse.stack_size + pse.vmem_code + pse.vmem_data;
2330 pse.vmem_minflt_counter = procs[i].p_uru_minflt;
2331 pse.vmem_majflt_counter = procs[i].p_uru_majflt;
2333 pse.cpu_user_counter =
2334 procs[i].p_uutime_usec + (1000000lu * procs[i].p_uutime_sec);
2335 pse.cpu_system_counter =
2336 procs[i].p_ustime_usec + (1000000lu * procs[i].p_ustime_sec);
2346 /* file descriptor count not implemented */
2349 /* Number of memory mappings */
2352 /* context switch counters not implemented */
2353 pse.cswitch_vol = -1;
2354 pse.cswitch_invol = -1;
2356 ps_list_add(procs[i].p_comm, have_cmdline ? cmdline : NULL, &pse);
2358 switch (procs[i].p_stat) {
2381 } /* if ((proc_ptr == NULL) || (proc_ptr->p_pid != procs[i].p_pid)) */
2386 ps_submit_state("running", running);
2387 ps_submit_state("sleeping", sleeping);
2388 ps_submit_state("zombies", zombies);
2389 ps_submit_state("stopped", stopped);
2390 ps_submit_state("onproc", onproc);
2391 ps_submit_state("idle", idle);
2392 ps_submit_state("dead", dead);
2394 for (procstat_t *ps_ptr = list_head_g; ps_ptr != NULL; ps_ptr = ps_ptr->next)
2395 ps_submit_proc_list(ps_ptr);
2396 /* #endif HAVE_LIBKVM_GETPROCS && HAVE_STRUCT_KINFO_PROC_OPENBSD */
2398 #elif HAVE_PROCINFO_H
2410 process_entry_t pse;
2413 while ((nprocs = getprocs64(procentry, sizeof(struct procentry64),
2414 /* fdsinfo = */ NULL, sizeof(struct fdsinfo64),
2415 &pindex, MAXPROCENTRY)) > 0) {
2416 for (int i = 0; i < nprocs; i++) {
2419 char arglist[MAXARGLN + 1];
2423 if (procentry[i].pi_state == SNONE)
2425 /* if (procentry[i].pi_state == SZOMB) FIXME */
2427 cmdline = procentry[i].pi_comm;
2428 cargs = procentry[i].pi_comm;
2429 if (procentry[i].pi_flags & SKPROC) {
2430 if (procentry[i].pi_pid == 0)
2431 cmdline = "swapper";
2434 if (getargs(&procentry[i], sizeof(struct procentry64), arglist,
2439 while (++n < MAXARGLN) {
2440 if (arglist[n] == '\0') {
2441 if (arglist[n + 1] == '\0')
2450 memset(&pse, 0, sizeof(pse));
2452 pse.id = procentry[i].pi_pid;
2453 pse.num_lwp = procentry[i].pi_thcount;
2457 while ((nthreads = getthrds64(procentry[i].pi_pid, thrdentry,
2458 sizeof(struct thrdentry64), &thindex,
2459 MAXTHRDENTRY)) > 0) {
2462 for (j = 0; j < nthreads; j++) {
2463 switch (thrdentry[j].ti_state) {
2464 /* case TSNONE: break; */
2467 break; /* FIXME is really blocked */
2485 if (nthreads < MAXTHRDENTRY)
2489 /* tv_usec is nanosec ??? */
2490 pse.cpu_user_counter = procentry[i].pi_ru.ru_utime.tv_sec * 1000000 +
2491 procentry[i].pi_ru.ru_utime.tv_usec / 1000;
2493 /* tv_usec is nanosec ??? */
2494 pse.cpu_system_counter = procentry[i].pi_ru.ru_stime.tv_sec * 1000000 +
2495 procentry[i].pi_ru.ru_stime.tv_usec / 1000;
2497 pse.vmem_minflt_counter = procentry[i].pi_minflt;
2498 pse.vmem_majflt_counter = procentry[i].pi_majflt;
2500 pse.vmem_size = procentry[i].pi_tsize + procentry[i].pi_dvm * pagesize;
2501 pse.vmem_rss = (procentry[i].pi_drss + procentry[i].pi_trss) * pagesize;
2502 /* Not supported/implemented */
2517 pse.cswitch_vol = -1;
2518 pse.cswitch_invol = -1;
2520 ps_list_add(cmdline, cargs, &pse);
2521 } /* for (i = 0 .. nprocs) */
2523 if (nprocs < MAXPROCENTRY)
2525 } /* while (getprocs64() > 0) */
2526 ps_submit_state("running", running);
2527 ps_submit_state("sleeping", sleeping);
2528 ps_submit_state("zombies", zombies);
2529 ps_submit_state("stopped", stopped);
2530 ps_submit_state("paging", paging);
2531 ps_submit_state("blocked", blocked);
2533 for (procstat_t *ps = list_head_g; ps != NULL; ps = ps->next)
2534 ps_submit_proc_list(ps);
2535 /* #endif HAVE_PROCINFO_H */
2537 #elif KERNEL_SOLARIS
2539 * The Solaris section adds a few more process states and removes some
2540 * process states compared to linux. Most notably there is no "PAGING"
2541 * and "BLOCKED" state for a process. The rest is similar to the linux
2559 char cmdline[PRARGSZ];
2563 proc = opendir("/proc");
2567 while ((ent = readdir(proc)) != NULL) {
2569 process_entry_t pse;
2572 if (!isdigit((int)ent->d_name[0]))
2575 pid = strtol(ent->d_name, &endptr, 10);
2576 if (*endptr != 0) /* value didn't completely parse as a number */
2579 memset(&pse, 0, sizeof(pse));
2582 status = ps_read_process(pid, &pse, &state);
2584 DEBUG("ps_read_process failed: %i", status);
2615 ps_list_add(pse.name,
2616 ps_get_cmdline(pid, pse.name, cmdline, sizeof(cmdline)), &pse);
2617 } /* while(readdir) */
2620 ps_submit_state("running", running);
2621 ps_submit_state("sleeping", sleeping);
2622 ps_submit_state("zombies", zombies);
2623 ps_submit_state("stopped", stopped);
2624 ps_submit_state("detached", detached);
2625 ps_submit_state("daemon", daemon);
2626 ps_submit_state("system", system);
2627 ps_submit_state("orphan", orphan);
2629 for (procstat_t *ps_ptr = list_head_g; ps_ptr != NULL; ps_ptr = ps_ptr->next)
2630 ps_submit_proc_list(ps_ptr);
2633 #endif /* KERNEL_SOLARIS */
2640 void module_register(void) {
2641 plugin_register_complex_config("processes", ps_config);
2642 plugin_register_init("processes", ps_init);
2643 plugin_register_read("processes", ps_read);
2644 } /* void module_register */