2 * collectd - src/processes.c
3 * Copyright (C) 2005 Lyonel Vincent
4 * Copyright (C) 2006-2007 Florian Forster (Mach code)
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU General Public License as published by the
8 * Free Software Foundation; either version 2 of the License, or (at your
9 * option) any later version.
11 * This program is distributed in the hope that it will be useful, but
12 * WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * General Public License for more details.
16 * You should have received a copy of the GNU General Public License along
17 * with this program; if not, write to the Free Software Foundation, Inc.,
18 * 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
21 * Lyonel Vincent <lyonel at ezix.org>
22 * Florian octo Forster <octo at verplant.org>
28 #include "configfile.h"
30 /* Include header files for the mach system, if they exist.. */
32 # if HAVE_MACH_MACH_INIT_H
33 # include <mach/mach_init.h>
35 # if HAVE_MACH_HOST_PRIV_H
36 # include <mach/host_priv.h>
38 # if HAVE_MACH_MACH_ERROR_H
39 # include <mach/mach_error.h>
41 # if HAVE_MACH_MACH_HOST_H
42 # include <mach/mach_host.h>
44 # if HAVE_MACH_MACH_PORT_H
45 # include <mach/mach_port.h>
47 # if HAVE_MACH_MACH_TYPES_H
48 # include <mach/mach_types.h>
50 # if HAVE_MACH_MESSAGE_H
51 # include <mach/message.h>
53 # if HAVE_MACH_PROCESSOR_SET_H
54 # include <mach/processor_set.h>
57 # include <mach/task.h>
59 # if HAVE_MACH_THREAD_ACT_H
60 # include <mach/thread_act.h>
62 # if HAVE_MACH_VM_REGION_H
63 # include <mach/vm_region.h>
65 # if HAVE_MACH_VM_MAP_H
66 # include <mach/vm_map.h>
68 # if HAVE_MACH_VM_PROT_H
69 # include <mach/vm_prot.h>
71 # if HAVE_SYS_SYSCTL_H
72 # include <sys/sysctl.h>
74 /* #endif HAVE_THREAD_INFO */
77 # if HAVE_LINUX_CONFIG_H
78 # include <linux/config.h>
81 # define CONFIG_HZ 100
83 /* #endif KERNEL_LINUX */
86 # error "No applicable input method."
91 static const char *config_keys[] =
96 static int config_keys_num = 1;
98 typedef struct procstat_entry_s
103 unsigned long num_proc;
104 unsigned long num_lwp;
105 unsigned long vmem_rss;
107 unsigned long vmem_minflt;
108 unsigned long vmem_majflt;
109 unsigned long vmem_minflt_counter;
110 unsigned long vmem_majflt_counter;
112 unsigned long cpu_user;
113 unsigned long cpu_system;
114 unsigned long cpu_user_counter;
115 unsigned long cpu_system_counter;
117 struct procstat_entry_s *next;
120 #define PROCSTAT_NAME_LEN 256
121 typedef struct procstat
123 char name[PROCSTAT_NAME_LEN];
125 unsigned long num_proc;
126 unsigned long num_lwp;
127 unsigned long vmem_rss;
129 unsigned long vmem_minflt_counter;
130 unsigned long vmem_majflt_counter;
132 unsigned long cpu_user_counter;
133 unsigned long cpu_system_counter;
135 struct procstat *next;
136 struct procstat_entry_s *instances;
139 static procstat_t *list_head_g = NULL;
142 static mach_port_t port_host_self;
143 static mach_port_t port_task_self;
145 static processor_set_name_array_t pset_list;
146 static mach_msg_type_number_t pset_list_len;
147 /* #endif HAVE_THREAD_INFO */
150 static long pagesize_g;
151 #endif /* KERNEL_LINUX */
153 static void ps_list_register (const char *name)
158 if ((new = (procstat_t *) malloc (sizeof (procstat_t))) == NULL)
160 memset (new, 0, sizeof (procstat_t));
161 strncpy (new->name, name, PROCSTAT_NAME_LEN);
163 for (ptr = list_head_g; ptr != NULL; ptr = ptr->next)
165 if (strcmp (ptr->name, name) == 0)
167 if (ptr->next == NULL)
177 static procstat_t *ps_list_search (const char *name)
181 for (ptr = list_head_g; ptr != NULL; ptr = ptr->next)
182 if (strcmp (ptr->name, name) == 0)
188 static void ps_list_add (const char *name, procstat_entry_t *entry)
191 procstat_entry_t *pse;
196 if ((ps = ps_list_search (name)) == NULL)
199 for (pse = ps->instances; pse != NULL; pse = pse->next)
200 if ((pse->id == entry->id) || (pse->next == NULL))
203 if ((pse == NULL) || (pse->id != entry->id))
205 procstat_entry_t *new;
207 new = (procstat_entry_t *) malloc (sizeof (procstat_entry_t));
210 memset (new, 0, sizeof (procstat_entry_t));
222 pse->num_proc = entry->num_proc;
223 pse->num_lwp = entry->num_lwp;
224 pse->vmem_rss = entry->vmem_rss;
226 ps->num_proc += pse->num_proc;
227 ps->num_lwp += pse->num_lwp;
228 ps->vmem_rss += pse->vmem_rss;
230 if ((entry->vmem_minflt_counter == 0)
231 && (entry->vmem_majflt_counter == 0))
233 pse->vmem_minflt_counter += entry->vmem_minflt;
234 pse->vmem_minflt = entry->vmem_minflt;
236 pse->vmem_majflt_counter += entry->vmem_majflt;
237 pse->vmem_majflt = entry->vmem_majflt;
241 if (entry->vmem_minflt_counter < pse->vmem_minflt_counter)
243 pse->vmem_minflt = entry->vmem_minflt_counter
244 + (ULONG_MAX - pse->vmem_minflt_counter);
248 pse->vmem_minflt = entry->vmem_minflt_counter - pse->vmem_minflt_counter;
250 pse->vmem_minflt_counter = entry->vmem_minflt_counter;
252 if (entry->vmem_majflt_counter < pse->vmem_majflt_counter)
254 pse->vmem_majflt = entry->vmem_majflt_counter
255 + (ULONG_MAX - pse->vmem_majflt_counter);
259 pse->vmem_majflt = entry->vmem_majflt_counter - pse->vmem_majflt_counter;
261 pse->vmem_majflt_counter = entry->vmem_majflt_counter;
264 ps->vmem_minflt_counter += pse->vmem_minflt;
265 ps->vmem_majflt_counter += pse->vmem_majflt;
267 if ((entry->cpu_user_counter == 0)
268 && (entry->cpu_system_counter == 0))
270 pse->cpu_user_counter += entry->cpu_user;
271 pse->cpu_user = entry->cpu_user;
273 pse->cpu_system_counter += entry->cpu_system;
274 pse->cpu_system = entry->cpu_system;
278 if (entry->cpu_user_counter < pse->cpu_user_counter)
280 pse->cpu_user = entry->cpu_user_counter
281 + (ULONG_MAX - pse->cpu_user_counter);
285 pse->cpu_user = entry->cpu_user_counter - pse->cpu_user_counter;
287 pse->cpu_user_counter = entry->cpu_user_counter;
289 if (entry->cpu_system_counter < pse->cpu_system_counter)
291 pse->cpu_system = entry->cpu_system_counter
292 + (ULONG_MAX - pse->cpu_system_counter);
296 pse->cpu_system = entry->cpu_system_counter - pse->cpu_system_counter;
298 pse->cpu_system_counter = entry->cpu_system_counter;
301 ps->cpu_user_counter += pse->cpu_user;
302 ps->cpu_system_counter += pse->cpu_system;
305 static void ps_list_reset (void)
308 procstat_entry_t *pse;
309 procstat_entry_t *pse_prev;
311 for (ps = list_head_g; ps != NULL; ps = ps->next)
323 DEBUG ("Removing this procstat entry cause it's too old: "
324 "id = %lu; name = %s;",
327 if (pse_prev == NULL)
329 ps->instances = pse->next;
335 pse_prev->next = pse->next;
337 pse = pse_prev->next;
346 } /* while (pse != NULL) */
347 } /* for (ps = list_head_g; ps != NULL; ps = ps->next) */
350 static int ps_config (const char *key, const char *value)
352 if (strcasecmp (key, "Process") == 0)
354 ps_list_register (value);
364 static int ps_init (void)
367 kern_return_t status;
369 port_host_self = mach_host_self ();
370 port_task_self = mach_task_self ();
372 if (pset_list != NULL)
374 vm_deallocate (port_task_self,
375 (vm_address_t) pset_list,
376 pset_list_len * sizeof (processor_set_t));
381 if ((status = host_processor_sets (port_host_self,
383 &pset_list_len)) != KERN_SUCCESS)
385 ERROR ("host_processor_sets failed: %s\n",
386 mach_error_string (status));
391 /* #endif HAVE_THREAD_INFO */
394 pagesize_g = sysconf(_SC_PAGESIZE);
395 DEBUG ("pagesize_g = %li; CONFIG_HZ = %i;",
396 pagesize_g, CONFIG_HZ);
397 #endif /* KERNEL_LINUX */
402 static void ps_submit_state (const char *state, double value)
405 value_list_t vl = VALUE_LIST_INIT;
407 values[0].gauge = value;
411 vl.time = time (NULL);
412 strcpy (vl.host, hostname_g);
413 strcpy (vl.plugin, "processes");
414 strcpy (vl.plugin_instance, "");
415 strncpy (vl.type_instance, state, sizeof (vl.type_instance));
417 plugin_dispatch_values ("ps_state", &vl);
420 static void ps_submit_proc_list (procstat_t *ps)
423 value_list_t vl = VALUE_LIST_INIT;
427 vl.time = time (NULL);
428 strcpy (vl.host, hostname_g);
429 strcpy (vl.plugin, "processes");
430 strncpy (vl.plugin_instance, ps->name, sizeof (vl.plugin_instance));
432 vl.values[0].gauge = ps->vmem_rss;
434 plugin_dispatch_values ("ps_rss", &vl);
436 vl.values[0].counter = ps->cpu_user_counter;
437 vl.values[1].counter = ps->cpu_system_counter;
439 plugin_dispatch_values ("ps_cputime", &vl);
441 vl.values[0].gauge = ps->num_proc;
442 vl.values[1].gauge = ps->num_lwp;
444 plugin_dispatch_values ("ps_count", &vl);
446 vl.values[0].counter = ps->vmem_minflt_counter;
447 vl.values[1].counter = ps->vmem_majflt_counter;
449 plugin_dispatch_values ("ps_pagefaults", &vl);
451 DEBUG ("name = %s; num_proc = %lu; num_lwp = %lu; vmem_rss = %lu; "
452 "vmem_minflt_counter = %lu; vmem_majflt_counter = %lu; "
453 "cpu_user_counter = %lu; cpu_system_counter = %lu;",
454 ps->name, ps->num_proc, ps->num_lwp, ps->vmem_rss,
455 ps->vmem_minflt_counter, ps->vmem_majflt_counter,
456 ps->cpu_user_counter, ps->cpu_system_counter);
457 } /* void ps_submit_proc_list */
460 static int *ps_read_tasks (int pid)
463 int list_size = 1; /* size of allocated space, in elements */
464 int list_len = 0; /* number of currently used elements */
470 snprintf (dirname, 64, "/proc/%i/task", pid);
473 if ((dh = opendir (dirname)) == NULL)
475 DEBUG ("Failed to open directory `%s'", dirname);
479 while ((ent = readdir (dh)) != NULL)
481 if (!isdigit (ent->d_name[0]))
484 if ((list_len + 1) >= list_size)
487 int new_size = 2 * list_size;
488 /* Comes in sizes: 2, 4, 8, 16, ... */
490 new_ptr = (int *) realloc (list, (size_t) (sizeof (int) * new_size));
495 ERROR ("processes plugin: "
496 "Failed to allocate more memory.");
501 list_size = new_size;
503 memset (list + list_len, 0, sizeof (int) * (list_size - list_len));
506 list[list_len] = atoi (ent->d_name);
507 if (list[list_len] != 0)
516 assert (list_len < list_size);
517 assert (list[list_len] == 0);
520 } /* int *ps_read_tasks */
522 int ps_read_process (int pid, procstat_t *ps, char *state)
537 long long unsigned cpu_user_counter;
538 long long unsigned cpu_system_counter;
539 long long unsigned vmem_rss;
541 memset (ps, 0, sizeof (procstat_t));
543 snprintf (filename, 64, "/proc/%i/stat", pid);
546 if ((fh = fopen (filename, "r")) == NULL)
549 if (fgets (buffer, 1024, fh) == NULL)
557 fields_len = strsplit (buffer, fields, 64);
560 DEBUG ("processes plugin: ps_read_process (pid = %i):"
561 " `%s' has only %i fields..",
562 (int) pid, filename, fields_len);
566 /* copy the name, strip brackets in the process */
567 name_len = strlen (fields[1]) - 2;
568 if ((fields[1][0] != '(') || (fields[1][name_len + 1] != ')'))
570 DEBUG ("No brackets found in process name: `%s'", fields[1]);
573 fields[1] = fields[1] + 1;
574 fields[1][name_len] = '\0';
575 strncpy (ps->name, fields[1], PROCSTAT_NAME_LEN);
577 ppid = atoi (fields[3]);
579 *state = fields[2][0];
586 else if ((tasks = ps_read_tasks (pid)) == NULL)
588 /* Kernel 2.4 or so */
596 for (i = 0; tasks[i] != 0; i++)
603 /* Leave the rest at zero if this is only a zombi */
604 if (ps->num_proc == 0)
606 DEBUG ("processes plugin: This is only a zombi: pid = %i; "
607 "name = %s;", pid, ps->name);
611 cpu_user_counter = atoll (fields[13]);
612 cpu_system_counter = atoll (fields[14]);
613 vmem_rss = atoll (fields[23]);
614 ps->vmem_minflt_counter = atol (fields[9]);
615 ps->vmem_majflt_counter = atol (fields[11]);
617 /* Convert jiffies to useconds */
618 cpu_user_counter = cpu_user_counter * 1000000 / CONFIG_HZ;
619 cpu_system_counter = cpu_system_counter * 1000000 / CONFIG_HZ;
620 vmem_rss = vmem_rss * pagesize_g;
622 ps->cpu_user_counter = (unsigned long) cpu_user_counter;
623 ps->cpu_system_counter = (unsigned long) cpu_system_counter;
624 ps->vmem_rss = (unsigned long) vmem_rss;
628 } /* int ps_read_process (...) */
629 #endif /* KERNEL_LINUX */
632 static int mach_get_task_name (task_t t, int *pid, char *name, size_t name_max_len)
636 struct kinfo_proc kp;
641 mib[2] = KERN_PROC_PID;
643 if (pid_for_task (t, pid) != KERN_SUCCESS)
647 kp_size = sizeof (kp);
648 if (sysctl (mib, 4, &kp, &kp_size, NULL, 0) != 0)
651 if (name_max_len > (MAXCOMLEN + 1))
652 name_max_len = MAXCOMLEN + 1;
654 strncpy (name, kp.kp_proc.p_comm, name_max_len - 1);
655 name[name_max_len - 1] = '\0';
657 DEBUG ("pid = %i; name = %s;", *pid, name);
659 /* We don't do the special handling for `p_comm == "LaunchCFMApp"' as
660 * `top' does it, because it is a lot of work and only used when
661 * debugging. -octo */
665 #endif /* HAVE_THREAD_INFO */
667 static int ps_read (void)
670 kern_return_t status;
673 processor_set_t port_pset_priv;
676 task_array_t task_list;
677 mach_msg_type_number_t task_list_len;
680 char task_name[MAXCOMLEN + 1];
683 thread_act_array_t thread_list;
684 mach_msg_type_number_t thread_list_len;
685 thread_basic_info_data_t thread_data;
686 mach_msg_type_number_t thread_data_len;
695 procstat_entry_t pse;
700 * The Mach-concept is a little different from the traditional UNIX
701 * concept: All the work is done in threads. Threads are contained in
702 * `tasks'. Therefore, `task status' doesn't make much sense, since
703 * it's actually a `thread status'.
704 * Tasks are assigned to sets of processors, so that's where you go to
707 for (pset = 0; pset < pset_list_len; pset++)
709 if ((status = host_processor_set_priv (port_host_self,
711 &port_pset_priv)) != KERN_SUCCESS)
713 ERROR ("host_processor_set_priv failed: %s\n",
714 mach_error_string (status));
718 if ((status = processor_set_tasks (port_pset_priv,
720 &task_list_len)) != KERN_SUCCESS)
722 ERROR ("processor_set_tasks failed: %s\n",
723 mach_error_string (status));
724 mach_port_deallocate (port_task_self, port_pset_priv);
728 for (task = 0; task < task_list_len; task++)
731 if (mach_get_task_name (task_list[task],
733 task_name, PROCSTAT_NAME_LEN) == 0)
734 ps = ps_list_search (task_name);
736 /* Collect more detailed statistics for this process */
739 task_basic_info_data_t task_basic_info;
740 mach_msg_type_number_t task_basic_info_len;
741 task_events_info_data_t task_events_info;
742 mach_msg_type_number_t task_events_info_len;
743 task_absolutetime_info_data_t task_absolutetime_info;
744 mach_msg_type_number_t task_absolutetime_info_len;
746 memset (&pse, '\0', sizeof (pse));
749 task_basic_info_len = TASK_BASIC_INFO_COUNT;
750 status = task_info (task_list[task],
752 (task_info_t) &task_basic_info,
753 &task_basic_info_len);
754 if (status != KERN_SUCCESS)
756 ERROR ("task_info failed: %s",
757 mach_error_string (status));
758 continue; /* with next thread_list */
761 task_events_info_len = TASK_EVENTS_INFO_COUNT;
762 status = task_info (task_list[task],
764 (task_info_t) &task_events_info,
765 &task_events_info_len);
766 if (status != KERN_SUCCESS)
768 ERROR ("task_info failed: %s",
769 mach_error_string (status));
770 continue; /* with next thread_list */
773 task_absolutetime_info_len = TASK_ABSOLUTETIME_INFO_COUNT;
774 status = task_info (task_list[task],
775 TASK_ABSOLUTETIME_INFO,
776 (task_info_t) &task_absolutetime_info,
777 &task_absolutetime_info_len);
778 if (status != KERN_SUCCESS)
780 ERROR ("task_info failed: %s",
781 mach_error_string (status));
782 continue; /* with next thread_list */
786 pse.vmem_rss = task_basic_info.resident_size;
788 pse.vmem_minflt_counter = task_events_info.cow_faults;
789 pse.vmem_majflt_counter = task_events_info.faults;
791 pse.cpu_user_counter = task_absolutetime_info.total_user;
792 pse.cpu_system_counter = task_absolutetime_info.total_system;
795 status = task_threads (task_list[task], &thread_list,
797 if (status != KERN_SUCCESS)
799 /* Apple's `top' treats this case a zombie. It
800 * makes sense to some extend: A `zombie'
801 * thread is nonsense, since the task/process
804 DEBUG ("task_threads failed: %s",
805 mach_error_string (status));
806 if (task_list[task] != port_task_self)
807 mach_port_deallocate (port_task_self,
809 continue; /* with next task_list */
812 for (thread = 0; thread < thread_list_len; thread++)
814 thread_data_len = THREAD_BASIC_INFO_COUNT;
815 status = thread_info (thread_list[thread],
817 (thread_info_t) &thread_data,
819 if (status != KERN_SUCCESS)
821 ERROR ("thread_info failed: %s",
822 mach_error_string (status));
823 if (task_list[task] != port_task_self)
824 mach_port_deallocate (port_task_self,
825 thread_list[thread]);
826 continue; /* with next thread_list */
832 switch (thread_data.run_state)
834 case TH_STATE_RUNNING:
837 case TH_STATE_STOPPED:
838 /* What exactly is `halted'? */
839 case TH_STATE_HALTED:
842 case TH_STATE_WAITING:
845 case TH_STATE_UNINTERRUPTIBLE:
848 /* There is no `zombie' case here,
849 * since there are no zombie-threads.
850 * There's only zombie tasks, which are
853 WARNING ("Unknown thread status: %s",
854 thread_data.run_state);
856 } /* switch (thread_data.run_state) */
858 if (task_list[task] != port_task_self)
860 status = mach_port_deallocate (port_task_self,
861 thread_list[thread]);
862 if (status != KERN_SUCCESS)
863 ERROR ("mach_port_deallocate failed: %s",
864 mach_error_string (status));
866 } /* for (thread_list) */
868 if ((status = vm_deallocate (port_task_self,
869 (vm_address_t) thread_list,
870 thread_list_len * sizeof (thread_act_t)))
873 ERROR ("vm_deallocate failed: %s",
874 mach_error_string (status));
879 /* Only deallocate the task port, if it isn't our own.
880 * Don't know what would happen in that case, but this
881 * is what Apple's top does.. ;) */
882 if (task_list[task] != port_task_self)
884 status = mach_port_deallocate (port_task_self,
886 if (status != KERN_SUCCESS)
887 ERROR ("mach_port_deallocate failed: %s",
888 mach_error_string (status));
892 ps_list_add (task_name, &pse);
893 } /* for (task_list) */
895 if ((status = vm_deallocate (port_task_self,
896 (vm_address_t) task_list,
897 task_list_len * sizeof (task_t))) != KERN_SUCCESS)
899 ERROR ("vm_deallocate failed: %s",
900 mach_error_string (status));
905 if ((status = mach_port_deallocate (port_task_self, port_pset_priv))
908 ERROR ("mach_port_deallocate failed: %s",
909 mach_error_string (status));
911 } /* for (pset_list) */
913 ps_submit_state ("running", running);
914 ps_submit_state ("sleeping", sleeping);
915 ps_submit_state ("zombies", zombies);
916 ps_submit_state ("stopped", stopped);
917 ps_submit_state ("blocked", blocked);
919 for (ps = list_head_g; ps != NULL; ps = ps->next)
920 ps_submit_proc_list (ps);
921 /* #endif HAVE_THREAD_INFO */
937 procstat_entry_t pse;
942 running = sleeping = zombies = stopped = paging = blocked = 0;
945 if ((proc = opendir ("/proc")) == NULL)
948 ERROR ("Cannot open `/proc': %s",
949 sstrerror (errno, errbuf, sizeof (errbuf)));
953 while ((ent = readdir (proc)) != NULL)
955 if (!isdigit (ent->d_name[0]))
958 if ((pid = atoi (ent->d_name)) < 1)
961 status = ps_read_process (pid, &ps, &state);
964 DEBUG ("ps_read_process failed: %i", status);
971 pse.num_proc = ps.num_proc;
972 pse.num_lwp = ps.num_lwp;
973 pse.vmem_rss = ps.vmem_rss;
976 pse.vmem_minflt_counter = ps.vmem_minflt_counter;
978 pse.vmem_majflt_counter = ps.vmem_majflt_counter;
981 pse.cpu_user_counter = ps.cpu_user_counter;
983 pse.cpu_system_counter = ps.cpu_system_counter;
987 case 'R': running++; break;
988 case 'S': sleeping++; break;
989 case 'D': blocked++; break;
990 case 'Z': zombies++; break;
991 case 'T': stopped++; break;
992 case 'W': paging++; break;
995 ps_list_add (ps.name, &pse);
1000 ps_submit_state ("running", running);
1001 ps_submit_state ("sleeping", sleeping);
1002 ps_submit_state ("zombies", zombies);
1003 ps_submit_state ("stopped", stopped);
1004 ps_submit_state ("paging", paging);
1005 ps_submit_state ("blocked", blocked);
1007 for (ps_ptr = list_head_g; ps_ptr != NULL; ps_ptr = ps_ptr->next)
1008 ps_submit_proc_list (ps_ptr);
1009 #endif /* KERNEL_LINUX */
1014 void module_register (void)
1016 plugin_register_config ("processes", ps_config,
1017 config_keys, config_keys_num);
1018 plugin_register_init ("processes", ps_init);
1019 plugin_register_read ("processes", ps_read);
1020 } /* void module_register */