]> arthur.barton.de Git - netdata.git/blob - src/plugin_proc.c
prevent multiple locks per web requests
[netdata.git] / src / plugin_proc.c
1 #ifdef HAVE_CONFIG_H
2 #include <config.h>
3 #endif
4 #include <pthread.h>
5 #include <sys/time.h>
6 #include <sys/resource.h>
7 #include <strings.h>
8 #include <unistd.h>
9
10 #include "global_statistics.h"
11 #include "common.h"
12 #include "appconfig.h"
13 #include "log.h"
14 #include "rrd.h"
15 #include "plugin_proc.h"
16 #include "main.h"
17 #include "registry.h"
18
19 void *proc_main(void *ptr)
20 {
21         static unsigned long long old_web_requests = 0, old_web_usec = 0;
22         (void)ptr;
23
24         info("PROC Plugin thread created with task id %d", gettid());
25
26         if(pthread_setcanceltype(PTHREAD_CANCEL_DEFERRED, NULL) != 0)
27                 error("Cannot set pthread cancel type to DEFERRED.");
28
29         if(pthread_setcancelstate(PTHREAD_CANCEL_ENABLE, NULL) != 0)
30                 error("Cannot set pthread cancel state to ENABLE.");
31
32         struct rusage me, thread;
33
34         // disable (by default) various interface that are not needed
35         config_get_boolean("plugin:proc:/proc/net/dev:lo", "enabled", 0);
36         config_get_boolean("plugin:proc:/proc/net/dev:fireqos_monitor", "enabled", 0);
37
38         // when ZERO, attempt to do it
39         int vdo_proc_net_dev                    = !config_get_boolean("plugin:proc", "/proc/net/dev", 1);
40         int vdo_proc_diskstats                  = !config_get_boolean("plugin:proc", "/proc/diskstats", 1);
41         int vdo_proc_net_snmp                   = !config_get_boolean("plugin:proc", "/proc/net/snmp", 1);
42         int vdo_proc_net_snmp6                  = !config_get_boolean("plugin:proc", "/proc/net/snmp6", 1);
43         int vdo_proc_net_netstat                = !config_get_boolean("plugin:proc", "/proc/net/netstat", 1);
44         int vdo_proc_net_stat_conntrack = !config_get_boolean("plugin:proc", "/proc/net/stat/conntrack", 1);
45         int vdo_proc_net_ip_vs_stats    = !config_get_boolean("plugin:proc", "/proc/net/ip_vs/stats", 1);
46         int vdo_proc_net_stat_synproxy  = !config_get_boolean("plugin:proc", "/proc/net/stat/synproxy", 1);
47         int vdo_proc_stat                               = !config_get_boolean("plugin:proc", "/proc/stat", 1);
48         int vdo_proc_meminfo                    = !config_get_boolean("plugin:proc", "/proc/meminfo", 1);
49         int vdo_proc_vmstat                     = !config_get_boolean("plugin:proc", "/proc/vmstat", 1);
50         int vdo_proc_net_rpc_nfsd               = !config_get_boolean("plugin:proc", "/proc/net/rpc/nfsd", 1);
51         int vdo_proc_sys_kernel_random_entropy_avail    = !config_get_boolean("plugin:proc", "/proc/sys/kernel/random/entropy_avail", 1);
52         int vdo_proc_interrupts                 = !config_get_boolean("plugin:proc", "/proc/interrupts", 1);
53         int vdo_proc_softirqs                   = !config_get_boolean("plugin:proc", "/proc/softirqs", 1);
54         int vdo_proc_loadavg                    = !config_get_boolean("plugin:proc", "/proc/loadavg", 1);
55         int vdo_sys_kernel_mm_ksm               = !config_get_boolean("plugin:proc", "/sys/kernel/mm/ksm", 1);
56         int vdo_cpu_netdata                     = !config_get_boolean("plugin:proc", "netdata server resources", 1);
57
58         // keep track of the time each module was called
59         unsigned long long sutime_proc_net_dev = 0ULL;
60         unsigned long long sutime_proc_diskstats = 0ULL;
61         unsigned long long sutime_proc_net_snmp = 0ULL;
62         unsigned long long sutime_proc_net_snmp6 = 0ULL;
63         unsigned long long sutime_proc_net_netstat = 0ULL;
64         unsigned long long sutime_proc_net_stat_conntrack = 0ULL;
65         unsigned long long sutime_proc_net_ip_vs_stats = 0ULL;
66         unsigned long long sutime_proc_net_stat_synproxy = 0ULL;
67         unsigned long long sutime_proc_stat = 0ULL;
68         unsigned long long sutime_proc_meminfo = 0ULL;
69         unsigned long long sutime_proc_vmstat = 0ULL;
70         unsigned long long sutime_proc_net_rpc_nfsd = 0ULL;
71         unsigned long long sutime_proc_sys_kernel_random_entropy_avail = 0ULL;
72         unsigned long long sutime_proc_interrupts = 0ULL;
73         unsigned long long sutime_proc_softirqs = 0ULL;
74         unsigned long long sutime_proc_loadavg = 0ULL;
75         unsigned long long sutime_sys_kernel_mm_ksm = 0ULL;
76
77         // the next time we will run - aligned properly
78         unsigned long long sunext = (time(NULL) - (time(NULL) % rrd_update_every) + rrd_update_every) * 1000000ULL;
79         unsigned long long sunow;
80
81         RRDSET *stcpu = NULL, *stcpu_thread = NULL, *stclients = NULL, *streqs = NULL, *stbytes = NULL, *stduration = NULL;
82
83         for(;1;) {
84                 if(unlikely(netdata_exit)) break;
85
86                 // delay until it is our time to run
87                 while((sunow = timems()) < sunext)
88                         usleep((useconds_t)(sunext - sunow));
89
90                 // find the next time we need to run
91                 while(timems() > sunext)
92                         sunext += rrd_update_every * 1000000ULL;
93
94                 if(unlikely(netdata_exit)) break;
95
96                 // BEGIN -- the job to be done
97
98                 if(!vdo_sys_kernel_mm_ksm) {
99                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_sys_kernel_mm_ksm().");
100
101                         sunow = timems();
102                         vdo_sys_kernel_mm_ksm = do_sys_kernel_mm_ksm(rrd_update_every, (sutime_sys_kernel_mm_ksm > 0)?sunow - sutime_sys_kernel_mm_ksm:0ULL);
103                         sutime_sys_kernel_mm_ksm = sunow;
104                 }
105                 if(unlikely(netdata_exit)) break;
106
107                 if(!vdo_proc_loadavg) {
108                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_proc_loadavg().");
109                         sunow = timems();
110                         vdo_proc_loadavg = do_proc_loadavg(rrd_update_every, (sutime_proc_loadavg > 0)?sunow - sutime_proc_loadavg:0ULL);
111                         sutime_proc_loadavg = sunow;
112                 }
113                 if(unlikely(netdata_exit)) break;
114
115                 if(!vdo_proc_interrupts) {
116                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_proc_interrupts().");
117                         sunow = timems();
118                         vdo_proc_interrupts = do_proc_interrupts(rrd_update_every, (sutime_proc_interrupts > 0)?sunow - sutime_proc_interrupts:0ULL);
119                         sutime_proc_interrupts = sunow;
120                 }
121                 if(unlikely(netdata_exit)) break;
122
123                 if(!vdo_proc_softirqs) {
124                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_proc_softirqs().");
125                         sunow = timems();
126                         vdo_proc_softirqs = do_proc_softirqs(rrd_update_every, (sutime_proc_softirqs > 0)?sunow - sutime_proc_softirqs:0ULL);
127                         sutime_proc_softirqs = sunow;
128                 }
129                 if(unlikely(netdata_exit)) break;
130
131                 if(!vdo_proc_sys_kernel_random_entropy_avail) {
132                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_proc_sys_kernel_random_entropy_avail().");
133                         sunow = timems();
134                         vdo_proc_sys_kernel_random_entropy_avail = do_proc_sys_kernel_random_entropy_avail(rrd_update_every, (sutime_proc_sys_kernel_random_entropy_avail > 0)?sunow - sutime_proc_sys_kernel_random_entropy_avail:0ULL);
135                         sutime_proc_sys_kernel_random_entropy_avail = sunow;
136                 }
137                 if(unlikely(netdata_exit)) break;
138
139                 if(!vdo_proc_net_dev) {
140                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_proc_net_dev().");
141                         sunow = timems();
142                         vdo_proc_net_dev = do_proc_net_dev(rrd_update_every, (sutime_proc_net_dev > 0)?sunow - sutime_proc_net_dev:0ULL);
143                         sutime_proc_net_dev = sunow;
144                 }
145                 if(unlikely(netdata_exit)) break;
146
147                 if(!vdo_proc_diskstats) {
148                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_proc_diskstats().");
149                         sunow = timems();
150                         vdo_proc_diskstats = do_proc_diskstats(rrd_update_every, (sutime_proc_diskstats > 0)?sunow - sutime_proc_diskstats:0ULL);
151                         sutime_proc_diskstats = sunow;
152                 }
153                 if(unlikely(netdata_exit)) break;
154
155                 if(!vdo_proc_net_snmp) {
156                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_proc_net_snmp().");
157                         sunow = timems();
158                         vdo_proc_net_snmp = do_proc_net_snmp(rrd_update_every, (sutime_proc_net_snmp > 0)?sunow - sutime_proc_net_snmp:0ULL);
159                         sutime_proc_net_snmp = sunow;
160                 }
161                 if(unlikely(netdata_exit)) break;
162
163                 if(!vdo_proc_net_snmp6) {
164                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_proc_net_snmp6().");
165                         sunow = timems();
166                         vdo_proc_net_snmp6 = do_proc_net_snmp6(rrd_update_every, (sutime_proc_net_snmp6 > 0)?sunow - sutime_proc_net_snmp6:0ULL);
167                         sutime_proc_net_snmp6 = sunow;
168                 }
169                 if(unlikely(netdata_exit)) break;
170
171                 if(!vdo_proc_net_netstat) {
172                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_proc_net_netstat().");
173                         sunow = timems();
174                         vdo_proc_net_netstat = do_proc_net_netstat(rrd_update_every, (sutime_proc_net_netstat > 0)?sunow - sutime_proc_net_netstat:0ULL);
175                         sutime_proc_net_netstat = sunow;
176                 }
177                 if(unlikely(netdata_exit)) break;
178
179                 if(!vdo_proc_net_stat_conntrack) {
180                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_proc_net_stat_conntrack().");
181                         sunow = timems();
182                         vdo_proc_net_stat_conntrack     = do_proc_net_stat_conntrack(rrd_update_every, (sutime_proc_net_stat_conntrack > 0)?sunow - sutime_proc_net_stat_conntrack:0ULL);
183                         sutime_proc_net_stat_conntrack = sunow;
184                 }
185                 if(unlikely(netdata_exit)) break;
186
187                 if(!vdo_proc_net_ip_vs_stats) {
188                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling vdo_proc_net_ip_vs_stats().");
189                         sunow = timems();
190                         vdo_proc_net_ip_vs_stats = do_proc_net_ip_vs_stats(rrd_update_every, (sutime_proc_net_ip_vs_stats > 0)?sunow - sutime_proc_net_ip_vs_stats:0ULL);
191                         sutime_proc_net_ip_vs_stats = sunow;
192                 }
193                 if(unlikely(netdata_exit)) break;
194
195                 if(!vdo_proc_net_stat_synproxy) {
196                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling vdo_proc_net_stat_synproxy().");
197                         sunow = timems();
198                         vdo_proc_net_stat_synproxy = do_proc_net_stat_synproxy(rrd_update_every, (sutime_proc_net_stat_synproxy > 0)?sunow - sutime_proc_net_stat_synproxy:0ULL);
199                         sutime_proc_net_stat_synproxy = sunow;
200                 }
201                 if(unlikely(netdata_exit)) break;
202
203                 if(!vdo_proc_stat) {
204                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_proc_stat().");
205                         sunow = timems();
206                         vdo_proc_stat = do_proc_stat(rrd_update_every, (sutime_proc_stat > 0)?sunow - sutime_proc_stat:0ULL);
207                         sutime_proc_stat = sunow;
208                 }
209                 if(unlikely(netdata_exit)) break;
210
211                 if(!vdo_proc_meminfo) {
212                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling vdo_proc_meminfo().");
213                         sunow = timems();
214                         vdo_proc_meminfo = do_proc_meminfo(rrd_update_every, (sutime_proc_meminfo > 0)?sunow - sutime_proc_meminfo:0ULL);
215                         sutime_proc_meminfo = sunow;
216                 }
217                 if(unlikely(netdata_exit)) break;
218
219                 if(!vdo_proc_vmstat) {
220                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling vdo_proc_vmstat().");
221                         sunow = timems();
222                         vdo_proc_vmstat = do_proc_vmstat(rrd_update_every, (sutime_proc_vmstat > 0)?sunow - sutime_proc_vmstat:0ULL);
223                         sutime_proc_vmstat = sunow;
224                 }
225                 if(unlikely(netdata_exit)) break;
226
227                 if(!vdo_proc_net_rpc_nfsd) {
228                         debug(D_PROCNETDEV_LOOP, "PROCNETDEV: calling do_proc_net_rpc_nfsd().");
229                         sunow = timems();
230                         vdo_proc_net_rpc_nfsd = do_proc_net_rpc_nfsd(rrd_update_every, (sutime_proc_net_rpc_nfsd > 0)?sunow - sutime_proc_net_rpc_nfsd:0ULL);
231                         sutime_proc_net_rpc_nfsd = sunow;
232                 }
233                 if(unlikely(netdata_exit)) break;
234
235                 // END -- the job is done
236
237                 // --------------------------------------------------------------------
238
239                 if(!vdo_cpu_netdata) {
240                         getrusage(RUSAGE_THREAD, &thread);
241                         getrusage(RUSAGE_SELF, &me);
242
243                         if(!stcpu_thread) stcpu_thread = rrdset_find("netdata.plugin_proc_cpu");
244                         if(!stcpu_thread) {
245                                 stcpu_thread = rrdset_create("netdata", "plugin_proc_cpu", NULL, "proc.internal", NULL, "NetData Proc Plugin CPU usage", "milliseconds/s", 132000, rrd_update_every, RRDSET_TYPE_STACKED);
246
247                                 rrddim_add(stcpu_thread, "user",  NULL,  1, 1000, RRDDIM_INCREMENTAL);
248                                 rrddim_add(stcpu_thread, "system", NULL, 1, 1000, RRDDIM_INCREMENTAL);
249                         }
250                         else rrdset_next(stcpu_thread);
251
252                         rrddim_set(stcpu_thread, "user"  , thread.ru_utime.tv_sec * 1000000ULL + thread.ru_utime.tv_usec);
253                         rrddim_set(stcpu_thread, "system", thread.ru_stime.tv_sec * 1000000ULL + thread.ru_stime.tv_usec);
254                         rrdset_done(stcpu_thread);
255
256                         // ----------------------------------------------------------------
257
258                         if(!stcpu) stcpu = rrdset_find("netdata.server_cpu");
259                         if(!stcpu) {
260                                 stcpu = rrdset_create("netdata", "server_cpu", NULL, "netdata", NULL, "NetData CPU usage", "milliseconds/s", 130000, rrd_update_every, RRDSET_TYPE_STACKED);
261
262                                 rrddim_add(stcpu, "user",  NULL,  1, 1000, RRDDIM_INCREMENTAL);
263                                 rrddim_add(stcpu, "system", NULL, 1, 1000, RRDDIM_INCREMENTAL);
264                         }
265                         else rrdset_next(stcpu);
266
267                         rrddim_set(stcpu, "user"  , me.ru_utime.tv_sec * 1000000ULL + me.ru_utime.tv_usec);
268                         rrddim_set(stcpu, "system", me.ru_stime.tv_sec * 1000000ULL + me.ru_stime.tv_usec);
269                         rrdset_done(stcpu);
270
271                         // ----------------------------------------------------------------
272
273                         if(!stclients) stclients = rrdset_find("netdata.clients");
274                         if(!stclients) {
275                                 stclients = rrdset_create("netdata", "clients", NULL, "netdata", NULL, "NetData Web Clients", "connected clients", 130100, rrd_update_every, RRDSET_TYPE_LINE);
276
277                                 rrddim_add(stclients, "clients",  NULL,  1, 1, RRDDIM_ABSOLUTE);
278                         }
279                         else rrdset_next(stclients);
280
281                         rrddim_set(stclients, "clients", global_statistics.connected_clients);
282                         rrdset_done(stclients);
283
284                         // ----------------------------------------------------------------
285
286                         if(!streqs) streqs = rrdset_find("netdata.requests");
287                         if(!streqs) {
288                                 streqs = rrdset_create("netdata", "requests", NULL, "netdata", NULL, "NetData Web Requests", "requests/s", 130200, rrd_update_every, RRDSET_TYPE_LINE);
289
290                                 rrddim_add(streqs, "requests",  NULL,  1, 1, RRDDIM_INCREMENTAL);
291                         }
292                         else rrdset_next(streqs);
293
294                         rrddim_set(streqs, "requests", global_statistics.web_requests);
295                         rrdset_done(streqs);
296
297                         // ----------------------------------------------------------------
298
299                         if(!stbytes) stbytes = rrdset_find("netdata.net");
300                         if(!stbytes) {
301                                 stbytes = rrdset_create("netdata", "net", NULL, "netdata", NULL, "NetData Network Traffic", "kilobits/s", 130300, rrd_update_every, RRDSET_TYPE_AREA);
302
303                                 rrddim_add(stbytes, "in",  NULL,  8, 1024, RRDDIM_INCREMENTAL);
304                                 rrddim_add(stbytes, "out",  NULL,  -8, 1024, RRDDIM_INCREMENTAL);
305                         }
306                         else rrdset_next(stbytes);
307
308                         rrddim_set(stbytes, "in", global_statistics.bytes_received);
309                         rrddim_set(stbytes, "out", global_statistics.bytes_sent);
310                         rrdset_done(stbytes);
311
312                         // ----------------------------------------------------------------
313
314                         if(!stduration) stduration = rrdset_find("netdata.response_time");
315                         if(!stduration) {
316                                 stduration = rrdset_create("netdata", "response_time", NULL, "netdata", NULL, "NetData Average API Response Time", "ms/request", 130400, rrd_update_every, RRDSET_TYPE_LINE);
317
318                                 rrddim_add(stduration, "response_time", "response time",  1, 1000, RRDDIM_ABSOLUTE);
319                         }
320                         else rrdset_next(stduration);
321
322                         unsigned long long gweb_usec     = global_statistics.web_usec;
323                         unsigned long long gweb_requests = global_statistics.web_requests;
324
325                         unsigned long long web_usec     = gweb_usec     - old_web_usec;
326                         unsigned long long web_requests = gweb_requests - old_web_requests;
327
328                         old_web_usec     = gweb_usec;
329                         old_web_requests = gweb_requests;
330
331                         if(!web_requests) web_requests = 1;
332
333                         rrddim_set(stduration, "response_time", web_usec / web_requests);
334                         rrdset_done(stduration);
335
336                         // ----------------------------------------------------------------
337
338                         registry_statistics();
339                 }
340         }
341
342         pthread_exit(NULL);
343         return NULL;
344 }