]> arthur.barton.de Git - netdata.git/blob - src/sys_fs_cgroup.c
16d057f4031b75977d0009da3a9bbf183926ca49
[netdata.git] / src / sys_fs_cgroup.c
1 #include "common.h"
2
3 // ----------------------------------------------------------------------------
4 // cgroup globals
5
6 #define CHART_PRIORITY_SYSTEMD_SERVICES 19000
7 #define CHART_PRIORITY_CONTAINERS       40000
8
9 static long system_page_size = 4096; // system will be queried via sysconf() in configuration()
10
11 static int cgroup_enable_cpuacct_stat = CONFIG_BOOLEAN_AUTO;
12 static int cgroup_enable_cpuacct_usage = CONFIG_BOOLEAN_AUTO;
13 static int cgroup_enable_memory = CONFIG_BOOLEAN_AUTO;
14 static int cgroup_enable_detailed_memory = CONFIG_BOOLEAN_AUTO;
15 static int cgroup_enable_memory_failcnt = CONFIG_BOOLEAN_AUTO;
16 static int cgroup_enable_swap = CONFIG_BOOLEAN_AUTO;
17 static int cgroup_enable_blkio_io = CONFIG_BOOLEAN_AUTO;
18 static int cgroup_enable_blkio_ops = CONFIG_BOOLEAN_AUTO;
19 static int cgroup_enable_blkio_throttle_io = CONFIG_BOOLEAN_AUTO;
20 static int cgroup_enable_blkio_throttle_ops = CONFIG_BOOLEAN_AUTO;
21 static int cgroup_enable_blkio_merged_ops = CONFIG_BOOLEAN_AUTO;
22 static int cgroup_enable_blkio_queued_ops = CONFIG_BOOLEAN_AUTO;
23
24 static int cgroup_enable_systemd_services = CONFIG_BOOLEAN_YES;
25 static int cgroup_enable_systemd_services_detailed_memory = CONFIG_BOOLEAN_NO;
26 static int cgroup_used_memory_without_cache = CONFIG_BOOLEAN_YES;
27
28 static int cgroup_search_in_devices = 1;
29
30 static int cgroup_enable_new_cgroups_detected_at_runtime = 1;
31 static int cgroup_check_for_new_every = 10;
32 static int cgroup_update_every = 1;
33
34 static int cgroup_recheck_zero_blkio_every_iterations = 10;
35 static int cgroup_recheck_zero_mem_failcnt_every_iterations = 10;
36 static int cgroup_recheck_zero_mem_detailed_every_iterations = 10;
37
38 static char *cgroup_cpuacct_base = NULL;
39 static char *cgroup_blkio_base = NULL;
40 static char *cgroup_memory_base = NULL;
41 static char *cgroup_devices_base = NULL;
42
43 static int cgroup_root_count = 0;
44 static int cgroup_root_max = 500;
45 static int cgroup_max_depth = 0;
46
47 static SIMPLE_PATTERN *enabled_cgroup_patterns = NULL;
48 static SIMPLE_PATTERN *enabled_cgroup_paths = NULL;
49 static SIMPLE_PATTERN *enabled_cgroup_renames = NULL;
50 static SIMPLE_PATTERN *systemd_services_cgroups = NULL;
51
52 static char *cgroups_rename_script = NULL;
53
54 static int cgroups_check = 0;
55
56 static uint32_t Read_hash = 0;
57 static uint32_t Write_hash = 0;
58 static uint32_t user_hash = 0;
59 static uint32_t system_hash = 0;
60
61 void read_cgroup_plugin_configuration() {
62     system_page_size = sysconf(_SC_PAGESIZE);
63
64     Read_hash = simple_hash("Read");
65     Write_hash = simple_hash("Write");
66     user_hash = simple_hash("user");
67     system_hash = simple_hash("system");
68
69     cgroup_update_every = (int)config_get_number("plugin:cgroups", "update every", localhost->rrd_update_every);
70     if(cgroup_update_every < localhost->rrd_update_every)
71         cgroup_update_every = localhost->rrd_update_every;
72
73     cgroup_check_for_new_every = (int)config_get_number("plugin:cgroups", "check for new cgroups every", cgroup_check_for_new_every * cgroup_update_every);
74     if(cgroup_check_for_new_every < cgroup_update_every)
75         cgroup_check_for_new_every = cgroup_update_every;
76
77     cgroup_enable_cpuacct_stat = config_get_boolean_ondemand("plugin:cgroups", "enable cpuacct stat (total CPU)", cgroup_enable_cpuacct_stat);
78     cgroup_enable_cpuacct_usage = config_get_boolean_ondemand("plugin:cgroups", "enable cpuacct usage (per core CPU)", cgroup_enable_cpuacct_usage);
79
80     cgroup_enable_memory = config_get_boolean_ondemand("plugin:cgroups", "enable memory (used mem including cache)", cgroup_enable_memory);
81     cgroup_enable_detailed_memory = config_get_boolean_ondemand("plugin:cgroups", "enable detailed memory", cgroup_enable_detailed_memory);
82     cgroup_enable_memory_failcnt = config_get_boolean_ondemand("plugin:cgroups", "enable memory limits fail count", cgroup_enable_memory_failcnt);
83     cgroup_enable_swap = config_get_boolean_ondemand("plugin:cgroups", "enable swap memory", cgroup_enable_swap);
84
85     cgroup_enable_blkio_io = config_get_boolean_ondemand("plugin:cgroups", "enable blkio bandwidth", cgroup_enable_blkio_io);
86     cgroup_enable_blkio_ops = config_get_boolean_ondemand("plugin:cgroups", "enable blkio operations", cgroup_enable_blkio_ops);
87     cgroup_enable_blkio_throttle_io = config_get_boolean_ondemand("plugin:cgroups", "enable blkio throttle bandwidth", cgroup_enable_blkio_throttle_io);
88     cgroup_enable_blkio_throttle_ops = config_get_boolean_ondemand("plugin:cgroups", "enable blkio throttle operations", cgroup_enable_blkio_throttle_ops);
89     cgroup_enable_blkio_queued_ops = config_get_boolean_ondemand("plugin:cgroups", "enable blkio queued operations", cgroup_enable_blkio_queued_ops);
90     cgroup_enable_blkio_merged_ops = config_get_boolean_ondemand("plugin:cgroups", "enable blkio merged operations", cgroup_enable_blkio_merged_ops);
91
92     cgroup_recheck_zero_blkio_every_iterations = (int)config_get_number("plugin:cgroups", "recheck zero blkio every iterations", cgroup_recheck_zero_blkio_every_iterations);
93     cgroup_recheck_zero_mem_failcnt_every_iterations = (int)config_get_number("plugin:cgroups", "recheck zero memory failcnt every iterations", cgroup_recheck_zero_mem_failcnt_every_iterations);
94     cgroup_recheck_zero_mem_detailed_every_iterations = (int)config_get_number("plugin:cgroups", "recheck zero detailed memory every iterations", cgroup_recheck_zero_mem_detailed_every_iterations);
95
96     cgroup_enable_systemd_services = config_get_boolean("plugin:cgroups", "enable systemd services", cgroup_enable_systemd_services);
97     cgroup_enable_systemd_services_detailed_memory = config_get_boolean("plugin:cgroups", "enable systemd services detailed memory", cgroup_enable_systemd_services_detailed_memory);
98     cgroup_used_memory_without_cache = config_get_boolean("plugin:cgroups", "report used memory without cache", cgroup_used_memory_without_cache);
99
100     char filename[FILENAME_MAX + 1], *s;
101     struct mountinfo *mi, *root = mountinfo_read(0);
102
103     mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "cpuacct");
104     if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "cpuacct");
105     if(!mi) {
106         error("Cannot find cgroup cpuacct mountinfo. Assuming default: /sys/fs/cgroup/cpuacct");
107         s = "/sys/fs/cgroup/cpuacct";
108     }
109     else s = mi->mount_point;
110     snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
111     cgroup_cpuacct_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/cpuacct", filename);
112
113     mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "blkio");
114     if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "blkio");
115     if(!mi) {
116         error("Cannot find cgroup blkio mountinfo. Assuming default: /sys/fs/cgroup/blkio");
117         s = "/sys/fs/cgroup/blkio";
118     }
119     else s = mi->mount_point;
120     snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
121     cgroup_blkio_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/blkio", filename);
122
123     mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "memory");
124     if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "memory");
125     if(!mi) {
126         error("Cannot find cgroup memory mountinfo. Assuming default: /sys/fs/cgroup/memory");
127         s = "/sys/fs/cgroup/memory";
128     }
129     else s = mi->mount_point;
130     snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
131     cgroup_memory_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/memory", filename);
132
133     mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "devices");
134     if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "devices");
135     if(!mi) {
136         error("Cannot find cgroup devices mountinfo. Assuming default: /sys/fs/cgroup/devices");
137         s = "/sys/fs/cgroup/devices";
138     }
139     else s = mi->mount_point;
140     snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
141     cgroup_devices_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/devices", filename);
142
143     cgroup_root_max = (int)config_get_number("plugin:cgroups", "max cgroups to allow", cgroup_root_max);
144     cgroup_max_depth = (int)config_get_number("plugin:cgroups", "max cgroups depth to monitor", cgroup_max_depth);
145
146     cgroup_enable_new_cgroups_detected_at_runtime = config_get_boolean("plugin:cgroups", "enable new cgroups detected at run time", cgroup_enable_new_cgroups_detected_at_runtime);
147
148     enabled_cgroup_patterns = simple_pattern_create(
149             config_get("plugin:cgroups", "enable by default cgroups matching",
150                     " /system.slice/docker-*.scope "
151                     " !*.mount "
152                     " !*.partition "
153                     " !*.scope "
154                     " !*.service "
155                     " !*.slice "
156                     " !*.swap "
157                     " !*.user "
158                     " !/ "
159                     " !/docker "
160                     " !/libvirt "
161                     " !/lxc "
162                     " !/lxc/*/ns "         //  #1397
163                     " !/machine "
164                     " !/qemu "
165                     " !/system "
166                     " !/systemd "
167                     " !/user "
168                     " * "                  // enable anything else
169             ), SIMPLE_PATTERN_EXACT);
170
171     enabled_cgroup_paths = simple_pattern_create(
172             config_get("plugin:cgroups", "search for cgroups in subpaths matching",
173                     " !*-qemu "            //  #345
174                     " !/init.scope "
175                     " !/system "
176                     " !/systemd "
177                     " !/user "
178                     " !/user.slice "
179                     " * "
180             ), SIMPLE_PATTERN_EXACT);
181
182     snprintfz(filename, FILENAME_MAX, "%s/cgroup-name.sh", netdata_configured_plugins_dir);
183     cgroups_rename_script = config_get("plugin:cgroups", "script to get cgroup names", filename);
184
185     enabled_cgroup_renames = simple_pattern_create(
186             config_get("plugin:cgroups", "run script to rename cgroups matching",
187                     " *docker* "
188                     " *lxc* "
189                     " !/ "
190                     " !*.mount "
191                     " !*.partition "
192                     " !*.scope "
193                     " !*.service "
194                     " !*.slice "
195                     " !*.swap "
196                     " !*.user "
197                     " * "
198             ), SIMPLE_PATTERN_EXACT);
199
200     if(cgroup_enable_systemd_services) {
201         systemd_services_cgroups = simple_pattern_create(
202                 config_get("plugin:cgroups", "cgroups to match as systemd services",
203                         " !/system.slice/*/*.service "
204                         " /system.slice/*.service "
205                 ), SIMPLE_PATTERN_EXACT);
206     }
207
208     mountinfo_free(root);
209 }
210
211 // ----------------------------------------------------------------------------
212 // cgroup objects
213
214 struct blkio {
215     int updated;
216     int enabled; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
217     int delay_counter;
218
219     char *filename;
220
221     unsigned long long Read;
222     unsigned long long Write;
223 /*
224     unsigned long long Sync;
225     unsigned long long Async;
226     unsigned long long Total;
227 */
228 };
229
230 // https://www.kernel.org/doc/Documentation/cgroup-v1/memory.txt
231 struct memory {
232     ARL_BASE *arl_base;
233     ARL_ENTRY *arl_dirty;
234     ARL_ENTRY *arl_swap;
235
236     int updated_detailed;
237     int updated_usage_in_bytes;
238     int updated_msw_usage_in_bytes;
239     int updated_failcnt;
240
241     int enabled_detailed;           // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
242     int enabled_usage_in_bytes;     // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
243     int enabled_msw_usage_in_bytes; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
244     int enabled_failcnt;            // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
245
246     int delay_counter_detailed;
247     int delay_counter_failcnt;
248
249     char *filename_detailed;
250     char *filename_usage_in_bytes;
251     char *filename_msw_usage_in_bytes;
252     char *filename_failcnt;
253
254     int detailed_has_dirty;
255     int detailed_has_swap;
256
257     // detailed metrics
258     unsigned long long cache;
259     unsigned long long rss;
260     unsigned long long rss_huge;
261     unsigned long long mapped_file;
262     unsigned long long writeback;
263     unsigned long long dirty;
264     unsigned long long swap;
265     unsigned long long pgpgin;
266     unsigned long long pgpgout;
267     unsigned long long pgfault;
268     unsigned long long pgmajfault;
269 /*
270     unsigned long long inactive_anon;
271     unsigned long long active_anon;
272     unsigned long long inactive_file;
273     unsigned long long active_file;
274     unsigned long long unevictable;
275     unsigned long long hierarchical_memory_limit;
276     unsigned long long total_cache;
277     unsigned long long total_rss;
278     unsigned long long total_rss_huge;
279     unsigned long long total_mapped_file;
280     unsigned long long total_writeback;
281     unsigned long long total_dirty;
282     unsigned long long total_swap;
283     unsigned long long total_pgpgin;
284     unsigned long long total_pgpgout;
285     unsigned long long total_pgfault;
286     unsigned long long total_pgmajfault;
287     unsigned long long total_inactive_anon;
288     unsigned long long total_active_anon;
289     unsigned long long total_inactive_file;
290     unsigned long long total_active_file;
291     unsigned long long total_unevictable;
292 */
293
294     // single file metrics
295     unsigned long long usage_in_bytes;
296     unsigned long long msw_usage_in_bytes;
297     unsigned long long failcnt;
298 };
299
300 // https://www.kernel.org/doc/Documentation/cgroup-v1/cpuacct.txt
301 struct cpuacct_stat {
302     int updated;
303     int enabled; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
304
305     char *filename;
306
307     unsigned long long user;
308     unsigned long long system;
309 };
310
311 // https://www.kernel.org/doc/Documentation/cgroup-v1/cpuacct.txt
312 struct cpuacct_usage {
313     int updated;
314     int enabled; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
315
316     char *filename;
317
318     unsigned int cpus;
319     unsigned long long *cpu_percpu;
320 };
321
322 #define CGROUP_OPTIONS_DISABLED_DUPLICATE   0x00000001
323 #define CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE 0x00000002
324
325 struct cgroup {
326     uint32_t options;
327
328     char available;      // found in the filesystem
329     char enabled;        // enabled in the config
330
331     char *id;
332     uint32_t hash;
333
334     char *chart_id;
335     uint32_t hash_chart;
336
337     char *chart_title;
338
339     struct cpuacct_stat cpuacct_stat;
340     struct cpuacct_usage cpuacct_usage;
341
342     struct memory memory;
343
344     struct blkio io_service_bytes;              // bytes
345     struct blkio io_serviced;                   // operations
346
347     struct blkio throttle_io_service_bytes;     // bytes
348     struct blkio throttle_io_serviced;          // operations
349
350     struct blkio io_merged;                     // operations
351     struct blkio io_queued;                     // operations
352
353     // per cgroup charts
354     RRDSET *st_cpu;
355     RRDSET *st_cpu_per_core;
356     RRDSET *st_mem;
357     RRDSET *st_writeback;
358     RRDSET *st_mem_activity;
359     RRDSET *st_pgfaults;
360     RRDSET *st_mem_usage;
361     RRDSET *st_mem_failcnt;
362     RRDSET *st_io;
363     RRDSET *st_serviced_ops;
364     RRDSET *st_throttle_io;
365     RRDSET *st_throttle_serviced_ops;
366     RRDSET *st_queued_ops;
367     RRDSET *st_merged_ops;
368
369     // services
370     RRDDIM *rd_cpu;
371     RRDDIM *rd_mem_usage;
372     RRDDIM *rd_mem_failcnt;
373     RRDDIM *rd_swap_usage;
374
375     RRDDIM *rd_mem_detailed_cache;
376     RRDDIM *rd_mem_detailed_rss;
377     RRDDIM *rd_mem_detailed_mapped;
378     RRDDIM *rd_mem_detailed_writeback;
379     RRDDIM *rd_mem_detailed_pgpgin;
380     RRDDIM *rd_mem_detailed_pgpgout;
381     RRDDIM *rd_mem_detailed_pgfault;
382     RRDDIM *rd_mem_detailed_pgmajfault;
383
384     RRDDIM *rd_io_service_bytes_read;
385     RRDDIM *rd_io_serviced_read;
386     RRDDIM *rd_throttle_io_read;
387     RRDDIM *rd_throttle_io_serviced_read;
388     RRDDIM *rd_io_queued_read;
389     RRDDIM *rd_io_merged_read;
390
391     RRDDIM *rd_io_service_bytes_write;
392     RRDDIM *rd_io_serviced_write;
393     RRDDIM *rd_throttle_io_write;
394     RRDDIM *rd_throttle_io_serviced_write;
395     RRDDIM *rd_io_queued_write;
396     RRDDIM *rd_io_merged_write;
397
398     struct cgroup *next;
399
400 } *cgroup_root = NULL;
401
402 // ----------------------------------------------------------------------------
403 // read values from /sys
404
405 static inline void cgroup_read_cpuacct_stat(struct cpuacct_stat *cp) {
406     static procfile *ff = NULL;
407
408     if(likely(cp->filename)) {
409         ff = procfile_reopen(ff, cp->filename, NULL, PROCFILE_FLAG_DEFAULT);
410         if(unlikely(!ff)) {
411             cp->updated = 0;
412             cgroups_check = 1;
413             return;
414         }
415
416         ff = procfile_readall(ff);
417         if(unlikely(!ff)) {
418             cp->updated = 0;
419             cgroups_check = 1;
420             return;
421         }
422
423         unsigned long i, lines = procfile_lines(ff);
424
425         if(unlikely(lines < 1)) {
426             error("File '%s' should have 1+ lines.", cp->filename);
427             cp->updated = 0;
428             return;
429         }
430
431         for(i = 0; i < lines ; i++) {
432             char *s = procfile_lineword(ff, i, 0);
433             uint32_t hash = simple_hash(s);
434
435             if(unlikely(hash == user_hash && !strcmp(s, "user")))
436                 cp->user = str2ull(procfile_lineword(ff, i, 1));
437
438             else if(unlikely(hash == system_hash && !strcmp(s, "system")))
439                 cp->system = str2ull(procfile_lineword(ff, i, 1));
440         }
441
442         cp->updated = 1;
443
444         if(unlikely(cp->enabled == CONFIG_BOOLEAN_AUTO && (cp->user || cp->system)))
445             cp->enabled = CONFIG_BOOLEAN_YES;
446     }
447 }
448
449 static inline void cgroup_read_cpuacct_usage(struct cpuacct_usage *ca) {
450     static procfile *ff = NULL;
451
452     if(likely(ca->filename)) {
453         ff = procfile_reopen(ff, ca->filename, NULL, PROCFILE_FLAG_DEFAULT);
454         if(unlikely(!ff)) {
455             ca->updated = 0;
456             cgroups_check = 1;
457             return;
458         }
459
460         ff = procfile_readall(ff);
461         if(unlikely(!ff)) {
462             ca->updated = 0;
463             cgroups_check = 1;
464             return;
465         }
466
467         if(unlikely(procfile_lines(ff) < 1)) {
468             error("File '%s' should have 1+ lines but has %zu.", ca->filename, procfile_lines(ff));
469             ca->updated = 0;
470             return;
471         }
472
473         unsigned long i = procfile_linewords(ff, 0);
474         if(unlikely(i == 0)) {
475             ca->updated = 0;
476             return;
477         }
478
479         // we may have 1 more CPU reported
480         while(i > 0) {
481             char *s = procfile_lineword(ff, 0, i - 1);
482             if(!*s) i--;
483             else break;
484         }
485
486         if(unlikely(i != ca->cpus)) {
487             freez(ca->cpu_percpu);
488             ca->cpu_percpu = mallocz(sizeof(unsigned long long) * i);
489             ca->cpus = (unsigned int)i;
490         }
491
492         unsigned long long total = 0;
493         for(i = 0; i < ca->cpus ;i++) {
494             unsigned long long n = str2ull(procfile_lineword(ff, 0, i));
495             ca->cpu_percpu[i] = n;
496             total += n;
497         }
498
499         ca->updated = 1;
500
501         if(unlikely(ca->enabled == CONFIG_BOOLEAN_AUTO && total))
502             ca->enabled = CONFIG_BOOLEAN_YES;
503     }
504 }
505
506 static inline void cgroup_read_blkio(struct blkio *io) {
507     static procfile *ff = NULL;
508
509     if(unlikely(io->enabled == CONFIG_BOOLEAN_AUTO && io->delay_counter > 0)) {
510         io->delay_counter--;
511         return;
512     }
513
514     if(likely(io->filename)) {
515         ff = procfile_reopen(ff, io->filename, NULL, PROCFILE_FLAG_DEFAULT);
516         if(unlikely(!ff)) {
517             io->updated = 0;
518             cgroups_check = 1;
519             return;
520         }
521
522         ff = procfile_readall(ff);
523         if(unlikely(!ff)) {
524             io->updated = 0;
525             cgroups_check = 1;
526             return;
527         }
528
529         unsigned long i, lines = procfile_lines(ff);
530
531         if(unlikely(lines < 1)) {
532             error("File '%s' should have 1+ lines.", io->filename);
533             io->updated = 0;
534             return;
535         }
536
537         io->Read = 0;
538         io->Write = 0;
539 /*
540         io->Sync = 0;
541         io->Async = 0;
542         io->Total = 0;
543 */
544
545         for(i = 0; i < lines ; i++) {
546             char *s = procfile_lineword(ff, i, 1);
547             uint32_t hash = simple_hash(s);
548
549             if(unlikely(hash == Read_hash && !strcmp(s, "Read")))
550                 io->Read += str2ull(procfile_lineword(ff, i, 2));
551
552             else if(unlikely(hash == Write_hash && !strcmp(s, "Write")))
553                 io->Write += str2ull(procfile_lineword(ff, i, 2));
554
555 /*
556             else if(unlikely(hash == Sync_hash && !strcmp(s, "Sync")))
557                 io->Sync += str2ull(procfile_lineword(ff, i, 2));
558
559             else if(unlikely(hash == Async_hash && !strcmp(s, "Async")))
560                 io->Async += str2ull(procfile_lineword(ff, i, 2));
561
562             else if(unlikely(hash == Total_hash && !strcmp(s, "Total")))
563                 io->Total += str2ull(procfile_lineword(ff, i, 2));
564 */
565         }
566
567         io->updated = 1;
568
569         if(unlikely(io->enabled == CONFIG_BOOLEAN_AUTO)) {
570             if(unlikely(io->Read || io->Write))
571                 io->enabled = CONFIG_BOOLEAN_YES;
572             else
573                 io->delay_counter = cgroup_recheck_zero_blkio_every_iterations;
574         }
575     }
576 }
577
578 static inline void cgroup_read_memory(struct memory *mem) {
579     static procfile *ff = NULL;
580
581     // read detailed ram usage
582     if(likely(mem->filename_detailed)) {
583         if(unlikely(mem->enabled_detailed == CONFIG_BOOLEAN_AUTO && mem->delay_counter_detailed > 0)) {
584             mem->delay_counter_detailed--;
585             goto memory_next;
586         }
587
588         ff = procfile_reopen(ff, mem->filename_detailed, NULL, PROCFILE_FLAG_DEFAULT);
589         if(unlikely(!ff)) {
590             mem->updated_detailed = 0;
591             cgroups_check = 1;
592             goto memory_next;
593         }
594
595         ff = procfile_readall(ff);
596         if(unlikely(!ff)) {
597             mem->updated_detailed = 0;
598             cgroups_check = 1;
599             goto memory_next;
600         }
601
602         unsigned long i, lines = procfile_lines(ff);
603
604         if(unlikely(lines < 1)) {
605             error("File '%s' should have 1+ lines.", mem->filename_detailed);
606             mem->updated_detailed = 0;
607             goto memory_next;
608         }
609
610         if(unlikely(!mem->arl_base)) {
611             mem->arl_base = arl_create("cgroup/memory", NULL, 60);
612
613             arl_expect(mem->arl_base, "cache", &mem->cache);
614             arl_expect(mem->arl_base, "rss", &mem->rss);
615             arl_expect(mem->arl_base, "rss_huge", &mem->rss_huge);
616             arl_expect(mem->arl_base, "mapped_file", &mem->mapped_file);
617             arl_expect(mem->arl_base, "writeback", &mem->writeback);
618             mem->arl_dirty = arl_expect(mem->arl_base, "dirty", &mem->dirty);
619             mem->arl_swap  = arl_expect(mem->arl_base, "swap", &mem->swap);
620             arl_expect(mem->arl_base, "pgpgin", &mem->pgpgin);
621             arl_expect(mem->arl_base, "pgpgout", &mem->pgpgout);
622             arl_expect(mem->arl_base, "pgfault", &mem->pgfault);
623             arl_expect(mem->arl_base, "pgmajfault", &mem->pgmajfault);
624         }
625
626         arl_begin(mem->arl_base);
627
628         for(i = 0; i < lines ; i++) {
629             if(arl_check(mem->arl_base,
630                     procfile_lineword(ff, i, 0),
631                     procfile_lineword(ff, i, 1))) break;
632         }
633
634         if(unlikely(mem->arl_dirty->flags & ARL_ENTRY_FLAG_FOUND))
635             mem->detailed_has_dirty = 1;
636
637         if(unlikely(mem->arl_swap->flags & ARL_ENTRY_FLAG_FOUND))
638             mem->detailed_has_swap = 1;
639
640         // fprintf(stderr, "READ: '%s', cache: %llu, rss: %llu, rss_huge: %llu, mapped_file: %llu, writeback: %llu, dirty: %llu, swap: %llu, pgpgin: %llu, pgpgout: %llu, pgfault: %llu, pgmajfault: %llu, inactive_anon: %llu, active_anon: %llu, inactive_file: %llu, active_file: %llu, unevictable: %llu, hierarchical_memory_limit: %llu, total_cache: %llu, total_rss: %llu, total_rss_huge: %llu, total_mapped_file: %llu, total_writeback: %llu, total_dirty: %llu, total_swap: %llu, total_pgpgin: %llu, total_pgpgout: %llu, total_pgfault: %llu, total_pgmajfault: %llu, total_inactive_anon: %llu, total_active_anon: %llu, total_inactive_file: %llu, total_active_file: %llu, total_unevictable: %llu\n", mem->filename, mem->cache, mem->rss, mem->rss_huge, mem->mapped_file, mem->writeback, mem->dirty, mem->swap, mem->pgpgin, mem->pgpgout, mem->pgfault, mem->pgmajfault, mem->inactive_anon, mem->active_anon, mem->inactive_file, mem->active_file, mem->unevictable, mem->hierarchical_memory_limit, mem->total_cache, mem->total_rss, mem->total_rss_huge, mem->total_mapped_file, mem->total_writeback, mem->total_dirty, mem->total_swap, mem->total_pgpgin, mem->total_pgpgout, mem->total_pgfault, mem->total_pgmajfault, mem->total_inactive_anon, mem->total_active_anon, mem->total_inactive_file, mem->total_active_file, mem->total_unevictable);
641
642         mem->updated_detailed = 1;
643
644         if(unlikely(mem->enabled_detailed == CONFIG_BOOLEAN_AUTO)) {
645             if(mem->cache || mem->dirty || mem->rss || mem->rss_huge || mem->mapped_file || mem->writeback || mem->swap || mem->pgpgin || mem->pgpgout || mem->pgfault || mem->pgmajfault)
646                 mem->enabled_detailed = CONFIG_BOOLEAN_YES;
647             else
648                 mem->delay_counter_detailed = cgroup_recheck_zero_mem_detailed_every_iterations;
649         }
650     }
651
652 memory_next:
653
654     // read usage_in_bytes
655     if(likely(mem->filename_usage_in_bytes)) {
656         mem->updated_usage_in_bytes = !read_single_number_file(mem->filename_usage_in_bytes, &mem->usage_in_bytes);
657         if(unlikely(mem->updated_usage_in_bytes && mem->enabled_usage_in_bytes == CONFIG_BOOLEAN_AUTO && mem->usage_in_bytes))
658             mem->enabled_usage_in_bytes = CONFIG_BOOLEAN_YES;
659     }
660
661     // read msw_usage_in_bytes
662     if(likely(mem->filename_msw_usage_in_bytes)) {
663         mem->updated_msw_usage_in_bytes = !read_single_number_file(mem->filename_msw_usage_in_bytes, &mem->msw_usage_in_bytes);
664         if(unlikely(mem->updated_msw_usage_in_bytes && mem->enabled_msw_usage_in_bytes == CONFIG_BOOLEAN_AUTO && mem->msw_usage_in_bytes))
665             mem->enabled_msw_usage_in_bytes = CONFIG_BOOLEAN_YES;
666     }
667
668     // read failcnt
669     if(likely(mem->filename_failcnt)) {
670         if(unlikely(mem->enabled_failcnt == CONFIG_BOOLEAN_AUTO && mem->delay_counter_failcnt > 0)) {
671             mem->updated_failcnt = 0;
672             mem->delay_counter_failcnt--;
673         }
674         else {
675             mem->updated_failcnt = !read_single_number_file(mem->filename_failcnt, &mem->failcnt);
676             if(unlikely(mem->updated_failcnt && mem->enabled_failcnt == CONFIG_BOOLEAN_AUTO)) {
677                 if(unlikely(!mem->failcnt))
678                     mem->delay_counter_failcnt = cgroup_recheck_zero_mem_failcnt_every_iterations;
679                 else
680                     mem->enabled_failcnt = CONFIG_BOOLEAN_YES;
681             }
682         }
683     }
684 }
685
686 static inline void cgroup_read(struct cgroup *cg) {
687     debug(D_CGROUP, "reading metrics for cgroups '%s'", cg->id);
688
689     cgroup_read_cpuacct_stat(&cg->cpuacct_stat);
690     cgroup_read_cpuacct_usage(&cg->cpuacct_usage);
691     cgroup_read_memory(&cg->memory);
692     cgroup_read_blkio(&cg->io_service_bytes);
693     cgroup_read_blkio(&cg->io_serviced);
694     cgroup_read_blkio(&cg->throttle_io_service_bytes);
695     cgroup_read_blkio(&cg->throttle_io_serviced);
696     cgroup_read_blkio(&cg->io_merged);
697     cgroup_read_blkio(&cg->io_queued);
698 }
699
700 static inline void read_all_cgroups(struct cgroup *root) {
701     debug(D_CGROUP, "reading metrics for all cgroups");
702
703     struct cgroup *cg;
704
705     for(cg = root; cg ; cg = cg->next)
706         if(cg->enabled && cg->available)
707             cgroup_read(cg);
708 }
709
710 // ----------------------------------------------------------------------------
711 // add/remove/find cgroup objects
712
713 #define CGROUP_CHARTID_LINE_MAX 1024
714
715 static inline char *cgroup_title_strdupz(const char *s) {
716     if(!s || !*s) s = "/";
717
718     if(*s == '/' && s[1] != '\0') s++;
719
720     char *r = strdupz(s);
721     netdata_fix_chart_name(r);
722
723     return r;
724 }
725
726 static inline char *cgroup_chart_id_strdupz(const char *s) {
727     if(!s || !*s) s = "/";
728
729     if(*s == '/' && s[1] != '\0') s++;
730
731     char *r = strdupz(s);
732     netdata_fix_chart_id(r);
733
734     return r;
735 }
736
737 static inline void cgroup_get_chart_name(struct cgroup *cg) {
738     debug(D_CGROUP, "looking for the name of cgroup '%s' with chart id '%s' and title '%s'", cg->id, cg->chart_id, cg->chart_title);
739
740     pid_t cgroup_pid;
741     char buffer[CGROUP_CHARTID_LINE_MAX + 1];
742
743     snprintfz(buffer, CGROUP_CHARTID_LINE_MAX, "exec %s '%s'", cgroups_rename_script, cg->chart_id);
744
745     debug(D_CGROUP, "executing command '%s' for cgroup '%s'", buffer, cg->id);
746     FILE *fp = mypopen(buffer, &cgroup_pid);
747     if(fp) {
748         // debug(D_CGROUP, "reading from command '%s' for cgroup '%s'", buffer, cg->id);
749         char *s = fgets(buffer, CGROUP_CHARTID_LINE_MAX, fp);
750         // debug(D_CGROUP, "closing command for cgroup '%s'", cg->id);
751         mypclose(fp, cgroup_pid);
752         // debug(D_CGROUP, "closed command for cgroup '%s'", cg->id);
753
754         if(s && *s && *s != '\n') {
755             debug(D_CGROUP, "cgroup '%s' should be renamed to '%s'", cg->id, s);
756
757             trim(s);
758
759             freez(cg->chart_title);
760             cg->chart_title = cgroup_title_strdupz(s);
761
762             freez(cg->chart_id);
763             cg->chart_id = cgroup_chart_id_strdupz(s);
764             cg->hash_chart = simple_hash(cg->chart_id);
765         }
766     }
767     else
768         error("CGROUP: Cannot popen(\"%s\", \"r\").", buffer);
769 }
770
771 static inline struct cgroup *cgroup_add(const char *id) {
772     if(!id || !*id) id = "/";
773     debug(D_CGROUP, "adding to list, cgroup with id '%s'", id);
774
775     if(cgroup_root_count >= cgroup_root_max) {
776         info("Maximum number of cgroups reached (%d). Not adding cgroup '%s'", cgroup_root_count, id);
777         return NULL;
778     }
779
780     int def = simple_pattern_matches(enabled_cgroup_patterns, id)?cgroup_enable_new_cgroups_detected_at_runtime:0;
781     struct cgroup *cg = callocz(1, sizeof(struct cgroup));
782
783     cg->id = strdupz(id);
784     cg->hash = simple_hash(cg->id);
785
786     cg->chart_title = cgroup_title_strdupz(id);
787
788     cg->chart_id = cgroup_chart_id_strdupz(id);
789     cg->hash_chart = simple_hash(cg->chart_id);
790
791     if(!cgroup_root)
792         cgroup_root = cg;
793     else {
794         // append it
795         struct cgroup *e;
796         for(e = cgroup_root; e->next ;e = e->next) ;
797         e->next = cg;
798     }
799
800     cgroup_root_count++;
801
802     // fix the chart_id and title by calling the external script
803     if(simple_pattern_matches(enabled_cgroup_renames, cg->id)) {
804
805         cgroup_get_chart_name(cg);
806
807         debug(D_CGROUP, "cgroup '%s' renamed to '%s' (title: '%s')", cg->id, cg->chart_id, cg->chart_title);
808     }
809     else
810         debug(D_CGROUP, "cgroup '%s' will not be renamed - it matches the list of disabled cgroup renames (will be shown as '%s')", cg->id, cg->chart_id);
811
812     int user_configurable = 1;
813
814     // check if this cgroup should be a systemd service
815     if(cgroup_enable_systemd_services) {
816         if(simple_pattern_matches(systemd_services_cgroups, cg->id) ||
817                 simple_pattern_matches(systemd_services_cgroups, cg->chart_id)) {
818             debug(D_CGROUP, "cgroup '%s' with chart id '%s' (title: '%s') matches systemd services cgroups", cg->id, cg->chart_id, cg->chart_title);
819
820             char buffer[CGROUP_CHARTID_LINE_MAX + 1];
821             cg->options |= CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE;
822
823             strncpy(buffer, cg->id, CGROUP_CHARTID_LINE_MAX);
824             char *s = buffer;
825
826             //freez(cg->chart_id);
827             //cg->chart_id = cgroup_chart_id_strdupz(s);
828             //cg->hash_chart = simple_hash(cg->chart_id);
829
830             // skip to the last slash
831             size_t len = strlen(s);
832             while(len--) if(unlikely(s[len] == '/')) break;
833             if(len) s = &s[len + 1];
834
835             // remove extension
836             len = strlen(s);
837             while(len--) if(unlikely(s[len] == '.')) break;
838             if(len) s[len] = '\0';
839
840             freez(cg->chart_title);
841             cg->chart_title = cgroup_title_strdupz(s);
842
843             cg->enabled = 1;
844             user_configurable = 0;
845
846             debug(D_CGROUP, "cgroup '%s' renamed to '%s' (title: '%s')", cg->id, cg->chart_id, cg->chart_title);
847         }
848         else
849             debug(D_CGROUP, "cgroup '%s' with chart id '%s' (title: '%s') does not match systemd services groups", cg->id, cg->chart_id, cg->chart_title);
850     }
851
852     if(user_configurable) {
853         // allow the user to enable/disable this individualy
854         char option[FILENAME_MAX + 1];
855         snprintfz(option, FILENAME_MAX, "enable cgroup %s", cg->chart_title);
856         cg->enabled = (char) config_get_boolean("plugin:cgroups", option, def);
857     }
858
859     // detect duplicate cgroups
860     if(cg->enabled) {
861         struct cgroup *t;
862         for (t = cgroup_root; t; t = t->next) {
863             if (t != cg && t->enabled && t->hash_chart == cg->hash_chart && !strcmp(t->chart_id, cg->chart_id)) {
864                 if (!strncmp(t->chart_id, "/system.slice/", 14) && !strncmp(cg->chart_id, "/init.scope/system.slice/", 25)) {
865                     error("Control group with chart id '%s' already exists with id '%s' and is enabled. Swapping them by enabling cgroup with id '%s' and disabling cgroup with id '%s'.",
866                           cg->chart_id, t->id, cg->id, t->id);
867                     debug(D_CGROUP, "Control group with chart id '%s' already exists with id '%s' and is enabled. Swapping them by enabling cgroup with id '%s' and disabling cgroup with id '%s'.",
868                           cg->chart_id, t->id, cg->id, t->id);
869                     t->enabled = 0;
870                     t->options |= CGROUP_OPTIONS_DISABLED_DUPLICATE;
871                 }
872                 else {
873                     error("Control group with chart id '%s' already exists with id '%s' and is enabled and available. Disabling cgroup with id '%s'.",
874                           cg->chart_id, t->id, cg->id);
875                     debug(D_CGROUP, "Control group with chart id '%s' already exists with id '%s' and is enabled and available. Disabling cgroup with id '%s'.",
876                           cg->chart_id, t->id, cg->id);
877                     cg->enabled = 0;
878                     cg->options |= CGROUP_OPTIONS_DISABLED_DUPLICATE;
879                 }
880
881                 break;
882             }
883         }
884     }
885
886     debug(D_CGROUP, "ADDED CGROUP: '%s' with chart id '%s' and title '%s' as %s (default was %s)", cg->id, cg->chart_id, cg->chart_title, (cg->enabled)?"enabled":"disabled", (def)?"enabled":"disabled");
887
888     return cg;
889 }
890
891 static inline void cgroup_free(struct cgroup *cg) {
892     debug(D_CGROUP, "Removing cgroup '%s' with chart id '%s' (was %s and %s)", cg->id, cg->chart_id, (cg->enabled)?"enabled":"disabled", (cg->available)?"available":"not available");
893
894     if(cg->st_cpu)                   rrdset_flag_set(cg->st_cpu,                   RRDSET_FLAG_OBSOLETE);
895     if(cg->st_cpu_per_core)          rrdset_flag_set(cg->st_cpu_per_core,          RRDSET_FLAG_OBSOLETE);
896     if(cg->st_mem)                   rrdset_flag_set(cg->st_mem,                   RRDSET_FLAG_OBSOLETE);
897     if(cg->st_writeback)             rrdset_flag_set(cg->st_writeback,             RRDSET_FLAG_OBSOLETE);
898     if(cg->st_mem_activity)          rrdset_flag_set(cg->st_mem_activity,          RRDSET_FLAG_OBSOLETE);
899     if(cg->st_pgfaults)              rrdset_flag_set(cg->st_pgfaults,              RRDSET_FLAG_OBSOLETE);
900     if(cg->st_mem_usage)             rrdset_flag_set(cg->st_mem_usage,             RRDSET_FLAG_OBSOLETE);
901     if(cg->st_mem_failcnt)           rrdset_flag_set(cg->st_mem_failcnt,           RRDSET_FLAG_OBSOLETE);
902     if(cg->st_io)                    rrdset_flag_set(cg->st_io,                    RRDSET_FLAG_OBSOLETE);
903     if(cg->st_serviced_ops)          rrdset_flag_set(cg->st_serviced_ops,          RRDSET_FLAG_OBSOLETE);
904     if(cg->st_throttle_io)           rrdset_flag_set(cg->st_throttle_io,           RRDSET_FLAG_OBSOLETE);
905     if(cg->st_throttle_serviced_ops) rrdset_flag_set(cg->st_throttle_serviced_ops, RRDSET_FLAG_OBSOLETE);
906     if(cg->st_queued_ops)            rrdset_flag_set(cg->st_queued_ops,            RRDSET_FLAG_OBSOLETE);
907     if(cg->st_merged_ops)            rrdset_flag_set(cg->st_merged_ops,            RRDSET_FLAG_OBSOLETE);
908
909     freez(cg->cpuacct_usage.cpu_percpu);
910
911     freez(cg->cpuacct_stat.filename);
912     freez(cg->cpuacct_usage.filename);
913
914     arl_free(cg->memory.arl_base);
915     freez(cg->memory.filename_detailed);
916     freez(cg->memory.filename_failcnt);
917     freez(cg->memory.filename_usage_in_bytes);
918     freez(cg->memory.filename_msw_usage_in_bytes);
919
920     freez(cg->io_service_bytes.filename);
921     freez(cg->io_serviced.filename);
922
923     freez(cg->throttle_io_service_bytes.filename);
924     freez(cg->throttle_io_serviced.filename);
925
926     freez(cg->io_merged.filename);
927     freez(cg->io_queued.filename);
928
929     freez(cg->id);
930     freez(cg->chart_id);
931     freez(cg->chart_title);
932
933     freez(cg);
934
935     cgroup_root_count--;
936 }
937
938 // find if a given cgroup exists
939 static inline struct cgroup *cgroup_find(const char *id) {
940     debug(D_CGROUP, "searching for cgroup '%s'", id);
941
942     uint32_t hash = simple_hash(id);
943
944     struct cgroup *cg;
945     for(cg = cgroup_root; cg ; cg = cg->next) {
946         if(hash == cg->hash && strcmp(id, cg->id) == 0)
947             break;
948     }
949
950     debug(D_CGROUP, "cgroup '%s' %s in memory", id, (cg)?"found":"not found");
951     return cg;
952 }
953
954 // ----------------------------------------------------------------------------
955 // detect running cgroups
956
957 // callback for find_file_in_subdirs()
958 static inline void found_subdir_in_dir(const char *dir) {
959     debug(D_CGROUP, "examining cgroup dir '%s'", dir);
960
961     struct cgroup *cg = cgroup_find(dir);
962     if(!cg) {
963         if(*dir && cgroup_max_depth > 0) {
964             int depth = 0;
965             const char *s;
966
967             for(s = dir; *s ;s++)
968                 if(unlikely(*s == '/'))
969                     depth++;
970
971             if(depth > cgroup_max_depth) {
972                 info("cgroup '%s' is too deep (%d, while max is %d)", dir, depth, cgroup_max_depth);
973                 return;
974             }
975         }
976         // debug(D_CGROUP, "will add dir '%s' as cgroup", dir);
977         cg = cgroup_add(dir);
978     }
979
980     if(cg) cg->available = 1;
981 }
982
983 static inline int find_dir_in_subdirs(const char *base, const char *this, void (*callback)(const char *)) {
984     if(!this) this = base;
985     debug(D_CGROUP, "searching for directories in '%s' (base '%s')", this?this:"", base);
986
987     size_t dirlen = strlen(this), baselen = strlen(base);
988
989     int ret = -1;
990     int enabled = -1;
991
992     const char *relative_path = &this[baselen];
993     if(!*relative_path) relative_path = "/";
994
995     DIR *dir = opendir(this);
996     if(!dir) {
997         error("Cannot read cgroups directory '%s'", base);
998         return ret;
999     }
1000     ret = 1;
1001
1002     callback(relative_path);
1003
1004     struct dirent *de = NULL;
1005     while((de = readdir(dir))) {
1006         if(de->d_type == DT_DIR
1007             && (
1008                 (de->d_name[0] == '.' && de->d_name[1] == '\0')
1009                 || (de->d_name[0] == '.' && de->d_name[1] == '.' && de->d_name[2] == '\0')
1010                 ))
1011             continue;
1012
1013         if(de->d_type == DT_DIR) {
1014             if(enabled == -1) {
1015                 const char *r = relative_path;
1016                 if(*r == '\0') r = "/";
1017
1018                 // do not decent in directories we are not interested
1019                 int def = simple_pattern_matches(enabled_cgroup_paths, r);
1020
1021                 // we check for this option here
1022                 // so that the config will not have settings
1023                 // for leaf directories
1024                 char option[FILENAME_MAX + 1];
1025                 snprintfz(option, FILENAME_MAX, "search for cgroups under %s", r);
1026                 option[FILENAME_MAX] = '\0';
1027                 enabled = config_get_boolean("plugin:cgroups", option, def);
1028             }
1029
1030             if(enabled) {
1031                 char *s = mallocz(dirlen + strlen(de->d_name) + 2);
1032                 strcpy(s, this);
1033                 strcat(s, "/");
1034                 strcat(s, de->d_name);
1035                 int ret2 = find_dir_in_subdirs(base, s, callback);
1036                 if(ret2 > 0) ret += ret2;
1037                 freez(s);
1038             }
1039         }
1040     }
1041
1042     closedir(dir);
1043     return ret;
1044 }
1045
1046 static inline void mark_all_cgroups_as_not_available() {
1047     debug(D_CGROUP, "marking all cgroups as not available");
1048
1049     struct cgroup *cg;
1050
1051     // mark all as not available
1052     for(cg = cgroup_root; cg ; cg = cg->next) {
1053         cg->available = 0;
1054     }
1055 }
1056
1057 static inline void cleanup_all_cgroups() {
1058     struct cgroup *cg = cgroup_root, *last = NULL;
1059
1060     for(; cg ;) {
1061         if(!cg->available) {
1062             // enable the first duplicate cgroup
1063             {
1064                 struct cgroup *t;
1065                 for(t = cgroup_root; t ; t = t->next) {
1066                     if(t != cg && t->available && !t->enabled && t->options & CGROUP_OPTIONS_DISABLED_DUPLICATE && t->hash_chart == cg->hash_chart && !strcmp(t->chart_id, cg->chart_id)) {
1067                         debug(D_CGROUP, "Enabling duplicate of cgroup '%s' with id '%s', because the original with id '%s' stopped.", t->chart_id, t->id, cg->id);
1068                         t->enabled = 1;
1069                         t->options &= ~CGROUP_OPTIONS_DISABLED_DUPLICATE;
1070                         break;
1071                     }
1072                 }
1073             }
1074
1075             if(!last)
1076                 cgroup_root = cg->next;
1077             else
1078                 last->next = cg->next;
1079
1080             cgroup_free(cg);
1081
1082             if(!last)
1083                 cg = cgroup_root;
1084             else
1085                 cg = last->next;
1086         }
1087         else {
1088             last = cg;
1089             cg = cg->next;
1090         }
1091     }
1092 }
1093
1094 static inline void find_all_cgroups() {
1095     debug(D_CGROUP, "searching for cgroups");
1096
1097     mark_all_cgroups_as_not_available();
1098
1099     if(cgroup_enable_cpuacct_stat || cgroup_enable_cpuacct_usage) {
1100         if(find_dir_in_subdirs(cgroup_cpuacct_base, NULL, found_subdir_in_dir) == -1) {
1101             cgroup_enable_cpuacct_stat =
1102             cgroup_enable_cpuacct_usage = CONFIG_BOOLEAN_NO;
1103             error("disabled CGROUP cpu statistics.");
1104         }
1105     }
1106
1107     if(cgroup_enable_blkio_io || cgroup_enable_blkio_ops || cgroup_enable_blkio_throttle_io || cgroup_enable_blkio_throttle_ops || cgroup_enable_blkio_merged_ops || cgroup_enable_blkio_queued_ops) {
1108         if(find_dir_in_subdirs(cgroup_blkio_base, NULL, found_subdir_in_dir) == -1) {
1109             cgroup_enable_blkio_io =
1110             cgroup_enable_blkio_ops =
1111             cgroup_enable_blkio_throttle_io =
1112             cgroup_enable_blkio_throttle_ops =
1113             cgroup_enable_blkio_merged_ops =
1114             cgroup_enable_blkio_queued_ops = CONFIG_BOOLEAN_NO;
1115             error("disabled CGROUP blkio statistics.");
1116         }
1117     }
1118
1119     if(cgroup_enable_memory || cgroup_enable_detailed_memory || cgroup_enable_swap || cgroup_enable_memory_failcnt) {
1120         if(find_dir_in_subdirs(cgroup_memory_base, NULL, found_subdir_in_dir) == -1) {
1121             cgroup_enable_memory =
1122             cgroup_enable_detailed_memory =
1123             cgroup_enable_swap =
1124             cgroup_enable_memory_failcnt = CONFIG_BOOLEAN_NO;
1125             error("disabled CGROUP memory statistics.");
1126         }
1127     }
1128
1129     if(cgroup_search_in_devices) {
1130         if(find_dir_in_subdirs(cgroup_devices_base, NULL, found_subdir_in_dir) == -1) {
1131             cgroup_search_in_devices = 0;
1132             error("disabled CGROUP devices statistics.");
1133         }
1134     }
1135
1136     // remove any non-existing cgroups
1137     cleanup_all_cgroups();
1138
1139     struct cgroup *cg;
1140     struct stat buf;
1141     for(cg = cgroup_root; cg ; cg = cg->next) {
1142         // fprintf(stderr, " >>> CGROUP '%s' (%u - %s) with name '%s'\n", cg->id, cg->hash, cg->available?"available":"stopped", cg->name);
1143
1144         if(unlikely(!cg->available))
1145             continue;
1146
1147         debug(D_CGROUP, "checking paths for cgroup '%s'", cg->id);
1148
1149         // check for newly added cgroups
1150         // and update the filenames they read
1151         char filename[FILENAME_MAX + 1];
1152         if(unlikely(cgroup_enable_cpuacct_stat && !cg->cpuacct_stat.filename)) {
1153             snprintfz(filename, FILENAME_MAX, "%s%s/cpuacct.stat", cgroup_cpuacct_base, cg->id);
1154             if(likely(stat(filename, &buf) != -1)) {
1155                 cg->cpuacct_stat.filename = strdupz(filename);
1156                 cg->cpuacct_stat.enabled = cgroup_enable_cpuacct_stat;
1157                 debug(D_CGROUP, "cpuacct.stat filename for cgroup '%s': '%s'", cg->id, cg->cpuacct_stat.filename);
1158             }
1159             else
1160                 debug(D_CGROUP, "cpuacct.stat file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1161         }
1162
1163         if(unlikely(cgroup_enable_cpuacct_usage && !cg->cpuacct_usage.filename && !(cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE))) {
1164             snprintfz(filename, FILENAME_MAX, "%s%s/cpuacct.usage_percpu", cgroup_cpuacct_base, cg->id);
1165             if(likely(stat(filename, &buf) != -1)) {
1166                 cg->cpuacct_usage.filename = strdupz(filename);
1167                 cg->cpuacct_usage.enabled = cgroup_enable_cpuacct_usage;
1168                 debug(D_CGROUP, "cpuacct.usage_percpu filename for cgroup '%s': '%s'", cg->id, cg->cpuacct_usage.filename);
1169             }
1170             else
1171                 debug(D_CGROUP, "cpuacct.usage_percpu file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1172         }
1173
1174         if(unlikely((cgroup_enable_detailed_memory || cgroup_used_memory_without_cache) && !cg->memory.filename_detailed && (cgroup_used_memory_without_cache || cgroup_enable_systemd_services_detailed_memory || !(cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE)))) {
1175             snprintfz(filename, FILENAME_MAX, "%s%s/memory.stat", cgroup_memory_base, cg->id);
1176             if(likely(stat(filename, &buf) != -1)) {
1177                 cg->memory.filename_detailed = strdupz(filename);
1178                 cg->memory.enabled_detailed = (cgroup_enable_detailed_memory == CONFIG_BOOLEAN_YES)?CONFIG_BOOLEAN_YES:CONFIG_BOOLEAN_AUTO;
1179                 debug(D_CGROUP, "memory.stat filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_detailed);
1180             }
1181             else
1182                 debug(D_CGROUP, "memory.stat file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1183         }
1184
1185         if(unlikely(cgroup_enable_memory && !cg->memory.filename_usage_in_bytes)) {
1186             snprintfz(filename, FILENAME_MAX, "%s%s/memory.usage_in_bytes", cgroup_memory_base, cg->id);
1187             if(likely(stat(filename, &buf) != -1)) {
1188                 cg->memory.filename_usage_in_bytes = strdupz(filename);
1189                 cg->memory.enabled_usage_in_bytes = cgroup_enable_memory;
1190                 debug(D_CGROUP, "memory.usage_in_bytes filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_usage_in_bytes);
1191             }
1192             else
1193                 debug(D_CGROUP, "memory.usage_in_bytes file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1194         }
1195
1196         if(unlikely(cgroup_enable_swap && !cg->memory.filename_msw_usage_in_bytes)) {
1197             snprintfz(filename, FILENAME_MAX, "%s%s/memory.msw_usage_in_bytes", cgroup_memory_base, cg->id);
1198             if(likely(stat(filename, &buf) != -1)) {
1199                 cg->memory.filename_msw_usage_in_bytes = strdupz(filename);
1200                 cg->memory.enabled_msw_usage_in_bytes = cgroup_enable_swap;
1201                 debug(D_CGROUP, "memory.msw_usage_in_bytes filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_msw_usage_in_bytes);
1202             }
1203             else
1204                 debug(D_CGROUP, "memory.msw_usage_in_bytes file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1205         }
1206
1207         if(unlikely(cgroup_enable_memory_failcnt && !cg->memory.filename_failcnt)) {
1208             snprintfz(filename, FILENAME_MAX, "%s%s/memory.failcnt", cgroup_memory_base, cg->id);
1209             if(likely(stat(filename, &buf) != -1)) {
1210                 cg->memory.filename_failcnt = strdupz(filename);
1211                 cg->memory.enabled_failcnt = cgroup_enable_memory_failcnt;
1212                 debug(D_CGROUP, "memory.failcnt filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_failcnt);
1213             }
1214             else
1215                 debug(D_CGROUP, "memory.failcnt file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1216         }
1217
1218         if(unlikely(cgroup_enable_blkio_io && !cg->io_service_bytes.filename)) {
1219             snprintfz(filename, FILENAME_MAX, "%s%s/blkio.io_service_bytes", cgroup_blkio_base, cg->id);
1220             if(likely(stat(filename, &buf) != -1)) {
1221                 cg->io_service_bytes.filename = strdupz(filename);
1222                 cg->io_service_bytes.enabled = cgroup_enable_blkio_io;
1223                 debug(D_CGROUP, "io_service_bytes filename for cgroup '%s': '%s'", cg->id, cg->io_service_bytes.filename);
1224             }
1225             else
1226                 debug(D_CGROUP, "io_service_bytes file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1227         }
1228
1229         if(unlikely(cgroup_enable_blkio_ops && !cg->io_serviced.filename)) {
1230             snprintfz(filename, FILENAME_MAX, "%s%s/blkio.io_serviced", cgroup_blkio_base, cg->id);
1231             if(likely(stat(filename, &buf) != -1)) {
1232                 cg->io_serviced.filename = strdupz(filename);
1233                 cg->io_serviced.enabled = cgroup_enable_blkio_ops;
1234                 debug(D_CGROUP, "io_serviced filename for cgroup '%s': '%s'", cg->id, cg->io_serviced.filename);
1235             }
1236             else
1237                 debug(D_CGROUP, "io_serviced file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1238         }
1239
1240         if(unlikely(cgroup_enable_blkio_throttle_io && !cg->throttle_io_service_bytes.filename)) {
1241             snprintfz(filename, FILENAME_MAX, "%s%s/blkio.throttle.io_service_bytes", cgroup_blkio_base, cg->id);
1242             if(likely(stat(filename, &buf) != -1)) {
1243                 cg->throttle_io_service_bytes.filename = strdupz(filename);
1244                 cg->throttle_io_service_bytes.enabled = cgroup_enable_blkio_throttle_io;
1245                 debug(D_CGROUP, "throttle_io_service_bytes filename for cgroup '%s': '%s'", cg->id, cg->throttle_io_service_bytes.filename);
1246             }
1247             else
1248                 debug(D_CGROUP, "throttle_io_service_bytes file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1249         }
1250
1251         if(unlikely(cgroup_enable_blkio_throttle_ops && !cg->throttle_io_serviced.filename)) {
1252             snprintfz(filename, FILENAME_MAX, "%s%s/blkio.throttle.io_serviced", cgroup_blkio_base, cg->id);
1253             if(likely(stat(filename, &buf) != -1)) {
1254                 cg->throttle_io_serviced.filename = strdupz(filename);
1255                 cg->throttle_io_serviced.enabled = cgroup_enable_blkio_throttle_ops;
1256                 debug(D_CGROUP, "throttle_io_serviced filename for cgroup '%s': '%s'", cg->id, cg->throttle_io_serviced.filename);
1257             }
1258             else
1259                 debug(D_CGROUP, "throttle_io_serviced file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1260         }
1261
1262         if(unlikely(cgroup_enable_blkio_merged_ops && !cg->io_merged.filename)) {
1263             snprintfz(filename, FILENAME_MAX, "%s%s/blkio.io_merged", cgroup_blkio_base, cg->id);
1264             if(likely(stat(filename, &buf) != -1)) {
1265                 cg->io_merged.filename = strdupz(filename);
1266                 cg->io_merged.enabled = cgroup_enable_blkio_merged_ops;
1267                 debug(D_CGROUP, "io_merged filename for cgroup '%s': '%s'", cg->id, cg->io_merged.filename);
1268             }
1269             else
1270                 debug(D_CGROUP, "io_merged file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1271         }
1272
1273         if(unlikely(cgroup_enable_blkio_queued_ops && !cg->io_queued.filename)) {
1274             snprintfz(filename, FILENAME_MAX, "%s%s/blkio.io_queued", cgroup_blkio_base, cg->id);
1275             if(likely(stat(filename, &buf) != -1)) {
1276                 cg->io_queued.filename = strdupz(filename);
1277                 cg->io_queued.enabled = cgroup_enable_blkio_queued_ops;
1278                 debug(D_CGROUP, "io_queued filename for cgroup '%s': '%s'", cg->id, cg->io_queued.filename);
1279             }
1280             else
1281                 debug(D_CGROUP, "io_queued file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1282         }
1283     }
1284
1285     debug(D_CGROUP, "done searching for cgroups");
1286     return;
1287 }
1288
1289 // ----------------------------------------------------------------------------
1290 // generate charts
1291
1292 #define CHART_TITLE_MAX 300
1293
1294 void update_systemd_services_charts(
1295           int update_every
1296         , int do_cpu
1297         , int do_mem_usage
1298         , int do_mem_detailed
1299         , int do_mem_failcnt
1300         , int do_swap_usage
1301         , int do_io
1302         , int do_io_ops
1303         , int do_throttle_io
1304         , int do_throttle_ops
1305         , int do_queued_ops
1306         , int do_merged_ops
1307 ) {
1308     static RRDSET
1309         *st_cpu = NULL,
1310         *st_mem_usage = NULL,
1311         *st_mem_failcnt = NULL,
1312         *st_swap_usage = NULL,
1313
1314         *st_mem_detailed_cache = NULL,
1315         *st_mem_detailed_rss = NULL,
1316         *st_mem_detailed_mapped = NULL,
1317         *st_mem_detailed_writeback = NULL,
1318         *st_mem_detailed_pgfault = NULL,
1319         *st_mem_detailed_pgmajfault = NULL,
1320         *st_mem_detailed_pgpgin = NULL,
1321         *st_mem_detailed_pgpgout = NULL,
1322
1323         *st_io_read = NULL,
1324         *st_io_serviced_read = NULL,
1325         *st_throttle_io_read = NULL,
1326         *st_throttle_ops_read = NULL,
1327         *st_queued_ops_read = NULL,
1328         *st_merged_ops_read = NULL,
1329
1330         *st_io_write = NULL,
1331         *st_io_serviced_write = NULL,
1332         *st_throttle_io_write = NULL,
1333         *st_throttle_ops_write = NULL,
1334         *st_queued_ops_write = NULL,
1335         *st_merged_ops_write = NULL;
1336
1337     // create the charts
1338
1339     if(likely(do_cpu)) {
1340         if(unlikely(!st_cpu)) {
1341             char title[CHART_TITLE_MAX + 1];
1342             snprintfz(title, CHART_TITLE_MAX, "Systemd Services CPU utilization (%d%% = %d core%s)", (processors * 100), processors, (processors > 1) ? "s" : "");
1343
1344             st_cpu = rrdset_create_localhost(
1345                     "services"
1346                     , "cpu"
1347                     , NULL
1348                     , "cpu"
1349                     , "services.cpu"
1350                     , title
1351                     , "%"
1352                     , CHART_PRIORITY_SYSTEMD_SERVICES
1353                     , update_every
1354                     , RRDSET_TYPE_STACKED
1355             );
1356
1357         }
1358         else
1359             rrdset_next(st_cpu);
1360     }
1361
1362     if(likely(do_mem_usage)) {
1363         if(unlikely(!st_mem_usage)) {
1364
1365             st_mem_usage = rrdset_create_localhost(
1366                     "services"
1367                     , "mem_usage"
1368                     , NULL
1369                     , "mem"
1370                     , "services.mem_usage"
1371                     , (cgroup_used_memory_without_cache) ? "Systemd Services Used Memory without Cache"
1372                                                          : "Systemd Services Used Memory"
1373                     , "MB"
1374                     , CHART_PRIORITY_SYSTEMD_SERVICES + 10
1375                     , update_every
1376                     , RRDSET_TYPE_STACKED
1377             );
1378
1379         }
1380         else
1381             rrdset_next(st_mem_usage);
1382     }
1383
1384     if(likely(do_mem_detailed)) {
1385         if(unlikely(!st_mem_detailed_rss)) {
1386
1387             st_mem_detailed_rss = rrdset_create_localhost(
1388                     "services"
1389                     , "mem_rss"
1390                     , NULL
1391                     , "mem"
1392                     , "services.mem_rss"
1393                     , "Systemd Services RSS Memory"
1394                     , "MB"
1395                     , CHART_PRIORITY_SYSTEMD_SERVICES + 20
1396                     , update_every
1397                     , RRDSET_TYPE_STACKED
1398             );
1399
1400         }
1401         else
1402             rrdset_next(st_mem_detailed_rss);
1403
1404         if(unlikely(!st_mem_detailed_mapped)) {
1405
1406             st_mem_detailed_mapped = rrdset_create_localhost(
1407                     "services"
1408                     , "mem_mapped"
1409                     , NULL
1410                     , "mem"
1411                     , "services.mem_mapped"
1412                     , "Systemd Services Mapped Memory"
1413                     , "MB"
1414                     , CHART_PRIORITY_SYSTEMD_SERVICES + 30
1415                     , update_every
1416                     , RRDSET_TYPE_STACKED
1417             );
1418
1419         }
1420         else
1421             rrdset_next(st_mem_detailed_mapped);
1422
1423         if(unlikely(!st_mem_detailed_cache)) {
1424
1425             st_mem_detailed_cache = rrdset_create_localhost(
1426                     "services"
1427                     , "mem_cache"
1428                     , NULL
1429                     , "mem"
1430                     , "services.mem_cache"
1431                     , "Systemd Services Cache Memory"
1432                     , "MB"
1433                     , CHART_PRIORITY_SYSTEMD_SERVICES + 40
1434                     , update_every
1435                     , RRDSET_TYPE_STACKED
1436             );
1437
1438         }
1439         else
1440             rrdset_next(st_mem_detailed_cache);
1441
1442         if(unlikely(!st_mem_detailed_writeback)) {
1443
1444             st_mem_detailed_writeback = rrdset_create_localhost(
1445                     "services"
1446                     , "mem_writeback"
1447                     , NULL
1448                     , "mem"
1449                     , "services.mem_writeback"
1450                     , "Systemd Services Writeback Memory"
1451                     , "MB"
1452                     , CHART_PRIORITY_SYSTEMD_SERVICES + 50
1453                     , update_every
1454                     , RRDSET_TYPE_STACKED
1455             );
1456
1457         }
1458         else
1459             rrdset_next(st_mem_detailed_writeback);
1460
1461         if(unlikely(!st_mem_detailed_pgfault)) {
1462
1463             st_mem_detailed_pgfault = rrdset_create_localhost(
1464                     "services"
1465                     , "mem_pgfault"
1466                     , NULL
1467                     , "mem"
1468                     , "services.mem_pgfault"
1469                     , "Systemd Services Memory Minor Page Faults"
1470                     , "MB/s"
1471                     , CHART_PRIORITY_SYSTEMD_SERVICES + 60
1472                     , update_every
1473                     , RRDSET_TYPE_STACKED
1474             );
1475         }
1476         else
1477             rrdset_next(st_mem_detailed_pgfault);
1478
1479         if(unlikely(!st_mem_detailed_pgmajfault)) {
1480
1481             st_mem_detailed_pgmajfault = rrdset_create_localhost(
1482                     "services"
1483                     , "mem_pgmajfault"
1484                     , NULL
1485                     , "mem"
1486                     , "services.mem_pgmajfault"
1487                     , "Systemd Services Memory Major Page Faults"
1488                     , "MB/s"
1489                     , CHART_PRIORITY_SYSTEMD_SERVICES + 70
1490                     , update_every
1491                     , RRDSET_TYPE_STACKED
1492             );
1493
1494         }
1495         else
1496             rrdset_next(st_mem_detailed_pgmajfault);
1497
1498         if(unlikely(!st_mem_detailed_pgpgin)) {
1499
1500             st_mem_detailed_pgpgin = rrdset_create_localhost(
1501                     "services"
1502                     , "mem_pgpgin"
1503                     , NULL
1504                     , "mem"
1505                     , "services.mem_pgpgin"
1506                     , "Systemd Services Memory Charging Activity"
1507                     , "MB/s"
1508                     , CHART_PRIORITY_SYSTEMD_SERVICES + 80
1509                     , update_every
1510                     , RRDSET_TYPE_STACKED
1511             );
1512
1513         }
1514         else
1515             rrdset_next(st_mem_detailed_pgpgin);
1516
1517         if(unlikely(!st_mem_detailed_pgpgout)) {
1518
1519             st_mem_detailed_pgpgout = rrdset_create_localhost(
1520                     "services"
1521                     , "mem_pgpgout"
1522                     , NULL
1523                     , "mem"
1524                     , "services.mem_pgpgout"
1525                     , "Systemd Services Memory Uncharging Activity"
1526                     , "MB/s"
1527                     , CHART_PRIORITY_SYSTEMD_SERVICES + 90
1528                     , update_every
1529                     , RRDSET_TYPE_STACKED
1530             );
1531
1532         }
1533         else
1534             rrdset_next(st_mem_detailed_pgpgout);
1535     }
1536
1537     if(likely(do_mem_failcnt)) {
1538         if(unlikely(!st_mem_failcnt)) {
1539
1540             st_mem_failcnt = rrdset_create_localhost(
1541                     "services"
1542                     , "mem_failcnt"
1543                     , NULL
1544                     , "mem"
1545                     , "services.mem_failcnt"
1546                     , "Systemd Services Memory Limit Failures"
1547                     , "MB"
1548                     , CHART_PRIORITY_SYSTEMD_SERVICES + 110
1549                     , update_every
1550                     , RRDSET_TYPE_STACKED
1551             );
1552
1553         }
1554         else
1555             rrdset_next(st_mem_failcnt);
1556     }
1557
1558     if(likely(do_swap_usage)) {
1559         if(unlikely(!st_swap_usage)) {
1560
1561             st_swap_usage = rrdset_create_localhost(
1562                     "services"
1563                     , "swap_usage"
1564                     , NULL
1565                     , "swap"
1566                     , "services.swap_usage"
1567                     , "Systemd Services Swap Memory Used"
1568                     , "MB"
1569                     , CHART_PRIORITY_SYSTEMD_SERVICES + 100
1570                     , update_every
1571                     , RRDSET_TYPE_STACKED
1572             );
1573
1574         }
1575         else
1576             rrdset_next(st_swap_usage);
1577     }
1578
1579     if(likely(do_io)) {
1580         if(unlikely(!st_io_read)) {
1581
1582             st_io_read = rrdset_create_localhost(
1583                     "services"
1584                     , "io_read"
1585                     , NULL
1586                     , "disk"
1587                     , "services.io_read"
1588                     , "Systemd Services Disk Read Bandwidth"
1589                     , "KB/s"
1590                     , CHART_PRIORITY_SYSTEMD_SERVICES + 120
1591                     , update_every
1592                     , RRDSET_TYPE_STACKED
1593             );
1594
1595         }
1596         else
1597             rrdset_next(st_io_read);
1598
1599         if(unlikely(!st_io_write)) {
1600
1601             st_io_write = rrdset_create_localhost(
1602                     "services"
1603                     , "io_write"
1604                     , NULL
1605                     , "disk"
1606                     , "services.io_write"
1607                     , "Systemd Services Disk Write Bandwidth"
1608                     , "KB/s"
1609                     , CHART_PRIORITY_SYSTEMD_SERVICES + 130
1610                     , update_every
1611                     , RRDSET_TYPE_STACKED
1612             );
1613
1614         }
1615         else
1616             rrdset_next(st_io_write);
1617     }
1618
1619     if(likely(do_io_ops)) {
1620         if(unlikely(!st_io_serviced_read)) {
1621
1622             st_io_serviced_read = rrdset_create_localhost(
1623                     "services"
1624                     , "io_ops_read"
1625                     , NULL
1626                     , "disk"
1627                     , "services.io_ops_read"
1628                     , "Systemd Services Disk Read Operations"
1629                     , "operations/s"
1630                     , CHART_PRIORITY_SYSTEMD_SERVICES + 140
1631                     , update_every
1632                     , RRDSET_TYPE_STACKED
1633             );
1634
1635         }
1636         else
1637             rrdset_next(st_io_serviced_read);
1638
1639         if(unlikely(!st_io_serviced_write)) {
1640
1641             st_io_serviced_write = rrdset_create_localhost(
1642                     "services"
1643                     , "io_ops_write"
1644                     , NULL
1645                     , "disk"
1646                     , "services.io_ops_write"
1647                     , "Systemd Services Disk Write Operations"
1648                     , "operations/s"
1649                     , CHART_PRIORITY_SYSTEMD_SERVICES + 150
1650                     , update_every
1651                     , RRDSET_TYPE_STACKED
1652             );
1653
1654         }
1655         else
1656             rrdset_next(st_io_serviced_write);
1657     }
1658
1659     if(likely(do_throttle_io)) {
1660         if(unlikely(!st_throttle_io_read)) {
1661
1662             st_throttle_io_read = rrdset_create_localhost(
1663                     "services"
1664                     , "throttle_io_read"
1665                     , NULL
1666                     , "disk"
1667                     , "services.throttle_io_read"
1668                     , "Systemd Services Throttle Disk Read Bandwidth"
1669                     , "KB/s"
1670                     , CHART_PRIORITY_SYSTEMD_SERVICES + 160
1671                     , update_every
1672                     , RRDSET_TYPE_STACKED
1673             );
1674
1675         }
1676         else
1677             rrdset_next(st_throttle_io_read);
1678
1679         if(unlikely(!st_throttle_io_write)) {
1680
1681             st_throttle_io_write = rrdset_create_localhost(
1682                     "services"
1683                     , "throttle_io_write"
1684                     , NULL
1685                     , "disk"
1686                     , "services.throttle_io_write"
1687                     , "Systemd Services Throttle Disk Write Bandwidth"
1688                     , "KB/s"
1689                     , CHART_PRIORITY_SYSTEMD_SERVICES + 170
1690                     , update_every
1691                     , RRDSET_TYPE_STACKED
1692             );
1693
1694         }
1695         else
1696             rrdset_next(st_throttle_io_write);
1697     }
1698
1699     if(likely(do_throttle_ops)) {
1700         if(unlikely(!st_throttle_ops_read)) {
1701
1702             st_throttle_ops_read = rrdset_create_localhost(
1703                     "services"
1704                     , "throttle_io_ops_read"
1705                     , NULL
1706                     , "disk"
1707                     , "services.throttle_io_ops_read"
1708                     , "Systemd Services Throttle Disk Read Operations"
1709                     , "operations/s"
1710                     , CHART_PRIORITY_SYSTEMD_SERVICES + 180
1711                     , update_every
1712                     , RRDSET_TYPE_STACKED
1713             );
1714
1715         }
1716         else
1717             rrdset_next(st_throttle_ops_read);
1718
1719         if(unlikely(!st_throttle_ops_write)) {
1720
1721             st_throttle_ops_write = rrdset_create_localhost(
1722                     "services"
1723                     , "throttle_io_ops_write"
1724                     , NULL
1725                     , "disk"
1726                     , "services.throttle_io_ops_write"
1727                     , "Systemd Services Throttle Disk Write Operations"
1728                     , "operations/s"
1729                     , CHART_PRIORITY_SYSTEMD_SERVICES + 190
1730                     , update_every
1731                     , RRDSET_TYPE_STACKED
1732             );
1733
1734         }
1735         else
1736             rrdset_next(st_throttle_ops_write);
1737     }
1738
1739     if(likely(do_queued_ops)) {
1740         if(unlikely(!st_queued_ops_read)) {
1741
1742             st_queued_ops_read = rrdset_create_localhost(
1743                     "services"
1744                     , "queued_io_ops_read"
1745                     , NULL
1746                     , "disk"
1747                     , "services.queued_io_ops_read"
1748                     , "Systemd Services Queued Disk Read Operations"
1749                     , "operations/s"
1750                     , CHART_PRIORITY_SYSTEMD_SERVICES + 200
1751                     , update_every
1752                     , RRDSET_TYPE_STACKED
1753             );
1754
1755         }
1756         else
1757             rrdset_next(st_queued_ops_read);
1758
1759         if(unlikely(!st_queued_ops_write)) {
1760
1761             st_queued_ops_write = rrdset_create_localhost(
1762                     "services"
1763                     , "queued_io_ops_write"
1764                     , NULL
1765                     , "disk"
1766                     , "services.queued_io_ops_write"
1767                     , "Systemd Services Queued Disk Write Operations"
1768                     , "operations/s"
1769                     , CHART_PRIORITY_SYSTEMD_SERVICES + 210
1770                     , update_every
1771                     , RRDSET_TYPE_STACKED
1772             );
1773
1774         }
1775         else
1776             rrdset_next(st_queued_ops_write);
1777     }
1778
1779     if(likely(do_merged_ops)) {
1780         if(unlikely(!st_merged_ops_read)) {
1781
1782             st_merged_ops_read = rrdset_create_localhost(
1783                     "services"
1784                     , "merged_io_ops_read"
1785                     , NULL
1786                     , "disk"
1787                     , "services.merged_io_ops_read"
1788                     , "Systemd Services Merged Disk Read Operations"
1789                     , "operations/s"
1790                     , CHART_PRIORITY_SYSTEMD_SERVICES + 220
1791                     , update_every
1792                     , RRDSET_TYPE_STACKED
1793             );
1794
1795         }
1796         else
1797             rrdset_next(st_merged_ops_read);
1798
1799         if(unlikely(!st_merged_ops_write)) {
1800
1801             st_merged_ops_write = rrdset_create_localhost(
1802                     "services"
1803                     , "merged_io_ops_write"
1804                     , NULL
1805                     , "disk"
1806                     , "services.merged_io_ops_write"
1807                     , "Systemd Services Merged Disk Write Operations"
1808                     , "operations/s"
1809                     , CHART_PRIORITY_SYSTEMD_SERVICES + 230
1810                     , update_every
1811                     , RRDSET_TYPE_STACKED
1812             );
1813
1814         }
1815         else
1816             rrdset_next(st_merged_ops_write);
1817     }
1818
1819     // update the values
1820     struct cgroup *cg;
1821     for(cg = cgroup_root; cg ; cg = cg->next) {
1822         if(unlikely(!cg->available || !cg->enabled || !(cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE)))
1823             continue;
1824
1825         if(likely(do_cpu && cg->cpuacct_stat.updated)) {
1826             if(unlikely(!cg->rd_cpu))
1827                 cg->rd_cpu = rrddim_add(st_cpu, cg->chart_id, cg->chart_title, 100, hz, RRD_ALGORITHM_INCREMENTAL);
1828
1829             rrddim_set_by_pointer(st_cpu, cg->rd_cpu, cg->cpuacct_stat.user + cg->cpuacct_stat.system);
1830         }
1831
1832         if(likely(do_mem_usage && cg->memory.updated_usage_in_bytes)) {
1833             if(unlikely(!cg->rd_mem_usage))
1834                 cg->rd_mem_usage = rrddim_add(st_mem_usage, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
1835
1836             rrddim_set_by_pointer(st_mem_usage, cg->rd_mem_usage, cg->memory.usage_in_bytes - ((cgroup_used_memory_without_cache)?cg->memory.cache:0));
1837         }
1838
1839         if(likely(do_mem_detailed && cg->memory.updated_detailed)) {
1840             if(unlikely(!cg->rd_mem_detailed_rss))
1841                 cg->rd_mem_detailed_rss = rrddim_add(st_mem_detailed_rss, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
1842
1843             rrddim_set_by_pointer(st_mem_detailed_rss, cg->rd_mem_detailed_rss, cg->memory.rss + cg->memory.rss_huge);
1844
1845             if(unlikely(!cg->rd_mem_detailed_mapped))
1846                 cg->rd_mem_detailed_mapped = rrddim_add(st_mem_detailed_mapped, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
1847
1848             rrddim_set_by_pointer(st_mem_detailed_mapped, cg->rd_mem_detailed_mapped, cg->memory.mapped_file);
1849
1850             if(unlikely(!cg->rd_mem_detailed_cache))
1851                 cg->rd_mem_detailed_cache = rrddim_add(st_mem_detailed_cache, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
1852
1853             rrddim_set_by_pointer(st_mem_detailed_cache, cg->rd_mem_detailed_cache, cg->memory.cache);
1854
1855             if(unlikely(!cg->rd_mem_detailed_writeback))
1856                 cg->rd_mem_detailed_writeback = rrddim_add(st_mem_detailed_writeback, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
1857
1858             rrddim_set_by_pointer(st_mem_detailed_writeback, cg->rd_mem_detailed_writeback, cg->memory.writeback);
1859
1860             if(unlikely(!cg->rd_mem_detailed_pgfault))
1861                 cg->rd_mem_detailed_pgfault = rrddim_add(st_mem_detailed_pgfault, cg->chart_id, cg->chart_title, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
1862
1863             rrddim_set_by_pointer(st_mem_detailed_pgfault, cg->rd_mem_detailed_pgfault, cg->memory.pgfault);
1864
1865             if(unlikely(!cg->rd_mem_detailed_pgmajfault))
1866                 cg->rd_mem_detailed_pgmajfault = rrddim_add(st_mem_detailed_pgmajfault, cg->chart_id, cg->chart_title, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
1867
1868             rrddim_set_by_pointer(st_mem_detailed_pgmajfault, cg->rd_mem_detailed_pgmajfault, cg->memory.pgmajfault);
1869
1870             if(unlikely(!cg->rd_mem_detailed_pgpgin))
1871                 cg->rd_mem_detailed_pgpgin = rrddim_add(st_mem_detailed_pgpgin, cg->chart_id, cg->chart_title, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
1872
1873             rrddim_set_by_pointer(st_mem_detailed_pgpgin, cg->rd_mem_detailed_pgpgin, cg->memory.pgpgin);
1874
1875             if(unlikely(!cg->rd_mem_detailed_pgpgout))
1876                 cg->rd_mem_detailed_pgpgout = rrddim_add(st_mem_detailed_pgpgout, cg->chart_id, cg->chart_title, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
1877
1878             rrddim_set_by_pointer(st_mem_detailed_pgpgout, cg->rd_mem_detailed_pgpgout, cg->memory.pgpgout);
1879         }
1880
1881         if(likely(do_mem_failcnt && cg->memory.updated_failcnt)) {
1882             if(unlikely(!cg->rd_mem_failcnt))
1883                 cg->rd_mem_failcnt = rrddim_add(st_mem_failcnt, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1884
1885             rrddim_set_by_pointer(st_mem_failcnt, cg->rd_mem_failcnt, cg->memory.failcnt);
1886         }
1887
1888         if(likely(do_swap_usage && cg->memory.updated_msw_usage_in_bytes)) {
1889             if(unlikely(!cg->rd_swap_usage))
1890                 cg->rd_swap_usage = rrddim_add(st_swap_usage, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
1891
1892             rrddim_set_by_pointer(st_swap_usage, cg->rd_swap_usage, cg->memory.msw_usage_in_bytes);
1893         }
1894
1895         if(likely(do_io && cg->io_service_bytes.updated)) {
1896             if(unlikely(!cg->rd_io_service_bytes_read))
1897                 cg->rd_io_service_bytes_read = rrddim_add(st_io_read, cg->chart_id, cg->chart_title, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
1898
1899             rrddim_set_by_pointer(st_io_read, cg->rd_io_service_bytes_read, cg->io_service_bytes.Read);
1900
1901             if(unlikely(!cg->rd_io_service_bytes_write))
1902                 cg->rd_io_service_bytes_write = rrddim_add(st_io_write, cg->chart_id, cg->chart_title, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
1903
1904             rrddim_set_by_pointer(st_io_write, cg->rd_io_service_bytes_write, cg->io_service_bytes.Write);
1905         }
1906
1907         if(likely(do_io_ops && cg->io_serviced.updated)) {
1908             if(unlikely(!cg->rd_io_serviced_read))
1909                 cg->rd_io_serviced_read = rrddim_add(st_io_serviced_read, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1910
1911             rrddim_set_by_pointer(st_io_serviced_read, cg->rd_io_serviced_read, cg->io_serviced.Read);
1912
1913             if(unlikely(!cg->rd_io_serviced_write))
1914                 cg->rd_io_serviced_write = rrddim_add(st_io_serviced_write, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1915
1916             rrddim_set_by_pointer(st_io_serviced_write, cg->rd_io_serviced_write, cg->io_serviced.Write);
1917         }
1918
1919         if(likely(do_throttle_io && cg->throttle_io_service_bytes.updated)) {
1920             if(unlikely(!cg->rd_throttle_io_read))
1921                 cg->rd_throttle_io_read = rrddim_add(st_throttle_io_read, cg->chart_id, cg->chart_title, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
1922
1923             rrddim_set_by_pointer(st_throttle_io_read, cg->rd_throttle_io_read, cg->throttle_io_service_bytes.Read);
1924
1925             if(unlikely(!cg->rd_throttle_io_write))
1926                 cg->rd_throttle_io_write = rrddim_add(st_throttle_io_write, cg->chart_id, cg->chart_title, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
1927
1928             rrddim_set_by_pointer(st_throttle_io_write, cg->rd_throttle_io_write, cg->throttle_io_service_bytes.Write);
1929         }
1930
1931         if(likely(do_throttle_ops && cg->throttle_io_serviced.updated)) {
1932             if(unlikely(!cg->rd_throttle_io_serviced_read))
1933                 cg->rd_throttle_io_serviced_read = rrddim_add(st_throttle_ops_read, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1934
1935             rrddim_set_by_pointer(st_throttle_ops_read, cg->rd_throttle_io_serviced_read, cg->throttle_io_serviced.Read);
1936
1937             if(unlikely(!cg->rd_throttle_io_serviced_write))
1938                 cg->rd_throttle_io_serviced_write = rrddim_add(st_throttle_ops_write, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1939
1940             rrddim_set_by_pointer(st_throttle_ops_write, cg->rd_throttle_io_serviced_write, cg->throttle_io_serviced.Write);
1941         }
1942
1943         if(likely(do_queued_ops && cg->io_queued.updated)) {
1944             if(unlikely(!cg->rd_io_queued_read))
1945                 cg->rd_io_queued_read = rrddim_add(st_queued_ops_read, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1946
1947             rrddim_set_by_pointer(st_queued_ops_read, cg->rd_io_queued_read, cg->io_queued.Read);
1948
1949             if(unlikely(!cg->rd_io_queued_write))
1950                 cg->rd_io_queued_write = rrddim_add(st_queued_ops_write, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1951
1952             rrddim_set_by_pointer(st_queued_ops_write, cg->rd_io_queued_write, cg->io_queued.Write);
1953         }
1954
1955         if(likely(do_merged_ops && cg->io_merged.updated)) {
1956             if(unlikely(!cg->rd_io_merged_read))
1957                 cg->rd_io_merged_read = rrddim_add(st_merged_ops_read, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1958
1959             rrddim_set_by_pointer(st_merged_ops_read, cg->rd_io_merged_read, cg->io_merged.Read);
1960
1961             if(unlikely(!cg->rd_io_merged_write))
1962                 cg->rd_io_merged_write = rrddim_add(st_merged_ops_write, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1963
1964             rrddim_set_by_pointer(st_merged_ops_write, cg->rd_io_merged_write, cg->io_merged.Write);
1965         }
1966     }
1967
1968     // complete the iteration
1969     if(likely(do_cpu))
1970         rrdset_done(st_cpu);
1971
1972     if(likely(do_mem_usage))
1973         rrdset_done(st_mem_usage);
1974
1975     if(unlikely(do_mem_detailed)) {
1976         rrdset_done(st_mem_detailed_cache);
1977         rrdset_done(st_mem_detailed_rss);
1978         rrdset_done(st_mem_detailed_mapped);
1979         rrdset_done(st_mem_detailed_writeback);
1980         rrdset_done(st_mem_detailed_pgfault);
1981         rrdset_done(st_mem_detailed_pgmajfault);
1982         rrdset_done(st_mem_detailed_pgpgin);
1983         rrdset_done(st_mem_detailed_pgpgout);
1984     }
1985
1986     if(likely(do_mem_failcnt))
1987         rrdset_done(st_mem_failcnt);
1988
1989     if(likely(do_swap_usage))
1990         rrdset_done(st_swap_usage);
1991
1992     if(likely(do_io)) {
1993         rrdset_done(st_io_read);
1994         rrdset_done(st_io_write);
1995     }
1996
1997     if(likely(do_io_ops)) {
1998         rrdset_done(st_io_serviced_read);
1999         rrdset_done(st_io_serviced_write);
2000     }
2001
2002     if(likely(do_throttle_io)) {
2003         rrdset_done(st_throttle_io_read);
2004         rrdset_done(st_throttle_io_write);
2005     }
2006
2007     if(likely(do_throttle_ops)) {
2008         rrdset_done(st_throttle_ops_read);
2009         rrdset_done(st_throttle_ops_write);
2010     }
2011
2012     if(likely(do_queued_ops)) {
2013         rrdset_done(st_queued_ops_read);
2014         rrdset_done(st_queued_ops_write);
2015     }
2016
2017     if(likely(do_merged_ops)) {
2018         rrdset_done(st_merged_ops_read);
2019         rrdset_done(st_merged_ops_write);
2020     }
2021 }
2022
2023 static inline char *cgroup_chart_type(char *buffer, const char *id, size_t len) {
2024     if(buffer[0]) return buffer;
2025
2026     if(id[0] == '\0' || (id[0] == '/' && id[1] == '\0'))
2027         strncpy(buffer, "cgroup_root", len);
2028     else
2029         snprintfz(buffer, len, "cgroup_%s", id);
2030
2031     netdata_fix_chart_id(buffer);
2032     return buffer;
2033 }
2034
2035 void update_cgroup_charts(int update_every) {
2036     debug(D_CGROUP, "updating cgroups charts");
2037
2038     char type[RRD_ID_LENGTH_MAX + 1];
2039     char title[CHART_TITLE_MAX + 1];
2040
2041     int services_do_cpu = 0,
2042             services_do_mem_usage = 0,
2043             services_do_mem_detailed = 0,
2044             services_do_mem_failcnt = 0,
2045             services_do_swap_usage = 0,
2046             services_do_io = 0,
2047             services_do_io_ops = 0,
2048             services_do_throttle_io = 0,
2049             services_do_throttle_ops = 0,
2050             services_do_queued_ops = 0,
2051             services_do_merged_ops = 0;
2052
2053     struct cgroup *cg;
2054     for(cg = cgroup_root; cg ; cg = cg->next) {
2055         if(unlikely(!cg->available || !cg->enabled))
2056             continue;
2057
2058         if(likely(cgroup_enable_systemd_services && cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE)) {
2059             if(cg->cpuacct_stat.updated && cg->cpuacct_stat.enabled == CONFIG_BOOLEAN_YES) services_do_cpu++;
2060
2061             if(cgroup_enable_systemd_services_detailed_memory && cg->memory.updated_detailed && cg->memory.enabled_detailed) services_do_mem_detailed++;
2062             if(cg->memory.updated_usage_in_bytes && cg->memory.enabled_usage_in_bytes == CONFIG_BOOLEAN_YES) services_do_mem_usage++;
2063             if(cg->memory.updated_failcnt && cg->memory.enabled_failcnt == CONFIG_BOOLEAN_YES) services_do_mem_failcnt++;
2064             if(cg->memory.updated_msw_usage_in_bytes && cg->memory.enabled_msw_usage_in_bytes == CONFIG_BOOLEAN_YES) services_do_swap_usage++;
2065
2066             if(cg->io_service_bytes.updated && cg->io_service_bytes.enabled == CONFIG_BOOLEAN_YES) services_do_io++;
2067             if(cg->io_serviced.updated && cg->io_serviced.enabled == CONFIG_BOOLEAN_YES) services_do_io_ops++;
2068             if(cg->throttle_io_service_bytes.updated && cg->throttle_io_service_bytes.enabled == CONFIG_BOOLEAN_YES) services_do_throttle_io++;
2069             if(cg->throttle_io_serviced.updated && cg->throttle_io_serviced.enabled == CONFIG_BOOLEAN_YES) services_do_throttle_ops++;
2070             if(cg->io_queued.updated && cg->io_queued.enabled == CONFIG_BOOLEAN_YES) services_do_queued_ops++;
2071             if(cg->io_merged.updated && cg->io_merged.enabled == CONFIG_BOOLEAN_YES) services_do_merged_ops++;
2072             continue;
2073         }
2074
2075         type[0] = '\0';
2076
2077         if(likely(cg->cpuacct_stat.updated && cg->cpuacct_stat.enabled == CONFIG_BOOLEAN_YES)) {
2078             if(unlikely(!cg->st_cpu)) {
2079                 snprintfz(title, CHART_TITLE_MAX, "CPU Usage (%d%% = %d core%s) for cgroup %s", (processors * 100), processors, (processors > 1) ? "s" : "", cg->chart_title);
2080
2081                 cg->st_cpu = rrdset_create_localhost(
2082                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2083                         , "cpu"
2084                         , NULL
2085                         , "cpu"
2086                         , "cgroup.cpu"
2087                         , title
2088                         , "%"
2089                         , CHART_PRIORITY_CONTAINERS
2090                         , update_every
2091                         , RRDSET_TYPE_STACKED
2092                 );
2093
2094                 rrddim_add(cg->st_cpu, "user", NULL, 100, hz, RRD_ALGORITHM_INCREMENTAL);
2095                 rrddim_add(cg->st_cpu, "system", NULL, 100, hz, RRD_ALGORITHM_INCREMENTAL);
2096             }
2097             else
2098                 rrdset_next(cg->st_cpu);
2099
2100             rrddim_set(cg->st_cpu, "user", cg->cpuacct_stat.user);
2101             rrddim_set(cg->st_cpu, "system", cg->cpuacct_stat.system);
2102             rrdset_done(cg->st_cpu);
2103         }
2104
2105         if(likely(cg->cpuacct_usage.updated && cg->cpuacct_usage.enabled == CONFIG_BOOLEAN_YES)) {
2106             char id[RRD_ID_LENGTH_MAX + 1];
2107             unsigned int i;
2108
2109             if(unlikely(!cg->st_cpu_per_core)) {
2110                 snprintfz(title, CHART_TITLE_MAX, "CPU Usage (%d%% = %d core%s) Per Core for cgroup %s", (processors * 100), processors, (processors > 1) ? "s" : "", cg->chart_title);
2111
2112                 cg->st_cpu_per_core = rrdset_create_localhost(
2113                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2114                         , "cpu_per_core"
2115                         , NULL
2116                         , "cpu"
2117                         , "cgroup.cpu_per_core"
2118                         , title
2119                         , "%"
2120                         , CHART_PRIORITY_CONTAINERS + 100
2121                         , update_every
2122                         , RRDSET_TYPE_STACKED
2123                 );
2124
2125                 for(i = 0; i < cg->cpuacct_usage.cpus; i++) {
2126                     snprintfz(id, RRD_ID_LENGTH_MAX, "cpu%u", i);
2127                     rrddim_add(cg->st_cpu_per_core, id, NULL, 100, 1000000000, RRD_ALGORITHM_INCREMENTAL);
2128                 }
2129             }
2130             else
2131                 rrdset_next(cg->st_cpu_per_core);
2132
2133             for(i = 0; i < cg->cpuacct_usage.cpus ;i++) {
2134                 snprintfz(id, RRD_ID_LENGTH_MAX, "cpu%u", i);
2135                 rrddim_set(cg->st_cpu_per_core, id, cg->cpuacct_usage.cpu_percpu[i]);
2136             }
2137             rrdset_done(cg->st_cpu_per_core);
2138         }
2139
2140         if(likely(cg->memory.updated_detailed && cg->memory.enabled_detailed == CONFIG_BOOLEAN_YES)) {
2141             if(unlikely(!cg->st_mem)) {
2142                 snprintfz(title, CHART_TITLE_MAX, "Memory Usage for cgroup %s", cg->chart_title);
2143
2144                 cg->st_mem = rrdset_create_localhost(
2145                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2146                         , "mem"
2147                         , NULL
2148                         , "mem"
2149                         , "cgroup.mem"
2150                         , title
2151                         , "MB"
2152                         , CHART_PRIORITY_CONTAINERS + 210
2153                         , update_every
2154                         , RRDSET_TYPE_STACKED
2155                 );
2156
2157                 rrddim_add(cg->st_mem, "cache", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2158                 rrddim_add(cg->st_mem, "rss", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2159
2160                 if(cg->memory.detailed_has_swap)
2161                     rrddim_add(cg->st_mem, "swap", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2162
2163                 rrddim_add(cg->st_mem, "rss_huge", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2164                 rrddim_add(cg->st_mem, "mapped_file", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2165             }
2166             else
2167                 rrdset_next(cg->st_mem);
2168
2169             rrddim_set(cg->st_mem, "cache", cg->memory.cache);
2170             rrddim_set(cg->st_mem, "rss", cg->memory.rss);
2171
2172             if(cg->memory.detailed_has_swap)
2173                 rrddim_set(cg->st_mem, "swap", cg->memory.swap);
2174
2175             rrddim_set(cg->st_mem, "rss_huge", cg->memory.rss_huge);
2176             rrddim_set(cg->st_mem, "mapped_file", cg->memory.mapped_file);
2177             rrdset_done(cg->st_mem);
2178
2179             if(unlikely(!cg->st_writeback)) {
2180                 snprintfz(title, CHART_TITLE_MAX, "Writeback Memory for cgroup %s", cg->chart_title);
2181
2182                 cg->st_writeback = rrdset_create_localhost(
2183                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2184                         , "writeback"
2185                         , NULL
2186                         , "mem"
2187                         , "cgroup.writeback"
2188                         , title
2189                         , "MB"
2190                         , CHART_PRIORITY_CONTAINERS + 300
2191                         , update_every
2192                         , RRDSET_TYPE_AREA
2193                 );
2194
2195                 if(cg->memory.detailed_has_dirty)
2196                     rrddim_add(cg->st_writeback, "dirty", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2197
2198                 rrddim_add(cg->st_writeback, "writeback", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2199             }
2200             else
2201                 rrdset_next(cg->st_writeback);
2202
2203             if(cg->memory.detailed_has_dirty)
2204                 rrddim_set(cg->st_writeback, "dirty", cg->memory.dirty);
2205
2206             rrddim_set(cg->st_writeback, "writeback", cg->memory.writeback);
2207             rrdset_done(cg->st_writeback);
2208
2209             if(unlikely(!cg->st_mem_activity)) {
2210                 snprintfz(title, CHART_TITLE_MAX, "Memory Activity for cgroup %s", cg->chart_title);
2211
2212                 cg->st_mem_activity = rrdset_create_localhost(
2213                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2214                         , "mem_activity"
2215                         , NULL
2216                         , "mem"
2217                         , "cgroup.mem_activity"
2218                         , title
2219                         , "MB/s"
2220                         , CHART_PRIORITY_CONTAINERS + 400
2221                         , update_every
2222                         , RRDSET_TYPE_LINE
2223                 );
2224
2225                 rrddim_add(cg->st_mem_activity, "pgpgin", "in", system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
2226                 rrddim_add(cg->st_mem_activity, "pgpgout", "out", -system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
2227             }
2228             else
2229                 rrdset_next(cg->st_mem_activity);
2230
2231             rrddim_set(cg->st_mem_activity, "pgpgin", cg->memory.pgpgin);
2232             rrddim_set(cg->st_mem_activity, "pgpgout", cg->memory.pgpgout);
2233             rrdset_done(cg->st_mem_activity);
2234
2235             if(unlikely(!cg->st_pgfaults)) {
2236                 snprintfz(title, CHART_TITLE_MAX, "Memory Page Faults for cgroup %s", cg->chart_title);
2237
2238                 cg->st_pgfaults = rrdset_create_localhost(
2239                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2240                         , "pgfaults"
2241                         , NULL
2242                         , "mem"
2243                         , "cgroup.pgfaults"
2244                         , title
2245                         , "MB/s"
2246                         , CHART_PRIORITY_CONTAINERS + 500
2247                         , update_every
2248                         , RRDSET_TYPE_LINE
2249                 );
2250
2251                 rrddim_add(cg->st_pgfaults, "pgfault", NULL, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
2252                 rrddim_add(cg->st_pgfaults, "pgmajfault", "swap", -system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
2253             }
2254             else
2255                 rrdset_next(cg->st_pgfaults);
2256
2257             rrddim_set(cg->st_pgfaults, "pgfault", cg->memory.pgfault);
2258             rrddim_set(cg->st_pgfaults, "pgmajfault", cg->memory.pgmajfault);
2259             rrdset_done(cg->st_pgfaults);
2260         }
2261
2262         if(likely(cg->memory.updated_usage_in_bytes && cg->memory.enabled_usage_in_bytes == CONFIG_BOOLEAN_YES)) {
2263             if(unlikely(!cg->st_mem_usage)) {
2264                 snprintfz(title, CHART_TITLE_MAX, "Used Memory %sfor cgroup %s", (cgroup_used_memory_without_cache && cg->memory.updated_detailed)?"without Cache ":"", cg->chart_title);
2265
2266                 cg->st_mem_usage = rrdset_create_localhost(
2267                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2268                         , "mem_usage"
2269                         , NULL
2270                         , "mem"
2271                         , "cgroup.mem_usage"
2272                         , title
2273                         , "MB"
2274                         , CHART_PRIORITY_CONTAINERS + 200
2275                         , update_every
2276                         , RRDSET_TYPE_STACKED
2277                 );
2278
2279                 rrddim_add(cg->st_mem_usage, "ram", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2280                 rrddim_add(cg->st_mem_usage, "swap", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2281             }
2282             else
2283                 rrdset_next(cg->st_mem_usage);
2284
2285             rrddim_set(cg->st_mem_usage, "ram", cg->memory.usage_in_bytes - ((cgroup_used_memory_without_cache)?cg->memory.cache:0));
2286             rrddim_set(cg->st_mem_usage, "swap", (cg->memory.msw_usage_in_bytes > cg->memory.usage_in_bytes)?cg->memory.msw_usage_in_bytes - cg->memory.usage_in_bytes:0);
2287             rrdset_done(cg->st_mem_usage);
2288         }
2289
2290         if(likely(cg->memory.updated_failcnt && cg->memory.enabled_failcnt == CONFIG_BOOLEAN_YES)) {
2291             if(unlikely(!cg->st_mem_failcnt)) {
2292                 snprintfz(title, CHART_TITLE_MAX, "Memory Limit Failures for cgroup %s", cg->chart_title);
2293
2294                 cg->st_mem_failcnt = rrdset_create_localhost(
2295                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2296                         , "mem_failcnt"
2297                         , NULL
2298                         , "mem"
2299                         , "cgroup.mem_failcnt"
2300                         , title
2301                         , "count"
2302                         , CHART_PRIORITY_CONTAINERS + 250
2303                         , update_every
2304                         , RRDSET_TYPE_LINE
2305                 );
2306
2307                 rrddim_add(cg->st_mem_failcnt, "failures", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
2308             }
2309             else
2310                 rrdset_next(cg->st_mem_failcnt);
2311
2312             rrddim_set(cg->st_mem_failcnt, "failures", cg->memory.failcnt);
2313             rrdset_done(cg->st_mem_failcnt);
2314         }
2315
2316         if(likely(cg->io_service_bytes.updated && cg->io_service_bytes.enabled == CONFIG_BOOLEAN_YES)) {
2317             if(unlikely(!cg->st_io)) {
2318                 snprintfz(title, CHART_TITLE_MAX, "I/O Bandwidth (all disks) for cgroup %s", cg->chart_title);
2319
2320                 cg->st_io = rrdset_create_localhost(
2321                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2322                         , "io"
2323                         , NULL
2324                         , "disk"
2325                         , "cgroup.io"
2326                         , title
2327                         , "KB/s"
2328                         , CHART_PRIORITY_CONTAINERS + 1200
2329                         , update_every
2330                         , RRDSET_TYPE_AREA
2331                 );
2332
2333                 rrddim_add(cg->st_io, "read", NULL, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
2334                 rrddim_add(cg->st_io, "write", NULL, -1, 1024, RRD_ALGORITHM_INCREMENTAL);
2335             }
2336             else
2337                 rrdset_next(cg->st_io);
2338
2339             rrddim_set(cg->st_io, "read", cg->io_service_bytes.Read);
2340             rrddim_set(cg->st_io, "write", cg->io_service_bytes.Write);
2341             rrdset_done(cg->st_io);
2342         }
2343
2344         if(likely(cg->io_serviced.updated && cg->io_serviced.enabled == CONFIG_BOOLEAN_YES)) {
2345             if(unlikely(!cg->st_serviced_ops)) {
2346                 snprintfz(title, CHART_TITLE_MAX, "Serviced I/O Operations (all disks) for cgroup %s", cg->chart_title);
2347
2348                 cg->st_serviced_ops = rrdset_create_localhost(
2349                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2350                         , "serviced_ops"
2351                         , NULL
2352                         , "disk"
2353                         , "cgroup.serviced_ops"
2354                         , title
2355                         , "operations/s"
2356                         , CHART_PRIORITY_CONTAINERS + 1200
2357                         , update_every
2358                         , RRDSET_TYPE_LINE
2359                 );
2360
2361                 rrddim_add(cg->st_serviced_ops, "read", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
2362                 rrddim_add(cg->st_serviced_ops, "write", NULL, -1, 1, RRD_ALGORITHM_INCREMENTAL);
2363             }
2364             else
2365                 rrdset_next(cg->st_serviced_ops);
2366
2367             rrddim_set(cg->st_serviced_ops, "read", cg->io_serviced.Read);
2368             rrddim_set(cg->st_serviced_ops, "write", cg->io_serviced.Write);
2369             rrdset_done(cg->st_serviced_ops);
2370         }
2371
2372         if(likely(cg->throttle_io_service_bytes.updated && cg->throttle_io_service_bytes.enabled == CONFIG_BOOLEAN_YES)) {
2373             if(unlikely(!cg->st_throttle_io)) {
2374                 snprintfz(title, CHART_TITLE_MAX, "Throttle I/O Bandwidth (all disks) for cgroup %s", cg->chart_title);
2375
2376                 cg->st_throttle_io = rrdset_create_localhost(
2377                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2378                         , "throttle_io"
2379                         , NULL
2380                         , "disk"
2381                         , "cgroup.throttle_io"
2382                         , title
2383                         , "KB/s"
2384                         , CHART_PRIORITY_CONTAINERS + 1200
2385                         , update_every
2386                         , RRDSET_TYPE_AREA
2387                 );
2388
2389                 rrddim_add(cg->st_throttle_io, "read", NULL, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
2390                 rrddim_add(cg->st_throttle_io, "write", NULL, -1, 1024, RRD_ALGORITHM_INCREMENTAL);
2391             }
2392             else
2393                 rrdset_next(cg->st_throttle_io);
2394
2395             rrddim_set(cg->st_throttle_io, "read", cg->throttle_io_service_bytes.Read);
2396             rrddim_set(cg->st_throttle_io, "write", cg->throttle_io_service_bytes.Write);
2397             rrdset_done(cg->st_throttle_io);
2398         }
2399
2400         if(likely(cg->throttle_io_serviced.updated && cg->throttle_io_serviced.enabled == CONFIG_BOOLEAN_YES)) {
2401             if(unlikely(!cg->st_throttle_serviced_ops)) {
2402                 snprintfz(title, CHART_TITLE_MAX, "Throttle Serviced I/O Operations (all disks) for cgroup %s", cg->chart_title);
2403
2404                 cg->st_throttle_serviced_ops = rrdset_create_localhost(
2405                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2406                         , "throttle_serviced_ops"
2407                         , NULL
2408                         , "disk"
2409                         , "cgroup.throttle_serviced_ops"
2410                         , title
2411                         , "operations/s"
2412                         , CHART_PRIORITY_CONTAINERS + 1200
2413                         , update_every
2414                         , RRDSET_TYPE_LINE
2415                 );
2416
2417                 rrddim_add(cg->st_throttle_serviced_ops, "read", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
2418                 rrddim_add(cg->st_throttle_serviced_ops, "write", NULL, -1, 1, RRD_ALGORITHM_INCREMENTAL);
2419             }
2420             else
2421                 rrdset_next(cg->st_throttle_serviced_ops);
2422
2423             rrddim_set(cg->st_throttle_serviced_ops, "read", cg->throttle_io_serviced.Read);
2424             rrddim_set(cg->st_throttle_serviced_ops, "write", cg->throttle_io_serviced.Write);
2425             rrdset_done(cg->st_throttle_serviced_ops);
2426         }
2427
2428         if(likely(cg->io_queued.updated && cg->io_queued.enabled == CONFIG_BOOLEAN_YES)) {
2429             if(unlikely(!cg->st_queued_ops)) {
2430                 snprintfz(title, CHART_TITLE_MAX, "Queued I/O Operations (all disks) for cgroup %s", cg->chart_title);
2431
2432                 cg->st_queued_ops = rrdset_create_localhost(
2433                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2434                         , "queued_ops"
2435                         , NULL
2436                         , "disk"
2437                         , "cgroup.queued_ops"
2438                         , title
2439                         , "operations"
2440                         , CHART_PRIORITY_CONTAINERS + 2000
2441                         , update_every
2442                         , RRDSET_TYPE_LINE
2443                 );
2444
2445                 rrddim_add(cg->st_queued_ops, "read", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
2446                 rrddim_add(cg->st_queued_ops, "write", NULL, -1, 1, RRD_ALGORITHM_ABSOLUTE);
2447             }
2448             else
2449                 rrdset_next(cg->st_queued_ops);
2450
2451             rrddim_set(cg->st_queued_ops, "read", cg->io_queued.Read);
2452             rrddim_set(cg->st_queued_ops, "write", cg->io_queued.Write);
2453             rrdset_done(cg->st_queued_ops);
2454         }
2455
2456         if(likely(cg->io_merged.updated && cg->io_merged.enabled == CONFIG_BOOLEAN_YES)) {
2457             if(unlikely(!cg->st_merged_ops)) {
2458                 snprintfz(title, CHART_TITLE_MAX, "Merged I/O Operations (all disks) for cgroup %s", cg->chart_title);
2459
2460                 cg->st_merged_ops = rrdset_create_localhost(
2461                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2462                         , "merged_ops"
2463                         , NULL
2464                         , "disk"
2465                         , "cgroup.merged_ops"
2466                         , title
2467                         , "operations/s"
2468                         , CHART_PRIORITY_CONTAINERS + 2100
2469                         , update_every
2470                         , RRDSET_TYPE_LINE
2471                 );
2472
2473                 rrddim_add(cg->st_merged_ops, "read", NULL, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
2474                 rrddim_add(cg->st_merged_ops, "write", NULL, -1, 1024, RRD_ALGORITHM_INCREMENTAL);
2475             }
2476             else
2477                 rrdset_next(cg->st_merged_ops);
2478
2479             rrddim_set(cg->st_merged_ops, "read", cg->io_merged.Read);
2480             rrddim_set(cg->st_merged_ops, "write", cg->io_merged.Write);
2481             rrdset_done(cg->st_merged_ops);
2482         }
2483     }
2484
2485     if(likely(cgroup_enable_systemd_services))
2486         update_systemd_services_charts(update_every, services_do_cpu, services_do_mem_usage, services_do_mem_detailed
2487                                        , services_do_mem_failcnt, services_do_swap_usage, services_do_io
2488                                        , services_do_io_ops, services_do_throttle_io, services_do_throttle_ops
2489                                        , services_do_queued_ops, services_do_merged_ops
2490         );
2491
2492     debug(D_CGROUP, "done updating cgroups charts");
2493 }
2494
2495 // ----------------------------------------------------------------------------
2496 // cgroups main
2497
2498 void *cgroups_main(void *ptr) {
2499     struct netdata_static_thread *static_thread = (struct netdata_static_thread *)ptr;
2500
2501     info("CGROUP Plugin thread created with task id %d", gettid());
2502
2503     if(pthread_setcanceltype(PTHREAD_CANCEL_DEFERRED, NULL) != 0)
2504         error("Cannot set pthread cancel type to DEFERRED.");
2505
2506     if(pthread_setcancelstate(PTHREAD_CANCEL_ENABLE, NULL) != 0)
2507         error("Cannot set pthread cancel state to ENABLE.");
2508
2509     struct rusage thread;
2510
2511     // when ZERO, attempt to do it
2512     int vdo_cpu_netdata = config_get_boolean("plugin:cgroups", "cgroups plugin resource charts", 1);
2513
2514     read_cgroup_plugin_configuration();
2515
2516     RRDSET *stcpu_thread = NULL;
2517
2518     heartbeat_t hb;
2519     heartbeat_init(&hb);
2520     usec_t step = cgroup_update_every * USEC_PER_SEC;
2521     usec_t find_every = cgroup_check_for_new_every * USEC_PER_SEC, find_dt = 0;
2522     for(;;) {
2523         usec_t hb_dt = heartbeat_next(&hb, step);
2524         if(unlikely(netdata_exit)) break;
2525
2526         // BEGIN -- the job to be done
2527
2528         find_dt += hb_dt;
2529         if(unlikely(find_dt >= find_every || cgroups_check)) {
2530             find_all_cgroups();
2531             find_dt = 0;
2532             cgroups_check = 0;
2533         }
2534
2535         read_all_cgroups(cgroup_root);
2536         update_cgroup_charts(cgroup_update_every);
2537
2538         // END -- the job is done
2539
2540         // --------------------------------------------------------------------
2541
2542         if(vdo_cpu_netdata) {
2543             getrusage(RUSAGE_THREAD, &thread);
2544
2545             if(unlikely(!stcpu_thread)) {
2546
2547                 stcpu_thread = rrdset_create_localhost(
2548                         "netdata"
2549                         , "plugin_cgroups_cpu"
2550                         , NULL
2551                         , "cgroups"
2552                         , NULL
2553                         , "NetData CGroups Plugin CPU usage"
2554                         , "milliseconds/s"
2555                         , 132000
2556                         , cgroup_update_every
2557                         , RRDSET_TYPE_STACKED
2558                 );
2559
2560                 rrddim_add(stcpu_thread, "user",  NULL,  1, 1000, RRD_ALGORITHM_INCREMENTAL);
2561                 rrddim_add(stcpu_thread, "system", NULL, 1, 1000, RRD_ALGORITHM_INCREMENTAL);
2562             }
2563             else
2564                 rrdset_next(stcpu_thread);
2565
2566             rrddim_set(stcpu_thread, "user"  , thread.ru_utime.tv_sec * 1000000ULL + thread.ru_utime.tv_usec);
2567             rrddim_set(stcpu_thread, "system", thread.ru_stime.tv_sec * 1000000ULL + thread.ru_stime.tv_usec);
2568             rrdset_done(stcpu_thread);
2569         }
2570     }
2571
2572     info("CGROUP thread exiting");
2573
2574     static_thread->enabled = 0;
2575     pthread_exit(NULL);
2576     return NULL;
2577 }