]> arthur.barton.de Git - netdata.git/blob - src/sys_fs_cgroup.c
9c2f749e629bdfc188aa929929d5e6f4c81f53b1
[netdata.git] / src / sys_fs_cgroup.c
1 #include "common.h"
2
3 // ----------------------------------------------------------------------------
4 // cgroup globals
5
6 #define CHART_PRIORITY_SYSTEMD_SERVICES 19000
7 #define CHART_PRIORITY_CONTAINERS       40000
8
9 static long system_page_size = 4096; // system will be queried via sysconf() in configuration()
10
11 static int cgroup_enable_cpuacct_stat = CONFIG_BOOLEAN_AUTO;
12 static int cgroup_enable_cpuacct_usage = CONFIG_BOOLEAN_AUTO;
13 static int cgroup_enable_memory = CONFIG_BOOLEAN_AUTO;
14 static int cgroup_enable_detailed_memory = CONFIG_BOOLEAN_AUTO;
15 static int cgroup_enable_memory_failcnt = CONFIG_BOOLEAN_AUTO;
16 static int cgroup_enable_swap = CONFIG_BOOLEAN_AUTO;
17 static int cgroup_enable_blkio_io = CONFIG_BOOLEAN_AUTO;
18 static int cgroup_enable_blkio_ops = CONFIG_BOOLEAN_AUTO;
19 static int cgroup_enable_blkio_throttle_io = CONFIG_BOOLEAN_AUTO;
20 static int cgroup_enable_blkio_throttle_ops = CONFIG_BOOLEAN_AUTO;
21 static int cgroup_enable_blkio_merged_ops = CONFIG_BOOLEAN_AUTO;
22 static int cgroup_enable_blkio_queued_ops = CONFIG_BOOLEAN_AUTO;
23
24 static int cgroup_enable_systemd_services = CONFIG_BOOLEAN_YES;
25 static int cgroup_enable_systemd_services_detailed_memory = CONFIG_BOOLEAN_NO;
26 static int cgroup_used_memory_without_cache = CONFIG_BOOLEAN_YES;
27
28 static int cgroup_search_in_devices = 1;
29
30 static int cgroup_enable_new_cgroups_detected_at_runtime = 1;
31 static int cgroup_check_for_new_every = 10;
32 static int cgroup_update_every = 1;
33
34 static int cgroup_recheck_zero_blkio_every_iterations = 10;
35 static int cgroup_recheck_zero_mem_failcnt_every_iterations = 10;
36 static int cgroup_recheck_zero_mem_detailed_every_iterations = 10;
37
38 static char *cgroup_cpuacct_base = NULL;
39 static char *cgroup_blkio_base = NULL;
40 static char *cgroup_memory_base = NULL;
41 static char *cgroup_devices_base = NULL;
42
43 static int cgroup_root_count = 0;
44 static int cgroup_root_max = 500;
45 static int cgroup_max_depth = 0;
46
47 static SIMPLE_PATTERN *enabled_cgroup_patterns = NULL;
48 static SIMPLE_PATTERN *enabled_cgroup_paths = NULL;
49 static SIMPLE_PATTERN *enabled_cgroup_renames = NULL;
50 static SIMPLE_PATTERN *systemd_services_cgroups = NULL;
51
52 static char *cgroups_rename_script = NULL;
53
54 static int cgroups_check = 0;
55
56 static uint32_t Read_hash = 0;
57 static uint32_t Write_hash = 0;
58 static uint32_t user_hash = 0;
59 static uint32_t system_hash = 0;
60
61 void read_cgroup_plugin_configuration() {
62     system_page_size = sysconf(_SC_PAGESIZE);
63
64     Read_hash = simple_hash("Read");
65     Write_hash = simple_hash("Write");
66     user_hash = simple_hash("user");
67     system_hash = simple_hash("system");
68
69     cgroup_update_every = (int)config_get_number("plugin:cgroups", "update every", localhost->rrd_update_every);
70     if(cgroup_update_every < localhost->rrd_update_every)
71         cgroup_update_every = localhost->rrd_update_every;
72
73     cgroup_check_for_new_every = (int)config_get_number("plugin:cgroups", "check for new cgroups every", cgroup_check_for_new_every * cgroup_update_every);
74     if(cgroup_check_for_new_every < cgroup_update_every)
75         cgroup_check_for_new_every = cgroup_update_every;
76
77     cgroup_enable_cpuacct_stat = config_get_boolean_ondemand("plugin:cgroups", "enable cpuacct stat (total CPU)", cgroup_enable_cpuacct_stat);
78     cgroup_enable_cpuacct_usage = config_get_boolean_ondemand("plugin:cgroups", "enable cpuacct usage (per core CPU)", cgroup_enable_cpuacct_usage);
79
80     cgroup_enable_memory = config_get_boolean_ondemand("plugin:cgroups", "enable memory (used mem including cache)", cgroup_enable_memory);
81     cgroup_enable_detailed_memory = config_get_boolean_ondemand("plugin:cgroups", "enable detailed memory", cgroup_enable_detailed_memory);
82     cgroup_enable_memory_failcnt = config_get_boolean_ondemand("plugin:cgroups", "enable memory limits fail count", cgroup_enable_memory_failcnt);
83     cgroup_enable_swap = config_get_boolean_ondemand("plugin:cgroups", "enable swap memory", cgroup_enable_swap);
84
85     cgroup_enable_blkio_io = config_get_boolean_ondemand("plugin:cgroups", "enable blkio bandwidth", cgroup_enable_blkio_io);
86     cgroup_enable_blkio_ops = config_get_boolean_ondemand("plugin:cgroups", "enable blkio operations", cgroup_enable_blkio_ops);
87     cgroup_enable_blkio_throttle_io = config_get_boolean_ondemand("plugin:cgroups", "enable blkio throttle bandwidth", cgroup_enable_blkio_throttle_io);
88     cgroup_enable_blkio_throttle_ops = config_get_boolean_ondemand("plugin:cgroups", "enable blkio throttle operations", cgroup_enable_blkio_throttle_ops);
89     cgroup_enable_blkio_queued_ops = config_get_boolean_ondemand("plugin:cgroups", "enable blkio queued operations", cgroup_enable_blkio_queued_ops);
90     cgroup_enable_blkio_merged_ops = config_get_boolean_ondemand("plugin:cgroups", "enable blkio merged operations", cgroup_enable_blkio_merged_ops);
91
92     cgroup_recheck_zero_blkio_every_iterations = (int)config_get_number("plugin:cgroups", "recheck zero blkio every iterations", cgroup_recheck_zero_blkio_every_iterations);
93     cgroup_recheck_zero_mem_failcnt_every_iterations = (int)config_get_number("plugin:cgroups", "recheck zero memory failcnt every iterations", cgroup_recheck_zero_mem_failcnt_every_iterations);
94     cgroup_recheck_zero_mem_detailed_every_iterations = (int)config_get_number("plugin:cgroups", "recheck zero detailed memory every iterations", cgroup_recheck_zero_mem_detailed_every_iterations);
95
96     cgroup_enable_systemd_services = config_get_boolean("plugin:cgroups", "enable systemd services", cgroup_enable_systemd_services);
97     cgroup_enable_systemd_services_detailed_memory = config_get_boolean("plugin:cgroups", "enable systemd services detailed memory", cgroup_enable_systemd_services_detailed_memory);
98     cgroup_used_memory_without_cache = config_get_boolean("plugin:cgroups", "report used memory without cache", cgroup_used_memory_without_cache);
99
100     char filename[FILENAME_MAX + 1], *s;
101     struct mountinfo *mi, *root = mountinfo_read(0);
102
103     mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "cpuacct");
104     if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "cpuacct");
105     if(!mi) {
106         error("Cannot find cgroup cpuacct mountinfo. Assuming default: /sys/fs/cgroup/cpuacct");
107         s = "/sys/fs/cgroup/cpuacct";
108     }
109     else s = mi->mount_point;
110     snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
111     cgroup_cpuacct_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/cpuacct", filename);
112
113     mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "blkio");
114     if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "blkio");
115     if(!mi) {
116         error("Cannot find cgroup blkio mountinfo. Assuming default: /sys/fs/cgroup/blkio");
117         s = "/sys/fs/cgroup/blkio";
118     }
119     else s = mi->mount_point;
120     snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
121     cgroup_blkio_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/blkio", filename);
122
123     mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "memory");
124     if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "memory");
125     if(!mi) {
126         error("Cannot find cgroup memory mountinfo. Assuming default: /sys/fs/cgroup/memory");
127         s = "/sys/fs/cgroup/memory";
128     }
129     else s = mi->mount_point;
130     snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
131     cgroup_memory_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/memory", filename);
132
133     mi = mountinfo_find_by_filesystem_super_option(root, "cgroup", "devices");
134     if(!mi) mi = mountinfo_find_by_filesystem_mount_source(root, "cgroup", "devices");
135     if(!mi) {
136         error("Cannot find cgroup devices mountinfo. Assuming default: /sys/fs/cgroup/devices");
137         s = "/sys/fs/cgroup/devices";
138     }
139     else s = mi->mount_point;
140     snprintfz(filename, FILENAME_MAX, "%s%s", netdata_configured_host_prefix, s);
141     cgroup_devices_base = config_get("plugin:cgroups", "path to /sys/fs/cgroup/devices", filename);
142
143     cgroup_root_max = (int)config_get_number("plugin:cgroups", "max cgroups to allow", cgroup_root_max);
144     cgroup_max_depth = (int)config_get_number("plugin:cgroups", "max cgroups depth to monitor", cgroup_max_depth);
145
146     cgroup_enable_new_cgroups_detected_at_runtime = config_get_boolean("plugin:cgroups", "enable new cgroups detected at run time", cgroup_enable_new_cgroups_detected_at_runtime);
147
148     enabled_cgroup_patterns = simple_pattern_create(
149             config_get("plugin:cgroups", "enable by default cgroups matching",
150             // ----------------------------------------------------------------
151
152                     " !*/init.scope "                      // ignore init.scope
153                     " *.scope "                            // we need all *.scope for sure
154
155             // ----------------------------------------------------------------
156
157                     " !*/vcpu* "                           // libvirtd adds these sub-cgroups
158                     " !*/emulator "                        // libvirtd adds these sub-cgroups
159                     " !*.mount "
160                     " !*.partition "
161                     " !*.service "
162                     " !*.slice "
163                     " !*.swap "
164                     " !*.user "
165                     " !/ "
166                     " !/docker "
167                     " !/libvirt "
168                     " !/lxc "
169                     " !/lxc/*/ns "                         //  #1397
170                     " !/machine "
171                     " !/qemu "
172                     " !/system "
173                     " !/systemd "
174                     " !/user "
175                     " * "                                  // enable anything else
176             ), SIMPLE_PATTERN_EXACT);
177
178     enabled_cgroup_paths = simple_pattern_create(
179             config_get("plugin:cgroups", "search for cgroups in subpaths matching",
180                     " !*/init.scope "                      // ignore init.scope
181                     " !*-qemu "                            //  #345
182                     " !/init.scope "
183                     " !/system "
184                     " !/systemd "
185                     " !/user "
186                     " !/user.slice "
187                     " !*.scope "
188                     " * "
189             ), SIMPLE_PATTERN_EXACT);
190
191     snprintfz(filename, FILENAME_MAX, "%s/cgroup-name.sh", netdata_configured_plugins_dir);
192     cgroups_rename_script = config_get("plugin:cgroups", "script to get cgroup names", filename);
193
194     enabled_cgroup_renames = simple_pattern_create(
195             config_get("plugin:cgroups", "run script to rename cgroups matching",
196                     " *.scope "
197                     " *docker* "
198                     " *lxc* "
199                     " *qemu* "
200                     " !/ "
201                     " !*.mount "
202                     " !*.partition "
203                     " !*.service "
204                     " !*.slice "
205                     " !*.swap "
206                     " !*.user "
207                     " * "
208             ), SIMPLE_PATTERN_EXACT);
209
210     if(cgroup_enable_systemd_services) {
211         systemd_services_cgroups = simple_pattern_create(
212                 config_get("plugin:cgroups", "cgroups to match as systemd services",
213                         " !/system.slice/*/*.service "
214                         " /system.slice/*.service "
215                 ), SIMPLE_PATTERN_EXACT);
216     }
217
218     mountinfo_free(root);
219 }
220
221 // ----------------------------------------------------------------------------
222 // cgroup objects
223
224 struct blkio {
225     int updated;
226     int enabled; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
227     int delay_counter;
228
229     char *filename;
230
231     unsigned long long Read;
232     unsigned long long Write;
233 /*
234     unsigned long long Sync;
235     unsigned long long Async;
236     unsigned long long Total;
237 */
238 };
239
240 // https://www.kernel.org/doc/Documentation/cgroup-v1/memory.txt
241 struct memory {
242     ARL_BASE *arl_base;
243     ARL_ENTRY *arl_dirty;
244     ARL_ENTRY *arl_swap;
245
246     int updated_detailed;
247     int updated_usage_in_bytes;
248     int updated_msw_usage_in_bytes;
249     int updated_failcnt;
250
251     int enabled_detailed;           // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
252     int enabled_usage_in_bytes;     // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
253     int enabled_msw_usage_in_bytes; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
254     int enabled_failcnt;            // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
255
256     int delay_counter_detailed;
257     int delay_counter_failcnt;
258
259     char *filename_detailed;
260     char *filename_usage_in_bytes;
261     char *filename_msw_usage_in_bytes;
262     char *filename_failcnt;
263
264     int detailed_has_dirty;
265     int detailed_has_swap;
266
267     // detailed metrics
268     unsigned long long cache;
269     unsigned long long rss;
270     unsigned long long rss_huge;
271     unsigned long long mapped_file;
272     unsigned long long writeback;
273     unsigned long long dirty;
274     unsigned long long swap;
275     unsigned long long pgpgin;
276     unsigned long long pgpgout;
277     unsigned long long pgfault;
278     unsigned long long pgmajfault;
279 /*
280     unsigned long long inactive_anon;
281     unsigned long long active_anon;
282     unsigned long long inactive_file;
283     unsigned long long active_file;
284     unsigned long long unevictable;
285     unsigned long long hierarchical_memory_limit;
286     unsigned long long total_cache;
287     unsigned long long total_rss;
288     unsigned long long total_rss_huge;
289     unsigned long long total_mapped_file;
290     unsigned long long total_writeback;
291     unsigned long long total_dirty;
292     unsigned long long total_swap;
293     unsigned long long total_pgpgin;
294     unsigned long long total_pgpgout;
295     unsigned long long total_pgfault;
296     unsigned long long total_pgmajfault;
297     unsigned long long total_inactive_anon;
298     unsigned long long total_active_anon;
299     unsigned long long total_inactive_file;
300     unsigned long long total_active_file;
301     unsigned long long total_unevictable;
302 */
303
304     // single file metrics
305     unsigned long long usage_in_bytes;
306     unsigned long long msw_usage_in_bytes;
307     unsigned long long failcnt;
308 };
309
310 // https://www.kernel.org/doc/Documentation/cgroup-v1/cpuacct.txt
311 struct cpuacct_stat {
312     int updated;
313     int enabled; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
314
315     char *filename;
316
317     unsigned long long user;
318     unsigned long long system;
319 };
320
321 // https://www.kernel.org/doc/Documentation/cgroup-v1/cpuacct.txt
322 struct cpuacct_usage {
323     int updated;
324     int enabled; // CONFIG_BOOLEAN_YES or CONFIG_BOOLEAN_AUTO
325
326     char *filename;
327
328     unsigned int cpus;
329     unsigned long long *cpu_percpu;
330 };
331
332 #define CGROUP_OPTIONS_DISABLED_DUPLICATE   0x00000001
333 #define CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE 0x00000002
334
335 struct cgroup {
336     uint32_t options;
337
338     char available;      // found in the filesystem
339     char enabled;        // enabled in the config
340
341     char *id;
342     uint32_t hash;
343
344     char *chart_id;
345     uint32_t hash_chart;
346
347     char *chart_title;
348
349     struct cpuacct_stat cpuacct_stat;
350     struct cpuacct_usage cpuacct_usage;
351
352     struct memory memory;
353
354     struct blkio io_service_bytes;              // bytes
355     struct blkio io_serviced;                   // operations
356
357     struct blkio throttle_io_service_bytes;     // bytes
358     struct blkio throttle_io_serviced;          // operations
359
360     struct blkio io_merged;                     // operations
361     struct blkio io_queued;                     // operations
362
363     // per cgroup charts
364     RRDSET *st_cpu;
365     RRDSET *st_cpu_per_core;
366     RRDSET *st_mem;
367     RRDSET *st_writeback;
368     RRDSET *st_mem_activity;
369     RRDSET *st_pgfaults;
370     RRDSET *st_mem_usage;
371     RRDSET *st_mem_failcnt;
372     RRDSET *st_io;
373     RRDSET *st_serviced_ops;
374     RRDSET *st_throttle_io;
375     RRDSET *st_throttle_serviced_ops;
376     RRDSET *st_queued_ops;
377     RRDSET *st_merged_ops;
378
379     // services
380     RRDDIM *rd_cpu;
381     RRDDIM *rd_mem_usage;
382     RRDDIM *rd_mem_failcnt;
383     RRDDIM *rd_swap_usage;
384
385     RRDDIM *rd_mem_detailed_cache;
386     RRDDIM *rd_mem_detailed_rss;
387     RRDDIM *rd_mem_detailed_mapped;
388     RRDDIM *rd_mem_detailed_writeback;
389     RRDDIM *rd_mem_detailed_pgpgin;
390     RRDDIM *rd_mem_detailed_pgpgout;
391     RRDDIM *rd_mem_detailed_pgfault;
392     RRDDIM *rd_mem_detailed_pgmajfault;
393
394     RRDDIM *rd_io_service_bytes_read;
395     RRDDIM *rd_io_serviced_read;
396     RRDDIM *rd_throttle_io_read;
397     RRDDIM *rd_throttle_io_serviced_read;
398     RRDDIM *rd_io_queued_read;
399     RRDDIM *rd_io_merged_read;
400
401     RRDDIM *rd_io_service_bytes_write;
402     RRDDIM *rd_io_serviced_write;
403     RRDDIM *rd_throttle_io_write;
404     RRDDIM *rd_throttle_io_serviced_write;
405     RRDDIM *rd_io_queued_write;
406     RRDDIM *rd_io_merged_write;
407
408     struct cgroup *next;
409
410 } *cgroup_root = NULL;
411
412 // ----------------------------------------------------------------------------
413 // read values from /sys
414
415 static inline void cgroup_read_cpuacct_stat(struct cpuacct_stat *cp) {
416     static procfile *ff = NULL;
417
418     if(likely(cp->filename)) {
419         ff = procfile_reopen(ff, cp->filename, NULL, PROCFILE_FLAG_DEFAULT);
420         if(unlikely(!ff)) {
421             cp->updated = 0;
422             cgroups_check = 1;
423             return;
424         }
425
426         ff = procfile_readall(ff);
427         if(unlikely(!ff)) {
428             cp->updated = 0;
429             cgroups_check = 1;
430             return;
431         }
432
433         unsigned long i, lines = procfile_lines(ff);
434
435         if(unlikely(lines < 1)) {
436             error("File '%s' should have 1+ lines.", cp->filename);
437             cp->updated = 0;
438             return;
439         }
440
441         for(i = 0; i < lines ; i++) {
442             char *s = procfile_lineword(ff, i, 0);
443             uint32_t hash = simple_hash(s);
444
445             if(unlikely(hash == user_hash && !strcmp(s, "user")))
446                 cp->user = str2ull(procfile_lineword(ff, i, 1));
447
448             else if(unlikely(hash == system_hash && !strcmp(s, "system")))
449                 cp->system = str2ull(procfile_lineword(ff, i, 1));
450         }
451
452         cp->updated = 1;
453
454         if(unlikely(cp->enabled == CONFIG_BOOLEAN_AUTO && (cp->user || cp->system)))
455             cp->enabled = CONFIG_BOOLEAN_YES;
456     }
457 }
458
459 static inline void cgroup_read_cpuacct_usage(struct cpuacct_usage *ca) {
460     static procfile *ff = NULL;
461
462     if(likely(ca->filename)) {
463         ff = procfile_reopen(ff, ca->filename, NULL, PROCFILE_FLAG_DEFAULT);
464         if(unlikely(!ff)) {
465             ca->updated = 0;
466             cgroups_check = 1;
467             return;
468         }
469
470         ff = procfile_readall(ff);
471         if(unlikely(!ff)) {
472             ca->updated = 0;
473             cgroups_check = 1;
474             return;
475         }
476
477         if(unlikely(procfile_lines(ff) < 1)) {
478             error("File '%s' should have 1+ lines but has %zu.", ca->filename, procfile_lines(ff));
479             ca->updated = 0;
480             return;
481         }
482
483         unsigned long i = procfile_linewords(ff, 0);
484         if(unlikely(i == 0)) {
485             ca->updated = 0;
486             return;
487         }
488
489         // we may have 1 more CPU reported
490         while(i > 0) {
491             char *s = procfile_lineword(ff, 0, i - 1);
492             if(!*s) i--;
493             else break;
494         }
495
496         if(unlikely(i != ca->cpus)) {
497             freez(ca->cpu_percpu);
498             ca->cpu_percpu = mallocz(sizeof(unsigned long long) * i);
499             ca->cpus = (unsigned int)i;
500         }
501
502         unsigned long long total = 0;
503         for(i = 0; i < ca->cpus ;i++) {
504             unsigned long long n = str2ull(procfile_lineword(ff, 0, i));
505             ca->cpu_percpu[i] = n;
506             total += n;
507         }
508
509         ca->updated = 1;
510
511         if(unlikely(ca->enabled == CONFIG_BOOLEAN_AUTO && total))
512             ca->enabled = CONFIG_BOOLEAN_YES;
513     }
514 }
515
516 static inline void cgroup_read_blkio(struct blkio *io) {
517     static procfile *ff = NULL;
518
519     if(unlikely(io->enabled == CONFIG_BOOLEAN_AUTO && io->delay_counter > 0)) {
520         io->delay_counter--;
521         return;
522     }
523
524     if(likely(io->filename)) {
525         ff = procfile_reopen(ff, io->filename, NULL, PROCFILE_FLAG_DEFAULT);
526         if(unlikely(!ff)) {
527             io->updated = 0;
528             cgroups_check = 1;
529             return;
530         }
531
532         ff = procfile_readall(ff);
533         if(unlikely(!ff)) {
534             io->updated = 0;
535             cgroups_check = 1;
536             return;
537         }
538
539         unsigned long i, lines = procfile_lines(ff);
540
541         if(unlikely(lines < 1)) {
542             error("File '%s' should have 1+ lines.", io->filename);
543             io->updated = 0;
544             return;
545         }
546
547         io->Read = 0;
548         io->Write = 0;
549 /*
550         io->Sync = 0;
551         io->Async = 0;
552         io->Total = 0;
553 */
554
555         for(i = 0; i < lines ; i++) {
556             char *s = procfile_lineword(ff, i, 1);
557             uint32_t hash = simple_hash(s);
558
559             if(unlikely(hash == Read_hash && !strcmp(s, "Read")))
560                 io->Read += str2ull(procfile_lineword(ff, i, 2));
561
562             else if(unlikely(hash == Write_hash && !strcmp(s, "Write")))
563                 io->Write += str2ull(procfile_lineword(ff, i, 2));
564
565 /*
566             else if(unlikely(hash == Sync_hash && !strcmp(s, "Sync")))
567                 io->Sync += str2ull(procfile_lineword(ff, i, 2));
568
569             else if(unlikely(hash == Async_hash && !strcmp(s, "Async")))
570                 io->Async += str2ull(procfile_lineword(ff, i, 2));
571
572             else if(unlikely(hash == Total_hash && !strcmp(s, "Total")))
573                 io->Total += str2ull(procfile_lineword(ff, i, 2));
574 */
575         }
576
577         io->updated = 1;
578
579         if(unlikely(io->enabled == CONFIG_BOOLEAN_AUTO)) {
580             if(unlikely(io->Read || io->Write))
581                 io->enabled = CONFIG_BOOLEAN_YES;
582             else
583                 io->delay_counter = cgroup_recheck_zero_blkio_every_iterations;
584         }
585     }
586 }
587
588 static inline void cgroup_read_memory(struct memory *mem) {
589     static procfile *ff = NULL;
590
591     // read detailed ram usage
592     if(likely(mem->filename_detailed)) {
593         if(unlikely(mem->enabled_detailed == CONFIG_BOOLEAN_AUTO && mem->delay_counter_detailed > 0)) {
594             mem->delay_counter_detailed--;
595             goto memory_next;
596         }
597
598         ff = procfile_reopen(ff, mem->filename_detailed, NULL, PROCFILE_FLAG_DEFAULT);
599         if(unlikely(!ff)) {
600             mem->updated_detailed = 0;
601             cgroups_check = 1;
602             goto memory_next;
603         }
604
605         ff = procfile_readall(ff);
606         if(unlikely(!ff)) {
607             mem->updated_detailed = 0;
608             cgroups_check = 1;
609             goto memory_next;
610         }
611
612         unsigned long i, lines = procfile_lines(ff);
613
614         if(unlikely(lines < 1)) {
615             error("File '%s' should have 1+ lines.", mem->filename_detailed);
616             mem->updated_detailed = 0;
617             goto memory_next;
618         }
619
620         if(unlikely(!mem->arl_base)) {
621             mem->arl_base = arl_create("cgroup/memory", NULL, 60);
622
623             arl_expect(mem->arl_base, "cache", &mem->cache);
624             arl_expect(mem->arl_base, "rss", &mem->rss);
625             arl_expect(mem->arl_base, "rss_huge", &mem->rss_huge);
626             arl_expect(mem->arl_base, "mapped_file", &mem->mapped_file);
627             arl_expect(mem->arl_base, "writeback", &mem->writeback);
628             mem->arl_dirty = arl_expect(mem->arl_base, "dirty", &mem->dirty);
629             mem->arl_swap  = arl_expect(mem->arl_base, "swap", &mem->swap);
630             arl_expect(mem->arl_base, "pgpgin", &mem->pgpgin);
631             arl_expect(mem->arl_base, "pgpgout", &mem->pgpgout);
632             arl_expect(mem->arl_base, "pgfault", &mem->pgfault);
633             arl_expect(mem->arl_base, "pgmajfault", &mem->pgmajfault);
634         }
635
636         arl_begin(mem->arl_base);
637
638         for(i = 0; i < lines ; i++) {
639             if(arl_check(mem->arl_base,
640                     procfile_lineword(ff, i, 0),
641                     procfile_lineword(ff, i, 1))) break;
642         }
643
644         if(unlikely(mem->arl_dirty->flags & ARL_ENTRY_FLAG_FOUND))
645             mem->detailed_has_dirty = 1;
646
647         if(unlikely(mem->arl_swap->flags & ARL_ENTRY_FLAG_FOUND))
648             mem->detailed_has_swap = 1;
649
650         // fprintf(stderr, "READ: '%s', cache: %llu, rss: %llu, rss_huge: %llu, mapped_file: %llu, writeback: %llu, dirty: %llu, swap: %llu, pgpgin: %llu, pgpgout: %llu, pgfault: %llu, pgmajfault: %llu, inactive_anon: %llu, active_anon: %llu, inactive_file: %llu, active_file: %llu, unevictable: %llu, hierarchical_memory_limit: %llu, total_cache: %llu, total_rss: %llu, total_rss_huge: %llu, total_mapped_file: %llu, total_writeback: %llu, total_dirty: %llu, total_swap: %llu, total_pgpgin: %llu, total_pgpgout: %llu, total_pgfault: %llu, total_pgmajfault: %llu, total_inactive_anon: %llu, total_active_anon: %llu, total_inactive_file: %llu, total_active_file: %llu, total_unevictable: %llu\n", mem->filename, mem->cache, mem->rss, mem->rss_huge, mem->mapped_file, mem->writeback, mem->dirty, mem->swap, mem->pgpgin, mem->pgpgout, mem->pgfault, mem->pgmajfault, mem->inactive_anon, mem->active_anon, mem->inactive_file, mem->active_file, mem->unevictable, mem->hierarchical_memory_limit, mem->total_cache, mem->total_rss, mem->total_rss_huge, mem->total_mapped_file, mem->total_writeback, mem->total_dirty, mem->total_swap, mem->total_pgpgin, mem->total_pgpgout, mem->total_pgfault, mem->total_pgmajfault, mem->total_inactive_anon, mem->total_active_anon, mem->total_inactive_file, mem->total_active_file, mem->total_unevictable);
651
652         mem->updated_detailed = 1;
653
654         if(unlikely(mem->enabled_detailed == CONFIG_BOOLEAN_AUTO)) {
655             if(mem->cache || mem->dirty || mem->rss || mem->rss_huge || mem->mapped_file || mem->writeback || mem->swap || mem->pgpgin || mem->pgpgout || mem->pgfault || mem->pgmajfault)
656                 mem->enabled_detailed = CONFIG_BOOLEAN_YES;
657             else
658                 mem->delay_counter_detailed = cgroup_recheck_zero_mem_detailed_every_iterations;
659         }
660     }
661
662 memory_next:
663
664     // read usage_in_bytes
665     if(likely(mem->filename_usage_in_bytes)) {
666         mem->updated_usage_in_bytes = !read_single_number_file(mem->filename_usage_in_bytes, &mem->usage_in_bytes);
667         if(unlikely(mem->updated_usage_in_bytes && mem->enabled_usage_in_bytes == CONFIG_BOOLEAN_AUTO && mem->usage_in_bytes))
668             mem->enabled_usage_in_bytes = CONFIG_BOOLEAN_YES;
669     }
670
671     // read msw_usage_in_bytes
672     if(likely(mem->filename_msw_usage_in_bytes)) {
673         mem->updated_msw_usage_in_bytes = !read_single_number_file(mem->filename_msw_usage_in_bytes, &mem->msw_usage_in_bytes);
674         if(unlikely(mem->updated_msw_usage_in_bytes && mem->enabled_msw_usage_in_bytes == CONFIG_BOOLEAN_AUTO && mem->msw_usage_in_bytes))
675             mem->enabled_msw_usage_in_bytes = CONFIG_BOOLEAN_YES;
676     }
677
678     // read failcnt
679     if(likely(mem->filename_failcnt)) {
680         if(unlikely(mem->enabled_failcnt == CONFIG_BOOLEAN_AUTO && mem->delay_counter_failcnt > 0)) {
681             mem->updated_failcnt = 0;
682             mem->delay_counter_failcnt--;
683         }
684         else {
685             mem->updated_failcnt = !read_single_number_file(mem->filename_failcnt, &mem->failcnt);
686             if(unlikely(mem->updated_failcnt && mem->enabled_failcnt == CONFIG_BOOLEAN_AUTO)) {
687                 if(unlikely(!mem->failcnt))
688                     mem->delay_counter_failcnt = cgroup_recheck_zero_mem_failcnt_every_iterations;
689                 else
690                     mem->enabled_failcnt = CONFIG_BOOLEAN_YES;
691             }
692         }
693     }
694 }
695
696 static inline void cgroup_read(struct cgroup *cg) {
697     debug(D_CGROUP, "reading metrics for cgroups '%s'", cg->id);
698
699     cgroup_read_cpuacct_stat(&cg->cpuacct_stat);
700     cgroup_read_cpuacct_usage(&cg->cpuacct_usage);
701     cgroup_read_memory(&cg->memory);
702     cgroup_read_blkio(&cg->io_service_bytes);
703     cgroup_read_blkio(&cg->io_serviced);
704     cgroup_read_blkio(&cg->throttle_io_service_bytes);
705     cgroup_read_blkio(&cg->throttle_io_serviced);
706     cgroup_read_blkio(&cg->io_merged);
707     cgroup_read_blkio(&cg->io_queued);
708 }
709
710 static inline void read_all_cgroups(struct cgroup *root) {
711     debug(D_CGROUP, "reading metrics for all cgroups");
712
713     struct cgroup *cg;
714
715     for(cg = root; cg ; cg = cg->next)
716         if(cg->enabled && cg->available)
717             cgroup_read(cg);
718 }
719
720 // ----------------------------------------------------------------------------
721 // add/remove/find cgroup objects
722
723 #define CGROUP_CHARTID_LINE_MAX 1024
724
725 static inline char *cgroup_title_strdupz(const char *s) {
726     if(!s || !*s) s = "/";
727
728     if(*s == '/' && s[1] != '\0') s++;
729
730     char *r = strdupz(s);
731     netdata_fix_chart_name(r);
732
733     return r;
734 }
735
736 static inline char *cgroup_chart_id_strdupz(const char *s) {
737     if(!s || !*s) s = "/";
738
739     if(*s == '/' && s[1] != '\0') s++;
740
741     char *r = strdupz(s);
742     netdata_fix_chart_id(r);
743
744     return r;
745 }
746
747 static inline void cgroup_get_chart_name(struct cgroup *cg) {
748     debug(D_CGROUP, "looking for the name of cgroup '%s' with chart id '%s' and title '%s'", cg->id, cg->chart_id, cg->chart_title);
749
750     pid_t cgroup_pid;
751     char buffer[CGROUP_CHARTID_LINE_MAX + 1];
752
753     snprintfz(buffer, CGROUP_CHARTID_LINE_MAX, "exec %s '%s'", cgroups_rename_script, cg->chart_id);
754
755     debug(D_CGROUP, "executing command '%s' for cgroup '%s'", buffer, cg->id);
756     FILE *fp = mypopen(buffer, &cgroup_pid);
757     if(fp) {
758         // debug(D_CGROUP, "reading from command '%s' for cgroup '%s'", buffer, cg->id);
759         char *s = fgets(buffer, CGROUP_CHARTID_LINE_MAX, fp);
760         // debug(D_CGROUP, "closing command for cgroup '%s'", cg->id);
761         mypclose(fp, cgroup_pid);
762         // debug(D_CGROUP, "closed command for cgroup '%s'", cg->id);
763
764         if(s && *s && *s != '\n') {
765             debug(D_CGROUP, "cgroup '%s' should be renamed to '%s'", cg->id, s);
766
767             trim(s);
768
769             freez(cg->chart_title);
770             cg->chart_title = cgroup_title_strdupz(s);
771
772             freez(cg->chart_id);
773             cg->chart_id = cgroup_chart_id_strdupz(s);
774             cg->hash_chart = simple_hash(cg->chart_id);
775         }
776     }
777     else
778         error("CGROUP: Cannot popen(\"%s\", \"r\").", buffer);
779 }
780
781 static inline struct cgroup *cgroup_add(const char *id) {
782     if(!id || !*id) id = "/";
783     debug(D_CGROUP, "adding to list, cgroup with id '%s'", id);
784
785     if(cgroup_root_count >= cgroup_root_max) {
786         info("Maximum number of cgroups reached (%d). Not adding cgroup '%s'", cgroup_root_count, id);
787         return NULL;
788     }
789
790     int def = simple_pattern_matches(enabled_cgroup_patterns, id)?cgroup_enable_new_cgroups_detected_at_runtime:0;
791     struct cgroup *cg = callocz(1, sizeof(struct cgroup));
792
793     cg->id = strdupz(id);
794     cg->hash = simple_hash(cg->id);
795
796     cg->chart_title = cgroup_title_strdupz(id);
797
798     cg->chart_id = cgroup_chart_id_strdupz(id);
799     cg->hash_chart = simple_hash(cg->chart_id);
800
801     if(!cgroup_root)
802         cgroup_root = cg;
803     else {
804         // append it
805         struct cgroup *e;
806         for(e = cgroup_root; e->next ;e = e->next) ;
807         e->next = cg;
808     }
809
810     cgroup_root_count++;
811
812     // fix the chart_id and title by calling the external script
813     if(simple_pattern_matches(enabled_cgroup_renames, cg->id)) {
814
815         cgroup_get_chart_name(cg);
816
817         debug(D_CGROUP, "cgroup '%s' renamed to '%s' (title: '%s')", cg->id, cg->chart_id, cg->chart_title);
818     }
819     else
820         debug(D_CGROUP, "cgroup '%s' will not be renamed - it matches the list of disabled cgroup renames (will be shown as '%s')", cg->id, cg->chart_id);
821
822     int user_configurable = 1;
823
824     // check if this cgroup should be a systemd service
825     if(cgroup_enable_systemd_services) {
826         if(simple_pattern_matches(systemd_services_cgroups, cg->id) ||
827                 simple_pattern_matches(systemd_services_cgroups, cg->chart_id)) {
828             debug(D_CGROUP, "cgroup '%s' with chart id '%s' (title: '%s') matches systemd services cgroups", cg->id, cg->chart_id, cg->chart_title);
829
830             char buffer[CGROUP_CHARTID_LINE_MAX + 1];
831             cg->options |= CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE;
832
833             strncpy(buffer, cg->id, CGROUP_CHARTID_LINE_MAX);
834             char *s = buffer;
835
836             //freez(cg->chart_id);
837             //cg->chart_id = cgroup_chart_id_strdupz(s);
838             //cg->hash_chart = simple_hash(cg->chart_id);
839
840             // skip to the last slash
841             size_t len = strlen(s);
842             while(len--) if(unlikely(s[len] == '/')) break;
843             if(len) s = &s[len + 1];
844
845             // remove extension
846             len = strlen(s);
847             while(len--) if(unlikely(s[len] == '.')) break;
848             if(len) s[len] = '\0';
849
850             freez(cg->chart_title);
851             cg->chart_title = cgroup_title_strdupz(s);
852
853             cg->enabled = 1;
854             user_configurable = 0;
855
856             debug(D_CGROUP, "cgroup '%s' renamed to '%s' (title: '%s')", cg->id, cg->chart_id, cg->chart_title);
857         }
858         else
859             debug(D_CGROUP, "cgroup '%s' with chart id '%s' (title: '%s') does not match systemd services groups", cg->id, cg->chart_id, cg->chart_title);
860     }
861
862     if(user_configurable) {
863         // allow the user to enable/disable this individualy
864         char option[FILENAME_MAX + 1];
865         snprintfz(option, FILENAME_MAX, "enable cgroup %s", cg->chart_title);
866         cg->enabled = (char) config_get_boolean("plugin:cgroups", option, def);
867     }
868
869     // detect duplicate cgroups
870     if(cg->enabled) {
871         struct cgroup *t;
872         for (t = cgroup_root; t; t = t->next) {
873             if (t != cg && t->enabled && t->hash_chart == cg->hash_chart && !strcmp(t->chart_id, cg->chart_id)) {
874                 if (!strncmp(t->chart_id, "/system.slice/", 14) && !strncmp(cg->chart_id, "/init.scope/system.slice/", 25)) {
875                     error("Control group with chart id '%s' already exists with id '%s' and is enabled. Swapping them by enabling cgroup with id '%s' and disabling cgroup with id '%s'.",
876                           cg->chart_id, t->id, cg->id, t->id);
877                     debug(D_CGROUP, "Control group with chart id '%s' already exists with id '%s' and is enabled. Swapping them by enabling cgroup with id '%s' and disabling cgroup with id '%s'.",
878                           cg->chart_id, t->id, cg->id, t->id);
879                     t->enabled = 0;
880                     t->options |= CGROUP_OPTIONS_DISABLED_DUPLICATE;
881                 }
882                 else {
883                     error("Control group with chart id '%s' already exists with id '%s' and is enabled and available. Disabling cgroup with id '%s'.",
884                           cg->chart_id, t->id, cg->id);
885                     debug(D_CGROUP, "Control group with chart id '%s' already exists with id '%s' and is enabled and available. Disabling cgroup with id '%s'.",
886                           cg->chart_id, t->id, cg->id);
887                     cg->enabled = 0;
888                     cg->options |= CGROUP_OPTIONS_DISABLED_DUPLICATE;
889                 }
890
891                 break;
892             }
893         }
894     }
895
896     debug(D_CGROUP, "ADDED CGROUP: '%s' with chart id '%s' and title '%s' as %s (default was %s)", cg->id, cg->chart_id, cg->chart_title, (cg->enabled)?"enabled":"disabled", (def)?"enabled":"disabled");
897
898     return cg;
899 }
900
901 static inline void cgroup_free(struct cgroup *cg) {
902     debug(D_CGROUP, "Removing cgroup '%s' with chart id '%s' (was %s and %s)", cg->id, cg->chart_id, (cg->enabled)?"enabled":"disabled", (cg->available)?"available":"not available");
903
904     if(cg->st_cpu)                   rrdset_flag_set(cg->st_cpu,                   RRDSET_FLAG_OBSOLETE);
905     if(cg->st_cpu_per_core)          rrdset_flag_set(cg->st_cpu_per_core,          RRDSET_FLAG_OBSOLETE);
906     if(cg->st_mem)                   rrdset_flag_set(cg->st_mem,                   RRDSET_FLAG_OBSOLETE);
907     if(cg->st_writeback)             rrdset_flag_set(cg->st_writeback,             RRDSET_FLAG_OBSOLETE);
908     if(cg->st_mem_activity)          rrdset_flag_set(cg->st_mem_activity,          RRDSET_FLAG_OBSOLETE);
909     if(cg->st_pgfaults)              rrdset_flag_set(cg->st_pgfaults,              RRDSET_FLAG_OBSOLETE);
910     if(cg->st_mem_usage)             rrdset_flag_set(cg->st_mem_usage,             RRDSET_FLAG_OBSOLETE);
911     if(cg->st_mem_failcnt)           rrdset_flag_set(cg->st_mem_failcnt,           RRDSET_FLAG_OBSOLETE);
912     if(cg->st_io)                    rrdset_flag_set(cg->st_io,                    RRDSET_FLAG_OBSOLETE);
913     if(cg->st_serviced_ops)          rrdset_flag_set(cg->st_serviced_ops,          RRDSET_FLAG_OBSOLETE);
914     if(cg->st_throttle_io)           rrdset_flag_set(cg->st_throttle_io,           RRDSET_FLAG_OBSOLETE);
915     if(cg->st_throttle_serviced_ops) rrdset_flag_set(cg->st_throttle_serviced_ops, RRDSET_FLAG_OBSOLETE);
916     if(cg->st_queued_ops)            rrdset_flag_set(cg->st_queued_ops,            RRDSET_FLAG_OBSOLETE);
917     if(cg->st_merged_ops)            rrdset_flag_set(cg->st_merged_ops,            RRDSET_FLAG_OBSOLETE);
918
919     freez(cg->cpuacct_usage.cpu_percpu);
920
921     freez(cg->cpuacct_stat.filename);
922     freez(cg->cpuacct_usage.filename);
923
924     arl_free(cg->memory.arl_base);
925     freez(cg->memory.filename_detailed);
926     freez(cg->memory.filename_failcnt);
927     freez(cg->memory.filename_usage_in_bytes);
928     freez(cg->memory.filename_msw_usage_in_bytes);
929
930     freez(cg->io_service_bytes.filename);
931     freez(cg->io_serviced.filename);
932
933     freez(cg->throttle_io_service_bytes.filename);
934     freez(cg->throttle_io_serviced.filename);
935
936     freez(cg->io_merged.filename);
937     freez(cg->io_queued.filename);
938
939     freez(cg->id);
940     freez(cg->chart_id);
941     freez(cg->chart_title);
942
943     freez(cg);
944
945     cgroup_root_count--;
946 }
947
948 // find if a given cgroup exists
949 static inline struct cgroup *cgroup_find(const char *id) {
950     debug(D_CGROUP, "searching for cgroup '%s'", id);
951
952     uint32_t hash = simple_hash(id);
953
954     struct cgroup *cg;
955     for(cg = cgroup_root; cg ; cg = cg->next) {
956         if(hash == cg->hash && strcmp(id, cg->id) == 0)
957             break;
958     }
959
960     debug(D_CGROUP, "cgroup '%s' %s in memory", id, (cg)?"found":"not found");
961     return cg;
962 }
963
964 // ----------------------------------------------------------------------------
965 // detect running cgroups
966
967 // callback for find_file_in_subdirs()
968 static inline void found_subdir_in_dir(const char *dir) {
969     debug(D_CGROUP, "examining cgroup dir '%s'", dir);
970
971     struct cgroup *cg = cgroup_find(dir);
972     if(!cg) {
973         if(*dir && cgroup_max_depth > 0) {
974             int depth = 0;
975             const char *s;
976
977             for(s = dir; *s ;s++)
978                 if(unlikely(*s == '/'))
979                     depth++;
980
981             if(depth > cgroup_max_depth) {
982                 info("cgroup '%s' is too deep (%d, while max is %d)", dir, depth, cgroup_max_depth);
983                 return;
984             }
985         }
986         // debug(D_CGROUP, "will add dir '%s' as cgroup", dir);
987         cg = cgroup_add(dir);
988     }
989
990     if(cg) cg->available = 1;
991 }
992
993 static inline int find_dir_in_subdirs(const char *base, const char *this, void (*callback)(const char *)) {
994     if(!this) this = base;
995     debug(D_CGROUP, "searching for directories in '%s' (base '%s')", this?this:"", base);
996
997     size_t dirlen = strlen(this), baselen = strlen(base);
998
999     int ret = -1;
1000     int enabled = -1;
1001
1002     const char *relative_path = &this[baselen];
1003     if(!*relative_path) relative_path = "/";
1004
1005     DIR *dir = opendir(this);
1006     if(!dir) {
1007         error("Cannot read cgroups directory '%s'", base);
1008         return ret;
1009     }
1010     ret = 1;
1011
1012     callback(relative_path);
1013
1014     struct dirent *de = NULL;
1015     while((de = readdir(dir))) {
1016         if(de->d_type == DT_DIR
1017             && (
1018                 (de->d_name[0] == '.' && de->d_name[1] == '\0')
1019                 || (de->d_name[0] == '.' && de->d_name[1] == '.' && de->d_name[2] == '\0')
1020                 ))
1021             continue;
1022
1023         if(de->d_type == DT_DIR) {
1024             if(enabled == -1) {
1025                 const char *r = relative_path;
1026                 if(*r == '\0') r = "/";
1027
1028                 // do not decent in directories we are not interested
1029                 int def = simple_pattern_matches(enabled_cgroup_paths, r);
1030
1031                 // we check for this option here
1032                 // so that the config will not have settings
1033                 // for leaf directories
1034                 char option[FILENAME_MAX + 1];
1035                 snprintfz(option, FILENAME_MAX, "search for cgroups under %s", r);
1036                 option[FILENAME_MAX] = '\0';
1037                 enabled = config_get_boolean("plugin:cgroups", option, def);
1038             }
1039
1040             if(enabled) {
1041                 char *s = mallocz(dirlen + strlen(de->d_name) + 2);
1042                 strcpy(s, this);
1043                 strcat(s, "/");
1044                 strcat(s, de->d_name);
1045                 int ret2 = find_dir_in_subdirs(base, s, callback);
1046                 if(ret2 > 0) ret += ret2;
1047                 freez(s);
1048             }
1049         }
1050     }
1051
1052     closedir(dir);
1053     return ret;
1054 }
1055
1056 static inline void mark_all_cgroups_as_not_available() {
1057     debug(D_CGROUP, "marking all cgroups as not available");
1058
1059     struct cgroup *cg;
1060
1061     // mark all as not available
1062     for(cg = cgroup_root; cg ; cg = cg->next) {
1063         cg->available = 0;
1064     }
1065 }
1066
1067 static inline void cleanup_all_cgroups() {
1068     struct cgroup *cg = cgroup_root, *last = NULL;
1069
1070     for(; cg ;) {
1071         if(!cg->available) {
1072             // enable the first duplicate cgroup
1073             {
1074                 struct cgroup *t;
1075                 for(t = cgroup_root; t ; t = t->next) {
1076                     if(t != cg && t->available && !t->enabled && t->options & CGROUP_OPTIONS_DISABLED_DUPLICATE && t->hash_chart == cg->hash_chart && !strcmp(t->chart_id, cg->chart_id)) {
1077                         debug(D_CGROUP, "Enabling duplicate of cgroup '%s' with id '%s', because the original with id '%s' stopped.", t->chart_id, t->id, cg->id);
1078                         t->enabled = 1;
1079                         t->options &= ~CGROUP_OPTIONS_DISABLED_DUPLICATE;
1080                         break;
1081                     }
1082                 }
1083             }
1084
1085             if(!last)
1086                 cgroup_root = cg->next;
1087             else
1088                 last->next = cg->next;
1089
1090             cgroup_free(cg);
1091
1092             if(!last)
1093                 cg = cgroup_root;
1094             else
1095                 cg = last->next;
1096         }
1097         else {
1098             last = cg;
1099             cg = cg->next;
1100         }
1101     }
1102 }
1103
1104 static inline void find_all_cgroups() {
1105     debug(D_CGROUP, "searching for cgroups");
1106
1107     mark_all_cgroups_as_not_available();
1108
1109     if(cgroup_enable_cpuacct_stat || cgroup_enable_cpuacct_usage) {
1110         if(find_dir_in_subdirs(cgroup_cpuacct_base, NULL, found_subdir_in_dir) == -1) {
1111             cgroup_enable_cpuacct_stat =
1112             cgroup_enable_cpuacct_usage = CONFIG_BOOLEAN_NO;
1113             error("disabled CGROUP cpu statistics.");
1114         }
1115     }
1116
1117     if(cgroup_enable_blkio_io || cgroup_enable_blkio_ops || cgroup_enable_blkio_throttle_io || cgroup_enable_blkio_throttle_ops || cgroup_enable_blkio_merged_ops || cgroup_enable_blkio_queued_ops) {
1118         if(find_dir_in_subdirs(cgroup_blkio_base, NULL, found_subdir_in_dir) == -1) {
1119             cgroup_enable_blkio_io =
1120             cgroup_enable_blkio_ops =
1121             cgroup_enable_blkio_throttle_io =
1122             cgroup_enable_blkio_throttle_ops =
1123             cgroup_enable_blkio_merged_ops =
1124             cgroup_enable_blkio_queued_ops = CONFIG_BOOLEAN_NO;
1125             error("disabled CGROUP blkio statistics.");
1126         }
1127     }
1128
1129     if(cgroup_enable_memory || cgroup_enable_detailed_memory || cgroup_enable_swap || cgroup_enable_memory_failcnt) {
1130         if(find_dir_in_subdirs(cgroup_memory_base, NULL, found_subdir_in_dir) == -1) {
1131             cgroup_enable_memory =
1132             cgroup_enable_detailed_memory =
1133             cgroup_enable_swap =
1134             cgroup_enable_memory_failcnt = CONFIG_BOOLEAN_NO;
1135             error("disabled CGROUP memory statistics.");
1136         }
1137     }
1138
1139     if(cgroup_search_in_devices) {
1140         if(find_dir_in_subdirs(cgroup_devices_base, NULL, found_subdir_in_dir) == -1) {
1141             cgroup_search_in_devices = 0;
1142             error("disabled CGROUP devices statistics.");
1143         }
1144     }
1145
1146     // remove any non-existing cgroups
1147     cleanup_all_cgroups();
1148
1149     struct cgroup *cg;
1150     struct stat buf;
1151     for(cg = cgroup_root; cg ; cg = cg->next) {
1152         // fprintf(stderr, " >>> CGROUP '%s' (%u - %s) with name '%s'\n", cg->id, cg->hash, cg->available?"available":"stopped", cg->name);
1153
1154         if(unlikely(!cg->available))
1155             continue;
1156
1157         debug(D_CGROUP, "checking paths for cgroup '%s'", cg->id);
1158
1159         // check for newly added cgroups
1160         // and update the filenames they read
1161         char filename[FILENAME_MAX + 1];
1162         if(unlikely(cgroup_enable_cpuacct_stat && !cg->cpuacct_stat.filename)) {
1163             snprintfz(filename, FILENAME_MAX, "%s%s/cpuacct.stat", cgroup_cpuacct_base, cg->id);
1164             if(likely(stat(filename, &buf) != -1)) {
1165                 cg->cpuacct_stat.filename = strdupz(filename);
1166                 cg->cpuacct_stat.enabled = cgroup_enable_cpuacct_stat;
1167                 debug(D_CGROUP, "cpuacct.stat filename for cgroup '%s': '%s'", cg->id, cg->cpuacct_stat.filename);
1168             }
1169             else
1170                 debug(D_CGROUP, "cpuacct.stat file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1171         }
1172
1173         if(unlikely(cgroup_enable_cpuacct_usage && !cg->cpuacct_usage.filename && !(cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE))) {
1174             snprintfz(filename, FILENAME_MAX, "%s%s/cpuacct.usage_percpu", cgroup_cpuacct_base, cg->id);
1175             if(likely(stat(filename, &buf) != -1)) {
1176                 cg->cpuacct_usage.filename = strdupz(filename);
1177                 cg->cpuacct_usage.enabled = cgroup_enable_cpuacct_usage;
1178                 debug(D_CGROUP, "cpuacct.usage_percpu filename for cgroup '%s': '%s'", cg->id, cg->cpuacct_usage.filename);
1179             }
1180             else
1181                 debug(D_CGROUP, "cpuacct.usage_percpu file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1182         }
1183
1184         if(unlikely((cgroup_enable_detailed_memory || cgroup_used_memory_without_cache) && !cg->memory.filename_detailed && (cgroup_used_memory_without_cache || cgroup_enable_systemd_services_detailed_memory || !(cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE)))) {
1185             snprintfz(filename, FILENAME_MAX, "%s%s/memory.stat", cgroup_memory_base, cg->id);
1186             if(likely(stat(filename, &buf) != -1)) {
1187                 cg->memory.filename_detailed = strdupz(filename);
1188                 cg->memory.enabled_detailed = (cgroup_enable_detailed_memory == CONFIG_BOOLEAN_YES)?CONFIG_BOOLEAN_YES:CONFIG_BOOLEAN_AUTO;
1189                 debug(D_CGROUP, "memory.stat filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_detailed);
1190             }
1191             else
1192                 debug(D_CGROUP, "memory.stat file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1193         }
1194
1195         if(unlikely(cgroup_enable_memory && !cg->memory.filename_usage_in_bytes)) {
1196             snprintfz(filename, FILENAME_MAX, "%s%s/memory.usage_in_bytes", cgroup_memory_base, cg->id);
1197             if(likely(stat(filename, &buf) != -1)) {
1198                 cg->memory.filename_usage_in_bytes = strdupz(filename);
1199                 cg->memory.enabled_usage_in_bytes = cgroup_enable_memory;
1200                 debug(D_CGROUP, "memory.usage_in_bytes filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_usage_in_bytes);
1201             }
1202             else
1203                 debug(D_CGROUP, "memory.usage_in_bytes file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1204         }
1205
1206         if(unlikely(cgroup_enable_swap && !cg->memory.filename_msw_usage_in_bytes)) {
1207             snprintfz(filename, FILENAME_MAX, "%s%s/memory.msw_usage_in_bytes", cgroup_memory_base, cg->id);
1208             if(likely(stat(filename, &buf) != -1)) {
1209                 cg->memory.filename_msw_usage_in_bytes = strdupz(filename);
1210                 cg->memory.enabled_msw_usage_in_bytes = cgroup_enable_swap;
1211                 debug(D_CGROUP, "memory.msw_usage_in_bytes filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_msw_usage_in_bytes);
1212             }
1213             else
1214                 debug(D_CGROUP, "memory.msw_usage_in_bytes file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1215         }
1216
1217         if(unlikely(cgroup_enable_memory_failcnt && !cg->memory.filename_failcnt)) {
1218             snprintfz(filename, FILENAME_MAX, "%s%s/memory.failcnt", cgroup_memory_base, cg->id);
1219             if(likely(stat(filename, &buf) != -1)) {
1220                 cg->memory.filename_failcnt = strdupz(filename);
1221                 cg->memory.enabled_failcnt = cgroup_enable_memory_failcnt;
1222                 debug(D_CGROUP, "memory.failcnt filename for cgroup '%s': '%s'", cg->id, cg->memory.filename_failcnt);
1223             }
1224             else
1225                 debug(D_CGROUP, "memory.failcnt file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1226         }
1227
1228         if(unlikely(cgroup_enable_blkio_io && !cg->io_service_bytes.filename)) {
1229             snprintfz(filename, FILENAME_MAX, "%s%s/blkio.io_service_bytes", cgroup_blkio_base, cg->id);
1230             if(likely(stat(filename, &buf) != -1)) {
1231                 cg->io_service_bytes.filename = strdupz(filename);
1232                 cg->io_service_bytes.enabled = cgroup_enable_blkio_io;
1233                 debug(D_CGROUP, "io_service_bytes filename for cgroup '%s': '%s'", cg->id, cg->io_service_bytes.filename);
1234             }
1235             else
1236                 debug(D_CGROUP, "io_service_bytes file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1237         }
1238
1239         if(unlikely(cgroup_enable_blkio_ops && !cg->io_serviced.filename)) {
1240             snprintfz(filename, FILENAME_MAX, "%s%s/blkio.io_serviced", cgroup_blkio_base, cg->id);
1241             if(likely(stat(filename, &buf) != -1)) {
1242                 cg->io_serviced.filename = strdupz(filename);
1243                 cg->io_serviced.enabled = cgroup_enable_blkio_ops;
1244                 debug(D_CGROUP, "io_serviced filename for cgroup '%s': '%s'", cg->id, cg->io_serviced.filename);
1245             }
1246             else
1247                 debug(D_CGROUP, "io_serviced file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1248         }
1249
1250         if(unlikely(cgroup_enable_blkio_throttle_io && !cg->throttle_io_service_bytes.filename)) {
1251             snprintfz(filename, FILENAME_MAX, "%s%s/blkio.throttle.io_service_bytes", cgroup_blkio_base, cg->id);
1252             if(likely(stat(filename, &buf) != -1)) {
1253                 cg->throttle_io_service_bytes.filename = strdupz(filename);
1254                 cg->throttle_io_service_bytes.enabled = cgroup_enable_blkio_throttle_io;
1255                 debug(D_CGROUP, "throttle_io_service_bytes filename for cgroup '%s': '%s'", cg->id, cg->throttle_io_service_bytes.filename);
1256             }
1257             else
1258                 debug(D_CGROUP, "throttle_io_service_bytes file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1259         }
1260
1261         if(unlikely(cgroup_enable_blkio_throttle_ops && !cg->throttle_io_serviced.filename)) {
1262             snprintfz(filename, FILENAME_MAX, "%s%s/blkio.throttle.io_serviced", cgroup_blkio_base, cg->id);
1263             if(likely(stat(filename, &buf) != -1)) {
1264                 cg->throttle_io_serviced.filename = strdupz(filename);
1265                 cg->throttle_io_serviced.enabled = cgroup_enable_blkio_throttle_ops;
1266                 debug(D_CGROUP, "throttle_io_serviced filename for cgroup '%s': '%s'", cg->id, cg->throttle_io_serviced.filename);
1267             }
1268             else
1269                 debug(D_CGROUP, "throttle_io_serviced file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1270         }
1271
1272         if(unlikely(cgroup_enable_blkio_merged_ops && !cg->io_merged.filename)) {
1273             snprintfz(filename, FILENAME_MAX, "%s%s/blkio.io_merged", cgroup_blkio_base, cg->id);
1274             if(likely(stat(filename, &buf) != -1)) {
1275                 cg->io_merged.filename = strdupz(filename);
1276                 cg->io_merged.enabled = cgroup_enable_blkio_merged_ops;
1277                 debug(D_CGROUP, "io_merged filename for cgroup '%s': '%s'", cg->id, cg->io_merged.filename);
1278             }
1279             else
1280                 debug(D_CGROUP, "io_merged file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1281         }
1282
1283         if(unlikely(cgroup_enable_blkio_queued_ops && !cg->io_queued.filename)) {
1284             snprintfz(filename, FILENAME_MAX, "%s%s/blkio.io_queued", cgroup_blkio_base, cg->id);
1285             if(likely(stat(filename, &buf) != -1)) {
1286                 cg->io_queued.filename = strdupz(filename);
1287                 cg->io_queued.enabled = cgroup_enable_blkio_queued_ops;
1288                 debug(D_CGROUP, "io_queued filename for cgroup '%s': '%s'", cg->id, cg->io_queued.filename);
1289             }
1290             else
1291                 debug(D_CGROUP, "io_queued file for cgroup '%s': '%s' does not exist.", cg->id, filename);
1292         }
1293     }
1294
1295     debug(D_CGROUP, "done searching for cgroups");
1296     return;
1297 }
1298
1299 // ----------------------------------------------------------------------------
1300 // generate charts
1301
1302 #define CHART_TITLE_MAX 300
1303
1304 void update_systemd_services_charts(
1305           int update_every
1306         , int do_cpu
1307         , int do_mem_usage
1308         , int do_mem_detailed
1309         , int do_mem_failcnt
1310         , int do_swap_usage
1311         , int do_io
1312         , int do_io_ops
1313         , int do_throttle_io
1314         , int do_throttle_ops
1315         , int do_queued_ops
1316         , int do_merged_ops
1317 ) {
1318     static RRDSET
1319         *st_cpu = NULL,
1320         *st_mem_usage = NULL,
1321         *st_mem_failcnt = NULL,
1322         *st_swap_usage = NULL,
1323
1324         *st_mem_detailed_cache = NULL,
1325         *st_mem_detailed_rss = NULL,
1326         *st_mem_detailed_mapped = NULL,
1327         *st_mem_detailed_writeback = NULL,
1328         *st_mem_detailed_pgfault = NULL,
1329         *st_mem_detailed_pgmajfault = NULL,
1330         *st_mem_detailed_pgpgin = NULL,
1331         *st_mem_detailed_pgpgout = NULL,
1332
1333         *st_io_read = NULL,
1334         *st_io_serviced_read = NULL,
1335         *st_throttle_io_read = NULL,
1336         *st_throttle_ops_read = NULL,
1337         *st_queued_ops_read = NULL,
1338         *st_merged_ops_read = NULL,
1339
1340         *st_io_write = NULL,
1341         *st_io_serviced_write = NULL,
1342         *st_throttle_io_write = NULL,
1343         *st_throttle_ops_write = NULL,
1344         *st_queued_ops_write = NULL,
1345         *st_merged_ops_write = NULL;
1346
1347     // create the charts
1348
1349     if(likely(do_cpu)) {
1350         if(unlikely(!st_cpu)) {
1351             char title[CHART_TITLE_MAX + 1];
1352             snprintfz(title, CHART_TITLE_MAX, "Systemd Services CPU utilization (%d%% = %d core%s)", (processors * 100), processors, (processors > 1) ? "s" : "");
1353
1354             st_cpu = rrdset_create_localhost(
1355                     "services"
1356                     , "cpu"
1357                     , NULL
1358                     , "cpu"
1359                     , "services.cpu"
1360                     , title
1361                     , "%"
1362                     , CHART_PRIORITY_SYSTEMD_SERVICES
1363                     , update_every
1364                     , RRDSET_TYPE_STACKED
1365             );
1366
1367         }
1368         else
1369             rrdset_next(st_cpu);
1370     }
1371
1372     if(likely(do_mem_usage)) {
1373         if(unlikely(!st_mem_usage)) {
1374
1375             st_mem_usage = rrdset_create_localhost(
1376                     "services"
1377                     , "mem_usage"
1378                     , NULL
1379                     , "mem"
1380                     , "services.mem_usage"
1381                     , (cgroup_used_memory_without_cache) ? "Systemd Services Used Memory without Cache"
1382                                                          : "Systemd Services Used Memory"
1383                     , "MB"
1384                     , CHART_PRIORITY_SYSTEMD_SERVICES + 10
1385                     , update_every
1386                     , RRDSET_TYPE_STACKED
1387             );
1388
1389         }
1390         else
1391             rrdset_next(st_mem_usage);
1392     }
1393
1394     if(likely(do_mem_detailed)) {
1395         if(unlikely(!st_mem_detailed_rss)) {
1396
1397             st_mem_detailed_rss = rrdset_create_localhost(
1398                     "services"
1399                     , "mem_rss"
1400                     , NULL
1401                     , "mem"
1402                     , "services.mem_rss"
1403                     , "Systemd Services RSS Memory"
1404                     , "MB"
1405                     , CHART_PRIORITY_SYSTEMD_SERVICES + 20
1406                     , update_every
1407                     , RRDSET_TYPE_STACKED
1408             );
1409
1410         }
1411         else
1412             rrdset_next(st_mem_detailed_rss);
1413
1414         if(unlikely(!st_mem_detailed_mapped)) {
1415
1416             st_mem_detailed_mapped = rrdset_create_localhost(
1417                     "services"
1418                     , "mem_mapped"
1419                     , NULL
1420                     , "mem"
1421                     , "services.mem_mapped"
1422                     , "Systemd Services Mapped Memory"
1423                     , "MB"
1424                     , CHART_PRIORITY_SYSTEMD_SERVICES + 30
1425                     , update_every
1426                     , RRDSET_TYPE_STACKED
1427             );
1428
1429         }
1430         else
1431             rrdset_next(st_mem_detailed_mapped);
1432
1433         if(unlikely(!st_mem_detailed_cache)) {
1434
1435             st_mem_detailed_cache = rrdset_create_localhost(
1436                     "services"
1437                     , "mem_cache"
1438                     , NULL
1439                     , "mem"
1440                     , "services.mem_cache"
1441                     , "Systemd Services Cache Memory"
1442                     , "MB"
1443                     , CHART_PRIORITY_SYSTEMD_SERVICES + 40
1444                     , update_every
1445                     , RRDSET_TYPE_STACKED
1446             );
1447
1448         }
1449         else
1450             rrdset_next(st_mem_detailed_cache);
1451
1452         if(unlikely(!st_mem_detailed_writeback)) {
1453
1454             st_mem_detailed_writeback = rrdset_create_localhost(
1455                     "services"
1456                     , "mem_writeback"
1457                     , NULL
1458                     , "mem"
1459                     , "services.mem_writeback"
1460                     , "Systemd Services Writeback Memory"
1461                     , "MB"
1462                     , CHART_PRIORITY_SYSTEMD_SERVICES + 50
1463                     , update_every
1464                     , RRDSET_TYPE_STACKED
1465             );
1466
1467         }
1468         else
1469             rrdset_next(st_mem_detailed_writeback);
1470
1471         if(unlikely(!st_mem_detailed_pgfault)) {
1472
1473             st_mem_detailed_pgfault = rrdset_create_localhost(
1474                     "services"
1475                     , "mem_pgfault"
1476                     , NULL
1477                     , "mem"
1478                     , "services.mem_pgfault"
1479                     , "Systemd Services Memory Minor Page Faults"
1480                     , "MB/s"
1481                     , CHART_PRIORITY_SYSTEMD_SERVICES + 60
1482                     , update_every
1483                     , RRDSET_TYPE_STACKED
1484             );
1485         }
1486         else
1487             rrdset_next(st_mem_detailed_pgfault);
1488
1489         if(unlikely(!st_mem_detailed_pgmajfault)) {
1490
1491             st_mem_detailed_pgmajfault = rrdset_create_localhost(
1492                     "services"
1493                     , "mem_pgmajfault"
1494                     , NULL
1495                     , "mem"
1496                     , "services.mem_pgmajfault"
1497                     , "Systemd Services Memory Major Page Faults"
1498                     , "MB/s"
1499                     , CHART_PRIORITY_SYSTEMD_SERVICES + 70
1500                     , update_every
1501                     , RRDSET_TYPE_STACKED
1502             );
1503
1504         }
1505         else
1506             rrdset_next(st_mem_detailed_pgmajfault);
1507
1508         if(unlikely(!st_mem_detailed_pgpgin)) {
1509
1510             st_mem_detailed_pgpgin = rrdset_create_localhost(
1511                     "services"
1512                     , "mem_pgpgin"
1513                     , NULL
1514                     , "mem"
1515                     , "services.mem_pgpgin"
1516                     , "Systemd Services Memory Charging Activity"
1517                     , "MB/s"
1518                     , CHART_PRIORITY_SYSTEMD_SERVICES + 80
1519                     , update_every
1520                     , RRDSET_TYPE_STACKED
1521             );
1522
1523         }
1524         else
1525             rrdset_next(st_mem_detailed_pgpgin);
1526
1527         if(unlikely(!st_mem_detailed_pgpgout)) {
1528
1529             st_mem_detailed_pgpgout = rrdset_create_localhost(
1530                     "services"
1531                     , "mem_pgpgout"
1532                     , NULL
1533                     , "mem"
1534                     , "services.mem_pgpgout"
1535                     , "Systemd Services Memory Uncharging Activity"
1536                     , "MB/s"
1537                     , CHART_PRIORITY_SYSTEMD_SERVICES + 90
1538                     , update_every
1539                     , RRDSET_TYPE_STACKED
1540             );
1541
1542         }
1543         else
1544             rrdset_next(st_mem_detailed_pgpgout);
1545     }
1546
1547     if(likely(do_mem_failcnt)) {
1548         if(unlikely(!st_mem_failcnt)) {
1549
1550             st_mem_failcnt = rrdset_create_localhost(
1551                     "services"
1552                     , "mem_failcnt"
1553                     , NULL
1554                     , "mem"
1555                     , "services.mem_failcnt"
1556                     , "Systemd Services Memory Limit Failures"
1557                     , "MB"
1558                     , CHART_PRIORITY_SYSTEMD_SERVICES + 110
1559                     , update_every
1560                     , RRDSET_TYPE_STACKED
1561             );
1562
1563         }
1564         else
1565             rrdset_next(st_mem_failcnt);
1566     }
1567
1568     if(likely(do_swap_usage)) {
1569         if(unlikely(!st_swap_usage)) {
1570
1571             st_swap_usage = rrdset_create_localhost(
1572                     "services"
1573                     , "swap_usage"
1574                     , NULL
1575                     , "swap"
1576                     , "services.swap_usage"
1577                     , "Systemd Services Swap Memory Used"
1578                     , "MB"
1579                     , CHART_PRIORITY_SYSTEMD_SERVICES + 100
1580                     , update_every
1581                     , RRDSET_TYPE_STACKED
1582             );
1583
1584         }
1585         else
1586             rrdset_next(st_swap_usage);
1587     }
1588
1589     if(likely(do_io)) {
1590         if(unlikely(!st_io_read)) {
1591
1592             st_io_read = rrdset_create_localhost(
1593                     "services"
1594                     , "io_read"
1595                     , NULL
1596                     , "disk"
1597                     , "services.io_read"
1598                     , "Systemd Services Disk Read Bandwidth"
1599                     , "KB/s"
1600                     , CHART_PRIORITY_SYSTEMD_SERVICES + 120
1601                     , update_every
1602                     , RRDSET_TYPE_STACKED
1603             );
1604
1605         }
1606         else
1607             rrdset_next(st_io_read);
1608
1609         if(unlikely(!st_io_write)) {
1610
1611             st_io_write = rrdset_create_localhost(
1612                     "services"
1613                     , "io_write"
1614                     , NULL
1615                     , "disk"
1616                     , "services.io_write"
1617                     , "Systemd Services Disk Write Bandwidth"
1618                     , "KB/s"
1619                     , CHART_PRIORITY_SYSTEMD_SERVICES + 130
1620                     , update_every
1621                     , RRDSET_TYPE_STACKED
1622             );
1623
1624         }
1625         else
1626             rrdset_next(st_io_write);
1627     }
1628
1629     if(likely(do_io_ops)) {
1630         if(unlikely(!st_io_serviced_read)) {
1631
1632             st_io_serviced_read = rrdset_create_localhost(
1633                     "services"
1634                     , "io_ops_read"
1635                     , NULL
1636                     , "disk"
1637                     , "services.io_ops_read"
1638                     , "Systemd Services Disk Read Operations"
1639                     , "operations/s"
1640                     , CHART_PRIORITY_SYSTEMD_SERVICES + 140
1641                     , update_every
1642                     , RRDSET_TYPE_STACKED
1643             );
1644
1645         }
1646         else
1647             rrdset_next(st_io_serviced_read);
1648
1649         if(unlikely(!st_io_serviced_write)) {
1650
1651             st_io_serviced_write = rrdset_create_localhost(
1652                     "services"
1653                     , "io_ops_write"
1654                     , NULL
1655                     , "disk"
1656                     , "services.io_ops_write"
1657                     , "Systemd Services Disk Write Operations"
1658                     , "operations/s"
1659                     , CHART_PRIORITY_SYSTEMD_SERVICES + 150
1660                     , update_every
1661                     , RRDSET_TYPE_STACKED
1662             );
1663
1664         }
1665         else
1666             rrdset_next(st_io_serviced_write);
1667     }
1668
1669     if(likely(do_throttle_io)) {
1670         if(unlikely(!st_throttle_io_read)) {
1671
1672             st_throttle_io_read = rrdset_create_localhost(
1673                     "services"
1674                     , "throttle_io_read"
1675                     , NULL
1676                     , "disk"
1677                     , "services.throttle_io_read"
1678                     , "Systemd Services Throttle Disk Read Bandwidth"
1679                     , "KB/s"
1680                     , CHART_PRIORITY_SYSTEMD_SERVICES + 160
1681                     , update_every
1682                     , RRDSET_TYPE_STACKED
1683             );
1684
1685         }
1686         else
1687             rrdset_next(st_throttle_io_read);
1688
1689         if(unlikely(!st_throttle_io_write)) {
1690
1691             st_throttle_io_write = rrdset_create_localhost(
1692                     "services"
1693                     , "throttle_io_write"
1694                     , NULL
1695                     , "disk"
1696                     , "services.throttle_io_write"
1697                     , "Systemd Services Throttle Disk Write Bandwidth"
1698                     , "KB/s"
1699                     , CHART_PRIORITY_SYSTEMD_SERVICES + 170
1700                     , update_every
1701                     , RRDSET_TYPE_STACKED
1702             );
1703
1704         }
1705         else
1706             rrdset_next(st_throttle_io_write);
1707     }
1708
1709     if(likely(do_throttle_ops)) {
1710         if(unlikely(!st_throttle_ops_read)) {
1711
1712             st_throttle_ops_read = rrdset_create_localhost(
1713                     "services"
1714                     , "throttle_io_ops_read"
1715                     , NULL
1716                     , "disk"
1717                     , "services.throttle_io_ops_read"
1718                     , "Systemd Services Throttle Disk Read Operations"
1719                     , "operations/s"
1720                     , CHART_PRIORITY_SYSTEMD_SERVICES + 180
1721                     , update_every
1722                     , RRDSET_TYPE_STACKED
1723             );
1724
1725         }
1726         else
1727             rrdset_next(st_throttle_ops_read);
1728
1729         if(unlikely(!st_throttle_ops_write)) {
1730
1731             st_throttle_ops_write = rrdset_create_localhost(
1732                     "services"
1733                     , "throttle_io_ops_write"
1734                     , NULL
1735                     , "disk"
1736                     , "services.throttle_io_ops_write"
1737                     , "Systemd Services Throttle Disk Write Operations"
1738                     , "operations/s"
1739                     , CHART_PRIORITY_SYSTEMD_SERVICES + 190
1740                     , update_every
1741                     , RRDSET_TYPE_STACKED
1742             );
1743
1744         }
1745         else
1746             rrdset_next(st_throttle_ops_write);
1747     }
1748
1749     if(likely(do_queued_ops)) {
1750         if(unlikely(!st_queued_ops_read)) {
1751
1752             st_queued_ops_read = rrdset_create_localhost(
1753                     "services"
1754                     , "queued_io_ops_read"
1755                     , NULL
1756                     , "disk"
1757                     , "services.queued_io_ops_read"
1758                     , "Systemd Services Queued Disk Read Operations"
1759                     , "operations/s"
1760                     , CHART_PRIORITY_SYSTEMD_SERVICES + 200
1761                     , update_every
1762                     , RRDSET_TYPE_STACKED
1763             );
1764
1765         }
1766         else
1767             rrdset_next(st_queued_ops_read);
1768
1769         if(unlikely(!st_queued_ops_write)) {
1770
1771             st_queued_ops_write = rrdset_create_localhost(
1772                     "services"
1773                     , "queued_io_ops_write"
1774                     , NULL
1775                     , "disk"
1776                     , "services.queued_io_ops_write"
1777                     , "Systemd Services Queued Disk Write Operations"
1778                     , "operations/s"
1779                     , CHART_PRIORITY_SYSTEMD_SERVICES + 210
1780                     , update_every
1781                     , RRDSET_TYPE_STACKED
1782             );
1783
1784         }
1785         else
1786             rrdset_next(st_queued_ops_write);
1787     }
1788
1789     if(likely(do_merged_ops)) {
1790         if(unlikely(!st_merged_ops_read)) {
1791
1792             st_merged_ops_read = rrdset_create_localhost(
1793                     "services"
1794                     , "merged_io_ops_read"
1795                     , NULL
1796                     , "disk"
1797                     , "services.merged_io_ops_read"
1798                     , "Systemd Services Merged Disk Read Operations"
1799                     , "operations/s"
1800                     , CHART_PRIORITY_SYSTEMD_SERVICES + 220
1801                     , update_every
1802                     , RRDSET_TYPE_STACKED
1803             );
1804
1805         }
1806         else
1807             rrdset_next(st_merged_ops_read);
1808
1809         if(unlikely(!st_merged_ops_write)) {
1810
1811             st_merged_ops_write = rrdset_create_localhost(
1812                     "services"
1813                     , "merged_io_ops_write"
1814                     , NULL
1815                     , "disk"
1816                     , "services.merged_io_ops_write"
1817                     , "Systemd Services Merged Disk Write Operations"
1818                     , "operations/s"
1819                     , CHART_PRIORITY_SYSTEMD_SERVICES + 230
1820                     , update_every
1821                     , RRDSET_TYPE_STACKED
1822             );
1823
1824         }
1825         else
1826             rrdset_next(st_merged_ops_write);
1827     }
1828
1829     // update the values
1830     struct cgroup *cg;
1831     for(cg = cgroup_root; cg ; cg = cg->next) {
1832         if(unlikely(!cg->available || !cg->enabled || !(cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE)))
1833             continue;
1834
1835         if(likely(do_cpu && cg->cpuacct_stat.updated)) {
1836             if(unlikely(!cg->rd_cpu))
1837                 cg->rd_cpu = rrddim_add(st_cpu, cg->chart_id, cg->chart_title, 100, hz, RRD_ALGORITHM_INCREMENTAL);
1838
1839             rrddim_set_by_pointer(st_cpu, cg->rd_cpu, cg->cpuacct_stat.user + cg->cpuacct_stat.system);
1840         }
1841
1842         if(likely(do_mem_usage && cg->memory.updated_usage_in_bytes)) {
1843             if(unlikely(!cg->rd_mem_usage))
1844                 cg->rd_mem_usage = rrddim_add(st_mem_usage, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
1845
1846             rrddim_set_by_pointer(st_mem_usage, cg->rd_mem_usage, cg->memory.usage_in_bytes - ((cgroup_used_memory_without_cache)?cg->memory.cache:0));
1847         }
1848
1849         if(likely(do_mem_detailed && cg->memory.updated_detailed)) {
1850             if(unlikely(!cg->rd_mem_detailed_rss))
1851                 cg->rd_mem_detailed_rss = rrddim_add(st_mem_detailed_rss, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
1852
1853             rrddim_set_by_pointer(st_mem_detailed_rss, cg->rd_mem_detailed_rss, cg->memory.rss + cg->memory.rss_huge);
1854
1855             if(unlikely(!cg->rd_mem_detailed_mapped))
1856                 cg->rd_mem_detailed_mapped = rrddim_add(st_mem_detailed_mapped, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
1857
1858             rrddim_set_by_pointer(st_mem_detailed_mapped, cg->rd_mem_detailed_mapped, cg->memory.mapped_file);
1859
1860             if(unlikely(!cg->rd_mem_detailed_cache))
1861                 cg->rd_mem_detailed_cache = rrddim_add(st_mem_detailed_cache, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
1862
1863             rrddim_set_by_pointer(st_mem_detailed_cache, cg->rd_mem_detailed_cache, cg->memory.cache);
1864
1865             if(unlikely(!cg->rd_mem_detailed_writeback))
1866                 cg->rd_mem_detailed_writeback = rrddim_add(st_mem_detailed_writeback, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
1867
1868             rrddim_set_by_pointer(st_mem_detailed_writeback, cg->rd_mem_detailed_writeback, cg->memory.writeback);
1869
1870             if(unlikely(!cg->rd_mem_detailed_pgfault))
1871                 cg->rd_mem_detailed_pgfault = rrddim_add(st_mem_detailed_pgfault, cg->chart_id, cg->chart_title, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
1872
1873             rrddim_set_by_pointer(st_mem_detailed_pgfault, cg->rd_mem_detailed_pgfault, cg->memory.pgfault);
1874
1875             if(unlikely(!cg->rd_mem_detailed_pgmajfault))
1876                 cg->rd_mem_detailed_pgmajfault = rrddim_add(st_mem_detailed_pgmajfault, cg->chart_id, cg->chart_title, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
1877
1878             rrddim_set_by_pointer(st_mem_detailed_pgmajfault, cg->rd_mem_detailed_pgmajfault, cg->memory.pgmajfault);
1879
1880             if(unlikely(!cg->rd_mem_detailed_pgpgin))
1881                 cg->rd_mem_detailed_pgpgin = rrddim_add(st_mem_detailed_pgpgin, cg->chart_id, cg->chart_title, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
1882
1883             rrddim_set_by_pointer(st_mem_detailed_pgpgin, cg->rd_mem_detailed_pgpgin, cg->memory.pgpgin);
1884
1885             if(unlikely(!cg->rd_mem_detailed_pgpgout))
1886                 cg->rd_mem_detailed_pgpgout = rrddim_add(st_mem_detailed_pgpgout, cg->chart_id, cg->chart_title, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
1887
1888             rrddim_set_by_pointer(st_mem_detailed_pgpgout, cg->rd_mem_detailed_pgpgout, cg->memory.pgpgout);
1889         }
1890
1891         if(likely(do_mem_failcnt && cg->memory.updated_failcnt)) {
1892             if(unlikely(!cg->rd_mem_failcnt))
1893                 cg->rd_mem_failcnt = rrddim_add(st_mem_failcnt, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1894
1895             rrddim_set_by_pointer(st_mem_failcnt, cg->rd_mem_failcnt, cg->memory.failcnt);
1896         }
1897
1898         if(likely(do_swap_usage && cg->memory.updated_msw_usage_in_bytes)) {
1899             if(unlikely(!cg->rd_swap_usage))
1900                 cg->rd_swap_usage = rrddim_add(st_swap_usage, cg->chart_id, cg->chart_title, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
1901
1902             rrddim_set_by_pointer(st_swap_usage, cg->rd_swap_usage, cg->memory.msw_usage_in_bytes);
1903         }
1904
1905         if(likely(do_io && cg->io_service_bytes.updated)) {
1906             if(unlikely(!cg->rd_io_service_bytes_read))
1907                 cg->rd_io_service_bytes_read = rrddim_add(st_io_read, cg->chart_id, cg->chart_title, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
1908
1909             rrddim_set_by_pointer(st_io_read, cg->rd_io_service_bytes_read, cg->io_service_bytes.Read);
1910
1911             if(unlikely(!cg->rd_io_service_bytes_write))
1912                 cg->rd_io_service_bytes_write = rrddim_add(st_io_write, cg->chart_id, cg->chart_title, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
1913
1914             rrddim_set_by_pointer(st_io_write, cg->rd_io_service_bytes_write, cg->io_service_bytes.Write);
1915         }
1916
1917         if(likely(do_io_ops && cg->io_serviced.updated)) {
1918             if(unlikely(!cg->rd_io_serviced_read))
1919                 cg->rd_io_serviced_read = rrddim_add(st_io_serviced_read, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1920
1921             rrddim_set_by_pointer(st_io_serviced_read, cg->rd_io_serviced_read, cg->io_serviced.Read);
1922
1923             if(unlikely(!cg->rd_io_serviced_write))
1924                 cg->rd_io_serviced_write = rrddim_add(st_io_serviced_write, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1925
1926             rrddim_set_by_pointer(st_io_serviced_write, cg->rd_io_serviced_write, cg->io_serviced.Write);
1927         }
1928
1929         if(likely(do_throttle_io && cg->throttle_io_service_bytes.updated)) {
1930             if(unlikely(!cg->rd_throttle_io_read))
1931                 cg->rd_throttle_io_read = rrddim_add(st_throttle_io_read, cg->chart_id, cg->chart_title, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
1932
1933             rrddim_set_by_pointer(st_throttle_io_read, cg->rd_throttle_io_read, cg->throttle_io_service_bytes.Read);
1934
1935             if(unlikely(!cg->rd_throttle_io_write))
1936                 cg->rd_throttle_io_write = rrddim_add(st_throttle_io_write, cg->chart_id, cg->chart_title, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
1937
1938             rrddim_set_by_pointer(st_throttle_io_write, cg->rd_throttle_io_write, cg->throttle_io_service_bytes.Write);
1939         }
1940
1941         if(likely(do_throttle_ops && cg->throttle_io_serviced.updated)) {
1942             if(unlikely(!cg->rd_throttle_io_serviced_read))
1943                 cg->rd_throttle_io_serviced_read = rrddim_add(st_throttle_ops_read, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1944
1945             rrddim_set_by_pointer(st_throttle_ops_read, cg->rd_throttle_io_serviced_read, cg->throttle_io_serviced.Read);
1946
1947             if(unlikely(!cg->rd_throttle_io_serviced_write))
1948                 cg->rd_throttle_io_serviced_write = rrddim_add(st_throttle_ops_write, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1949
1950             rrddim_set_by_pointer(st_throttle_ops_write, cg->rd_throttle_io_serviced_write, cg->throttle_io_serviced.Write);
1951         }
1952
1953         if(likely(do_queued_ops && cg->io_queued.updated)) {
1954             if(unlikely(!cg->rd_io_queued_read))
1955                 cg->rd_io_queued_read = rrddim_add(st_queued_ops_read, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1956
1957             rrddim_set_by_pointer(st_queued_ops_read, cg->rd_io_queued_read, cg->io_queued.Read);
1958
1959             if(unlikely(!cg->rd_io_queued_write))
1960                 cg->rd_io_queued_write = rrddim_add(st_queued_ops_write, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1961
1962             rrddim_set_by_pointer(st_queued_ops_write, cg->rd_io_queued_write, cg->io_queued.Write);
1963         }
1964
1965         if(likely(do_merged_ops && cg->io_merged.updated)) {
1966             if(unlikely(!cg->rd_io_merged_read))
1967                 cg->rd_io_merged_read = rrddim_add(st_merged_ops_read, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1968
1969             rrddim_set_by_pointer(st_merged_ops_read, cg->rd_io_merged_read, cg->io_merged.Read);
1970
1971             if(unlikely(!cg->rd_io_merged_write))
1972                 cg->rd_io_merged_write = rrddim_add(st_merged_ops_write, cg->chart_id, cg->chart_title, 1, 1, RRD_ALGORITHM_INCREMENTAL);
1973
1974             rrddim_set_by_pointer(st_merged_ops_write, cg->rd_io_merged_write, cg->io_merged.Write);
1975         }
1976     }
1977
1978     // complete the iteration
1979     if(likely(do_cpu))
1980         rrdset_done(st_cpu);
1981
1982     if(likely(do_mem_usage))
1983         rrdset_done(st_mem_usage);
1984
1985     if(unlikely(do_mem_detailed)) {
1986         rrdset_done(st_mem_detailed_cache);
1987         rrdset_done(st_mem_detailed_rss);
1988         rrdset_done(st_mem_detailed_mapped);
1989         rrdset_done(st_mem_detailed_writeback);
1990         rrdset_done(st_mem_detailed_pgfault);
1991         rrdset_done(st_mem_detailed_pgmajfault);
1992         rrdset_done(st_mem_detailed_pgpgin);
1993         rrdset_done(st_mem_detailed_pgpgout);
1994     }
1995
1996     if(likely(do_mem_failcnt))
1997         rrdset_done(st_mem_failcnt);
1998
1999     if(likely(do_swap_usage))
2000         rrdset_done(st_swap_usage);
2001
2002     if(likely(do_io)) {
2003         rrdset_done(st_io_read);
2004         rrdset_done(st_io_write);
2005     }
2006
2007     if(likely(do_io_ops)) {
2008         rrdset_done(st_io_serviced_read);
2009         rrdset_done(st_io_serviced_write);
2010     }
2011
2012     if(likely(do_throttle_io)) {
2013         rrdset_done(st_throttle_io_read);
2014         rrdset_done(st_throttle_io_write);
2015     }
2016
2017     if(likely(do_throttle_ops)) {
2018         rrdset_done(st_throttle_ops_read);
2019         rrdset_done(st_throttle_ops_write);
2020     }
2021
2022     if(likely(do_queued_ops)) {
2023         rrdset_done(st_queued_ops_read);
2024         rrdset_done(st_queued_ops_write);
2025     }
2026
2027     if(likely(do_merged_ops)) {
2028         rrdset_done(st_merged_ops_read);
2029         rrdset_done(st_merged_ops_write);
2030     }
2031 }
2032
2033 static inline char *cgroup_chart_type(char *buffer, const char *id, size_t len) {
2034     if(buffer[0]) return buffer;
2035
2036     if(id[0] == '\0' || (id[0] == '/' && id[1] == '\0'))
2037         strncpy(buffer, "cgroup_root", len);
2038     else
2039         snprintfz(buffer, len, "cgroup_%s", id);
2040
2041     netdata_fix_chart_id(buffer);
2042     return buffer;
2043 }
2044
2045 void update_cgroup_charts(int update_every) {
2046     debug(D_CGROUP, "updating cgroups charts");
2047
2048     char type[RRD_ID_LENGTH_MAX + 1];
2049     char title[CHART_TITLE_MAX + 1];
2050
2051     int services_do_cpu = 0,
2052             services_do_mem_usage = 0,
2053             services_do_mem_detailed = 0,
2054             services_do_mem_failcnt = 0,
2055             services_do_swap_usage = 0,
2056             services_do_io = 0,
2057             services_do_io_ops = 0,
2058             services_do_throttle_io = 0,
2059             services_do_throttle_ops = 0,
2060             services_do_queued_ops = 0,
2061             services_do_merged_ops = 0;
2062
2063     struct cgroup *cg;
2064     for(cg = cgroup_root; cg ; cg = cg->next) {
2065         if(unlikely(!cg->available || !cg->enabled))
2066             continue;
2067
2068         if(likely(cgroup_enable_systemd_services && cg->options & CGROUP_OPTIONS_SYSTEM_SLICE_SERVICE)) {
2069             if(cg->cpuacct_stat.updated && cg->cpuacct_stat.enabled == CONFIG_BOOLEAN_YES) services_do_cpu++;
2070
2071             if(cgroup_enable_systemd_services_detailed_memory && cg->memory.updated_detailed && cg->memory.enabled_detailed) services_do_mem_detailed++;
2072             if(cg->memory.updated_usage_in_bytes && cg->memory.enabled_usage_in_bytes == CONFIG_BOOLEAN_YES) services_do_mem_usage++;
2073             if(cg->memory.updated_failcnt && cg->memory.enabled_failcnt == CONFIG_BOOLEAN_YES) services_do_mem_failcnt++;
2074             if(cg->memory.updated_msw_usage_in_bytes && cg->memory.enabled_msw_usage_in_bytes == CONFIG_BOOLEAN_YES) services_do_swap_usage++;
2075
2076             if(cg->io_service_bytes.updated && cg->io_service_bytes.enabled == CONFIG_BOOLEAN_YES) services_do_io++;
2077             if(cg->io_serviced.updated && cg->io_serviced.enabled == CONFIG_BOOLEAN_YES) services_do_io_ops++;
2078             if(cg->throttle_io_service_bytes.updated && cg->throttle_io_service_bytes.enabled == CONFIG_BOOLEAN_YES) services_do_throttle_io++;
2079             if(cg->throttle_io_serviced.updated && cg->throttle_io_serviced.enabled == CONFIG_BOOLEAN_YES) services_do_throttle_ops++;
2080             if(cg->io_queued.updated && cg->io_queued.enabled == CONFIG_BOOLEAN_YES) services_do_queued_ops++;
2081             if(cg->io_merged.updated && cg->io_merged.enabled == CONFIG_BOOLEAN_YES) services_do_merged_ops++;
2082             continue;
2083         }
2084
2085         type[0] = '\0';
2086
2087         if(likely(cg->cpuacct_stat.updated && cg->cpuacct_stat.enabled == CONFIG_BOOLEAN_YES)) {
2088             if(unlikely(!cg->st_cpu)) {
2089                 snprintfz(title, CHART_TITLE_MAX, "CPU Usage (%d%% = %d core%s) for cgroup %s", (processors * 100), processors, (processors > 1) ? "s" : "", cg->chart_title);
2090
2091                 cg->st_cpu = rrdset_create_localhost(
2092                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2093                         , "cpu"
2094                         , NULL
2095                         , "cpu"
2096                         , "cgroup.cpu"
2097                         , title
2098                         , "%"
2099                         , CHART_PRIORITY_CONTAINERS
2100                         , update_every
2101                         , RRDSET_TYPE_STACKED
2102                 );
2103
2104                 rrddim_add(cg->st_cpu, "user", NULL, 100, hz, RRD_ALGORITHM_INCREMENTAL);
2105                 rrddim_add(cg->st_cpu, "system", NULL, 100, hz, RRD_ALGORITHM_INCREMENTAL);
2106             }
2107             else
2108                 rrdset_next(cg->st_cpu);
2109
2110             rrddim_set(cg->st_cpu, "user", cg->cpuacct_stat.user);
2111             rrddim_set(cg->st_cpu, "system", cg->cpuacct_stat.system);
2112             rrdset_done(cg->st_cpu);
2113         }
2114
2115         if(likely(cg->cpuacct_usage.updated && cg->cpuacct_usage.enabled == CONFIG_BOOLEAN_YES)) {
2116             char id[RRD_ID_LENGTH_MAX + 1];
2117             unsigned int i;
2118
2119             if(unlikely(!cg->st_cpu_per_core)) {
2120                 snprintfz(title, CHART_TITLE_MAX, "CPU Usage (%d%% = %d core%s) Per Core for cgroup %s", (processors * 100), processors, (processors > 1) ? "s" : "", cg->chart_title);
2121
2122                 cg->st_cpu_per_core = rrdset_create_localhost(
2123                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2124                         , "cpu_per_core"
2125                         , NULL
2126                         , "cpu"
2127                         , "cgroup.cpu_per_core"
2128                         , title
2129                         , "%"
2130                         , CHART_PRIORITY_CONTAINERS + 100
2131                         , update_every
2132                         , RRDSET_TYPE_STACKED
2133                 );
2134
2135                 for(i = 0; i < cg->cpuacct_usage.cpus; i++) {
2136                     snprintfz(id, RRD_ID_LENGTH_MAX, "cpu%u", i);
2137                     rrddim_add(cg->st_cpu_per_core, id, NULL, 100, 1000000000, RRD_ALGORITHM_INCREMENTAL);
2138                 }
2139             }
2140             else
2141                 rrdset_next(cg->st_cpu_per_core);
2142
2143             for(i = 0; i < cg->cpuacct_usage.cpus ;i++) {
2144                 snprintfz(id, RRD_ID_LENGTH_MAX, "cpu%u", i);
2145                 rrddim_set(cg->st_cpu_per_core, id, cg->cpuacct_usage.cpu_percpu[i]);
2146             }
2147             rrdset_done(cg->st_cpu_per_core);
2148         }
2149
2150         if(likely(cg->memory.updated_detailed && cg->memory.enabled_detailed == CONFIG_BOOLEAN_YES)) {
2151             if(unlikely(!cg->st_mem)) {
2152                 snprintfz(title, CHART_TITLE_MAX, "Memory Usage for cgroup %s", cg->chart_title);
2153
2154                 cg->st_mem = rrdset_create_localhost(
2155                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2156                         , "mem"
2157                         , NULL
2158                         , "mem"
2159                         , "cgroup.mem"
2160                         , title
2161                         , "MB"
2162                         , CHART_PRIORITY_CONTAINERS + 210
2163                         , update_every
2164                         , RRDSET_TYPE_STACKED
2165                 );
2166
2167                 rrddim_add(cg->st_mem, "cache", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2168                 rrddim_add(cg->st_mem, "rss", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2169
2170                 if(cg->memory.detailed_has_swap)
2171                     rrddim_add(cg->st_mem, "swap", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2172
2173                 rrddim_add(cg->st_mem, "rss_huge", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2174                 rrddim_add(cg->st_mem, "mapped_file", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2175             }
2176             else
2177                 rrdset_next(cg->st_mem);
2178
2179             rrddim_set(cg->st_mem, "cache", cg->memory.cache);
2180             rrddim_set(cg->st_mem, "rss", cg->memory.rss);
2181
2182             if(cg->memory.detailed_has_swap)
2183                 rrddim_set(cg->st_mem, "swap", cg->memory.swap);
2184
2185             rrddim_set(cg->st_mem, "rss_huge", cg->memory.rss_huge);
2186             rrddim_set(cg->st_mem, "mapped_file", cg->memory.mapped_file);
2187             rrdset_done(cg->st_mem);
2188
2189             if(unlikely(!cg->st_writeback)) {
2190                 snprintfz(title, CHART_TITLE_MAX, "Writeback Memory for cgroup %s", cg->chart_title);
2191
2192                 cg->st_writeback = rrdset_create_localhost(
2193                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2194                         , "writeback"
2195                         , NULL
2196                         , "mem"
2197                         , "cgroup.writeback"
2198                         , title
2199                         , "MB"
2200                         , CHART_PRIORITY_CONTAINERS + 300
2201                         , update_every
2202                         , RRDSET_TYPE_AREA
2203                 );
2204
2205                 if(cg->memory.detailed_has_dirty)
2206                     rrddim_add(cg->st_writeback, "dirty", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2207
2208                 rrddim_add(cg->st_writeback, "writeback", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2209             }
2210             else
2211                 rrdset_next(cg->st_writeback);
2212
2213             if(cg->memory.detailed_has_dirty)
2214                 rrddim_set(cg->st_writeback, "dirty", cg->memory.dirty);
2215
2216             rrddim_set(cg->st_writeback, "writeback", cg->memory.writeback);
2217             rrdset_done(cg->st_writeback);
2218
2219             if(unlikely(!cg->st_mem_activity)) {
2220                 snprintfz(title, CHART_TITLE_MAX, "Memory Activity for cgroup %s", cg->chart_title);
2221
2222                 cg->st_mem_activity = rrdset_create_localhost(
2223                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2224                         , "mem_activity"
2225                         , NULL
2226                         , "mem"
2227                         , "cgroup.mem_activity"
2228                         , title
2229                         , "MB/s"
2230                         , CHART_PRIORITY_CONTAINERS + 400
2231                         , update_every
2232                         , RRDSET_TYPE_LINE
2233                 );
2234
2235                 rrddim_add(cg->st_mem_activity, "pgpgin", "in", system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
2236                 rrddim_add(cg->st_mem_activity, "pgpgout", "out", -system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
2237             }
2238             else
2239                 rrdset_next(cg->st_mem_activity);
2240
2241             rrddim_set(cg->st_mem_activity, "pgpgin", cg->memory.pgpgin);
2242             rrddim_set(cg->st_mem_activity, "pgpgout", cg->memory.pgpgout);
2243             rrdset_done(cg->st_mem_activity);
2244
2245             if(unlikely(!cg->st_pgfaults)) {
2246                 snprintfz(title, CHART_TITLE_MAX, "Memory Page Faults for cgroup %s", cg->chart_title);
2247
2248                 cg->st_pgfaults = rrdset_create_localhost(
2249                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2250                         , "pgfaults"
2251                         , NULL
2252                         , "mem"
2253                         , "cgroup.pgfaults"
2254                         , title
2255                         , "MB/s"
2256                         , CHART_PRIORITY_CONTAINERS + 500
2257                         , update_every
2258                         , RRDSET_TYPE_LINE
2259                 );
2260
2261                 rrddim_add(cg->st_pgfaults, "pgfault", NULL, system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
2262                 rrddim_add(cg->st_pgfaults, "pgmajfault", "swap", -system_page_size, 1024 * 1024, RRD_ALGORITHM_INCREMENTAL);
2263             }
2264             else
2265                 rrdset_next(cg->st_pgfaults);
2266
2267             rrddim_set(cg->st_pgfaults, "pgfault", cg->memory.pgfault);
2268             rrddim_set(cg->st_pgfaults, "pgmajfault", cg->memory.pgmajfault);
2269             rrdset_done(cg->st_pgfaults);
2270         }
2271
2272         if(likely(cg->memory.updated_usage_in_bytes && cg->memory.enabled_usage_in_bytes == CONFIG_BOOLEAN_YES)) {
2273             if(unlikely(!cg->st_mem_usage)) {
2274                 snprintfz(title, CHART_TITLE_MAX, "Used Memory %sfor cgroup %s", (cgroup_used_memory_without_cache && cg->memory.updated_detailed)?"without Cache ":"", cg->chart_title);
2275
2276                 cg->st_mem_usage = rrdset_create_localhost(
2277                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2278                         , "mem_usage"
2279                         , NULL
2280                         , "mem"
2281                         , "cgroup.mem_usage"
2282                         , title
2283                         , "MB"
2284                         , CHART_PRIORITY_CONTAINERS + 200
2285                         , update_every
2286                         , RRDSET_TYPE_STACKED
2287                 );
2288
2289                 rrddim_add(cg->st_mem_usage, "ram", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2290                 rrddim_add(cg->st_mem_usage, "swap", NULL, 1, 1024 * 1024, RRD_ALGORITHM_ABSOLUTE);
2291             }
2292             else
2293                 rrdset_next(cg->st_mem_usage);
2294
2295             rrddim_set(cg->st_mem_usage, "ram", cg->memory.usage_in_bytes - ((cgroup_used_memory_without_cache)?cg->memory.cache:0));
2296             rrddim_set(cg->st_mem_usage, "swap", (cg->memory.msw_usage_in_bytes > cg->memory.usage_in_bytes)?cg->memory.msw_usage_in_bytes - cg->memory.usage_in_bytes:0);
2297             rrdset_done(cg->st_mem_usage);
2298         }
2299
2300         if(likely(cg->memory.updated_failcnt && cg->memory.enabled_failcnt == CONFIG_BOOLEAN_YES)) {
2301             if(unlikely(!cg->st_mem_failcnt)) {
2302                 snprintfz(title, CHART_TITLE_MAX, "Memory Limit Failures for cgroup %s", cg->chart_title);
2303
2304                 cg->st_mem_failcnt = rrdset_create_localhost(
2305                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2306                         , "mem_failcnt"
2307                         , NULL
2308                         , "mem"
2309                         , "cgroup.mem_failcnt"
2310                         , title
2311                         , "count"
2312                         , CHART_PRIORITY_CONTAINERS + 250
2313                         , update_every
2314                         , RRDSET_TYPE_LINE
2315                 );
2316
2317                 rrddim_add(cg->st_mem_failcnt, "failures", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
2318             }
2319             else
2320                 rrdset_next(cg->st_mem_failcnt);
2321
2322             rrddim_set(cg->st_mem_failcnt, "failures", cg->memory.failcnt);
2323             rrdset_done(cg->st_mem_failcnt);
2324         }
2325
2326         if(likely(cg->io_service_bytes.updated && cg->io_service_bytes.enabled == CONFIG_BOOLEAN_YES)) {
2327             if(unlikely(!cg->st_io)) {
2328                 snprintfz(title, CHART_TITLE_MAX, "I/O Bandwidth (all disks) for cgroup %s", cg->chart_title);
2329
2330                 cg->st_io = rrdset_create_localhost(
2331                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2332                         , "io"
2333                         , NULL
2334                         , "disk"
2335                         , "cgroup.io"
2336                         , title
2337                         , "KB/s"
2338                         , CHART_PRIORITY_CONTAINERS + 1200
2339                         , update_every
2340                         , RRDSET_TYPE_AREA
2341                 );
2342
2343                 rrddim_add(cg->st_io, "read", NULL, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
2344                 rrddim_add(cg->st_io, "write", NULL, -1, 1024, RRD_ALGORITHM_INCREMENTAL);
2345             }
2346             else
2347                 rrdset_next(cg->st_io);
2348
2349             rrddim_set(cg->st_io, "read", cg->io_service_bytes.Read);
2350             rrddim_set(cg->st_io, "write", cg->io_service_bytes.Write);
2351             rrdset_done(cg->st_io);
2352         }
2353
2354         if(likely(cg->io_serviced.updated && cg->io_serviced.enabled == CONFIG_BOOLEAN_YES)) {
2355             if(unlikely(!cg->st_serviced_ops)) {
2356                 snprintfz(title, CHART_TITLE_MAX, "Serviced I/O Operations (all disks) for cgroup %s", cg->chart_title);
2357
2358                 cg->st_serviced_ops = rrdset_create_localhost(
2359                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2360                         , "serviced_ops"
2361                         , NULL
2362                         , "disk"
2363                         , "cgroup.serviced_ops"
2364                         , title
2365                         , "operations/s"
2366                         , CHART_PRIORITY_CONTAINERS + 1200
2367                         , update_every
2368                         , RRDSET_TYPE_LINE
2369                 );
2370
2371                 rrddim_add(cg->st_serviced_ops, "read", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
2372                 rrddim_add(cg->st_serviced_ops, "write", NULL, -1, 1, RRD_ALGORITHM_INCREMENTAL);
2373             }
2374             else
2375                 rrdset_next(cg->st_serviced_ops);
2376
2377             rrddim_set(cg->st_serviced_ops, "read", cg->io_serviced.Read);
2378             rrddim_set(cg->st_serviced_ops, "write", cg->io_serviced.Write);
2379             rrdset_done(cg->st_serviced_ops);
2380         }
2381
2382         if(likely(cg->throttle_io_service_bytes.updated && cg->throttle_io_service_bytes.enabled == CONFIG_BOOLEAN_YES)) {
2383             if(unlikely(!cg->st_throttle_io)) {
2384                 snprintfz(title, CHART_TITLE_MAX, "Throttle I/O Bandwidth (all disks) for cgroup %s", cg->chart_title);
2385
2386                 cg->st_throttle_io = rrdset_create_localhost(
2387                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2388                         , "throttle_io"
2389                         , NULL
2390                         , "disk"
2391                         , "cgroup.throttle_io"
2392                         , title
2393                         , "KB/s"
2394                         , CHART_PRIORITY_CONTAINERS + 1200
2395                         , update_every
2396                         , RRDSET_TYPE_AREA
2397                 );
2398
2399                 rrddim_add(cg->st_throttle_io, "read", NULL, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
2400                 rrddim_add(cg->st_throttle_io, "write", NULL, -1, 1024, RRD_ALGORITHM_INCREMENTAL);
2401             }
2402             else
2403                 rrdset_next(cg->st_throttle_io);
2404
2405             rrddim_set(cg->st_throttle_io, "read", cg->throttle_io_service_bytes.Read);
2406             rrddim_set(cg->st_throttle_io, "write", cg->throttle_io_service_bytes.Write);
2407             rrdset_done(cg->st_throttle_io);
2408         }
2409
2410         if(likely(cg->throttle_io_serviced.updated && cg->throttle_io_serviced.enabled == CONFIG_BOOLEAN_YES)) {
2411             if(unlikely(!cg->st_throttle_serviced_ops)) {
2412                 snprintfz(title, CHART_TITLE_MAX, "Throttle Serviced I/O Operations (all disks) for cgroup %s", cg->chart_title);
2413
2414                 cg->st_throttle_serviced_ops = rrdset_create_localhost(
2415                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2416                         , "throttle_serviced_ops"
2417                         , NULL
2418                         , "disk"
2419                         , "cgroup.throttle_serviced_ops"
2420                         , title
2421                         , "operations/s"
2422                         , CHART_PRIORITY_CONTAINERS + 1200
2423                         , update_every
2424                         , RRDSET_TYPE_LINE
2425                 );
2426
2427                 rrddim_add(cg->st_throttle_serviced_ops, "read", NULL, 1, 1, RRD_ALGORITHM_INCREMENTAL);
2428                 rrddim_add(cg->st_throttle_serviced_ops, "write", NULL, -1, 1, RRD_ALGORITHM_INCREMENTAL);
2429             }
2430             else
2431                 rrdset_next(cg->st_throttle_serviced_ops);
2432
2433             rrddim_set(cg->st_throttle_serviced_ops, "read", cg->throttle_io_serviced.Read);
2434             rrddim_set(cg->st_throttle_serviced_ops, "write", cg->throttle_io_serviced.Write);
2435             rrdset_done(cg->st_throttle_serviced_ops);
2436         }
2437
2438         if(likely(cg->io_queued.updated && cg->io_queued.enabled == CONFIG_BOOLEAN_YES)) {
2439             if(unlikely(!cg->st_queued_ops)) {
2440                 snprintfz(title, CHART_TITLE_MAX, "Queued I/O Operations (all disks) for cgroup %s", cg->chart_title);
2441
2442                 cg->st_queued_ops = rrdset_create_localhost(
2443                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2444                         , "queued_ops"
2445                         , NULL
2446                         , "disk"
2447                         , "cgroup.queued_ops"
2448                         , title
2449                         , "operations"
2450                         , CHART_PRIORITY_CONTAINERS + 2000
2451                         , update_every
2452                         , RRDSET_TYPE_LINE
2453                 );
2454
2455                 rrddim_add(cg->st_queued_ops, "read", NULL, 1, 1, RRD_ALGORITHM_ABSOLUTE);
2456                 rrddim_add(cg->st_queued_ops, "write", NULL, -1, 1, RRD_ALGORITHM_ABSOLUTE);
2457             }
2458             else
2459                 rrdset_next(cg->st_queued_ops);
2460
2461             rrddim_set(cg->st_queued_ops, "read", cg->io_queued.Read);
2462             rrddim_set(cg->st_queued_ops, "write", cg->io_queued.Write);
2463             rrdset_done(cg->st_queued_ops);
2464         }
2465
2466         if(likely(cg->io_merged.updated && cg->io_merged.enabled == CONFIG_BOOLEAN_YES)) {
2467             if(unlikely(!cg->st_merged_ops)) {
2468                 snprintfz(title, CHART_TITLE_MAX, "Merged I/O Operations (all disks) for cgroup %s", cg->chart_title);
2469
2470                 cg->st_merged_ops = rrdset_create_localhost(
2471                         cgroup_chart_type(type, cg->chart_id, RRD_ID_LENGTH_MAX)
2472                         , "merged_ops"
2473                         , NULL
2474                         , "disk"
2475                         , "cgroup.merged_ops"
2476                         , title
2477                         , "operations/s"
2478                         , CHART_PRIORITY_CONTAINERS + 2100
2479                         , update_every
2480                         , RRDSET_TYPE_LINE
2481                 );
2482
2483                 rrddim_add(cg->st_merged_ops, "read", NULL, 1, 1024, RRD_ALGORITHM_INCREMENTAL);
2484                 rrddim_add(cg->st_merged_ops, "write", NULL, -1, 1024, RRD_ALGORITHM_INCREMENTAL);
2485             }
2486             else
2487                 rrdset_next(cg->st_merged_ops);
2488
2489             rrddim_set(cg->st_merged_ops, "read", cg->io_merged.Read);
2490             rrddim_set(cg->st_merged_ops, "write", cg->io_merged.Write);
2491             rrdset_done(cg->st_merged_ops);
2492         }
2493     }
2494
2495     if(likely(cgroup_enable_systemd_services))
2496         update_systemd_services_charts(update_every, services_do_cpu, services_do_mem_usage, services_do_mem_detailed
2497                                        , services_do_mem_failcnt, services_do_swap_usage, services_do_io
2498                                        , services_do_io_ops, services_do_throttle_io, services_do_throttle_ops
2499                                        , services_do_queued_ops, services_do_merged_ops
2500         );
2501
2502     debug(D_CGROUP, "done updating cgroups charts");
2503 }
2504
2505 // ----------------------------------------------------------------------------
2506 // cgroups main
2507
2508 void *cgroups_main(void *ptr) {
2509     struct netdata_static_thread *static_thread = (struct netdata_static_thread *)ptr;
2510
2511     info("CGROUP Plugin thread created with task id %d", gettid());
2512
2513     if(pthread_setcanceltype(PTHREAD_CANCEL_DEFERRED, NULL) != 0)
2514         error("Cannot set pthread cancel type to DEFERRED.");
2515
2516     if(pthread_setcancelstate(PTHREAD_CANCEL_ENABLE, NULL) != 0)
2517         error("Cannot set pthread cancel state to ENABLE.");
2518
2519     struct rusage thread;
2520
2521     // when ZERO, attempt to do it
2522     int vdo_cpu_netdata = config_get_boolean("plugin:cgroups", "cgroups plugin resource charts", 1);
2523
2524     read_cgroup_plugin_configuration();
2525
2526     RRDSET *stcpu_thread = NULL;
2527
2528     heartbeat_t hb;
2529     heartbeat_init(&hb);
2530     usec_t step = cgroup_update_every * USEC_PER_SEC;
2531     usec_t find_every = cgroup_check_for_new_every * USEC_PER_SEC, find_dt = 0;
2532     for(;;) {
2533         usec_t hb_dt = heartbeat_next(&hb, step);
2534         if(unlikely(netdata_exit)) break;
2535
2536         // BEGIN -- the job to be done
2537
2538         find_dt += hb_dt;
2539         if(unlikely(find_dt >= find_every || cgroups_check)) {
2540             find_all_cgroups();
2541             find_dt = 0;
2542             cgroups_check = 0;
2543         }
2544
2545         read_all_cgroups(cgroup_root);
2546         update_cgroup_charts(cgroup_update_every);
2547
2548         // END -- the job is done
2549
2550         // --------------------------------------------------------------------
2551
2552         if(vdo_cpu_netdata) {
2553             getrusage(RUSAGE_THREAD, &thread);
2554
2555             if(unlikely(!stcpu_thread)) {
2556
2557                 stcpu_thread = rrdset_create_localhost(
2558                         "netdata"
2559                         , "plugin_cgroups_cpu"
2560                         , NULL
2561                         , "cgroups"
2562                         , NULL
2563                         , "NetData CGroups Plugin CPU usage"
2564                         , "milliseconds/s"
2565                         , 132000
2566                         , cgroup_update_every
2567                         , RRDSET_TYPE_STACKED
2568                 );
2569
2570                 rrddim_add(stcpu_thread, "user",  NULL,  1, 1000, RRD_ALGORITHM_INCREMENTAL);
2571                 rrddim_add(stcpu_thread, "system", NULL, 1, 1000, RRD_ALGORITHM_INCREMENTAL);
2572             }
2573             else
2574                 rrdset_next(stcpu_thread);
2575
2576             rrddim_set(stcpu_thread, "user"  , thread.ru_utime.tv_sec * 1000000ULL + thread.ru_utime.tv_usec);
2577             rrddim_set(stcpu_thread, "system", thread.ru_stime.tv_sec * 1000000ULL + thread.ru_stime.tv_usec);
2578             rrdset_done(stcpu_thread);
2579         }
2580     }
2581
2582     info("CGROUP thread exiting");
2583
2584     static_thread->enabled = 0;
2585     pthread_exit(NULL);
2586     return NULL;
2587 }