]> arthur.barton.de Git - netdata.git/blob - src/proc_diskstats.c
fixed minor issues throughout the code (mainly types); dashboard has now a watermark...
[netdata.git] / src / proc_diskstats.c
1 #ifdef HAVE_CONFIG_H
2 #include <config.h>
3 #endif
4 #include <stdio.h>
5 #include <stdlib.h>
6 #include <string.h>
7
8 #include "common.h"
9 #include "log.h"
10 #include "appconfig.h"
11 #include "procfile.h"
12 #include "rrd.h"
13 #include "plugin_proc.h"
14
15 #define RRD_TYPE_DISK "disk"
16
17 int do_proc_diskstats(int update_every, unsigned long long dt) {
18         static procfile *ff = NULL;
19         static char path_to_get_hw_sector_size[FILENAME_MAX + 1] = "";
20         static int enable_new_disks = -1;
21         static int do_io = -1, do_ops = -1, do_mops = -1, do_iotime = -1, do_qops = -1, do_util = -1, do_backlog = -1;
22
23         if(enable_new_disks == -1)      enable_new_disks = config_get_boolean_ondemand("plugin:proc:/proc/diskstats", "enable new disks detected at runtime", CONFIG_ONDEMAND_ONDEMAND);
24
25         if(do_io == -1)         do_io           = config_get_boolean_ondemand("plugin:proc:/proc/diskstats", "bandwidth for all disks", CONFIG_ONDEMAND_ONDEMAND);
26         if(do_ops == -1)        do_ops          = config_get_boolean_ondemand("plugin:proc:/proc/diskstats", "operations for all disks", CONFIG_ONDEMAND_ONDEMAND);
27         if(do_mops == -1)       do_mops         = config_get_boolean_ondemand("plugin:proc:/proc/diskstats", "merged operations for all disks", CONFIG_ONDEMAND_ONDEMAND);
28         if(do_iotime == -1)     do_iotime       = config_get_boolean_ondemand("plugin:proc:/proc/diskstats", "i/o time for all disks", CONFIG_ONDEMAND_ONDEMAND);
29         if(do_qops == -1)       do_qops         = config_get_boolean_ondemand("plugin:proc:/proc/diskstats", "queued operations for all disks", CONFIG_ONDEMAND_ONDEMAND);
30         if(do_util == -1)       do_util         = config_get_boolean_ondemand("plugin:proc:/proc/diskstats", "utilization percentage for all disks", CONFIG_ONDEMAND_ONDEMAND);
31         if(do_backlog == -1)do_backlog  = config_get_boolean_ondemand("plugin:proc:/proc/diskstats", "backlog for all disks", CONFIG_ONDEMAND_ONDEMAND);
32
33         if(!ff) {
34                 char filename[FILENAME_MAX + 1];
35                 snprintf(filename, FILENAME_MAX, "%s%s", global_host_prefix, "/proc/diskstats");
36                 ff = procfile_open(config_get("plugin:proc:/proc/diskstats", "filename to monitor", filename), " \t", PROCFILE_FLAG_DEFAULT);
37         }
38         if(!ff) return 1;
39
40         if(!path_to_get_hw_sector_size[0]) {
41                 char filename[FILENAME_MAX + 1];
42                 snprintf(filename, FILENAME_MAX, "%s%s", global_host_prefix, "/sys/block/%s/queue/hw_sector_size");
43                 snprintf(path_to_get_hw_sector_size, FILENAME_MAX, "%s%s", global_host_prefix, config_get("plugin:proc:/proc/diskstats", "path to get h/w sector size", filename));
44         }
45
46         ff = procfile_readall(ff);
47         if(!ff) return 0; // we return 0, so that we will retry to open it next time
48
49         uint32_t lines = procfile_lines(ff), l;
50         uint32_t words;
51
52         for(l = 0; l < lines ;l++) {
53                 char *disk;
54                 unsigned long long      major = 0, minor = 0,
55                                                         reads = 0,  mreads = 0,  readsectors = 0,  readms = 0,
56                                                         writes = 0, mwrites = 0, writesectors = 0, writems = 0,
57                                                         queued_ios = 0, busy_ms = 0, backlog_ms = 0;
58
59                 unsigned long long      last_reads = 0,  last_readsectors = 0,  last_readms = 0,
60                                                         last_writes = 0, last_writesectors = 0, last_writems = 0,
61                                                         last_busy_ms = 0;
62
63                 words = procfile_linewords(ff, l);
64                 if(words < 14) continue;
65
66                 major                   = strtoull(procfile_lineword(ff, l, 0), NULL, 10);
67                 minor                   = strtoull(procfile_lineword(ff, l, 1), NULL, 10);
68                 disk                    = procfile_lineword(ff, l, 2);
69
70                 // # of reads completed # of writes completed
71                 // This is the total number of reads or writes completed successfully.
72                 reads                   = strtoull(procfile_lineword(ff, l, 3), NULL, 10);      // rd_ios
73                 writes                  = strtoull(procfile_lineword(ff, l, 7), NULL, 10);      // wr_ios
74
75                 // # of reads merged # of writes merged
76                 // Reads and writes which are adjacent to each other may be merged for
77             // efficiency.  Thus two 4K reads may become one 8K read before it is
78             // ultimately handed to the disk, and so it will be counted (and queued)
79                 mreads                  = strtoull(procfile_lineword(ff, l, 4), NULL, 10);      // rd_merges_or_rd_sec
80                 mwrites                 = strtoull(procfile_lineword(ff, l, 8), NULL, 10);      // wr_merges
81
82                 // # of sectors read # of sectors written
83                 // This is the total number of sectors read or written successfully.
84                 readsectors     = strtoull(procfile_lineword(ff, l, 5), NULL, 10);      // rd_sec_or_wr_ios
85                 writesectors    = strtoull(procfile_lineword(ff, l, 9), NULL, 10);      // wr_sec
86
87                 // # of milliseconds spent reading # of milliseconds spent writing
88                 // This is the total number of milliseconds spent by all reads or writes (as
89                 // measured from __make_request() to end_that_request_last()).
90                 readms                  = strtoull(procfile_lineword(ff, l, 6), NULL, 10);      // rd_ticks_or_wr_sec
91                 writems                 = strtoull(procfile_lineword(ff, l, 10), NULL, 10);     // wr_ticks
92
93                 // # of I/Os currently in progress
94                 // The only field that should go to zero. Incremented as requests are
95                 // given to appropriate struct request_queue and decremented as they finish.
96                 queued_ios              = strtoull(procfile_lineword(ff, l, 11), NULL, 10);     // ios_pgr
97
98                 // # of milliseconds spent doing I/Os
99                 // This field increases so long as field queued_ios is nonzero.
100                 busy_ms                 = strtoull(procfile_lineword(ff, l, 12), NULL, 10);     // tot_ticks
101
102                 // weighted # of milliseconds spent doing I/Os
103                 // This field is incremented at each I/O start, I/O completion, I/O
104                 // merge, or read of these stats by the number of I/Os in progress
105                 // (field queued_ios) times the number of milliseconds spent doing I/O since the
106                 // last update of this field.  This can provide an easy measure of both
107                 // I/O completion time and the backlog that may be accumulating.
108                 backlog_ms              = strtoull(procfile_lineword(ff, l, 13), NULL, 10);     // rq_ticks
109
110
111                 int def_enabled = 0;
112
113                 // remove slashes from disk names
114                 char *s;
115                 for(s = disk; *s ;s++) if(*s == '/') *s = '_';
116
117                 switch(major) {
118                         case 9: // MDs
119                         case 43: // network block
120                         case 144: // nfs
121                         case 145: // nfs
122                         case 146: // nfs
123                         case 199: // veritas
124                         case 201: // veritas
125                         case 251: // dm
126                                 def_enabled = enable_new_disks;
127                                 break;
128
129                         case 48: // RAID
130                         case 49: // RAID
131                         case 50: // RAID
132                         case 51: // RAID
133                         case 52: // RAID
134                         case 53: // RAID
135                         case 54: // RAID
136                         case 55: // RAID
137                         case 112: // RAID
138                         case 136: // RAID
139                         case 137: // RAID
140                         case 138: // RAID
141                         case 139: // RAID
142                         case 140: // RAID
143                         case 141: // RAID
144                         case 142: // RAID
145                         case 143: // RAID
146                         case 179: // MMC
147                         case 180: // USB
148                                 if(minor % 8) def_enabled = 0; // partitions
149                                 else def_enabled = enable_new_disks;
150                                 break;
151
152                         case 8: // scsi disks
153                         case 65: // scsi disks
154                         case 66: // scsi disks
155                         case 67: // scsi disks
156                         case 68: // scsi disks
157                         case 69: // scsi disks
158                         case 70: // scsi disks
159                         case 71: // scsi disks
160                         case 72: // scsi disks
161                         case 73: // scsi disks
162                         case 74: // scsi disks
163                         case 75: // scsi disks
164                         case 76: // scsi disks
165                         case 77: // scsi disks
166                         case 78: // scsi disks
167                         case 79: // scsi disks
168                         case 80: // i2o
169                         case 81: // i2o
170                         case 82: // i2o
171                         case 83: // i2o
172                         case 84: // i2o
173                         case 85: // i2o
174                         case 86: // i2o
175                         case 87: // i2o
176                         case 101: // hyperdisk
177                         case 102: // compressed
178                         case 104: // scsi
179                         case 105: // scsi
180                         case 106: // scsi
181                         case 107: // scsi
182                         case 108: // scsi
183                         case 109: // scsi
184                         case 110: // scsi
185                         case 111: // scsi
186                         case 114: // bios raid
187                         case 116: // ram board
188                         case 128: // scsi
189                         case 129: // scsi
190                         case 130: // scsi
191                         case 131: // scsi
192                         case 132: // scsi
193                         case 133: // scsi
194                         case 134: // scsi
195                         case 135: // scsi
196                         case 153: // raid
197                         case 202: // xen
198                         case 256: // flash
199                         case 257: // flash
200                                 if(minor % 16) def_enabled = 0; // partitions
201                                 else def_enabled = enable_new_disks;
202                                 break;
203
204                         case 160: // raid
205                         case 161: // raid
206                                 if(minor % 32) def_enabled = 0; // partitions
207                                 else def_enabled = enable_new_disks;
208                                 break;
209
210                         case 3: // ide
211                         case 13: // 8bit ide
212                         case 22: // ide
213                         case 33: // ide
214                         case 34: // ide
215                         case 56: // ide
216                         case 57: // ide
217                         case 88: // ide
218                         case 89: // ide
219                         case 90: // ide
220                         case 91: // ide
221                                 if(minor % 64) def_enabled = 0; // partitions
222                                 else def_enabled = enable_new_disks;
223                                 break;
224
225                         case 252: // zram
226                                 def_enabled = 0;
227                                 break;
228
229                         default:
230                                 def_enabled = 0;
231                                 break;
232                 }
233
234                 int ddo_io = do_io, ddo_ops = do_ops, ddo_mops = do_mops, ddo_iotime = do_iotime, ddo_qops = do_qops, ddo_util = do_util, ddo_backlog = do_backlog;
235
236                 // check which charts are enabled for this disk
237                 {
238                         char var_name[4096 + 1];
239                         snprintf(var_name, 4096, "plugin:proc:/proc/diskstats:%s", disk);
240                         def_enabled = config_get_boolean_ondemand(var_name, "enabled", def_enabled);
241                         if(def_enabled == CONFIG_ONDEMAND_NO) continue;
242                         if(def_enabled == CONFIG_ONDEMAND_ONDEMAND && !reads && !writes) continue;
243
244
245                         ddo_io          = config_get_boolean_ondemand(var_name, "bandwidth", ddo_io);
246                         ddo_ops         = config_get_boolean_ondemand(var_name, "operations", ddo_ops);
247                         ddo_mops        = config_get_boolean_ondemand(var_name, "merged operations", ddo_mops);
248                         ddo_iotime      = config_get_boolean_ondemand(var_name, "i/o time", ddo_iotime);
249                         ddo_qops        = config_get_boolean_ondemand(var_name, "queued operations", ddo_qops);
250                         ddo_util        = config_get_boolean_ondemand(var_name, "utilization percentage", ddo_util);
251                         ddo_backlog = config_get_boolean_ondemand(var_name, "backlog", ddo_backlog);
252
253                         // by default, do not add charts that do not have values
254                         if(ddo_io == CONFIG_ONDEMAND_ONDEMAND && !reads && !writes) ddo_io = 0;
255                         if(ddo_mops == CONFIG_ONDEMAND_ONDEMAND && mreads == 0 && mwrites == 0) ddo_mops = 0;
256                         if(ddo_iotime == CONFIG_ONDEMAND_ONDEMAND && readms == 0 && writems == 0) ddo_iotime = 0;
257                         if(ddo_util == CONFIG_ONDEMAND_ONDEMAND && busy_ms == 0) ddo_util = 0;
258                         if(ddo_backlog == CONFIG_ONDEMAND_ONDEMAND && backlog_ms == 0) ddo_backlog = 0;
259                         if(ddo_qops == CONFIG_ONDEMAND_ONDEMAND && backlog_ms == 0) ddo_qops = 0;
260
261                         // for absolute values, we need to switch the setting to 'yes'
262                         // to allow it refresh from now on
263                         if(ddo_qops == CONFIG_ONDEMAND_ONDEMAND) config_set(var_name, "queued operations", "yes");
264                 }
265
266                 RRDSET *st;
267
268                 // --------------------------------------------------------------------
269
270                 int sector_size = 512;
271                 if(ddo_io) {
272                         st = rrdset_find_bytype(RRD_TYPE_DISK, disk);
273                         if(!st) {
274                                 char tf[FILENAME_MAX + 1], *t;
275                                 char ssfilename[FILENAME_MAX + 1];
276
277                                 strncpy(tf, disk, FILENAME_MAX);
278                                 tf[FILENAME_MAX] = '\0';
279
280                                 // replace all / with !
281                                 while((t = strchr(tf, '/'))) *t = '!';
282
283                                 snprintf(ssfilename, FILENAME_MAX, path_to_get_hw_sector_size, tf);
284                                 FILE *fpss = fopen(ssfilename, "r");
285                                 if(fpss) {
286                                         char ssbuffer[1025];
287                                         char *tmp = fgets(ssbuffer, 1024, fpss);
288
289                                         if(tmp) {
290                                                 sector_size = atoi(tmp);
291                                                 if(sector_size <= 0) {
292                                                         error("Invalid sector size %d for device %s in %s. Assuming 512.", sector_size, disk, ssfilename);
293                                                         sector_size = 512;
294                                                 }
295                                         }
296                                         else error("Cannot read data for sector size for device %s from %s. Assuming 512.", disk, ssfilename);
297
298                                         fclose(fpss);
299                                 }
300                                 else error("Cannot read sector size for device %s from %s. Assuming 512.", disk, ssfilename);
301
302                                 st = rrdset_create(RRD_TYPE_DISK, disk, NULL, disk, "Disk I/O Bandwidth", "kilobytes/s", 2000, update_every, RRDSET_TYPE_AREA);
303
304                                 rrddim_add(st, "reads", NULL, sector_size, 1024, RRDDIM_INCREMENTAL);
305                                 rrddim_add(st, "writes", NULL, sector_size * -1, 1024, RRDDIM_INCREMENTAL);
306                         }
307                         else rrdset_next_usec(st, dt);
308
309                         last_readsectors  = rrddim_set(st, "reads", readsectors);
310                         last_writesectors = rrddim_set(st, "writes", writesectors);
311                         rrdset_done(st);
312                 }
313
314                 // --------------------------------------------------------------------
315
316                 if(ddo_ops) {
317                         st = rrdset_find_bytype("disk_ops", disk);
318                         if(!st) {
319                                 st = rrdset_create("disk_ops", disk, NULL, disk, "Disk Completed I/O Operations", "operations/s", 2001, update_every, RRDSET_TYPE_LINE);
320                                 st->isdetail = 1;
321
322                                 rrddim_add(st, "reads", NULL, 1, 1, RRDDIM_INCREMENTAL);
323                                 rrddim_add(st, "writes", NULL, -1, 1, RRDDIM_INCREMENTAL);
324                         }
325                         else rrdset_next_usec(st, dt);
326
327                         last_reads  = rrddim_set(st, "reads", reads);
328                         last_writes = rrddim_set(st, "writes", writes);
329                         rrdset_done(st);
330                 }
331
332                 // --------------------------------------------------------------------
333
334                 if(ddo_qops) {
335                         st = rrdset_find_bytype("disk_qops", disk);
336                         if(!st) {
337                                 st = rrdset_create("disk_qops", disk, NULL, disk, "Disk Queued I/O Operations", "operations", 2002, update_every, RRDSET_TYPE_LINE);
338                                 st->isdetail = 1;
339
340                                 rrddim_add(st, "operations", NULL, 1, 1, RRDDIM_ABSOLUTE);
341                         }
342                         else rrdset_next_usec(st, dt);
343
344                         rrddim_set(st, "operations", queued_ios);
345                         rrdset_done(st);
346                 }
347
348                 // --------------------------------------------------------------------
349
350                 if(ddo_backlog) {
351                         st = rrdset_find_bytype("disk_backlog", disk);
352                         if(!st) {
353                                 st = rrdset_create("disk_backlog", disk, NULL, disk, "Disk Backlog", "backlog (ms)", 2003, update_every, RRDSET_TYPE_AREA);
354                                 st->isdetail = 1;
355
356                                 rrddim_add(st, "backlog", NULL, 1, 10, RRDDIM_INCREMENTAL);
357                         }
358                         else rrdset_next_usec(st, dt);
359
360                         rrddim_set(st, "backlog", backlog_ms);
361                         rrdset_done(st);
362                 }
363
364                 // --------------------------------------------------------------------
365
366                 if(ddo_util) {
367                         st = rrdset_find_bytype("disk_util", disk);
368                         if(!st) {
369                                 st = rrdset_create("disk_util", disk, NULL, disk, "Disk Utilization Time", "% of time working", 2004, update_every, RRDSET_TYPE_AREA);
370                                 st->isdetail = 1;
371
372                                 rrddim_add(st, "utilization", NULL, 1, 10, RRDDIM_INCREMENTAL);
373                         }
374                         else rrdset_next_usec(st, dt);
375
376                         last_busy_ms = rrddim_set(st, "utilization", busy_ms);
377                         rrdset_done(st);
378                 }
379
380                 // --------------------------------------------------------------------
381
382                 if(ddo_mops) {
383                         st = rrdset_find_bytype("disk_mops", disk);
384                         if(!st) {
385                                 st = rrdset_create("disk_mops", disk, NULL, disk, "Disk Merged Operations", "merged operations/s", 2021, update_every, RRDSET_TYPE_LINE);
386                                 st->isdetail = 1;
387
388                                 rrddim_add(st, "reads", NULL, 1, 1, RRDDIM_INCREMENTAL);
389                                 rrddim_add(st, "writes", NULL, -1, 1, RRDDIM_INCREMENTAL);
390                         }
391                         else rrdset_next_usec(st, dt);
392
393                         rrddim_set(st, "reads", mreads);
394                         rrddim_set(st, "writes", mwrites);
395                         rrdset_done(st);
396                 }
397
398                 // --------------------------------------------------------------------
399
400                 if(ddo_iotime) {
401                         st = rrdset_find_bytype("disk_iotime", disk);
402                         if(!st) {
403                                 st = rrdset_create("disk_iotime", disk, NULL, disk, "Disk Total I/O Time", "milliseconds/s", 2022, update_every, RRDSET_TYPE_LINE);
404                                 st->isdetail = 1;
405
406                                 rrddim_add(st, "reads", NULL, 1, 1, RRDDIM_INCREMENTAL);
407                                 rrddim_add(st, "writes", NULL, -1, 1, RRDDIM_INCREMENTAL);
408                         }
409                         else rrdset_next_usec(st, dt);
410
411                         last_readms  = rrddim_set(st, "reads", readms);
412                         last_writems = rrddim_set(st, "writes", writems);
413                         rrdset_done(st);
414                 }
415
416                 // --------------------------------------------------------------------
417                 // calculate differential charts
418                 // only if this is not the first time we run
419
420                 if(dt) {
421                         if(ddo_iotime && ddo_ops) {
422                                 st = rrdset_find_bytype("disk_await", disk);
423                                 if(!st) {
424                                         st = rrdset_create("disk_await", disk, NULL, disk, "Average Completed I/O Operation Time", "ms per operation", 2005, update_every, RRDSET_TYPE_LINE);
425                                         st->isdetail = 1;
426
427                                         rrddim_add(st, "reads", NULL, 1, 1, RRDDIM_ABSOLUTE);
428                                         rrddim_add(st, "writes", NULL, -1, 1, RRDDIM_ABSOLUTE);
429                                 }
430                                 else rrdset_next_usec(st, dt);
431
432                                 rrddim_set(st, "reads", (reads - last_reads) ? (readms - last_readms) / (reads - last_reads) : 0);
433                                 rrddim_set(st, "writes", (writes - last_writes) ? (writems - last_writems) / (writes - last_writes) : 0);
434                                 rrdset_done(st);
435                         }
436
437                         if(ddo_io && ddo_ops) {
438                                 st = rrdset_find_bytype("disk_avgsz", disk);
439                                 if(!st) {
440                                         st = rrdset_create("disk_avgsz", disk, NULL, disk, "Average Completed I/O Operation Bandwidth", "kilobytes per operation", 2006, update_every, RRDSET_TYPE_AREA);
441                                         st->isdetail = 1;
442
443                                         rrddim_add(st, "reads", NULL, sector_size, 1024, RRDDIM_ABSOLUTE);
444                                         rrddim_add(st, "writes", NULL, -sector_size, 1024, RRDDIM_ABSOLUTE);
445                                 }
446                                 else rrdset_next_usec(st, dt);
447
448                                 rrddim_set(st, "reads", (reads - last_reads) ? (readsectors - last_readsectors) / (reads - last_reads) : 0);
449                                 rrddim_set(st, "writes", (writes - last_writes) ? (writesectors - last_writesectors) / (writes - last_writes) : 0);
450                                 rrdset_done(st);
451                         }
452
453                         if(ddo_util && ddo_ops) {
454                                 st = rrdset_find_bytype("disk_svctm", disk);
455                                 if(!st) {
456                                         st = rrdset_create("disk_svctm", disk, NULL, disk, "Average Service Time", "ms per operation", 2007, update_every, RRDSET_TYPE_LINE);
457                                         st->isdetail = 1;
458
459                                         rrddim_add(st, "svctm", NULL, 1, 1, RRDDIM_ABSOLUTE);
460                                 }
461                                 else rrdset_next_usec(st, dt);
462
463                                 rrddim_set(st, "svctm", ((reads - last_reads) + (writes - last_writes)) ? (busy_ms - last_busy_ms) / ((reads - last_reads) + (writes - last_writes)) : 0);
464                                 rrdset_done(st);
465                         }
466                 }
467         }
468
469         return 0;
470 }