]> arthur.barton.de Git - netdata.git/blob - src/proc_diskstats.c
e7a84162c7426e2f528fc2713ff79c4bdcb08bb5
[netdata.git] / src / proc_diskstats.c
1 #include <inttypes.h>
2 #include <stdio.h>
3 #include <stdlib.h>
4 #include <string.h>
5
6 #include "common.h"
7 #include "log.h"
8 #include "config.h"
9 #include "procfile.h"
10 #include "rrd.h"
11 #include "plugin_proc.h"
12
13 #define RRD_TYPE_DISK                           "disk"
14 #define RRD_TYPE_DISK_LEN                       strlen(RRD_TYPE_DISK)
15
16 #define MAX_PROC_DISKSTATS_LINE 4096
17
18 int do_proc_diskstats(int update_every, unsigned long long dt) {
19         static procfile *ff = NULL;
20         static char path_to_get_hw_sector_size[FILENAME_MAX + 1] = "";
21         static int enable_new_disks = -1;
22         static int do_io = -1, do_ops = -1, do_mops = -1, do_iotime = -1, do_qops = -1, do_util = -1, do_backlog = -1;
23
24         if(enable_new_disks == -1)      enable_new_disks = config_get_boolean("plugin:proc:/proc/diskstats", "enable new disks detected at runtime", 1);
25
26         if(do_io == -1)         do_io           = config_get_boolean("plugin:proc:/proc/diskstats", "bandwidth for all disks", 1);
27         if(do_ops == -1)        do_ops          = config_get_boolean("plugin:proc:/proc/diskstats", "operations for all disks", 1);
28         if(do_mops == -1)       do_mops         = config_get_boolean("plugin:proc:/proc/diskstats", "merged operations for all disks", 1);
29         if(do_iotime == -1)     do_iotime       = config_get_boolean("plugin:proc:/proc/diskstats", "i/o time for all disks", 1);
30         if(do_qops == -1)       do_qops         = config_get_boolean("plugin:proc:/proc/diskstats", "queued operations for all disks", 1);
31         if(do_util == -1)       do_util         = config_get_boolean("plugin:proc:/proc/diskstats", "utilization percentage for all disks", 1);
32         if(do_backlog == -1)do_backlog  = config_get_boolean("plugin:proc:/proc/diskstats", "backlog for all disks", 1);
33
34         if(!ff) {
35                 char filename[FILENAME_MAX + 1];
36                 snprintf(filename, FILENAME_MAX, "%s%s", global_host_prefix, "/proc/diskstats");
37                 ff = procfile_open(config_get("plugin:proc:/proc/diskstats", "filename to monitor", filename), " \t", PROCFILE_FLAG_DEFAULT);
38         }
39         if(!ff) return 1;
40
41         if(!path_to_get_hw_sector_size[0]) {
42                 char filename[FILENAME_MAX + 1];
43                 snprintf(filename, FILENAME_MAX, "%s%s", global_host_prefix, "/sys/block/%s/queue/hw_sector_size");
44                 snprintf(path_to_get_hw_sector_size, FILENAME_MAX, "%s%s", global_host_prefix, config_get("plugin:proc:/proc/diskstats", "path to get h/w sector size", filename));
45         }
46
47         ff = procfile_readall(ff);
48         if(!ff) return 0; // we return 0, so that we will retry to open it next time
49
50         uint32_t lines = procfile_lines(ff), l;
51         uint32_t words;
52
53         for(l = 0; l < lines ;l++) {
54                 char *disk;
55                 unsigned long long      major = 0, minor = 0,
56                                                         reads = 0,  mreads = 0,  readsectors = 0,  readms = 0,
57                                                         writes = 0, mwrites = 0, writesectors = 0, writems = 0,
58                                                         queued_ios = 0, busy_ms = 0, backlog_ms = 0;
59
60                 unsigned long long      last_reads = 0,  last_readsectors = 0,  last_readms = 0,
61                                                         last_writes = 0, last_writesectors = 0, last_writems = 0,
62                                                         last_busy_ms = 0;
63
64                 words = procfile_linewords(ff, l);
65                 if(words < 14) continue;
66
67                 major                   = strtoull(procfile_lineword(ff, l, 0), NULL, 10);
68                 minor                   = strtoull(procfile_lineword(ff, l, 1), NULL, 10);
69                 disk                    = procfile_lineword(ff, l, 2);
70
71                 // # of reads completed # of writes completed
72                 // This is the total number of reads or writes completed successfully.
73                 reads                   = strtoull(procfile_lineword(ff, l, 3), NULL, 10);      // rd_ios
74                 writes                  = strtoull(procfile_lineword(ff, l, 7), NULL, 10);      // wr_ios
75
76                 // # of reads merged # of writes merged
77                 // Reads and writes which are adjacent to each other may be merged for
78             // efficiency.  Thus two 4K reads may become one 8K read before it is
79             // ultimately handed to the disk, and so it will be counted (and queued)
80                 mreads                  = strtoull(procfile_lineword(ff, l, 4), NULL, 10);      // rd_merges_or_rd_sec
81                 mwrites                 = strtoull(procfile_lineword(ff, l, 8), NULL, 10);      // wr_merges
82
83                 // # of sectors read # of sectors written
84                 // This is the total number of sectors read or written successfully.
85                 readsectors     = strtoull(procfile_lineword(ff, l, 5), NULL, 10);      // rd_sec_or_wr_ios
86                 writesectors    = strtoull(procfile_lineword(ff, l, 9), NULL, 10);      // wr_sec
87
88                 // # of milliseconds spent reading # of milliseconds spent writing
89                 // This is the total number of milliseconds spent by all reads or writes (as
90                 // measured from __make_request() to end_that_request_last()).
91                 readms                  = strtoull(procfile_lineword(ff, l, 6), NULL, 10);      // rd_ticks_or_wr_sec
92                 writems                 = strtoull(procfile_lineword(ff, l, 10), NULL, 10);     // wr_ticks
93
94                 // # of I/Os currently in progress
95                 // The only field that should go to zero. Incremented as requests are
96                 // given to appropriate struct request_queue and decremented as they finish.
97                 queued_ios              = strtoull(procfile_lineword(ff, l, 11), NULL, 10);     // ios_pgr
98
99                 // # of milliseconds spent doing I/Os
100                 // This field increases so long as field queued_ios is nonzero.
101                 busy_ms                 = strtoull(procfile_lineword(ff, l, 12), NULL, 10);     // tot_ticks
102
103                 // weighted # of milliseconds spent doing I/Os
104                 // This field is incremented at each I/O start, I/O completion, I/O
105                 // merge, or read of these stats by the number of I/Os in progress
106                 // (field queued_ios) times the number of milliseconds spent doing I/O since the
107                 // last update of this field.  This can provide an easy measure of both
108                 // I/O completion time and the backlog that may be accumulating.
109                 backlog_ms              = strtoull(procfile_lineword(ff, l, 13), NULL, 10);     // rq_ticks
110
111                 int def_enabled = 0;
112
113                 // remove slashes from disk names
114                 char *s;
115                 for(s = disk; *s ;s++) if(*s == '/') *s = '_';
116
117                 switch(major) {
118                         case 9: // MDs
119                         case 43: // network block
120                         case 144: // nfs
121                         case 145: // nfs
122                         case 146: // nfs
123                         case 199: // veritas
124                         case 201: // veritas
125                         case 251: // dm
126                                 def_enabled = enable_new_disks;
127                                 break;
128
129                         case 48: // RAID
130                         case 49: // RAID
131                         case 50: // RAID
132                         case 51: // RAID
133                         case 52: // RAID
134                         case 53: // RAID
135                         case 54: // RAID
136                         case 55: // RAID
137                         case 112: // RAID
138                         case 136: // RAID
139                         case 137: // RAID
140                         case 138: // RAID
141                         case 139: // RAID
142                         case 140: // RAID
143                         case 141: // RAID
144                         case 142: // RAID
145                         case 143: // RAID
146                         case 179: // MMC
147                         case 180: // USB
148                                 if(minor % 8) def_enabled = 0; // partitions
149                                 else def_enabled = enable_new_disks;
150                                 break;
151
152                         case 8: // scsi disks
153                         case 65: // scsi disks
154                         case 66: // scsi disks
155                         case 67: // scsi disks
156                         case 68: // scsi disks
157                         case 69: // scsi disks
158                         case 70: // scsi disks
159                         case 71: // scsi disks
160                         case 72: // scsi disks
161                         case 73: // scsi disks
162                         case 74: // scsi disks
163                         case 75: // scsi disks
164                         case 76: // scsi disks
165                         case 77: // scsi disks
166                         case 78: // scsi disks
167                         case 79: // scsi disks
168                         case 80: // i2o
169                         case 81: // i2o
170                         case 82: // i2o
171                         case 83: // i2o
172                         case 84: // i2o
173                         case 85: // i2o
174                         case 86: // i2o
175                         case 87: // i2o
176                         case 101: // hyperdisk
177                         case 102: // compressed
178                         case 104: // scsi
179                         case 105: // scsi
180                         case 106: // scsi
181                         case 107: // scsi
182                         case 108: // scsi
183                         case 109: // scsi
184                         case 110: // scsi
185                         case 111: // scsi
186                         case 114: // bios raid
187                         case 116: // ram board
188                         case 128: // scsi
189                         case 129: // scsi
190                         case 130: // scsi
191                         case 131: // scsi
192                         case 132: // scsi
193                         case 133: // scsi
194                         case 134: // scsi
195                         case 135: // scsi
196                         case 153: // raid
197                         case 202: // xen
198                         case 256: // flash
199                         case 257: // flash
200                                 if(minor % 16) def_enabled = 0; // partitions
201                                 else def_enabled = enable_new_disks;
202                                 break;
203
204                         case 160: // raid
205                         case 161: // raid
206                                 if(minor % 32) def_enabled = 0; // partitions
207                                 else def_enabled = enable_new_disks;
208                                 break;
209
210                         case 3: // ide
211                         case 13: // 8bit ide
212                         case 22: // ide
213                         case 33: // ide
214                         case 34: // ide
215                         case 56: // ide
216                         case 57: // ide
217                         case 88: // ide
218                         case 89: // ide
219                         case 90: // ide
220                         case 91: // ide
221                                 if(minor % 64) def_enabled = 0; // partitions
222                                 else def_enabled = enable_new_disks;
223                                 break;
224
225                         default:
226                                 def_enabled = 0;
227                                 break;
228                 }
229
230                 // check if it is enabled
231                 {
232                         char var_name[4096 + 1];
233                         snprintf(var_name, 4096, "disk %s", disk);
234                         if(!config_get_boolean("plugin:proc:/proc/diskstats", var_name, def_enabled)) continue;
235                 }
236
237                 RRDSET *st;
238
239                 // --------------------------------------------------------------------
240
241                 int sector_size = 512;
242                 if(do_io) {
243                         st = rrdset_find_bytype(RRD_TYPE_DISK, disk);
244                         if(!st) {
245                                 char tf[FILENAME_MAX + 1], *t;
246                                 char ssfilename[FILENAME_MAX + 1];
247
248                                 strncpy(tf, disk, FILENAME_MAX);
249                                 tf[FILENAME_MAX] = '\0';
250
251                                 // replace all / with !
252                                 while((t = strchr(tf, '/'))) *t = '!';
253
254                                 snprintf(ssfilename, FILENAME_MAX, path_to_get_hw_sector_size, tf);
255                                 FILE *fpss = fopen(ssfilename, "r");
256                                 if(fpss) {
257                                         char ssbuffer[1025];
258                                         char *tmp = fgets(ssbuffer, 1024, fpss);
259
260                                         if(tmp) {
261                                                 sector_size = atoi(tmp);
262                                                 if(sector_size <= 0) {
263                                                         error("Invalid sector size %d for device %s in %s. Assuming 512.", sector_size, disk, ssfilename);
264                                                         sector_size = 512;
265                                                 }
266                                         }
267                                         else error("Cannot read data for sector size for device %s from %s. Assuming 512.", disk, ssfilename);
268
269                                         fclose(fpss);
270                                 }
271                                 else error("Cannot read sector size for device %s from %s. Assuming 512.", disk, ssfilename);
272
273                                 st = rrdset_create(RRD_TYPE_DISK, disk, NULL, disk, "Disk I/O Bandwidth", "kilobytes/s", 2000, update_every, RRDSET_TYPE_AREA);
274
275                                 rrddim_add(st, "reads", NULL, sector_size, 1024 * update_every, RRDDIM_INCREMENTAL);
276                                 rrddim_add(st, "writes", NULL, sector_size * -1, 1024 * update_every, RRDDIM_INCREMENTAL);
277                         }
278                         else rrdset_next_usec(st, dt);
279
280                         last_readsectors  = rrddim_set(st, "reads", readsectors);
281                         last_writesectors = rrddim_set(st, "writes", writesectors);
282                         rrdset_done(st);
283                 }
284
285                 // --------------------------------------------------------------------
286
287                 if(do_ops) {
288                         st = rrdset_find_bytype("disk_ops", disk);
289                         if(!st) {
290                                 st = rrdset_create("disk_ops", disk, NULL, disk, "Disk Completed I/O Operations", "operations/s", 2001, update_every, RRDSET_TYPE_LINE);
291                                 st->isdetail = 1;
292
293                                 rrddim_add(st, "reads", NULL, 1, 1 * update_every, RRDDIM_INCREMENTAL);
294                                 rrddim_add(st, "writes", NULL, -1, 1 * update_every, RRDDIM_INCREMENTAL);
295                         }
296                         else rrdset_next_usec(st, dt);
297
298                         last_reads  = rrddim_set(st, "reads", reads);
299                         last_writes = rrddim_set(st, "writes", writes);
300                         rrdset_done(st);
301                 }
302
303                 // --------------------------------------------------------------------
304
305                 if(do_qops) {
306                         st = rrdset_find_bytype("disk_qops", disk);
307                         if(!st) {
308                                 st = rrdset_create("disk_qops", disk, NULL, disk, "Disk Queued I/O Operations", "operations", 2002, update_every, RRDSET_TYPE_LINE);
309                                 st->isdetail = 1;
310
311                                 rrddim_add(st, "operations", NULL, 1, 1, RRDDIM_ABSOLUTE);
312                         }
313                         else rrdset_next_usec(st, dt);
314
315                         rrddim_set(st, "operations", queued_ios);
316                         rrdset_done(st);
317                 }
318
319                 // --------------------------------------------------------------------
320
321                 if(do_backlog) {
322                         st = rrdset_find_bytype("disk_backlog", disk);
323                         if(!st) {
324                                 st = rrdset_create("disk_backlog", disk, NULL, disk, "Disk Backlog", "backlog (ms)", 2003, update_every, RRDSET_TYPE_AREA);
325                                 st->isdetail = 1;
326
327                                 rrddim_add(st, "backlog", NULL, 1, 10 * update_every, RRDDIM_INCREMENTAL);
328                         }
329                         else rrdset_next_usec(st, dt);
330
331                         rrddim_set(st, "backlog", backlog_ms);
332                         rrdset_done(st);
333                 }
334
335                 // --------------------------------------------------------------------
336
337                 if(do_util) {
338                         st = rrdset_find_bytype("disk_util", disk);
339                         if(!st) {
340                                 st = rrdset_create("disk_util", disk, NULL, disk, "Disk Utilization Time", "% of time working", 2004, update_every, RRDSET_TYPE_AREA);
341                                 st->isdetail = 1;
342
343                                 rrddim_add(st, "utilization", NULL, 1, 10 * update_every, RRDDIM_INCREMENTAL);
344                         }
345                         else rrdset_next_usec(st, dt);
346
347                         last_busy_ms = rrddim_set(st, "utilization", busy_ms);
348                         rrdset_done(st);
349                 }
350
351                 // --------------------------------------------------------------------
352
353                 if(do_mops) {
354                         st = rrdset_find_bytype("disk_mops", disk);
355                         if(!st) {
356                                 st = rrdset_create("disk_mops", disk, NULL, disk, "Disk Merged Operations", "merged operations/s", 2021, update_every, RRDSET_TYPE_LINE);
357                                 st->isdetail = 1;
358
359                                 rrddim_add(st, "reads", NULL, 1, 1 * update_every, RRDDIM_INCREMENTAL);
360                                 rrddim_add(st, "writes", NULL, -1, 1 * update_every, RRDDIM_INCREMENTAL);
361                         }
362                         else rrdset_next_usec(st, dt);
363
364                         rrddim_set(st, "reads", mreads);
365                         rrddim_set(st, "writes", mwrites);
366                         rrdset_done(st);
367                 }
368
369                 // --------------------------------------------------------------------
370
371                 if(do_iotime) {
372                         st = rrdset_find_bytype("disk_iotime", disk);
373                         if(!st) {
374                                 st = rrdset_create("disk_iotime", disk, NULL, disk, "Disk Total I/O Time", "milliseconds/s", 2022, update_every, RRDSET_TYPE_LINE);
375                                 st->isdetail = 1;
376
377                                 rrddim_add(st, "reads", NULL, 1, 1 * update_every, RRDDIM_INCREMENTAL);
378                                 rrddim_add(st, "writes", NULL, -1, 1 * update_every, RRDDIM_INCREMENTAL);
379                         }
380                         else rrdset_next_usec(st, dt);
381
382                         last_readms  = rrddim_set(st, "reads", readms);
383                         last_writems = rrddim_set(st, "writes", writems);
384                         rrdset_done(st);
385                 }
386
387                 // --------------------------------------------------------------------
388                 // calculate differential charts
389                 // only if this is not the first time we run
390
391                 if(dt) {
392                         if(do_iotime && do_ops) {
393                                 st = rrdset_find_bytype("disk_await", disk);
394                                 if(!st) {
395                                         st = rrdset_create("disk_await", disk, NULL, disk, "Average Completed I/O Operation Time", "ms per operation", 2005, update_every, RRDSET_TYPE_LINE);
396                                         st->isdetail = 1;
397
398                                         rrddim_add(st, "reads", NULL, 1, 1, RRDDIM_ABSOLUTE);
399                                         rrddim_add(st, "writes", NULL, -1, 1, RRDDIM_ABSOLUTE);
400                                 }
401                                 else rrdset_next_usec(st, dt);
402
403                                 rrddim_set(st, "reads", (reads - last_reads) ? (readms - last_readms) / (reads - last_reads) : 0);
404                                 rrddim_set(st, "writes", (writes - last_writes) ? (writems - last_writems) / (writes - last_writes) : 0);
405                                 rrdset_done(st);
406                         }
407
408                         if(do_io && do_ops) {
409                                 st = rrdset_find_bytype("disk_avgsz", disk);
410                                 if(!st) {
411                                         st = rrdset_create("disk_avgsz", disk, NULL, disk, "Average Completed I/O Operation Bandwidth", "kilobytes per operation", 2006, update_every, RRDSET_TYPE_AREA);
412                                         st->isdetail = 1;
413
414                                         rrddim_add(st, "reads", NULL, sector_size, 1024, RRDDIM_ABSOLUTE);
415                                         rrddim_add(st, "writes", NULL, -sector_size, 1024, RRDDIM_ABSOLUTE);
416                                 }
417                                 else rrdset_next_usec(st, dt);
418
419                                 rrddim_set(st, "reads", (reads - last_reads) ? (readsectors - last_readsectors) / (reads - last_reads) : 0);
420                                 rrddim_set(st, "writes", (writes - last_writes) ? (writesectors - last_writesectors) / (writes - last_writes) : 0);
421                                 rrdset_done(st);
422                         }
423
424                         if(do_util && do_ops) {
425                                 st = rrdset_find_bytype("disk_svctm", disk);
426                                 if(!st) {
427                                         st = rrdset_create("disk_svctm", disk, NULL, disk, "Average Service Time", "ms per operation", 2007, update_every, RRDSET_TYPE_LINE);
428                                         st->isdetail = 1;
429
430                                         rrddim_add(st, "svctm", NULL, 1, 1, RRDDIM_ABSOLUTE);
431                                 }
432                                 else rrdset_next_usec(st, dt);
433
434                                 rrddim_set(st, "svctm", ((reads - last_reads) + (writes - last_writes)) ? (busy_ms - last_busy_ms) / ((reads - last_reads) + (writes - last_writes)) : 0);
435                                 rrdset_done(st);
436                         }
437                 }
438         }
439         
440         return 0;
441 }