11 #include "plugin_proc.h"
13 #define RRD_TYPE_DISK "disk"
14 #define RRD_TYPE_DISK_LEN strlen(RRD_TYPE_DISK)
16 #define MAX_PROC_DISKSTATS_LINE 4096
18 int do_proc_diskstats(int update_every, unsigned long long dt) {
19 static procfile *ff = NULL;
20 static char path_to_get_hw_sector_size[FILENAME_MAX + 1] = "";
21 static int enable_new_disks = -1;
22 static int do_io = -1, do_ops = -1, do_mops = -1, do_iotime = -1, do_qops = -1, do_util = -1, do_backlog = -1;
24 if(enable_new_disks == -1) enable_new_disks = config_get_boolean("plugin:proc:/proc/diskstats", "enable new disks detected at runtime", 1);
26 if(do_io == -1) do_io = config_get_boolean("plugin:proc:/proc/diskstats", "bandwidth for all disks", 1);
27 if(do_ops == -1) do_ops = config_get_boolean("plugin:proc:/proc/diskstats", "operations for all disks", 1);
28 if(do_mops == -1) do_mops = config_get_boolean("plugin:proc:/proc/diskstats", "merged operations for all disks", 1);
29 if(do_iotime == -1) do_iotime = config_get_boolean("plugin:proc:/proc/diskstats", "i/o time for all disks", 1);
30 if(do_qops == -1) do_qops = config_get_boolean("plugin:proc:/proc/diskstats", "queued operations for all disks", 1);
31 if(do_util == -1) do_util = config_get_boolean("plugin:proc:/proc/diskstats", "utilization percentage for all disks", 1);
32 if(do_backlog == -1)do_backlog = config_get_boolean("plugin:proc:/proc/diskstats", "backlog for all disks", 1);
35 char filename[FILENAME_MAX + 1];
36 snprintf(filename, FILENAME_MAX, "%s%s", global_host_prefix, "/proc/diskstats");
37 ff = procfile_open(config_get("plugin:proc:/proc/diskstats", "filename to monitor", filename), " \t", PROCFILE_FLAG_DEFAULT);
41 if(!path_to_get_hw_sector_size[0]) {
42 char filename[FILENAME_MAX + 1];
43 snprintf(filename, FILENAME_MAX, "%s%s", global_host_prefix, "/sys/block/%s/queue/hw_sector_size");
44 snprintf(path_to_get_hw_sector_size, FILENAME_MAX, "%s%s", global_host_prefix, config_get("plugin:proc:/proc/diskstats", "path to get h/w sector size", filename));
47 ff = procfile_readall(ff);
48 if(!ff) return 0; // we return 0, so that we will retry to open it next time
50 uint32_t lines = procfile_lines(ff), l;
53 for(l = 0; l < lines ;l++) {
55 unsigned long long major = 0, minor = 0,
56 reads = 0, mreads = 0, readsectors = 0, readms = 0,
57 writes = 0, mwrites = 0, writesectors = 0, writems = 0,
58 queued_ios = 0, busy_ms = 0, backlog_ms = 0;
60 unsigned long long last_reads = 0, last_readsectors = 0, last_readms = 0,
61 last_writes = 0, last_writesectors = 0, last_writems = 0,
64 words = procfile_linewords(ff, l);
65 if(words < 14) continue;
67 major = strtoull(procfile_lineword(ff, l, 0), NULL, 10);
68 minor = strtoull(procfile_lineword(ff, l, 1), NULL, 10);
69 disk = procfile_lineword(ff, l, 2);
71 // # of reads completed # of writes completed
72 // This is the total number of reads or writes completed successfully.
73 reads = strtoull(procfile_lineword(ff, l, 3), NULL, 10); // rd_ios
74 writes = strtoull(procfile_lineword(ff, l, 7), NULL, 10); // wr_ios
76 // # of reads merged # of writes merged
77 // Reads and writes which are adjacent to each other may be merged for
78 // efficiency. Thus two 4K reads may become one 8K read before it is
79 // ultimately handed to the disk, and so it will be counted (and queued)
80 mreads = strtoull(procfile_lineword(ff, l, 4), NULL, 10); // rd_merges_or_rd_sec
81 mwrites = strtoull(procfile_lineword(ff, l, 8), NULL, 10); // wr_merges
83 // # of sectors read # of sectors written
84 // This is the total number of sectors read or written successfully.
85 readsectors = strtoull(procfile_lineword(ff, l, 5), NULL, 10); // rd_sec_or_wr_ios
86 writesectors = strtoull(procfile_lineword(ff, l, 9), NULL, 10); // wr_sec
88 // # of milliseconds spent reading # of milliseconds spent writing
89 // This is the total number of milliseconds spent by all reads or writes (as
90 // measured from __make_request() to end_that_request_last()).
91 readms = strtoull(procfile_lineword(ff, l, 6), NULL, 10); // rd_ticks_or_wr_sec
92 writems = strtoull(procfile_lineword(ff, l, 10), NULL, 10); // wr_ticks
94 // # of I/Os currently in progress
95 // The only field that should go to zero. Incremented as requests are
96 // given to appropriate struct request_queue and decremented as they finish.
97 queued_ios = strtoull(procfile_lineword(ff, l, 11), NULL, 10); // ios_pgr
99 // # of milliseconds spent doing I/Os
100 // This field increases so long as field queued_ios is nonzero.
101 busy_ms = strtoull(procfile_lineword(ff, l, 12), NULL, 10); // tot_ticks
103 // weighted # of milliseconds spent doing I/Os
104 // This field is incremented at each I/O start, I/O completion, I/O
105 // merge, or read of these stats by the number of I/Os in progress
106 // (field queued_ios) times the number of milliseconds spent doing I/O since the
107 // last update of this field. This can provide an easy measure of both
108 // I/O completion time and the backlog that may be accumulating.
109 backlog_ms = strtoull(procfile_lineword(ff, l, 13), NULL, 10); // rq_ticks
113 // remove slashes from disk names
115 for(s = disk; *s ;s++) if(*s == '/') *s = '_';
119 case 43: // network block
126 def_enabled = enable_new_disks;
148 if(minor % 8) def_enabled = 0; // partitions
149 else def_enabled = enable_new_disks;
152 case 8: // scsi disks
153 case 65: // scsi disks
154 case 66: // scsi disks
155 case 67: // scsi disks
156 case 68: // scsi disks
157 case 69: // scsi disks
158 case 70: // scsi disks
159 case 71: // scsi disks
160 case 72: // scsi disks
161 case 73: // scsi disks
162 case 74: // scsi disks
163 case 75: // scsi disks
164 case 76: // scsi disks
165 case 77: // scsi disks
166 case 78: // scsi disks
167 case 79: // scsi disks
176 case 101: // hyperdisk
177 case 102: // compressed
186 case 114: // bios raid
187 case 116: // ram board
200 if(minor % 16) def_enabled = 0; // partitions
201 else def_enabled = enable_new_disks;
206 if(minor % 32) def_enabled = 0; // partitions
207 else def_enabled = enable_new_disks;
221 if(minor % 64) def_enabled = 0; // partitions
222 else def_enabled = enable_new_disks;
230 // check if it is enabled
232 char var_name[4096 + 1];
233 snprintf(var_name, 4096, "disk %s", disk);
234 if(!config_get_boolean("plugin:proc:/proc/diskstats", var_name, def_enabled)) continue;
239 // --------------------------------------------------------------------
241 int sector_size = 512;
243 st = rrdset_find_bytype(RRD_TYPE_DISK, disk);
245 char tf[FILENAME_MAX + 1], *t;
246 char ssfilename[FILENAME_MAX + 1];
248 strncpy(tf, disk, FILENAME_MAX);
249 tf[FILENAME_MAX] = '\0';
251 // replace all / with !
252 while((t = strchr(tf, '/'))) *t = '!';
254 snprintf(ssfilename, FILENAME_MAX, path_to_get_hw_sector_size, tf);
255 FILE *fpss = fopen(ssfilename, "r");
258 char *tmp = fgets(ssbuffer, 1024, fpss);
261 sector_size = atoi(tmp);
262 if(sector_size <= 0) {
263 error("Invalid sector size %d for device %s in %s. Assuming 512.", sector_size, disk, ssfilename);
267 else error("Cannot read data for sector size for device %s from %s. Assuming 512.", disk, ssfilename);
271 else error("Cannot read sector size for device %s from %s. Assuming 512.", disk, ssfilename);
273 st = rrdset_create(RRD_TYPE_DISK, disk, NULL, disk, "Disk I/O Bandwidth", "kilobytes/s", 2000, update_every, RRDSET_TYPE_AREA);
275 rrddim_add(st, "reads", NULL, sector_size, 1024 * update_every, RRDDIM_INCREMENTAL);
276 rrddim_add(st, "writes", NULL, sector_size * -1, 1024 * update_every, RRDDIM_INCREMENTAL);
278 else rrdset_next_usec(st, dt);
280 last_readsectors = rrddim_set(st, "reads", readsectors);
281 last_writesectors = rrddim_set(st, "writes", writesectors);
285 // --------------------------------------------------------------------
288 st = rrdset_find_bytype("disk_ops", disk);
290 st = rrdset_create("disk_ops", disk, NULL, disk, "Disk Completed I/O Operations", "operations/s", 2001, update_every, RRDSET_TYPE_LINE);
293 rrddim_add(st, "reads", NULL, 1, 1 * update_every, RRDDIM_INCREMENTAL);
294 rrddim_add(st, "writes", NULL, -1, 1 * update_every, RRDDIM_INCREMENTAL);
296 else rrdset_next_usec(st, dt);
298 last_reads = rrddim_set(st, "reads", reads);
299 last_writes = rrddim_set(st, "writes", writes);
303 // --------------------------------------------------------------------
306 st = rrdset_find_bytype("disk_qops", disk);
308 st = rrdset_create("disk_qops", disk, NULL, disk, "Disk Queued I/O Operations", "operations", 2002, update_every, RRDSET_TYPE_LINE);
311 rrddim_add(st, "operations", NULL, 1, 1, RRDDIM_ABSOLUTE);
313 else rrdset_next_usec(st, dt);
315 rrddim_set(st, "operations", queued_ios);
319 // --------------------------------------------------------------------
322 st = rrdset_find_bytype("disk_backlog", disk);
324 st = rrdset_create("disk_backlog", disk, NULL, disk, "Disk Backlog", "backlog (ms)", 2003, update_every, RRDSET_TYPE_AREA);
327 rrddim_add(st, "backlog", NULL, 1, 10 * update_every, RRDDIM_INCREMENTAL);
329 else rrdset_next_usec(st, dt);
331 rrddim_set(st, "backlog", backlog_ms);
335 // --------------------------------------------------------------------
338 st = rrdset_find_bytype("disk_util", disk);
340 st = rrdset_create("disk_util", disk, NULL, disk, "Disk Utilization Time", "% of time working", 2004, update_every, RRDSET_TYPE_AREA);
343 rrddim_add(st, "utilization", NULL, 1, 10 * update_every, RRDDIM_INCREMENTAL);
345 else rrdset_next_usec(st, dt);
347 last_busy_ms = rrddim_set(st, "utilization", busy_ms);
351 // --------------------------------------------------------------------
354 st = rrdset_find_bytype("disk_mops", disk);
356 st = rrdset_create("disk_mops", disk, NULL, disk, "Disk Merged Operations", "merged operations/s", 2021, update_every, RRDSET_TYPE_LINE);
359 rrddim_add(st, "reads", NULL, 1, 1 * update_every, RRDDIM_INCREMENTAL);
360 rrddim_add(st, "writes", NULL, -1, 1 * update_every, RRDDIM_INCREMENTAL);
362 else rrdset_next_usec(st, dt);
364 rrddim_set(st, "reads", mreads);
365 rrddim_set(st, "writes", mwrites);
369 // --------------------------------------------------------------------
372 st = rrdset_find_bytype("disk_iotime", disk);
374 st = rrdset_create("disk_iotime", disk, NULL, disk, "Disk Total I/O Time", "milliseconds/s", 2022, update_every, RRDSET_TYPE_LINE);
377 rrddim_add(st, "reads", NULL, 1, 1 * update_every, RRDDIM_INCREMENTAL);
378 rrddim_add(st, "writes", NULL, -1, 1 * update_every, RRDDIM_INCREMENTAL);
380 else rrdset_next_usec(st, dt);
382 last_readms = rrddim_set(st, "reads", readms);
383 last_writems = rrddim_set(st, "writes", writems);
387 // --------------------------------------------------------------------
388 // calculate differential charts
389 // only if this is not the first time we run
392 if(do_iotime && do_ops) {
393 st = rrdset_find_bytype("disk_await", disk);
395 st = rrdset_create("disk_await", disk, NULL, disk, "Average Completed I/O Operation Time", "ms per operation", 2005, update_every, RRDSET_TYPE_LINE);
398 rrddim_add(st, "reads", NULL, 1, 1, RRDDIM_ABSOLUTE);
399 rrddim_add(st, "writes", NULL, -1, 1, RRDDIM_ABSOLUTE);
401 else rrdset_next_usec(st, dt);
403 rrddim_set(st, "reads", (reads - last_reads) ? (readms - last_readms) / (reads - last_reads) : 0);
404 rrddim_set(st, "writes", (writes - last_writes) ? (writems - last_writems) / (writes - last_writes) : 0);
408 if(do_io && do_ops) {
409 st = rrdset_find_bytype("disk_avgsz", disk);
411 st = rrdset_create("disk_avgsz", disk, NULL, disk, "Average Completed I/O Operation Bandwidth", "kilobytes per operation", 2006, update_every, RRDSET_TYPE_AREA);
414 rrddim_add(st, "reads", NULL, sector_size, 1024, RRDDIM_ABSOLUTE);
415 rrddim_add(st, "writes", NULL, -sector_size, 1024, RRDDIM_ABSOLUTE);
417 else rrdset_next_usec(st, dt);
419 rrddim_set(st, "reads", (reads - last_reads) ? (readsectors - last_readsectors) / (reads - last_reads) : 0);
420 rrddim_set(st, "writes", (writes - last_writes) ? (writesectors - last_writesectors) / (writes - last_writes) : 0);
424 if(do_util && do_ops) {
425 st = rrdset_find_bytype("disk_svctm", disk);
427 st = rrdset_create("disk_svctm", disk, NULL, disk, "Average Service Time", "ms per operation", 2007, update_every, RRDSET_TYPE_LINE);
430 rrddim_add(st, "svctm", NULL, 1, 1, RRDDIM_ABSOLUTE);
432 else rrdset_next_usec(st, dt);
434 rrddim_set(st, "svctm", ((reads - last_reads) + (writes - last_writes)) ? (busy_ms - last_busy_ms) / ((reads - last_reads) + (writes - last_writes)) : 0);