1 #ifndef NETDATA_HEALTH_H
2 #define NETDATA_HEALTH_H
4 extern int health_enabled;
6 extern int rrdvar_compare(void *a, void *b);
8 #define RRDVAR_TYPE_CALCULATED 1
9 #define RRDVAR_TYPE_TIME_T 2
10 #define RRDVAR_TYPE_COLLECTED 3
11 #define RRDVAR_TYPE_TOTAL 4
12 #define RRDVAR_TYPE_INT 5
14 // the variables as stored in the variables indexes
15 // there are 3 indexes:
16 // 1. at each chart (RRDSET.variables_root_index)
17 // 2. at each context (RRDFAMILY.variables_root_index)
18 // 3. at each host (RRDHOST.variables_root_index)
19 typedef struct rrdvar {
31 // variables linked to charts
32 // We link variables to point to the values that are already
33 // calculated / processed by the normal data collection process
34 // This means, there will be no speed penalty for using
36 typedef struct rrdsetvar {
37 char *fullid; // chart type.chart id.variable
38 char *fullname; // chart type.chart name.variable
39 char *variable; // variable
52 struct rrdset *rrdset;
54 struct rrdsetvar *next;
58 // variables linked to individual dimensions
59 // We link variables to point the values that are already
60 // calculated / processed by the normal data collection process
61 // This means, there will be no speed penalty for using
63 typedef struct rrddimvar {
67 char *id; // dimension id
68 char *name; // dimension name
69 char *fullidid; // chart type.chart id.dimension id
70 char *fullidname; // chart type.chart id.dimension name
71 char *fullnameid; // chart type.chart name.dimension id
72 char *fullnamename; // chart type.chart name.dimension name
85 RRDVAR *host_fullidid;
86 RRDVAR *host_fullidname;
87 RRDVAR *host_fullnameid;
88 RRDVAR *host_fullnamename;
90 struct rrddim *rrddim;
92 struct rrddimvar *next;
95 // calculated variables (defined in health configuration)
96 // These aggregate time-series data at fixed intervals
97 // (defined in their update_every member below)
98 // These increase the overhead of netdata.
100 // These calculations are allocated and linked (->next)
102 // Then are also linked to RRDSET (of course only when the
103 // chart is found, via ->rrdset_next and ->rrdset_prev).
104 // This double-linked list is maintained sorted at all times
105 // having as RRDSET.calculations the RRDCALC to be processed
108 #define RRDCALC_STATUS_REMOVED -2
109 #define RRDCALC_STATUS_UNDEFINED -1
110 #define RRDCALC_STATUS_UNINITIALIZED 0
111 #define RRDCALC_STATUS_CLEAR 1
112 #define RRDCALC_STATUS_RAISED 2
113 #define RRDCALC_STATUS_WARNING 3
114 #define RRDCALC_STATUS_CRITICAL 4
116 #define RRDCALC_FLAG_DB_ERROR 0x00000001
117 #define RRDCALC_FLAG_DB_NAN 0x00000002
118 #define RRDCALC_FLAG_DB_STALE 0x00000004
119 #define RRDCALC_FLAG_CALC_ERROR 0x00000008
120 #define RRDCALC_FLAG_WARN_ERROR 0x00000010
121 #define RRDCALC_FLAG_CRIT_ERROR 0x00000020
123 typedef struct rrdcalc {
124 uint32_t id; // the unique id of this alarm
125 uint32_t next_event_id; // the next event id that will be used for this alarm
127 char *name; // the name of this alarm
130 char *exec; // the command to execute when this alarm switches state
131 char *recipient; // the recipient of the alarm (the first parameter to exec)
133 char *chart; // the chart id this should be linked to
136 char *source; // the source of this alarm
137 char *units; // the units of the alarm
138 char *info; // a short description of the alarm
140 int update_every; // update frequency for the alarm
142 // the red and green threshold of this alarm (to be set to the chart)
143 calculated_number green;
144 calculated_number red;
146 // ------------------------------------------------------------------------
147 // database lookup settings
149 char *dimensions; // the chart dimensions
150 int group; // grouping method: average, max, etc.
151 int before; // ending point in time-series
152 int after; // starting point in time-series
153 uint32_t options; // calculation options
155 // ------------------------------------------------------------------------
156 // expressions related to the alarm
158 EVAL_EXPRESSION *calculation; // expression to calculate the value of the alarm
159 EVAL_EXPRESSION *warning; // expression to check the warning condition
160 EVAL_EXPRESSION *critical; // expression to check the critical condition
162 // ------------------------------------------------------------------------
163 // notification delay settings
165 int delay_up_duration; // duration to delay notifications when alarm raises
166 int delay_down_duration; // duration to delay notifications when alarm lowers
167 int delay_max_duration; // the absolute max delay to apply to this alarm
168 float delay_multiplier; // multiplier for all delays when alarms switch status
169 // while now < delay_up_to
171 // ------------------------------------------------------------------------
172 // runtime information
174 int status; // the current status of the alarm
176 calculated_number value; // the current value of the alarm
177 calculated_number old_value; // the previous value of the alarm
179 uint32_t rrdcalc_flags; // check RRDCALC_FLAG_*
181 time_t last_updated; // the last update timestamp of the alarm
182 time_t next_update; // the next update timestamp of the alarm
183 time_t last_status_change; // the timestamp of the last time this alarm changed status
185 time_t db_after; // the first timestamp evaluated by the db lookup
186 time_t db_before; // the last timestamp evaluated by the db lookup
188 time_t delay_up_to_timestamp; // the timestamp up to which we should delay notifications
189 int delay_up_current; // the current up notification delay duration
190 int delay_down_current; // the current down notification delay duration
191 int delay_last; // the last delay we used
193 // ------------------------------------------------------------------------
194 // variables this alarm exposes to the rest of the alarms
201 // ------------------------------------------------------------------------
202 // the chart this alarm it is linked to
204 struct rrdset *rrdset;
206 // linking of this alarm on its chart
207 struct rrdcalc *rrdset_next;
208 struct rrdcalc *rrdset_prev;
210 struct rrdcalc *next;
213 #define RRDCALC_HAS_DB_LOOKUP(rc) ((rc)->after)
216 // these are to be applied to charts found dynamically
217 // based on their context.
218 typedef struct rrdcalctemplate {
226 uint32_t hash_context;
228 char *source; // the source of this alarm
229 char *units; // the units of the alarm
230 char *info; // a short description of the alarm
232 int update_every; // update frequency for the alarm
234 // the red and green threshold of this alarm (to be set to the chart)
235 calculated_number green;
236 calculated_number red;
238 // ------------------------------------------------------------------------
239 // database lookup settings
241 char *dimensions; // the chart dimensions
242 int group; // grouping method: average, max, etc.
243 int before; // ending point in time-series
244 int after; // starting point in time-series
245 uint32_t options; // calculation options
247 // ------------------------------------------------------------------------
248 // notification delay settings
250 int delay_up_duration; // duration to delay notifications when alarm raises
251 int delay_down_duration; // duration to delay notifications when alarm lowers
252 int delay_max_duration; // the absolute max delay to apply to this alarm
253 float delay_multiplier; // multiplier for all delays when alarms switch status
255 // ------------------------------------------------------------------------
256 // expressions related to the alarm
258 EVAL_EXPRESSION *calculation;
259 EVAL_EXPRESSION *warning;
260 EVAL_EXPRESSION *critical;
262 struct rrdcalctemplate *next;
265 #define RRDCALCTEMPLATE_HAS_CALCULATION(rt) ((rt)->after)
267 #define HEALTH_ENTRY_FLAG_PROCESSED 0x00000001
268 #define HEALTH_ENTRY_FLAG_UPDATED 0x00000002
269 #define HEALTH_ENTRY_FLAG_EXEC_RUN 0x00000004
270 #define HEALTH_ENTRY_FLAG_EXEC_FAILED 0x00000008
271 #define HEALTH_ENTRY_FLAG_SAVED 0x10000000
273 typedef struct alarm_entry {
276 uint32_t alarm_event_id;
280 time_t non_clear_duration;
292 time_t exec_run_timestamp;
299 calculated_number old_value;
300 calculated_number new_value;
307 time_t delay_up_to_timestamp;
309 uint32_t updated_by_id;
312 struct alarm_entry *next;
315 typedef struct alarm_log {
316 uint32_t next_log_id;
317 uint32_t next_alarm_id;
321 pthread_rwlock_t alarm_log_rwlock;
326 extern void rrdsetvar_rename_all(RRDSET *st);
327 extern RRDSETVAR *rrdsetvar_create(RRDSET *st, const char *variable, int type, void *value, uint32_t options);
328 extern void rrdsetvar_free(RRDSETVAR *rs);
330 extern void rrddimvar_rename_all(RRDDIM *rd);
331 extern RRDDIMVAR *rrddimvar_create(RRDDIM *rd, int type, const char *prefix, const char *suffix, void *value, uint32_t options);
332 extern void rrddimvar_free(RRDDIMVAR *rs);
334 extern void rrdsetcalc_link_matching(RRDSET *st);
335 extern void rrdsetcalc_unlink(RRDCALC *rc);
336 extern void rrdcalctemplate_link_matching(RRDSET *st);
337 extern RRDCALC *rrdcalc_find(RRDSET *st, const char *name);
339 extern void health_init(void);
340 extern void *health_main(void *ptr);
342 extern void health_reload(void);
344 extern int health_variable_lookup(const char *variable, uint32_t hash, RRDCALC *rc, calculated_number *result);
345 extern void health_alarms2json(RRDHOST *host, BUFFER *wb, int all);
346 extern void health_alarm_log2json(RRDHOST *host, BUFFER *wb, uint32_t after);
348 #endif //NETDATA_HEALTH_H