]> arthur.barton.de Git - netdata.git/blob - src/rrdpush.c
prevent cancelling the sending thread with locks in place
[netdata.git] / src / rrdpush.c
1 #include "common.h"
2
3 /*
4  * rrdpush
5  *
6  * 3 threads are involved for all stream operations
7  *
8  * 1. a random data collection thread, calling rrdset_done_push()
9  *    this is called for each chart.
10  *
11  *    the output of this work is kept in a BUFFER in RRDHOST
12  *    the sender thread is signalled via a pipe (also in RRDHOST)
13  *
14  * 2. a sender thread running at the sending netdata
15  *    this is spawned automatically on the first chart to be pushed
16  *
17  *    It tries to push the metrics to the remote netdata, as fast
18  *    as possible (i.e. immediately after they are collected).
19  *
20  * 3. a receiver thread, running at the receiving netdata
21  *    this is spawned automatically when the sender connects to
22  *    the receiver.
23  *
24  */
25
26 #define START_STREAMING_PROMPT "Hit me baby, push them over..."
27
28 int default_rrdpush_enabled = 0;
29 char *default_rrdpush_destination = NULL;
30 char *default_rrdpush_api_key = NULL;
31
32 int rrdpush_init() {
33     default_rrdpush_enabled     = appconfig_get_boolean(&stream_config, CONFIG_SECTION_STREAM, "enabled", default_rrdpush_enabled);
34     default_rrdpush_destination = appconfig_get(&stream_config, CONFIG_SECTION_STREAM, "destination", "");
35     default_rrdpush_api_key     = appconfig_get(&stream_config, CONFIG_SECTION_STREAM, "api key", "");
36     rrdhost_free_orphan_time    = appconfig_get_number(&stream_config, CONFIG_SECTION_STREAM, "free orphan hosts after seconds", rrdhost_free_orphan_time);
37
38     if(default_rrdpush_enabled && (!default_rrdpush_destination || !*default_rrdpush_destination || !default_rrdpush_api_key || !*default_rrdpush_api_key)) {
39         error("STREAM [send]: cannot enable sending thread - information is missing.");
40         default_rrdpush_enabled = 0;
41     }
42
43     return default_rrdpush_enabled;
44 }
45
46 #define CONNECTED_TO_SIZE 100
47
48 // data collection happens from multiple threads
49 // each of these threads calls rrdset_done()
50 // which in turn calls rrdset_done_push()
51 // which uses this pipe to notify the streaming thread
52 // that there are more data ready to be sent
53 #define PIPE_READ 0
54 #define PIPE_WRITE 1
55
56 // to have the remote netdata re-sync the charts
57 // to its current clock, we send for this many
58 // iterations a BEGIN line without microseconds
59 // this is for the first iterations of each chart
60 static unsigned int remote_clock_resync_iterations = 60;
61
62 #define rrdpush_lock(host) pthread_mutex_lock(&((host)->rrdpush_mutex))
63 #define rrdpush_unlock(host) pthread_mutex_unlock(&((host)->rrdpush_mutex))
64
65 // checks if the current chart definition has been sent
66 static inline int need_to_send_chart_definition(RRDSET *st) {
67     RRDDIM *rd;
68     rrddim_foreach_read(rd, st)
69         if(!rd->exposed)
70             return 1;
71
72     return 0;
73 }
74
75 // sends the current chart definition
76 static inline void send_chart_definition(RRDSET *st) {
77     buffer_sprintf(st->rrdhost->rrdpush_buffer, "CHART '%s' '%s' '%s' '%s' '%s' '%s' '%s' %ld %d\n"
78                 , st->id
79                 , st->name
80                 , st->title
81                 , st->units
82                 , st->family
83                 , st->context
84                 , rrdset_type_name(st->chart_type)
85                 , st->priority
86                 , st->update_every
87     );
88
89     RRDDIM *rd;
90     rrddim_foreach_read(rd, st) {
91         buffer_sprintf(st->rrdhost->rrdpush_buffer, "DIMENSION '%s' '%s' '%s' " COLLECTED_NUMBER_FORMAT " " COLLECTED_NUMBER_FORMAT " '%s %s'\n"
92                        , rd->id
93                        , rd->name
94                        , rrd_algorithm_name(rd->algorithm)
95                        , rd->multiplier
96                        , rd->divisor
97                        , rrddim_flag_check(rd, RRDDIM_FLAG_HIDDEN)?"hidden":""
98                        , rrddim_flag_check(rd, RRDDIM_FLAG_DONT_DETECT_RESETS_OR_OVERFLOWS)?"noreset":""
99         );
100         rd->exposed = 1;
101     }
102 }
103
104 // sends the current chart dimensions
105 static inline void send_chart_metrics(RRDSET *st) {
106     buffer_sprintf(st->rrdhost->rrdpush_buffer, "BEGIN %s %llu\n", st->id, (st->counter_done > remote_clock_resync_iterations)?st->usec_since_last_update:0);
107
108     RRDDIM *rd;
109     rrddim_foreach_read(rd, st) {
110         if(rd->updated && rd->exposed)
111             buffer_sprintf(st->rrdhost->rrdpush_buffer, "SET %s = " COLLECTED_NUMBER_FORMAT "\n"
112                        , rd->id
113                        , rd->collected_value
114         );
115     }
116
117     buffer_strcat(st->rrdhost->rrdpush_buffer, "END\n");
118 }
119
120 void rrdpush_sender_thread_spawn(RRDHOST *host);
121
122 void rrdset_done_push(RRDSET *st) {
123     RRDHOST *host = st->rrdhost;
124
125     if(unlikely(!rrdset_flag_check(st, RRDSET_FLAG_ENABLED)))
126         return;
127
128     rrdpush_lock(host);
129
130     if(unlikely(host->rrdpush_enabled && !host->rrdpush_spawn))
131         rrdpush_sender_thread_spawn(host);
132
133     if(unlikely(!host->rrdpush_buffer || !host->rrdpush_connected)) {
134         if(unlikely(!host->rrdpush_error_shown))
135             error("STREAM %s [send]: not ready - discarding collected metrics.", host->hostname);
136
137         host->rrdpush_error_shown = 1;
138
139         rrdpush_unlock(host);
140         return;
141     }
142     else if(unlikely(host->rrdpush_error_shown)) {
143         info("STREAM %s [send]: ready - sending metrics...", host->hostname);
144         host->rrdpush_error_shown = 0;
145     }
146
147     if(need_to_send_chart_definition(st))
148         send_chart_definition(st);
149
150     send_chart_metrics(st);
151
152     // signal the sender there are more data
153     if(write(host->rrdpush_pipe[PIPE_WRITE], " ", 1) == -1)
154         error("STREAM %s [send]: cannot write to internal pipe", host->hostname);
155
156     rrdpush_unlock(host);
157 }
158
159 // ----------------------------------------------------------------------------
160 // rrdpush sender thread
161
162 // resets all the chart, so that their definitions
163 // will be resent to the central netdata
164 static void rrdpush_sender_thread_reset_all_charts(RRDHOST *host) {
165     rrdhost_rdlock(host);
166
167     RRDSET *st;
168     rrdset_foreach_read(st, host) {
169
170         // make it re-align the current time
171         // on the remote host
172         st->counter_done = 0;
173
174         rrdset_rdlock(st);
175
176         RRDDIM *rd;
177         rrddim_foreach_read(rd, st)
178             rd->exposed = 0;
179
180         rrdset_unlock(st);
181     }
182
183     rrdhost_unlock(host);
184 }
185
186 static inline void rrdpush_sender_thread_data_flush(RRDHOST *host) {
187     rrdpush_lock(host);
188
189     if(buffer_strlen(host->rrdpush_buffer))
190         error("STREAM %s [send]: discarding %zu bytes of metrics already in the buffer.", host->hostname, buffer_strlen(host->rrdpush_buffer));
191
192     buffer_flush(host->rrdpush_buffer);
193
194     rrdpush_sender_thread_reset_all_charts(host);
195
196     rrdpush_unlock(host);
197 }
198
199 static void rrdpush_sender_thread_cleanup_locked_all(RRDHOST *host) {
200     host->rrdpush_connected = 0;
201
202     if(host->rrdpush_socket != -1) {
203         close(host->rrdpush_socket);
204         host->rrdpush_socket = -1;
205     }
206
207     // close the pipe
208     if(host->rrdpush_pipe[PIPE_READ] != -1) {
209         close(host->rrdpush_pipe[PIPE_READ]);
210         host->rrdpush_pipe[PIPE_READ] = -1;
211     }
212
213     if(host->rrdpush_pipe[PIPE_WRITE] != -1) {
214         close(host->rrdpush_pipe[PIPE_WRITE]);
215         host->rrdpush_pipe[PIPE_WRITE] = -1;
216     }
217
218     buffer_free(host->rrdpush_buffer);
219     host->rrdpush_buffer = NULL;
220
221     host->rrdpush_spawn = 0;
222 }
223
224 void rrdpush_sender_thread_stop(RRDHOST *host) {
225     rrdpush_lock(host);
226     rrdhost_wrlock(host);
227
228     if(host->rrdpush_spawn) {
229         info("STREAM %s [send]: stopping sending thread...", host->hostname);
230         pthread_cancel(host->rrdpush_thread);
231         rrdpush_sender_thread_cleanup_locked_all(host);
232     }
233
234     rrdhost_unlock(host);
235     rrdpush_unlock(host);
236 }
237
238 void *rrdpush_sender_thread(void *ptr) {
239     RRDHOST *host = (RRDHOST *)ptr;
240
241     info("STREAM %s [send]: thread created (task id %d)", host->hostname, gettid());
242
243     if(pthread_setcanceltype(PTHREAD_CANCEL_DEFERRED, NULL) != 0)
244         error("STREAM %s [send]: cannot set pthread cancel type to DEFERRED.", host->hostname);
245
246     if(pthread_setcancelstate(PTHREAD_CANCEL_ENABLE, NULL) != 0)
247         error("STREAM %s [send]: cannot set pthread cancel state to ENABLE.", host->hostname);
248
249     int timeout = (int)appconfig_get_number(&stream_config, CONFIG_SECTION_STREAM, "timeout seconds", 60);
250     int default_port = (int)appconfig_get_number(&stream_config, CONFIG_SECTION_STREAM, "default port", 19999);
251     size_t max_size = (size_t)appconfig_get_number(&stream_config, CONFIG_SECTION_STREAM, "buffer size bytes", 1024 * 1024);
252     unsigned int reconnect_delay = (unsigned int)appconfig_get_number(&stream_config, CONFIG_SECTION_STREAM, "reconnect delay seconds", 5);
253     remote_clock_resync_iterations = (unsigned int)appconfig_get_number(&stream_config, CONFIG_SECTION_STREAM, "initial clock resync iterations", remote_clock_resync_iterations);
254     char connected_to[CONNECTED_TO_SIZE + 1] = "";
255
256     if(!host->rrdpush_enabled || !host->rrdpush_destination || !*host->rrdpush_destination || !host->rrdpush_api_key || !*host->rrdpush_api_key)
257         goto cleanup;
258
259     // initialize rrdpush globals
260     host->rrdpush_buffer = buffer_create(1);
261     host->rrdpush_connected = 0;
262     if(pipe(host->rrdpush_pipe) == -1) fatal("STREAM %s [send]: cannot create required pipe.", host->hostname);
263
264     // initialize local variables
265     size_t begin = 0;
266     size_t reconnects_counter = 0;
267     size_t sent_bytes = 0;
268     size_t sent_connection = 0;
269
270     struct timeval tv = {
271             .tv_sec = timeout,
272             .tv_usec = 0
273     };
274
275     struct pollfd fds[2], *ifd, *ofd;
276     nfds_t fdmax;
277
278     ifd = &fds[0];
279     ofd = &fds[1];
280
281     for(; host->rrdpush_enabled && !netdata_exit ;) {
282
283         if(unlikely(host->rrdpush_socket == -1)) {
284             // stop appending data into rrdpush_buffer
285             // they will be lost, so there is no point to do it
286             host->rrdpush_connected = 0;
287
288             info("STREAM %s [send to %s]: connecting...", host->hostname, host->rrdpush_destination);
289             host->rrdpush_socket = connect_to_one_of(host->rrdpush_destination, default_port, &tv, &reconnects_counter, connected_to, CONNECTED_TO_SIZE);
290
291             if(unlikely(host->rrdpush_socket == -1)) {
292                 error("STREAM %s [send to %s]: failed to connect", host->hostname, host->rrdpush_destination);
293                 sleep(reconnect_delay);
294                 continue;
295             }
296
297             info("STREAM %s [send to %s]: initializing communication...", host->hostname, connected_to);
298
299             char http[1000 + 1];
300             snprintfz(http, 1000,
301                     "STREAM key=%s&hostname=%s&machine_guid=%s&os=%s&update_every=%d HTTP/1.1\r\n"
302                     "User-Agent: netdata-push-service/%s\r\n"
303                     "Accept: */*\r\n\r\n"
304                       , host->rrdpush_api_key
305                       , host->hostname
306                       , host->machine_guid
307                       , host->os
308                       , default_rrd_update_every
309                       , program_version
310             );
311
312             if(send_timeout(host->rrdpush_socket, http, strlen(http), 0, timeout) == -1) {
313                 close(host->rrdpush_socket);
314                 host->rrdpush_socket = -1;
315                 error("STREAM %s [send to %s]: failed to send http header to netdata", host->hostname, connected_to);
316                 sleep(reconnect_delay);
317                 continue;
318             }
319
320             info("STREAM %s [send to %s]: waiting response from remote netdata...", host->hostname, connected_to);
321
322             if(recv_timeout(host->rrdpush_socket, http, 1000, 0, timeout) == -1) {
323                 close(host->rrdpush_socket);
324                 host->rrdpush_socket = -1;
325                 error("STREAM %s [send to %s]: failed to initialize communication", host->hostname, connected_to);
326                 sleep(reconnect_delay);
327                 continue;
328             }
329
330             if(strncmp(http, START_STREAMING_PROMPT, strlen(START_STREAMING_PROMPT))) {
331                 close(host->rrdpush_socket);
332                 host->rrdpush_socket = -1;
333                 error("STREAM %s [send to %s]: server is not replying properly.", host->hostname, connected_to);
334                 sleep(reconnect_delay);
335                 continue;
336             }
337
338             info("STREAM %s [send to %s]: established communication - sending metrics...", host->hostname, connected_to);
339
340             if(fcntl(host->rrdpush_socket, F_SETFL, O_NONBLOCK) < 0)
341                 error("STREAM %s [send to %s]: cannot set non-blocking mode for socket.", host->hostname, connected_to);
342
343             rrdpush_sender_thread_data_flush(host);
344             sent_connection = 0;
345
346             // allow appending data into rrdpush_buffer
347             host->rrdpush_connected = 1;
348         }
349
350         ifd->fd = host->rrdpush_pipe[PIPE_READ];
351         ifd->events = POLLIN;
352         ifd->revents = 0;
353
354         ofd->fd = host->rrdpush_socket;
355         ofd->revents = 0;
356         if(begin < buffer_strlen(host->rrdpush_buffer)) {
357             ofd->events = POLLOUT;
358             fdmax = 2;
359         }
360         else {
361             ofd->events = 0;
362             fdmax = 1;
363         }
364
365         if(netdata_exit) break;
366         int retval = poll(fds, fdmax, timeout * 1000);
367         if(netdata_exit) break;
368
369         if(unlikely(retval == -1)) {
370             if(errno == EAGAIN || errno == EINTR)
371                 continue;
372
373             error("STREAM %s [send to %s]: failed to poll().", host->hostname, connected_to);
374             close(host->rrdpush_socket);
375             host->rrdpush_socket = -1;
376             break;
377         }
378         else if(unlikely(!retval)) {
379             // timeout
380             continue;
381         }
382
383         if(ifd->revents & POLLIN) {
384             char buffer[1000 + 1];
385             if(read(host->rrdpush_pipe[PIPE_READ], buffer, 1000) == -1)
386                 error("STREAM %s [send to %s]: cannot read from internal pipe.", host->hostname, connected_to);
387         }
388
389         if(ofd->revents & POLLOUT && begin < buffer_strlen(host->rrdpush_buffer)) {
390
391             // BEGIN RRDPUSH LOCKED SESSION
392
393             // during this session, data collectors
394             // will not be able to append data to our buffer
395             // but the socket is in non-blocking mode
396             // so, we will not block at send()
397
398             if(pthread_setcancelstate(PTHREAD_CANCEL_DISABLE, NULL) != 0)
399                 error("STREAM %s [send]: cannot set pthread cancel state to DISABLE.", host->hostname);
400
401             rrdpush_lock(host);
402
403             ssize_t ret = send(host->rrdpush_socket, &host->rrdpush_buffer->buffer[begin], buffer_strlen(host->rrdpush_buffer) - begin, MSG_DONTWAIT);
404             if(ret == -1) {
405                 if(errno != EAGAIN && errno != EINTR) {
406                     error("STREAM %s [send to %s]: failed to send metrics - closing connection - we have sent %zu bytes on this connection.", host->hostname, connected_to, sent_connection);
407                     close(host->rrdpush_socket);
408                     host->rrdpush_socket = -1;
409                 }
410             }
411             else {
412                 sent_connection += ret;
413                 sent_bytes += ret;
414                 begin += ret;
415                 if(begin == buffer_strlen(host->rrdpush_buffer)) {
416                     // we send it all
417
418                     buffer_flush(host->rrdpush_buffer);
419                     begin = 0;
420                 }
421             }
422
423             rrdpush_unlock(host);
424
425             if(pthread_setcancelstate(PTHREAD_CANCEL_ENABLE, NULL) != 0)
426                 error("STREAM %s [send]: cannot set pthread cancel state to ENABLE.", host->hostname);
427
428             // END RRDPUSH LOCKED SESSION
429         }
430
431         // protection from overflow
432         if(host->rrdpush_buffer->len > max_size) {
433             errno = 0;
434             error("STREAM %s [send to %s]: too many data pending - buffer is %zu bytes long, %zu unsent - we have sent %zu bytes in total, %zu on this connection. Closing connection to flush the data.", host->hostname, connected_to, host->rrdpush_buffer->len, host->rrdpush_buffer->len - begin, sent_bytes, sent_connection);
435             if(host->rrdpush_socket != -1) {
436                 close(host->rrdpush_socket);
437                 host->rrdpush_socket = -1;
438             }
439         }
440     }
441
442 cleanup:
443     debug(D_WEB_CLIENT, "STREAM %s [send]: sending thread exits.", host->hostname);
444
445     if(pthread_setcancelstate(PTHREAD_CANCEL_DISABLE, NULL) != 0)
446         error("STREAM %s [send]: cannot set pthread cancel state to DISABLE.", host->hostname);
447
448     rrdpush_lock(host);
449     rrdhost_wrlock(host);
450     rrdpush_sender_thread_cleanup_locked_all(host);
451     rrdhost_unlock(host);
452     rrdpush_unlock(host);
453
454     if(pthread_setcancelstate(PTHREAD_CANCEL_ENABLE, NULL) != 0)
455         error("STREAM %s [send]: cannot set pthread cancel state to ENABLE.", host->hostname);
456     
457     pthread_exit(NULL);
458     return NULL;
459 }
460
461
462 // ----------------------------------------------------------------------------
463 // rrdpush receiver thread
464
465 int rrdpush_receive(int fd, const char *key, const char *hostname, const char *machine_guid, const char *os, int update_every, char *client_ip, char *client_port) {
466     RRDHOST *host;
467     int history = default_rrd_history_entries;
468     RRD_MEMORY_MODE mode = default_rrd_memory_mode;
469     int health_enabled = default_health_enabled;
470     int rrdpush_enabled = default_rrdpush_enabled;
471     char *rrdpush_destination = default_rrdpush_destination;
472     char *rrdpush_api_key = default_rrdpush_api_key;
473     time_t alarms_delay = 60;
474
475     update_every = (int)appconfig_get_number(&stream_config, machine_guid, "update every", update_every);
476     if(update_every < 0) update_every = 1;
477
478     history = (int)appconfig_get_number(&stream_config, key, "default history", history);
479     history = (int)appconfig_get_number(&stream_config, machine_guid, "history", history);
480     if(history < 5) history = 5;
481
482     mode = rrd_memory_mode_id(appconfig_get(&stream_config, key, "default memory mode", rrd_memory_mode_name(mode)));
483     mode = rrd_memory_mode_id(appconfig_get(&stream_config, machine_guid, "memory mode", rrd_memory_mode_name(mode)));
484
485     health_enabled = appconfig_get_boolean_ondemand(&stream_config, key, "health enabled by default", health_enabled);
486     health_enabled = appconfig_get_boolean_ondemand(&stream_config, machine_guid, "health enabled", health_enabled);
487
488     alarms_delay = appconfig_get_number(&stream_config, key, "default postpone alarms on connect seconds", alarms_delay);
489     alarms_delay = appconfig_get_number(&stream_config, machine_guid, "postpone alarms on connect seconds", alarms_delay);
490
491     rrdpush_enabled = appconfig_get_boolean(&stream_config, key, "default proxy enabled", rrdpush_enabled);
492     rrdpush_enabled = appconfig_get_boolean(&stream_config, machine_guid, "proxy enabled", rrdpush_enabled);
493
494     rrdpush_destination = appconfig_get(&stream_config, key, "default proxy destination", rrdpush_destination);
495     rrdpush_destination = appconfig_get(&stream_config, machine_guid, "proxy destination", rrdpush_destination);
496
497     rrdpush_api_key = appconfig_get(&stream_config, key, "default proxy api key", rrdpush_api_key);
498     rrdpush_api_key = appconfig_get(&stream_config, machine_guid, "proxy api key", rrdpush_api_key);
499
500     if(!strcmp(machine_guid, "localhost"))
501         host = localhost;
502     else
503         host = rrdhost_find_or_create(
504                 hostname
505                 , machine_guid
506                 , os
507                 , update_every
508                 , history
509                 , mode
510                 , (health_enabled != CONFIG_BOOLEAN_NO)
511                 , (rrdpush_enabled && rrdpush_destination && *rrdpush_destination && rrdpush_api_key && *rrdpush_api_key)
512                 , rrdpush_destination
513                 , rrdpush_api_key
514         );
515
516     if(!host) {
517         close(fd);
518         error("STREAM %s [receive from [%s]:%s]: failed to find/create host structure.", hostname, client_ip, client_port);
519         return 1;
520     }
521
522 #ifdef NETDATA_INTERNAL_CHECKS
523     info("STREAM %s [receive from [%s]:%s]: client willing to stream metrics for host '%s' with machine_guid '%s': update every = %d, history = %d, memory mode = %s, health %s"
524          , hostname
525          , client_ip
526          , client_port
527          , host->hostname
528          , host->machine_guid
529          , host->rrd_update_every
530          , host->rrd_history_entries
531          , rrd_memory_mode_name(host->rrd_memory_mode)
532          , (health_enabled == CONFIG_BOOLEAN_NO)?"disabled":((health_enabled == CONFIG_BOOLEAN_YES)?"enabled":"auto")
533     );
534 #endif // NETDATA_INTERNAL_CHECKS
535
536     struct plugind cd = {
537             .enabled = 1,
538             .update_every = default_rrd_update_every,
539             .pid = 0,
540             .serial_failures = 0,
541             .successful_collections = 0,
542             .obsolete = 0,
543             .started_t = now_realtime_sec(),
544             .next = NULL,
545     };
546
547     // put the client IP and port into the buffers used by plugins.d
548     snprintfz(cd.id,           CONFIG_MAX_NAME,  "%s:%s", client_ip, client_port);
549     snprintfz(cd.filename,     FILENAME_MAX,     "%s:%s", client_ip, client_port);
550     snprintfz(cd.fullfilename, FILENAME_MAX,     "%s:%s", client_ip, client_port);
551     snprintfz(cd.cmd,          PLUGINSD_CMD_MAX, "%s:%s", client_ip, client_port);
552
553     info("STREAM %s [receive from [%s]:%s]: initializing communication...", host->hostname, client_ip, client_port);
554     if(send_timeout(fd, START_STREAMING_PROMPT, strlen(START_STREAMING_PROMPT), 0, 60) != strlen(START_STREAMING_PROMPT)) {
555         error("STREAM %s [receive from [%s]:%s]: cannot send ready command.", host->hostname, client_ip, client_port);
556         close(fd);
557         return 0;
558     }
559
560     // remove the non-blocking flag from the socket
561     if(fcntl(fd, F_SETFL, fcntl(fd, F_GETFL, 0) & ~O_NONBLOCK) == -1)
562         error("STREAM %s [receive from [%s]:%s]: cannot remove the non-blocking flag from socket %d", host->hostname, client_ip, client_port, fd);
563
564     // convert the socket to a FILE *
565     FILE *fp = fdopen(fd, "r");
566     if(!fp) {
567         error("STREAM %s [receive from [%s]:%s]: failed to get a FILE for FD %d.", host->hostname, client_ip, client_port, fd);
568         close(fd);
569         return 0;
570     }
571
572     rrdhost_wrlock(host);
573     host->connected_senders++;
574     if(health_enabled != CONFIG_BOOLEAN_NO)
575         host->health_delay_up_to = now_realtime_sec() + alarms_delay;
576     rrdhost_unlock(host);
577
578     // call the plugins.d processor to receive the metrics
579     info("STREAM %s [receive from [%s]:%s]: receiving metrics...", host->hostname, client_ip, client_port);
580     size_t count = pluginsd_process(host, &cd, fp, 1);
581     error("STREAM %s [receive from [%s]:%s]: disconnected (completed updates %zu).", host->hostname, client_ip, client_port, count);
582
583     rrdhost_wrlock(host);
584     host->connected_senders--;
585     if(!host->connected_senders) {
586         if(health_enabled == CONFIG_BOOLEAN_AUTO)
587             host->health_enabled = 0;
588
589         host->senders_disconnected_time = now_realtime_sec();
590     }
591     rrdhost_unlock(host);
592
593     rrdpush_sender_thread_stop(host);
594
595     // cleanup
596     fclose(fp);
597
598     return (int)count;
599 }
600
601 struct rrdpush_thread {
602     int fd;
603     char *key;
604     char *hostname;
605     char *machine_guid;
606     char *os;
607     char *client_ip;
608     char *client_port;
609     int update_every;
610 };
611
612 void *rrdpush_receiver_thread(void *ptr) {
613     struct rrdpush_thread *rpt = (struct rrdpush_thread *)ptr;
614
615     if (pthread_setcanceltype(PTHREAD_CANCEL_DEFERRED, NULL) != 0)
616         error("STREAM %s [receive]: cannot set pthread cancel type to DEFERRED.", rpt->hostname);
617
618     if (pthread_setcancelstate(PTHREAD_CANCEL_ENABLE, NULL) != 0)
619         error("STREAM %s [receive]: cannot set pthread cancel state to ENABLE.", rpt->hostname);
620
621
622     info("STREAM %s [%s]:%s: receive thread created (task id %d)", rpt->hostname, rpt->client_ip, rpt->client_port, gettid());
623     rrdpush_receive(rpt->fd, rpt->key, rpt->hostname, rpt->machine_guid, rpt->os, rpt->update_every, rpt->client_ip, rpt->client_port);
624     info("STREAM %s [receive from [%s]:%s]: receive thread ended (task id %d)", rpt->hostname, rpt->client_ip, rpt->client_port, gettid());
625
626     freez(rpt->key);
627     freez(rpt->hostname);
628     freez(rpt->machine_guid);
629     freez(rpt->os);
630     freez(rpt->client_ip);
631     freez(rpt->client_port);
632     freez(rpt);
633
634     pthread_exit(NULL);
635     return NULL;
636 }
637
638 void rrdpush_sender_thread_spawn(RRDHOST *host) {
639     rrdhost_wrlock(host);
640
641     if(!host->rrdpush_spawn) {
642         if(pthread_create(&host->rrdpush_thread, NULL, rrdpush_sender_thread, (void *) host))
643             error("STREAM %s [send]: failed to create new thread for client.", host->hostname);
644
645         else if(pthread_detach(host->rrdpush_thread))
646             error("STREAM %s [send]: cannot request detach newly created thread.", host->hostname);
647
648         host->rrdpush_spawn = 1;
649     }
650
651     rrdhost_unlock(host);
652 }
653
654 int rrdpush_receiver_thread_spawn(RRDHOST *host, struct web_client *w, char *url) {
655     (void)host;
656
657     info("STREAM [receive from [%s]:%s]: new client connection.", w->client_ip, w->client_port);
658
659     char *key = NULL, *hostname = NULL, *machine_guid = NULL, *os = "unknown";
660     int update_every = default_rrd_update_every;
661     char buf[GUID_LEN + 1];
662
663     while(url) {
664         char *value = mystrsep(&url, "?&");
665         if(!value || !*value) continue;
666
667         char *name = mystrsep(&value, "=");
668         if(!name || !*name) continue;
669         if(!value || !*value) continue;
670
671         if(!strcmp(name, "key"))
672             key = value;
673         else if(!strcmp(name, "hostname"))
674             hostname = value;
675         else if(!strcmp(name, "machine_guid"))
676             machine_guid = value;
677         else if(!strcmp(name, "update_every"))
678             update_every = (int)strtoul(value, NULL, 0);
679         else if(!strcmp(name, "os"))
680             os = value;
681     }
682
683     if(!key || !*key) {
684         error("STREAM [receive from [%s]:%s]: request without an API key. Forbidding access.", w->client_ip, w->client_port);
685         buffer_flush(w->response.data);
686         buffer_sprintf(w->response.data, "You need an API key for this request.");
687         return 401;
688     }
689
690     if(!hostname || !*hostname) {
691         error("STREAM [receive from [%s]:%s]: request without a hostname. Forbidding access.", w->client_ip, w->client_port);
692         buffer_flush(w->response.data);
693         buffer_sprintf(w->response.data, "You need to send a hostname too.");
694         return 400;
695     }
696
697     if(!machine_guid || !*machine_guid) {
698         error("STREAM [receive from [%s]:%s]: request without a machine GUID. Forbidding access.", w->client_ip, w->client_port);
699         buffer_flush(w->response.data);
700         buffer_sprintf(w->response.data, "You need to send a machine GUID too.");
701         return 400;
702     }
703
704     if(regenerate_guid(key, buf) == -1) {
705         error("STREAM [receive from [%s]:%s]: API key '%s' is not valid GUID. Forbidding access.", w->client_ip, w->client_port, key);
706         buffer_flush(w->response.data);
707         buffer_sprintf(w->response.data, "Your API key is invalid.");
708         return 401;
709     }
710
711     if(regenerate_guid(machine_guid, buf) == -1) {
712         error("STREAM [receive from [%s]:%s]: machine GUID '%s' is not GUID. Forbidding access.", w->client_ip, w->client_port, key);
713         buffer_flush(w->response.data);
714         buffer_sprintf(w->response.data, "Your machine GUID is invalid.");
715         return 404;
716     }
717
718     if(!appconfig_get_boolean(&stream_config, key, "enabled", 0)) {
719         error("STREAM [receive from [%s]:%s]: API key '%s' is not allowed. Forbidding access.", w->client_ip, w->client_port, machine_guid);
720         buffer_flush(w->response.data);
721         buffer_sprintf(w->response.data, "Your API key is not permitted access.");
722         return 401;
723     }
724
725     if(!appconfig_get_boolean(&stream_config, machine_guid, "enabled", 1)) {
726         error("STREAM [receive from [%s]:%s]: machine GUID '%s' is not allowed. Forbidding access.", w->client_ip, w->client_port, machine_guid);
727         buffer_flush(w->response.data);
728         buffer_sprintf(w->response.data, "Your machine guide is not permitted access.");
729         return 404;
730     }
731
732     struct rrdpush_thread *rpt = mallocz(sizeof(struct rrdpush_thread));
733     rpt->fd           = w->ifd;
734     rpt->key          = strdupz(key);
735     rpt->hostname     = strdupz(hostname);
736     rpt->machine_guid = strdupz(machine_guid);
737     rpt->os           = strdupz(os);
738     rpt->client_ip    = strdupz(w->client_ip);
739     rpt->client_port  = strdupz(w->client_port);
740     rpt->update_every = update_every;
741     pthread_t thread;
742
743     debug(D_SYSTEM, "STREAM [receive from [%s]:%s]: starting receiving thread.", w->client_ip, w->client_port);
744
745     if(pthread_create(&thread, NULL, rrdpush_receiver_thread, (void *)rpt))
746         error("STREAM [receive from [%s]:%s]: failed to create new thread for client.", w->client_ip, w->client_port);
747
748     else if(pthread_detach(thread))
749         error("STREAM [receive from [%s]:%s]: cannot request detach newly created thread.", w->client_ip, w->client_port);
750
751     // prevent the caller from closing the streaming socket
752     if(w->ifd == w->ofd)
753         w->ifd = w->ofd = -1;
754     else
755         w->ifd = -1;
756
757     buffer_flush(w->response.data);
758     return 200;
759 }