c208b2d19f381146df11e3322f86a4c34302862a
[cubemap] / main.cpp
1 #include <assert.h>
2 #include <errno.h>
3 #include <getopt.h>
4 #include <limits.h>
5 #include <signal.h>
6 #include <stddef.h>
7 #include <stdio.h>
8 #include <stdlib.h>
9 #include <string.h>
10 #include <sys/time.h>
11 #include <sys/wait.h>
12 #include <systemd/sd-daemon.h>
13 #include <unistd.h>
14 #include <algorithm>
15 #include <map>
16 #include <set>
17 #include <string>
18 #include <utility>
19 #include <vector>
20
21 #include "tlse.h"
22
23 #include "acceptor.h"
24 #include "accesslog.h"
25 #include "config.h"
26 #include "input.h"
27 #include "input_stats.h"
28 #include "log.h"
29 #include "sa_compare.h"
30 #include "serverpool.h"
31 #include "state.pb.h"
32 #include "stats.h"
33 #include "stream.h"
34 #include "util.h"
35 #include "version.h"
36
37 using namespace std;
38
39 AccessLogThread *access_log = NULL;
40 ServerPool *servers = NULL;
41 volatile bool hupped = false;
42 volatile bool stopped = false;
43
44 typedef pair<string, Input::Encoding> InputKey;
45
46 namespace {
47
48 struct OrderByConnectionTime {
49         bool operator() (const ClientProto &a, const ClientProto &b) const {
50                 if (a.connect_time_sec() != b.connect_time_sec())
51                         return a.connect_time_sec() < b.connect_time_sec();
52                 return a.connect_time_nsec() < b.connect_time_nsec();
53         }
54 };
55
56 // An arbitrary ordering.
57 struct AcceptorConfigCompare {
58         bool operator() (const AcceptorConfig &a, const AcceptorConfig &b) const {
59                 int cmp = a.certificate_chain.compare(b.certificate_chain);
60                 if (cmp != 0) {
61                         return cmp < 0;
62                 }
63
64                 cmp = a.private_key.compare(b.private_key);
65                 if (cmp != 0) {
66                         return cmp < 0;
67                 }
68
69                 return Sockaddr6Compare()(a.addr, b.addr);
70         }
71 };
72
73 }  // namespace
74
75 struct InputWithRefcount {
76         Input *input;
77         int refcount;
78 };
79
80 void hup(int signum)
81 {
82         hupped = true;
83         if (signum == SIGINT) {
84                 stopped = true;
85         }
86 }
87
88 void do_nothing(int signum)
89 {
90 }
91
92 CubemapStateProto collect_state(const timespec &serialize_start,
93                                 const vector<Acceptor *> acceptors,
94                                 const multimap<InputKey, InputWithRefcount> inputs,
95                                 ServerPool *servers)
96 {
97         CubemapStateProto state = servers->serialize();  // Fills streams() and clients().
98         state.set_serialize_start_sec(serialize_start.tv_sec);
99         state.set_serialize_start_usec(serialize_start.tv_nsec / 1000);
100
101         for (Acceptor *acceptor : acceptors) {  
102                 state.add_acceptors()->MergeFrom(acceptor->serialize());
103         }
104
105         for (const auto &key_and_input_with_refcount : inputs) {
106                 state.add_inputs()->MergeFrom(key_and_input_with_refcount.second.input->serialize());
107         }
108
109         return state;
110 }
111
112 // Find all port statements in the configuration file, and create acceptors for them.
113 vector<Acceptor *> create_acceptors(
114         const Config &config,
115         map<AcceptorConfig, Acceptor *, AcceptorConfigCompare> *deserialized_acceptors)
116 {
117         vector<Acceptor *> acceptors;
118         for (const AcceptorConfig &acceptor_config : config.acceptors) {
119                 Acceptor *acceptor = NULL;
120                 const auto deserialized_acceptor_it = deserialized_acceptors->find(acceptor_config);
121                 if (deserialized_acceptor_it != deserialized_acceptors->end()) {
122                         acceptor = deserialized_acceptor_it->second;
123                         deserialized_acceptors->erase(deserialized_acceptor_it);
124                 } else {
125                         int server_sock = create_server_socket(acceptor_config.addr, TCP_SOCKET);
126                         acceptor = new Acceptor(server_sock, acceptor_config.addr,
127                                                 acceptor_config.certificate_chain,
128                                                 acceptor_config.private_key);
129                 }
130                 acceptor->run();
131                 acceptors.push_back(acceptor);
132         }
133
134         // Close all acceptors that are no longer in the configuration file.
135         for (auto &config_and_acceptor : *deserialized_acceptors) {
136                 config_and_acceptor.second->close_socket();
137                 delete config_and_acceptor.second;
138         }
139
140         return acceptors;
141 }
142
143 void create_config_input(const string &src, Input::Encoding encoding, multimap<InputKey, InputWithRefcount> *inputs)
144 {
145         if (src.empty()) {
146                 return;
147         }
148         InputKey key(src, encoding);
149         if (inputs->count(key) != 0) {
150                 return;
151         }
152
153         InputWithRefcount iwr;
154         iwr.input = create_input(src, encoding);
155         if (iwr.input == NULL) {
156                 log(ERROR, "did not understand URL '%s' or source encoding was invalid, clients will not get any data.",
157                         src.c_str());
158                 return;
159         }
160         iwr.refcount = 0;
161         inputs->insert(make_pair(key, iwr));
162 }
163
164 // Find all streams in the configuration file, and create inputs for them.
165 void create_config_inputs(const Config &config, multimap<InputKey, InputWithRefcount> *inputs)
166 {
167         for (const StreamConfig &stream_config : config.streams) {
168                 if (stream_config.src != "delete") {
169                         create_config_input(stream_config.src, Input::Encoding(stream_config.src_encoding), inputs);
170                 }
171         }
172         for (const UDPStreamConfig &udpstream_config : config.udpstreams) {
173                 create_config_input(udpstream_config.src, Input::INPUT_ENCODING_RAW, inputs);
174         }
175 }
176
177 void create_streams(const Config &config,
178                     const set<string> &deserialized_urls,
179                     multimap<InputKey, InputWithRefcount> *inputs)
180 {
181         // HTTP streams.
182         set<string> expecting_urls = deserialized_urls;
183         for (const StreamConfig &stream_config : config.streams) {
184                 int stream_index;
185
186                 expecting_urls.erase(stream_config.url);
187
188                 // Special-case deleted streams; they were never deserialized in the first place,
189                 // so just ignore them.
190                 if (stream_config.src == "delete") {
191                         continue;
192                 }
193
194                 if (deserialized_urls.count(stream_config.url) == 0) {
195                         stream_index = servers->add_stream(stream_config.url,
196                                                            stream_config.backlog_size,
197                                                            stream_config.prebuffering_bytes,
198                                                            Stream::Encoding(stream_config.encoding),
199                                                            Stream::Encoding(stream_config.src_encoding));
200                 } else {
201                         stream_index = servers->lookup_stream_by_url(stream_config.url);
202                         assert(stream_index != -1);
203                         servers->set_backlog_size(stream_index, stream_config.backlog_size);
204                         servers->set_prebuffering_bytes(stream_index, stream_config.prebuffering_bytes);
205                         servers->set_encoding(stream_index,
206                                               Stream::Encoding(stream_config.encoding));
207                         servers->set_src_encoding(stream_index,
208                                                   Stream::Encoding(stream_config.src_encoding));
209                 }
210
211                 servers->set_pacing_rate(stream_index, stream_config.pacing_rate);
212
213                 string src = stream_config.src;
214                 Input::Encoding src_encoding = Input::Encoding(stream_config.src_encoding);
215                 if (!src.empty()) {
216                         const auto input_it = inputs->find(make_pair(src, src_encoding));
217                         if (input_it != inputs->end()) {
218                                 input_it->second.input->add_destination(stream_index);
219                                 ++input_it->second.refcount;
220                         }
221                 }
222         }
223
224         // Warn about any streams servers we've lost.
225         for (const string &url : expecting_urls) {
226                 log(WARNING, "stream '%s' disappeared from the configuration file. "
227                              "It will not be deleted, but clients will not get any new inputs. "
228                              "If you really meant to delete it, set src=delete and reload.",
229                              url.c_str());
230         }
231
232         // UDP streams.
233         for (const UDPStreamConfig &udpstream_config : config.udpstreams) {
234                 int stream_index = servers->add_udpstream(
235                         udpstream_config.dst,
236                         udpstream_config.pacing_rate,
237                         udpstream_config.ttl,
238                         udpstream_config.multicast_iface_index);
239
240                 string src = udpstream_config.src;
241                 if (!src.empty()) {
242                         auto input_it = inputs->find(make_pair(src, Input::INPUT_ENCODING_RAW));
243                         assert(input_it != inputs->end());
244                         input_it->second.input->add_destination(stream_index);
245                         ++input_it->second.refcount;
246                 }
247         }
248
249         // HTTP gen204 endpoints.
250         for (const Gen204Config &ping_config : config.pings) {
251                 servers->add_gen204(ping_config.url, ping_config.allow_origin);
252         }
253 }
254         
255 void open_logs(const vector<LogConfig> &log_destinations)
256 {
257         for (const LogConfig &log_destination : log_destinations) {
258                 if (log_destination.type == LogConfig::LOG_TYPE_FILE) {
259                         add_log_destination_file(log_destination.filename);
260                 } else if (log_destination.type == LogConfig::LOG_TYPE_CONSOLE) {
261                         add_log_destination_console();
262                 } else if (log_destination.type == LogConfig::LOG_TYPE_SYSLOG) {
263                         add_log_destination_syslog();
264                 } else {
265                         assert(false);
266                 }
267         }
268         start_logging();
269 }
270         
271 bool dry_run_config(const string &argv0, const string &config_filename)
272 {
273         char *argv0_copy = strdup(argv0.c_str());
274         char *config_filename_copy = strdup(config_filename.c_str());
275
276         pid_t pid = fork();
277         switch (pid) {
278         case -1:
279                 log_perror("fork()");
280                 free(argv0_copy);
281                 free(config_filename_copy);
282                 return false;
283         case 0:
284                 // Child.
285                 execlp(argv0_copy, argv0_copy, "--test-config", config_filename_copy, NULL);
286                 log_perror(argv0_copy);
287                 _exit(1);
288         default:
289                 // Parent.
290                 break;
291         }
292                 
293         free(argv0_copy);
294         free(config_filename_copy);
295
296         int status;
297         pid_t err;
298         do {
299                 err = waitpid(pid, &status, 0);
300         } while (err == -1 && errno == EINTR);
301
302         if (err == -1) {
303                 log_perror("waitpid()");
304                 return false;
305         }       
306
307         return (WIFEXITED(status) && WEXITSTATUS(status) == 0);
308 }
309
310 void find_deleted_streams(const Config &config, set<string> *deleted_urls)
311 {
312         for (const StreamConfig &stream_config : config.streams) {
313                 if (stream_config.src == "delete") {
314                         log(INFO, "Deleting stream '%s'.", stream_config.url.c_str());
315                         deleted_urls->insert(stream_config.url);
316                 }
317         }
318 }
319
320 int main(int argc, char **argv)
321 {
322         signal(SIGHUP, hup);
323         signal(SIGINT, hup);
324         signal(SIGUSR1, do_nothing);  // Used in internal signalling.
325         signal(SIGPIPE, SIG_IGN);
326
327         tls_init();
328         
329         // Parse options.
330         int state_fd = -1;
331         bool test_config = false;
332         for ( ;; ) {
333                 static const option long_options[] = {
334                         { "state", required_argument, 0, 's' },
335                         { "test-config", no_argument, 0, 't' },
336                         { 0, 0, 0, 0 }
337                 };
338                 int option_index = 0;
339                 int c = getopt_long(argc, argv, "s:t", long_options, &option_index);
340      
341                 if (c == -1) {
342                         break;
343                 }
344                 switch (c) {
345                 case 's':
346                         state_fd = atoi(optarg);
347                         break;
348                 case 't':
349                         test_config = true;
350                         break;
351                 default:
352                         fprintf(stderr, "Unknown option '%s'\n", argv[option_index]);
353                         exit(1);
354                 }
355         }
356
357         string config_filename = "cubemap.config";
358         if (optind < argc) {
359                 config_filename = argv[optind++];
360         }
361
362         // Canonicalize argv[0] and config_filename.
363         char argv0_canon[PATH_MAX];
364         char config_filename_canon[PATH_MAX];
365
366         if (realpath("/proc/self/exe", argv0_canon) == NULL) {
367                 log_perror(argv[0]);
368                 exit(1);
369         }
370         if (realpath(config_filename.c_str(), config_filename_canon) == NULL) {
371                 log_perror(config_filename.c_str());
372                 exit(1);
373         }
374
375         // Now parse the configuration file.
376         Config config;
377         if (!parse_config(config_filename_canon, &config)) {
378                 exit(1);
379         }
380         if (test_config) {
381                 exit(0);
382         }
383         
384         // Ideally we'd like to daemonize only when we've started up all threads etc.,
385         // but daemon() forks, which is not good in multithreaded software, so we'll
386         // have to do it here.
387         if (config.daemonize) {
388                 if (daemon(0, 0) == -1) {
389                         log_perror("daemon");
390                         exit(1);
391                 }
392         }
393
394 start:
395         // Open logs as soon as possible.
396         open_logs(config.log_destinations);
397
398         log(INFO, "Cubemap " SERVER_VERSION " starting.");
399         if (config.access_log_file.empty()) {
400                 // Create a dummy logger.
401                 access_log = new AccessLogThread();
402         } else {
403                 access_log = new AccessLogThread(config.access_log_file);
404         }
405         access_log->run();
406
407         servers = new ServerPool(config.num_servers);
408
409         // Find all the streams that are to be deleted.
410         set<string> deleted_urls;
411         find_deleted_streams(config, &deleted_urls);
412
413         CubemapStateProto loaded_state;
414         timespec serialize_start;
415         set<string> deserialized_urls;
416         map<AcceptorConfig, Acceptor *, AcceptorConfigCompare> deserialized_acceptors;
417         multimap<InputKey, InputWithRefcount> inputs;  // multimap due to older versions without deduplication.
418         if (state_fd != -1) {
419                 log(INFO, "Deserializing state from previous process...");
420                 string serialized;
421                 if (!read_tempfile_and_close(state_fd, &serialized)) {
422                         exit(1);
423                 }
424                 if (!loaded_state.ParseFromString(serialized)) {
425                         log(ERROR, "Failed deserialization of state.");
426                         exit(1);
427                 }
428
429                 serialize_start.tv_sec = loaded_state.serialize_start_sec();
430                 serialize_start.tv_nsec = loaded_state.serialize_start_usec() * 1000ull;
431
432                 // Deserialize the streams.
433                 map<string, string> stream_headers_for_url;  // See below.
434                 for (const StreamProto &stream : loaded_state.streams()) {
435                         if (deleted_urls.count(stream.url()) != 0) {
436                                 // Delete the stream backlogs.
437                                 for (const int fd : stream.data_fds()) {
438                                         safe_close(fd);
439                                 }
440                         } else {
441                                 vector<int> data_fds;
442                                 for (const int fd : stream.data_fds()) {
443                                         data_fds.push_back(fd);
444                                 }
445
446                                 servers->add_stream_from_serialized(stream, data_fds);
447                                 deserialized_urls.insert(stream.url());
448
449                                 stream_headers_for_url.insert(make_pair(stream.url(), stream.stream_header()));
450                         }
451                 }
452
453                 // Deserialize the inputs. Note that we don't actually add them to any stream yet.
454                 for (const InputProto &serialized_input : loaded_state.inputs()) {
455                         InputWithRefcount iwr;
456                         iwr.input = create_input(serialized_input);
457                         iwr.refcount = 0;
458
459                         Input::Encoding src_encoding = serialized_input.is_metacube_encoded() ?
460                                 Input::INPUT_ENCODING_METACUBE :
461                                 Input::INPUT_ENCODING_RAW;
462                         InputKey key(serialized_input.url(), src_encoding);
463                         inputs.insert(make_pair(key, iwr));
464                 } 
465
466                 // Deserialize the acceptors.
467                 for (const AcceptorProto &serialized_acceptor : loaded_state.acceptors()) {
468                         AcceptorConfig config;
469                         config.addr = extract_address_from_acceptor_proto(serialized_acceptor);
470                         config.certificate_chain = serialized_acceptor.certificate_chain();
471                         config.private_key = serialized_acceptor.private_key();
472                         deserialized_acceptors.insert(make_pair(
473                                 config,
474                                 new Acceptor(serialized_acceptor)));
475                 }
476
477                 log(INFO, "Deserialization done.");
478         }
479
480         // Add any new inputs coming from the config.
481         create_config_inputs(config, &inputs);
482         
483         // Find all streams in the configuration file, create them, and connect to the inputs.
484         create_streams(config, deserialized_urls, &inputs);
485         vector<Acceptor *> acceptors = create_acceptors(config, &deserialized_acceptors);
486
487         // Make all the servers create TLS contexts for every TLS keypair we have.
488         for (Acceptor *acceptor : acceptors) {
489                 if (acceptor->is_tls()) {
490                         servers->create_tls_context_for_acceptor(acceptor);
491                 }
492         }
493         
494         // Put back the existing clients. It doesn't matter which server we
495         // allocate them to, so just do round-robin. However, we need to sort them
496         // by connection time first, since add_client_serialized() expects that.
497         sort(loaded_state.mutable_clients()->begin(),
498              loaded_state.mutable_clients()->end(),
499              OrderByConnectionTime());
500         for (int i = 0; i < loaded_state.clients_size(); ++i) {
501                 if (deleted_urls.count(loaded_state.clients(i).url()) != 0) {
502                         safe_close(loaded_state.clients(i).sock());
503                 } else {
504                         servers->add_client_from_serialized(loaded_state.clients(i));
505                 }
506         }
507         
508         servers->run();
509
510         // Now delete all inputs that are longer in use, and start the others.
511         for (auto input_it = inputs.begin(); input_it != inputs.end(); ) {
512                 if (input_it->second.refcount == 0) {
513                         if (input_it->first.second == Input::INPUT_ENCODING_RAW) {
514                                 log(WARNING, "Raw input '%s' no longer in use, closing.",
515                                     input_it->first.first.c_str());
516                         } else {
517                                 assert(input_it->first.second == Input::INPUT_ENCODING_METACUBE);
518                                 log(WARNING, "Metacube input '%s' no longer in use, closing.",
519                                     input_it->first.first.c_str());
520                         }
521                         input_it->second.input->close_socket();
522                         delete input_it->second.input;
523                         inputs.erase(input_it++);
524                 } else {
525                         input_it->second.input->run();
526                         ++input_it;
527                 }
528         }
529
530         // Start writing statistics.
531         unique_ptr<StatsThread> stats_thread;
532         if (!config.stats_file.empty()) {
533                 stats_thread.reset(new StatsThread(config.stats_file, config.stats_interval));
534                 stats_thread->run();
535         }
536
537         unique_ptr<InputStatsThread> input_stats_thread;
538         if (!config.input_stats_file.empty()) {
539                 vector<Input*> inputs_no_refcount;
540                 for (const auto &key_and_input_with_refcount : inputs) {
541                         inputs_no_refcount.push_back(key_and_input_with_refcount.second.input);
542                 }
543
544                 input_stats_thread.reset(new InputStatsThread(config.input_stats_file, config.input_stats_interval, inputs_no_refcount));
545                 input_stats_thread->run();
546         }
547
548         timespec server_start;
549         int err = clock_gettime(CLOCK_MONOTONIC, &server_start);
550         assert(err != -1);
551         if (state_fd != -1) {
552                 // Measure time from we started deserializing (below) to now, when basically everything
553                 // is up and running. This is, in other words, a conservative estimate of how long our
554                 // “glitch” period was, not counting of course reconnects if the configuration changed.
555                 double glitch_time = server_start.tv_sec - serialize_start.tv_sec +
556                         1e-9 * (server_start.tv_nsec - serialize_start.tv_nsec);
557                 log(INFO, "Re-exec happened in approx. %.0f ms.", glitch_time * 1000.0);
558         }
559
560         sd_notify(0, "READY=1");
561
562         while (!hupped) {
563                 usleep(100000);
564         }
565
566         if (stopped) {
567                 sd_notify(0, "STOPPING=1");
568         } else {
569                 sd_notify(0, "RELOADING=1");
570         }
571
572         // OK, we've been HUPed. Time to shut down everything, serialize, and re-exec.
573         err = clock_gettime(CLOCK_MONOTONIC, &serialize_start);
574         assert(err != -1);
575
576         if (input_stats_thread != NULL) {
577                 input_stats_thread->stop();
578                 input_stats_thread.reset();
579         }
580         if (stats_thread != NULL) {
581                 stats_thread->stop();
582                 stats_thread.reset();
583         }
584         for (Acceptor *acceptor : acceptors) {
585                 acceptor->stop();
586         }
587         for (const auto &key_and_input_with_refcount : inputs) {
588                 key_and_input_with_refcount.second.input->stop();
589         }
590         servers->stop();
591
592         CubemapStateProto state;
593         if (stopped) {
594                 log(INFO, "Shutting down.");
595         } else {
596                 log(INFO, "Serializing state and re-execing...");
597                 state = collect_state(
598                         serialize_start, acceptors, inputs, servers);
599                 string serialized;
600                 state.SerializeToString(&serialized);
601                 state_fd = make_tempfile(serialized);
602                 if (state_fd == -1) {
603                         exit(1);
604                 }
605         }
606         delete servers;
607
608         access_log->stop();
609         delete access_log;
610         shut_down_logging();
611
612         if (stopped) {
613                 exit(0);
614         }
615
616         // OK, so the signal was SIGHUP. Check that the new config is okay, then exec the new binary.
617         if (!dry_run_config(argv0_canon, config_filename_canon)) {
618                 open_logs(config.log_destinations);
619                 log(ERROR, "%s --test-config failed. Restarting old version instead of new.", argv[0]);
620                 hupped = false;
621                 shut_down_logging();
622                 goto start;
623         }
624          
625         char buf[16];
626         sprintf(buf, "%d", state_fd);
627
628         for ( ;; ) {
629                 execlp(argv0_canon, argv0_canon, config_filename_canon, "--state", buf, NULL);
630                 open_logs(config.log_destinations);
631                 log_perror("execlp");
632                 log(ERROR, "re-exec of %s failed. Waiting 0.2 seconds and trying again...", argv0_canon);
633                 shut_down_logging();
634                 usleep(200000);
635         }
636 }