858a6d0867000bf9ec9fcb456fa66f621bd4544d
[cubemap] / main.cpp
1 #include <assert.h>
2 #include <errno.h>
3 #include <getopt.h>
4 #include <limits.h>
5 #include <signal.h>
6 #include <stddef.h>
7 #include <stdio.h>
8 #include <stdlib.h>
9 #include <string.h>
10 #include <sys/time.h>
11 #include <sys/wait.h>
12 #include <systemd/sd-daemon.h>
13 #include <unistd.h>
14 #include <algorithm>
15 #include <map>
16 #include <set>
17 #include <string>
18 #include <utility>
19 #include <vector>
20
21 #include "tlse.h"
22
23 #include "acceptor.h"
24 #include "accesslog.h"
25 #include "config.h"
26 #include "input.h"
27 #include "input_stats.h"
28 #include "log.h"
29 #include "sa_compare.h"
30 #include "serverpool.h"
31 #include "state.pb.h"
32 #include "stats.h"
33 #include "stream.h"
34 #include "util.h"
35 #include "version.h"
36
37 using namespace std;
38
39 AccessLogThread *access_log = nullptr;
40 ServerPool *servers = nullptr;
41 volatile bool hupped = false;
42 volatile bool stopped = false;
43
44 typedef pair<string, Input::Encoding> InputKey;
45
46 namespace {
47
48 struct OrderByConnectionTime {
49         bool operator() (const ClientProto &a, const ClientProto &b) const {
50                 if (a.connect_time_sec() != b.connect_time_sec())
51                         return a.connect_time_sec() < b.connect_time_sec();
52                 return a.connect_time_nsec() < b.connect_time_nsec();
53         }
54 };
55
56 // An arbitrary ordering.
57 struct AcceptorConfigCompare {
58         bool operator() (const AcceptorConfig &a, const AcceptorConfig &b) const {
59                 int cmp = a.certificate_chain.compare(b.certificate_chain);
60                 if (cmp != 0) {
61                         return cmp < 0;
62                 }
63
64                 cmp = a.private_key.compare(b.private_key);
65                 if (cmp != 0) {
66                         return cmp < 0;
67                 }
68
69                 return Sockaddr6Compare()(a.addr, b.addr);
70         }
71 };
72
73 }  // namespace
74
75 struct InputWithRefcount {
76         Input *input;
77         int refcount;
78 };
79
80 void hup(int signum)
81 {
82         hupped = true;
83         if (signum == SIGINT) {
84                 stopped = true;
85         }
86 }
87
88 void do_nothing(int signum)
89 {
90 }
91
92 CubemapStateProto collect_state(const timespec &serialize_start,
93                                 const vector<Acceptor *> acceptors,
94                                 const multimap<InputKey, InputWithRefcount> inputs,
95                                 ServerPool *servers)
96 {
97         CubemapStateProto state = servers->serialize();  // Fills streams() and clients().
98         state.set_serialize_start_sec(serialize_start.tv_sec);
99         state.set_serialize_start_usec(serialize_start.tv_nsec / 1000);
100
101         for (Acceptor *acceptor : acceptors) {  
102                 state.add_acceptors()->MergeFrom(acceptor->serialize());
103         }
104
105         for (const auto &key_and_input_with_refcount : inputs) {
106                 state.add_inputs()->MergeFrom(key_and_input_with_refcount.second.input->serialize());
107         }
108
109         return state;
110 }
111
112 // Find all port statements in the configuration file, and create acceptors for them.
113 vector<Acceptor *> create_acceptors(
114         const Config &config,
115         map<AcceptorConfig, Acceptor *, AcceptorConfigCompare> *deserialized_acceptors)
116 {
117         vector<Acceptor *> acceptors;
118         for (const AcceptorConfig &acceptor_config : config.acceptors) {
119                 Acceptor *acceptor = nullptr;
120                 const auto deserialized_acceptor_it = deserialized_acceptors->find(acceptor_config);
121                 if (deserialized_acceptor_it != deserialized_acceptors->end()) {
122                         acceptor = deserialized_acceptor_it->second;
123                         deserialized_acceptors->erase(deserialized_acceptor_it);
124                 } else {
125                         int server_sock = create_server_socket(acceptor_config.addr, TCP_SOCKET);
126                         acceptor = new Acceptor(server_sock, acceptor_config.addr,
127                                                 acceptor_config.certificate_chain,
128                                                 acceptor_config.private_key);
129                 }
130                 acceptor->run();
131                 acceptors.push_back(acceptor);
132         }
133
134         // Close all acceptors that are no longer in the configuration file.
135         for (auto &config_and_acceptor : *deserialized_acceptors) {
136                 config_and_acceptor.second->close_socket();
137                 delete config_and_acceptor.second;
138         }
139
140         return acceptors;
141 }
142
143 void create_config_input(const string &src, Input::Encoding encoding, multimap<InputKey, InputWithRefcount> *inputs)
144 {
145         if (src.empty()) {
146                 return;
147         }
148         InputKey key(src, encoding);
149         if (inputs->count(key) != 0) {
150                 return;
151         }
152
153         InputWithRefcount iwr;
154         iwr.input = create_input(src, encoding);
155         if (iwr.input == nullptr) {
156                 log(ERROR, "did not understand URL '%s' or source encoding was invalid, clients will not get any data.",
157                         src.c_str());
158                 return;
159         }
160         iwr.refcount = 0;
161         inputs->insert(make_pair(key, iwr));
162 }
163
164 // Find all streams in the configuration file, and create inputs for them.
165 void create_config_inputs(const Config &config, multimap<InputKey, InputWithRefcount> *inputs)
166 {
167         for (const StreamConfig &stream_config : config.streams) {
168                 if (stream_config.src == "delete") {
169                         // Ignored for pre-1.4.0 configuration compatibility.
170                         continue;
171                 }
172                 create_config_input(stream_config.src, Input::Encoding(stream_config.src_encoding), inputs);
173         }
174         for (const UDPStreamConfig &udpstream_config : config.udpstreams) {
175                 create_config_input(udpstream_config.src, Input::INPUT_ENCODING_RAW, inputs);
176         }
177 }
178
179 void create_streams(const Config &config,
180                     const set<string> &deserialized_urls,
181                     multimap<InputKey, InputWithRefcount> *inputs)
182 {
183         // HTTP streams.
184         set<string> expecting_urls = deserialized_urls;
185         for (const StreamConfig &stream_config : config.streams) {
186                 int stream_index;
187
188                 expecting_urls.erase(stream_config.url);
189
190                 if (stream_config.src == "delete") {
191                         // Ignored for pre-1.4.0 configuration compatibility.
192                         continue;
193                 }
194
195                 if (deserialized_urls.count(stream_config.url) == 0) {
196                         stream_index = servers->add_stream(stream_config.url,
197                                                            stream_config.backlog_size,
198                                                            stream_config.prebuffering_bytes,
199                                                            Stream::Encoding(stream_config.encoding),
200                                                            Stream::Encoding(stream_config.src_encoding));
201                 } else {
202                         stream_index = servers->lookup_stream_by_url(stream_config.url);
203                         assert(stream_index != -1);
204                         servers->set_backlog_size(stream_index, stream_config.backlog_size);
205                         servers->set_prebuffering_bytes(stream_index, stream_config.prebuffering_bytes);
206                         servers->set_encoding(stream_index,
207                                               Stream::Encoding(stream_config.encoding));
208                         servers->set_src_encoding(stream_index,
209                                                   Stream::Encoding(stream_config.src_encoding));
210                 }
211
212                 servers->set_pacing_rate(stream_index, stream_config.pacing_rate);
213
214                 string src = stream_config.src;
215                 Input::Encoding src_encoding = Input::Encoding(stream_config.src_encoding);
216                 if (!src.empty()) {
217                         const auto input_it = inputs->find(make_pair(src, src_encoding));
218                         if (input_it != inputs->end()) {
219                                 input_it->second.input->add_destination(stream_index);
220                                 ++input_it->second.refcount;
221                         }
222                 }
223         }
224
225         // Warn about any streams servers we've lost.
226         for (const string &url : expecting_urls) {
227                 log(WARNING, "stream '%s' disappeared from the configuration file. "
228                              "It will not be deleted, but clients will not get any new inputs. "
229                              "If you really meant to delete it, set src=delete and reload.",
230                              url.c_str());
231         }
232
233         // UDP streams.
234         for (const UDPStreamConfig &udpstream_config : config.udpstreams) {
235                 int stream_index = servers->add_udpstream(
236                         udpstream_config.dst,
237                         udpstream_config.pacing_rate,
238                         udpstream_config.ttl,
239                         udpstream_config.multicast_iface_index);
240
241                 string src = udpstream_config.src;
242                 if (!src.empty()) {
243                         auto input_it = inputs->find(make_pair(src, Input::INPUT_ENCODING_RAW));
244                         assert(input_it != inputs->end());
245                         input_it->second.input->add_destination(stream_index);
246                         ++input_it->second.refcount;
247                 }
248         }
249
250         // HTTP gen204 endpoints.
251         for (const Gen204Config &ping_config : config.pings) {
252                 servers->add_gen204(ping_config.url, ping_config.allow_origin);
253         }
254 }
255         
256 void open_logs(const vector<LogConfig> &log_destinations)
257 {
258         for (const LogConfig &log_destination : log_destinations) {
259                 if (log_destination.type == LogConfig::LOG_TYPE_FILE) {
260                         add_log_destination_file(log_destination.filename);
261                 } else if (log_destination.type == LogConfig::LOG_TYPE_CONSOLE) {
262                         add_log_destination_console();
263                 } else if (log_destination.type == LogConfig::LOG_TYPE_SYSLOG) {
264                         add_log_destination_syslog();
265                 } else {
266                         assert(false);
267                 }
268         }
269         start_logging();
270 }
271         
272 bool dry_run_config(const string &argv0, const string &config_filename)
273 {
274         char *argv0_copy = strdup(argv0.c_str());
275         char *config_filename_copy = strdup(config_filename.c_str());
276
277         pid_t pid = fork();
278         switch (pid) {
279         case -1:
280                 log_perror("fork()");
281                 free(argv0_copy);
282                 free(config_filename_copy);
283                 return false;
284         case 0:
285                 // Child.
286                 execlp(argv0_copy, argv0_copy, "--test-config", config_filename_copy, nullptr);
287                 log_perror(argv0_copy);
288                 _exit(1);
289         default:
290                 // Parent.
291                 break;
292         }
293                 
294         free(argv0_copy);
295         free(config_filename_copy);
296
297         int status;
298         pid_t err;
299         do {
300                 err = waitpid(pid, &status, 0);
301         } while (err == -1 && errno == EINTR);
302
303         if (err == -1) {
304                 log_perror("waitpid()");
305                 return false;
306         }       
307
308         return (WIFEXITED(status) && WEXITSTATUS(status) == 0);
309 }
310
311 void find_all_streams(const Config &config, set<string> *all_urls)
312 {
313         for (const StreamConfig &stream_config : config.streams) {
314                 if (stream_config.src == "delete") {
315                         log(WARNING, "stream '%s' has src=delete; ignoring it. Since Cubemap 1.4.0, you do not "
316                                      "need to set src=delete to delete streams anymore; just delete them from "
317                                      "the configuration file.",
318                                      stream_config.url.c_str());
319                 } else {
320                         all_urls->insert(stream_config.url);
321                 }
322         }
323 }
324
325 int main(int argc, char **argv)
326 {
327         signal(SIGHUP, hup);
328         signal(SIGINT, hup);
329         signal(SIGUSR1, do_nothing);  // Used in internal signalling.
330         signal(SIGPIPE, SIG_IGN);
331
332         tls_init();
333         
334         // Parse options.
335         int state_fd = -1;
336         bool test_config = false;
337         for ( ;; ) {
338                 static const option long_options[] = {
339                         { "state", required_argument, 0, 's' },
340                         { "test-config", no_argument, 0, 't' },
341                         { 0, 0, 0, 0 }
342                 };
343                 int option_index = 0;
344                 int c = getopt_long(argc, argv, "s:t", long_options, &option_index);
345      
346                 if (c == -1) {
347                         break;
348                 }
349                 switch (c) {
350                 case 's':
351                         state_fd = atoi(optarg);
352                         break;
353                 case 't':
354                         test_config = true;
355                         break;
356                 default:
357                         fprintf(stderr, "Unknown option '%s'\n", argv[option_index]);
358                         exit(1);
359                 }
360         }
361
362         string config_filename = "cubemap.config";
363         if (optind < argc) {
364                 config_filename = argv[optind++];
365         }
366
367         // Canonicalize argv[0] and config_filename.
368         char argv0_canon[PATH_MAX];
369         char config_filename_canon[PATH_MAX];
370
371         if (realpath("/proc/self/exe", argv0_canon) == nullptr) {
372                 log_perror(argv[0]);
373                 exit(1);
374         }
375         if (realpath(config_filename.c_str(), config_filename_canon) == nullptr) {
376                 log_perror(config_filename.c_str());
377                 exit(1);
378         }
379
380         // Now parse the configuration file.
381         Config config;
382         if (!parse_config(config_filename_canon, &config)) {
383                 exit(1);
384         }
385         if (test_config) {
386                 exit(0);
387         }
388         
389         // Ideally we'd like to daemonize only when we've started up all threads etc.,
390         // but daemon() forks, which is not good in multithreaded software, so we'll
391         // have to do it here.
392         if (config.daemonize) {
393                 if (daemon(0, 0) == -1) {
394                         log_perror("daemon");
395                         exit(1);
396                 }
397         }
398
399 start:
400         // Open logs as soon as possible.
401         open_logs(config.log_destinations);
402
403         log(INFO, "Cubemap " SERVER_VERSION " starting.");
404         if (config.access_log_file.empty()) {
405                 // Create a dummy logger.
406                 access_log = new AccessLogThread();
407         } else {
408                 access_log = new AccessLogThread(config.access_log_file);
409         }
410         access_log->run();
411
412         servers = new ServerPool(config.num_servers);
413
414         // Find all the streams that are to be kept.
415         set<string> all_urls;
416         find_all_streams(config, &all_urls);
417
418         CubemapStateProto loaded_state;
419         timespec serialize_start;
420         set<string> deserialized_urls;
421         map<AcceptorConfig, Acceptor *, AcceptorConfigCompare> deserialized_acceptors;
422         multimap<InputKey, InputWithRefcount> inputs;  // multimap due to older versions without deduplication.
423         if (state_fd != -1) {
424                 log(INFO, "Deserializing state from previous process...");
425                 string serialized;
426                 if (!read_tempfile_and_close(state_fd, &serialized)) {
427                         exit(1);
428                 }
429                 if (!loaded_state.ParseFromString(serialized)) {
430                         log(ERROR, "Failed deserialization of state.");
431                         exit(1);
432                 }
433
434                 serialize_start.tv_sec = loaded_state.serialize_start_sec();
435                 serialize_start.tv_nsec = loaded_state.serialize_start_usec() * 1000ull;
436
437                 // Deserialize the streams.
438                 map<string, string> stream_headers_for_url;  // See below.
439                 for (const StreamProto &stream : loaded_state.streams()) {
440                         if (all_urls.count(stream.url()) == 0) {
441                                 // Delete the stream backlogs.
442                                 log(INFO, "Deleting stream '%s'.", stream.url().c_str());
443                                 for (const int fd : stream.data_fds()) {
444                                         safe_close(fd);
445                                 }
446                         } else {
447                                 vector<int> data_fds;
448                                 for (const int fd : stream.data_fds()) {
449                                         data_fds.push_back(fd);
450                                 }
451
452                                 servers->add_stream_from_serialized(stream, data_fds);
453                                 deserialized_urls.insert(stream.url());
454
455                                 stream_headers_for_url.insert(make_pair(stream.url(), stream.stream_header()));
456                         }
457                 }
458
459                 // Deserialize the inputs. Note that we don't actually add them to any stream yet.
460                 for (const InputProto &serialized_input : loaded_state.inputs()) {
461                         InputWithRefcount iwr;
462                         iwr.input = create_input(serialized_input);
463                         iwr.refcount = 0;
464
465                         Input::Encoding src_encoding = serialized_input.is_metacube_encoded() ?
466                                 Input::INPUT_ENCODING_METACUBE :
467                                 Input::INPUT_ENCODING_RAW;
468                         InputKey key(serialized_input.url(), src_encoding);
469                         inputs.insert(make_pair(key, iwr));
470                 } 
471
472                 // Deserialize the acceptors.
473                 for (const AcceptorProto &serialized_acceptor : loaded_state.acceptors()) {
474                         AcceptorConfig config;
475                         config.addr = extract_address_from_acceptor_proto(serialized_acceptor);
476                         config.certificate_chain = serialized_acceptor.certificate_chain();
477                         config.private_key = serialized_acceptor.private_key();
478                         deserialized_acceptors.insert(make_pair(
479                                 config,
480                                 new Acceptor(serialized_acceptor)));
481                 }
482
483                 log(INFO, "Deserialization done.");
484         }
485
486         // Add any new inputs coming from the config.
487         create_config_inputs(config, &inputs);
488         
489         // Find all streams in the configuration file, create them, and connect to the inputs.
490         create_streams(config, deserialized_urls, &inputs);
491         vector<Acceptor *> acceptors = create_acceptors(config, &deserialized_acceptors);
492
493         // Make all the servers create TLS contexts for every TLS keypair we have.
494         for (Acceptor *acceptor : acceptors) {
495                 if (acceptor->is_tls()) {
496                         servers->create_tls_context_for_acceptor(acceptor);
497                 }
498         }
499         
500         // Put back the existing clients. It doesn't matter which server we
501         // allocate them to, so just do round-robin. However, we need to sort them
502         // by connection time first, since add_client_serialized() expects that.
503         sort(loaded_state.mutable_clients()->begin(),
504              loaded_state.mutable_clients()->end(),
505              OrderByConnectionTime());
506         for (int i = 0; i < loaded_state.clients_size(); ++i) {
507                 if (all_urls.count(loaded_state.clients(i).url()) == 0) {
508                         safe_close(loaded_state.clients(i).sock());
509                 } else {
510                         servers->add_client_from_serialized(loaded_state.clients(i));
511                 }
512         }
513         
514         servers->run();
515
516         // Now delete all inputs that are longer in use, and start the others.
517         for (auto input_it = inputs.begin(); input_it != inputs.end(); ) {
518                 if (input_it->second.refcount == 0) {
519                         if (input_it->first.second == Input::INPUT_ENCODING_RAW) {
520                                 log(WARNING, "Raw input '%s' no longer in use, closing.",
521                                     input_it->first.first.c_str());
522                         } else {
523                                 assert(input_it->first.second == Input::INPUT_ENCODING_METACUBE);
524                                 log(WARNING, "Metacube input '%s' no longer in use, closing.",
525                                     input_it->first.first.c_str());
526                         }
527                         input_it->second.input->close_socket();
528                         delete input_it->second.input;
529                         inputs.erase(input_it++);
530                 } else {
531                         input_it->second.input->run();
532                         ++input_it;
533                 }
534         }
535
536         // Start writing statistics.
537         unique_ptr<StatsThread> stats_thread;
538         if (!config.stats_file.empty()) {
539                 stats_thread.reset(new StatsThread(config.stats_file, config.stats_interval));
540                 stats_thread->run();
541         }
542
543         unique_ptr<InputStatsThread> input_stats_thread;
544         if (!config.input_stats_file.empty()) {
545                 vector<Input*> inputs_no_refcount;
546                 for (const auto &key_and_input_with_refcount : inputs) {
547                         inputs_no_refcount.push_back(key_and_input_with_refcount.second.input);
548                 }
549
550                 input_stats_thread.reset(new InputStatsThread(config.input_stats_file, config.input_stats_interval, inputs_no_refcount));
551                 input_stats_thread->run();
552         }
553
554         timespec server_start;
555         int err = clock_gettime(CLOCK_MONOTONIC, &server_start);
556         assert(err != -1);
557         if (state_fd != -1) {
558                 // Measure time from we started deserializing (below) to now, when basically everything
559                 // is up and running. This is, in other words, a conservative estimate of how long our
560                 // “glitch” period was, not counting of course reconnects if the configuration changed.
561                 double glitch_time = server_start.tv_sec - serialize_start.tv_sec +
562                         1e-9 * (server_start.tv_nsec - serialize_start.tv_nsec);
563                 log(INFO, "Re-exec happened in approx. %.0f ms.", glitch_time * 1000.0);
564         }
565
566         sd_notify(0, "READY=1");
567
568         while (!hupped) {
569                 usleep(100000);
570         }
571
572         if (stopped) {
573                 sd_notify(0, "STOPPING=1");
574         } else {
575                 sd_notify(0, "RELOADING=1");
576         }
577
578         // OK, we've been HUPed. Time to shut down everything, serialize, and re-exec.
579         err = clock_gettime(CLOCK_MONOTONIC, &serialize_start);
580         assert(err != -1);
581
582         if (input_stats_thread != nullptr) {
583                 input_stats_thread->stop();
584                 input_stats_thread.reset();
585         }
586         if (stats_thread != nullptr) {
587                 stats_thread->stop();
588                 stats_thread.reset();
589         }
590         for (Acceptor *acceptor : acceptors) {
591                 acceptor->stop();
592         }
593         for (const auto &key_and_input_with_refcount : inputs) {
594                 key_and_input_with_refcount.second.input->stop();
595         }
596         servers->stop();
597
598         CubemapStateProto state;
599         if (stopped) {
600                 log(INFO, "Shutting down.");
601         } else {
602                 log(INFO, "Serializing state and re-execing...");
603                 state = collect_state(
604                         serialize_start, acceptors, inputs, servers);
605                 string serialized;
606                 state.SerializeToString(&serialized);
607                 state_fd = make_tempfile(serialized);
608                 if (state_fd == -1) {
609                         exit(1);
610                 }
611         }
612         delete servers;
613
614         access_log->stop();
615         delete access_log;
616         shut_down_logging();
617
618         if (stopped) {
619                 exit(0);
620         }
621
622         // OK, so the signal was SIGHUP. Check that the new config is okay, then exec the new binary.
623         if (!dry_run_config(argv0_canon, config_filename_canon)) {
624                 open_logs(config.log_destinations);
625                 log(ERROR, "%s --test-config failed. Restarting old version instead of new.", argv[0]);
626                 hupped = false;
627                 shut_down_logging();
628                 goto start;
629         }
630          
631         char buf[16];
632         sprintf(buf, "%d", state_fd);
633
634         for ( ;; ) {
635                 execlp(argv0_canon, argv0_canon, config_filename_canon, "--state", buf, nullptr);
636                 open_logs(config.log_destinations);
637                 log_perror("execlp");
638                 log(ERROR, "re-exec of %s failed. Waiting 0.2 seconds and trying again...", argv0_canon);
639                 shut_down_logging();
640                 usleep(200000);
641         }
642 }