X-Git-Url: https://git.sesse.net/?a=blobdiff_plain;f=nageru%2Fvideo_encoder.cpp;h=0257d38bbfae3f271a107a936a5f66150ed620bf;hb=68271fb0bddd8a48aa036428f2928a69a5e4e660;hp=c75c4e3f365f851a0aa056fdebb3bacd7701bf9a;hpb=f0db8fcc58dd66a7dfd019f99add721d8161b75a;p=nageru diff --git a/nageru/video_encoder.cpp b/nageru/video_encoder.cpp index c75c4e3..0257d38 100644 --- a/nageru/video_encoder.cpp +++ b/nageru/video_encoder.cpp @@ -4,6 +4,9 @@ #include #include #include +#include +#include +#include #include #include @@ -12,6 +15,9 @@ extern "C" { } #include "audio_encoder.h" +#ifdef HAVE_AV1 +#include "av1_encoder.h" +#endif #include "defs.h" #include "shared/ffmpeg_raii.h" #include "flags.h" @@ -51,6 +57,10 @@ string generate_local_dump_filename(int frame) VideoEncoder::VideoEncoder(ResourcePool *resource_pool, QSurface *surface, const std::string &va_display, int width, int height, HTTPD *httpd, DiskSpaceEstimator *disk_space_estimator) : resource_pool(resource_pool), surface(surface), va_display(va_display), width(width), height(height), httpd(httpd), disk_space_estimator(disk_space_estimator) { + // TODO: If we're outputting AV1, we can't use MPEG-TS currently. + srt_oformat = av_guess_format("mpegts", nullptr, nullptr); + assert(srt_oformat != nullptr); + oformat = av_guess_format(global_flags.stream_mux_name.c_str(), nullptr, nullptr); assert(oformat != nullptr); if (global_flags.stream_audio_codec_name.empty()) { @@ -61,8 +71,14 @@ VideoEncoder::VideoEncoder(ResourcePool *resource_pool, QSurface *surface, const if (global_flags.x264_video_to_http || global_flags.x264_video_to_disk) { x264_encoder.reset(new X264Encoder(oformat, /*use_separate_disk_params=*/false)); } - X264Encoder *http_encoder = x264_encoder.get(); - X264Encoder *disk_encoder = x264_encoder.get(); + VideoCodecInterface *http_encoder = x264_encoder.get(); + VideoCodecInterface *disk_encoder = x264_encoder.get(); +#ifdef HAVE_AV1 + if (global_flags.av1_video_to_http) { + av1_encoder.reset(new AV1Encoder(oformat)); + http_encoder = av1_encoder.get(); + } +#endif if (global_flags.x264_separate_disk_encode) { x264_disk_encoder.reset(new X264Encoder(oformat, /*use_separate_disk_params=*/true)); disk_encoder = x264_disk_encoder.get(); @@ -71,16 +87,34 @@ VideoEncoder::VideoEncoder(ResourcePool *resource_pool, QSurface *surface, const string filename = generate_local_dump_filename(/*frame=*/0); quicksync_encoder.reset(new QuickSyncEncoder(filename, resource_pool, surface, va_display, width, height, oformat, http_encoder, disk_encoder, disk_space_estimator)); - open_output_stream(); - stream_audio_encoder->add_mux(stream_mux.get()); - quicksync_encoder->set_stream_mux(stream_mux.get()); + open_output_streams(); + stream_audio_encoder->add_mux(http_mux.get()); + if (srt_mux != nullptr) { + stream_audio_encoder->add_mux(srt_mux.get()); + } + quicksync_encoder->set_http_mux(http_mux.get()); + if (srt_mux != nullptr) { + quicksync_encoder->set_srt_mux(srt_mux.get()); + } if (global_flags.x264_video_to_http) { - x264_encoder->add_mux(stream_mux.get()); + x264_encoder->add_mux(http_mux.get()); + if (srt_mux != nullptr) { + x264_encoder->add_mux(srt_mux.get()); + } + } +#ifdef HAVE_AV1 + if (global_flags.av1_video_to_http) { + av1_encoder->add_mux(http_mux.get()); + if (srt_mux != nullptr) { + av1_encoder->add_mux(srt_mux.get()); + } } +#endif } VideoEncoder::~VideoEncoder() { + should_quit = true; quicksync_encoder->shutdown(); x264_encoder.reset(nullptr); x264_disk_encoder.reset(nullptr); @@ -102,7 +136,7 @@ void VideoEncoder::do_cut(int frame) // However, since this means both encoders could be sending packets at // the same time, it means pts could come out of order to the stream mux, // and we need to plug it until the shutdown is complete. - stream_mux->plug(); + http_mux->plug(); lock(qs_mu, qs_audio_mu); lock_guard lock1(qs_mu, adopt_lock), lock2(qs_audio_mu, adopt_lock); QuickSyncEncoder *old_encoder = quicksync_encoder.release(); // When we go C++14, we can use move capture instead. @@ -119,7 +153,7 @@ void VideoEncoder::do_cut(int frame) delete old_x264_encoder; delete old_x264_disk_encoder; old_encoder->close_file(); - stream_mux->unplug(); + http_mux->unplug(); // We cannot delete the encoder here, as this thread has no OpenGL context. // We'll deal with it in begin_frame(). @@ -131,7 +165,7 @@ void VideoEncoder::do_cut(int frame) x264_encoder.reset(new X264Encoder(oformat, /*use_separate_disk_params=*/false)); assert(global_flags.x264_video_to_http); if (global_flags.x264_video_to_http) { - x264_encoder->add_mux(stream_mux.get()); + x264_encoder->add_mux(http_mux.get()); } if (overriding_bitrate != 0) { x264_encoder->change_bitrate(overriding_bitrate); @@ -145,7 +179,7 @@ void VideoEncoder::do_cut(int frame) } quicksync_encoder.reset(new QuickSyncEncoder(filename, resource_pool, surface, va_display, width, height, oformat, http_encoder, disk_encoder, disk_space_estimator)); - quicksync_encoder->set_stream_mux(stream_mux.get()); + quicksync_encoder->set_http_mux(http_mux.get()); } void VideoEncoder::change_x264_bitrate(unsigned rate_kbit) @@ -184,38 +218,61 @@ bool VideoEncoder::begin_frame(int64_t pts, int64_t duration, movit::YCbCrLumaCo RefCountedGLsync VideoEncoder::end_frame() { + want_srt_metric_update = true; lock_guard lock(qs_mu); return quicksync_encoder->end_frame(); } -void VideoEncoder::open_output_stream() +void VideoEncoder::open_output_streams() { - AVFormatContext *avctx = avformat_alloc_context(); - avctx->oformat = const_castoformat)>(oformat); // const_cast is a hack to work in FFmpeg both before and after 5.0. + for (bool is_srt : {false, true}) { + if (is_srt && global_flags.srt_destination_host.empty()) { + continue; + } - uint8_t *buf = (uint8_t *)av_malloc(MUX_BUFFER_SIZE); - avctx->pb = avio_alloc_context(buf, MUX_BUFFER_SIZE, 1, this, nullptr, nullptr, nullptr); - avctx->pb->write_data_type = &VideoEncoder::write_packet2_thunk; - avctx->pb->ignore_boundary_point = 1; + AVFormatContext *avctx = avformat_alloc_context(); + avctx->oformat = is_srt ? srt_oformat : oformat; - Mux::Codec video_codec; - if (global_flags.uncompressed_video_to_http) { - video_codec = Mux::CODEC_NV12; - } else { - video_codec = Mux::CODEC_H264; - } + uint8_t *buf = (uint8_t *)av_malloc(MUX_BUFFER_SIZE); + avctx->pb = avio_alloc_context(buf, MUX_BUFFER_SIZE, 1, this, nullptr, nullptr, nullptr); + if (is_srt) { + avctx->pb->write_packet = &VideoEncoder::write_srt_packet_thunk; + } else { + avctx->pb->write_data_type = &VideoEncoder::write_packet2_thunk; + avctx->pb->ignore_boundary_point = 1; + } - avctx->flags = AVFMT_FLAG_CUSTOM_IO; + Mux::Codec video_codec; + if (global_flags.av1_video_to_http) { + video_codec = Mux::CODEC_AV1; + } else { + video_codec = Mux::CODEC_H264; + } - string video_extradata; - if (global_flags.x264_video_to_http || global_flags.x264_video_to_disk) { - video_extradata = x264_encoder->get_global_headers(); - } + avctx->flags = AVFMT_FLAG_CUSTOM_IO; + + string video_extradata; + if (global_flags.x264_video_to_http) { + video_extradata = x264_encoder->get_global_headers(); +#ifdef HAVE_AV1 + } else if (global_flags.av1_video_to_http) { + video_extradata = av1_encoder->get_global_headers(); +#endif + } - stream_mux.reset(new Mux(avctx, width, height, video_codec, video_extradata, stream_audio_encoder->get_codec_parameters().get(), - get_color_space(global_flags.ycbcr_rec709_coefficients), COARSE_TIMEBASE, - /*write_callback=*/nullptr, Mux::WRITE_FOREGROUND, { &stream_mux_metrics })); - stream_mux_metrics.init({{ "destination", "http" }}); + Mux *mux = new Mux(avctx, width, height, video_codec, video_extradata, stream_audio_encoder->get_codec_parameters().get(), + get_color_space(global_flags.ycbcr_rec709_coefficients), COARSE_TIMEBASE, + /*write_callback=*/nullptr, is_srt ? Mux::WRITE_BACKGROUND : Mux::WRITE_FOREGROUND, { is_srt ? &srt_mux_metrics : &http_mux_metrics }); + if (is_srt) { + srt_mux.reset(mux); + srt_mux_metrics.init({{ "destination", "srt" }}); + srt_metrics.init({{ "cardtype", "output" }}); + global_metrics.add("srt_num_connection_attempts", {{ "cardtype", "output" }}, &metric_srt_num_connection_attempts); + } else { + http_mux.reset(mux); + http_mux_metrics.init({{ "destination", "http" }}); + } + } } int VideoEncoder::write_packet2_thunk(void *opaque, uint8_t *buf, int buf_size, AVIODataMarkerType type, int64_t time) @@ -235,11 +292,198 @@ int VideoEncoder::write_packet2(uint8_t *buf, int buf_size, AVIODataMarkerType t } if (type == AVIO_DATA_MARKER_HEADER) { - stream_mux_header.append((char *)buf, buf_size); - httpd->set_header(HTTPD::StreamID{ HTTPD::MAIN_STREAM, 0 }, stream_mux_header); + http_mux_header.append((char *)buf, buf_size); + httpd->set_header(HTTPD::StreamID{ HTTPD::MAIN_STREAM, 0 }, http_mux_header); } else { httpd->add_data(HTTPD::StreamID{ HTTPD::MAIN_STREAM, 0 }, (char *)buf, buf_size, type == AVIO_DATA_MARKER_SYNC_POINT, time, AVRational{ AV_TIME_BASE, 1 }); } return buf_size; } +int VideoEncoder::write_srt_packet_thunk(void *opaque, uint8_t *buf, int buf_size) +{ + VideoEncoder *video_encoder = (VideoEncoder *)opaque; + return video_encoder->write_srt_packet(buf, buf_size); +} + +static string print_addrinfo(const addrinfo *ai) +{ + char hoststr[NI_MAXHOST], portstr[NI_MAXSERV]; + if (getnameinfo(ai->ai_addr, ai->ai_addrlen, hoststr, sizeof(hoststr), portstr, sizeof(portstr), NI_DGRAM | NI_NUMERICHOST | NI_NUMERICSERV) != 0) { + return ""; // Should basically never happen, since we're not doing DNS lookups. + } + + if (ai->ai_family == AF_INET6) { + return string("[") + hoststr + "]:" + portstr; + } else { + return string(hoststr) + ":" + portstr; + } +} + +int VideoEncoder::open_srt_socket() +{ + int sock = srt_create_socket(); + if (sock == -1) { + fprintf(stderr, "srt_create_socket(): %s\n", srt_getlasterror_str()); + return -1; + } + + SRT_TRANSTYPE live = SRTT_LIVE; + if (srt_setsockopt(sock, 0, SRTO_TRANSTYPE, &live, sizeof(live)) < 0) { + fprintf(stderr, "srt_setsockopt(SRTO_TRANSTYPE): %s\n", srt_getlasterror_str()); + srt_close(sock); + return -1; + } + + if (srt_setsockopt(sock, 0, SRTO_LATENCY, &global_flags.srt_output_latency_ms, sizeof(global_flags.srt_output_latency_ms)) < 0) { + fprintf(stderr, "srt_setsockopt(SRTO_LATENCY): %s\n", srt_getlasterror_str()); + srt_close(sock); + return -1; + } + + if (!global_flags.srt_streamid.empty()) { + if (srt_setsockopt(sock, 0, SRTO_STREAMID, global_flags.srt_streamid.data(), global_flags.srt_streamid.size()) < 0) { + fprintf(stderr, "srt_setsockopt(SRTO_STREAMID): %s\n", srt_getlasterror_str()); + srt_close(sock); + return -1; + } + } + + if (!global_flags.srt_passphrase.empty()) { + if (srt_setsockopt(sock, 0, SRTO_PASSPHRASE, global_flags.srt_passphrase.data(), global_flags.srt_passphrase.size()) < 0) { + fprintf(stderr, "srt_setsockopt(SRTO_PASSPHRASE): %s\n", srt_getlasterror_str()); + srt_close(sock); + return -1; + } + } + + return sock; +} + +int VideoEncoder::connect_to_srt() +{ + // We need to specify SOCK_DGRAM as a hint, or we'll get all addresses + // three times (for each of TCP, UDP, raw). + addrinfo hints; + memset(&hints, 0, sizeof(hints)); + hints.ai_flags = AI_ADDRCONFIG; + hints.ai_socktype = SOCK_DGRAM; + + addrinfo *ai; + int ret = getaddrinfo(global_flags.srt_destination_host.c_str(), global_flags.srt_destination_port.c_str(), &hints, &ai); + if (ret != 0) { + fprintf(stderr, "getaddrinfo(%s:%s): %s\n", global_flags.srt_destination_host.c_str(), global_flags.srt_destination_port.c_str(), gai_strerror(ret)); + return -1; + } + + unique_ptr ai_cleanup(ai, &freeaddrinfo); + + for (const addrinfo *cur = ai; cur != nullptr; cur = cur->ai_next) { + // Seemingly, srt_create_socket() isn't universal; once we try to connect, + // it gets locked to either IPv4 or IPv6. So we need to create a new one + // for every address we try. + int sock = open_srt_socket(); + if (sock == -1) { + // Die immediately. + return sock; + } + ++metric_srt_num_connection_attempts; + + // We do a non-blocking connect, so that we can check should_quit + // every now and then. + int blocking = 0; + if (srt_setsockopt(sock, 0, SRTO_RCVSYN, &blocking, sizeof(blocking)) < 0) { + fprintf(stderr, "srt_setsockopt(SRTO_SNDSYN=0): %s\n", srt_getlasterror_str()); + srt_close(sock); + continue; + } + if (srt_connect(sock, cur->ai_addr, cur->ai_addrlen) < 0) { + fprintf(stderr, "srt_connect(%s): %s\n", print_addrinfo(cur).c_str(), srt_getlasterror_str()); + srt_close(sock); + continue; + } + int eid = srt_epoll_create(); + if (eid < 0) { + fprintf(stderr, "srt_epoll_create(): %s\n", srt_getlasterror_str()); + srt_close(sock); + continue; + } + int modes = SRT_EPOLL_ERR | SRT_EPOLL_OUT; + if (srt_epoll_add_usock(eid, sock, &modes) < 0) { + fprintf(stderr, "srt_epoll_usock(): %s\n", srt_getlasterror_str()); + srt_close(sock); + srt_epoll_release(eid); + continue; + } + bool ok; + while (!should_quit.load()) { + SRTSOCKET errfds[1], writefds[1]; + int num_errfds = 1, num_writefds = 1; + int poll_time_ms = 100; + int ret = srt_epoll_wait(eid, errfds, &num_errfds, writefds, &num_writefds, poll_time_ms, 0, 0, 0, 0); + if (ret < 0) { + if (srt_getlasterror(nullptr) == SRT_ETIMEOUT) { + continue; + } else { + fprintf(stderr, "srt_epoll_wait(): %s\n", srt_getlasterror_str()); + srt_close(sock); + srt_epoll_release(eid); + return -1; + } + } else if (ret > 0) { + // The SRT epoll framework is pretty odd, but seemingly, + // this is the way. Getting the same error code as srt_connect() + // would normally return seems to be impossible, though. + ok = (num_errfds == 0); + break; + fprintf(stderr, "num_errfds=%d num_writefds=%d last_err=%s\n", num_errfds, num_writefds, srt_getlasterror_str()); + break; + } + } + srt_epoll_release(eid); + if (should_quit.load()) { + srt_close(sock); + return -1; + } + if (ok) { + fprintf(stderr, "Connected to destination SRT endpoint at %s.\n", print_addrinfo(cur).c_str()); + return sock; + } else { + fprintf(stderr, "srt_connect(%s): %s\n", print_addrinfo(cur).c_str(), srt_getlasterror_str()); + srt_close(sock); + } + } + + // Out of candidates, so give up. + return -1; +} + +int VideoEncoder::write_srt_packet(uint8_t *buf, int buf_size) +{ + if (want_srt_metric_update.exchange(false) && srt_sock != -1) { + srt_metrics.update_srt_stats(srt_sock); + } + while (buf_size > 0 && !should_quit.load()) { + if (srt_sock == -1) { + srt_sock = connect_to_srt(); + if (srt_sock == -1) { + usleep(100000); + continue; + } + srt_metrics.update_srt_stats(srt_sock); + } + int to_send = min(buf_size, SRT_LIVE_DEF_PLSIZE); + int ret = srt_send(srt_sock, (char *)buf, to_send); + if (ret < 0) { + fprintf(stderr, "srt_send(): %s\n", srt_getlasterror_str()); + srt_close(srt_sock); + srt_metrics.metric_srt_uptime_seconds = 0.0 / 0.0; + srt_sock = connect_to_srt(); + continue; + } + buf += ret; + buf_size -= ret; + } + return buf_size; +} +