X-Git-Url: https://git.sesse.net/?p=nageru;a=blobdiff_plain;f=ffmpeg_capture.h;h=8a513df971fa20f2cba71e25ac603242b9be3be3;hp=e6b4ed481f6b151e8a687a1f7b0aec5dab7d0472;hb=703e00da89118df9be0354dda621bed023e6030e;hpb=b6089b76678e76271616131672c5ba454a5d336d diff --git a/ffmpeg_capture.h b/ffmpeg_capture.h index e6b4ed4..8a513df 100644 --- a/ffmpeg_capture.h +++ b/ffmpeg_capture.h @@ -6,19 +6,17 @@ // FFmpeg (thus the name), this means it can handle a very wide array of video // formats, and also things like network streaming and V4L capture, but it is // also significantly less integrated and optimized than the regular capture -// cards. In particular, the frames are always scaled and converted to 8-bit +// cards. In particular, the frames are always scaled and converted to 8-bit // RGBA on the CPU before being sent on to the GPU. // // Since we don't really know much about the video when building the chains, // there are some limitations. In particular, frames are always assumed to be // sRGB even if the video container says something else. We could probably -// try to load the video on startup and pick out the parameters at that point -// (which would probably also allow us to send Y'CbCr video through without -// CPU conversion), but it would require some more plumbing, and it would also -// fail if the file changes parameters midway, which is allowed in some formats. +// try to load the video on startup and pick out the parameters at that point, +// but it would require some more plumbing, and it would also fail if the file +// changes parameters midway, which is allowed in some formats. // -// There is currently no audio support. There is also no support for changing -// the video underway (unlike images), although there really should be. +// You can get out the audio either as decoded or in raw form (Kaeru uses this). #include #include @@ -30,7 +28,24 @@ #include #include +#include + +extern "C" { +#include +#include +#include +#include +} + #include "bmusb/bmusb.h" +#include "ffmpeg_raii.h" +#include "ref_counted_frame.h" +#include "quittable_sleeper.h" + +struct AVFormatContext; +struct AVFrame; +struct AVRational; +struct AVPacket; class FFmpegCapture : public bmusb::CaptureInterface { @@ -52,12 +67,33 @@ public: { std::lock_guard lock(queue_mu); command_queue.push_back(QueuedCommand { QueuedCommand::REWIND }); + producer_thread_should_quit.wakeup(); } void change_rate(double new_rate) { std::lock_guard lock(queue_mu); command_queue.push_back(QueuedCommand { QueuedCommand::CHANGE_RATE, new_rate }); + producer_thread_should_quit.wakeup(); + } + + std::string get_filename() const + { + std::lock_guard lock(filename_mu); + return filename; + } + + void change_filename(const std::string &new_filename) + { + std::lock_guard lock(filename_mu); + filename = new_filename; + should_interrupt = true; + } + + // Will stop the stream even if it's hung on blocking I/O. + void disconnect() + { + should_interrupt = true; } // CaptureInterface. @@ -88,11 +124,46 @@ public: return audio_frame_allocator; } - void set_frame_callback(bmusb::frame_callback_t callback) override + // FFmpegCapture-specific overload of set_frame_callback that also gives + // the raw original pts from the video. Negative pts means a dummy frame. + typedef std::function + frame_callback_t; + void set_frame_callback(frame_callback_t callback) { frame_callback = callback; } + void set_frame_callback(bmusb::frame_callback_t callback) override + { + frame_callback = std::bind( + callback, + std::placeholders::_5, + std::placeholders::_6, + std::placeholders::_7, + std::placeholders::_8, + std::placeholders::_9, + std::placeholders::_10, + std::placeholders::_11); + } + + // FFmpegCapture-specific callback that gives the raw audio. + typedef std::function audio_callback_t; + void set_audio_callback(audio_callback_t callback) + { + audio_callback = callback; + } + + // Used to get precise information about the Y'CbCr format used + // for a given frame. Only valid to call during the frame callback, + // and only when receiving a frame with pixel format PixelFormat_8BitYCbCrPlanar. + movit::YCbCrFormat get_current_frame_ycbcr_format() const + { + return current_frame_ycbcr_format; + } + void set_dequeue_thread_callbacks(std::function init, std::function cleanup) override { dequeue_init_callback = init; @@ -108,22 +179,21 @@ public: void configure_card() override; void start_bm_capture() override; void stop_dequeue_thread() override; + bool get_disconnected() const override { return false; } // We never unplug. - // TODO: Specify error status through this. - bool get_disconnected() const override { return false; } - - std::map get_available_video_modes() const; + std::map get_available_video_modes() const override; void set_video_mode(uint32_t video_mode_id) override {} // Ignore. uint32_t get_current_video_mode() const override { return 0; } + static constexpr bmusb::PixelFormat PixelFormat_NV12 = static_cast(100); // In the private range. std::set get_available_pixel_formats() const override { - return std::set{ bmusb::PixelFormat_8BitRGBA }; + return std::set{ bmusb::PixelFormat_8BitBGRA, bmusb::PixelFormat_8BitYCbCrPlanar, PixelFormat_NV12 }; } void set_pixel_format(bmusb::PixelFormat pixel_format) override { - assert(pixel_format == bmusb::PixelFormat_8BitRGBA); + this->pixel_format = pixel_format; } bmusb::PixelFormat get_current_pixel_format() const override { - return bmusb::PixelFormat_8BitRGBA; + return pixel_format; } std::map get_available_video_inputs() const override { @@ -139,13 +209,36 @@ public: private: void producer_thread_func(); + void send_disconnected_frame(); bool play_video(const std::string &pathname); + void internal_rewind(); + // Returns true if there was an error. + bool process_queued_commands(AVFormatContext *format_ctx, const std::string &pathname, timespec last_modified, bool *rewound); + + // Returns nullptr if no frame was decoded (e.g. EOF). + AVFrameWithDeleter decode_frame(AVFormatContext *format_ctx, AVCodecContext *video_codec_ctx, AVCodecContext *audio_codec_ctx, + const std::string &pathname, int video_stream_index, int audio_stream_index, + bmusb::FrameAllocator::Frame *audio_frame, bmusb::AudioFormat *audio_format, int64_t *audio_pts, bool *error); + void convert_audio(const AVFrame *audio_avframe, bmusb::FrameAllocator::Frame *audio_frame, bmusb::AudioFormat *audio_format); + + bmusb::VideoFormat construct_video_format(const AVFrame *frame, AVRational video_timebase); + UniqueFrame make_video_frame(const AVFrame *frame, const std::string &pathname, bool *error); + + static int interrupt_cb_thunk(void *unique); + int interrupt_cb(); + + mutable std::mutex filename_mu; std::string description, filename; uint16_t timecode = 0; unsigned width, height; + bmusb::PixelFormat pixel_format = bmusb::PixelFormat_8BitBGRA; + movit::YCbCrFormat current_frame_ycbcr_format; bool running = false; int card_index = -1; + double rate = 1.0; + std::atomic should_interrupt{false}; + bool last_frame_was_connected = true; bool has_dequeue_callbacks = false; std::function dequeue_init_callback = nullptr; @@ -155,17 +248,33 @@ private: bmusb::FrameAllocator *audio_frame_allocator = nullptr; std::unique_ptr owned_video_frame_allocator; std::unique_ptr owned_audio_frame_allocator; - bmusb::frame_callback_t frame_callback = nullptr; + frame_callback_t frame_callback = nullptr; + audio_callback_t audio_callback = nullptr; - std::atomic producer_thread_should_quit{false}; + SwsContextWithDeleter sws_ctx; + int sws_last_width = -1, sws_last_height = -1, sws_last_src_format = -1; + AVPixelFormat sws_dst_format = AVPixelFormat(-1); // In practice, always initialized. + AVRational video_timebase, audio_timebase; + + QuittableSleeper producer_thread_should_quit; std::thread producer_thread; + int64_t pts_origin, last_pts; + std::chrono::steady_clock::time_point start, next_frame_start, last_frame; + std::mutex queue_mu; struct QueuedCommand { enum Command { REWIND, CHANGE_RATE } command; double new_rate; // For CHANGE_RATE. }; std::vector command_queue; // Protected by . + + // Audio resampler. + AVAudioResampleContext *resampler = nullptr; + AVSampleFormat last_src_format, last_dst_format; + int64_t last_channel_layout; + int last_sample_rate; + }; #endif // !defined(_FFMPEG_CAPTURE_H)