]> git.sesse.net Git - nageru/blobdiff - video_stream.cpp
Start hacking in support for interpolated frames in the main application.
[nageru] / video_stream.cpp
index 65f52c094bd70e16d41a09a9afbd0c573964e6e6..a783bdb91fe8246b1b59bb5dd97a75ad09a68b9d 100644 (file)
@@ -5,10 +5,18 @@ extern "C" {
 #include <libavformat/avio.h>
 }
 
+#include <unistd.h>
+
+#include "context.h"
+#include "flow.h"
 #include "httpd.h"
 #include "jpeg_frame_view.h"
+#include "movit/util.h"
 #include "mux.h"
 #include "player.h"
+#include "util.h"
+
+#include <epoxy/glx.h>
 
 using namespace std;
 
@@ -37,6 +45,84 @@ string read_file(const string &filename)
 
 }  // namespace
 
+VideoStream::VideoStream()
+{
+       using namespace movit;
+       // TODO: deduplicate code against JPEGFrameView?
+       ycbcr_convert_chain.reset(new EffectChain(1280, 720));
+       ImageFormat image_format;
+       image_format.color_space = COLORSPACE_sRGB;
+       image_format.gamma_curve = GAMMA_sRGB;
+       ycbcr_format.luma_coefficients = YCBCR_REC_709;
+       ycbcr_format.full_range = false;
+       ycbcr_format.num_levels = 256;
+       ycbcr_format.chroma_subsampling_x = 2;
+       ycbcr_format.chroma_subsampling_y = 1;
+       ycbcr_format.cb_x_position = 0.0f;  // H.264 -- _not_ JPEG, even though our input is MJPEG-encoded
+       ycbcr_format.cb_y_position = 0.5f;  // Irrelevant.
+       ycbcr_format.cr_x_position = 0.0f;
+       ycbcr_format.cr_y_position = 0.5f;
+       ycbcr_input = (movit::YCbCrInput *)ycbcr_convert_chain->add_input(new YCbCrInput(image_format, ycbcr_format, 1280, 720));
+
+       ImageFormat inout_format;
+       inout_format.color_space = COLORSPACE_sRGB;
+       inout_format.gamma_curve = GAMMA_sRGB;
+
+       check_error();
+       ycbcr_convert_chain->add_output(inout_format, OUTPUT_ALPHA_FORMAT_POSTMULTIPLIED);
+       check_error();
+       ycbcr_convert_chain->set_dither_bits(8);
+       check_error();
+       ycbcr_convert_chain->finalize();
+       check_error();
+
+       GLuint input_tex[num_interpolate_slots], gray_tex[num_interpolate_slots];
+       glCreateTextures(GL_TEXTURE_2D_ARRAY, 10, input_tex);
+       glCreateTextures(GL_TEXTURE_2D_ARRAY, 10, gray_tex);
+       check_error();
+       constexpr size_t width = 1280, height = 720;  // FIXME: adjustable width, height
+       int levels = find_num_levels(width, height);
+       for (size_t i = 0; i < num_interpolate_slots; ++i) {
+               glTextureStorage3D(input_tex[i], levels, GL_RGBA8, width, height, 2);
+               check_error();
+               glTextureStorage3D(gray_tex[i], levels, GL_R8, width, height, 2);
+               check_error();
+
+               InterpolatedFrameResources resource;
+               resource.input_tex = input_tex[i];
+               resource.gray_tex = gray_tex[i];
+               glCreateFramebuffers(2, resource.input_fbos);
+               check_error();
+
+               glNamedFramebufferTextureLayer(resource.input_fbos[0], GL_COLOR_ATTACHMENT0, input_tex[i], 0, 0);
+               check_error();
+               glNamedFramebufferTextureLayer(resource.input_fbos[1], GL_COLOR_ATTACHMENT0, input_tex[i], 0, 1);
+               check_error();
+
+               GLuint buf = GL_COLOR_ATTACHMENT0;
+               glNamedFramebufferDrawBuffers(resource.input_fbos[0], 1, &buf);
+               check_error();
+               glNamedFramebufferDrawBuffers(resource.input_fbos[1], 1, &buf);
+               check_error();
+
+               glCreateBuffers(1, &resource.pbo);
+               check_error();
+               glNamedBufferStorage(resource.pbo, width * height * 4, nullptr, GL_MAP_READ_BIT | GL_MAP_PERSISTENT_BIT);
+               check_error();
+               resource.pbo_contents = glMapNamedBufferRange(resource.pbo, 0, width * height * 4, GL_MAP_READ_BIT | GL_MAP_PERSISTENT_BIT); 
+               interpolate_resources.push_back(resource);
+       }
+
+       check_error();
+
+       compute_flow.reset(new DISComputeFlow(width, height, operating_point3));
+       gray.reset(new GrayscaleConversion);  // NOTE: Must come after DISComputeFlow, since it sets up the VBO!
+       interpolate.reset(new Interpolate(width, height, operating_point3));
+       check_error();
+}
+
+VideoStream::~VideoStream() {}
+
 void VideoStream::start()
 {
        AVFormatContext *avctx = avformat_alloc_context();
@@ -68,17 +154,100 @@ void VideoStream::stop()
 
 void VideoStream::schedule_original_frame(int64_t output_pts, unsigned stream_idx, int64_t input_pts)
 {
-       unique_lock<mutex> lock(queue_lock);
        QueuedFrame qf;
+       qf.type = QueuedFrame::ORIGINAL;
        qf.output_pts = output_pts;
        qf.stream_idx = stream_idx;
        qf.input_first_pts = input_pts; 
+
+       unique_lock<mutex> lock(queue_lock);
+       frame_queue.push_back(qf);
+       queue_nonempty.notify_all();
+}
+
+void VideoStream::schedule_interpolated_frame(int64_t output_pts, unsigned stream_idx, int64_t input_first_pts, int64_t input_second_pts, float alpha)
+{
+       // Get the temporary OpenGL resources we need for doing the interpolation.
+       InterpolatedFrameResources resources;
+       {
+               unique_lock<mutex> lock(queue_lock);
+               if (interpolate_resources.empty()) {
+                       fprintf(stderr, "WARNING: Too many interpolated frames already in transit; dropping one.\n");
+                       return;
+               }
+               resources = interpolate_resources.front();
+               interpolate_resources.pop_front();
+       }
+
+       QueuedFrame qf;
+       qf.type = QueuedFrame::INTERPOLATED;
+       qf.output_pts = output_pts;
+       qf.stream_idx = stream_idx;
+       qf.resources = resources;
+
+       check_error();
+
+       // Convert frame0 and frame1 to OpenGL textures.
+       // TODO: Deduplicate against JPEGFrameView::setDecodedFrame?
+       for (size_t frame_no = 0; frame_no < 2; ++frame_no) {
+               shared_ptr<Frame> frame = decode_jpeg(filename_for_frame(stream_idx, frame_no == 1 ? input_second_pts : input_first_pts));
+               ycbcr_format.chroma_subsampling_x = frame->chroma_subsampling_x;
+               ycbcr_format.chroma_subsampling_y = frame->chroma_subsampling_y;
+               ycbcr_input->change_ycbcr_format(ycbcr_format);
+               ycbcr_input->set_width(frame->width);
+               ycbcr_input->set_height(frame->height);
+               ycbcr_input->set_pixel_data(0, frame->y.get());
+               ycbcr_input->set_pixel_data(1, frame->cb.get());
+               ycbcr_input->set_pixel_data(2, frame->cr.get());
+               ycbcr_input->set_pitch(0, frame->pitch_y);
+               ycbcr_input->set_pitch(1, frame->pitch_chroma);
+               ycbcr_input->set_pitch(2, frame->pitch_chroma);
+               ycbcr_convert_chain->render_to_fbo(resources.input_fbos[frame_no], 1280, 720);
+       }
+
+       glGenerateTextureMipmap(resources.input_tex);
+
+       // Compute the interpolated frame.
+       check_error();
+       gray->exec(resources.input_tex, resources.gray_tex, 1280, 720, /*num_layers=*/2);
+       check_error();
+       glGenerateTextureMipmap(resources.gray_tex);
+       check_error();
+       GLuint flow_tex = compute_flow->exec(resources.gray_tex, DISComputeFlow::FORWARD_AND_BACKWARD, DISComputeFlow::DO_NOT_RESIZE_FLOW);
+       check_error();
+
+       qf.output_tex = interpolate->exec(resources.input_tex, flow_tex, 1280, 720, alpha);
+       check_error();
+
+       // Read it down (asynchronously) to the CPU.
+       glPixelStorei(GL_PACK_ROW_LENGTH, 0);
+       glBindBuffer(GL_PIXEL_PACK_BUFFER, resources.pbo);
+       check_error();
+       glGetTextureImage(qf.output_tex, 0, GL_RGBA, GL_UNSIGNED_BYTE, 1280 * 720 * 4, nullptr);
+       check_error();
+       glBindBuffer(GL_PIXEL_PACK_BUFFER, 0);
+
+       // Set a fence we can wait for to make sure the CPU sees the read.
+       glMemoryBarrier(GL_CLIENT_MAPPED_BUFFER_BARRIER_BIT);
+       check_error();
+       qf.fence = RefCountedGLsync(GL_SYNC_GPU_COMMANDS_COMPLETE, /*flags=*/0);
+       check_error();
+
+       unique_lock<mutex> lock(queue_lock);
        frame_queue.push_back(qf);
        queue_nonempty.notify_all();
 }
 
 void VideoStream::encode_thread_func()
 {
+       QSurface *surface = create_surface();
+       QOpenGLContext *context = create_context(surface);
+       bool ok = make_current(context, surface);
+       if (!ok) {
+               fprintf(stderr, "Video stream couldn't get an OpenGL context\n");
+               exit(1);
+       }
+
        for ( ;; ) {
                QueuedFrame qf;
                {
@@ -91,6 +260,7 @@ void VideoStream::encode_thread_func()
                }
 
                if (qf.type == QueuedFrame::ORIGINAL) {
+                       // Send the JPEG frame on, unchanged.
                        string jpeg = read_file(filename_for_frame(qf.stream_idx, qf.input_first_pts));
                        AVPacket pkt;
                        av_init_packet(&pkt);
@@ -98,7 +268,28 @@ void VideoStream::encode_thread_func()
                        pkt.data = (uint8_t *)jpeg.data();
                        pkt.size = jpeg.size();
                        stream_mux->add_packet(pkt, qf.output_pts, qf.output_pts);
-               }               
+               } else if (qf.type == QueuedFrame::INTERPOLATED) {
+                       glClientWaitSync(qf.fence.get(), /*flags=*/0, GL_TIMEOUT_IGNORED);
+
+                       // DEBUG: Writing the frame to disk.
+                       FILE *fp = fopen("inter.ppm", "wb");
+                       fprintf(fp, "P6\n%d %d\n255\n", 1280, 720);
+                       for (size_t y = 0; y < 720; ++y) {
+                               const uint8_t *ptr = (uint8_t *)qf.resources.pbo_contents + (719 - y) * 1280 * 4;
+                               for (size_t x = 0; x < 1280; ++x) {
+                                       putc(ptr[0], fp);
+                                       putc(ptr[1], fp);
+                                       putc(ptr[2], fp);
+                                       ptr += 4;
+                               }
+                       }
+                       fclose(fp);
+                       // TODO: Release flow and output textures.
+
+                       // Put the frame resources back.
+                       unique_lock<mutex> lock(queue_lock);
+                       interpolate_resources.push_back(qf.resources);
+               }
        }
 }