]> git.sesse.net Git - ffmpeg/blob - libavcodec/libschroedingerenc.c
schroenc: Use constant quality for constant quality, not noise threshold
[ffmpeg] / libavcodec / libschroedingerenc.c
1 /*
2  * Dirac encoder support via Schroedinger libraries
3  * Copyright (c) 2008 BBC, Anuradha Suraparaju <asuraparaju at gmail dot com >
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21
22 /**
23 * @file
24 * Dirac encoder support via libschroedinger-1.0 libraries. More details about
25 * the Schroedinger project can be found at http://www.diracvideo.org/.
26 * The library implements Dirac Specification Version 2.2
27 * (http://dirac.sourceforge.net/specification.html).
28 */
29
30 #undef NDEBUG
31 #include <assert.h>
32
33 #include <schroedinger/schro.h>
34 #include <schroedinger/schrodebug.h>
35 #include <schroedinger/schrovideoformat.h>
36
37 #include "avcodec.h"
38 #include "libdirac_libschro.h"
39 #include "libschroedinger.h"
40
41
42 /** libschroedinger encoder private data */
43 typedef struct FfmpegSchroEncoderParams {
44     /** Schroedinger video format */
45     SchroVideoFormat *format;
46
47     /** Schroedinger frame format */
48     SchroFrameFormat frame_format;
49
50     /** frame being encoded */
51     AVFrame picture;
52
53     /** frame size */
54     int frame_size;
55
56     /** Schroedinger encoder handle*/
57     SchroEncoder* encoder;
58
59     /** buffer to store encoder output before writing it to the frame queue*/
60     unsigned char *enc_buf;
61
62     /** Size of encoder buffer*/
63     int enc_buf_size;
64
65     /** queue storing encoded frames */
66     FfmpegDiracSchroQueue enc_frame_queue;
67
68     /** end of sequence signalled */
69     int eos_signalled;
70
71     /** end of sequence pulled */
72     int eos_pulled;
73 } FfmpegSchroEncoderParams;
74
75 /**
76 * Works out Schro-compatible chroma format.
77 */
78 static int SetSchroChromaFormat(AVCodecContext *avccontext)
79 {
80     int num_formats = sizeof(ffmpeg_schro_pixel_format_map) /
81                       sizeof(ffmpeg_schro_pixel_format_map[0]);
82     int idx;
83
84     FfmpegSchroEncoderParams* p_schro_params = avccontext->priv_data;
85
86     for (idx = 0; idx < num_formats; ++idx) {
87         if (ffmpeg_schro_pixel_format_map[idx].ff_pix_fmt ==
88             avccontext->pix_fmt) {
89             p_schro_params->format->chroma_format =
90                             ffmpeg_schro_pixel_format_map[idx].schro_pix_fmt;
91             return 0;
92         }
93     }
94
95     av_log(avccontext, AV_LOG_ERROR,
96            "This codec currently only supports planar YUV 4:2:0, 4:2:2"
97            " and 4:4:4 formats.\n");
98
99     return -1;
100 }
101
102 static int libschroedinger_encode_init(AVCodecContext *avccontext)
103 {
104     FfmpegSchroEncoderParams* p_schro_params = avccontext->priv_data;
105     SchroVideoFormatEnum preset;
106
107     /* Initialize the libraries that libschroedinger depends on. */
108     schro_init();
109
110     /* Create an encoder object. */
111     p_schro_params->encoder = schro_encoder_new();
112
113     if (!p_schro_params->encoder) {
114         av_log(avccontext, AV_LOG_ERROR,
115                "Unrecoverable Error: schro_encoder_new failed. ");
116         return -1;
117     }
118
119     /* Initialize the format. */
120     preset = ff_get_schro_video_format_preset(avccontext);
121     p_schro_params->format =
122                     schro_encoder_get_video_format(p_schro_params->encoder);
123     schro_video_format_set_std_video_format(p_schro_params->format, preset);
124     p_schro_params->format->width  = avccontext->width;
125     p_schro_params->format->height = avccontext->height;
126
127     if (SetSchroChromaFormat(avccontext) == -1)
128         return -1;
129
130     if (ff_get_schro_frame_format(p_schro_params->format->chroma_format,
131                                   &p_schro_params->frame_format) == -1) {
132         av_log(avccontext, AV_LOG_ERROR,
133                "This codec currently supports only planar YUV 4:2:0, 4:2:2"
134                " and 4:4:4 formats.\n");
135         return -1;
136     }
137
138     p_schro_params->format->frame_rate_numerator   = avccontext->time_base.den;
139     p_schro_params->format->frame_rate_denominator = avccontext->time_base.num;
140
141     p_schro_params->frame_size = avpicture_get_size(avccontext->pix_fmt,
142                                                     avccontext->width,
143                                                     avccontext->height);
144
145     avccontext->coded_frame = &p_schro_params->picture;
146
147     if (!avccontext->gop_size) {
148         schro_encoder_setting_set_double(p_schro_params->encoder,
149                                          "gop_structure",
150                                          SCHRO_ENCODER_GOP_INTRA_ONLY);
151
152         if (avccontext->coder_type == FF_CODER_TYPE_VLC)
153             schro_encoder_setting_set_double(p_schro_params->encoder,
154                                              "enable_noarith", 1);
155     } else {
156         avccontext->has_b_frames = 1;
157     }
158
159     /* FIXME - Need to handle SCHRO_ENCODER_RATE_CONTROL_LOW_DELAY. */
160     if (avccontext->flags & CODEC_FLAG_QSCALE) {
161         if (!avccontext->global_quality) {
162             /* lossless coding */
163             schro_encoder_setting_set_double(p_schro_params->encoder,
164                                              "rate_control",
165                                              SCHRO_ENCODER_RATE_CONTROL_LOSSLESS);
166         } else {
167             int quality;
168             schro_encoder_setting_set_double(p_schro_params->encoder,
169                                              "rate_control",
170                                              SCHRO_ENCODER_RATE_CONTROL_CONSTANT_QUALITY);
171
172             quality = avccontext->global_quality / FF_QP2LAMBDA;
173             if (quality > 10)
174                 quality = 10;
175             schro_encoder_setting_set_double(p_schro_params->encoder,
176                                              "quality", quality);
177         }
178     } else {
179         schro_encoder_setting_set_double(p_schro_params->encoder,
180                                          "rate_control",
181                                          SCHRO_ENCODER_RATE_CONTROL_CONSTANT_BITRATE);
182
183         schro_encoder_setting_set_double(p_schro_params->encoder,
184                                          "bitrate",
185                                          avccontext->bit_rate);
186
187     }
188
189     if (avccontext->flags & CODEC_FLAG_INTERLACED_ME)
190         /* All material can be coded as interlaced or progressive
191            irrespective of the type of source material. */
192         schro_encoder_setting_set_double(p_schro_params->encoder,
193                                          "interlaced_coding", 1);
194
195     /* FIXME: Signal range hardcoded to 8-bit data until both libschroedinger
196      * and libdirac support other bit-depth data. */
197     schro_video_format_set_std_signal_range(p_schro_params->format,
198                                             SCHRO_SIGNAL_RANGE_8BIT_VIDEO);
199
200     /* Set the encoder format. */
201     schro_encoder_set_video_format(p_schro_params->encoder,
202                                    p_schro_params->format);
203
204     /* Set the debug level. */
205     schro_debug_set_level(avccontext->debug);
206
207     schro_encoder_start(p_schro_params->encoder);
208
209     /* Initialize the encoded frame queue. */
210     ff_dirac_schro_queue_init(&p_schro_params->enc_frame_queue);
211     return 0;
212 }
213
214 static SchroFrame *libschroedinger_frame_from_data(AVCodecContext *avccontext,
215                                                    void *in_data)
216 {
217     FfmpegSchroEncoderParams* p_schro_params = avccontext->priv_data;
218     SchroFrame *in_frame;
219     /* Input line size may differ from what the codec supports. Especially
220      * when transcoding from one format to another. So use avpicture_layout
221      * to copy the frame. */
222     in_frame = ff_create_schro_frame(avccontext, p_schro_params->frame_format);
223
224     if (in_frame)
225         avpicture_layout((AVPicture *)in_data, avccontext->pix_fmt,
226                           avccontext->width, avccontext->height,
227                           in_frame->components[0].data,
228                           p_schro_params->frame_size);
229
230     return in_frame;
231 }
232
233 static void SchroedingerFreeFrame(void *data)
234 {
235     FfmpegDiracSchroEncodedFrame *enc_frame = data;
236
237     av_freep(&(enc_frame->p_encbuf));
238     av_free(enc_frame);
239 }
240
241 static int libschroedinger_encode_frame(AVCodecContext *avccontext,
242                                         unsigned char *frame,
243                                         int buf_size, void *data)
244 {
245     int enc_size = 0;
246     FfmpegSchroEncoderParams* p_schro_params = avccontext->priv_data;
247     SchroEncoder *encoder = p_schro_params->encoder;
248     struct FfmpegDiracSchroEncodedFrame* p_frame_output = NULL;
249     int go = 1;
250     SchroBuffer *enc_buf;
251     int presentation_frame;
252     int parse_code;
253     int last_frame_in_sequence = 0;
254
255     if (!data) {
256         /* Push end of sequence if not already signalled. */
257         if (!p_schro_params->eos_signalled) {
258             schro_encoder_end_of_stream(encoder);
259             p_schro_params->eos_signalled = 1;
260         }
261     } else {
262         /* Allocate frame data to schro input buffer. */
263         SchroFrame *in_frame = libschroedinger_frame_from_data(avccontext,
264                                                                data);
265         /* Load next frame. */
266         schro_encoder_push_frame(encoder, in_frame);
267     }
268
269     if (p_schro_params->eos_pulled)
270         go = 0;
271
272     /* Now check to see if we have any output from the encoder. */
273     while (go) {
274         SchroStateEnum state;
275         state = schro_encoder_wait(encoder);
276         switch (state) {
277         case SCHRO_STATE_HAVE_BUFFER:
278         case SCHRO_STATE_END_OF_STREAM:
279             enc_buf = schro_encoder_pull(encoder, &presentation_frame);
280             assert(enc_buf->length > 0);
281             assert(enc_buf->length <= buf_size);
282             parse_code = enc_buf->data[4];
283
284             /* All non-frame data is prepended to actual frame data to
285              * be able to set the pts correctly. So we don't write data
286              * to the frame output queue until we actually have a frame
287              */
288             p_schro_params->enc_buf = av_realloc(p_schro_params->enc_buf,
289                                                  p_schro_params->enc_buf_size + enc_buf->length);
290
291             memcpy(p_schro_params->enc_buf + p_schro_params->enc_buf_size,
292                    enc_buf->data, enc_buf->length);
293             p_schro_params->enc_buf_size += enc_buf->length;
294
295
296             if (state == SCHRO_STATE_END_OF_STREAM) {
297                 p_schro_params->eos_pulled = 1;
298                 go = 0;
299             }
300
301             if (!SCHRO_PARSE_CODE_IS_PICTURE(parse_code)) {
302                 schro_buffer_unref(enc_buf);
303                 break;
304             }
305
306             /* Create output frame. */
307             p_frame_output = av_mallocz(sizeof(FfmpegDiracSchroEncodedFrame));
308             /* Set output data. */
309             p_frame_output->size     = p_schro_params->enc_buf_size;
310             p_frame_output->p_encbuf = p_schro_params->enc_buf;
311             if (SCHRO_PARSE_CODE_IS_INTRA(parse_code) &&
312                 SCHRO_PARSE_CODE_IS_REFERENCE(parse_code))
313                 p_frame_output->key_frame = 1;
314
315             /* Parse the coded frame number from the bitstream. Bytes 14
316              * through 17 represesent the frame number. */
317                 p_frame_output->frame_num = (enc_buf->data[13] << 24) +
318                                             (enc_buf->data[14] << 16) +
319                                             (enc_buf->data[15] <<  8) +
320                                              enc_buf->data[16];
321
322             ff_dirac_schro_queue_push_back(&p_schro_params->enc_frame_queue,
323                                            p_frame_output);
324             p_schro_params->enc_buf_size = 0;
325             p_schro_params->enc_buf      = NULL;
326
327             schro_buffer_unref(enc_buf);
328
329             break;
330
331         case SCHRO_STATE_NEED_FRAME:
332             go = 0;
333             break;
334
335         case SCHRO_STATE_AGAIN:
336             break;
337
338         default:
339             av_log(avccontext, AV_LOG_ERROR, "Unknown Schro Encoder state\n");
340             return -1;
341         }
342     }
343
344     /* Copy 'next' frame in queue. */
345
346     if (p_schro_params->enc_frame_queue.size == 1 &&
347         p_schro_params->eos_pulled)
348         last_frame_in_sequence = 1;
349
350     p_frame_output = ff_dirac_schro_queue_pop(&p_schro_params->enc_frame_queue);
351
352     if (!p_frame_output)
353         return 0;
354
355     memcpy(frame, p_frame_output->p_encbuf, p_frame_output->size);
356     avccontext->coded_frame->key_frame = p_frame_output->key_frame;
357     /* Use the frame number of the encoded frame as the pts. It is OK to
358      * do so since Dirac is a constant frame rate codec. It expects input
359      * to be of constant frame rate. */
360     avccontext->coded_frame->pts = p_frame_output->frame_num;
361     enc_size = p_frame_output->size;
362
363     /* Append the end of sequence information to the last frame in the
364      * sequence. */
365     if (last_frame_in_sequence && p_schro_params->enc_buf_size > 0) {
366         memcpy(frame + enc_size, p_schro_params->enc_buf,
367                p_schro_params->enc_buf_size);
368         enc_size += p_schro_params->enc_buf_size;
369         av_freep(&p_schro_params->enc_buf);
370         p_schro_params->enc_buf_size = 0;
371     }
372
373     /* free frame */
374     SchroedingerFreeFrame(p_frame_output);
375
376     return enc_size;
377 }
378
379
380 static int libschroedinger_encode_close(AVCodecContext *avccontext)
381 {
382
383     FfmpegSchroEncoderParams* p_schro_params = avccontext->priv_data;
384
385     /* Close the encoder. */
386     schro_encoder_free(p_schro_params->encoder);
387
388     /* Free data in the output frame queue. */
389     ff_dirac_schro_queue_free(&p_schro_params->enc_frame_queue,
390                               SchroedingerFreeFrame);
391
392
393     /* Free the encoder buffer. */
394     if (p_schro_params->enc_buf_size)
395         av_freep(&p_schro_params->enc_buf);
396
397     /* Free the video format structure. */
398     av_freep(&p_schro_params->format);
399
400     return 0;
401 }
402
403
404 AVCodec libschroedinger_encoder = {
405     "libschroedinger",
406     AVMEDIA_TYPE_VIDEO,
407     CODEC_ID_DIRAC,
408     sizeof(FfmpegSchroEncoderParams),
409     libschroedinger_encode_init,
410     libschroedinger_encode_frame,
411     libschroedinger_encode_close,
412    .capabilities = CODEC_CAP_DELAY,
413    .pix_fmts     = (const enum PixelFormat[]){PIX_FMT_YUV420P, PIX_FMT_YUV422P, PIX_FMT_YUV444P, PIX_FMT_NONE},
414    .long_name    = NULL_IF_CONFIG_SMALL("libschroedinger Dirac 2.2"),
415 };