]> git.sesse.net Git - ffmpeg/blob - libavcodec/vaapi_encode_h264.c
vaapi_encode_h264: Support more complex reference structures
[ffmpeg] / libavcodec / vaapi_encode_h264.c
1 /*
2  * This file is part of FFmpeg.
3  *
4  * FFmpeg is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU Lesser General Public
6  * License as published by the Free Software Foundation; either
7  * version 2.1 of the License, or (at your option) any later version.
8  *
9  * FFmpeg is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
12  * Lesser General Public License for more details.
13  *
14  * You should have received a copy of the GNU Lesser General Public
15  * License along with FFmpeg; if not, write to the Free Software
16  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17  */
18
19 #include <string.h>
20
21 #include <va/va.h>
22 #include <va/va_enc_h264.h>
23
24 #include "libavutil/avassert.h"
25 #include "libavutil/common.h"
26 #include "libavutil/internal.h"
27 #include "libavutil/opt.h"
28
29 #include "avcodec.h"
30 #include "cbs.h"
31 #include "cbs_h264.h"
32 #include "h264.h"
33 #include "h264_levels.h"
34 #include "h264_sei.h"
35 #include "internal.h"
36 #include "vaapi_encode.h"
37
38 enum {
39     SEI_TIMING         = 0x01,
40     SEI_IDENTIFIER     = 0x02,
41     SEI_RECOVERY_POINT = 0x04,
42 };
43
44 // Random (version 4) ISO 11578 UUID.
45 static const uint8_t vaapi_encode_h264_sei_identifier_uuid[16] = {
46     0x59, 0x94, 0x8b, 0x28, 0x11, 0xec, 0x45, 0xaf,
47     0x96, 0x75, 0x19, 0xd4, 0x1f, 0xea, 0xa9, 0x4d,
48 };
49
50 typedef struct VAAPIEncodeH264Picture {
51     int frame_num;
52     int pic_order_cnt;
53
54     int64_t last_idr_frame;
55     uint16_t idr_pic_id;
56
57     int primary_pic_type;
58     int slice_type;
59
60     int cpb_delay;
61     int dpb_delay;
62 } VAAPIEncodeH264Picture;
63
64 typedef struct VAAPIEncodeH264Context {
65     VAAPIEncodeContext common;
66
67     // User options.
68     int qp;
69     int quality;
70     int coder;
71     int aud;
72     int sei;
73     int profile;
74     int level;
75
76     // Derived settings.
77     int mb_width;
78     int mb_height;
79
80     int fixed_qp_idr;
81     int fixed_qp_p;
82     int fixed_qp_b;
83
84     int dpb_frames;
85
86     // Writer structures.
87     CodedBitstreamContext *cbc;
88     CodedBitstreamFragment current_access_unit;
89
90     H264RawAUD   raw_aud;
91     H264RawSPS   raw_sps;
92     H264RawPPS   raw_pps;
93     H264RawSEI   raw_sei;
94     H264RawSlice raw_slice;
95
96     H264RawSEIBufferingPeriod      sei_buffering_period;
97     H264RawSEIPicTiming            sei_pic_timing;
98     H264RawSEIRecoveryPoint        sei_recovery_point;
99     H264RawSEIUserDataUnregistered sei_identifier;
100     char                          *sei_identifier_string;
101
102     int aud_needed;
103     int sei_needed;
104     int sei_cbr_workaround_needed;
105 } VAAPIEncodeH264Context;
106
107
108 static int vaapi_encode_h264_write_access_unit(AVCodecContext *avctx,
109                                                char *data, size_t *data_len,
110                                                CodedBitstreamFragment *au)
111 {
112     VAAPIEncodeH264Context *priv = avctx->priv_data;
113     int err;
114
115     err = ff_cbs_write_fragment_data(priv->cbc, au);
116     if (err < 0) {
117         av_log(avctx, AV_LOG_ERROR, "Failed to write packed header.\n");
118         return err;
119     }
120
121     if (*data_len < 8 * au->data_size - au->data_bit_padding) {
122         av_log(avctx, AV_LOG_ERROR, "Access unit too large: "
123                "%zu < %zu.\n", *data_len,
124                8 * au->data_size - au->data_bit_padding);
125         return AVERROR(ENOSPC);
126     }
127
128     memcpy(data, au->data, au->data_size);
129     *data_len = 8 * au->data_size - au->data_bit_padding;
130
131     return 0;
132 }
133
134 static int vaapi_encode_h264_add_nal(AVCodecContext *avctx,
135                                      CodedBitstreamFragment *au,
136                                      void *nal_unit)
137 {
138     VAAPIEncodeH264Context *priv = avctx->priv_data;
139     H264RawNALUnitHeader *header = nal_unit;
140     int err;
141
142     err = ff_cbs_insert_unit_content(priv->cbc, au, -1,
143                                      header->nal_unit_type, nal_unit, NULL);
144     if (err < 0) {
145         av_log(avctx, AV_LOG_ERROR, "Failed to add NAL unit: "
146                "type = %d.\n", header->nal_unit_type);
147         return err;
148     }
149
150     return 0;
151 }
152
153 static int vaapi_encode_h264_write_sequence_header(AVCodecContext *avctx,
154                                                    char *data, size_t *data_len)
155 {
156     VAAPIEncodeH264Context *priv = avctx->priv_data;
157     CodedBitstreamFragment   *au = &priv->current_access_unit;
158     int err;
159
160     if (priv->aud_needed) {
161         err = vaapi_encode_h264_add_nal(avctx, au, &priv->raw_aud);
162         if (err < 0)
163             goto fail;
164         priv->aud_needed = 0;
165     }
166
167     err = vaapi_encode_h264_add_nal(avctx, au, &priv->raw_sps);
168     if (err < 0)
169         goto fail;
170
171     err = vaapi_encode_h264_add_nal(avctx, au, &priv->raw_pps);
172     if (err < 0)
173         goto fail;
174
175     err = vaapi_encode_h264_write_access_unit(avctx, data, data_len, au);
176 fail:
177     ff_cbs_fragment_uninit(priv->cbc, au);
178     return err;
179 }
180
181 static int vaapi_encode_h264_write_slice_header(AVCodecContext *avctx,
182                                                 VAAPIEncodePicture *pic,
183                                                 VAAPIEncodeSlice *slice,
184                                                 char *data, size_t *data_len)
185 {
186     VAAPIEncodeH264Context *priv = avctx->priv_data;
187     CodedBitstreamFragment   *au = &priv->current_access_unit;
188     int err;
189
190     if (priv->aud_needed) {
191         err = vaapi_encode_h264_add_nal(avctx, au, &priv->raw_aud);
192         if (err < 0)
193             goto fail;
194         priv->aud_needed = 0;
195     }
196
197     err = vaapi_encode_h264_add_nal(avctx, au, &priv->raw_slice);
198     if (err < 0)
199         goto fail;
200
201     err = vaapi_encode_h264_write_access_unit(avctx, data, data_len, au);
202 fail:
203     ff_cbs_fragment_uninit(priv->cbc, au);
204     return err;
205 }
206
207 static int vaapi_encode_h264_write_extra_header(AVCodecContext *avctx,
208                                                 VAAPIEncodePicture *pic,
209                                                 int index, int *type,
210                                                 char *data, size_t *data_len)
211 {
212     VAAPIEncodeH264Context *priv = avctx->priv_data;
213     CodedBitstreamFragment   *au = &priv->current_access_unit;
214     int err, i;
215
216     if (priv->sei_needed) {
217         H264RawSEI *sei = &priv->raw_sei;
218
219         if (priv->aud_needed) {
220             err = vaapi_encode_h264_add_nal(avctx, au, &priv->raw_aud);
221             if (err < 0)
222                 goto fail;
223             priv->aud_needed = 0;
224         }
225
226         *sei = (H264RawSEI) {
227             .nal_unit_header = {
228                 .nal_unit_type = H264_NAL_SEI,
229             },
230         };
231
232         i = 0;
233
234         if (priv->sei_needed & SEI_IDENTIFIER) {
235             sei->payload[i].payload_type = H264_SEI_TYPE_USER_DATA_UNREGISTERED;
236             sei->payload[i].payload.user_data_unregistered = priv->sei_identifier;
237             ++i;
238         }
239         if (priv->sei_needed & SEI_TIMING) {
240             if (pic->type == PICTURE_TYPE_IDR) {
241                 sei->payload[i].payload_type = H264_SEI_TYPE_BUFFERING_PERIOD;
242                 sei->payload[i].payload.buffering_period = priv->sei_buffering_period;
243                 ++i;
244             }
245             sei->payload[i].payload_type = H264_SEI_TYPE_PIC_TIMING;
246             sei->payload[i].payload.pic_timing = priv->sei_pic_timing;
247             ++i;
248         }
249         if (priv->sei_needed & SEI_RECOVERY_POINT) {
250             sei->payload[i].payload_type = H264_SEI_TYPE_RECOVERY_POINT;
251             sei->payload[i].payload.recovery_point = priv->sei_recovery_point;
252             ++i;
253         }
254
255         sei->payload_count = i;
256         av_assert0(sei->payload_count > 0);
257
258         err = vaapi_encode_h264_add_nal(avctx, au, sei);
259         if (err < 0)
260             goto fail;
261         priv->sei_needed = 0;
262
263         err = vaapi_encode_h264_write_access_unit(avctx, data, data_len, au);
264         if (err < 0)
265             goto fail;
266
267         ff_cbs_fragment_uninit(priv->cbc, au);
268
269         *type = VAEncPackedHeaderRawData;
270         return 0;
271
272 #if !CONFIG_VAAPI_1
273     } else if (priv->sei_cbr_workaround_needed) {
274         // Insert a zero-length header using the old SEI type.  This is
275         // required to avoid triggering broken behaviour on Intel platforms
276         // in CBR mode where an invalid SEI message is generated by the
277         // driver and inserted into the stream.
278         *data_len = 0;
279         *type = VAEncPackedHeaderH264_SEI;
280         priv->sei_cbr_workaround_needed = 0;
281         return 0;
282 #endif
283
284     } else {
285         return AVERROR_EOF;
286     }
287
288 fail:
289     ff_cbs_fragment_uninit(priv->cbc, au);
290     return err;
291 }
292
293 static int vaapi_encode_h264_init_sequence_params(AVCodecContext *avctx)
294 {
295     VAAPIEncodeContext                *ctx = avctx->priv_data;
296     VAAPIEncodeH264Context           *priv = avctx->priv_data;
297     H264RawSPS                        *sps = &priv->raw_sps;
298     H264RawPPS                        *pps = &priv->raw_pps;
299     VAEncSequenceParameterBufferH264 *vseq = ctx->codec_sequence_params;
300     VAEncPictureParameterBufferH264  *vpic = ctx->codec_picture_params;
301
302     memset(&priv->current_access_unit, 0,
303            sizeof(priv->current_access_unit));
304
305     memset(sps, 0, sizeof(*sps));
306     memset(pps, 0, sizeof(*pps));
307
308     sps->nal_unit_header.nal_ref_idc   = 3;
309     sps->nal_unit_header.nal_unit_type = H264_NAL_SPS;
310
311     sps->profile_idc = avctx->profile & 0xff;
312
313     if (avctx->profile == FF_PROFILE_H264_CONSTRAINED_BASELINE ||
314         avctx->profile == FF_PROFILE_H264_MAIN)
315         sps->constraint_set1_flag = 1;
316
317     if (avctx->profile == FF_PROFILE_H264_HIGH)
318         sps->constraint_set3_flag = ctx->gop_size == 1;
319
320     if (avctx->profile == FF_PROFILE_H264_MAIN ||
321         avctx->profile == FF_PROFILE_H264_HIGH) {
322         sps->constraint_set4_flag = 1;
323         sps->constraint_set5_flag = ctx->b_per_p == 0;
324     }
325
326     if (ctx->gop_size == 1)
327         priv->dpb_frames = 0;
328     else
329         priv->dpb_frames = 1 + ctx->max_b_depth;
330
331     if (avctx->level != FF_LEVEL_UNKNOWN) {
332         sps->level_idc = avctx->level;
333     } else {
334         const H264LevelDescriptor *level;
335
336         level = ff_h264_guess_level(sps->profile_idc,
337                                     avctx->bit_rate,
338                                     priv->mb_width  * 16,
339                                     priv->mb_height * 16,
340                                     priv->dpb_frames);
341         if (level) {
342             av_log(avctx, AV_LOG_VERBOSE, "Using level %s.\n", level->name);
343             if (level->constraint_set3_flag)
344                 sps->constraint_set3_flag = 1;
345             sps->level_idc = level->level_idc;
346         } else {
347             av_log(avctx, AV_LOG_WARNING, "Stream will not conform "
348                    "to any level: using level 6.2.\n");
349             sps->level_idc = 62;
350         }
351     }
352
353     sps->seq_parameter_set_id = 0;
354     sps->chroma_format_idc    = 1;
355
356     sps->log2_max_frame_num_minus4 = 4;
357     sps->pic_order_cnt_type        = 0;
358     sps->log2_max_pic_order_cnt_lsb_minus4 = 4;
359
360     sps->max_num_ref_frames = priv->dpb_frames;
361
362     sps->pic_width_in_mbs_minus1        = priv->mb_width  - 1;
363     sps->pic_height_in_map_units_minus1 = priv->mb_height - 1;
364
365     sps->frame_mbs_only_flag = 1;
366     sps->direct_8x8_inference_flag = 1;
367
368     if (avctx->width  != 16 * priv->mb_width ||
369         avctx->height != 16 * priv->mb_height) {
370         sps->frame_cropping_flag = 1;
371
372         sps->frame_crop_left_offset   = 0;
373         sps->frame_crop_right_offset  =
374             (16 * priv->mb_width - avctx->width) / 2;
375         sps->frame_crop_top_offset    = 0;
376         sps->frame_crop_bottom_offset =
377             (16 * priv->mb_height - avctx->height) / 2;
378     } else {
379         sps->frame_cropping_flag = 0;
380     }
381
382     sps->vui_parameters_present_flag = 1;
383
384     if (avctx->sample_aspect_ratio.num != 0 &&
385         avctx->sample_aspect_ratio.den != 0) {
386         static const AVRational sar_idc[] = {
387             {   0,  0 },
388             {   1,  1 }, {  12, 11 }, {  10, 11 }, {  16, 11 },
389             {  40, 33 }, {  24, 11 }, {  20, 11 }, {  32, 11 },
390             {  80, 33 }, {  18, 11 }, {  15, 11 }, {  64, 33 },
391             { 160, 99 }, {   4,  3 }, {   3,  2 }, {   2,  1 },
392         };
393         int num, den, i;
394         av_reduce(&num, &den, avctx->sample_aspect_ratio.num,
395                   avctx->sample_aspect_ratio.den, 65535);
396         for (i = 0; i < FF_ARRAY_ELEMS(sar_idc); i++) {
397             if (num == sar_idc[i].num &&
398                 den == sar_idc[i].den) {
399                 sps->vui.aspect_ratio_idc = i;
400                 break;
401             }
402         }
403         if (i >= FF_ARRAY_ELEMS(sar_idc)) {
404             sps->vui.aspect_ratio_idc = 255;
405             sps->vui.sar_width  = num;
406             sps->vui.sar_height = den;
407         }
408         sps->vui.aspect_ratio_info_present_flag = 1;
409     }
410
411     if (avctx->color_range     != AVCOL_RANGE_UNSPECIFIED ||
412         avctx->color_primaries != AVCOL_PRI_UNSPECIFIED ||
413         avctx->color_trc       != AVCOL_TRC_UNSPECIFIED ||
414         avctx->colorspace      != AVCOL_SPC_UNSPECIFIED) {
415         sps->vui.video_signal_type_present_flag = 1;
416         sps->vui.video_format      = 5; // Unspecified.
417         sps->vui.video_full_range_flag =
418             avctx->color_range == AVCOL_RANGE_JPEG;
419
420         if (avctx->color_primaries != AVCOL_PRI_UNSPECIFIED ||
421             avctx->color_trc       != AVCOL_TRC_UNSPECIFIED ||
422             avctx->colorspace      != AVCOL_SPC_UNSPECIFIED) {
423             sps->vui.colour_description_present_flag = 1;
424             sps->vui.colour_primaries         = avctx->color_primaries;
425             sps->vui.transfer_characteristics = avctx->color_trc;
426             sps->vui.matrix_coefficients      = avctx->colorspace;
427         }
428     } else {
429         sps->vui.video_format             = 5;
430         sps->vui.video_full_range_flag    = 0;
431         sps->vui.colour_primaries         = avctx->color_primaries;
432         sps->vui.transfer_characteristics = avctx->color_trc;
433         sps->vui.matrix_coefficients      = avctx->colorspace;
434     }
435
436     if (avctx->chroma_sample_location != AVCHROMA_LOC_UNSPECIFIED) {
437         sps->vui.chroma_loc_info_present_flag = 1;
438         sps->vui.chroma_sample_loc_type_top_field    =
439         sps->vui.chroma_sample_loc_type_bottom_field =
440             avctx->chroma_sample_location - 1;
441     }
442
443     sps->vui.timing_info_present_flag = 1;
444     if (avctx->framerate.num > 0 && avctx->framerate.den > 0) {
445         sps->vui.num_units_in_tick = avctx->framerate.den;
446         sps->vui.time_scale        = 2 * avctx->framerate.num;
447         sps->vui.fixed_frame_rate_flag = 1;
448     } else {
449         sps->vui.num_units_in_tick = avctx->time_base.num;
450         sps->vui.time_scale        = 2 * avctx->time_base.den;
451         sps->vui.fixed_frame_rate_flag = 0;
452     }
453
454     if (priv->sei & SEI_TIMING) {
455         H264RawHRD *hrd = &sps->vui.nal_hrd_parameters;
456         H264RawSEIBufferingPeriod *bp = &priv->sei_buffering_period;
457
458         sps->vui.nal_hrd_parameters_present_flag = 1;
459
460         hrd->cpb_cnt_minus1 = 0;
461
462         // Try to scale these to a sensible range so that the
463         // golomb encode of the value is not overlong.
464         hrd->bit_rate_scale =
465             av_clip_uintp2(av_log2(ctx->va_bit_rate) - 15 - 6, 4);
466         hrd->bit_rate_value_minus1[0] =
467             (ctx->va_bit_rate >> hrd->bit_rate_scale + 6) - 1;
468
469         hrd->cpb_size_scale =
470             av_clip_uintp2(av_log2(ctx->hrd_params.hrd.buffer_size) - 15 - 4, 4);
471         hrd->cpb_size_value_minus1[0] =
472             (ctx->hrd_params.hrd.buffer_size >> hrd->cpb_size_scale + 4) - 1;
473
474         // CBR mode as defined for the HRD cannot be achieved without filler
475         // data, so this flag cannot be set even with VAAPI CBR modes.
476         hrd->cbr_flag[0] = 0;
477
478         hrd->initial_cpb_removal_delay_length_minus1 = 23;
479         hrd->cpb_removal_delay_length_minus1         = 23;
480         hrd->dpb_output_delay_length_minus1          = 7;
481         hrd->time_offset_length                      = 0;
482
483         bp->seq_parameter_set_id = sps->seq_parameter_set_id;
484
485         // This calculation can easily overflow 32 bits.
486         bp->nal.initial_cpb_removal_delay[0] = 90000 *
487             (uint64_t)ctx->hrd_params.hrd.initial_buffer_fullness /
488             ctx->hrd_params.hrd.buffer_size;
489         bp->nal.initial_cpb_removal_delay_offset[0] = 0;
490     } else {
491         sps->vui.nal_hrd_parameters_present_flag = 0;
492         sps->vui.low_delay_hrd_flag = 1 - sps->vui.fixed_frame_rate_flag;
493     }
494
495     sps->vui.bitstream_restriction_flag    = 1;
496     sps->vui.motion_vectors_over_pic_boundaries_flag = 1;
497     sps->vui.log2_max_mv_length_horizontal = 15;
498     sps->vui.log2_max_mv_length_vertical   = 15;
499     sps->vui.max_num_reorder_frames        = ctx->max_b_depth;
500     sps->vui.max_dec_frame_buffering       = ctx->max_b_depth + 1;
501
502     pps->nal_unit_header.nal_ref_idc = 3;
503     pps->nal_unit_header.nal_unit_type = H264_NAL_PPS;
504
505     pps->pic_parameter_set_id = 0;
506     pps->seq_parameter_set_id = 0;
507
508     pps->entropy_coding_mode_flag =
509         !(sps->profile_idc == FF_PROFILE_H264_BASELINE ||
510           sps->profile_idc == FF_PROFILE_H264_EXTENDED ||
511           sps->profile_idc == FF_PROFILE_H264_CAVLC_444);
512     if (!priv->coder && pps->entropy_coding_mode_flag)
513         pps->entropy_coding_mode_flag = 0;
514
515     pps->num_ref_idx_l0_default_active_minus1 = 0;
516     pps->num_ref_idx_l1_default_active_minus1 = 0;
517
518     pps->pic_init_qp_minus26 = priv->fixed_qp_idr - 26;
519
520     if (sps->profile_idc == FF_PROFILE_H264_BASELINE ||
521         sps->profile_idc == FF_PROFILE_H264_EXTENDED ||
522         sps->profile_idc == FF_PROFILE_H264_MAIN) {
523         pps->more_rbsp_data = 0;
524     } else {
525         pps->more_rbsp_data = 1;
526
527         pps->transform_8x8_mode_flag = 1;
528     }
529
530     *vseq = (VAEncSequenceParameterBufferH264) {
531         .seq_parameter_set_id = sps->seq_parameter_set_id,
532         .level_idc        = sps->level_idc,
533         .intra_period     = ctx->gop_size,
534         .intra_idr_period = ctx->gop_size,
535         .ip_period        = ctx->b_per_p + 1,
536
537         .bits_per_second       = ctx->va_bit_rate,
538         .max_num_ref_frames    = sps->max_num_ref_frames,
539         .picture_width_in_mbs  = sps->pic_width_in_mbs_minus1 + 1,
540         .picture_height_in_mbs = sps->pic_height_in_map_units_minus1 + 1,
541
542         .seq_fields.bits = {
543             .chroma_format_idc                 = sps->chroma_format_idc,
544             .frame_mbs_only_flag               = sps->frame_mbs_only_flag,
545             .mb_adaptive_frame_field_flag      = sps->mb_adaptive_frame_field_flag,
546             .seq_scaling_matrix_present_flag   = sps->seq_scaling_matrix_present_flag,
547             .direct_8x8_inference_flag         = sps->direct_8x8_inference_flag,
548             .log2_max_frame_num_minus4         = sps->log2_max_frame_num_minus4,
549             .pic_order_cnt_type                = sps->pic_order_cnt_type,
550             .log2_max_pic_order_cnt_lsb_minus4 = sps->log2_max_pic_order_cnt_lsb_minus4,
551             .delta_pic_order_always_zero_flag  = sps->delta_pic_order_always_zero_flag,
552         },
553
554         .bit_depth_luma_minus8   = sps->bit_depth_luma_minus8,
555         .bit_depth_chroma_minus8 = sps->bit_depth_chroma_minus8,
556
557         .frame_cropping_flag      = sps->frame_cropping_flag,
558         .frame_crop_left_offset   = sps->frame_crop_left_offset,
559         .frame_crop_right_offset  = sps->frame_crop_right_offset,
560         .frame_crop_top_offset    = sps->frame_crop_top_offset,
561         .frame_crop_bottom_offset = sps->frame_crop_bottom_offset,
562
563         .vui_parameters_present_flag = sps->vui_parameters_present_flag,
564
565         .vui_fields.bits = {
566             .aspect_ratio_info_present_flag = sps->vui.aspect_ratio_info_present_flag,
567             .timing_info_present_flag       = sps->vui.timing_info_present_flag,
568             .bitstream_restriction_flag     = sps->vui.bitstream_restriction_flag,
569             .log2_max_mv_length_horizontal  = sps->vui.log2_max_mv_length_horizontal,
570             .log2_max_mv_length_vertical    = sps->vui.log2_max_mv_length_vertical,
571         },
572
573         .aspect_ratio_idc  = sps->vui.aspect_ratio_idc,
574         .sar_width         = sps->vui.sar_width,
575         .sar_height        = sps->vui.sar_height,
576         .num_units_in_tick = sps->vui.num_units_in_tick,
577         .time_scale        = sps->vui.time_scale,
578     };
579
580     *vpic = (VAEncPictureParameterBufferH264) {
581         .CurrPic = {
582             .picture_id = VA_INVALID_ID,
583             .flags      = VA_PICTURE_H264_INVALID,
584         },
585
586         .coded_buf = VA_INVALID_ID,
587
588         .pic_parameter_set_id = pps->pic_parameter_set_id,
589         .seq_parameter_set_id = pps->seq_parameter_set_id,
590
591         .pic_init_qp                  = pps->pic_init_qp_minus26 + 26,
592         .num_ref_idx_l0_active_minus1 = pps->num_ref_idx_l0_default_active_minus1,
593         .num_ref_idx_l1_active_minus1 = pps->num_ref_idx_l1_default_active_minus1,
594
595         .chroma_qp_index_offset        = pps->chroma_qp_index_offset,
596         .second_chroma_qp_index_offset = pps->second_chroma_qp_index_offset,
597
598         .pic_fields.bits = {
599             .entropy_coding_mode_flag        = pps->entropy_coding_mode_flag,
600             .weighted_pred_flag              = pps->weighted_pred_flag,
601             .weighted_bipred_idc             = pps->weighted_bipred_idc,
602             .constrained_intra_pred_flag     = pps->constrained_intra_pred_flag,
603             .transform_8x8_mode_flag         = pps->transform_8x8_mode_flag,
604             .deblocking_filter_control_present_flag =
605                 pps->deblocking_filter_control_present_flag,
606             .redundant_pic_cnt_present_flag  = pps->redundant_pic_cnt_present_flag,
607             .pic_order_present_flag          =
608                 pps->bottom_field_pic_order_in_frame_present_flag,
609             .pic_scaling_matrix_present_flag = pps->pic_scaling_matrix_present_flag,
610         },
611     };
612
613     return 0;
614 }
615
616 static int vaapi_encode_h264_init_picture_params(AVCodecContext *avctx,
617                                                  VAAPIEncodePicture *pic)
618 {
619     VAAPIEncodeContext               *ctx = avctx->priv_data;
620     VAAPIEncodeH264Context          *priv = avctx->priv_data;
621     VAAPIEncodeH264Picture          *hpic = pic->priv_data;
622     VAAPIEncodePicture              *prev = pic->prev;
623     VAAPIEncodeH264Picture         *hprev = prev ? prev->priv_data : NULL;
624     VAEncPictureParameterBufferH264 *vpic = pic->codec_picture_params;
625     int i;
626
627     memset(&priv->current_access_unit, 0,
628            sizeof(priv->current_access_unit));
629
630     if (pic->type == PICTURE_TYPE_IDR) {
631         av_assert0(pic->display_order == pic->encode_order);
632
633         hpic->frame_num      = 0;
634         hpic->last_idr_frame = pic->display_order;
635         hpic->idr_pic_id     = hprev ? hprev->idr_pic_id + 1 : 0;
636
637         hpic->primary_pic_type = 0;
638         hpic->slice_type       = 7;
639     } else {
640         av_assert0(prev);
641
642         hpic->frame_num = hprev->frame_num + prev->is_reference;
643
644         hpic->last_idr_frame = hprev->last_idr_frame;
645         hpic->idr_pic_id     = hprev->idr_pic_id;
646
647         if (pic->type == PICTURE_TYPE_I) {
648             hpic->slice_type       = 7;
649             hpic->primary_pic_type = 0;
650         } else if (pic->type == PICTURE_TYPE_P) {
651             hpic->slice_type       = 5;
652             hpic->primary_pic_type = 1;
653         } else {
654             hpic->slice_type       = 6;
655             hpic->primary_pic_type = 2;
656         }
657     }
658     hpic->pic_order_cnt = pic->display_order - hpic->last_idr_frame;
659     hpic->dpb_delay     = pic->display_order - pic->encode_order + ctx->max_b_depth;
660     hpic->cpb_delay     = pic->encode_order - hpic->last_idr_frame;
661
662     if (priv->aud) {
663         priv->aud_needed = 1;
664         priv->raw_aud = (H264RawAUD) {
665             .nal_unit_header = {
666                 .nal_unit_type = H264_NAL_AUD,
667             },
668             .primary_pic_type  = hpic->primary_pic_type,
669         };
670     } else {
671         priv->aud_needed = 0;
672     }
673
674     priv->sei_needed = 0;
675
676     if (priv->sei & SEI_IDENTIFIER && pic->encode_order == 0)
677         priv->sei_needed |= SEI_IDENTIFIER;
678 #if !CONFIG_VAAPI_1
679     if (ctx->va_rc_mode == VA_RC_CBR)
680         priv->sei_cbr_workaround_needed = 1;
681 #endif
682
683     if (priv->sei & SEI_TIMING) {
684         priv->sei_pic_timing = (H264RawSEIPicTiming) {
685             .cpb_removal_delay = 2 * hpic->cpb_delay,
686             .dpb_output_delay  = 2 * hpic->dpb_delay,
687         };
688
689         priv->sei_needed |= SEI_TIMING;
690     }
691
692     if (priv->sei & SEI_RECOVERY_POINT && pic->type == PICTURE_TYPE_I) {
693         priv->sei_recovery_point = (H264RawSEIRecoveryPoint) {
694             .recovery_frame_cnt = 0,
695             .exact_match_flag   = 1,
696             .broken_link_flag   = ctx->b_per_p > 0,
697         };
698
699         priv->sei_needed |= SEI_RECOVERY_POINT;
700     }
701
702     vpic->CurrPic = (VAPictureH264) {
703         .picture_id          = pic->recon_surface,
704         .frame_idx           = hpic->frame_num,
705         .flags               = 0,
706         .TopFieldOrderCnt    = hpic->pic_order_cnt,
707         .BottomFieldOrderCnt = hpic->pic_order_cnt,
708     };
709
710     for (i = 0; i < pic->nb_refs; i++) {
711         VAAPIEncodePicture      *ref = pic->refs[i];
712         VAAPIEncodeH264Picture *href;
713
714         av_assert0(ref && ref->encode_order < pic->encode_order);
715         href = ref->priv_data;
716
717         vpic->ReferenceFrames[i] = (VAPictureH264) {
718             .picture_id          = ref->recon_surface,
719             .frame_idx           = href->frame_num,
720             .flags               = VA_PICTURE_H264_SHORT_TERM_REFERENCE,
721             .TopFieldOrderCnt    = href->pic_order_cnt,
722             .BottomFieldOrderCnt = href->pic_order_cnt,
723         };
724     }
725     for (; i < FF_ARRAY_ELEMS(vpic->ReferenceFrames); i++) {
726         vpic->ReferenceFrames[i] = (VAPictureH264) {
727             .picture_id = VA_INVALID_ID,
728             .flags      = VA_PICTURE_H264_INVALID,
729         };
730     }
731
732     vpic->coded_buf = pic->output_buffer;
733
734     vpic->frame_num = hpic->frame_num;
735
736     vpic->pic_fields.bits.idr_pic_flag       = (pic->type == PICTURE_TYPE_IDR);
737     vpic->pic_fields.bits.reference_pic_flag = (pic->type != PICTURE_TYPE_B);
738
739     return 0;
740 }
741
742 static void vaapi_encode_h264_default_ref_pic_list(AVCodecContext *avctx,
743                                                    VAAPIEncodePicture *pic,
744                                                    VAAPIEncodePicture **rpl0,
745                                                    VAAPIEncodePicture **rpl1,
746                                                    int *rpl_size)
747 {
748     VAAPIEncodePicture *prev;
749     VAAPIEncodeH264Picture *hp, *hn, *hc;
750     int i, j, n = 0;
751
752     prev = pic->prev;
753     av_assert0(prev);
754     hp = pic->priv_data;
755
756     for (i = 0; i < pic->prev->nb_dpb_pics; i++) {
757         hn = prev->dpb[i]->priv_data;
758         av_assert0(hn->frame_num < hp->frame_num);
759
760         if (pic->type == PICTURE_TYPE_P) {
761             for (j = n; j > 0; j--) {
762                 hc = rpl0[j - 1]->priv_data;
763                 av_assert0(hc->frame_num != hn->frame_num);
764                 if (hc->frame_num > hn->frame_num)
765                     break;
766                 rpl0[j] = rpl0[j - 1];
767             }
768             rpl0[j] = prev->dpb[i];
769
770         } else if (pic->type == PICTURE_TYPE_B) {
771             for (j = n; j > 0; j--) {
772                 hc = rpl0[j - 1]->priv_data;
773                 av_assert0(hc->pic_order_cnt != hp->pic_order_cnt);
774                 if (hc->pic_order_cnt < hp->pic_order_cnt) {
775                     if (hn->pic_order_cnt > hp->pic_order_cnt ||
776                         hn->pic_order_cnt < hc->pic_order_cnt)
777                         break;
778                 } else {
779                     if (hn->pic_order_cnt > hc->pic_order_cnt)
780                         break;
781                 }
782                 rpl0[j] = rpl0[j - 1];
783             }
784             rpl0[j] = prev->dpb[i];
785
786             for (j = n; j > 0; j--) {
787                 hc = rpl1[j - 1]->priv_data;
788                 av_assert0(hc->pic_order_cnt != hp->pic_order_cnt);
789                 if (hc->pic_order_cnt > hp->pic_order_cnt) {
790                     if (hn->pic_order_cnt < hp->pic_order_cnt ||
791                         hn->pic_order_cnt > hc->pic_order_cnt)
792                         break;
793                 } else {
794                     if (hn->pic_order_cnt < hc->pic_order_cnt)
795                         break;
796                 }
797                 rpl1[j] = rpl1[j - 1];
798             }
799             rpl1[j] = prev->dpb[i];
800         }
801
802         ++n;
803     }
804
805     if (pic->type == PICTURE_TYPE_B) {
806         for (i = 0; i < n; i++) {
807             if (rpl0[i] != rpl1[i])
808                 break;
809         }
810         if (i == n)
811             FFSWAP(VAAPIEncodePicture*, rpl1[0], rpl1[1]);
812     }
813
814     if (pic->type == PICTURE_TYPE_P ||
815         pic->type == PICTURE_TYPE_B) {
816         av_log(avctx, AV_LOG_DEBUG, "Default RefPicList0 for fn=%d/poc=%d:",
817                hp->frame_num, hp->pic_order_cnt);
818         for (i = 0; i < n; i++) {
819             hn = rpl0[i]->priv_data;
820             av_log(avctx, AV_LOG_DEBUG, "  fn=%d/poc=%d",
821                    hn->frame_num, hn->pic_order_cnt);
822         }
823         av_log(avctx, AV_LOG_DEBUG, "\n");
824     }
825     if (pic->type == PICTURE_TYPE_B) {
826         av_log(avctx, AV_LOG_DEBUG, "Default RefPicList1 for fn=%d/poc=%d:",
827                hp->frame_num, hp->pic_order_cnt);
828         for (i = 0; i < n; i++) {
829             hn = rpl1[i]->priv_data;
830             av_log(avctx, AV_LOG_DEBUG, "  fn=%d/poc=%d",
831                    hn->frame_num, hn->pic_order_cnt);
832         }
833         av_log(avctx, AV_LOG_DEBUG, "\n");
834     }
835
836     *rpl_size = n;
837 }
838
839 static int vaapi_encode_h264_init_slice_params(AVCodecContext *avctx,
840                                                VAAPIEncodePicture *pic,
841                                                VAAPIEncodeSlice *slice)
842 {
843     VAAPIEncodeH264Context          *priv = avctx->priv_data;
844     VAAPIEncodeH264Picture          *hpic = pic->priv_data;
845     VAAPIEncodePicture              *prev = pic->prev;
846     H264RawSPS                       *sps = &priv->raw_sps;
847     H264RawPPS                       *pps = &priv->raw_pps;
848     H264RawSliceHeader                *sh = &priv->raw_slice.header;
849     VAEncPictureParameterBufferH264 *vpic = pic->codec_picture_params;
850     VAEncSliceParameterBufferH264 *vslice = slice->codec_slice_params;
851     int i, j;
852
853     if (pic->type == PICTURE_TYPE_IDR) {
854         sh->nal_unit_header.nal_unit_type = H264_NAL_IDR_SLICE;
855         sh->nal_unit_header.nal_ref_idc   = 3;
856     } else {
857         sh->nal_unit_header.nal_unit_type = H264_NAL_SLICE;
858         sh->nal_unit_header.nal_ref_idc   = pic->is_reference;
859     }
860
861     sh->first_mb_in_slice = slice->block_start;
862     sh->slice_type        = hpic->slice_type;
863
864     sh->pic_parameter_set_id = pps->pic_parameter_set_id;
865
866     sh->frame_num = hpic->frame_num &
867         ((1 << (4 + sps->log2_max_frame_num_minus4)) - 1);
868     sh->idr_pic_id = hpic->idr_pic_id;
869     sh->pic_order_cnt_lsb = hpic->pic_order_cnt &
870         ((1 << (4 + sps->log2_max_pic_order_cnt_lsb_minus4)) - 1);
871
872     sh->direct_spatial_mv_pred_flag = 1;
873
874     if (pic->type == PICTURE_TYPE_B)
875         sh->slice_qp_delta = priv->fixed_qp_b - (pps->pic_init_qp_minus26 + 26);
876     else if (pic->type == PICTURE_TYPE_P)
877         sh->slice_qp_delta = priv->fixed_qp_p - (pps->pic_init_qp_minus26 + 26);
878     else
879         sh->slice_qp_delta = priv->fixed_qp_idr - (pps->pic_init_qp_minus26 + 26);
880
881     if (pic->is_reference && pic->type != PICTURE_TYPE_IDR) {
882         VAAPIEncodePicture *discard_list[MAX_DPB_SIZE];
883         int discard = 0, keep = 0;
884
885         // Discard everything which is in the DPB of the previous frame but
886         // not in the DPB of this one.
887         for (i = 0; i < prev->nb_dpb_pics; i++) {
888             for (j = 0; j < pic->nb_dpb_pics; j++) {
889                 if (prev->dpb[i] == pic->dpb[j])
890                     break;
891             }
892             if (j == pic->nb_dpb_pics) {
893                 discard_list[discard] = prev->dpb[i];
894                 ++discard;
895             } else {
896                 ++keep;
897             }
898         }
899         av_assert0(keep <= priv->dpb_frames);
900
901         if (discard == 0) {
902             sh->adaptive_ref_pic_marking_mode_flag = 0;
903         } else {
904             sh->adaptive_ref_pic_marking_mode_flag = 1;
905             for (i = 0; i < discard; i++) {
906                 VAAPIEncodeH264Picture *old = discard_list[i]->priv_data;
907                 av_assert0(old->frame_num < hpic->frame_num);
908                 sh->mmco[i].memory_management_control_operation = 1;
909                 sh->mmco[i].difference_of_pic_nums_minus1 =
910                     hpic->frame_num - old->frame_num - 1;
911             }
912             sh->mmco[i].memory_management_control_operation = 0;
913         }
914     }
915
916     // If the intended references are not the first entries of RefPicListN
917     // by default, use ref-pic-list-modification to move them there.
918     if (pic->type == PICTURE_TYPE_P || pic->type == PICTURE_TYPE_B) {
919         VAAPIEncodePicture *def_l0[MAX_DPB_SIZE], *def_l1[MAX_DPB_SIZE];
920         VAAPIEncodeH264Picture *href;
921         int n;
922
923         vaapi_encode_h264_default_ref_pic_list(avctx, pic,
924                                                def_l0, def_l1, &n);
925
926         if (pic->type == PICTURE_TYPE_P) {
927             int need_rplm = 0;
928             for (i = 0; i < pic->nb_refs; i++) {
929                 av_assert0(pic->refs[i]);
930                 if (pic->refs[i] != def_l0[i])
931                     need_rplm = 1;
932             }
933
934             sh->ref_pic_list_modification_flag_l0 = need_rplm;
935             if (need_rplm) {
936                 int pic_num = hpic->frame_num;
937                 for (i = 0; i < pic->nb_refs; i++) {
938                     href = pic->refs[i]->priv_data;
939                     av_assert0(href->frame_num != pic_num);
940                     if (href->frame_num < pic_num) {
941                         sh->rplm_l0[i].modification_of_pic_nums_idc = 0;
942                         sh->rplm_l0[i].abs_diff_pic_num_minus1 =
943                             pic_num - href->frame_num - 1;
944                     } else {
945                         sh->rplm_l0[i].modification_of_pic_nums_idc = 1;
946                         sh->rplm_l0[i].abs_diff_pic_num_minus1 =
947                             href->frame_num - pic_num - 1;
948                     }
949                     pic_num = href->frame_num;
950                 }
951                 sh->rplm_l0[i].modification_of_pic_nums_idc = 3;
952             }
953
954         } else {
955             int need_rplm_l0 = 0, need_rplm_l1 = 0;
956             int n0 = 0, n1 = 0;
957             for (i = 0; i < pic->nb_refs; i++) {
958                 av_assert0(pic->refs[i]);
959                 href = pic->refs[i]->priv_data;
960                 av_assert0(href->pic_order_cnt != hpic->pic_order_cnt);
961                 if (href->pic_order_cnt < hpic->pic_order_cnt) {
962                     if (pic->refs[i] != def_l0[n0])
963                         need_rplm_l0 = 1;
964                     ++n0;
965                 } else {
966                     if (pic->refs[i] != def_l1[n1])
967                         need_rplm_l1 = 1;
968                     ++n1;
969                 }
970             }
971
972             sh->ref_pic_list_modification_flag_l0 = need_rplm_l0;
973             if (need_rplm_l0) {
974                 int pic_num = hpic->frame_num;
975                 for (i = j = 0; i < pic->nb_refs; i++) {
976                     href = pic->refs[i]->priv_data;
977                     if (href->pic_order_cnt > hpic->pic_order_cnt)
978                         continue;
979                     av_assert0(href->frame_num != pic_num);
980                     if (href->frame_num < pic_num) {
981                         sh->rplm_l0[j].modification_of_pic_nums_idc = 0;
982                         sh->rplm_l0[j].abs_diff_pic_num_minus1 =
983                             pic_num - href->frame_num - 1;
984                     } else {
985                         sh->rplm_l0[j].modification_of_pic_nums_idc = 1;
986                         sh->rplm_l0[j].abs_diff_pic_num_minus1 =
987                             href->frame_num - pic_num - 1;
988                     }
989                     pic_num = href->frame_num;
990                     ++j;
991                 }
992                 av_assert0(j == n0);
993                 sh->rplm_l0[j].modification_of_pic_nums_idc = 3;
994             }
995
996             sh->ref_pic_list_modification_flag_l1 = need_rplm_l1;
997             if (need_rplm_l1) {
998                 int pic_num = hpic->frame_num;
999                 for (i = j = 0; i < pic->nb_refs; i++) {
1000                     href = pic->refs[i]->priv_data;
1001                     if (href->pic_order_cnt < hpic->pic_order_cnt)
1002                         continue;
1003                     av_assert0(href->frame_num != pic_num);
1004                     if (href->frame_num < pic_num) {
1005                         sh->rplm_l1[j].modification_of_pic_nums_idc = 0;
1006                         sh->rplm_l1[j].abs_diff_pic_num_minus1 =
1007                             pic_num - href->frame_num - 1;
1008                     } else {
1009                         sh->rplm_l1[j].modification_of_pic_nums_idc = 1;
1010                         sh->rplm_l1[j].abs_diff_pic_num_minus1 =
1011                             href->frame_num - pic_num - 1;
1012                     }
1013                     pic_num = href->frame_num;
1014                     ++j;
1015                 }
1016                 av_assert0(j == n1);
1017                 sh->rplm_l1[j].modification_of_pic_nums_idc = 3;
1018             }
1019         }
1020     }
1021
1022     vslice->macroblock_address = slice->block_start;
1023     vslice->num_macroblocks    = slice->block_size;
1024
1025     vslice->macroblock_info = VA_INVALID_ID;
1026
1027     vslice->slice_type           = sh->slice_type % 5;
1028     vslice->pic_parameter_set_id = sh->pic_parameter_set_id;
1029     vslice->idr_pic_id           = sh->idr_pic_id;
1030
1031     vslice->pic_order_cnt_lsb = sh->pic_order_cnt_lsb;
1032
1033     vslice->direct_spatial_mv_pred_flag = sh->direct_spatial_mv_pred_flag;
1034
1035     for (i = 0; i < FF_ARRAY_ELEMS(vslice->RefPicList0); i++) {
1036         vslice->RefPicList0[i].picture_id = VA_INVALID_ID;
1037         vslice->RefPicList0[i].flags      = VA_PICTURE_H264_INVALID;
1038         vslice->RefPicList1[i].picture_id = VA_INVALID_ID;
1039         vslice->RefPicList1[i].flags      = VA_PICTURE_H264_INVALID;
1040     }
1041
1042     av_assert0(pic->nb_refs <= 2);
1043     if (pic->nb_refs >= 1) {
1044         // Backward reference for P- or B-frame.
1045         av_assert0(pic->type == PICTURE_TYPE_P ||
1046                    pic->type == PICTURE_TYPE_B);
1047         vslice->RefPicList0[0] = vpic->ReferenceFrames[0];
1048     }
1049     if (pic->nb_refs >= 2) {
1050         // Forward reference for B-frame.
1051         av_assert0(pic->type == PICTURE_TYPE_B);
1052         vslice->RefPicList1[0] = vpic->ReferenceFrames[1];
1053     }
1054
1055     vslice->slice_qp_delta = sh->slice_qp_delta;
1056
1057     return 0;
1058 }
1059
1060 static av_cold int vaapi_encode_h264_configure(AVCodecContext *avctx)
1061 {
1062     VAAPIEncodeContext      *ctx = avctx->priv_data;
1063     VAAPIEncodeH264Context *priv = avctx->priv_data;
1064     int err;
1065
1066     err = ff_cbs_init(&priv->cbc, AV_CODEC_ID_H264, avctx);
1067     if (err < 0)
1068         return err;
1069
1070     priv->mb_width  = FFALIGN(avctx->width,  16) / 16;
1071     priv->mb_height = FFALIGN(avctx->height, 16) / 16;
1072
1073     if (ctx->va_rc_mode == VA_RC_CQP) {
1074         priv->fixed_qp_p = priv->qp;
1075         if (avctx->i_quant_factor > 0.0)
1076             priv->fixed_qp_idr = (int)((priv->fixed_qp_p * avctx->i_quant_factor +
1077                                         avctx->i_quant_offset) + 0.5);
1078         else
1079             priv->fixed_qp_idr = priv->fixed_qp_p;
1080         if (avctx->b_quant_factor > 0.0)
1081             priv->fixed_qp_b = (int)((priv->fixed_qp_p * avctx->b_quant_factor +
1082                                       avctx->b_quant_offset) + 0.5);
1083         else
1084             priv->fixed_qp_b = priv->fixed_qp_p;
1085
1086         priv->sei &= ~SEI_TIMING;
1087
1088         av_log(avctx, AV_LOG_DEBUG, "Using fixed QP = "
1089                "%d / %d / %d for IDR- / P- / B-frames.\n",
1090                priv->fixed_qp_idr, priv->fixed_qp_p, priv->fixed_qp_b);
1091
1092     } else if (ctx->va_rc_mode == VA_RC_CBR ||
1093                ctx->va_rc_mode == VA_RC_VBR) {
1094         // These still need to be  set for pic_init_qp/slice_qp_delta.
1095         priv->fixed_qp_idr = 26;
1096         priv->fixed_qp_p   = 26;
1097         priv->fixed_qp_b   = 26;
1098
1099     } else {
1100         av_assert0(0 && "Invalid RC mode.");
1101     }
1102
1103     if (priv->sei & SEI_IDENTIFIER) {
1104         const char *lavc  = LIBAVCODEC_IDENT;
1105         const char *vaapi = VA_VERSION_S;
1106         const char *driver;
1107         int len;
1108
1109         memcpy(priv->sei_identifier.uuid_iso_iec_11578,
1110                vaapi_encode_h264_sei_identifier_uuid,
1111                sizeof(priv->sei_identifier.uuid_iso_iec_11578));
1112
1113         driver = vaQueryVendorString(ctx->hwctx->display);
1114         if (!driver)
1115             driver = "unknown driver";
1116
1117         len = snprintf(NULL, 0, "%s / VAAPI %s / %s", lavc, vaapi, driver);
1118         if (len >= 0) {
1119             priv->sei_identifier_string = av_malloc(len + 1);
1120             if (!priv->sei_identifier_string)
1121                 return AVERROR(ENOMEM);
1122
1123             snprintf(priv->sei_identifier_string, len + 1,
1124                      "%s / VAAPI %s / %s", lavc, vaapi, driver);
1125
1126             priv->sei_identifier.data        = priv->sei_identifier_string;
1127             priv->sei_identifier.data_length = len + 1;
1128         }
1129     }
1130
1131     return 0;
1132 }
1133
1134 static const VAAPIEncodeProfile vaapi_encode_h264_profiles[] = {
1135     { FF_PROFILE_H264_HIGH, 8, 3, 1, 1, VAProfileH264High },
1136     { FF_PROFILE_H264_MAIN, 8, 3, 1, 1, VAProfileH264Main },
1137     { FF_PROFILE_H264_CONSTRAINED_BASELINE,
1138                             8, 3, 1, 1, VAProfileH264ConstrainedBaseline },
1139     { FF_PROFILE_UNKNOWN }
1140 };
1141
1142 static const VAAPIEncodeType vaapi_encode_type_h264 = {
1143     .profiles              = vaapi_encode_h264_profiles,
1144
1145     .flags                 = FLAG_SLICE_CONTROL |
1146                              FLAG_B_PICTURES |
1147                              FLAG_B_PICTURE_REFERENCES |
1148                              FLAG_NON_IDR_KEY_PICTURES,
1149
1150     .configure             = &vaapi_encode_h264_configure,
1151
1152     .picture_priv_data_size = sizeof(VAAPIEncodeH264Picture),
1153
1154     .sequence_params_size  = sizeof(VAEncSequenceParameterBufferH264),
1155     .init_sequence_params  = &vaapi_encode_h264_init_sequence_params,
1156
1157     .picture_params_size   = sizeof(VAEncPictureParameterBufferH264),
1158     .init_picture_params   = &vaapi_encode_h264_init_picture_params,
1159
1160     .slice_params_size     = sizeof(VAEncSliceParameterBufferH264),
1161     .init_slice_params     = &vaapi_encode_h264_init_slice_params,
1162
1163     .sequence_header_type  = VAEncPackedHeaderSequence,
1164     .write_sequence_header = &vaapi_encode_h264_write_sequence_header,
1165
1166     .slice_header_type     = VAEncPackedHeaderH264_Slice,
1167     .write_slice_header    = &vaapi_encode_h264_write_slice_header,
1168
1169     .write_extra_header    = &vaapi_encode_h264_write_extra_header,
1170 };
1171
1172 static av_cold int vaapi_encode_h264_init(AVCodecContext *avctx)
1173 {
1174     VAAPIEncodeContext      *ctx = avctx->priv_data;
1175     VAAPIEncodeH264Context *priv = avctx->priv_data;
1176
1177     ctx->codec = &vaapi_encode_type_h264;
1178
1179     if (avctx->profile == FF_PROFILE_UNKNOWN)
1180         avctx->profile = priv->profile;
1181     if (avctx->level == FF_LEVEL_UNKNOWN)
1182         avctx->level = priv->level;
1183     if (avctx->compression_level == FF_COMPRESSION_DEFAULT)
1184         avctx->compression_level = priv->quality;
1185
1186     // Reject unsupported profiles.
1187     switch (avctx->profile) {
1188     case FF_PROFILE_H264_BASELINE:
1189         av_log(avctx, AV_LOG_WARNING, "H.264 baseline profile is not "
1190                "supported, using constrained baseline profile instead.\n");
1191         avctx->profile = FF_PROFILE_H264_CONSTRAINED_BASELINE;
1192         break;
1193     case FF_PROFILE_H264_EXTENDED:
1194         av_log(avctx, AV_LOG_ERROR, "H.264 extended profile "
1195                "is not supported.\n");
1196         return AVERROR_PATCHWELCOME;
1197     case FF_PROFILE_H264_HIGH_10:
1198     case FF_PROFILE_H264_HIGH_10_INTRA:
1199         av_log(avctx, AV_LOG_ERROR, "H.264 10-bit profiles "
1200                "are not supported.\n");
1201         return AVERROR_PATCHWELCOME;
1202     case FF_PROFILE_H264_HIGH_422:
1203     case FF_PROFILE_H264_HIGH_422_INTRA:
1204     case FF_PROFILE_H264_HIGH_444:
1205     case FF_PROFILE_H264_HIGH_444_PREDICTIVE:
1206     case FF_PROFILE_H264_HIGH_444_INTRA:
1207     case FF_PROFILE_H264_CAVLC_444:
1208         av_log(avctx, AV_LOG_ERROR, "H.264 non-4:2:0 profiles "
1209                "are not supported.\n");
1210         return AVERROR_PATCHWELCOME;
1211     }
1212
1213     if (avctx->level != FF_LEVEL_UNKNOWN && avctx->level & ~0xff) {
1214         av_log(avctx, AV_LOG_ERROR, "Invalid level %d: must fit "
1215                "in 8-bit unsigned integer.\n", avctx->level);
1216         return AVERROR(EINVAL);
1217     }
1218
1219     ctx->desired_packed_headers =
1220         VA_ENC_PACKED_HEADER_SEQUENCE | // SPS and PPS.
1221         VA_ENC_PACKED_HEADER_SLICE    | // Slice headers.
1222         VA_ENC_PACKED_HEADER_MISC;      // SEI.
1223
1224     ctx->surface_width  = FFALIGN(avctx->width,  16);
1225     ctx->surface_height = FFALIGN(avctx->height, 16);
1226
1227     ctx->slice_block_height = ctx->slice_block_width = 16;
1228
1229     return ff_vaapi_encode_init(avctx);
1230 }
1231
1232 static av_cold int vaapi_encode_h264_close(AVCodecContext *avctx)
1233 {
1234     VAAPIEncodeH264Context *priv = avctx->priv_data;
1235
1236     ff_cbs_close(&priv->cbc);
1237     av_freep(&priv->sei_identifier_string);
1238
1239     return ff_vaapi_encode_close(avctx);
1240 }
1241
1242 #define OFFSET(x) offsetof(VAAPIEncodeH264Context, x)
1243 #define FLAGS (AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM)
1244 static const AVOption vaapi_encode_h264_options[] = {
1245     VAAPI_ENCODE_COMMON_OPTIONS,
1246
1247     { "qp", "Constant QP (for P-frames; scaled by qfactor/qoffset for I/B)",
1248       OFFSET(qp), AV_OPT_TYPE_INT, { .i64 = 20 }, 0, 52, FLAGS },
1249     { "quality", "Set encode quality (trades off against speed, higher is faster)",
1250       OFFSET(quality), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT_MAX, FLAGS },
1251     { "coder", "Entropy coder type",
1252       OFFSET(coder), AV_OPT_TYPE_INT, { .i64 = 1 }, 0, 1, FLAGS, "coder" },
1253         { "cavlc", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 0 }, INT_MIN, INT_MAX, FLAGS, "coder" },
1254         { "cabac", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 1 }, INT_MIN, INT_MAX, FLAGS, "coder" },
1255         { "vlc",   NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 0 }, INT_MIN, INT_MAX, FLAGS, "coder" },
1256         { "ac",    NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 1 }, INT_MIN, INT_MAX, FLAGS, "coder" },
1257
1258     { "aud", "Include AUD",
1259       OFFSET(aud), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, FLAGS },
1260
1261     { "sei", "Set SEI to include",
1262       OFFSET(sei), AV_OPT_TYPE_FLAGS,
1263       { .i64 = SEI_IDENTIFIER | SEI_TIMING | SEI_RECOVERY_POINT },
1264       0, INT_MAX, FLAGS, "sei" },
1265     { "identifier", "Include encoder version identifier",
1266       0, AV_OPT_TYPE_CONST, { .i64 = SEI_IDENTIFIER },
1267       INT_MIN, INT_MAX, FLAGS, "sei" },
1268     { "timing", "Include timing parameters (buffering_period and pic_timing)",
1269       0, AV_OPT_TYPE_CONST, { .i64 = SEI_TIMING },
1270       INT_MIN, INT_MAX, FLAGS, "sei" },
1271     { "recovery_point", "Include recovery points where appropriate",
1272       0, AV_OPT_TYPE_CONST, { .i64 = SEI_RECOVERY_POINT },
1273       INT_MIN, INT_MAX, FLAGS, "sei" },
1274
1275     { "profile", "Set profile (profile_idc and constraint_set*_flag)",
1276       OFFSET(profile), AV_OPT_TYPE_INT,
1277       { .i64 = FF_PROFILE_UNKNOWN }, FF_PROFILE_UNKNOWN, 0xffff, FLAGS, "profile" },
1278
1279 #define PROFILE(name, value)  name, NULL, 0, AV_OPT_TYPE_CONST, \
1280       { .i64 = value }, 0, 0, FLAGS, "profile"
1281     { PROFILE("constrained_baseline", FF_PROFILE_H264_CONSTRAINED_BASELINE) },
1282     { PROFILE("main",                 FF_PROFILE_H264_MAIN) },
1283     { PROFILE("high",                 FF_PROFILE_H264_HIGH) },
1284 #undef PROFILE
1285
1286     { "level", "Set level (level_idc)",
1287       OFFSET(level), AV_OPT_TYPE_INT,
1288       { .i64 = FF_LEVEL_UNKNOWN }, FF_LEVEL_UNKNOWN, 0xff, FLAGS, "level" },
1289
1290 #define LEVEL(name, value) name, NULL, 0, AV_OPT_TYPE_CONST, \
1291       { .i64 = value }, 0, 0, FLAGS, "level"
1292     { LEVEL("1",   10) },
1293     { LEVEL("1.1", 11) },
1294     { LEVEL("1.2", 12) },
1295     { LEVEL("1.3", 13) },
1296     { LEVEL("2",   20) },
1297     { LEVEL("2.1", 21) },
1298     { LEVEL("2.2", 22) },
1299     { LEVEL("3",   30) },
1300     { LEVEL("3.1", 31) },
1301     { LEVEL("3.2", 32) },
1302     { LEVEL("4",   40) },
1303     { LEVEL("4.1", 41) },
1304     { LEVEL("4.2", 42) },
1305     { LEVEL("5",   50) },
1306     { LEVEL("5.1", 51) },
1307     { LEVEL("5.2", 52) },
1308     { LEVEL("6",   60) },
1309     { LEVEL("6.1", 61) },
1310     { LEVEL("6.2", 62) },
1311 #undef LEVEL
1312
1313     { NULL },
1314 };
1315
1316 static const AVCodecDefault vaapi_encode_h264_defaults[] = {
1317     { "b",              "0"   },
1318     { "bf",             "2"   },
1319     { "g",              "120" },
1320     { "i_qfactor",      "1"   },
1321     { "i_qoffset",      "0"   },
1322     { "b_qfactor",      "6/5" },
1323     { "b_qoffset",      "0"   },
1324     { "qmin",           "-1"  },
1325     { "qmax",           "-1"  },
1326     { NULL },
1327 };
1328
1329 static const AVClass vaapi_encode_h264_class = {
1330     .class_name = "h264_vaapi",
1331     .item_name  = av_default_item_name,
1332     .option     = vaapi_encode_h264_options,
1333     .version    = LIBAVUTIL_VERSION_INT,
1334 };
1335
1336 AVCodec ff_h264_vaapi_encoder = {
1337     .name           = "h264_vaapi",
1338     .long_name      = NULL_IF_CONFIG_SMALL("H.264/AVC (VAAPI)"),
1339     .type           = AVMEDIA_TYPE_VIDEO,
1340     .id             = AV_CODEC_ID_H264,
1341     .priv_data_size = sizeof(VAAPIEncodeH264Context),
1342     .init           = &vaapi_encode_h264_init,
1343     .send_frame     = &ff_vaapi_encode_send_frame,
1344     .receive_packet = &ff_vaapi_encode_receive_packet,
1345     .close          = &vaapi_encode_h264_close,
1346     .priv_class     = &vaapi_encode_h264_class,
1347     .capabilities   = AV_CODEC_CAP_DELAY | AV_CODEC_CAP_HARDWARE,
1348     .defaults       = vaapi_encode_h264_defaults,
1349     .pix_fmts = (const enum AVPixelFormat[]) {
1350         AV_PIX_FMT_VAAPI,
1351         AV_PIX_FMT_NONE,
1352     },
1353     .wrapper_name   = "vaapi",
1354 };