2 * Copyright © 2011 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the
6 * "Software"), to deal in the Software without restriction, including
7 * without limitation the rights to use, copy, modify, merge, publish,
8 * distribute, sub license, and/or sell copies of the Software, and to
9 * permit persons to whom the Software is furnished to do so, subject to
10 * the following conditions:
12 * The above copyright notice and this permission notice (including the
13 * next paragraph) shall be included in all copies or substantial portions
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
17 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
19 * IN NO EVENT SHALL PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR
20 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
21 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
22 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
30 #include <va/va_enc_h264.h>
31 #include <va/va_enc_mpeg2.h>
33 #include "i965_encoder_utils.h"
35 #define BITSTREAM_ALLOCATE_STEPPING 4096
37 #define NAL_REF_IDC_NONE 0
38 #define NAL_REF_IDC_LOW 1
39 #define NAL_REF_IDC_MEDIUM 2
40 #define NAL_REF_IDC_HIGH 3
48 #define SLICE_TYPE_P 0
49 #define SLICE_TYPE_B 1
50 #define SLICE_TYPE_I 2
52 #define IS_I_SLICE(type) (SLICE_TYPE_I == (type) || SLICE_TYPE_I == (type - 5))
53 #define IS_P_SLICE(type) (SLICE_TYPE_P == (type) || SLICE_TYPE_P == (type - 5))
54 #define IS_B_SLICE(type) (SLICE_TYPE_B == (type) || SLICE_TYPE_B == (type - 5))
56 #define ENTROPY_MODE_CAVLC 0
57 #define ENTROPY_MODE_CABAC 1
59 #define PROFILE_IDC_BASELINE 66
60 #define PROFILE_IDC_MAIN 77
61 #define PROFILE_IDC_HIGH 100
63 struct __avc_bitstream {
66 int max_size_in_dword;
69 typedef struct __avc_bitstream avc_bitstream;
72 swap32(unsigned int val)
74 unsigned char *pval = (unsigned char *)&val;
76 return ((pval[0] << 24) |
83 avc_bitstream_start(avc_bitstream *bs)
85 bs->max_size_in_dword = BITSTREAM_ALLOCATE_STEPPING;
86 bs->buffer = calloc(bs->max_size_in_dword * sizeof(int), 1);
91 avc_bitstream_end(avc_bitstream *bs)
93 int pos = (bs->bit_offset >> 5);
94 int bit_offset = (bs->bit_offset & 0x1f);
95 int bit_left = 32 - bit_offset;
98 bs->buffer[pos] = swap32((bs->buffer[pos] << bit_left));
105 avc_bitstream_put_ui(avc_bitstream *bs, unsigned int val, int size_in_bits)
107 int pos = (bs->bit_offset >> 5);
108 int bit_offset = (bs->bit_offset & 0x1f);
109 int bit_left = 32 - bit_offset;
114 if (size_in_bits < 32)
115 val &= (( 1 << size_in_bits) - 1);
117 bs->bit_offset += size_in_bits;
119 if (bit_left > size_in_bits) {
120 bs->buffer[pos] = (bs->buffer[pos] << size_in_bits | val);
122 size_in_bits -= bit_left;
123 bs->buffer[pos] = (bs->buffer[pos] << bit_left) | (val >> size_in_bits);
124 bs->buffer[pos] = swap32(bs->buffer[pos]);
126 if (pos + 1 == bs->max_size_in_dword) {
127 bs->max_size_in_dword += BITSTREAM_ALLOCATE_STEPPING;
128 bs->buffer = realloc(bs->buffer, bs->max_size_in_dword * sizeof(unsigned int));
134 bs->buffer[pos + 1] = val;
139 avc_bitstream_put_ue(avc_bitstream *bs, unsigned int val)
141 int size_in_bits = 0;
149 avc_bitstream_put_ui(bs, 0, size_in_bits - 1); // leading zero
150 avc_bitstream_put_ui(bs, val, size_in_bits);
154 avc_bitstream_put_se(avc_bitstream *bs, int val)
156 unsigned int new_val;
161 new_val = 2 * val - 1;
163 avc_bitstream_put_ue(bs, new_val);
167 avc_bitstream_byte_aligning(avc_bitstream *bs, int bit)
169 int bit_offset = (bs->bit_offset & 0x7);
170 int bit_left = 8 - bit_offset;
176 assert(bit == 0 || bit == 1);
179 new_val = (1 << bit_left) - 1;
183 avc_bitstream_put_ui(bs, new_val, bit_left);
185 static void avc_rbsp_trailing_bits(avc_bitstream *bs)
187 avc_bitstream_put_ui(bs, 1, 1);
188 avc_bitstream_byte_aligning(bs, 0);
190 static void nal_start_code_prefix(avc_bitstream *bs)
192 avc_bitstream_put_ui(bs, 0x00000001, 32);
195 static void nal_header(avc_bitstream *bs, int nal_ref_idc, int nal_unit_type)
197 avc_bitstream_put_ui(bs, 0, 1); /* forbidden_zero_bit: 0 */
198 avc_bitstream_put_ui(bs, nal_ref_idc, 2);
199 avc_bitstream_put_ui(bs, nal_unit_type, 5);
203 slice_header(avc_bitstream *bs,
204 VAEncSequenceParameterBufferH264 *sps_param,
205 VAEncPictureParameterBufferH264 *pic_param,
206 VAEncSliceParameterBufferH264 *slice_param)
208 int first_mb_in_slice = slice_param->macroblock_address;
210 avc_bitstream_put_ue(bs, first_mb_in_slice); /* first_mb_in_slice: 0 */
211 avc_bitstream_put_ue(bs, slice_param->slice_type); /* slice_type */
212 avc_bitstream_put_ue(bs, slice_param->pic_parameter_set_id); /* pic_parameter_set_id: 0 */
213 avc_bitstream_put_ui(bs, pic_param->frame_num, sps_param->seq_fields.bits.log2_max_frame_num_minus4 + 4); /* frame_num */
215 /* frame_mbs_only_flag == 1 */
216 if (!sps_param->seq_fields.bits.frame_mbs_only_flag) {
221 if (pic_param->pic_fields.bits.idr_pic_flag)
222 avc_bitstream_put_ue(bs, slice_param->idr_pic_id); /* idr_pic_id: 0 */
224 if (sps_param->seq_fields.bits.pic_order_cnt_type == 0) {
225 avc_bitstream_put_ui(bs, pic_param->CurrPic.TopFieldOrderCnt, sps_param->seq_fields.bits.log2_max_pic_order_cnt_lsb_minus4 + 4);
226 /* pic_order_present_flag == 0 */
232 /* redundant_pic_cnt_present_flag == 0 */
235 if (IS_P_SLICE(slice_param->slice_type)) {
236 avc_bitstream_put_ui(bs, slice_param->num_ref_idx_active_override_flag, 1); /* num_ref_idx_active_override_flag: */
238 if (slice_param->num_ref_idx_active_override_flag)
239 avc_bitstream_put_ue(bs, slice_param->num_ref_idx_l0_active_minus1);
241 /* ref_pic_list_reordering */
242 avc_bitstream_put_ui(bs, 0, 1); /* ref_pic_list_reordering_flag_l0: 0 */
243 } else if (IS_B_SLICE(slice_param->slice_type)) {
244 avc_bitstream_put_ui(bs, slice_param->direct_spatial_mv_pred_flag, 1); /* direct_spatial_mv_pred: 1 */
246 avc_bitstream_put_ui(bs, slice_param->num_ref_idx_active_override_flag, 1); /* num_ref_idx_active_override_flag: */
248 if (slice_param->num_ref_idx_active_override_flag) {
249 avc_bitstream_put_ue(bs, slice_param->num_ref_idx_l0_active_minus1);
250 avc_bitstream_put_ue(bs, slice_param->num_ref_idx_l1_active_minus1);
253 /* ref_pic_list_reordering */
254 avc_bitstream_put_ui(bs, 0, 1); /* ref_pic_list_reordering_flag_l0: 0 */
255 avc_bitstream_put_ui(bs, 0, 1); /* ref_pic_list_reordering_flag_l1: 0 */
258 if ((pic_param->pic_fields.bits.weighted_pred_flag &&
259 IS_P_SLICE(slice_param->slice_type)) ||
260 ((pic_param->pic_fields.bits.weighted_bipred_idc == 1) &&
261 IS_B_SLICE(slice_param->slice_type))) {
262 /* FIXME: fill weight/offset table */
266 /* dec_ref_pic_marking */
267 if (pic_param->pic_fields.bits.reference_pic_flag) { /* nal_ref_idc != 0 */
268 unsigned char no_output_of_prior_pics_flag = 0;
269 unsigned char long_term_reference_flag = 0;
270 unsigned char adaptive_ref_pic_marking_mode_flag = 0;
272 if (pic_param->pic_fields.bits.idr_pic_flag) {
273 avc_bitstream_put_ui(bs, no_output_of_prior_pics_flag, 1); /* no_output_of_prior_pics_flag: 0 */
274 avc_bitstream_put_ui(bs, long_term_reference_flag, 1); /* long_term_reference_flag: 0 */
276 avc_bitstream_put_ui(bs, adaptive_ref_pic_marking_mode_flag, 1); /* adaptive_ref_pic_marking_mode_flag: 0 */
280 if (pic_param->pic_fields.bits.entropy_coding_mode_flag &&
281 !IS_I_SLICE(slice_param->slice_type))
282 avc_bitstream_put_ue(bs, slice_param->cabac_init_idc); /* cabac_init_idc: 0 */
284 avc_bitstream_put_se(bs, slice_param->slice_qp_delta); /* slice_qp_delta: 0 */
286 /* ignore for SP/SI */
288 if (pic_param->pic_fields.bits.deblocking_filter_control_present_flag) {
289 avc_bitstream_put_ue(bs, slice_param->disable_deblocking_filter_idc); /* disable_deblocking_filter_idc: 0 */
291 if (slice_param->disable_deblocking_filter_idc != 1) {
292 avc_bitstream_put_se(bs, slice_param->slice_alpha_c0_offset_div2); /* slice_alpha_c0_offset_div2: 2 */
293 avc_bitstream_put_se(bs, slice_param->slice_beta_offset_div2); /* slice_beta_offset_div2: 2 */
297 if (pic_param->pic_fields.bits.entropy_coding_mode_flag) {
298 avc_bitstream_byte_aligning(bs, 1);
303 build_avc_slice_header(VAEncSequenceParameterBufferH264 *sps_param,
304 VAEncPictureParameterBufferH264 *pic_param,
305 VAEncSliceParameterBufferH264 *slice_param,
306 unsigned char **slice_header_buffer)
309 int is_idr = !!pic_param->pic_fields.bits.idr_pic_flag;
310 int is_ref = !!pic_param->pic_fields.bits.reference_pic_flag;
312 avc_bitstream_start(&bs);
313 nal_start_code_prefix(&bs);
315 if (IS_I_SLICE(slice_param->slice_type)) {
316 nal_header(&bs, NAL_REF_IDC_HIGH, is_idr ? NAL_IDR : NAL_NON_IDR);
317 } else if (IS_P_SLICE(slice_param->slice_type)) {
319 nal_header(&bs, NAL_REF_IDC_MEDIUM, NAL_NON_IDR);
321 assert(IS_B_SLICE(slice_param->slice_type));
323 nal_header(&bs, is_ref ? NAL_REF_IDC_LOW : NAL_REF_IDC_NONE, NAL_NON_IDR);
326 slice_header(&bs, sps_param, pic_param, slice_param);
328 avc_bitstream_end(&bs);
329 *slice_header_buffer = (unsigned char *)bs.buffer;
331 return bs.bit_offset;
335 build_avc_sei_buffering_period(int cpb_removal_length,
336 unsigned int init_cpb_removal_delay,
337 unsigned int init_cpb_removal_delay_offset,
338 unsigned char **sei_buffer)
340 unsigned char *byte_buf;
343 avc_bitstream nal_bs;
344 avc_bitstream sei_bs;
346 avc_bitstream_start(&sei_bs);
347 avc_bitstream_put_ue(&sei_bs, 0); /*seq_parameter_set_id*/
348 avc_bitstream_put_ui(&sei_bs, init_cpb_removal_delay, cpb_removal_length);
349 avc_bitstream_put_ui(&sei_bs, init_cpb_removal_delay_offset, cpb_removal_length);
350 if ( sei_bs.bit_offset & 0x7) {
351 avc_bitstream_put_ui(&sei_bs, 1, 1);
353 avc_bitstream_end(&sei_bs);
354 byte_size = (sei_bs.bit_offset + 7) / 8;
356 avc_bitstream_start(&nal_bs);
357 nal_start_code_prefix(&nal_bs);
358 nal_header(&nal_bs, NAL_REF_IDC_NONE, NAL_SEI);
360 avc_bitstream_put_ui(&nal_bs, 0, 8);
361 avc_bitstream_put_ui(&nal_bs, byte_size, 8);
363 byte_buf = (unsigned char *)sei_bs.buffer;
364 for(i = 0; i < byte_size; i++) {
365 avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
369 avc_rbsp_trailing_bits(&nal_bs);
370 avc_bitstream_end(&nal_bs);
372 *sei_buffer = (unsigned char *)nal_bs.buffer;
374 return nal_bs.bit_offset;
378 build_avc_sei_pic_timing(unsigned int cpb_removal_length, unsigned int cpb_removal_delay,
379 unsigned int dpb_output_length, unsigned int dpb_output_delay,
380 unsigned char **sei_buffer)
382 unsigned char *byte_buf;
385 avc_bitstream nal_bs;
386 avc_bitstream sei_bs;
388 avc_bitstream_start(&sei_bs);
389 avc_bitstream_put_ui(&sei_bs, cpb_removal_delay, cpb_removal_length);
390 avc_bitstream_put_ui(&sei_bs, dpb_output_delay, dpb_output_length);
391 if ( sei_bs.bit_offset & 0x7) {
392 avc_bitstream_put_ui(&sei_bs, 1, 1);
394 avc_bitstream_end(&sei_bs);
395 byte_size = (sei_bs.bit_offset + 7) / 8;
397 avc_bitstream_start(&nal_bs);
398 nal_start_code_prefix(&nal_bs);
399 nal_header(&nal_bs, NAL_REF_IDC_NONE, NAL_SEI);
401 avc_bitstream_put_ui(&nal_bs, 0x01, 8);
402 avc_bitstream_put_ui(&nal_bs, byte_size, 8);
404 byte_buf = (unsigned char *)sei_bs.buffer;
405 for(i = 0; i < byte_size; i++) {
406 avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
410 avc_rbsp_trailing_bits(&nal_bs);
411 avc_bitstream_end(&nal_bs);
413 *sei_buffer = (unsigned char *)nal_bs.buffer;
415 return nal_bs.bit_offset;
420 build_avc_sei_buffer_timing(unsigned int init_cpb_removal_length,
421 unsigned int init_cpb_removal_delay,
422 unsigned int init_cpb_removal_delay_offset,
423 unsigned int cpb_removal_length,
424 unsigned int cpb_removal_delay,
425 unsigned int dpb_output_length,
426 unsigned int dpb_output_delay,
427 unsigned char **sei_buffer)
429 unsigned char *byte_buf;
430 int bp_byte_size, i, pic_byte_size;
432 avc_bitstream nal_bs;
433 avc_bitstream sei_bp_bs, sei_pic_bs;
435 avc_bitstream_start(&sei_bp_bs);
436 avc_bitstream_put_ue(&sei_bp_bs, 0); /*seq_parameter_set_id*/
437 avc_bitstream_put_ui(&sei_bp_bs, init_cpb_removal_delay, cpb_removal_length);
438 avc_bitstream_put_ui(&sei_bp_bs, init_cpb_removal_delay_offset, cpb_removal_length);
439 if ( sei_bp_bs.bit_offset & 0x7) {
440 avc_bitstream_put_ui(&sei_bp_bs, 1, 1);
442 avc_bitstream_end(&sei_bp_bs);
443 bp_byte_size = (sei_bp_bs.bit_offset + 7) / 8;
445 avc_bitstream_start(&sei_pic_bs);
446 avc_bitstream_put_ui(&sei_pic_bs, cpb_removal_delay, cpb_removal_length);
447 avc_bitstream_put_ui(&sei_pic_bs, dpb_output_delay, dpb_output_length);
448 if ( sei_pic_bs.bit_offset & 0x7) {
449 avc_bitstream_put_ui(&sei_pic_bs, 1, 1);
451 avc_bitstream_end(&sei_pic_bs);
452 pic_byte_size = (sei_pic_bs.bit_offset + 7) / 8;
454 avc_bitstream_start(&nal_bs);
455 nal_start_code_prefix(&nal_bs);
456 nal_header(&nal_bs, NAL_REF_IDC_NONE, NAL_SEI);
458 /* Write the SEI buffer period data */
459 avc_bitstream_put_ui(&nal_bs, 0, 8);
460 avc_bitstream_put_ui(&nal_bs, bp_byte_size, 8);
462 byte_buf = (unsigned char *)sei_bp_bs.buffer;
463 for(i = 0; i < bp_byte_size; i++) {
464 avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
467 /* write the SEI timing data */
468 avc_bitstream_put_ui(&nal_bs, 0x01, 8);
469 avc_bitstream_put_ui(&nal_bs, pic_byte_size, 8);
471 byte_buf = (unsigned char *)sei_pic_bs.buffer;
472 for(i = 0; i < pic_byte_size; i++) {
473 avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
477 avc_rbsp_trailing_bits(&nal_bs);
478 avc_bitstream_end(&nal_bs);
480 *sei_buffer = (unsigned char *)nal_bs.buffer;
482 return nal_bs.bit_offset;
486 build_mpeg2_slice_header(VAEncSequenceParameterBufferMPEG2 *sps_param,
487 VAEncPictureParameterBufferMPEG2 *pic_param,
488 VAEncSliceParameterBufferMPEG2 *slice_param,
489 unsigned char **slice_header_buffer)
493 avc_bitstream_start(&bs);
494 avc_bitstream_end(&bs);
495 *slice_header_buffer = (unsigned char *)bs.buffer;
497 return bs.bit_offset;