Support B frame for reference frame
[platform/upstream/libva-intel-driver.git] / src / i965_encoder_utils.c
1 /*
2  * Copyright © 2011 Intel Corporation
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the
6  * "Software"), to deal in the Software without restriction, including
7  * without limitation the rights to use, copy, modify, merge, publish,
8  * distribute, sub license, and/or sell copies of the Software, and to
9  * permit persons to whom the Software is furnished to do so, subject to
10  * the following conditions:
11  *
12  * The above copyright notice and this permission notice (including the
13  * next paragraph) shall be included in all copies or substantial portions
14  * of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
17  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
19  * IN NO EVENT SHALL PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR
20  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
21  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
22  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
23  *
24  */
25
26 #include <stdlib.h>
27 #include <assert.h>
28
29 #include <va/va.h>
30 #include <va/va_enc_h264.h>
31 #include <va/va_enc_mpeg2.h>
32
33 #include "i965_encoder_utils.h"
34
35 #define BITSTREAM_ALLOCATE_STEPPING     4096
36
37 #define NAL_REF_IDC_NONE        0
38 #define NAL_REF_IDC_LOW         1
39 #define NAL_REF_IDC_MEDIUM      2
40 #define NAL_REF_IDC_HIGH        3
41
42 #define NAL_NON_IDR             1
43 #define NAL_IDR                 5
44 #define NAL_SPS                 7
45 #define NAL_PPS                 8
46 #define NAL_SEI                 6
47
48 #define SLICE_TYPE_P            0
49 #define SLICE_TYPE_B            1
50 #define SLICE_TYPE_I            2
51
52 #define IS_I_SLICE(type) (SLICE_TYPE_I == (type) || SLICE_TYPE_I == (type - 5))
53 #define IS_P_SLICE(type) (SLICE_TYPE_P == (type) || SLICE_TYPE_P == (type - 5))
54 #define IS_B_SLICE(type) (SLICE_TYPE_B == (type) || SLICE_TYPE_B == (type - 5))
55
56 #define ENTROPY_MODE_CAVLC      0
57 #define ENTROPY_MODE_CABAC      1
58
59 #define PROFILE_IDC_BASELINE    66
60 #define PROFILE_IDC_MAIN        77
61 #define PROFILE_IDC_HIGH        100
62
63 struct __avc_bitstream {
64     unsigned int *buffer;
65     int bit_offset;
66     int max_size_in_dword;
67 };
68
69 typedef struct __avc_bitstream avc_bitstream;
70
71 static unsigned int 
72 swap32(unsigned int val)
73 {
74     unsigned char *pval = (unsigned char *)&val;
75
76     return ((pval[0] << 24)     |
77             (pval[1] << 16)     |
78             (pval[2] << 8)      |
79             (pval[3] << 0));
80 }
81
82 static void
83 avc_bitstream_start(avc_bitstream *bs)
84 {
85     bs->max_size_in_dword = BITSTREAM_ALLOCATE_STEPPING;
86     bs->buffer = calloc(bs->max_size_in_dword * sizeof(int), 1);
87     bs->bit_offset = 0;
88 }
89
90 static void
91 avc_bitstream_end(avc_bitstream *bs)
92 {
93     int pos = (bs->bit_offset >> 5);
94     int bit_offset = (bs->bit_offset & 0x1f);
95     int bit_left = 32 - bit_offset;
96
97     if (bit_offset) {
98         bs->buffer[pos] = swap32((bs->buffer[pos] << bit_left));
99     }
100
101     // free(bs->buffer);
102 }
103
104 static void
105 avc_bitstream_put_ui(avc_bitstream *bs, unsigned int val, int size_in_bits)
106 {
107     int pos = (bs->bit_offset >> 5);
108     int bit_offset = (bs->bit_offset & 0x1f);
109     int bit_left = 32 - bit_offset;
110
111     if (!size_in_bits)
112         return;
113
114     if (size_in_bits < 32)
115         val &= (( 1 << size_in_bits) - 1);
116
117     bs->bit_offset += size_in_bits;
118
119     if (bit_left > size_in_bits) {
120         bs->buffer[pos] = (bs->buffer[pos] << size_in_bits | val);
121     } else {
122         size_in_bits -= bit_left;
123         bs->buffer[pos] = (bs->buffer[pos] << bit_left) | (val >> size_in_bits);
124         bs->buffer[pos] = swap32(bs->buffer[pos]);
125
126         if (pos + 1 == bs->max_size_in_dword) {
127             bs->max_size_in_dword += BITSTREAM_ALLOCATE_STEPPING;
128             bs->buffer = realloc(bs->buffer, bs->max_size_in_dword * sizeof(unsigned int));
129             
130             if (!bs->buffer)
131                 return;
132         }
133
134         bs->buffer[pos + 1] = val;
135     }
136 }
137
138 static void
139 avc_bitstream_put_ue(avc_bitstream *bs, unsigned int val)
140 {
141     int size_in_bits = 0;
142     int tmp_val = ++val;
143
144     while (tmp_val) {
145         tmp_val >>= 1;
146         size_in_bits++;
147     }
148
149     avc_bitstream_put_ui(bs, 0, size_in_bits - 1); // leading zero
150     avc_bitstream_put_ui(bs, val, size_in_bits);
151 }
152
153 static void
154 avc_bitstream_put_se(avc_bitstream *bs, int val)
155 {
156     unsigned int new_val;
157
158     if (val <= 0)
159         new_val = -2 * val;
160     else
161         new_val = 2 * val - 1;
162
163     avc_bitstream_put_ue(bs, new_val);
164 }
165
166 static void
167 avc_bitstream_byte_aligning(avc_bitstream *bs, int bit)
168 {
169     int bit_offset = (bs->bit_offset & 0x7);
170     int bit_left = 8 - bit_offset;
171     int new_val;
172
173     if (!bit_offset)
174         return;
175
176     assert(bit == 0 || bit == 1);
177
178     if (bit)
179         new_val = (1 << bit_left) - 1;
180     else
181         new_val = 0;
182
183     avc_bitstream_put_ui(bs, new_val, bit_left);
184 }
185 static void avc_rbsp_trailing_bits(avc_bitstream *bs)
186 {
187     avc_bitstream_put_ui(bs, 1, 1);
188     avc_bitstream_byte_aligning(bs, 0);
189 }
190 static void nal_start_code_prefix(avc_bitstream *bs)
191 {
192     avc_bitstream_put_ui(bs, 0x00000001, 32);
193 }
194
195 static void nal_header(avc_bitstream *bs, int nal_ref_idc, int nal_unit_type)
196 {
197     avc_bitstream_put_ui(bs, 0, 1);                /* forbidden_zero_bit: 0 */
198     avc_bitstream_put_ui(bs, nal_ref_idc, 2);
199     avc_bitstream_put_ui(bs, nal_unit_type, 5);
200 }
201
202 static void 
203 slice_header(avc_bitstream *bs,
204              VAEncSequenceParameterBufferH264 *sps_param,
205              VAEncPictureParameterBufferH264 *pic_param,
206              VAEncSliceParameterBufferH264 *slice_param)
207 {
208     int first_mb_in_slice = slice_param->macroblock_address;
209
210     avc_bitstream_put_ue(bs, first_mb_in_slice);        /* first_mb_in_slice: 0 */
211     avc_bitstream_put_ue(bs, slice_param->slice_type);  /* slice_type */
212     avc_bitstream_put_ue(bs, slice_param->pic_parameter_set_id);        /* pic_parameter_set_id: 0 */
213     avc_bitstream_put_ui(bs, pic_param->frame_num, sps_param->seq_fields.bits.log2_max_frame_num_minus4 + 4); /* frame_num */
214
215     /* frame_mbs_only_flag == 1 */
216     if (!sps_param->seq_fields.bits.frame_mbs_only_flag) {
217         /* FIXME: */
218         assert(0);
219     }
220
221     if (pic_param->pic_fields.bits.idr_pic_flag)
222         avc_bitstream_put_ue(bs, slice_param->idr_pic_id);              /* idr_pic_id: 0 */
223
224     if (sps_param->seq_fields.bits.pic_order_cnt_type == 0) {
225         avc_bitstream_put_ui(bs, pic_param->CurrPic.TopFieldOrderCnt, sps_param->seq_fields.bits.log2_max_pic_order_cnt_lsb_minus4 + 4);
226         /* pic_order_present_flag == 0 */
227     } else {
228         /* FIXME: */
229         assert(0);
230     }
231
232     /* redundant_pic_cnt_present_flag == 0 */
233     
234     /* slice type */
235     if (IS_P_SLICE(slice_param->slice_type)) {
236         avc_bitstream_put_ui(bs, 0, 1);            /* num_ref_idx_active_override_flag: 0 */
237
238         /* ref_pic_list_reordering */
239         avc_bitstream_put_ui(bs, 0, 1);            /* ref_pic_list_reordering_flag_l0: 0 */
240     } else if (IS_B_SLICE(slice_param->slice_type)) {
241         avc_bitstream_put_ui(bs, slice_param->direct_spatial_mv_pred_flag, 1);            /* direct_spatial_mv_pred: 1 */
242         avc_bitstream_put_ui(bs, 0, 1);            /* num_ref_idx_active_override_flag: 0 */
243
244         /* ref_pic_list_reordering */
245         avc_bitstream_put_ui(bs, 0, 1);            /* ref_pic_list_reordering_flag_l0: 0 */
246         avc_bitstream_put_ui(bs, 0, 1);            /* ref_pic_list_reordering_flag_l1: 0 */
247     } 
248
249     if ((pic_param->pic_fields.bits.weighted_pred_flag && 
250          IS_P_SLICE(slice_param->slice_type)) ||
251         ((pic_param->pic_fields.bits.weighted_bipred_idc == 1) &&
252          IS_B_SLICE(slice_param->slice_type))) {
253         /* FIXME: fill weight/offset table */
254         assert(0);
255     }
256
257     /* dec_ref_pic_marking */
258     if (pic_param->pic_fields.bits.reference_pic_flag) {     /* nal_ref_idc != 0 */
259         unsigned char no_output_of_prior_pics_flag = 0;
260         unsigned char long_term_reference_flag = 0;
261         unsigned char adaptive_ref_pic_marking_mode_flag = 0;
262
263         if (pic_param->pic_fields.bits.idr_pic_flag) {
264             avc_bitstream_put_ui(bs, no_output_of_prior_pics_flag, 1);            /* no_output_of_prior_pics_flag: 0 */
265             avc_bitstream_put_ui(bs, long_term_reference_flag, 1);            /* long_term_reference_flag: 0 */
266         } else {
267             avc_bitstream_put_ui(bs, adaptive_ref_pic_marking_mode_flag, 1);            /* adaptive_ref_pic_marking_mode_flag: 0 */
268         }
269     }
270
271     if (pic_param->pic_fields.bits.entropy_coding_mode_flag &&
272         !IS_I_SLICE(slice_param->slice_type))
273         avc_bitstream_put_ue(bs, slice_param->cabac_init_idc);               /* cabac_init_idc: 0 */
274
275     avc_bitstream_put_se(bs, slice_param->slice_qp_delta);                   /* slice_qp_delta: 0 */
276
277     /* ignore for SP/SI */
278
279     if (pic_param->pic_fields.bits.deblocking_filter_control_present_flag) {
280         avc_bitstream_put_ue(bs, slice_param->disable_deblocking_filter_idc);           /* disable_deblocking_filter_idc: 0 */
281
282         if (slice_param->disable_deblocking_filter_idc != 1) {
283             avc_bitstream_put_se(bs, slice_param->slice_alpha_c0_offset_div2);          /* slice_alpha_c0_offset_div2: 2 */
284             avc_bitstream_put_se(bs, slice_param->slice_beta_offset_div2);              /* slice_beta_offset_div2: 2 */
285         }
286     }
287
288     if (pic_param->pic_fields.bits.entropy_coding_mode_flag) {
289         avc_bitstream_byte_aligning(bs, 1);
290     }
291 }
292
293 int 
294 build_avc_slice_header(VAEncSequenceParameterBufferH264 *sps_param,
295                        VAEncPictureParameterBufferH264 *pic_param,
296                        VAEncSliceParameterBufferH264 *slice_param,
297                        unsigned char **slice_header_buffer)
298 {
299     avc_bitstream bs;
300     int is_idr = !!pic_param->pic_fields.bits.idr_pic_flag;
301     int is_ref = !!pic_param->pic_fields.bits.reference_pic_flag;
302
303     avc_bitstream_start(&bs);
304     nal_start_code_prefix(&bs);
305
306     if (IS_I_SLICE(slice_param->slice_type)) {
307         nal_header(&bs, NAL_REF_IDC_HIGH, is_idr ? NAL_IDR : NAL_NON_IDR);
308     } else if (IS_P_SLICE(slice_param->slice_type)) {
309         assert(!is_idr);
310         nal_header(&bs, NAL_REF_IDC_MEDIUM, NAL_NON_IDR);
311     } else {
312         assert(IS_B_SLICE(slice_param->slice_type));
313         assert(!is_idr);
314         nal_header(&bs, is_ref ? NAL_REF_IDC_LOW : NAL_REF_IDC_NONE, NAL_NON_IDR);
315     }
316
317     slice_header(&bs, sps_param, pic_param, slice_param);
318
319     avc_bitstream_end(&bs);
320     *slice_header_buffer = (unsigned char *)bs.buffer;
321
322     return bs.bit_offset;
323 }
324
325 int 
326 build_avc_sei_buffering_period(int cpb_removal_length,
327                                unsigned int init_cpb_removal_delay, 
328                                unsigned int init_cpb_removal_delay_offset,
329                                unsigned char **sei_buffer) 
330 {
331     unsigned char *byte_buf;
332     int byte_size, i;
333
334     avc_bitstream nal_bs;
335     avc_bitstream sei_bs;
336
337     avc_bitstream_start(&sei_bs);
338     avc_bitstream_put_ue(&sei_bs, 0);       /*seq_parameter_set_id*/
339     avc_bitstream_put_ui(&sei_bs, init_cpb_removal_delay, cpb_removal_length); 
340     avc_bitstream_put_ui(&sei_bs, init_cpb_removal_delay_offset, cpb_removal_length); 
341     if ( sei_bs.bit_offset & 0x7) {
342         avc_bitstream_put_ui(&sei_bs, 1, 1);
343     }
344     avc_bitstream_end(&sei_bs);
345     byte_size = (sei_bs.bit_offset + 7) / 8;
346     
347     avc_bitstream_start(&nal_bs);
348     nal_start_code_prefix(&nal_bs);
349     nal_header(&nal_bs, NAL_REF_IDC_NONE, NAL_SEI);
350     
351     avc_bitstream_put_ui(&nal_bs, 0, 8);
352     avc_bitstream_put_ui(&nal_bs, byte_size, 8);
353     
354     byte_buf = (unsigned char *)sei_bs.buffer;
355     for(i = 0; i < byte_size; i++) {
356         avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
357     }
358     free(byte_buf);
359
360     avc_rbsp_trailing_bits(&nal_bs);
361     avc_bitstream_end(&nal_bs);
362
363     *sei_buffer = (unsigned char *)nal_bs.buffer; 
364    
365     return nal_bs.bit_offset;
366 }
367
368 int 
369 build_avc_sei_pic_timing(unsigned int cpb_removal_length, unsigned int cpb_removal_delay, 
370                          unsigned int dpb_output_length, unsigned int dpb_output_delay,
371                          unsigned char **sei_buffer)
372 {
373     unsigned char *byte_buf;
374     int byte_size, i;
375
376     avc_bitstream nal_bs;
377     avc_bitstream sei_bs;
378
379     avc_bitstream_start(&sei_bs);
380     avc_bitstream_put_ui(&sei_bs, cpb_removal_delay, cpb_removal_length); 
381     avc_bitstream_put_ui(&sei_bs, dpb_output_delay, dpb_output_length); 
382     if ( sei_bs.bit_offset & 0x7) {
383         avc_bitstream_put_ui(&sei_bs, 1, 1);
384     }
385     avc_bitstream_end(&sei_bs);
386     byte_size = (sei_bs.bit_offset + 7) / 8;
387     
388     avc_bitstream_start(&nal_bs);
389     nal_start_code_prefix(&nal_bs);
390     nal_header(&nal_bs, NAL_REF_IDC_NONE, NAL_SEI);
391     
392     avc_bitstream_put_ui(&nal_bs, 0x01, 8);
393     avc_bitstream_put_ui(&nal_bs, byte_size, 8);
394     
395     byte_buf = (unsigned char *)sei_bs.buffer;
396     for(i = 0; i < byte_size; i++) {
397         avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
398     }
399     free(byte_buf);
400
401     avc_rbsp_trailing_bits(&nal_bs);
402     avc_bitstream_end(&nal_bs);
403
404     *sei_buffer = (unsigned char *)nal_bs.buffer; 
405    
406     return nal_bs.bit_offset;
407 }
408
409
410 int 
411 build_avc_sei_buffer_timing(unsigned int init_cpb_removal_length,
412                                 unsigned int init_cpb_removal_delay,
413                                 unsigned int init_cpb_removal_delay_offset,
414                                 unsigned int cpb_removal_length,
415                                 unsigned int cpb_removal_delay,
416                                 unsigned int dpb_output_length,
417                                 unsigned int dpb_output_delay,
418                                 unsigned char **sei_buffer)
419 {
420     unsigned char *byte_buf;
421     int bp_byte_size, i, pic_byte_size;
422
423     avc_bitstream nal_bs;
424     avc_bitstream sei_bp_bs, sei_pic_bs;
425
426     avc_bitstream_start(&sei_bp_bs);
427     avc_bitstream_put_ue(&sei_bp_bs, 0);       /*seq_parameter_set_id*/
428     avc_bitstream_put_ui(&sei_bp_bs, init_cpb_removal_delay, cpb_removal_length); 
429     avc_bitstream_put_ui(&sei_bp_bs, init_cpb_removal_delay_offset, cpb_removal_length); 
430     if ( sei_bp_bs.bit_offset & 0x7) {
431         avc_bitstream_put_ui(&sei_bp_bs, 1, 1);
432     }
433     avc_bitstream_end(&sei_bp_bs);
434     bp_byte_size = (sei_bp_bs.bit_offset + 7) / 8;
435     
436     avc_bitstream_start(&sei_pic_bs);
437     avc_bitstream_put_ui(&sei_pic_bs, cpb_removal_delay, cpb_removal_length); 
438     avc_bitstream_put_ui(&sei_pic_bs, dpb_output_delay, dpb_output_length); 
439     if ( sei_pic_bs.bit_offset & 0x7) {
440         avc_bitstream_put_ui(&sei_pic_bs, 1, 1);
441     }
442     avc_bitstream_end(&sei_pic_bs);
443     pic_byte_size = (sei_pic_bs.bit_offset + 7) / 8;
444     
445     avc_bitstream_start(&nal_bs);
446     nal_start_code_prefix(&nal_bs);
447     nal_header(&nal_bs, NAL_REF_IDC_NONE, NAL_SEI);
448
449         /* Write the SEI buffer period data */    
450     avc_bitstream_put_ui(&nal_bs, 0, 8);
451     avc_bitstream_put_ui(&nal_bs, bp_byte_size, 8);
452     
453     byte_buf = (unsigned char *)sei_bp_bs.buffer;
454     for(i = 0; i < bp_byte_size; i++) {
455         avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
456     }
457     free(byte_buf);
458         /* write the SEI timing data */
459     avc_bitstream_put_ui(&nal_bs, 0x01, 8);
460     avc_bitstream_put_ui(&nal_bs, pic_byte_size, 8);
461     
462     byte_buf = (unsigned char *)sei_pic_bs.buffer;
463     for(i = 0; i < pic_byte_size; i++) {
464         avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
465     }
466     free(byte_buf);
467
468     avc_rbsp_trailing_bits(&nal_bs);
469     avc_bitstream_end(&nal_bs);
470
471     *sei_buffer = (unsigned char *)nal_bs.buffer; 
472    
473     return nal_bs.bit_offset;
474 }
475
476 int 
477 build_mpeg2_slice_header(VAEncSequenceParameterBufferMPEG2 *sps_param,
478                          VAEncPictureParameterBufferMPEG2 *pic_param,
479                          VAEncSliceParameterBufferMPEG2 *slice_param,
480                          unsigned char **slice_header_buffer)
481 {
482     avc_bitstream bs;
483
484     avc_bitstream_start(&bs);
485     avc_bitstream_end(&bs);
486     *slice_header_buffer = (unsigned char *)bs.buffer;
487
488     return bs.bit_offset;
489 }