OSDN Git Service

android: remove redundant -DANDROID
[android-x86/hardware-intel-common-vaapi.git] / src / i965_encoder_utils.c
index 3a93d8d..8c9b83c 100644 (file)
 #include <assert.h>
 
 #include <va/va.h>
-
+#include <va/va_enc_h264.h>
+#include <va/va_enc_mpeg2.h>
+#include <va/va_enc_vp8.h>
+#include <va/va_enc_hevc.h>
+#include <math.h>
+#include "gen6_mfc.h"
 #include "i965_encoder_utils.h"
 
 #define BITSTREAM_ALLOCATE_STEPPING     4096
@@ -41,6 +46,7 @@
 #define NAL_IDR                 5
 #define NAL_SPS                 7
 #define NAL_PPS                 8
+#define NAL_SEI                 6
 
 #define SLICE_TYPE_P            0
 #define SLICE_TYPE_B            1
 #define PROFILE_IDC_MAIN        77
 #define PROFILE_IDC_HIGH        100
 
+/*HEVC*/
+#define VPS_NUT     32
+#define SPS_NUT     33
+#define PPS_NUT     34
+#define IDR_WRADL_NUT   19
+#define IDR_NLP_NUT 20
+#define SLICE_TRAIL_N_NUT   0
+#define SLICE_TRAIL_R_NUT   1
+#define PREFIX_SEI_NUT  39
+#define SUFFIX_SEI_NUT  40
+
 struct __avc_bitstream {
     unsigned int *buffer;
     int bit_offset;
@@ -65,7 +82,7 @@ struct __avc_bitstream {
 
 typedef struct __avc_bitstream avc_bitstream;
 
-static unsigned int 
+static unsigned int
 swap32(unsigned int val)
 {
     unsigned char *pval = (unsigned char *)&val;
@@ -97,7 +114,7 @@ avc_bitstream_end(avc_bitstream *bs)
 
     // free(bs->buffer);
 }
+
 static void
 avc_bitstream_put_ui(avc_bitstream *bs, unsigned int val, int size_in_bits)
 {
@@ -109,7 +126,7 @@ avc_bitstream_put_ui(avc_bitstream *bs, unsigned int val, int size_in_bits)
         return;
 
     if (size_in_bits < 32)
-        val &= (( 1 << size_in_bits) - 1);
+        val &= ((1 << size_in_bits) - 1);
 
     bs->bit_offset += size_in_bits;
 
@@ -117,12 +134,19 @@ avc_bitstream_put_ui(avc_bitstream *bs, unsigned int val, int size_in_bits)
         bs->buffer[pos] = (bs->buffer[pos] << size_in_bits | val);
     } else {
         size_in_bits -= bit_left;
-        bs->buffer[pos] = (bs->buffer[pos] << bit_left) | (val >> size_in_bits);
+        if (bit_left == 32) {
+            bs->buffer[pos] = val;
+        } else {
+            bs->buffer[pos] = (bs->buffer[pos] << bit_left) | (val >> size_in_bits);
+        }
         bs->buffer[pos] = swap32(bs->buffer[pos]);
 
         if (pos + 1 == bs->max_size_in_dword) {
             bs->max_size_in_dword += BITSTREAM_ALLOCATE_STEPPING;
             bs->buffer = realloc(bs->buffer, bs->max_size_in_dword * sizeof(unsigned int));
+
+            if (!bs->buffer)
+                return;
         }
 
         bs->buffer[pos + 1] = val;
@@ -176,7 +200,11 @@ avc_bitstream_byte_aligning(avc_bitstream *bs, int bit)
 
     avc_bitstream_put_ui(bs, new_val, bit_left);
 }
-
+static void avc_rbsp_trailing_bits(avc_bitstream *bs)
+{
+    avc_bitstream_put_ui(bs, 1, 1);
+    avc_bitstream_byte_aligning(bs, 0);
+}
 static void nal_start_code_prefix(avc_bitstream *bs)
 {
     avc_bitstream_put_ui(bs, 0x00000001, 32);
@@ -189,31 +217,30 @@ static void nal_header(avc_bitstream *bs, int nal_ref_idc, int nal_unit_type)
     avc_bitstream_put_ui(bs, nal_unit_type, 5);
 }
 
-static void 
+static void
 slice_header(avc_bitstream *bs,
              VAEncSequenceParameterBufferH264 *sps_param,
              VAEncPictureParameterBufferH264 *pic_param,
-             VAEncSliceParameterBufferH264 *slice_param,
-             VAEncH264DecRefPicMarkingBuffer *dec_ref_pic_marking_param)
+             VAEncSliceParameterBufferH264 *slice_param)
 {
-    int first_mb_in_slice = slice_param->starting_macroblock_address;
+    int first_mb_in_slice = slice_param->macroblock_address;
 
     avc_bitstream_put_ue(bs, first_mb_in_slice);        /* first_mb_in_slice: 0 */
     avc_bitstream_put_ue(bs, slice_param->slice_type);  /* slice_type */
     avc_bitstream_put_ue(bs, slice_param->pic_parameter_set_id);        /* pic_parameter_set_id: 0 */
-    avc_bitstream_put_ui(bs, pic_param->frame_num, sps_param->log2_max_frame_num_minus4 + 4); /* frame_num */
+    avc_bitstream_put_ui(bs, pic_param->frame_num, sps_param->seq_fields.bits.log2_max_frame_num_minus4 + 4); /* frame_num */
 
     /* frame_mbs_only_flag == 1 */
-    if (!sps_param->frame_mbs_only_flag) {
+    if (!sps_param->seq_fields.bits.frame_mbs_only_flag) {
         /* FIXME: */
         assert(0);
     }
 
     if (pic_param->pic_fields.bits.idr_pic_flag)
-        avc_bitstream_put_ue(bs, slice_param->idr_pic_id);             /* idr_pic_id: 0 */
+        avc_bitstream_put_ue(bs, slice_param->idr_pic_id);      /* idr_pic_id: 0 */
 
-    if (sps_param->pic_order_cnt_type == 0) {
-        avc_bitstream_put_ui(bs, pic_param->CurrPic.TopFieldOrderCnt, sps_param->log2_max_pic_order_cnt_lsb_minus4 + 4);
+    if (sps_param->seq_fields.bits.pic_order_cnt_type == 0) {
+        avc_bitstream_put_ui(bs, pic_param->CurrPic.TopFieldOrderCnt, sps_param->seq_fields.bits.log2_max_pic_order_cnt_lsb_minus4 + 4);
         /* pic_order_present_flag == 0 */
     } else {
         /* FIXME: */
@@ -221,26 +248,32 @@ slice_header(avc_bitstream *bs,
     }
 
     /* redundant_pic_cnt_present_flag == 0 */
-    
+
     /* slice type */
     if (IS_P_SLICE(slice_param->slice_type)) {
-        avc_bitstream_put_ui(bs, 0, 1);            /* num_ref_idx_active_override_flag: 0 */
+        avc_bitstream_put_ui(bs, slice_param->num_ref_idx_active_override_flag, 1);            /* num_ref_idx_active_override_flag: */
+
+        if (slice_param->num_ref_idx_active_override_flag)
+            avc_bitstream_put_ue(bs, slice_param->num_ref_idx_l0_active_minus1);
 
         /* ref_pic_list_reordering */
-        assert(slice_param->ref_pic_list_modification_flag_l0 == 0);
-        avc_bitstream_put_ui(bs, slice_param->ref_pic_list_modification_flag_l0, 1);            /* ref_pic_list_reordering_flag_l0: 0 */
+        avc_bitstream_put_ui(bs, 0, 1);            /* ref_pic_list_reordering_flag_l0: 0 */
     } else if (IS_B_SLICE(slice_param->slice_type)) {
         avc_bitstream_put_ui(bs, slice_param->direct_spatial_mv_pred_flag, 1);            /* direct_spatial_mv_pred: 1 */
-        avc_bitstream_put_ui(bs, 0, 1);            /* num_ref_idx_active_override_flag: 0 */
+
+        avc_bitstream_put_ui(bs, slice_param->num_ref_idx_active_override_flag, 1);       /* num_ref_idx_active_override_flag: */
+
+        if (slice_param->num_ref_idx_active_override_flag) {
+            avc_bitstream_put_ue(bs, slice_param->num_ref_idx_l0_active_minus1);
+            avc_bitstream_put_ue(bs, slice_param->num_ref_idx_l1_active_minus1);
+        }
 
         /* ref_pic_list_reordering */
-        assert(slice_param->ref_pic_list_modification_flag_l0 == 0);
-        assert(slice_param->ref_pic_list_modification_flag_l1 == 0);
-        avc_bitstream_put_ui(bs, slice_param->ref_pic_list_modification_flag_l0, 1);            /* ref_pic_list_reordering_flag_l0: 0 */
-        avc_bitstream_put_ui(bs, slice_param->ref_pic_list_modification_flag_l1, 1);            /* ref_pic_list_reordering_flag_l1: 0 */
-    } 
+        avc_bitstream_put_ui(bs, 0, 1);            /* ref_pic_list_reordering_flag_l0: 0 */
+        avc_bitstream_put_ui(bs, 0, 1);            /* ref_pic_list_reordering_flag_l1: 0 */
+    }
 
-    if ((pic_param->pic_fields.bits.weighted_pred_flag && 
+    if ((pic_param->pic_fields.bits.weighted_pred_flag &&
          IS_P_SLICE(slice_param->slice_type)) ||
         ((pic_param->pic_fields.bits.weighted_bipred_idc == 1) &&
          IS_B_SLICE(slice_param->slice_type))) {
@@ -254,14 +287,6 @@ slice_header(avc_bitstream *bs,
         unsigned char long_term_reference_flag = 0;
         unsigned char adaptive_ref_pic_marking_mode_flag = 0;
 
-        if (dec_ref_pic_marking_param) {
-            no_output_of_prior_pics_flag = dec_ref_pic_marking_param->no_output_of_prior_pics_flag;
-            long_term_reference_flag = dec_ref_pic_marking_param->long_term_reference_flag;
-            adaptive_ref_pic_marking_mode_flag = dec_ref_pic_marking_param->adaptive_ref_pic_marking_mode_flag;
-            /* FIXME: XXX */
-            assert(adaptive_ref_pic_marking_mode_flag == 0);
-        }
-
         if (pic_param->pic_fields.bits.idr_pic_flag) {
             avc_bitstream_put_ui(bs, no_output_of_prior_pics_flag, 1);            /* no_output_of_prior_pics_flag: 0 */
             avc_bitstream_put_ui(bs, long_term_reference_flag, 1);            /* long_term_reference_flag: 0 */
@@ -292,15 +317,15 @@ slice_header(avc_bitstream *bs,
     }
 }
 
-int 
+int
 build_avc_slice_header(VAEncSequenceParameterBufferH264 *sps_param,
                        VAEncPictureParameterBufferH264 *pic_param,
                        VAEncSliceParameterBufferH264 *slice_param,
-                       VAEncH264DecRefPicMarkingBuffer *dec_ref_pic_marking_param,
                        unsigned char **slice_header_buffer)
 {
     avc_bitstream bs;
     int is_idr = !!pic_param->pic_fields.bits.idr_pic_flag;
+    int is_ref = !!pic_param->pic_fields.bits.reference_pic_flag;
 
     avc_bitstream_start(&bs);
     nal_start_code_prefix(&bs);
@@ -308,16 +333,841 @@ build_avc_slice_header(VAEncSequenceParameterBufferH264 *sps_param,
     if (IS_I_SLICE(slice_param->slice_type)) {
         nal_header(&bs, NAL_REF_IDC_HIGH, is_idr ? NAL_IDR : NAL_NON_IDR);
     } else if (IS_P_SLICE(slice_param->slice_type)) {
-        nal_header(&bs, NAL_REF_IDC_MEDIUM, is_idr ? NAL_IDR : NAL_NON_IDR);
+        assert(!is_idr);
+        nal_header(&bs, NAL_REF_IDC_MEDIUM, NAL_NON_IDR);
     } else {
         assert(IS_B_SLICE(slice_param->slice_type));
-        nal_header(&bs, NAL_REF_IDC_NONE, is_idr ? NAL_IDR : NAL_NON_IDR);
+        assert(!is_idr);
+        nal_header(&bs, is_ref ? NAL_REF_IDC_LOW : NAL_REF_IDC_NONE, NAL_NON_IDR);
     }
 
-    slice_header(&bs, sps_param, pic_param, slice_param, dec_ref_pic_marking_param);
+    slice_header(&bs, sps_param, pic_param, slice_param);
 
     avc_bitstream_end(&bs);
     *slice_header_buffer = (unsigned char *)bs.buffer;
 
     return bs.bit_offset;
 }
+
+int
+build_avc_sei_buffering_period(int cpb_removal_length,
+                               unsigned int init_cpb_removal_delay,
+                               unsigned int init_cpb_removal_delay_offset,
+                               unsigned char **sei_buffer)
+{
+    unsigned char *byte_buf;
+    int byte_size, i;
+
+    avc_bitstream nal_bs;
+    avc_bitstream sei_bs;
+
+    avc_bitstream_start(&sei_bs);
+    avc_bitstream_put_ue(&sei_bs, 0);       /*seq_parameter_set_id*/
+    avc_bitstream_put_ui(&sei_bs, init_cpb_removal_delay, cpb_removal_length);
+    avc_bitstream_put_ui(&sei_bs, init_cpb_removal_delay_offset, cpb_removal_length);
+    if (sei_bs.bit_offset & 0x7) {
+        avc_bitstream_put_ui(&sei_bs, 1, 1);
+    }
+    avc_bitstream_end(&sei_bs);
+    byte_size = (sei_bs.bit_offset + 7) / 8;
+
+    avc_bitstream_start(&nal_bs);
+    nal_start_code_prefix(&nal_bs);
+    nal_header(&nal_bs, NAL_REF_IDC_NONE, NAL_SEI);
+
+    avc_bitstream_put_ui(&nal_bs, 0, 8);
+    avc_bitstream_put_ui(&nal_bs, byte_size, 8);
+
+    byte_buf = (unsigned char *)sei_bs.buffer;
+    for (i = 0; i < byte_size; i++) {
+        avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
+    }
+    free(byte_buf);
+
+    avc_rbsp_trailing_bits(&nal_bs);
+    avc_bitstream_end(&nal_bs);
+
+    *sei_buffer = (unsigned char *)nal_bs.buffer;
+
+    return nal_bs.bit_offset;
+}
+
+int
+build_avc_sei_pic_timing(unsigned int cpb_removal_length, unsigned int cpb_removal_delay,
+                         unsigned int dpb_output_length, unsigned int dpb_output_delay,
+                         unsigned char **sei_buffer)
+{
+    unsigned char *byte_buf;
+    int byte_size, i;
+
+    avc_bitstream nal_bs;
+    avc_bitstream sei_bs;
+
+    avc_bitstream_start(&sei_bs);
+    avc_bitstream_put_ui(&sei_bs, cpb_removal_delay, cpb_removal_length);
+    avc_bitstream_put_ui(&sei_bs, dpb_output_delay, dpb_output_length);
+    if (sei_bs.bit_offset & 0x7) {
+        avc_bitstream_put_ui(&sei_bs, 1, 1);
+    }
+    avc_bitstream_end(&sei_bs);
+    byte_size = (sei_bs.bit_offset + 7) / 8;
+
+    avc_bitstream_start(&nal_bs);
+    nal_start_code_prefix(&nal_bs);
+    nal_header(&nal_bs, NAL_REF_IDC_NONE, NAL_SEI);
+
+    avc_bitstream_put_ui(&nal_bs, 0x01, 8);
+    avc_bitstream_put_ui(&nal_bs, byte_size, 8);
+
+    byte_buf = (unsigned char *)sei_bs.buffer;
+    for (i = 0; i < byte_size; i++) {
+        avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
+    }
+    free(byte_buf);
+
+    avc_rbsp_trailing_bits(&nal_bs);
+    avc_bitstream_end(&nal_bs);
+
+    *sei_buffer = (unsigned char *)nal_bs.buffer;
+
+    return nal_bs.bit_offset;
+}
+
+
+int
+build_avc_sei_buffer_timing(unsigned int init_cpb_removal_length,
+                            unsigned int init_cpb_removal_delay,
+                            unsigned int init_cpb_removal_delay_offset,
+                            unsigned int cpb_removal_length,
+                            unsigned int cpb_removal_delay,
+                            unsigned int dpb_output_length,
+                            unsigned int dpb_output_delay,
+                            unsigned char **sei_buffer)
+{
+    unsigned char *byte_buf;
+    int bp_byte_size, i, pic_byte_size;
+
+    avc_bitstream nal_bs;
+    avc_bitstream sei_bp_bs, sei_pic_bs;
+
+    avc_bitstream_start(&sei_bp_bs);
+    avc_bitstream_put_ue(&sei_bp_bs, 0);       /*seq_parameter_set_id*/
+    avc_bitstream_put_ui(&sei_bp_bs, init_cpb_removal_delay, cpb_removal_length);
+    avc_bitstream_put_ui(&sei_bp_bs, init_cpb_removal_delay_offset, cpb_removal_length);
+    if (sei_bp_bs.bit_offset & 0x7) {
+        avc_bitstream_put_ui(&sei_bp_bs, 1, 1);
+    }
+    avc_bitstream_end(&sei_bp_bs);
+    bp_byte_size = (sei_bp_bs.bit_offset + 7) / 8;
+
+    avc_bitstream_start(&sei_pic_bs);
+    avc_bitstream_put_ui(&sei_pic_bs, cpb_removal_delay, cpb_removal_length);
+    avc_bitstream_put_ui(&sei_pic_bs, dpb_output_delay, dpb_output_length);
+    if (sei_pic_bs.bit_offset & 0x7) {
+        avc_bitstream_put_ui(&sei_pic_bs, 1, 1);
+    }
+    avc_bitstream_end(&sei_pic_bs);
+    pic_byte_size = (sei_pic_bs.bit_offset + 7) / 8;
+
+    avc_bitstream_start(&nal_bs);
+    nal_start_code_prefix(&nal_bs);
+    nal_header(&nal_bs, NAL_REF_IDC_NONE, NAL_SEI);
+
+    /* Write the SEI buffer period data */
+    avc_bitstream_put_ui(&nal_bs, 0, 8);
+    avc_bitstream_put_ui(&nal_bs, bp_byte_size, 8);
+
+    byte_buf = (unsigned char *)sei_bp_bs.buffer;
+    for (i = 0; i < bp_byte_size; i++) {
+        avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
+    }
+    free(byte_buf);
+    /* write the SEI timing data */
+    avc_bitstream_put_ui(&nal_bs, 0x01, 8);
+    avc_bitstream_put_ui(&nal_bs, pic_byte_size, 8);
+
+    byte_buf = (unsigned char *)sei_pic_bs.buffer;
+    for (i = 0; i < pic_byte_size; i++) {
+        avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
+    }
+    free(byte_buf);
+
+    avc_rbsp_trailing_bits(&nal_bs);
+    avc_bitstream_end(&nal_bs);
+
+    *sei_buffer = (unsigned char *)nal_bs.buffer;
+
+    return nal_bs.bit_offset;
+}
+
+int
+build_mpeg2_slice_header(VAEncSequenceParameterBufferMPEG2 *sps_param,
+                         VAEncPictureParameterBufferMPEG2 *pic_param,
+                         VAEncSliceParameterBufferMPEG2 *slice_param,
+                         unsigned char **slice_header_buffer)
+{
+    avc_bitstream bs;
+
+    avc_bitstream_start(&bs);
+    avc_bitstream_end(&bs);
+    *slice_header_buffer = (unsigned char *)bs.buffer;
+
+    return bs.bit_offset;
+}
+
+static void binarize_qindex_delta(avc_bitstream *bs, int qindex_delta)
+{
+    if (qindex_delta == 0)
+        avc_bitstream_put_ui(bs, 0, 1);
+    else {
+        avc_bitstream_put_ui(bs, 1, 1);
+        avc_bitstream_put_ui(bs, abs(qindex_delta), 4);
+
+        if (qindex_delta < 0)
+            avc_bitstream_put_ui(bs, 1, 1);
+        else
+            avc_bitstream_put_ui(bs, 0, 1);
+    }
+}
+
+void binarize_vp8_frame_header(VAEncSequenceParameterBufferVP8 *seq_param,
+                               VAEncPictureParameterBufferVP8 *pic_param,
+                               VAQMatrixBufferVP8 *q_matrix,
+                               struct gen6_mfc_context *mfc_context,
+                               struct intel_encoder_context *encoder_context)
+{
+    avc_bitstream bs;
+    int i, j;
+    int is_intra_frame = !pic_param->pic_flags.bits.frame_type;
+    int log2num = pic_param->pic_flags.bits.num_token_partitions;
+
+    /* modify picture paramters */
+    pic_param->pic_flags.bits.loop_filter_adj_enable = 1;
+    pic_param->pic_flags.bits.mb_no_coeff_skip = 1;
+    pic_param->pic_flags.bits.forced_lf_adjustment = 1;
+    pic_param->pic_flags.bits.refresh_entropy_probs = 1;
+    pic_param->pic_flags.bits.segmentation_enabled = 0;
+
+    pic_param->pic_flags.bits.loop_filter_type = pic_param->pic_flags.bits.version / 2;
+    if (pic_param->pic_flags.bits.version > 1)
+        pic_param->loop_filter_level[0] = 0;
+
+    avc_bitstream_start(&bs);
+
+    if (is_intra_frame) {
+        avc_bitstream_put_ui(&bs, 0, 1);
+        avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.clamping_type , 1);
+    }
+
+    avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.segmentation_enabled, 1);
+
+    if (pic_param->pic_flags.bits.segmentation_enabled) {
+        avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.update_mb_segmentation_map, 1);
+        avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.update_segment_feature_data, 1);
+        if (pic_param->pic_flags.bits.update_segment_feature_data) {
+            /*add it later*/
+            assert(0);
+        }
+        if (pic_param->pic_flags.bits.update_mb_segmentation_map) {
+            for (i = 0; i < 3; i++) {
+                if (mfc_context->vp8_state.mb_segment_tree_probs[i] == 255)
+                    avc_bitstream_put_ui(&bs, 0, 1);
+                else {
+                    avc_bitstream_put_ui(&bs, 1, 1);
+                    avc_bitstream_put_ui(&bs, mfc_context->vp8_state.mb_segment_tree_probs[i], 8);
+                }
+            }
+        }
+    }
+
+    avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.loop_filter_type, 1);
+    avc_bitstream_put_ui(&bs, pic_param->loop_filter_level[0], 6);
+    avc_bitstream_put_ui(&bs, pic_param->sharpness_level, 3);
+
+    mfc_context->vp8_state.frame_header_lf_update_pos = bs.bit_offset;
+
+    if (pic_param->pic_flags.bits.forced_lf_adjustment) {
+        avc_bitstream_put_ui(&bs, 1, 1);//mode_ref_lf_delta_enable = 1
+        avc_bitstream_put_ui(&bs, 1, 1);//mode_ref_lf_delta_update = 1
+
+        for (i = 0; i < 4; i++) {
+            avc_bitstream_put_ui(&bs, 1, 1);
+            if (pic_param->ref_lf_delta[i] > 0) {
+                avc_bitstream_put_ui(&bs, (abs(pic_param->ref_lf_delta[i]) & 0x3F), 6);
+                avc_bitstream_put_ui(&bs, 0, 1);
+            } else {
+                avc_bitstream_put_ui(&bs, (abs(pic_param->ref_lf_delta[i]) & 0x3F), 6);
+                avc_bitstream_put_ui(&bs, 1, 1);
+            }
+        }
+
+        for (i = 0; i < 4; i++) {
+            avc_bitstream_put_ui(&bs, 1, 1);
+            if (pic_param->mode_lf_delta[i] > 0) {
+                avc_bitstream_put_ui(&bs, (abs(pic_param->mode_lf_delta[i]) & 0x3F), 6);
+                avc_bitstream_put_ui(&bs, 0, 1);
+            } else {
+                avc_bitstream_put_ui(&bs, (abs(pic_param->mode_lf_delta[i]) & 0x3F), 6);
+                avc_bitstream_put_ui(&bs, 1, 1);
+            }
+        }
+
+    } else {
+        avc_bitstream_put_ui(&bs, 0, 1);//mode_ref_lf_delta_enable = 0
+    }
+
+    avc_bitstream_put_ui(&bs, log2num, 2);
+
+    mfc_context->vp8_state.frame_header_qindex_update_pos = bs.bit_offset;
+
+    avc_bitstream_put_ui(&bs, q_matrix->quantization_index[0], 7);
+
+    for (i = 0; i < 5; i++)
+        binarize_qindex_delta(&bs, q_matrix->quantization_index_delta[i]);
+
+    if (!is_intra_frame) {
+        avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.refresh_golden_frame, 1);
+        avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.refresh_alternate_frame, 1);
+
+        if (!pic_param->pic_flags.bits.refresh_golden_frame)
+            avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.copy_buffer_to_golden, 2);
+
+        if (!pic_param->pic_flags.bits.refresh_alternate_frame)
+            avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.copy_buffer_to_alternate, 2);
+
+        avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.sign_bias_golden, 1);
+        avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.sign_bias_alternate, 1);
+    }
+
+    avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.refresh_entropy_probs, 1);
+
+    if (!is_intra_frame)
+        avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.refresh_last, 1);
+
+    mfc_context->vp8_state.frame_header_token_update_pos = bs.bit_offset;
+
+    for (i = 0; i < 4 * 8 * 3 * 11; i++)
+        avc_bitstream_put_ui(&bs, 0, 1); //don't update coeff_probs
+
+    avc_bitstream_put_ui(&bs, pic_param->pic_flags.bits.mb_no_coeff_skip, 1);
+    if (pic_param->pic_flags.bits.mb_no_coeff_skip)
+        avc_bitstream_put_ui(&bs, mfc_context->vp8_state.prob_skip_false, 8);
+
+    if (!is_intra_frame) {
+        avc_bitstream_put_ui(&bs, mfc_context->vp8_state.prob_intra, 8);
+        avc_bitstream_put_ui(&bs, mfc_context->vp8_state.prob_last, 8);
+        avc_bitstream_put_ui(&bs, mfc_context->vp8_state.prob_gf, 8);
+
+        avc_bitstream_put_ui(&bs, 1, 1); //y_mode_update_flag = 1
+        for (i = 0; i < 4; i++) {
+            avc_bitstream_put_ui(&bs, mfc_context->vp8_state.y_mode_probs[i], 8);
+        }
+
+        avc_bitstream_put_ui(&bs, 1, 1); //uv_mode_update_flag = 1
+        for (i = 0; i < 3; i++) {
+            avc_bitstream_put_ui(&bs, mfc_context->vp8_state.uv_mode_probs[i], 8);
+        }
+
+        mfc_context->vp8_state.frame_header_bin_mv_upate_pos = bs.bit_offset;
+
+        for (i = 0; i < 2 ; i++) {
+            for (j = 0; j < 19; j++) {
+                avc_bitstream_put_ui(&bs, 0, 1);
+                //avc_bitstream_put_ui(&bs, mfc_context->vp8_state.mv_probs[i][j], 7);
+            }
+        }
+    }
+
+    avc_bitstream_end(&bs);
+
+    mfc_context->vp8_state.vp8_frame_header = (unsigned char *)bs.buffer;
+    mfc_context->vp8_state.frame_header_bit_count = bs.bit_offset;
+}
+
+/* HEVC to do for internal header generated*/
+
+void nal_header_hevc(avc_bitstream *bs, int nal_unit_type, int temporalid)
+{
+    /* forbidden_zero_bit: 0 */
+    avc_bitstream_put_ui(bs, 0, 1);
+    /* nal unit_type */
+    avc_bitstream_put_ui(bs, nal_unit_type, 6);
+    /* layer_id. currently it is zero */
+    avc_bitstream_put_ui(bs, 0, 6);
+    /* teporalid + 1 .*/
+    avc_bitstream_put_ui(bs, temporalid + 1, 3);
+}
+
+int build_hevc_sei_buffering_period(int init_cpb_removal_delay_length,
+                                    unsigned int init_cpb_removal_delay,
+                                    unsigned int init_cpb_removal_delay_offset,
+                                    unsigned char **sei_buffer)
+{
+    unsigned char *byte_buf;
+    int bp_byte_size, i;
+    //unsigned int cpb_removal_delay;
+
+    avc_bitstream nal_bs;
+    avc_bitstream sei_bp_bs;
+
+    avc_bitstream_start(&sei_bp_bs);
+    avc_bitstream_put_ue(&sei_bp_bs, 0);       /*seq_parameter_set_id*/
+    /* SEI buffer period info */
+    /* NALHrdBpPresentFlag == 1 */
+    avc_bitstream_put_ui(&sei_bp_bs, init_cpb_removal_delay, init_cpb_removal_delay_length);
+    avc_bitstream_put_ui(&sei_bp_bs, init_cpb_removal_delay_offset, init_cpb_removal_delay_length);
+    if (sei_bp_bs.bit_offset & 0x7) {
+        avc_bitstream_put_ui(&sei_bp_bs, 1, 1);
+    }
+    avc_bitstream_end(&sei_bp_bs);
+    bp_byte_size = (sei_bp_bs.bit_offset + 7) / 8;
+
+    avc_bitstream_start(&nal_bs);
+    nal_start_code_prefix(&nal_bs);
+    nal_header_hevc(&nal_bs, PREFIX_SEI_NUT , 0);
+
+    /* Write the SEI buffer period data */
+    avc_bitstream_put_ui(&nal_bs, 0, 8);
+    avc_bitstream_put_ui(&nal_bs, bp_byte_size, 8);
+
+    byte_buf = (unsigned char *)sei_bp_bs.buffer;
+    for (i = 0; i < bp_byte_size; i++) {
+        avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
+    }
+    free(byte_buf);
+
+    avc_rbsp_trailing_bits(&nal_bs);
+    avc_bitstream_end(&nal_bs);
+
+    *sei_buffer = (unsigned char *)nal_bs.buffer;
+
+    return nal_bs.bit_offset;
+}
+
+int build_hevc_idr_sei_buffer_timing(unsigned int init_cpb_removal_delay_length,
+                                     unsigned int init_cpb_removal_delay,
+                                     unsigned int init_cpb_removal_delay_offset,
+                                     unsigned int cpb_removal_length,
+                                     unsigned int cpb_removal_delay,
+                                     unsigned int dpb_output_length,
+                                     unsigned int dpb_output_delay,
+                                     unsigned char **sei_buffer)
+{
+    unsigned char *byte_buf;
+    int bp_byte_size, i, pic_byte_size;
+    //unsigned int cpb_removal_delay;
+
+    avc_bitstream nal_bs;
+    avc_bitstream sei_bp_bs, sei_pic_bs;
+
+    avc_bitstream_start(&sei_bp_bs);
+    avc_bitstream_put_ue(&sei_bp_bs, 0);       /*seq_parameter_set_id*/
+    /* SEI buffer period info */
+    /* NALHrdBpPresentFlag == 1 */
+    avc_bitstream_put_ui(&sei_bp_bs, init_cpb_removal_delay, init_cpb_removal_delay_length);
+    avc_bitstream_put_ui(&sei_bp_bs, init_cpb_removal_delay_offset, init_cpb_removal_delay_length);
+    if (sei_bp_bs.bit_offset & 0x7) {
+        avc_bitstream_put_ui(&sei_bp_bs, 1, 1);
+    }
+    avc_bitstream_end(&sei_bp_bs);
+    bp_byte_size = (sei_bp_bs.bit_offset + 7) / 8;
+
+    /* SEI pic timing info */
+    avc_bitstream_start(&sei_pic_bs);
+    /* The info of CPB and DPB delay is controlled by CpbDpbDelaysPresentFlag,
+    * which is derived as 1 if one of the following conditions is true:
+    * nal_hrd_parameters_present_flag is present in the avc_bitstream and is equal to 1,
+    * vcl_hrd_parameters_present_flag is present in the avc_bitstream and is equal to 1,
+    */
+    //cpb_removal_delay = (hevc_context.current_cpb_removal - hevc_context.prev_idr_cpb_removal);
+    avc_bitstream_put_ui(&sei_pic_bs, cpb_removal_delay, cpb_removal_length);
+    avc_bitstream_put_ui(&sei_pic_bs, dpb_output_delay, dpb_output_length);
+    if (sei_pic_bs.bit_offset & 0x7) {
+        avc_bitstream_put_ui(&sei_pic_bs, 1, 1);
+    }
+    /* The pic_structure_present_flag determines whether the pic_structure
+    * info is written into the SEI pic timing info.
+    * Currently it is set to zero.
+    */
+    avc_bitstream_end(&sei_pic_bs);
+    pic_byte_size = (sei_pic_bs.bit_offset + 7) / 8;
+
+    avc_bitstream_start(&nal_bs);
+    nal_start_code_prefix(&nal_bs);
+    nal_header_hevc(&nal_bs, PREFIX_SEI_NUT , 0);
+
+    /* Write the SEI buffer period data */
+    avc_bitstream_put_ui(&nal_bs, 0, 8);
+    avc_bitstream_put_ui(&nal_bs, bp_byte_size, 8);
+
+    byte_buf = (unsigned char *)sei_bp_bs.buffer;
+    for (i = 0; i < bp_byte_size; i++) {
+        avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
+    }
+    free(byte_buf);
+    /* write the SEI pic timing data */
+    avc_bitstream_put_ui(&nal_bs, 0x01, 8);
+    avc_bitstream_put_ui(&nal_bs, pic_byte_size, 8);
+
+    byte_buf = (unsigned char *)sei_pic_bs.buffer;
+    for (i = 0; i < pic_byte_size; i++) {
+        avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
+    }
+    free(byte_buf);
+
+    avc_rbsp_trailing_bits(&nal_bs);
+    avc_bitstream_end(&nal_bs);
+
+    *sei_buffer = (unsigned char *)nal_bs.buffer;
+
+    return nal_bs.bit_offset;
+}
+
+int build_hevc_sei_pic_timing(unsigned int cpb_removal_length, unsigned int cpb_removal_delay,
+                              unsigned int dpb_output_length, unsigned int dpb_output_delay,
+                              unsigned char **sei_buffer)
+{
+    unsigned char *byte_buf;
+    int i, pic_byte_size;
+    //unsigned int cpb_removal_delay;
+
+    avc_bitstream nal_bs;
+    avc_bitstream sei_pic_bs;
+
+    avc_bitstream_start(&sei_pic_bs);
+    /* The info of CPB and DPB delay is controlled by CpbDpbDelaysPresentFlag,
+    * which is derived as 1 if one of the following conditions is true:
+    * nal_hrd_parameters_present_flag is present in the avc_bitstream and is equal to 1,
+    * vcl_hrd_parameters_present_flag is present in the avc_bitstream and is equal to 1,
+    */
+    //cpb_removal_delay = (hevc_context.current_cpb_removal - hevc_context.current_idr_cpb_removal);
+    avc_bitstream_put_ui(&sei_pic_bs, cpb_removal_delay, cpb_removal_length);
+    avc_bitstream_put_ui(&sei_pic_bs, dpb_output_delay,  dpb_output_length);
+    if (sei_pic_bs.bit_offset & 0x7) {
+        avc_bitstream_put_ui(&sei_pic_bs, 1, 1);
+    }
+
+    /* The pic_structure_present_flag determines whether the pic_structure
+    * info is written into the SEI pic timing info.
+    * Currently it is set to zero.
+    */
+    avc_bitstream_end(&sei_pic_bs);
+    pic_byte_size = (sei_pic_bs.bit_offset + 7) / 8;
+
+    avc_bitstream_start(&nal_bs);
+    nal_start_code_prefix(&nal_bs);
+    nal_header_hevc(&nal_bs, PREFIX_SEI_NUT , 0);
+
+    /* write the SEI Pic timing data */
+    avc_bitstream_put_ui(&nal_bs, 0x01, 8);
+    avc_bitstream_put_ui(&nal_bs, pic_byte_size, 8);
+
+    byte_buf = (unsigned char *)sei_pic_bs.buffer;
+    for (i = 0; i < pic_byte_size; i++) {
+        avc_bitstream_put_ui(&nal_bs, byte_buf[i], 8);
+    }
+    free(byte_buf);
+
+    avc_rbsp_trailing_bits(&nal_bs);
+    avc_bitstream_end(&nal_bs);
+
+    *sei_buffer = (unsigned char *)nal_bs.buffer;
+
+    return nal_bs.bit_offset;
+}
+
+typedef struct _RefPicSet {
+    unsigned char    num_negative_pics;
+    unsigned char    num_positive_pics;
+    unsigned char    delta_poc_s0_minus1[8];
+    unsigned char    used_by_curr_pic_s0_flag[8];
+    unsigned char    delta_poc_s1_minus1[8];
+    unsigned char    used_by_curr_pic_s1_flag[8];
+    unsigned int     inter_ref_pic_set_prediction_flag;
+} hevcRefPicSet;
+
+void hevc_short_term_ref_pic_set(avc_bitstream *bs, VAEncSliceParameterBufferHEVC *slice_param, int curPicOrderCnt)
+{
+    hevcRefPicSet hevc_rps;
+    int rps_idx = 1, ref_idx = 0;
+    int i = 0;
+
+    hevc_rps.inter_ref_pic_set_prediction_flag = 0;
+    /* s0: between I and P/B; s1 : between P and B */
+    hevc_rps.num_negative_pics               = (slice_param->slice_type != HEVC_SLICE_I) ? 1 : 0;
+    hevc_rps.num_positive_pics               = (slice_param->slice_type == HEVC_SLICE_B) ? 1 : 0;
+    hevc_rps.delta_poc_s0_minus1[0]          = 0;
+    hevc_rps.used_by_curr_pic_s0_flag[0]     = 0;
+    hevc_rps.delta_poc_s1_minus1[0]          = 0;
+    hevc_rps.used_by_curr_pic_s1_flag[0]     = 0;
+    if (slice_param->num_ref_idx_l0_active_minus1 == 0) {
+        hevc_rps.delta_poc_s0_minus1[0]          = (slice_param->slice_type == HEVC_SLICE_I) ? 0 : (curPicOrderCnt - slice_param->ref_pic_list0[0].pic_order_cnt - 1); //0;
+        hevc_rps.used_by_curr_pic_s0_flag[0]     = 1;
+    }
+    if (slice_param->num_ref_idx_l1_active_minus1 == 0) {
+        hevc_rps.delta_poc_s1_minus1[0]          = (slice_param->slice_type == HEVC_SLICE_I) ? 0 : (slice_param->ref_pic_list1[0].pic_order_cnt - curPicOrderCnt - 1);
+        hevc_rps.used_by_curr_pic_s1_flag[0]     = 1;
+    }
+
+    if (rps_idx)
+        avc_bitstream_put_ui(bs, hevc_rps.inter_ref_pic_set_prediction_flag, 1);
+
+    if (hevc_rps.inter_ref_pic_set_prediction_flag) {
+        /* not support */
+        /* to do */
+    } else {
+        avc_bitstream_put_ue(bs, hevc_rps.num_negative_pics);
+        avc_bitstream_put_ue(bs, hevc_rps.num_positive_pics);
+
+        for (i = 0; i < hevc_rps.num_negative_pics; i++) {
+            avc_bitstream_put_ue(bs, hevc_rps.delta_poc_s0_minus1[ref_idx]);
+            avc_bitstream_put_ui(bs, hevc_rps.used_by_curr_pic_s0_flag[ref_idx], 1);
+        }
+        for (i = 0; i < hevc_rps.num_positive_pics; i++) {
+            avc_bitstream_put_ue(bs, hevc_rps.delta_poc_s1_minus1[ref_idx]);
+            avc_bitstream_put_ui(bs, hevc_rps.used_by_curr_pic_s1_flag[ref_idx], 1);
+        }
+    }
+
+    return;
+}
+
+static void slice_rbsp(avc_bitstream *bs,
+                       int slice_index,
+                       VAEncSequenceParameterBufferHEVC *seq_param,
+                       VAEncPictureParameterBufferHEVC *pic_param,
+                       VAEncSliceParameterBufferHEVC *slice_param)
+{
+    int log2_cu_size = seq_param->log2_min_luma_coding_block_size_minus3 + 3;
+    int log2_ctb_size = seq_param->log2_diff_max_min_luma_coding_block_size + log2_cu_size;
+    int ctb_size = 1 << log2_ctb_size;
+
+    int picture_width_in_ctb = (seq_param->pic_width_in_luma_samples + ctb_size - 1) / ctb_size;
+    int picture_height_in_ctb = (seq_param->pic_height_in_luma_samples + ctb_size - 1) / ctb_size;
+
+    /* first_slice_segment_in_pic_flag */
+    if (slice_index == 0) {
+        avc_bitstream_put_ui(bs, 1, 1);
+    } else {
+        avc_bitstream_put_ui(bs, 0, 1);
+    }
+
+    /* no_output_of_prior_pics_flag */
+    if (pic_param->pic_fields.bits.idr_pic_flag)
+        avc_bitstream_put_ui(bs, 1, 1);
+
+    /* slice_pic_parameter_set_id */
+    avc_bitstream_put_ue(bs, 0);
+
+    /* not the first slice */
+    if (slice_index) {
+        /* TBD */
+        int bit_size;
+
+        float num_ctus;
+
+        num_ctus = picture_width_in_ctb * picture_height_in_ctb;
+        bit_size = ceilf(log2f(num_ctus));
+
+        if (pic_param->pic_fields.bits.dependent_slice_segments_enabled_flag) {
+            avc_bitstream_put_ui(bs,
+                                 slice_param->slice_fields.bits.dependent_slice_segment_flag, 1);
+        }
+        /* slice_segment_address is based on Ceil(log2(PictureSizeinCtbs)) */
+        avc_bitstream_put_ui(bs, slice_param->slice_segment_address, bit_size);
+    }
+    if (!slice_param->slice_fields.bits.dependent_slice_segment_flag) {
+        /* slice_reserved_flag */
+
+        /* slice_type */
+        avc_bitstream_put_ue(bs, slice_param->slice_type);
+        /* use the inferred the value of pic_output_flag */
+
+        /* colour_plane_id */
+        if (seq_param->seq_fields.bits.separate_colour_plane_flag) {
+            avc_bitstream_put_ui(bs, slice_param->slice_fields.bits.colour_plane_id, 1);
+        }
+
+        if (!pic_param->pic_fields.bits.idr_pic_flag) {
+            int Log2MaxPicOrderCntLsb = 8;
+            avc_bitstream_put_ui(bs, pic_param->decoded_curr_pic.pic_order_cnt, Log2MaxPicOrderCntLsb);
+
+            //if (!slice_param->short_term_ref_pic_set_sps_flag)
+            {
+                /* short_term_ref_pic_set_sps_flag.
+                * Use zero and then pass the RPS from slice_header
+                */
+                avc_bitstream_put_ui(bs, 0, 1);
+                /* TBD
+                * Add the short_term reference picture set
+                */
+                hevc_short_term_ref_pic_set(bs, slice_param, pic_param->decoded_curr_pic.pic_order_cnt);
+            }
+            /* long term reference present flag. unpresent */
+            /* TBD */
+
+            /* sps temporal MVP*/
+            if (seq_param->seq_fields.bits.sps_temporal_mvp_enabled_flag) {
+                avc_bitstream_put_ui(bs,
+                                     slice_param->slice_fields.bits.slice_temporal_mvp_enabled_flag, 1);
+            }
+        }
+
+        /* long term reference present flag. unpresent */
+
+        /* sample adaptive offset enabled flag */
+        if (seq_param->seq_fields.bits.sample_adaptive_offset_enabled_flag) {
+            avc_bitstream_put_ui(bs, slice_param->slice_fields.bits.slice_sao_luma_flag, 1);
+            avc_bitstream_put_ui(bs, slice_param->slice_fields.bits.slice_sao_chroma_flag, 1);
+        }
+
+        if (slice_param->slice_type != HEVC_SLICE_I) {
+            /* num_ref_idx_active_override_flag. 0 */
+            avc_bitstream_put_ui(bs, 0, 1);
+            /* lists_modification_flag is unpresent NumPocTotalCurr > 1 ,here it is 1*/
+
+            /* No reference picture set modification */
+
+            /* MVD_l1_zero_flag */
+            if (slice_param->slice_type == HEVC_SLICE_B)
+                avc_bitstream_put_ui(bs, slice_param->slice_fields.bits.mvd_l1_zero_flag, 1);
+
+            /* cabac_init_present_flag. 0 */
+
+            /* slice_temporal_mvp_enabled_flag. */
+            if (slice_param->slice_fields.bits.slice_temporal_mvp_enabled_flag) {
+                if (slice_param->slice_type == HEVC_SLICE_B)
+                    avc_bitstream_put_ui(bs, slice_param->slice_fields.bits.collocated_from_l0_flag, 1);
+                /*
+                * TBD: Add the collocated_ref_idx.
+                */
+            }
+            if (((pic_param->pic_fields.bits.weighted_pred_flag) &&
+                 (slice_param->slice_type == HEVC_SLICE_P)) ||
+                ((pic_param->pic_fields.bits.weighted_bipred_flag) &&
+                 (slice_param->slice_type == HEVC_SLICE_B))) {
+                /* TBD:
+                * add the weighted table
+                */
+            }
+            avc_bitstream_put_ue(bs, 5 - slice_param->max_num_merge_cand);
+        }
+        /* slice_qp_delta */
+        avc_bitstream_put_ue(bs, slice_param->slice_qp_delta);
+
+        /* slice_cb/cr_qp_offset is controlled by pps_slice_chroma_qp_offsets_present_flag
+        * The present flag is set to 1.
+        */
+        avc_bitstream_put_ue(bs, slice_param->slice_cb_qp_offset);
+        avc_bitstream_put_ue(bs, slice_param->slice_cr_qp_offset);
+
+        /*
+        * deblocking_filter_override_flag is controlled by
+        * deblocking_filter_override_enabled_flag.
+        * The override_enabled_flag is zero.
+        * deblocking_filter_override_flag is zero. then
+        * slice_deblocking_filter_disabled_flag is also zero
+        * (It is inferred to be equal to pps_deblocking_filter_disabled_flag.
+        */
+
+        /* slice_loop_filter_across_slices_enabled_flag is controlled
+        * by pps_loop_filter_across_slices_enabled_flag &&
+        * (slice_sao_luma_flag | | slice_sao_chroma_flag | |
+        *  !slice_deblocking_filter_disabled_flag ))
+        *
+        */
+    }
+
+    if (pic_param->pic_fields.bits.tiles_enabled_flag ||
+        pic_param->pic_fields.bits.entropy_coding_sync_enabled_flag) {
+        /* TBD.
+        * Add the Entry-points && tile definition.
+        */
+    }
+
+    /* slice_segment_header_extension_present_flag. Not present */
+
+    /* byte_alignment */
+    avc_rbsp_trailing_bits(bs);
+}
+
+int get_hevc_slice_nalu_type(VAEncPictureParameterBufferHEVC *pic_param)
+{
+    if (pic_param->pic_fields.bits.idr_pic_flag)
+        return IDR_WRADL_NUT;
+    else if (pic_param->pic_fields.bits.reference_pic_flag)
+        return SLICE_TRAIL_R_NUT;
+    else
+        return SLICE_TRAIL_N_NUT;
+}
+
+int build_hevc_slice_header(VAEncSequenceParameterBufferHEVC *seq_param,
+                            VAEncPictureParameterBufferHEVC *pic_param,
+                            VAEncSliceParameterBufferHEVC *slice_param,
+                            unsigned char **header_buffer,
+                            int slice_index)
+{
+    avc_bitstream bs;
+
+    avc_bitstream_start(&bs);
+    nal_start_code_prefix(&bs);
+    nal_header_hevc(&bs, get_hevc_slice_nalu_type(pic_param), 0);
+    slice_rbsp(&bs, slice_index, seq_param, pic_param, slice_param);
+    avc_bitstream_end(&bs);
+
+    *header_buffer = (unsigned char *)bs.buffer;
+    return bs.bit_offset;
+}
+
+int
+intel_avc_find_skipemulcnt(unsigned char *buf, int bits_length)
+{
+    int i, found;
+    int leading_zero_cnt, byte_length, zero_byte;
+    int nal_unit_type;
+    int skip_cnt = 0;
+
+#define NAL_UNIT_TYPE_MASK 0x1f
+#define HW_MAX_SKIP_LENGTH 15
+
+    byte_length = ALIGN(bits_length, 32) >> 3;
+
+
+    leading_zero_cnt = 0;
+    found = 0;
+    for (i = 0; i < byte_length - 4; i++) {
+        if (((buf[i] == 0) && (buf[i + 1] == 0) && (buf[i + 2] == 1)) ||
+            ((buf[i] == 0) && (buf[i + 1] == 0) && (buf[i + 2] == 0) && (buf[i + 3] == 1))) {
+            found = 1;
+            break;
+        }
+        leading_zero_cnt++;
+    }
+    if (!found) {
+        /* warning message is complained. But anyway it will be inserted. */
+        WARN_ONCE("Invalid packed header data. "
+                  "Can't find the 000001 start_prefix code\n");
+        return 0;
+    }
+    i = leading_zero_cnt;
+
+    zero_byte = 0;
+    if (!((buf[i] == 0) && (buf[i + 1] == 0) && (buf[i + 2] == 1)))
+        zero_byte = 1;
+
+    skip_cnt = leading_zero_cnt + zero_byte + 3;
+
+    /* the unit header byte is accounted */
+    nal_unit_type = (buf[skip_cnt]) & NAL_UNIT_TYPE_MASK;
+    skip_cnt += 1;
+
+    if (nal_unit_type == 14 || nal_unit_type == 20 || nal_unit_type == 21) {
+        /* more unit header bytes are accounted for MVC/SVC */
+        skip_cnt += 3;
+    }
+    if (skip_cnt > HW_MAX_SKIP_LENGTH) {
+        WARN_ONCE("Too many leading zeros are padded for packed data. "
+                  "It is beyond the HW range.!!!\n");
+    }
+    return skip_cnt;
+}