/******************************************************************************
 *
 * Copyright (C) 2015 The Android Open Source Project
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at:
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 *****************************************************************************
 * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore
*/
/*!
 ***************************************************************************
 * \file ih264d_parse_cavlc.c
 *
 * \brief
 *    This file contains UVLC related functions.
 *
 * \date
 *    20/11/2002
 *
 * \author  NS
 ***************************************************************************
 */

#include <string.h>
#include <stdio.h>

#include "ih264d_bitstrm.h"
#include "ih264d_parse_cavlc.h"
#include "ih264d_error_handler.h"
#include "ih264d_defs.h"
#include "ih264d_debug.h"
#include "ih264d_cabac.h"
#include "ih264d_structs.h"
#include "ih264d_tables.h"
#include "ih264d_tables.h"
#include "ih264d_mb_utils.h"

void ih264d_unpack_coeff4x4_dc_4x4blk(tu_sblk4x4_coeff_data_t *ps_tu_4x4,
                                      WORD16 *pi2_out_coeff_data,
                                      UWORD8 *pu1_inv_scan);

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_uev                                                  */
/*                                                                           */
/*  Description   : Reads the unsigned Exp Golomb codec syntax from the      */
/*                  ps_bitstrm as specified in section 9.1 of H264 standard      */
/*                  It also increases bitstream u4_ofst by the number of bits */
/*                  parsed for UEV decode operation                          */
/*                                                                           */
/*  Inputs        : bitstream base pointer and bitsream u4_ofst in bits       */
/*  Globals       : None                                                     */
/*  Processing    :                                                          */
/*  Outputs       : UEV decoded syntax element and incremented ps_bitstrm u4_ofst */
/*  Returns       : UEV decoded syntax element                               */
/*                                                                           */
/*  Issues        : Does not check if ps_bitstrm u4_ofst exceeds max ps_bitstrm i4_size  */
/*                  for performamce. Caller might have to do error resilence */
/*                  check for bitstream overflow                             */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         19 09 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/
UWORD32 ih264d_uev(UWORD32 *pu4_bitstrm_ofst, UWORD32 *pu4_bitstrm_buf)
{
    UWORD32 u4_bitstream_offset = *pu4_bitstrm_ofst;
    UWORD32 u4_word, u4_ldz;

    /***************************************************************/
    /* Find leading zeros in next 32 bits                          */
    /***************************************************************/
    NEXTBITS_32(u4_word, u4_bitstream_offset, pu4_bitstrm_buf);
    u4_ldz = CLZ(u4_word);
    /* Flush the ps_bitstrm */
    u4_bitstream_offset += (u4_ldz + 1);
    /* Read the suffix from the ps_bitstrm */
    u4_word = 0;
    if(u4_ldz)
        GETBITS(u4_word, u4_bitstream_offset, pu4_bitstrm_buf, u4_ldz);
    *pu4_bitstrm_ofst = u4_bitstream_offset;
    return ((1 << u4_ldz) + u4_word - 1);
}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_sev                                                  */
/*                                                                           */
/*  Description   : Reads the signed Exp Golomb codec syntax from the ps_bitstrm */
/*                  as specified in section 9.1 of H264 standard.            */
/*                  It also increases bitstream u4_ofst by the number of bits */
/*                  parsed for SEV decode operation                          */
/*                                                                           */
/*  Inputs        : bitstream base pointer and bitsream u4_ofst in bits       */
/*  Globals       : None                                                     */
/*  Processing    :                                                          */
/*  Outputs       : SEV decoded syntax element and incremented ps_bitstrm u4_ofst */
/*  Returns       : SEV decoded syntax element                               */
/*                                                                           */
/*  Issues        : Does not check if ps_bitstrm u4_ofst exceeds max ps_bitstrm i4_size  */
/*                  for performamce. Caller might have to do error resilence */
/*                  check for bitstream overflow                             */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         19 09 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/
WORD32 ih264d_sev(UWORD32 *pu4_bitstrm_ofst, UWORD32 *pu4_bitstrm_buf)
{
    UWORD32 u4_bitstream_offset = *pu4_bitstrm_ofst;
    UWORD32 u4_word, u4_ldz, u4_abs_val;

    /***************************************************************/
    /* Find leading zeros in next 32 bits                          */
    /***************************************************************/
    NEXTBITS_32(u4_word, u4_bitstream_offset, pu4_bitstrm_buf);
    u4_ldz = CLZ(u4_word);

    /* Flush the ps_bitstrm */
    u4_bitstream_offset += (u4_ldz + 1);

    /* Read the suffix from the ps_bitstrm */
    u4_word = 0;
    if(u4_ldz)
        GETBITS(u4_word, u4_bitstream_offset, pu4_bitstrm_buf, u4_ldz);

    *pu4_bitstrm_ofst = u4_bitstream_offset;
    u4_abs_val = ((1 << u4_ldz) + u4_word) >> 1;

    if(u4_word & 0x1)
        return (-(WORD32)u4_abs_val);
    else
        return (u4_abs_val);
}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : get_tev_range_1                                          */
/*                                                                           */
/*  Description   : Reads the TEV Exp Golomb codec syntax from the ps_bitstrm    */
/*                  as specified in section 9.1 of H264 standard. This will  */
/*                  called only when the input range is 1 for TEV decode.    */
/*                  If range is more than 1, then UEV decode is done         */
/*                                                                           */
/*  Inputs        : bitstream base pointer and bitsream u4_ofst in bits       */
/*  Globals       : None                                                     */
/*  Processing    :                                                          */
/*  Outputs       : TEV decoded syntax element and incremented ps_bitstrm u4_ofst */
/*  Returns       : TEV decoded syntax element                               */
/*                                                                           */
/*  Issues        : Does not check if ps_bitstrm u4_ofst exceeds max ps_bitstrm i4_size  */
/*                  for performamce. Caller might have to do error resilence */
/*                  check for bitstream overflow                             */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         19 09 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/
UWORD32 ih264d_tev_range1(UWORD32 *pu4_bitstrm_ofst, UWORD32 *pu4_bitstrm_buf)
{
    UWORD32 u4_code;
    GETBIT(u4_code, *pu4_bitstrm_ofst, pu4_bitstrm_buf);
    return (!u4_code);
}

/*!
 **************************************************************************
 * \if Function name : ih264d_uvlc \endif
 *
 * \brief
 *
 *    Reads the unsigned/signed/truncated integer Exp-Golomb-coded syntax element
 *    with the left bit first. The parsing process for this descriptor is specified
 *    in subclause 9.1.
 *
 * \param ps_bitstrm       : Pointer to Bitstream Structure .
 * \param u4_range           : Range value in case of Truncated Exp-Golomb-code
 * \param pi_bitstrm_ofst : Pointer to the local copy of Bitstream u4_ofst
 * \param u1_flag            : Flag indicating the case of UEV,SEV or TEV
 * \param u4_bitstrm_ofst : Local copy of Bitstream u4_ofst
 * \param pu4_bitstrm_buf : Pointer to the Bitstream buffer
 *
 * \return
 *    Returns Code Value.
 *
 **************************************************************************
 */

WORD32 ih264d_uvlc(dec_bit_stream_t *ps_bitstrm,
                   UWORD32 u4_range,
                   UWORD32 *pi_bitstrm_ofst,
                   UWORD8 u1_flag,
                   UWORD32 u4_bitstrm_ofst,
                   UWORD32 *pu4_bitstrm_buf)
{
    UWORD32 word, word2, cur_bit, cur_word, code_val, code_num, clz;

    SWITCHOFFTRACE;
    cur_bit = u4_bitstrm_ofst & 0x1F;
    cur_word = u4_bitstrm_ofst >> 5;
    word = pu4_bitstrm_buf[cur_word];
    word2 = pu4_bitstrm_buf[cur_word + 1];

    if(cur_bit != 0)
    {
        word <<= cur_bit;
        word2 >>= (32 - cur_bit);
        word |= word2;
    }

    if(u1_flag == TEV && u4_range == 1)
    {
        word >>= 31;
        word = 1 - word;
        (*pi_bitstrm_ofst)++;
        ps_bitstrm->u4_ofst = *pi_bitstrm_ofst;
        return (WORD32)word;
    }

    //finding clz
    {
        UWORD32 ui32_code, ui32_mask;

        ui32_code = word;
        ui32_mask = 0x80000000;
        clz = 0;

        /* DSP implements this with LMBD instruction */
        /* so there we don't need to break the loop */
        while(!(ui32_code & ui32_mask))
        {
            clz++;
            ui32_mask >>= 1;
            if(0 == ui32_mask)
                break;
        }
    }

    if(clz == 0)
    {
        *pi_bitstrm_ofst = *pi_bitstrm_ofst + (2 * clz) + 1;
        ps_bitstrm->u4_ofst = *pi_bitstrm_ofst;
        return 0;
    }

    word <<= (clz + 1);
    word >>= (32 - clz);
    code_num = (1 << clz) + word - 1;
    *pi_bitstrm_ofst = *pi_bitstrm_ofst + (2 * clz) + 1;
    ps_bitstrm->u4_ofst = *pi_bitstrm_ofst;

    if(u1_flag == TEV || u1_flag == UEV)
        return (WORD32)code_num;

    code_val = (code_num + 1) >> 1;
    if(!(code_num & 0x01))
        return -((WORD32)code_val);
    return (WORD32)code_val;

}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_cavlc_4x4res_block_totalcoeff_1                          */
/*                                                                           */
/*  Description   : This function does cavlc decoding of 4x4 block residual  */
/*                  coefficient when total coeff is equal to 1. The parsing  */
/*                  is done as defined in section 9.2.2 and 9.2.3 of the     */
/*                  H264 standard.                                           */
/*                                                                           */
/*  Inputs        : <What inputs does the function take?>                    */
/*  Globals       : <Does it use any global variables?>                      */
/*  Processing    : <Describe how the function operates - include algorithm  */
/*                  description>                                             */
/*  Outputs       : <What does the function produce?>                        */
/*  Returns       : <What does the function return?>                         */
/*                                                                           */
/*  Issues        : <List any issues or problems with this function>         */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         25 09 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/
WORD32 ih264d_cavlc_4x4res_block_totalcoeff_1(UWORD32 u4_isdc,
                                           UWORD32 u4_total_coeff_trail_one,
                                           dec_bit_stream_t *ps_bitstrm)
{

    UWORD32 *pu4_bitstrm_buf = ps_bitstrm->pu4_buffer;
    UWORD32 u4_bitstream_offset = ps_bitstrm->u4_ofst;
    UWORD32 u4_trailing_ones = u4_total_coeff_trail_one & 0xFFFF;
    WORD32 i2_level;
    UWORD32 u4_tot_zero, u4_ldz, u4_scan_pos;

    tu_sblk4x4_coeff_data_t *ps_tu_4x4;
    WORD16 *pi2_coeff_data;
    dec_struct_t *ps_dec = (dec_struct_t *)ps_bitstrm->pv_codec_handle;

    ps_tu_4x4 = (tu_sblk4x4_coeff_data_t *)ps_dec->pv_parse_tu_coeff_data;
    ps_tu_4x4->u2_sig_coeff_map = 0;
    pi2_coeff_data = &ps_tu_4x4->ai2_level[0];


    if(u4_trailing_ones)
    {
        UWORD32 u4_sign;
        /****************************************************************/
        /* Decode Trailing One as in section 9.2.2                      */
        /****************************************************************/
        GETBIT(u4_sign, u4_bitstream_offset, pu4_bitstrm_buf);
        i2_level = u4_sign ? -1 : 1;
    }
    else
    {
        /****************************************************************/
        /* Decoding Level based on prefix and suffix  as in 9.2.2       */
        /****************************************************************/
        UWORD32 u4_lev_suffix, u4_lev_suffix_size;
        WORD32 u2_lev_code, u2_abs_value;
        UWORD32 u4_lev_prefix;
        /***************************************************************/
        /* Find leading zeros in next 32 bits                          */
        /***************************************************************/
        FIND_ONE_IN_STREAM_32(u4_lev_prefix, u4_bitstream_offset,
                              pu4_bitstrm_buf);
        u2_lev_code = (2 + MIN(u4_lev_prefix, 15));

        if(14 == u4_lev_prefix)
            u4_lev_suffix_size = 4;
        else if(15 <= u4_lev_prefix)
        {
            u2_lev_code += 15;
            u4_lev_suffix_size = u4_lev_prefix - 3;
        }
        else
            u4_lev_suffix_size = 0;

        //HP_LEVEL_PREFIX
        if(16 <= u4_lev_prefix)
        {
            u2_lev_code += ((1 << (u4_lev_prefix - 3)) - 4096);
        }
        if(u4_lev_suffix_size)
        {
            GETBITS(u4_lev_suffix, u4_bitstream_offset, pu4_bitstrm_buf,
                    u4_lev_suffix_size);
            u2_lev_code += u4_lev_suffix;
        }

        u2_abs_value = (u2_lev_code + 2) >> 1;
        /*********************************************************/
        /* If Level code is odd, level is negative else positive */
        /*********************************************************/
        i2_level = (u2_lev_code & 1) ? -u2_abs_value : u2_abs_value;

    }

    /****************************************************************/
    /* Decoding total zeros as in section 9.2.3, table 9.7          */
    /****************************************************************/
    FIND_ONE_IN_STREAM_LEN(u4_ldz, u4_bitstream_offset, pu4_bitstrm_buf, 8);

    if(u4_ldz)
    {
        GETBIT(u4_tot_zero, u4_bitstream_offset, pu4_bitstrm_buf);
        u4_tot_zero = (u4_ldz << 1) - u4_tot_zero;
    }
    else
        u4_tot_zero = 0;

    /***********************************************************************/
    /* Inverse scan and store  residual coeff. Update the bitstream u4_ofst */
    /***********************************************************************/
    u4_scan_pos = u4_tot_zero + u4_isdc;
    if(u4_scan_pos > 15)
        return -1;

    SET_BIT(ps_tu_4x4->u2_sig_coeff_map, u4_scan_pos);
    *pi2_coeff_data++ = i2_level;


    {
        WORD32 offset;
        offset = (UWORD8 *)pi2_coeff_data - (UWORD8 *)ps_tu_4x4;
        offset = ALIGN4(offset);
        ps_dec->pv_parse_tu_coeff_data = (void *)((UWORD8 *)ps_dec->pv_parse_tu_coeff_data + offset);
    }

    ps_bitstrm->u4_ofst = u4_bitstream_offset;
    return 0;
}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_cavlc_4x4res_block_totalcoeff_2to10                      */
/*                                                                           */
/*  Description   : This function does cavlc decoding of 4x4 block residual  */
/*                  coefficient when total coeffs are between two and ten    */
/*                  inclusive. Parsing is done as defined in section 9.2.2   */
/*                  and 9.2.3 the H264 standard.                             */
/*                                                                           */
/*  Inputs        : <What inputs does the function take?>                    */
/*  Globals       : <Does it use any global variables?>                      */
/*  Processing    : <Describe how the function operates - include algorithm  */
/*                  description>                                             */
/*  Outputs       : <What does the function produce?>                        */
/*  Returns       : <What does the function return?>                         */
/*                                                                           */
/*  Issues        : <List any issues or problems with this function>         */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         25 09 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/

WORD32 ih264d_cavlc_4x4res_block_totalcoeff_2to10(UWORD32 u4_isdc,
                                               UWORD32 u4_total_coeff_trail_one, /*!<TotalCoefficients<<16+trailingones*/
                                               dec_bit_stream_t *ps_bitstrm)
{
    UWORD32 u4_total_zeroes;
    WORD32 i;
    UWORD32 *pu4_bitstrm_buf = ps_bitstrm->pu4_buffer;
    UWORD32 u4_bitstream_offset = ps_bitstrm->u4_ofst;
    UWORD32 u4_trailing_ones = u4_total_coeff_trail_one & 0xFFFF;
    UWORD32 u4_total_coeff = u4_total_coeff_trail_one >> 16;
    // To avoid error check at 4x4 level, allocating for 3 extra levels(16+3)
    // since u4_trailing_ones can at the max be 3. This will be required when
    // u4_total_coeff is less than u4_trailing_ones
    WORD16 ai2_level_arr[19];
    WORD16 *i2_level_arr = &ai2_level_arr[3];

    tu_sblk4x4_coeff_data_t *ps_tu_4x4;
    WORD16 *pi2_coeff_data;
    dec_struct_t *ps_dec = (dec_struct_t *)ps_bitstrm->pv_codec_handle;

    ps_tu_4x4 = (tu_sblk4x4_coeff_data_t *)ps_dec->pv_parse_tu_coeff_data;
    ps_tu_4x4->u2_sig_coeff_map = 0;
    pi2_coeff_data = &ps_tu_4x4->ai2_level[0];

    i = u4_total_coeff - 1;

    if(u4_trailing_ones)
    {
        /*********************************************************************/
        /* Decode Trailing Ones                                              */
        /* read the sign of T1's and put them in level array                 */
        /*********************************************************************/
        UWORD32 u4_signs, u4_cnt = u4_trailing_ones;
        WORD16 (*ppi2_trlone_lkup)[3] =
                        (WORD16 (*)[3])gai2_ih264d_trailing_one_level;
        WORD16 *pi2_trlone_lkup;

        GETBITS(u4_signs, u4_bitstream_offset, pu4_bitstrm_buf, u4_cnt);

        pi2_trlone_lkup = ppi2_trlone_lkup[(1 << u4_cnt) - 2 + u4_signs];

        while(u4_cnt)
        {
            i2_level_arr[i--] = *pi2_trlone_lkup++;
            u4_cnt--;
        }
    }

    /****************************************************************/
    /* Decoding Levels Begins                                       */
    /****************************************************************/
    if(i >= 0)
    {
        /****************************************************************/
        /* First level is decoded outside the loop as it has lot of     */
        /* special cases.                                               */
        /****************************************************************/
        UWORD32 u4_lev_suffix, u4_suffix_len, u4_lev_suffix_size;
        WORD32 u2_lev_code, u2_abs_value;
        UWORD32 u4_lev_prefix;

        /***************************************************************/
        /* u4_suffix_len = 0,  Find leading zeros in next 32 bits      */
        /***************************************************************/
        FIND_ONE_IN_STREAM_32(u4_lev_prefix, u4_bitstream_offset,
                              pu4_bitstrm_buf);

        /*********************************************************/
        /* Special decoding case when trailing ones are 3        */
        /*********************************************************/
        u2_lev_code = MIN(15, u4_lev_prefix);

        u2_lev_code += (3 == u4_trailing_ones) ? 0 : 2;

        if(14 == u4_lev_prefix)
            u4_lev_suffix_size = 4;
        else if(15 <= u4_lev_prefix)
        {
            u2_lev_code += 15;
            u4_lev_suffix_size = u4_lev_prefix - 3;
        }
        else
            u4_lev_suffix_size = 0;

        //HP_LEVEL_PREFIX
        if(16 <= u4_lev_prefix)
        {
            u2_lev_code += ((1 << (u4_lev_prefix - 3)) - 4096);
        }
        if(u4_lev_suffix_size)
        {
            GETBITS(u4_lev_suffix, u4_bitstream_offset, pu4_bitstrm_buf,
                    u4_lev_suffix_size);
            u2_lev_code += u4_lev_suffix;
        }

        u2_abs_value = (u2_lev_code + 2) >> 1;
        /*********************************************************/
        /* If Level code is odd, level is negative else positive */
        /*********************************************************/
        i2_level_arr[i--] = (u2_lev_code & 1) ? -u2_abs_value : u2_abs_value;

        u4_suffix_len = (u2_abs_value > 3) ? 2 : 1;

        /*********************************************************/
        /* Now loop over the remaining levels                    */
        /*********************************************************/
        while(i >= 0)
        {

            /***************************************************************/
            /* Find leading zeros in next 32 bits                          */
            /***************************************************************/
            FIND_ONE_IN_STREAM_32(u4_lev_prefix, u4_bitstream_offset,
                                  pu4_bitstrm_buf);

            u4_lev_suffix_size =
                            (15 <= u4_lev_prefix) ?
                                            (u4_lev_prefix - 3) : u4_suffix_len;

            /*********************************************************/
            /* Compute level code using prefix and suffix            */
            /*********************************************************/
            GETBITS(u4_lev_suffix, u4_bitstream_offset, pu4_bitstrm_buf,
                    u4_lev_suffix_size);
            u2_lev_code = (MIN(15,u4_lev_prefix) << u4_suffix_len)
                            + u4_lev_suffix;

            //HP_LEVEL_PREFIX
            if(16 <= u4_lev_prefix)
            {
                u2_lev_code += ((1 << (u4_lev_prefix - 3)) - 4096);
            }
            u2_abs_value = (u2_lev_code + 2) >> 1;

            /*********************************************************/
            /* If Level code is odd, level is negative else positive */
            /*********************************************************/
            i2_level_arr[i--] =
                            (u2_lev_code & 1) ? -u2_abs_value : u2_abs_value;

            /*********************************************************/
            /* Increment suffix length if required                   */
            /*********************************************************/
            u4_suffix_len +=
                            (u4_suffix_len < 6) ?
                                            (u2_abs_value
                                                            > (3
                                                                            << (u4_suffix_len
                                                                                            - 1))) :
                                            0;
        }

        /****************************************************************/
        /* Decoding Levels Ends                                         */
        /****************************************************************/
    }

    /****************************************************************/
    /* Decoding total zeros as in section 9.2.3, table 9.7          */
    /****************************************************************/
    {
        UWORD32 u4_index;
        const UWORD8 (*ppu1_total_zero_lkup)[64] =
                        (const UWORD8 (*)[64])gau1_ih264d_table_total_zero_2to10;

        NEXTBITS(u4_index, u4_bitstream_offset, pu4_bitstrm_buf, 6);
        u4_total_zeroes = ppu1_total_zero_lkup[u4_total_coeff - 2][u4_index];

        FLUSHBITS(u4_bitstream_offset, (u4_total_zeroes >> 4));
        u4_total_zeroes &= 0xf;
    }

    /**************************************************************/
    /* Decode the runs and form the coefficient buffer            */
    /**************************************************************/
    {
        const UWORD8 *pu1_table_runbefore;
        UWORD32 u4_run;
        WORD32 k;
        WORD32 u4_scan_pos = u4_total_coeff + u4_total_zeroes - 1 + u4_isdc;
        WORD32 u4_zeroes_left = u4_total_zeroes;
        k = u4_total_coeff - 1;

        /**************************************************************/
        /* Decoding Runs Begin for zeros left > 6                     */
        /**************************************************************/
        while((u4_zeroes_left > 6) && k)
        {
            UWORD32 u4_code;

            NEXTBITS(u4_code, u4_bitstream_offset, pu4_bitstrm_buf, 3);

            if(u4_code != 0)
            {
                FLUSHBITS(u4_bitstream_offset, 3);
                u4_run = (7 - u4_code);
            }
            else
            {

                FIND_ONE_IN_STREAM_LEN(u4_code, u4_bitstream_offset,
                                       pu4_bitstrm_buf, 11);
                u4_run = (4 + u4_code);
            }

            SET_BIT(ps_tu_4x4->u2_sig_coeff_map, u4_scan_pos);
            *pi2_coeff_data++ = i2_level_arr[k--];
            u4_zeroes_left -= (WORD32)u4_run;
            u4_scan_pos -= (WORD32)(u4_run + 1);
        }

        if (u4_zeroes_left < 0 || u4_scan_pos < 0)
            return -1;

        /**************************************************************/
        /* Decoding Runs for 0 < zeros left <=6                       */
        /**************************************************************/
        pu1_table_runbefore = (UWORD8 *)gau1_ih264d_table_run_before;
        while((u4_zeroes_left > 0) && k)
        {
            UWORD32 u4_code;
            NEXTBITS(u4_code, u4_bitstream_offset, pu4_bitstrm_buf, 3);

            u4_code = pu1_table_runbefore[u4_code + (u4_zeroes_left << 3)];
            u4_run = u4_code >> 2;

            FLUSHBITS(u4_bitstream_offset, (u4_code & 0x03));

            SET_BIT(ps_tu_4x4->u2_sig_coeff_map, u4_scan_pos);
            *pi2_coeff_data++ = i2_level_arr[k--];
            u4_zeroes_left -= (WORD32)u4_run;
            u4_scan_pos -= (WORD32)(u4_run + 1);
        }
        if (u4_zeroes_left < 0 || u4_scan_pos < 0)
            return -1;
        /**************************************************************/
        /* Decoding Runs End                                          */
        /**************************************************************/

        /**************************************************************/
        /* Copy the remaining coefficients                            */
        /**************************************************************/
        while(k >= 0)
        {

            SET_BIT(ps_tu_4x4->u2_sig_coeff_map, u4_scan_pos);
            *pi2_coeff_data++ = i2_level_arr[k--];
            u4_scan_pos--;
        }
    }

    {
        WORD32 offset;
        offset = (UWORD8 *)pi2_coeff_data - (UWORD8 *)ps_tu_4x4;
        offset = ALIGN4(offset);
        ps_dec->pv_parse_tu_coeff_data = (void *)((UWORD8 *)ps_dec->pv_parse_tu_coeff_data + offset);
    }

    ps_bitstrm->u4_ofst = u4_bitstream_offset;
    return 0;
}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_cavlc_4x4res_block_totalcoeff_11to16                     */
/*                                                                           */
/*  Description   : This function does cavlc decoding of 4x4 block residual  */
/*                  coefficient when total coeffs are greater than ten.      */
/*                  Parsing is done as defined in section 9.2.2 and 9.2.3 of */
/*                  the H264 standard.                                       */
/*                                                                           */
/*  Inputs        : <What inputs does the function take?>                    */
/*  Globals       : <Does it use any global variables?>                      */
/*  Processing    : <Describe how the function operates - include algorithm  */
/*                  description>                                             */
/*  Outputs       : <What does the function produce?>                        */
/*  Returns       : <What does the function return?>                         */
/*                                                                           */
/*  Issues        : <List any issues or problems with this function>         */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         25 09 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/

WORD32 ih264d_cavlc_4x4res_block_totalcoeff_11to16(UWORD32 u4_isdc,
                                                UWORD32 u4_total_coeff_trail_one, /*!<TotalCoefficients<<16+trailingones*/
                                                dec_bit_stream_t *ps_bitstrm )
{
    UWORD32 u4_total_zeroes;
    WORD32 i;
    UWORD32 *pu4_bitstrm_buf = ps_bitstrm->pu4_buffer;
    UWORD32 u4_bitstream_offset = ps_bitstrm->u4_ofst;
    UWORD32 u4_trailing_ones = u4_total_coeff_trail_one & 0xFFFF;
    UWORD32 u4_total_coeff = u4_total_coeff_trail_one >> 16;
    // To avoid error check at 4x4 level, allocating for 3 extra levels(16+3)
    // since u4_trailing_ones can at the max be 3. This will be required when
    // u4_total_coeff is less than u4_trailing_ones
    WORD16 ai2_level_arr[19];//
    WORD16 *i2_level_arr = &ai2_level_arr[3];

    tu_sblk4x4_coeff_data_t *ps_tu_4x4;
    WORD16 *pi2_coeff_data;
    dec_struct_t *ps_dec = (dec_struct_t *)ps_bitstrm->pv_codec_handle;

    ps_tu_4x4 = (tu_sblk4x4_coeff_data_t *)ps_dec->pv_parse_tu_coeff_data;
    ps_tu_4x4->u2_sig_coeff_map = 0;
    pi2_coeff_data = &ps_tu_4x4->ai2_level[0];

    i = u4_total_coeff - 1;
    if(u4_trailing_ones)
    {
        /*********************************************************************/
        /* Decode Trailing Ones                                              */
        /* read the sign of T1's and put them in level array                 */
        /*********************************************************************/
        UWORD32 u4_signs, u4_cnt = u4_trailing_ones;
        WORD16 (*ppi2_trlone_lkup)[3] =
                        (WORD16 (*)[3])gai2_ih264d_trailing_one_level;
        WORD16 *pi2_trlone_lkup;

        GETBITS(u4_signs, u4_bitstream_offset, pu4_bitstrm_buf, u4_cnt);

        pi2_trlone_lkup = ppi2_trlone_lkup[(1 << u4_cnt) - 2 + u4_signs];

        while(u4_cnt)
        {
            i2_level_arr[i--] = *pi2_trlone_lkup++;
            u4_cnt--;
        }
    }

    /****************************************************************/
    /* Decoding Levels Begins                                       */
    /****************************************************************/
    if(i >= 0)
    {
        /****************************************************************/
        /* First level is decoded outside the loop as it has lot of     */
        /* special cases.                                               */
        /****************************************************************/
        UWORD32 u4_lev_suffix, u4_suffix_len, u4_lev_suffix_size;
        UWORD16 u2_lev_code, u2_abs_value;
        UWORD32 u4_lev_prefix;

        if(u4_trailing_ones < 3)
        {
            /*********************************************************/
            /* u4_suffix_len = 1                                     */
            /*********************************************************/
            /***************************************************************/
            /* Find leading zeros in next 32 bits                          */
            /***************************************************************/
            FIND_ONE_IN_STREAM_32(u4_lev_prefix, u4_bitstream_offset,
                                  pu4_bitstrm_buf);

            u4_lev_suffix_size =
                            (15 <= u4_lev_prefix) ? (u4_lev_prefix - 3) : 1;

            GETBITS(u4_lev_suffix, u4_bitstream_offset, pu4_bitstrm_buf,
                    u4_lev_suffix_size);
            u2_lev_code = 2 + (MIN(u4_lev_prefix,15) << 1) + u4_lev_suffix;

            //HP_LEVEL_PREFIX
            if(16 <= u4_lev_prefix)
            {
                u2_lev_code += ((1 << (u4_lev_prefix - 3)) - 4096);
            }
        }
        else
        {
            /*********************************************************/
            /*u4_suffix_len = 0                                      */
            /*********************************************************/
            /***************************************************************/
            /* Find leading zeros in next 32 bits                          */
            /***************************************************************/
            FIND_ONE_IN_STREAM_32(u4_lev_prefix, u4_bitstream_offset,
                                  pu4_bitstrm_buf);

            /*********************************************************/
            /* Special decoding case when trailing ones are 3        */
            /*********************************************************/
            u2_lev_code = MIN(15, u4_lev_prefix);

            u2_lev_code += (3 == u4_trailing_ones) ? 0 : (2);

            if(14 == u4_lev_prefix)
                u4_lev_suffix_size = 4;
            else if(15 <= u4_lev_prefix)
            {
                u2_lev_code += 15;
                u4_lev_suffix_size = (u4_lev_prefix - 3);
            }
            else
                u4_lev_suffix_size = 0;

            //HP_LEVEL_PREFIX
            if(16 <= u4_lev_prefix)
            {
                u2_lev_code += ((1 << (u4_lev_prefix - 3)) - 4096);
            }
            if(u4_lev_suffix_size)
            {
                GETBITS(u4_lev_suffix, u4_bitstream_offset, pu4_bitstrm_buf,
                        u4_lev_suffix_size);
                u2_lev_code += u4_lev_suffix;
            }
        }

        u2_abs_value = (u2_lev_code + 2) >> 1;
        /*********************************************************/
        /* If Level code is odd, level is negative else positive */
        /*********************************************************/
        i2_level_arr[i--] = (u2_lev_code & 1) ? -u2_abs_value : u2_abs_value;

        u4_suffix_len = (u2_abs_value > 3) ? 2 : 1;

        /*********************************************************/
        /* Now loop over the remaining levels                    */
        /*********************************************************/
        while(i >= 0)
        {

            /***************************************************************/
            /* Find leading zeros in next 32 bits                          */
            /***************************************************************/
            FIND_ONE_IN_STREAM_32(u4_lev_prefix, u4_bitstream_offset,
                                  pu4_bitstrm_buf);

            u4_lev_suffix_size =
                            (15 <= u4_lev_prefix) ?
                                            (u4_lev_prefix - 3) : u4_suffix_len;

            /*********************************************************/
            /* Compute level code using prefix and suffix            */
            /*********************************************************/
            GETBITS(u4_lev_suffix, u4_bitstream_offset, pu4_bitstrm_buf,
                    u4_lev_suffix_size);
            u2_lev_code = (MIN(15,u4_lev_prefix) << u4_suffix_len)
                            + u4_lev_suffix;

            //HP_LEVEL_PREFIX
            if(16 <= u4_lev_prefix)
            {
                u2_lev_code += ((1 << (u4_lev_prefix - 3)) - 4096);
            }
            u2_abs_value = (u2_lev_code + 2) >> 1;

            /*********************************************************/
            /* If Level code is odd, level is negative else positive */
            /*********************************************************/
            i2_level_arr[i--] =
                            (u2_lev_code & 1) ? -u2_abs_value : u2_abs_value;

            /*********************************************************/
            /* Increment suffix length if required                   */
            /*********************************************************/
            u4_suffix_len +=
                            (u4_suffix_len < 6) ?
                                            (u2_abs_value
                                                            > (3
                                                                            << (u4_suffix_len
                                                                                            - 1))) :
                                            0;
        }

        /****************************************************************/
        /* Decoding Levels Ends                                         */
        /****************************************************************/
    }

    if(u4_total_coeff < (16 - u4_isdc))
    {
        UWORD32 u4_index;
        const UWORD8 (*ppu1_total_zero_lkup)[16] =
                        (const UWORD8 (*)[16])gau1_ih264d_table_total_zero_11to15;

        NEXTBITS(u4_index, u4_bitstream_offset, pu4_bitstrm_buf, 4);
        u4_total_zeroes = ppu1_total_zero_lkup[u4_total_coeff - 11][u4_index];

        FLUSHBITS(u4_bitstream_offset, (u4_total_zeroes >> 4));
        u4_total_zeroes &= 0xf;
    }
    else
        u4_total_zeroes = 0;

    /**************************************************************/
    /* Decode the runs and form the coefficient buffer            */
    /**************************************************************/
    {
        const UWORD8 *pu1_table_runbefore;
        UWORD32 u4_run;
        WORD32 k;
        WORD32 u4_scan_pos = u4_total_coeff + u4_total_zeroes - 1 + u4_isdc;
        WORD32 u4_zeroes_left = u4_total_zeroes;
        k = u4_total_coeff - 1;

        /**************************************************************/
        /* Decoding Runs for 0 < zeros left <=6                       */
        /**************************************************************/
        pu1_table_runbefore = (UWORD8 *)gau1_ih264d_table_run_before;
        while((u4_zeroes_left > 0) && k)
        {
            UWORD32 u4_code;
            NEXTBITS(u4_code, u4_bitstream_offset, pu4_bitstrm_buf, 3);

            u4_code = pu1_table_runbefore[u4_code + (u4_zeroes_left << 3)];
            u4_run = u4_code >> 2;

            FLUSHBITS(u4_bitstream_offset, (u4_code & 0x03));
            SET_BIT(ps_tu_4x4->u2_sig_coeff_map, u4_scan_pos);
            *pi2_coeff_data++ = i2_level_arr[k--];
            u4_zeroes_left -= (WORD32)u4_run;
            u4_scan_pos -= (WORD32)(u4_run + 1);
        }
        if (u4_zeroes_left < 0 || u4_scan_pos < 0)
          return -1;

        /**************************************************************/
        /* Decoding Runs End                                          */
        /**************************************************************/

        /**************************************************************/
        /* Copy the remaining coefficients                            */
        /**************************************************************/
        while(k >= 0)
        {
            SET_BIT(ps_tu_4x4->u2_sig_coeff_map, u4_scan_pos);
            *pi2_coeff_data++ = i2_level_arr[k--];
            u4_scan_pos--;
        }
    }

    {
        WORD32 offset;
        offset = (UWORD8 *)pi2_coeff_data - (UWORD8 *)ps_tu_4x4;
        offset = ALIGN4(offset);
        ps_dec->pv_parse_tu_coeff_data = (void *)((UWORD8 *)ps_dec->pv_parse_tu_coeff_data + offset);
    }

    ps_bitstrm->u4_ofst = u4_bitstream_offset;
    return 0;
}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_rest_of_residual_cav_chroma_dc_block              */
/*                                                                           */
/*  Description   : This function does the Cavlc parsing of the bitstream    */
/*                  for chroma dc coefficients                               */
/*  Inputs        : <What inputs does the function take?>                    */
/*  Globals       : <Does it use any global variables?>                      */
/*  Processing    : <Describe how the function operates - include algorithm  */
/*                  description>                                             */
/*  Outputs       : <What does the function produce?>                        */
/*  Returns       : <What does the function return?>                         */
/*                                                                           */
/*  Issues        : <List any issues or problems with this function>         */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         15 09 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/
void ih264d_rest_of_residual_cav_chroma_dc_block(UWORD32 u4_total_coeff_trail_one,
                                                 dec_bit_stream_t *ps_bitstrm)
{
    UWORD32 u4_total_zeroes;
    WORD16 i;
    UWORD32 *pu4_bitstrm_buf = ps_bitstrm->pu4_buffer;
    UWORD32 u4_bitstream_offset = ps_bitstrm->u4_ofst;
    UWORD32 u4_trailing_ones = u4_total_coeff_trail_one & 0xFFFF;
    UWORD32 u4_total_coeff = u4_total_coeff_trail_one >> 16;
    // To avoid error check at 4x4 level, allocating for 3 extra levels(4+3)
    // since u4_trailing_ones can at the max be 3. This will be required when
    // u4_total_coeff is less than u4_trailing_ones
    WORD16 ai2_level_arr[7];//
    WORD16 *i2_level_arr = &ai2_level_arr[3];

    tu_sblk4x4_coeff_data_t *ps_tu_4x4;
    WORD16 *pi2_coeff_data;
    dec_struct_t *ps_dec = (dec_struct_t *)ps_bitstrm->pv_codec_handle;

    ps_tu_4x4 = (tu_sblk4x4_coeff_data_t *)ps_dec->pv_parse_tu_coeff_data;
    ps_tu_4x4->u2_sig_coeff_map = 0;
    pi2_coeff_data = &ps_tu_4x4->ai2_level[0];

    i = u4_total_coeff - 1;
    if(u4_trailing_ones)
    {
        /*********************************************************************/
        /* Decode Trailing Ones                                              */
        /* read the sign of T1's and put them in level array                 */
        /*********************************************************************/
        UWORD32 u4_signs, u4_cnt = u4_trailing_ones;
        WORD16 (*ppi2_trlone_lkup)[3] =
                        (WORD16 (*)[3])gai2_ih264d_trailing_one_level;
        WORD16 *pi2_trlone_lkup;

        GETBITS(u4_signs, u4_bitstream_offset, pu4_bitstrm_buf, u4_cnt);

        pi2_trlone_lkup = ppi2_trlone_lkup[(1 << u4_cnt) - 2 + u4_signs];

        while(u4_cnt)
        {
            i2_level_arr[i--] = *pi2_trlone_lkup++;
            u4_cnt--;
        }
    }

    /****************************************************************/
    /* Decoding Levels Begins                                       */
    /****************************************************************/
    if(i >= 0)
    {
        /****************************************************************/
        /* First level is decoded outside the loop as it has lot of     */
        /* special cases.                                               */
        /****************************************************************/
        UWORD32 u4_lev_suffix, u4_suffix_len, u4_lev_suffix_size;
        UWORD16 u2_lev_code, u2_abs_value;
        UWORD32 u4_lev_prefix;

        /***************************************************************/
        /* u4_suffix_len = 0,  Find leading zeros in next 32 bits      */
        /***************************************************************/
        FIND_ONE_IN_STREAM_32(u4_lev_prefix, u4_bitstream_offset,
                              pu4_bitstrm_buf);

        /*********************************************************/
        /* Special decoding case when trailing ones are 3        */
        /*********************************************************/
        u2_lev_code = MIN(15, u4_lev_prefix);

        u2_lev_code += (3 == u4_trailing_ones) ? 0 : (2);

        if(14 == u4_lev_prefix)
            u4_lev_suffix_size = 4;
        else if(15 <= u4_lev_prefix)
        {
            u2_lev_code += 15;
            u4_lev_suffix_size = u4_lev_prefix - 3;
        }
        else
            u4_lev_suffix_size = 0;

        //HP_LEVEL_PREFIX
        if(16 <= u4_lev_prefix)
        {
            u2_lev_code += ((1 << (u4_lev_prefix - 3)) - 4096);
        }
        if(u4_lev_suffix_size)
        {
            GETBITS(u4_lev_suffix, u4_bitstream_offset, pu4_bitstrm_buf,
                    u4_lev_suffix_size);
            u2_lev_code += u4_lev_suffix;
        }

        u2_abs_value = (u2_lev_code + 2) >> 1;
        /*********************************************************/
        /* If Level code is odd, level is negative else positive */
        /*********************************************************/
        i2_level_arr[i--] = (u2_lev_code & 1) ? -u2_abs_value : u2_abs_value;

        u4_suffix_len = (u2_abs_value > 3) ? 2 : 1;

        /*********************************************************/
        /* Now loop over the remaining levels                    */
        /*********************************************************/
        while(i >= 0)
        {

            /***************************************************************/
            /* Find leading zeros in next 32 bits                          */
            /***************************************************************/
            FIND_ONE_IN_STREAM_32(u4_lev_prefix, u4_bitstream_offset,
                                  pu4_bitstrm_buf);

            u4_lev_suffix_size =
                            (15 <= u4_lev_prefix) ?
                                            (u4_lev_prefix - 3) : u4_suffix_len;

            /*********************************************************/
            /* Compute level code using prefix and suffix            */
            /*********************************************************/
            GETBITS(u4_lev_suffix, u4_bitstream_offset, pu4_bitstrm_buf,
                    u4_lev_suffix_size);
            u2_lev_code = (MIN(u4_lev_prefix,15) << u4_suffix_len)
                            + u4_lev_suffix;

            //HP_LEVEL_PREFIX
            if(16 <= u4_lev_prefix)
            {
                u2_lev_code += ((1 << (u4_lev_prefix - 3)) - 4096);
            }
            u2_abs_value = (u2_lev_code + 2) >> 1;

            /*********************************************************/
            /* If Level code is odd, level is negative else positive */
            /*********************************************************/
            i2_level_arr[i--] =
                            (u2_lev_code & 1) ? -u2_abs_value : u2_abs_value;

            /*********************************************************/
            /* Increment suffix length if required                   */
            /*********************************************************/
            u4_suffix_len += (u2_abs_value > (3 << (u4_suffix_len - 1)));
        }

        /****************************************************************/
        /* Decoding Levels Ends                                         */
        /****************************************************************/
    }

    if(u4_total_coeff < 4)
    {
        UWORD32 u4_max_ldz = (4 - u4_total_coeff);
        FIND_ONE_IN_STREAM_LEN(u4_total_zeroes, u4_bitstream_offset,
                               pu4_bitstrm_buf, u4_max_ldz);
    }
    else
        u4_total_zeroes = 0;

    /**************************************************************/
    /* Decode the runs and form the coefficient buffer            */
    /**************************************************************/
    {
        const UWORD8 *pu1_table_runbefore;
        UWORD32 u4_run;
        WORD32 u4_scan_pos = (u4_total_coeff + u4_total_zeroes - 1);
        UWORD32 u4_zeroes_left = u4_total_zeroes;
        i = u4_total_coeff - 1;

        /**************************************************************/
        /* Decoding Runs for 0 < zeros left <=6                       */
        /**************************************************************/
        pu1_table_runbefore = (UWORD8 *)gau1_ih264d_table_run_before;
        while(u4_zeroes_left && i)
        {
            UWORD32 u4_code;
            NEXTBITS(u4_code, u4_bitstream_offset, pu4_bitstrm_buf, 3);

            u4_code = pu1_table_runbefore[u4_code + (u4_zeroes_left << 3)];
            u4_run = u4_code >> 2;

            FLUSHBITS(u4_bitstream_offset, (u4_code & 0x03));
            SET_BIT(ps_tu_4x4->u2_sig_coeff_map, u4_scan_pos);
            *pi2_coeff_data++ = i2_level_arr[i--];
            u4_zeroes_left -= (WORD32)u4_run;
            u4_scan_pos -= (WORD32)(u4_run + 1);
        }
        /**************************************************************/
        /* Decoding Runs End                                          */
        /**************************************************************/

        /**************************************************************/
        /* Copy the remaining coefficients                            */
        /**************************************************************/
        while(i >= 0)
        {
            SET_BIT(ps_tu_4x4->u2_sig_coeff_map, u4_scan_pos);
            *pi2_coeff_data++ = i2_level_arr[i--];
            u4_scan_pos--;
        }
    }

    {
        WORD32 offset;
        offset = (UWORD8 *)pi2_coeff_data - (UWORD8 *)ps_tu_4x4;
        offset = ALIGN4(offset);
        ps_dec->pv_parse_tu_coeff_data = (void *)((UWORD8 *)ps_dec->pv_parse_tu_coeff_data + offset);
    }

    ps_bitstrm->u4_ofst = u4_bitstream_offset;
}

/*!
 **************************************************************************
 * \if Function name : CavlcParsingInvScanInvQuant \endif
 *
 * \brief
 *    This function do cavlc parsing of coefficient tokens for any block
 *    type except chromDc and depending
 *    on whenther any coefficients to be parsed calls module
 *    RestOfResidualBlockCavlc.
 *
 * \return
 *    Returns total number of non-zero coefficients.
 *
 **************************************************************************
 */

WORD32 ih264d_cavlc_parse4x4coeff_n0to7(WORD16 *pi2_coeff_block,
                                        UWORD32 u4_isdc, /* is it a DC block */
                                        WORD32 u4_n,
                                        dec_struct_t *ps_dec,
                                        UWORD32 *pu4_total_coeff)
{
    dec_bit_stream_t *ps_bitstrm = ps_dec->ps_bitstrm;
    UWORD32 *pu4_bitstrm_buf = ps_bitstrm->pu4_buffer;
    UWORD32 u4_bitstream_offset = ps_bitstrm->u4_ofst;
    UWORD32 u4_code, u4_index, u4_ldz;
    const UWORD16 *pu2_code = (const UWORD16*)gau2_ih264d_code_gx;
    const UWORD16 *pu2_offset_num_vlc =
                    (const UWORD16 *)gau2_ih264d_offset_num_vlc_tab;
    UWORD32 u4_offset_num_vlc = pu2_offset_num_vlc[u4_n];


    UNUSED(pi2_coeff_block);
    *pu4_total_coeff = 0;
    FIND_ONE_IN_STREAM_32(u4_ldz, u4_bitstream_offset, pu4_bitstrm_buf);
    NEXTBITS(u4_index, u4_bitstream_offset, pu4_bitstrm_buf, 3);
    u4_index += (u4_ldz << 3);
    u4_index += u4_offset_num_vlc;

    u4_index = MIN(u4_index, 303);
    u4_code = pu2_code[u4_index];

    FLUSHBITS(u4_bitstream_offset, (u4_code & 0x03));
    ps_bitstrm->u4_ofst = u4_bitstream_offset;
    *pu4_total_coeff = (u4_code >> 4);

    if(*pu4_total_coeff)
    {
        UWORD32 u4_trailing_ones, u4_offset, u4_total_coeff_tone;
        const UWORD8 *pu1_offset =
                        (UWORD8 *)gau1_ih264d_total_coeff_fn_ptr_offset;
        WORD32 ret;
        u4_trailing_ones = ((u4_code >> 2) & 0x03);
        u4_offset = pu1_offset[*pu4_total_coeff - 1];
        u4_total_coeff_tone = (*pu4_total_coeff << 16) | u4_trailing_ones;

        ret = ps_dec->pf_cavlc_4x4res_block[u4_offset](u4_isdc,
                                                       u4_total_coeff_tone,
                                                       ps_bitstrm);
        if(ret != 0)
            return ERROR_CAVLC_NUM_COEFF_T;
    }

    return OK;
}

WORD32 ih264d_cavlc_parse4x4coeff_n8(WORD16 *pi2_coeff_block,
                                     UWORD32 u4_isdc, /* is it a DC block */
                                     WORD32 u4_n,
                                     dec_struct_t *ps_dec,
                                     UWORD32 *pu4_total_coeff)
{

    dec_bit_stream_t *ps_bitstrm = ps_dec->ps_bitstrm;
    UWORD32 *pu4_bitstrm_buf = ps_bitstrm->pu4_buffer;
    UWORD32 u4_bitstream_offset = ps_bitstrm->u4_ofst;
    UWORD32 u4_code;
    UNUSED(u4_n);
    UNUSED(pi2_coeff_block);
    GETBITS(u4_code, u4_bitstream_offset, pu4_bitstrm_buf, 6);
    ps_bitstrm->u4_ofst = u4_bitstream_offset;
    *pu4_total_coeff = 0;

    if(u4_code != 3)
    {
        UWORD8 *pu1_offset = (UWORD8 *)gau1_ih264d_total_coeff_fn_ptr_offset;
        UWORD32 u4_trailing_ones, u4_offset, u4_total_coeff_tone;

        *pu4_total_coeff = (u4_code >> 2) + 1;
        u4_trailing_ones = u4_code & 0x03;
        u4_offset = pu1_offset[*pu4_total_coeff - 1];
        u4_total_coeff_tone = (*pu4_total_coeff << 16) | u4_trailing_ones;

        ps_dec->pf_cavlc_4x4res_block[u4_offset](u4_isdc,
                                                 u4_total_coeff_tone,
                                                 ps_bitstrm);
    }

    return OK;
}

/*!
 **************************************************************************
 * \if Function name : ih264d_cavlc_parse_chroma_dc \endif
 *
 * \brief
 *    This function do cavlc parsing of coefficient tokens chromDc block
 *    and depending  on whenther any coefficients to be parsed calls module
 *    ih264d_rest_of_residual_cav_chroma_dc_block.
 *
 * \return
 *    Returns total number of non-zero coefficients.
 *
 **************************************************************************
 */

void ih264d_cavlc_parse_chroma_dc(dec_mb_info_t *ps_cur_mb_info,
                                  WORD16 *pi2_coeff_block,
                                  dec_bit_stream_t *ps_bitstrm,
                                  UWORD32 u4_scale_u,
                                  UWORD32 u4_scale_v,
                                  WORD32 i4_mb_inter_inc)
{
    UWORD32 u4_total_coeff, u4_trailing_ones, u4_total_coeff_tone, u4_code;
    UWORD32 *pu4_bitstrm_buf = ps_bitstrm->pu4_buffer;
    UWORD32 u4_bitstream_offset = ps_bitstrm->u4_ofst;
    const UWORD8 *pu1_cav_chromdc = (const UWORD8*)gau1_ih264d_cav_chromdc_vld;
    UNUSED(i4_mb_inter_inc);
    /******************************************************************/
    /*  Chroma DC Block for U component                               */
    /******************************************************************/
    NEXTBITS(u4_code, u4_bitstream_offset, pu4_bitstrm_buf, 8);

    u4_code = pu1_cav_chromdc[u4_code];

    FLUSHBITS(u4_bitstream_offset, ((u4_code & 0x7) + 1));
    ps_bitstrm->u4_ofst = u4_bitstream_offset;

    u4_total_coeff = (u4_code >> 5);

    if(u4_total_coeff)
    {
        WORD32 i_z0, i_z1, i_z2, i_z3;
        tu_sblk4x4_coeff_data_t *ps_tu_4x4;
        dec_struct_t *ps_dec = (dec_struct_t *)ps_bitstrm->pv_codec_handle;
        WORD16 ai2_dc_coef[4];
        UWORD8 pu1_inv_scan[4] =
                        { 0, 1, 2, 3 };
        WORD16 *pi2_coeff_data =
                                    (WORD16 *)ps_dec->pv_parse_tu_coeff_data;

        ps_tu_4x4 = (tu_sblk4x4_coeff_data_t *)ps_dec->pv_parse_tu_coeff_data;

        u4_trailing_ones = ((u4_code >> 3) & 0x3);
        u4_total_coeff_tone = (u4_total_coeff << 16) | u4_trailing_ones;
        ih264d_rest_of_residual_cav_chroma_dc_block(u4_total_coeff_tone,
                                                    ps_bitstrm);

        ai2_dc_coef[0] = 0;
        ai2_dc_coef[1] = 0;
        ai2_dc_coef[2] = 0;
        ai2_dc_coef[3] = 0;

        ih264d_unpack_coeff4x4_dc_4x4blk(ps_tu_4x4,
                                         ai2_dc_coef,
                                         pu1_inv_scan);
        /*-------------------------------------------------------------------*/
        /* Inverse 2x2 transform and scaling  of chroma DC                   */
        /*-------------------------------------------------------------------*/
        i_z0 = (ai2_dc_coef[0] + ai2_dc_coef[2]);
        i_z1 = (ai2_dc_coef[0] - ai2_dc_coef[2]);
        i_z2 = (ai2_dc_coef[1] - ai2_dc_coef[3]);
        i_z3 = (ai2_dc_coef[1] + ai2_dc_coef[3]);

        /*-----------------------------------------------------------*/
        /* Scaling and storing the values back                       */
        /*-----------------------------------------------------------*/
        *pi2_coeff_data++ = (WORD16)(((i_z0 + i_z3) * (WORD32)u4_scale_u) >> 5);
        *pi2_coeff_data++ = (WORD16)(((i_z0 - i_z3) * (WORD32)u4_scale_u) >> 5);
        *pi2_coeff_data++ = (WORD16)(((i_z1 + i_z2) * (WORD32)u4_scale_u) >> 5);
        *pi2_coeff_data++ = (WORD16)(((i_z1 - i_z2) * (WORD32)u4_scale_u) >> 5);

        ps_dec->pv_parse_tu_coeff_data = (void *)pi2_coeff_data;

        SET_BIT(ps_cur_mb_info->u1_yuv_dc_block_flag,1);
    }

    /******************************************************************/
    /*  Chroma DC Block for V component                               */
    /******************************************************************/
    pi2_coeff_block += 64;
    u4_bitstream_offset = ps_bitstrm->u4_ofst;

    NEXTBITS(u4_code, u4_bitstream_offset, pu4_bitstrm_buf, 8);

    u4_code = pu1_cav_chromdc[u4_code];

    FLUSHBITS(u4_bitstream_offset, ((u4_code & 0x7) + 1));
    ps_bitstrm->u4_ofst = u4_bitstream_offset;

    u4_total_coeff = (u4_code >> 5);

    if(u4_total_coeff)
    {
        WORD32 i_z0, i_z1, i_z2, i_z3;
        tu_sblk4x4_coeff_data_t *ps_tu_4x4;
        dec_struct_t *ps_dec = (dec_struct_t *)ps_bitstrm->pv_codec_handle;
        WORD16 ai2_dc_coef[4];
        UWORD8 pu1_inv_scan[4] =
                        { 0, 1, 2, 3 };
        WORD16 *pi2_coeff_data =
                                    (WORD16 *)ps_dec->pv_parse_tu_coeff_data;

        ps_tu_4x4 = (tu_sblk4x4_coeff_data_t *)ps_dec->pv_parse_tu_coeff_data;

        u4_trailing_ones = ((u4_code >> 3) & 0x3);
        u4_total_coeff_tone = (u4_total_coeff << 16) | u4_trailing_ones;
        ih264d_rest_of_residual_cav_chroma_dc_block(u4_total_coeff_tone,
                                                    ps_bitstrm);

        ai2_dc_coef[0] = 0;
        ai2_dc_coef[1] = 0;
        ai2_dc_coef[2] = 0;
        ai2_dc_coef[3] = 0;

        ih264d_unpack_coeff4x4_dc_4x4blk(ps_tu_4x4,
                                         ai2_dc_coef,
                                         pu1_inv_scan);

        /*-------------------------------------------------------------------*/
        /* Inverse 2x2 transform and scaling  of chroma DC                   */
        /*-------------------------------------------------------------------*/
        i_z0 = (ai2_dc_coef[0] + ai2_dc_coef[2]);
        i_z1 = (ai2_dc_coef[0] - ai2_dc_coef[2]);
        i_z2 = (ai2_dc_coef[1] - ai2_dc_coef[3]);
        i_z3 = (ai2_dc_coef[1] + ai2_dc_coef[3]);

        /*-----------------------------------------------------------*/
        /* Scaling and storing the values back                       */
        /*-----------------------------------------------------------*/
        *pi2_coeff_data++ = (WORD16)(((i_z0 + i_z3) * (WORD32)u4_scale_v) >> 5);
        *pi2_coeff_data++ = (WORD16)(((i_z0 - i_z3) * (WORD32)u4_scale_v) >> 5);
        *pi2_coeff_data++ = (WORD16)(((i_z1 + i_z2) * (WORD32)u4_scale_v) >> 5);
        *pi2_coeff_data++ = (WORD16)(((i_z1 - i_z2) * (WORD32)u4_scale_v) >> 5);

        ps_dec->pv_parse_tu_coeff_data = (void *)pi2_coeff_data;

        SET_BIT(ps_cur_mb_info->u1_yuv_dc_block_flag,2);
    }
}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_parse_pmb_ref_index_cavlc_range1                         */
/*                                                                           */
/*  Description   : This function does the Cavlc  TEV range =1 parsing of    */
/*                  reference index  for a P MB. Range is 1 when             */
/*                  num_ref_idx_active_minus1 is 0                           */
/*                                                                           */
/*  Inputs        : <What inputs does the function take?>                    */
/*  Globals       : <Does it use any global variables?>                      */
/*  Processing    : <Describe how the function operates - include algorithm  */
/*                  description>                                             */
/*  Outputs       : <What does the function produce?>                        */
/*  Returns       : <What does the function return?>                         */
/*                                                                           */
/*  Issues        : <List any issues or problems with this function>         */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         19 09 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/
void ih264d_parse_pmb_ref_index_cavlc_range1(UWORD32 u4_num_part, /* Number of partitions in MB      */
                                             dec_bit_stream_t *ps_bitstrm, /* Pointer to bitstream Structure. */
                                             WORD8 *pi1_ref_idx, /* pointer to reference index array */
                                             UWORD32 u4_num_ref_idx_active_minus1 /* Not used for range 1    */
                                             )
{
    UWORD32 u4_i;
    UWORD32 *pu4_bitstrm_buf = ps_bitstrm->pu4_buffer;
    UWORD32 *pu4_bitstream_off = &ps_bitstrm->u4_ofst;
    UNUSED(u4_num_ref_idx_active_minus1);
    for(u4_i = 0; u4_i < u4_num_part; u4_i++)
    {
        UWORD32 u4_ref_idx;
        u4_ref_idx = ih264d_tev_range1(pu4_bitstream_off, pu4_bitstrm_buf);

        /* Storing Reference Idx Information */
        pi1_ref_idx[u4_i] = (WORD8)u4_ref_idx;
    }
}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_parse_pmb_ref_index_cavlc                                */
/*                                                                           */
/*  Description   : This function does the Cavlc  TEV range > 1 parsing of   */
/*                  reference index  for a P MB.                             */
/*                  Range > 1 when num_ref_idx_active_minus1 > 0             */
/*                                                                           */
/*  Inputs        : <What inputs does the function take?>                    */
/*  Globals       : <Does it use any global variables?>                      */
/*  Processing    : <Describe how the function operates - include algorithm  */
/*                  description>                                             */
/*  Outputs       : <What does the function produce?>                        */
/*  Returns       : <What does the function return?>                         */
/*                                                                           */
/*  Issues        : <List any issues or problems with this function>         */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         19 09 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/

WORD32 ih264d_parse_pmb_ref_index_cavlc(UWORD32 u4_num_part, /* Number of partitions in MB      */
                                      dec_bit_stream_t *ps_bitstrm, /* Pointer to bitstream Structure. */
                                      WORD8 *pi1_ref_idx, /* pointer to reference index array */
                                      UWORD32 u4_num_ref_idx_active_minus1 /* Number of active references - 1  */
                                      )
{
    UWORD32 u4_i;
    UWORD32 *pu4_bitstrm_buf = ps_bitstrm->pu4_buffer;
    UWORD32 *pu4_bitstream_off = &ps_bitstrm->u4_ofst;

    for(u4_i = 0; u4_i < u4_num_part; u4_i++)
    {
        UWORD32 u4_ref_idx;
//Inlined ih264d_uev
        UWORD32 u4_bitstream_offset = *pu4_bitstream_off;
        UWORD32 u4_word, u4_ldz;

        /***************************************************************/
        /* Find leading zeros in next 32 bits                          */
        /***************************************************************/
        NEXTBITS_32(u4_word, u4_bitstream_offset, pu4_bitstrm_buf);
        u4_ldz = CLZ(u4_word);
        /* Flush the ps_bitstrm */
        u4_bitstream_offset += (u4_ldz + 1);
        /* Read the suffix from the ps_bitstrm */
        u4_word = 0;
        if(u4_ldz)
            GETBITS(u4_word, u4_bitstream_offset, pu4_bitstrm_buf, u4_ldz);
        *pu4_bitstream_off = u4_bitstream_offset;
        u4_ref_idx = ((1 << u4_ldz) + u4_word - 1);
//Inlined ih264d_uev

        if(u4_ref_idx > u4_num_ref_idx_active_minus1)
            return ERROR_REF_IDX;

        /* Storing Reference Idx Information */
        pi1_ref_idx[u4_i] = (WORD8)u4_ref_idx;
    }
    return OK;
}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_parse_bmb_ref_index_cavlc_range1                         */
/*                                                                           */
/*  Description   : This function does the Cavlc  TEV range =1 parsing of    */
/*                  reference index  for a B MB. Range is 1 when             */
/*                  num_ref_idx_active_minus1 is 0                           */
/*                                                                           */
/*  Inputs        : <What inputs does the function take?>                    */
/*  Globals       : <Does it use any global variables?>                      */
/*  Processing    : <Describe how the function operates - include algorithm  */
/*                  description>                                             */
/*  Outputs       : <What does the function produce?>                        */
/*  Returns       : <What does the function return?>                         */
/*                                                                           */
/*  Issues        : <List any issues or problems with this function>         */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         19 09 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/
void ih264d_parse_bmb_ref_index_cavlc_range1(UWORD32 u4_num_part, /* Number of partitions in MB      */
                                             dec_bit_stream_t *ps_bitstrm, /* Pointer to bitstream Structure. */
                                             WORD8 *pi1_ref_idx, /* pointer to reference index array */
                                             UWORD32 u4_num_ref_idx_active_minus1 /* Not used for range 1    */
                                             )
{
    UWORD32 u4_i;
    UWORD32 *pu4_bitstrm_buf = ps_bitstrm->pu4_buffer;
    UWORD32 *pu4_bitstream_off = &ps_bitstrm->u4_ofst;
    UNUSED(u4_num_ref_idx_active_minus1);
    for(u4_i = 0; u4_i < u4_num_part; u4_i++)
    {
        if(pi1_ref_idx[u4_i] > -1)
        {
            UWORD32 u4_ref_idx;

            u4_ref_idx = ih264d_tev_range1(pu4_bitstream_off, pu4_bitstrm_buf);

            /* Storing Reference Idx Information */
            pi1_ref_idx[u4_i] = (WORD8)u4_ref_idx;
        }
    }
}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_parse_bmb_ref_index_cavlc                                */
/*                                                                           */
/*  Description   : This function does the Cavlc  TEV range > 1 parsing of   */
/*                  reference index  for a B MB.                             */
/*                  Range > 1 when num_ref_idx_active_minus1 > 0             */
/*                                                                           */
/*  Inputs        : <What inputs does the function take?>                    */
/*  Globals       : <Does it use any global variables?>                      */
/*  Processing    : <Describe how the function operates - include algorithm  */
/*                  description>                                             */
/*  Outputs       : <What does the function produce?>                        */
/*  Returns       : <What does the function return?>                         */
/*                                                                           */
/*  Issues        : <List any issues or problems with this function>         */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         19 09 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/
WORD32 ih264d_parse_bmb_ref_index_cavlc(UWORD32 u4_num_part, /* Number of partitions in MB      */
                                      dec_bit_stream_t *ps_bitstrm, /* Pointer to bitstream Structure. */
                                      WORD8 *pi1_ref_idx, /* pointer to reference index array */
                                      UWORD32 u4_num_ref_idx_active_minus1 /* Number of active references - 1  */
                                      )
{
    UWORD32 u4_i;
    UWORD32 *pu4_bitstrm_buf = ps_bitstrm->pu4_buffer;
    UWORD32 *pu4_bitstream_off = &ps_bitstrm->u4_ofst;

    for(u4_i = 0; u4_i < u4_num_part; u4_i++)
    {
        if(pi1_ref_idx[u4_i] > -1)
        {
            UWORD32 u4_ref_idx;
//inlining ih264d_uev
            UWORD32 u4_bitstream_offset = *pu4_bitstream_off;
            UWORD32 u4_word, u4_ldz;

            /***************************************************************/
            /* Find leading zeros in next 32 bits                          */
            /***************************************************************/
            NEXTBITS_32(u4_word, u4_bitstream_offset, pu4_bitstrm_buf);
            u4_ldz = CLZ(u4_word);
            /* Flush the ps_bitstrm */
            u4_bitstream_offset += (u4_ldz + 1);
            /* Read the suffix from the ps_bitstrm */
            u4_word = 0;
            if(u4_ldz)
                GETBITS(u4_word, u4_bitstream_offset, pu4_bitstrm_buf, u4_ldz);
            *pu4_bitstream_off = u4_bitstream_offset;
            u4_ref_idx = ((1 << u4_ldz) + u4_word - 1);
//inlining ih264d_uev
            if(u4_ref_idx > u4_num_ref_idx_active_minus1)
                return ERROR_REF_IDX;

            /* Storing Reference Idx Information */
            pi1_ref_idx[u4_i] = (WORD8)u4_ref_idx;
        }
    }
    return OK;
}
/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_cavlc_parse_8x8block_both_available                      */
/*                                                                           */
/*  Description   : This function does the residual parsing of 4 subblocks   */
/*                  in a 8x8 block when both top and left are available      */
/*                                                                           */
/*  Inputs        : pi2_coeff_block : pointer to residual block where        */
/*                  decoded and inverse scan coefficients are updated        */
/*                                                                           */
/*                  u4_sub_block_strd : indicates the number of sublocks    */
/*                  in a row. It is 4 for luma and 2 for chroma.             */
/*                                                                           */
/*                  u4_isdc : required to indicate 4x4 parse modules if the  */
/*                  current  Mb is I_16x16/chroma DC coded.                  */
/*                                                                           */
/*                  ps_dec : pointer to Decstruct (decoder context)          */
/*                                                                           */
/*                  pu1_top_nnz : top nnz pointer                            */
/*                                                                           */
/*                  pu1_left_nnz : left nnz pointer                          */
/*                                                                           */
/*  Globals       : No                                                       */
/*  Processing    : Parsing for four subblocks in unrolled, top and left nnz */
/*                  are updated on the fly. csbp is set in accordance to     */
/*                  decoded numcoeff for the subblock index in raster order  */
/*                                                                           */
/*  Outputs       : The updated residue buffer, nnzs and csbp current block  */
/*                                                                           */
/*  Returns       : Returns the coded sub block pattern csbp for the block   */
/*                                                                           */
/*  Issues        : <List any issues or problems with this function>         */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         09 10 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/
WORD32 ih264d_cavlc_parse_8x8block_both_available(WORD16 *pi2_coeff_block,
                                                  UWORD32 u4_sub_block_strd,
                                                  UWORD32 u4_isdc,
                                                  dec_struct_t * ps_dec,
                                                  UWORD8 *pu1_top_nnz,
                                                  UWORD8 *pu1_left_nnz,
                                                  UWORD8 u1_tran_form8x8,
                                                  UWORD8 u1_mb_field_decodingflag,
                                                  UWORD32 *pu4_csbp)
{
    UWORD32 u4_num_coeff, u4_n, u4_subblock_coded;
    UWORD32 u4_top0, u4_top1;
    UWORD32 *pu4_dummy;
    WORD32 (**pf_cavlc_parse4x4coeff)(WORD16 *pi2_coeff_block,
                                      UWORD32 u4_isdc,
                                      WORD32 u4_n,
                                      struct _DecStruct *ps_dec,
                                      UWORD32 *pu4_dummy) =
                                      ps_dec->pf_cavlc_parse4x4coeff;
    UWORD32 u4_idx = 0;
    UWORD8 *puc_temp;
    WORD32 ret;

    *pu4_csbp = 0;
    /* need to change the inverse scan matrices here */
    puc_temp = ps_dec->pu1_inv_scan;

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 0                    */
    /*------------------------------------------------------*/
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[0];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[0];
        }
    }
    u4_n = (pu1_top_nnz[0] + pu1_left_nnz[0] + 1) >> 1;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    u4_top0 = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 1                    */
    /*------------------------------------------------------*/
    u4_idx++;
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[1];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[1];
        }
    }
    else
    {
        pi2_coeff_block += NUM_COEFFS_IN_4x4BLK;
    }
    u4_n = (pu1_top_nnz[1] + u4_num_coeff + 1) >> 1;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    u4_top1 = pu1_left_nnz[0] = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 2                    */
    /*------------------------------------------------------*/
    u4_idx += (u4_sub_block_strd - 1);
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[2];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[2];
        }
    }
    else
    {
        pi2_coeff_block += ((u4_sub_block_strd - 1) * NUM_COEFFS_IN_4x4BLK);
    }
    u4_n = (u4_top0 + pu1_left_nnz[1] + 1) >> 1;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    pu1_top_nnz[0] = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 3                    */
    /*------------------------------------------------------*/
    u4_idx++;
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[3];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[3];
        }
    }
    else
    {
        pi2_coeff_block += NUM_COEFFS_IN_4x4BLK;
    }
    u4_n = (u4_top1 + u4_num_coeff + 1) >> 1;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    pu1_top_nnz[1] = pu1_left_nnz[1] = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    ps_dec->pu1_inv_scan = puc_temp;

    return OK;
}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_cavlc_parse_8x8block_left_available                      */
/*                                                                           */
/*  Description   : This function does the residual parsing of 4 subblocks   */
/*                  in a 8x8 block when only left is available for block     */
/*                                                                           */
/*  Inputs        : pi2_coeff_block : pointer to residual block where        */
/*                  decoded and inverse scan coefficients are updated        */
/*                                                                           */
/*                  u4_sub_block_strd : indicates the number of sublocks    */
/*                  in a row. It is 4 for luma and 2 for chroma.             */
/*                                                                           */
/*                  u4_isdc : required to indicate 4x4 parse modules if the  */
/*                  current  Mb is I_16x16/chroma DC coded.                  */
/*                                                                           */
/*                  ps_dec : pointer to Decstruct (decoder context)          */
/*                                                                           */
/*                  pu1_top_nnz : top nnz pointer                            */
/*                                                                           */
/*                  pu1_left_nnz : left nnz pointer                          */
/*                                                                           */
/*  Globals       : No                                                       */
/*  Processing    : Parsing for four subblocks in unrolled, top and left nnz */
/*                  are updated on the fly. csbp is set in accordance to     */
/*                  decoded numcoeff for the subblock index in raster order  */
/*                                                                           */
/*  Outputs       : The updated residue buffer, nnzs and csbp current block  */
/*                                                                           */
/*  Returns       : Returns the coded sub block pattern csbp for the block   */
/*                                                                           */
/*  Issues        : <List any issues or problems with this function>         */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         09 10 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/
WORD32 ih264d_cavlc_parse_8x8block_left_available(WORD16 *pi2_coeff_block,
                                                  UWORD32 u4_sub_block_strd,
                                                  UWORD32 u4_isdc,
                                                  dec_struct_t * ps_dec,
                                                  UWORD8 *pu1_top_nnz,
                                                  UWORD8 *pu1_left_nnz,
                                                  UWORD8 u1_tran_form8x8,
                                                  UWORD8 u1_mb_field_decodingflag,
                                                  UWORD32 *pu4_csbp)
{
    UWORD32 u4_num_coeff, u4_n, u4_subblock_coded;
    UWORD32 u4_top0, u4_top1;
    UWORD32 *pu4_dummy;
    WORD32 (**pf_cavlc_parse4x4coeff)(WORD16 *pi2_coeff_block,
                                      UWORD32 u4_isdc,
                                      WORD32 u4_n,
                                      struct _DecStruct *ps_dec,
                                      UWORD32 *pu4_dummy) =
                                      ps_dec->pf_cavlc_parse4x4coeff;
    UWORD32 u4_idx = 0;
    UWORD8 *puc_temp;
    WORD32 ret;

    *pu4_csbp = 0;
    puc_temp = ps_dec->pu1_inv_scan;

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 0                    */
    /*------------------------------------------------------*/
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[0];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[0];
        }
    }
    u4_n = pu1_left_nnz[0];
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    u4_top0 = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 1                    */
    /*------------------------------------------------------*/
    u4_idx++;
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[1];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[1];
        }
    }
    else
    {
        pi2_coeff_block += NUM_COEFFS_IN_4x4BLK;
    }
    u4_n = u4_num_coeff;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    u4_top1 = pu1_left_nnz[0] = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 2                    */
    /*------------------------------------------------------*/
    u4_idx += (u4_sub_block_strd - 1);
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[2];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[2];
        }
    }
    else
    {
        pi2_coeff_block += ((u4_sub_block_strd - 1) * NUM_COEFFS_IN_4x4BLK);
    }
    u4_n = (u4_top0 + pu1_left_nnz[1] + 1) >> 1;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    pu1_top_nnz[0] = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 3                    */
    /*------------------------------------------------------*/
    u4_idx++;
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[3];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[3];
        }
    }
    else
    {
        pi2_coeff_block += NUM_COEFFS_IN_4x4BLK;
    }
    u4_n = (u4_top1 + u4_num_coeff + 1) >> 1;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    pu1_top_nnz[1] = pu1_left_nnz[1] = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    ps_dec->pu1_inv_scan = puc_temp;

    return OK;
}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_cavlc_parse_8x8block_top_available                       */
/*                                                                           */
/*  Description   : This function does the residual parsing of 4 subblocks   */
/*                  in a 8x8 block when only top is available for block      */
/*                                                                           */
/*  Inputs        : pi2_coeff_block : pointer to residual block where        */
/*                  decoded and inverse scan coefficients are updated        */
/*                                                                           */
/*                  u4_sub_block_strd : indicates the number of sublocks    */
/*                  in a row. It is 4 for luma and 2 for chroma.             */
/*                                                                           */
/*                  u4_isdc : required to indicate 4x4 parse modules if the  */
/*                  current  Mb is I_16x16/chroma DC coded.                  */
/*                                                                           */
/*                  ps_dec : pointer to Decstruct (decoder context)          */
/*                                                                           */
/*                  pu1_top_nnz : top nnz pointer                            */
/*                                                                           */
/*                  pu1_left_nnz : left nnz pointer                          */
/*                                                                           */
/*  Globals       : No                                                       */
/*  Processing    : Parsing for four subblocks in unrolled, top and left nnz */
/*                  are updated on the fly. csbp is set in accordance to     */
/*                  decoded numcoeff for the subblock index in raster order  */
/*                                                                           */
/*  Outputs       : The updated residue buffer, nnzs and csbp current block  */
/*                                                                           */
/*  Returns       : Returns the coded sub block pattern csbp for the block   */
/*                                                                           */
/*  Issues        : <List any issues or problems with this function>         */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         09 10 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/
WORD32 ih264d_cavlc_parse_8x8block_top_available(WORD16 *pi2_coeff_block,
                                                 UWORD32 u4_sub_block_strd,
                                                 UWORD32 u4_isdc,
                                                 dec_struct_t * ps_dec,
                                                 UWORD8 *pu1_top_nnz,
                                                 UWORD8 *pu1_left_nnz,
                                                 UWORD8 u1_tran_form8x8,
                                                 UWORD8 u1_mb_field_decodingflag,
                                                 UWORD32 *pu4_csbp)
{
    UWORD32 u4_num_coeff, u4_n, u4_subblock_coded;
    UWORD32 u4_top0, u4_top1;
    UWORD32 *pu4_dummy;
    WORD32 (**pf_cavlc_parse4x4coeff)(WORD16 *pi2_coeff_block,
                                      UWORD32 u4_isdc,
                                      WORD32 u4_n,
                                      struct _DecStruct *ps_dec,
                                      UWORD32 *pu4_dummy) =
                                      ps_dec->pf_cavlc_parse4x4coeff;
    UWORD32 u4_idx = 0;
    UWORD8 *puc_temp;
    WORD32 ret;

    *pu4_csbp = 0;
    puc_temp = ps_dec->pu1_inv_scan;

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 0                    */
    /*------------------------------------------------------*/
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[0];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[0];
        }
    }
    u4_n = pu1_top_nnz[0];
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    u4_top0 = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 1                    */
    /*------------------------------------------------------*/
    u4_idx++;
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[1];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[1];
        }
    }
    else
    {
        pi2_coeff_block += NUM_COEFFS_IN_4x4BLK;
    }
    u4_n = (pu1_top_nnz[1] + u4_num_coeff + 1) >> 1;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    u4_top1 = pu1_left_nnz[0] = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 2                    */
    /*------------------------------------------------------*/
    u4_idx += (u4_sub_block_strd - 1);
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[2];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[2];
        }
    }
    else
    {
        pi2_coeff_block += ((u4_sub_block_strd - 1) * NUM_COEFFS_IN_4x4BLK);
    }
    u4_n = u4_top0;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    pu1_top_nnz[0] = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 3                    */
    /*------------------------------------------------------*/
    u4_idx++;
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[3];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[3];
        }
    }
    else
    {
        pi2_coeff_block += NUM_COEFFS_IN_4x4BLK;
    }
    u4_n = (u4_top1 + u4_num_coeff + 1) >> 1;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    pu1_top_nnz[1] = pu1_left_nnz[1] = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    ps_dec->pu1_inv_scan = puc_temp;

    return OK;
}

/*****************************************************************************/
/*                                                                           */
/*  Function Name : ih264d_cavlc_parse_8x8block_none_available                      */
/*                                                                           */
/*  Description   : This function does the residual parsing of 4 subblocks   */
/*                  in a 8x8 block when none of the neigbours are available  */
/*                                                                           */
/*  Inputs        : pi2_coeff_block : pointer to residual block where        */
/*                  decoded and inverse scan coefficients are updated        */
/*                                                                           */
/*                  u4_sub_block_strd : indicates the number of sublocks    */
/*                  in a row. It is 4 for luma and 2 for chroma.             */
/*                                                                           */
/*                  u4_isdc : required to indicate 4x4 parse modules if the  */
/*                  current  Mb is I_16x16/chroma DC coded.                  */
/*                                                                           */
/*                  ps_dec : pointer to Decstruct (decoder context)          */
/*                                                                           */
/*                  pu1_top_nnz : top nnz pointer                            */
/*                                                                           */
/*                  pu1_left_nnz : left nnz pointer                          */
/*                                                                           */
/*  Globals       : No                                                       */
/*  Processing    : Parsing for four subblocks in unrolled, top and left nnz */
/*                  are updated on the fly. csbp is set in accordance to     */
/*                  decoded numcoeff for the subblock index in raster order  */
/*                                                                           */
/*  Outputs       : The updated residue buffer, nnzs and csbp current block  */
/*                                                                           */
/*  Returns       : Returns the coded sub block pattern csbp for the block   */
/*                                                                           */
/*  Issues        : <List any issues or problems with this function>         */
/*                                                                           */
/*  Revision History:                                                        */
/*                                                                           */
/*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
/*         09 10 2008   Jay          Draft                                   */
/*                                                                           */
/*****************************************************************************/
WORD32 ih264d_cavlc_parse_8x8block_none_available(WORD16 *pi2_coeff_block,
                                                  UWORD32 u4_sub_block_strd,
                                                  UWORD32 u4_isdc,
                                                  dec_struct_t * ps_dec,
                                                  UWORD8 *pu1_top_nnz,
                                                  UWORD8 *pu1_left_nnz,
                                                  UWORD8 u1_tran_form8x8,
                                                  UWORD8 u1_mb_field_decodingflag,
                                                  UWORD32 *pu4_csbp)
{
    UWORD32 u4_num_coeff, u4_n, u4_subblock_coded;
    UWORD32 u4_top0, u4_top1;
    UWORD32 *pu4_dummy;
    WORD32 (**pf_cavlc_parse4x4coeff)(WORD16 *pi2_coeff_block,
                                      UWORD32 u4_isdc,
                                      WORD32 u4_n,
                                      struct _DecStruct *ps_dec,
                                      UWORD32 *pu4_dummy) =
                                      ps_dec->pf_cavlc_parse4x4coeff;
    UWORD32 u4_idx = 0;
    UWORD8 *puc_temp;
    WORD32 ret;

    *pu4_csbp = 0;
    puc_temp = ps_dec->pu1_inv_scan;

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 0                    */
    /*------------------------------------------------------*/
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[0];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[0];
        }
    }
    ret = pf_cavlc_parse4x4coeff[0](pi2_coeff_block, u4_isdc, 0,
                                    ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    u4_top0 = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 1                    */
    /*------------------------------------------------------*/
    u4_idx++;
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[1];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[1];
        }
    }
    else
    {
        pi2_coeff_block += NUM_COEFFS_IN_4x4BLK;
    }
    u4_n = u4_num_coeff;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    u4_top1 = pu1_left_nnz[0] = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 2                    */
    /*------------------------------------------------------*/
    u4_idx += (u4_sub_block_strd - 1);
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[2];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[2];
        }
    }
    else
    {
        pi2_coeff_block += ((u4_sub_block_strd - 1) * NUM_COEFFS_IN_4x4BLK);
    }
    u4_n = u4_top0;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    pu1_top_nnz[0] = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    /*------------------------------------------------------*/
    /* Residual 4x4 decoding: SubBlock 3                    */
    /*------------------------------------------------------*/
    u4_idx++;
    if(u1_tran_form8x8)
    {
        if(!u1_mb_field_decodingflag)
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[3];
        }
        else
        {
            ps_dec->pu1_inv_scan =
                            (UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[3];
        }
    }
    else
    {
        pi2_coeff_block += NUM_COEFFS_IN_4x4BLK;
    }
    u4_n = (u4_top1 + u4_num_coeff + 1) >> 1;
    ret = pf_cavlc_parse4x4coeff[(u4_n > 7)](pi2_coeff_block, u4_isdc,
                                             u4_n, ps_dec, &u4_num_coeff);
    if(ret != OK)
        return ret;

    pu1_top_nnz[1] = pu1_left_nnz[1] = u4_num_coeff;
    u4_subblock_coded = (u4_num_coeff != 0);
    INSERT_BIT(*pu4_csbp, u4_idx, u4_subblock_coded);

    ps_dec->pu1_inv_scan = puc_temp;

    return OK;
}

/*!
 **************************************************************************
 * \if Function name : ih264d_parse_residual4x4_cavlc \endif
 *
 * \brief
 *    This function parses CAVLC syntax of a Luma and Chroma AC Residuals.
 *
 * \return
 *    0 on Success and Error code otherwise
 **************************************************************************
 */

WORD32 ih264d_parse_residual4x4_cavlc(dec_struct_t * ps_dec,
                                      dec_mb_info_t *ps_cur_mb_info,
                                      UWORD8 u1_offset)
{
    UWORD8 u1_cbp = ps_cur_mb_info->u1_cbp;
    UWORD16 ui16_csbp = 0;
    UWORD32 u4_nbr_avl;
    WORD16 *pi2_residual_buf;

    UWORD8 u1_is_top_mb_avail;
    UWORD8 u1_is_left_mb_avail;

    UWORD8 *pu1_top_nnz = ps_cur_mb_info->ps_curmb->pu1_nnz_y;
    UWORD8 *pu1_left_nnz = ps_dec->pu1_left_nnz_y;
    WORD16 *pi2_coeff_block = NULL;
    UWORD32 *pu4_dummy;
    WORD32 ret;

    WORD32 (**pf_cavlc_parse_8x8block)(WORD16 *pi2_coeff_block,
                                       UWORD32 u4_sub_block_strd,
                                       UWORD32 u4_isdc,
                                       struct _DecStruct *ps_dec,
                                       UWORD8 *pu1_top_nnz,
                                       UWORD8 *pu1_left_nnz,
                                       UWORD8 u1_tran_form8x8,
                                       UWORD8 u1_mb_field_decodingflag,
                                       UWORD32 *pu4_dummy) = ps_dec->pf_cavlc_parse_8x8block;


    {
        UWORD8 uc_temp = ps_dec->u1_mb_ngbr_availablity;
        u1_is_top_mb_avail = BOOLEAN(uc_temp & TOP_MB_AVAILABLE_MASK);
        u1_is_left_mb_avail = BOOLEAN(uc_temp & LEFT_MB_AVAILABLE_MASK);
        u4_nbr_avl = (u1_is_top_mb_avail << 1) | u1_is_left_mb_avail;
    }

    ps_cur_mb_info->u1_qp_div6 = ps_dec->u1_qp_y_div6;
    ps_cur_mb_info->u1_qp_rem6 = ps_dec->u1_qp_y_rem6;
    ps_cur_mb_info->u1_qpc_div6 = ps_dec->u1_qp_u_div6;
    ps_cur_mb_info->u1_qpc_rem6 = ps_dec->u1_qp_u_rem6;
    ps_cur_mb_info->u1_qpcr_div6 = ps_dec->u1_qp_v_div6;
    ps_cur_mb_info->u1_qpcr_rem6 = ps_dec->u1_qp_v_rem6;

    if(u1_cbp & 0xf)
    {
        pu1_top_nnz[0] = ps_cur_mb_info->ps_top_mb->pu1_nnz_y[0];
        pu1_top_nnz[1] = ps_cur_mb_info->ps_top_mb->pu1_nnz_y[1];
        pu1_top_nnz[2] = ps_cur_mb_info->ps_top_mb->pu1_nnz_y[2];
        pu1_top_nnz[3] = ps_cur_mb_info->ps_top_mb->pu1_nnz_y[3];

        /*******************************************************************/
        /* Block 0 residual decoding, check cbp and proceed (subblock = 0) */
        /*******************************************************************/
        if(!(u1_cbp & 0x1))
        {
            *(UWORD16 *)(pu1_top_nnz) = 0;
            *(UWORD16 *)(pu1_left_nnz) = 0;

        }
        else
        {
            UWORD32 u4_temp;
            ret = pf_cavlc_parse_8x8block[u4_nbr_avl](
                        pi2_coeff_block, 4, u1_offset, ps_dec, pu1_top_nnz,
                        pu1_left_nnz, ps_cur_mb_info->u1_tran_form8x8,
                        ps_cur_mb_info->u1_mb_field_decodingflag, &u4_temp);
            if(ret != OK)
                return ret;
            ui16_csbp = u4_temp;
        }

        /*******************************************************************/
        /* Block 1 residual decoding, check cbp and proceed (subblock = 2) */
        /*******************************************************************/
        if(ps_cur_mb_info->u1_tran_form8x8)
        {
            pi2_coeff_block += 64;
        }
        else
        {
            pi2_coeff_block += (2 * NUM_COEFFS_IN_4x4BLK);
        }

        if(!(u1_cbp & 0x2))
        {
            *(UWORD16 *)(pu1_top_nnz + 2) = 0;
            *(UWORD16 *)(pu1_left_nnz) = 0;
        }
        else
        {
            UWORD32 u4_temp = (u4_nbr_avl | 0x1);
            ret = pf_cavlc_parse_8x8block[u4_temp](
                        pi2_coeff_block, 4, u1_offset, ps_dec,
                        (pu1_top_nnz + 2), pu1_left_nnz,
                        ps_cur_mb_info->u1_tran_form8x8,
                        ps_cur_mb_info->u1_mb_field_decodingflag, &u4_temp);
            if(ret != OK)
                return ret;
            ui16_csbp |= (u4_temp << 2);
        }

        /*******************************************************************/
        /* Block 2 residual decoding, check cbp and proceed (subblock = 8) */
        /*******************************************************************/
        if(ps_cur_mb_info->u1_tran_form8x8)
        {
            pi2_coeff_block += 64;
        }
        else
        {
            pi2_coeff_block += (6 * NUM_COEFFS_IN_4x4BLK);
        }

        if(!(u1_cbp & 0x4))
        {
            *(UWORD16 *)(pu1_top_nnz) = 0;
            *(UWORD16 *)(pu1_left_nnz + 2) = 0;
        }
        else
        {
            UWORD32 u4_temp = (u4_nbr_avl | 0x2);
            ret = pf_cavlc_parse_8x8block[u4_temp](
                        pi2_coeff_block, 4, u1_offset, ps_dec, pu1_top_nnz,
                        (pu1_left_nnz + 2), ps_cur_mb_info->u1_tran_form8x8,
                        ps_cur_mb_info->u1_mb_field_decodingflag, &u4_temp);
            if(ret != OK)
                return ret;
            ui16_csbp |= (u4_temp << 8);
        }

        /*******************************************************************/
        /* Block 3 residual decoding, check cbp and proceed (subblock = 10)*/
        /*******************************************************************/
        if(ps_cur_mb_info->u1_tran_form8x8)
        {
            pi2_coeff_block += 64;
        }
        else
        {
            pi2_coeff_block += (2 * NUM_COEFFS_IN_4x4BLK);
        }

        if(!(u1_cbp & 0x8))
        {
            *(UWORD16 *)(pu1_top_nnz + 2) = 0;
            *(UWORD16 *)(pu1_left_nnz + 2) = 0;
        }
        else
        {
            UWORD32 u4_temp;
            ret = pf_cavlc_parse_8x8block[0x3](
                        pi2_coeff_block, 4, u1_offset, ps_dec,
                        (pu1_top_nnz + 2), (pu1_left_nnz + 2),
                        ps_cur_mb_info->u1_tran_form8x8,
                        ps_cur_mb_info->u1_mb_field_decodingflag, &u4_temp);
            if(ret != OK)
                return ret;
            ui16_csbp |= (u4_temp << 10);
        }
    }
    else
    {
        *(UWORD32 *)(pu1_top_nnz) = 0;
        *(UWORD32 *)(pu1_left_nnz) = 0;
    }

    ps_cur_mb_info->u2_luma_csbp = ui16_csbp;
    ps_cur_mb_info->ps_curmb->u2_luma_csbp = ui16_csbp;

    {
        UWORD16 u2_chroma_csbp = 0;
        ps_cur_mb_info->u2_chroma_csbp = 0;
        pu1_top_nnz = ps_cur_mb_info->ps_curmb->pu1_nnz_uv;
        pu1_left_nnz = ps_dec->pu1_left_nnz_uv;

        u1_cbp >>= 4;
        /*--------------------------------------------------------------------*/
        /* if Chroma Component not present OR no ac values present            */
        /* Set the values of N to zero                                        */
        /*--------------------------------------------------------------------*/
        if(u1_cbp == CBPC_ALLZERO || u1_cbp == CBPC_ACZERO)
        {
            *(UWORD32 *)(pu1_top_nnz) = 0;
            *(UWORD32 *)(pu1_left_nnz) = 0;
        }

        if(u1_cbp == CBPC_ALLZERO)
        {
            return (0);
        }
        /*--------------------------------------------------------------------*/
        /* Decode Chroma DC values                                            */
        /*--------------------------------------------------------------------*/
        {
            WORD32 u4_scale_u;
            WORD32 u4_scale_v;
            WORD32 i4_mb_inter_inc;
            u4_scale_u = ps_dec->pu2_quant_scale_u[0] << ps_dec->u1_qp_u_div6;
            u4_scale_v = ps_dec->pu2_quant_scale_v[0] << ps_dec->u1_qp_v_div6;
            i4_mb_inter_inc = (!((ps_cur_mb_info->ps_curmb->u1_mb_type == I_4x4_MB)
                            || (ps_cur_mb_info->ps_curmb->u1_mb_type == I_16x16_MB)))
                            * 3;

            if(ps_dec->s_high_profile.u1_scaling_present)
            {
                u4_scale_u *=
                                ps_dec->s_high_profile.i2_scalinglist4x4[i4_mb_inter_inc
                                                + 1][0];
                u4_scale_v *=
                                ps_dec->s_high_profile.i2_scalinglist4x4[i4_mb_inter_inc
                                                + 2][0];

            }
            else
            {
                u4_scale_u <<= 4;
                u4_scale_v <<= 4;
            }

            ih264d_cavlc_parse_chroma_dc(ps_cur_mb_info,pi2_coeff_block, ps_dec->ps_bitstrm,
                                         u4_scale_u, u4_scale_v,
                                         i4_mb_inter_inc);
        }

        if(u1_cbp == CBPC_ACZERO)
            return (0);

        pu1_top_nnz[0] = ps_cur_mb_info->ps_top_mb->pu1_nnz_uv[0];
        pu1_top_nnz[1] = ps_cur_mb_info->ps_top_mb->pu1_nnz_uv[1];
        pu1_top_nnz[2] = ps_cur_mb_info->ps_top_mb->pu1_nnz_uv[2];
        pu1_top_nnz[3] = ps_cur_mb_info->ps_top_mb->pu1_nnz_uv[3];
        /*--------------------------------------------------------------------*/
        /* Decode Chroma AC values                                            */
        /*--------------------------------------------------------------------*/
        {
            UWORD32 u4_temp;
            /*****************************************************************/
            /* U Block  residual decoding, check cbp and proceed (subblock=0)*/
            /*****************************************************************/
            ret = pf_cavlc_parse_8x8block[u4_nbr_avl](
                        pi2_coeff_block, 2, 1, ps_dec, pu1_top_nnz,
                        pu1_left_nnz, 0, 0, &u4_temp);
            if(ret != OK)
                return ret;
            u2_chroma_csbp = u4_temp;

            pi2_coeff_block += MB_CHROM_SIZE;
            /*****************************************************************/
            /* V Block  residual decoding, check cbp and proceed (subblock=1)*/
            /*****************************************************************/
            ret = pf_cavlc_parse_8x8block[u4_nbr_avl](pi2_coeff_block, 2, 1,
                                                      ps_dec,
                                                      (pu1_top_nnz + 2),
                                                      (pu1_left_nnz + 2), 0,
                                                      0, &u4_temp);
            if(ret != OK)
                return ret;
            u2_chroma_csbp |= (u4_temp << 4);
        }

        ps_cur_mb_info->u2_chroma_csbp = u2_chroma_csbp;
    }
    return OK;
}