mirror of
https://github.com/cemu-project/Cemu.git
synced 2025-01-10 00:49:22 +01:00
2023 lines
78 KiB
C
2023 lines
78 KiB
C
/******************************************************************************
|
|
*
|
|
* Copyright (C) 2015 The Android Open Source Project
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at:
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*
|
|
*****************************************************************************
|
|
* Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore
|
|
*/
|
|
/*!
|
|
**************************************************************************
|
|
* \file ih264d_process_intra_mb.c
|
|
*
|
|
* \brief
|
|
* Contains routines that decode a I slice type
|
|
*
|
|
* Detailed_description
|
|
*
|
|
* \date
|
|
* 07/07/2003
|
|
*
|
|
* \author NS
|
|
**************************************************************************
|
|
*/
|
|
|
|
#include <string.h>
|
|
#include "ih264d_bitstrm.h"
|
|
#include "ih264d_defs.h"
|
|
#include "ih264d_debug.h"
|
|
#include "ih264d_tables.h"
|
|
#include "ih264d_structs.h"
|
|
#include "ih264d_defs.h"
|
|
#include "ih264d_parse_cavlc.h"
|
|
#include "ih264d_mb_utils.h"
|
|
#include "ih264d_parse_slice.h"
|
|
#include "ih264d_process_intra_mb.h"
|
|
#include "ih264d_error_handler.h"
|
|
#include "ih264d_quant_scaling.h"
|
|
#include "ih264d_tables.h"
|
|
|
|
/*!
|
|
**************************************************************************
|
|
* \if Function name : ih264d_itrans_recon_luma_dc \endif
|
|
*
|
|
* \brief
|
|
* This function does InvTransform, scaling and reconstruction of Luma DC.
|
|
*
|
|
* \return
|
|
* 0 on Success and Error code otherwise
|
|
**************************************************************************
|
|
*/
|
|
void ih264d_itrans_recon_luma_dc(dec_struct_t *ps_dec,
|
|
WORD16* pi2_src,
|
|
WORD16* pi2_coeff_block,
|
|
const UWORD16 *pu2_weigh_mat)
|
|
{
|
|
WORD32 i;
|
|
WORD16 pi2_out[16];
|
|
WORD32 pi4_tmp[16];
|
|
WORD16 *pi2_out_ptr = &pi2_out[0];
|
|
PROFILE_DISABLE_IQ_IT_RECON_RETURN()
|
|
ps_dec->pf_ihadamard_scaling_4x4(pi2_src, pi2_out,
|
|
ps_dec->pu2_quant_scale_y, pu2_weigh_mat,
|
|
ps_dec->u1_qp_y_div6, pi4_tmp);
|
|
for(i = 0; i < 4; i++)
|
|
{
|
|
pi2_coeff_block[0] = pi2_out_ptr[0];
|
|
pi2_coeff_block[4 * 16] = pi2_out_ptr[4];
|
|
pi2_coeff_block[8 * 16] = pi2_out_ptr[8];
|
|
pi2_coeff_block[12 * 16] = pi2_out_ptr[12];
|
|
|
|
pi2_out_ptr++; /* Point to next column */
|
|
pi2_coeff_block += 16;
|
|
}
|
|
}
|
|
/*!
|
|
**************************************************************************
|
|
* \if Function name : ih264d_read_intra_pred_modes \endif
|
|
*
|
|
* \brief
|
|
* Reads the intra pred mode related values of I4x4 MB from bitstream.
|
|
*
|
|
* This function will read the prev intra pred mode flags and
|
|
* stores it in pu1_prev_intra4x4_pred_mode_flag. If the u4_flag
|
|
* indicates that most probable mode is not intra pred mode, then
|
|
* the rem_intra4x4_pred_mode is read and stored in
|
|
* pu1_rem_intra4x4_pred_mode array.
|
|
*
|
|
*
|
|
* \return
|
|
* 0 on success and Error code otherwise
|
|
*
|
|
**************************************************************************
|
|
*/
|
|
WORD32 ih264d_read_intra_pred_modes(dec_struct_t * ps_dec,
|
|
UWORD8 * pu1_prev_intra4x4_pred_mode_flag,
|
|
UWORD8 * pu1_rem_intra4x4_pred_mode,
|
|
UWORD32 u4_trans_form8x8)
|
|
{
|
|
WORD32 i4x4_luma_blk_idx = 0, i8x8_luma_blk_idx = 0;
|
|
|
|
dec_bit_stream_t * ps_bitstrm = ps_dec->ps_bitstrm;
|
|
|
|
if(!u4_trans_form8x8)
|
|
{
|
|
for(i4x4_luma_blk_idx = 0; i4x4_luma_blk_idx < 16; ++i4x4_luma_blk_idx)
|
|
{
|
|
UWORD32 u4_temp;
|
|
SWITCHOFFTRACE;
|
|
|
|
GETBIT(u4_temp, ps_bitstrm->u4_ofst, ps_bitstrm->pu4_buffer);
|
|
*pu1_prev_intra4x4_pred_mode_flag = (UWORD8)u4_temp;
|
|
if(!(*pu1_prev_intra4x4_pred_mode_flag))
|
|
{
|
|
GETBITS(u4_temp, ps_bitstrm->u4_ofst, ps_bitstrm->pu4_buffer, 3);
|
|
|
|
*(pu1_rem_intra4x4_pred_mode) = (UWORD8)u4_temp;
|
|
}
|
|
|
|
pu1_prev_intra4x4_pred_mode_flag++;
|
|
pu1_rem_intra4x4_pred_mode++;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
/**********************************************************************/
|
|
/* prev_intra4x4_pred_modes to be interpreted as */
|
|
/* prev_intra8x8_pred_modes in case of transform 8x8 */
|
|
/**********************************************************************/
|
|
for(i8x8_luma_blk_idx = 0; i8x8_luma_blk_idx < 4; i8x8_luma_blk_idx++)
|
|
{
|
|
UWORD32 u4_temp;
|
|
GETBIT(u4_temp, ps_bitstrm->u4_ofst, ps_bitstrm->pu4_buffer);
|
|
*pu1_prev_intra4x4_pred_mode_flag = (UWORD8)u4_temp;
|
|
if(!(*pu1_prev_intra4x4_pred_mode_flag))
|
|
{
|
|
GETBITS(u4_temp, ps_bitstrm->u4_ofst, ps_bitstrm->pu4_buffer, 3);
|
|
|
|
(*pu1_rem_intra4x4_pred_mode) = (UWORD8)u4_temp;
|
|
}
|
|
pu1_prev_intra4x4_pred_mode_flag++;
|
|
pu1_rem_intra4x4_pred_mode++;
|
|
}
|
|
}
|
|
return (0);
|
|
}
|
|
WORD32 ih264d_unpack_coeff4x4_4x4blk(dec_struct_t * ps_dec,
|
|
WORD16 *pi2_out_coeff_data,
|
|
UWORD8 *pu1_inv_scan)
|
|
{
|
|
tu_sblk4x4_coeff_data_t *ps_tu_4x4 = (tu_sblk4x4_coeff_data_t *)ps_dec->pv_proc_tu_coeff_data;
|
|
UWORD16 u2_sig_coeff_map = ps_tu_4x4->u2_sig_coeff_map;
|
|
WORD32 idx = 0;
|
|
WORD16 *pi2_coeff_data = &ps_tu_4x4->ai2_level[0];
|
|
WORD32 dc_only_flag = 0;
|
|
WORD32 num_coeff = 0;
|
|
|
|
PROFILE_DISABLE_UNPACK_LUMA()
|
|
while(u2_sig_coeff_map)
|
|
{
|
|
idx = CLZ(u2_sig_coeff_map);
|
|
|
|
idx = 31 - idx;
|
|
RESET_BIT(u2_sig_coeff_map,idx);
|
|
|
|
idx = pu1_inv_scan[idx];
|
|
pi2_out_coeff_data[idx] = *pi2_coeff_data++;
|
|
num_coeff++;
|
|
}
|
|
|
|
if((num_coeff == 1) && (idx == 0))
|
|
{
|
|
dc_only_flag = 1;
|
|
}
|
|
|
|
{
|
|
WORD32 offset;
|
|
offset = (UWORD8 *)pi2_coeff_data - (UWORD8 *)ps_tu_4x4;
|
|
offset = ALIGN4(offset);
|
|
ps_dec->pv_proc_tu_coeff_data = (void *)((UWORD8 *)ps_dec->pv_proc_tu_coeff_data + offset);
|
|
}
|
|
|
|
return dc_only_flag;
|
|
}
|
|
|
|
UWORD32 ih264d_unpack_coeff4x4_8x8blk(dec_struct_t * ps_dec,
|
|
dec_mb_info_t * ps_cur_mb_info,
|
|
UWORD16 ui2_luma_csbp,
|
|
WORD16 *pi2_out_coeff_data)
|
|
{
|
|
UWORD8 *pu1_inv_scan;
|
|
UWORD8 u1_mb_field_decoding_flag = ps_cur_mb_info->u1_mb_field_decodingflag;
|
|
UWORD8 u1_field_coding_flag = ps_cur_mb_info->ps_curmb->u1_mb_fld;
|
|
UWORD32 u4_luma_dc_only_csbp = 0;
|
|
WORD32 dc_only_flag = 0;
|
|
|
|
PROFILE_DISABLE_UNPACK_LUMA()
|
|
if(u1_field_coding_flag || u1_mb_field_decoding_flag)
|
|
{
|
|
pu1_inv_scan = (UWORD8 *)gau1_ih264d_inv_scan_fld;
|
|
}
|
|
else
|
|
{
|
|
pu1_inv_scan = (UWORD8 *)gau1_ih264d_inv_scan;
|
|
}
|
|
|
|
// sub 0
|
|
if(ui2_luma_csbp & 0x1)
|
|
{
|
|
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
|
|
dc_only_flag = ih264d_unpack_coeff4x4_4x4blk(ps_dec,
|
|
pi2_out_coeff_data,
|
|
pu1_inv_scan);
|
|
|
|
INSERT_BIT(u4_luma_dc_only_csbp, 0, dc_only_flag);
|
|
}
|
|
|
|
pi2_out_coeff_data += 16;
|
|
// sub 1
|
|
if(ui2_luma_csbp & 0x2)
|
|
{
|
|
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
|
|
dc_only_flag = ih264d_unpack_coeff4x4_4x4blk(ps_dec,
|
|
pi2_out_coeff_data,
|
|
pu1_inv_scan);
|
|
INSERT_BIT(u4_luma_dc_only_csbp, 1, dc_only_flag);
|
|
}
|
|
|
|
pi2_out_coeff_data += 16 + 32;
|
|
// sub 2
|
|
if(ui2_luma_csbp & 0x10)
|
|
{
|
|
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
|
|
dc_only_flag = ih264d_unpack_coeff4x4_4x4blk(ps_dec,
|
|
pi2_out_coeff_data,
|
|
pu1_inv_scan);
|
|
INSERT_BIT(u4_luma_dc_only_csbp, 4, dc_only_flag);
|
|
}
|
|
|
|
pi2_out_coeff_data += 16;
|
|
// sub 3
|
|
if(ui2_luma_csbp & 0x20)
|
|
{
|
|
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
|
|
dc_only_flag = ih264d_unpack_coeff4x4_4x4blk(ps_dec,
|
|
pi2_out_coeff_data,
|
|
pu1_inv_scan);
|
|
INSERT_BIT(u4_luma_dc_only_csbp, 5, dc_only_flag);
|
|
}
|
|
return u4_luma_dc_only_csbp;
|
|
}
|
|
WORD32 ih264d_unpack_coeff8x8_8x8blk_cavlc(dec_struct_t * ps_dec,
|
|
dec_mb_info_t * ps_cur_mb_info,
|
|
UWORD16 ui2_luma_csbp,
|
|
WORD16 *pi2_out_coeff_data)
|
|
{
|
|
UWORD8 *pu1_inv_scan;
|
|
UWORD8 u1_mb_field_decoding_flag = ps_cur_mb_info->u1_mb_field_decodingflag;
|
|
UWORD8 u1_field_coding_flag = ps_cur_mb_info->ps_curmb->u1_mb_fld;
|
|
WORD32 dc_only_flag = 0;
|
|
|
|
PROFILE_DISABLE_UNPACK_LUMA()
|
|
if(ui2_luma_csbp & 0x33)
|
|
{
|
|
memset(pi2_out_coeff_data,0,64*sizeof(WORD16));
|
|
}
|
|
|
|
if(!u1_mb_field_decoding_flag)
|
|
{
|
|
pu1_inv_scan =
|
|
(UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[0];
|
|
}
|
|
else
|
|
{
|
|
pu1_inv_scan =
|
|
(UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[0];
|
|
}
|
|
// sub 0
|
|
if(ui2_luma_csbp & 0x1)
|
|
{
|
|
dc_only_flag = ih264d_unpack_coeff4x4_4x4blk(ps_dec,
|
|
pi2_out_coeff_data,
|
|
pu1_inv_scan);
|
|
}
|
|
|
|
if(!u1_mb_field_decoding_flag)
|
|
{
|
|
pu1_inv_scan =
|
|
(UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[1];
|
|
}
|
|
else
|
|
{
|
|
pu1_inv_scan =
|
|
(UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[1];
|
|
}
|
|
// sub 1
|
|
if(ui2_luma_csbp & 0x2)
|
|
{
|
|
dc_only_flag = 0;
|
|
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
|
|
pi2_out_coeff_data,
|
|
pu1_inv_scan);
|
|
}
|
|
|
|
if(!u1_mb_field_decoding_flag)
|
|
{
|
|
pu1_inv_scan =
|
|
(UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[2];
|
|
}
|
|
else
|
|
{
|
|
pu1_inv_scan =
|
|
(UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[2];
|
|
}
|
|
// sub 2
|
|
if(ui2_luma_csbp & 0x10)
|
|
{
|
|
dc_only_flag = 0;
|
|
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
|
|
pi2_out_coeff_data,
|
|
pu1_inv_scan);
|
|
}
|
|
|
|
if(!u1_mb_field_decoding_flag)
|
|
{
|
|
pu1_inv_scan =
|
|
(UWORD8*)gau1_ih264d_inv_scan_prog8x8_cavlc[3];
|
|
}
|
|
else
|
|
{
|
|
pu1_inv_scan =
|
|
(UWORD8*)gau1_ih264d_inv_scan_int8x8_cavlc[3];
|
|
}
|
|
// sub 3
|
|
if(ui2_luma_csbp & 0x20)
|
|
{
|
|
dc_only_flag = 0;
|
|
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
|
|
pi2_out_coeff_data,
|
|
pu1_inv_scan);
|
|
}
|
|
return dc_only_flag;
|
|
}
|
|
void ih264d_unpack_coeff4x4_8x8blk_chroma(dec_struct_t * ps_dec,
|
|
dec_mb_info_t * ps_cur_mb_info,
|
|
UWORD16 ui2_chroma_csbp,
|
|
WORD16 *pi2_out_coeff_data)
|
|
{
|
|
UWORD8 *pu1_inv_scan;
|
|
UWORD8 u1_mb_field_decoding_flag = ps_cur_mb_info->u1_mb_field_decodingflag;
|
|
UWORD8 u1_field_coding_flag = ps_cur_mb_info->ps_curmb->u1_mb_fld;
|
|
|
|
PROFILE_DISABLE_UNPACK_CHROMA()
|
|
if(u1_field_coding_flag || u1_mb_field_decoding_flag)
|
|
{
|
|
pu1_inv_scan = (UWORD8 *)gau1_ih264d_inv_scan_fld;
|
|
}
|
|
else
|
|
{
|
|
pu1_inv_scan = (UWORD8 *)gau1_ih264d_inv_scan;
|
|
}
|
|
|
|
if(ui2_chroma_csbp & 0x1)
|
|
{
|
|
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
|
|
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
|
|
pi2_out_coeff_data,
|
|
pu1_inv_scan);
|
|
}
|
|
pi2_out_coeff_data += 16;
|
|
if(ui2_chroma_csbp & 0x2)
|
|
{
|
|
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
|
|
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
|
|
pi2_out_coeff_data,
|
|
pu1_inv_scan);
|
|
}
|
|
|
|
pi2_out_coeff_data += 16;
|
|
if(ui2_chroma_csbp & 0x4)
|
|
{
|
|
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
|
|
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
|
|
pi2_out_coeff_data,
|
|
pu1_inv_scan);
|
|
}
|
|
|
|
pi2_out_coeff_data += 16;
|
|
if(ui2_chroma_csbp & 0x8)
|
|
{
|
|
memset(pi2_out_coeff_data,0,16*sizeof(WORD16));
|
|
ih264d_unpack_coeff4x4_4x4blk(ps_dec,
|
|
pi2_out_coeff_data,
|
|
pu1_inv_scan);
|
|
}
|
|
}
|
|
UWORD32 ih264d_unpack_luma_coeff4x4_mb(dec_struct_t * ps_dec,
|
|
dec_mb_info_t * ps_cur_mb_info,
|
|
UWORD8 intra_flag)
|
|
{
|
|
UWORD8 u1_mb_type = ps_cur_mb_info->u1_mb_type;
|
|
UWORD16 ui2_luma_csbp = ps_cur_mb_info->u2_luma_csbp;
|
|
UWORD8 *pu1_inv_scan = ps_dec->pu1_inv_scan;
|
|
WORD16 *pi2_coeff_data = ps_dec->pi2_coeff_data;
|
|
|
|
PROFILE_DISABLE_UNPACK_LUMA()
|
|
if(!ps_cur_mb_info->u1_tran_form8x8)
|
|
{
|
|
UWORD32 u4_luma_dc_only_csbp = 0;
|
|
UWORD32 u4_temp = 0;
|
|
WORD16* pi2_dc_val = NULL;
|
|
/*
|
|
* Reserve the pointer to dc vals. The dc vals will be copied
|
|
* after unpacking of ac vals since memset to 0 inside.
|
|
*/
|
|
if(intra_flag && (u1_mb_type != I_4x4_MB))
|
|
{
|
|
if(CHECKBIT(ps_cur_mb_info->u1_yuv_dc_block_flag,0))
|
|
{
|
|
pi2_dc_val = (WORD16 *)ps_dec->pv_proc_tu_coeff_data;
|
|
|
|
ps_dec->pv_proc_tu_coeff_data = (void *)(pi2_dc_val + 16);
|
|
}
|
|
}
|
|
|
|
if(ui2_luma_csbp)
|
|
{
|
|
pi2_coeff_data = ps_dec->pi2_coeff_data;
|
|
u4_temp = ih264d_unpack_coeff4x4_8x8blk(ps_dec,
|
|
ps_cur_mb_info,
|
|
ui2_luma_csbp,
|
|
pi2_coeff_data);
|
|
u4_luma_dc_only_csbp = u4_temp;
|
|
|
|
pi2_coeff_data += 32;
|
|
|
|
ui2_luma_csbp = ui2_luma_csbp >> 2;
|
|
u4_temp = ih264d_unpack_coeff4x4_8x8blk(ps_dec,
|
|
ps_cur_mb_info,
|
|
ui2_luma_csbp,
|
|
pi2_coeff_data);
|
|
|
|
u4_luma_dc_only_csbp |= (u4_temp << 2);
|
|
|
|
pi2_coeff_data += 32 + 64;
|
|
|
|
ui2_luma_csbp = ui2_luma_csbp >> 6;
|
|
u4_temp = ih264d_unpack_coeff4x4_8x8blk(ps_dec,
|
|
ps_cur_mb_info,
|
|
ui2_luma_csbp,
|
|
pi2_coeff_data);
|
|
|
|
u4_luma_dc_only_csbp |= (u4_temp << 8);
|
|
|
|
pi2_coeff_data += 32;
|
|
|
|
ui2_luma_csbp = ui2_luma_csbp >> 2;
|
|
u4_temp = ih264d_unpack_coeff4x4_8x8blk(ps_dec,
|
|
ps_cur_mb_info,
|
|
ui2_luma_csbp,
|
|
pi2_coeff_data);
|
|
u4_luma_dc_only_csbp |= (u4_temp << 10);
|
|
}
|
|
|
|
if(pi2_dc_val != NULL)
|
|
{
|
|
WORD32 i;
|
|
pi2_coeff_data = ps_dec->pi2_coeff_data;
|
|
for(i = 0; i < 4; i++)
|
|
{
|
|
pi2_coeff_data[0] = pi2_dc_val[0];
|
|
pi2_coeff_data[4 * 16] = pi2_dc_val[4];
|
|
pi2_coeff_data[8 * 16] = pi2_dc_val[8];
|
|
pi2_coeff_data[12 * 16] = pi2_dc_val[12];
|
|
|
|
pi2_dc_val++; /* Point to next column */
|
|
pi2_coeff_data += 16;
|
|
}
|
|
u4_luma_dc_only_csbp = ps_cur_mb_info->u2_luma_csbp ^ 0xFFFF;
|
|
}
|
|
return u4_luma_dc_only_csbp;
|
|
}
|
|
else
|
|
{
|
|
UWORD32 u4_luma_dc_only_cbp = 0;
|
|
WORD32 dc_only_flag;
|
|
if(ui2_luma_csbp)
|
|
{
|
|
pi2_coeff_data = ps_dec->pi2_coeff_data;
|
|
dc_only_flag = ih264d_unpack_coeff8x8_8x8blk_cavlc(ps_dec,
|
|
ps_cur_mb_info,
|
|
ui2_luma_csbp,
|
|
pi2_coeff_data);
|
|
INSERT_BIT(u4_luma_dc_only_cbp, 0, dc_only_flag);
|
|
|
|
pi2_coeff_data += 64;
|
|
|
|
ui2_luma_csbp = ui2_luma_csbp >> 2;
|
|
dc_only_flag = ih264d_unpack_coeff8x8_8x8blk_cavlc(ps_dec,
|
|
ps_cur_mb_info,
|
|
ui2_luma_csbp,
|
|
pi2_coeff_data);
|
|
|
|
INSERT_BIT(u4_luma_dc_only_cbp, 1, dc_only_flag);
|
|
|
|
pi2_coeff_data += 64;
|
|
|
|
ui2_luma_csbp = ui2_luma_csbp >> 6;
|
|
dc_only_flag = ih264d_unpack_coeff8x8_8x8blk_cavlc(ps_dec,
|
|
ps_cur_mb_info,
|
|
ui2_luma_csbp,
|
|
pi2_coeff_data);
|
|
|
|
INSERT_BIT(u4_luma_dc_only_cbp, 2, dc_only_flag);
|
|
|
|
pi2_coeff_data += 64;
|
|
ui2_luma_csbp = ui2_luma_csbp >> 2;
|
|
dc_only_flag = ih264d_unpack_coeff8x8_8x8blk_cavlc(ps_dec,
|
|
ps_cur_mb_info,
|
|
ui2_luma_csbp,
|
|
pi2_coeff_data);
|
|
INSERT_BIT(u4_luma_dc_only_cbp, 3, dc_only_flag);
|
|
}
|
|
return u4_luma_dc_only_cbp;
|
|
}
|
|
|
|
}
|
|
|
|
void ih264d_unpack_chroma_coeff4x4_mb(dec_struct_t * ps_dec,
|
|
dec_mb_info_t * ps_cur_mb_info)
|
|
{
|
|
UWORD8 u1_mb_type = ps_cur_mb_info->u1_mb_type;
|
|
UWORD16 ui2_chroma_csbp = ps_cur_mb_info->u2_chroma_csbp;
|
|
UWORD8 *pu1_inv_scan = ps_dec->pu1_inv_scan;
|
|
WORD16 *pi2_coeff_data = ps_dec->pi2_coeff_data;
|
|
WORD32 i;
|
|
WORD16 *pi2_dc_val_u = NULL;
|
|
WORD16 *pi2_dc_val_v = NULL;
|
|
|
|
PROFILE_DISABLE_UNPACK_CHROMA()
|
|
if((ps_cur_mb_info->u1_cbp >> 4) == CBPC_ALLZERO)
|
|
return;
|
|
|
|
/*
|
|
* Reserve the pointers to dc vals. The dc vals will be copied
|
|
* after unpacking of ac vals since memset to 0 inside.
|
|
*/
|
|
if(CHECKBIT(ps_cur_mb_info->u1_yuv_dc_block_flag,1))
|
|
{
|
|
pi2_dc_val_u = (WORD16 *)ps_dec->pv_proc_tu_coeff_data;
|
|
|
|
ps_dec->pv_proc_tu_coeff_data = (void *)(pi2_dc_val_u + 4);
|
|
}
|
|
if(CHECKBIT(ps_cur_mb_info->u1_yuv_dc_block_flag,2))
|
|
{
|
|
pi2_dc_val_v = (WORD16 *)ps_dec->pv_proc_tu_coeff_data;
|
|
|
|
ps_dec->pv_proc_tu_coeff_data = (void *)(pi2_dc_val_v + 4);
|
|
}
|
|
|
|
if((ps_cur_mb_info->u1_cbp >> 4) == CBPC_NONZERO)
|
|
{
|
|
pi2_coeff_data = ps_dec->pi2_coeff_data;
|
|
ih264d_unpack_coeff4x4_8x8blk_chroma(ps_dec,
|
|
ps_cur_mb_info,
|
|
ui2_chroma_csbp,
|
|
pi2_coeff_data);
|
|
|
|
pi2_coeff_data += 64;
|
|
ui2_chroma_csbp = ui2_chroma_csbp >> 4;
|
|
ih264d_unpack_coeff4x4_8x8blk_chroma(ps_dec,
|
|
ps_cur_mb_info,
|
|
ui2_chroma_csbp,
|
|
pi2_coeff_data);
|
|
|
|
}
|
|
|
|
pi2_coeff_data = ps_dec->pi2_coeff_data;
|
|
if(pi2_dc_val_u != NULL)
|
|
{
|
|
pi2_coeff_data[0] = *pi2_dc_val_u++;
|
|
pi2_coeff_data[1 * 16] = *pi2_dc_val_u++;
|
|
pi2_coeff_data[2 * 16] = *pi2_dc_val_u++;
|
|
pi2_coeff_data[3 * 16] = *pi2_dc_val_u++;
|
|
}
|
|
else
|
|
{
|
|
pi2_coeff_data[0] = 0;
|
|
pi2_coeff_data[1 * 16] = 0;
|
|
pi2_coeff_data[2 * 16] = 0;
|
|
pi2_coeff_data[3 * 16] = 0;
|
|
}
|
|
pi2_coeff_data += 64;
|
|
if(pi2_dc_val_v != NULL)
|
|
{
|
|
pi2_coeff_data[0] = *pi2_dc_val_v++;
|
|
pi2_coeff_data[1 * 16] = *pi2_dc_val_v++;
|
|
pi2_coeff_data[2 * 16] = *pi2_dc_val_v++;
|
|
pi2_coeff_data[3 * 16] = *pi2_dc_val_v++;
|
|
}
|
|
else
|
|
{
|
|
pi2_coeff_data[0] = 0;
|
|
pi2_coeff_data[1 * 16] = 0;
|
|
pi2_coeff_data[2 * 16] = 0;
|
|
pi2_coeff_data[3 * 16] = 0;
|
|
}
|
|
}
|
|
UWORD32 ih264d_unpack_luma_coeff8x8_mb(dec_struct_t * ps_dec,
|
|
dec_mb_info_t * ps_cur_mb_info)
|
|
{
|
|
WORD32 blk_8x8_cnt;
|
|
WORD16 *pi2_out_coeff_data = ps_dec->pi2_coeff_data;
|
|
UWORD8 u1_field_coding_flag = ps_cur_mb_info->ps_curmb->u1_mb_fld;
|
|
UWORD8 *pu1_inv_scan;
|
|
UWORD32 u4_luma_dc_only_cbp = 0;
|
|
|
|
PROFILE_DISABLE_UNPACK_LUMA()
|
|
if(!u1_field_coding_flag)
|
|
{
|
|
/*******************************************************************/
|
|
/* initializing inverse scan matrices */
|
|
/*******************************************************************/
|
|
pu1_inv_scan = (UWORD8 *)gau1_ih264d_inv_scan_prog8x8_cabac;
|
|
}
|
|
else
|
|
{
|
|
/*******************************************************************/
|
|
/* initializing inverse scan matrices */
|
|
/*******************************************************************/
|
|
pu1_inv_scan = (UWORD8 *)gau1_ih264d_inv_scan_int8x8_cabac;
|
|
}
|
|
|
|
for(blk_8x8_cnt = 0; blk_8x8_cnt < 4; blk_8x8_cnt++)
|
|
{
|
|
if(CHECKBIT(ps_cur_mb_info->u1_cbp, blk_8x8_cnt))
|
|
{
|
|
tu_blk8x8_coeff_data_t *ps_tu_8x8 = (tu_blk8x8_coeff_data_t *)ps_dec->pv_proc_tu_coeff_data;
|
|
UWORD32 u4_sig_coeff_map;
|
|
WORD32 idx = 0;
|
|
WORD16 *pi2_coeff_data = &ps_tu_8x8->ai2_level[0];
|
|
WORD32 num_coeff = 0;
|
|
|
|
/* memset 64 coefficient to zero */
|
|
memset(pi2_out_coeff_data,0,64*sizeof(WORD16));
|
|
|
|
u4_sig_coeff_map = ps_tu_8x8->au4_sig_coeff_map[1];
|
|
|
|
while(u4_sig_coeff_map)
|
|
{
|
|
idx = CLZ(u4_sig_coeff_map);
|
|
|
|
idx = 31 - idx;
|
|
RESET_BIT(u4_sig_coeff_map,idx);
|
|
|
|
idx = pu1_inv_scan[idx + 32];
|
|
pi2_out_coeff_data[idx] = *pi2_coeff_data++;
|
|
num_coeff++;
|
|
}
|
|
|
|
u4_sig_coeff_map = ps_tu_8x8->au4_sig_coeff_map[0];
|
|
while(u4_sig_coeff_map)
|
|
{
|
|
idx = CLZ(u4_sig_coeff_map);
|
|
|
|
idx = 31 - idx;
|
|
RESET_BIT(u4_sig_coeff_map,idx);
|
|
|
|
idx = pu1_inv_scan[idx];
|
|
pi2_out_coeff_data[idx] = *pi2_coeff_data++;
|
|
num_coeff++;
|
|
}
|
|
|
|
if((num_coeff == 1) && (idx == 0))
|
|
{
|
|
SET_BIT(u4_luma_dc_only_cbp,blk_8x8_cnt);
|
|
}
|
|
|
|
|
|
{
|
|
WORD32 offset;
|
|
offset = (UWORD8 *)pi2_coeff_data - (UWORD8 *)ps_tu_8x8;
|
|
offset = ALIGN4(offset);
|
|
ps_dec->pv_proc_tu_coeff_data = (void *)((UWORD8 *)ps_dec->pv_proc_tu_coeff_data + offset);
|
|
}
|
|
}
|
|
pi2_out_coeff_data += 64;
|
|
}
|
|
|
|
return u4_luma_dc_only_cbp;
|
|
}
|
|
/*!
|
|
**************************************************************************
|
|
* \if Function name : ih264d_process_intra_mb \endif
|
|
*
|
|
* \brief
|
|
* This function decodes an I MB. Intraprediction is carried out followed
|
|
* by InvTramsform. Both IntraPrediction and Reconstrucion are carried out
|
|
* row buffer itself.
|
|
*
|
|
*
|
|
* \return
|
|
* 0 on Success and Error code otherwise
|
|
**************************************************************************
|
|
*/
|
|
WORD32 ih264d_process_intra_mb(dec_struct_t * ps_dec,
|
|
dec_mb_info_t * ps_cur_mb_info,
|
|
UWORD8 u1_mb_num)
|
|
{
|
|
UWORD8 u1_mb_type = ps_cur_mb_info->u1_mb_type;
|
|
UWORD8 uc_temp = ps_cur_mb_info->u1_mb_ngbr_availablity;
|
|
UWORD8 u1_top_available = BOOLEAN(uc_temp & TOP_MB_AVAILABLE_MASK);
|
|
UWORD8 u1_left_available = BOOLEAN(uc_temp & LEFT_MB_AVAILABLE_MASK);
|
|
UWORD8 u1_use_top_right_mb = BOOLEAN(uc_temp & TOP_RIGHT_MB_AVAILABLE_MASK);
|
|
UWORD8 u1_use_top_left_mb = BOOLEAN(uc_temp & TOP_LEFT_MB_AVAILABLE_MASK);
|
|
UWORD8 uc_useTopMB = u1_top_available;
|
|
UWORD16 u2_use_left_mb = u1_left_available;
|
|
UWORD16 u2_use_left_mb_pack;
|
|
UWORD8 *pu1_luma_pred_buffer;
|
|
/* CHANGED CODE */
|
|
UWORD8 *pu1_luma_rec_buffer;
|
|
UWORD8 *puc_top;
|
|
|
|
mb_neigbour_params_t *ps_left_mb;
|
|
mb_neigbour_params_t *ps_top_mb;
|
|
mb_neigbour_params_t *ps_top_right_mb;
|
|
mb_neigbour_params_t *ps_curmb;
|
|
|
|
UWORD16 u2_mbx = ps_cur_mb_info->u2_mbx;
|
|
UWORD32 ui_pred_width, ui_rec_width;
|
|
WORD16 *pi2_y_coeff;
|
|
UWORD8 u1_mbaff, u1_topmb, u1_mb_field_decoding_flag;
|
|
UWORD32 u4_num_pmbair;
|
|
UWORD16 ui2_luma_csbp = ps_cur_mb_info->u2_luma_csbp;
|
|
UWORD8 *pu1_yleft, *pu1_ytop_left;
|
|
/* Chroma variables*/
|
|
UWORD8 *pu1_top_u;
|
|
UWORD8 *pu1_uleft;
|
|
UWORD8 *pu1_u_top_left;
|
|
/* CHANGED CODE */
|
|
UWORD8 *pu1_mb_cb_rei1_buffer, *pu1_mb_cr_rei1_buffer;
|
|
UWORD32 u4_recwidth_cr;
|
|
/* CHANGED CODE */
|
|
tfr_ctxt_t *ps_frame_buf = ps_dec->ps_frame_buf_ip_recon;
|
|
UWORD32 u4_luma_dc_only_csbp = 0;
|
|
UWORD32 u4_luma_dc_only_cbp = 0;
|
|
|
|
UWORD8 *pu1_prev_intra4x4_pred_mode_data = (UWORD8 *)ps_dec->pv_proc_tu_coeff_data; //Pointer to keep track of intra4x4_pred_mode data in pv_proc_tu_coeff_data buffer
|
|
u1_mbaff = ps_dec->ps_cur_slice->u1_mbaff_frame_flag;
|
|
u1_topmb = ps_cur_mb_info->u1_topmb;
|
|
u4_num_pmbair = (u1_mb_num >> u1_mbaff);
|
|
|
|
|
|
/*--------------------------------------------------------------------*/
|
|
/* Find the current MB's mb params */
|
|
/*--------------------------------------------------------------------*/
|
|
u1_mb_field_decoding_flag = ps_cur_mb_info->u1_mb_field_decodingflag;
|
|
|
|
ps_curmb = ps_cur_mb_info->ps_curmb;
|
|
ps_top_mb = ps_cur_mb_info->ps_top_mb;
|
|
ps_left_mb = ps_cur_mb_info->ps_left_mb;
|
|
ps_top_right_mb = ps_cur_mb_info->ps_top_right_mb;
|
|
|
|
/*--------------------------------------------------------------------*/
|
|
/* Check whether neighbouring MB is Inter MB and */
|
|
/* constrained intra pred is 1. */
|
|
/*--------------------------------------------------------------------*/
|
|
u2_use_left_mb_pack = (u2_use_left_mb << 8) + u2_use_left_mb;
|
|
|
|
if(ps_dec->ps_cur_pps->u1_constrained_intra_pred_flag)
|
|
{
|
|
UWORD8 u1_left = (UWORD8)u2_use_left_mb;
|
|
|
|
uc_useTopMB = uc_useTopMB
|
|
&& ((ps_top_mb->u1_mb_type != P_MB)
|
|
&& (ps_top_mb->u1_mb_type != B_MB));
|
|
u2_use_left_mb = u2_use_left_mb
|
|
&& ((ps_left_mb->u1_mb_type != P_MB)
|
|
&& (ps_left_mb->u1_mb_type != B_MB));
|
|
|
|
u2_use_left_mb_pack = (u2_use_left_mb << 8) + u2_use_left_mb;
|
|
if(u1_mbaff)
|
|
{
|
|
if(u1_mb_field_decoding_flag ^ ps_left_mb->u1_mb_fld)
|
|
{
|
|
u1_left = u1_left
|
|
&& (((ps_left_mb + 1)->u1_mb_type != P_MB)
|
|
&& ((ps_left_mb + 1)->u1_mb_type
|
|
!= B_MB));
|
|
u2_use_left_mb = u2_use_left_mb && u1_left;
|
|
if(u1_mb_field_decoding_flag)
|
|
u2_use_left_mb_pack = (u1_left << 8)
|
|
+ (u2_use_left_mb_pack & 0xff);
|
|
else
|
|
u2_use_left_mb_pack = (u2_use_left_mb << 8)
|
|
+ (u2_use_left_mb);
|
|
}
|
|
}
|
|
u1_use_top_right_mb =
|
|
u1_use_top_right_mb
|
|
&& ((ps_top_right_mb->u1_mb_type != P_MB)
|
|
&& (ps_top_right_mb->u1_mb_type
|
|
!= B_MB));
|
|
|
|
u1_use_top_left_mb =
|
|
u1_use_top_left_mb
|
|
&& ((ps_cur_mb_info->u1_topleft_mbtype != P_MB)
|
|
&& (ps_cur_mb_info->u1_topleft_mbtype
|
|
!= B_MB));
|
|
}
|
|
|
|
/*********************Common pointer calculations *************************/
|
|
/* CHANGED CODE */
|
|
pu1_luma_pred_buffer = ps_dec->pu1_y;
|
|
pu1_luma_rec_buffer = ps_frame_buf->pu1_dest_y + (u4_num_pmbair << 4);
|
|
pu1_mb_cb_rei1_buffer = ps_frame_buf->pu1_dest_u
|
|
+ (u4_num_pmbair << 3) * YUV420SP_FACTOR;
|
|
pu1_mb_cr_rei1_buffer = ps_frame_buf->pu1_dest_v + (u4_num_pmbair << 3);
|
|
ui_pred_width = MB_SIZE;
|
|
ui_rec_width = ps_dec->u2_frm_wd_y << u1_mb_field_decoding_flag;
|
|
u4_recwidth_cr = ps_dec->u2_frm_wd_uv << u1_mb_field_decoding_flag;
|
|
/************* Current and top luma pointer *****************/
|
|
|
|
if(u1_mbaff)
|
|
{
|
|
if(u1_topmb == 0)
|
|
{
|
|
pu1_luma_rec_buffer += (
|
|
u1_mb_field_decoding_flag ?
|
|
(ui_rec_width >> 1) :
|
|
(ui_rec_width << 4));
|
|
pu1_mb_cb_rei1_buffer += (
|
|
u1_mb_field_decoding_flag ?
|
|
(u4_recwidth_cr >> 1) :
|
|
(u4_recwidth_cr << 3));
|
|
pu1_mb_cr_rei1_buffer += (
|
|
u1_mb_field_decoding_flag ?
|
|
(u4_recwidth_cr >> 1) :
|
|
(u4_recwidth_cr << 3));
|
|
}
|
|
}
|
|
|
|
/* CHANGED CODE */
|
|
if(ps_dec->u4_use_intrapred_line_copy == 1)
|
|
{
|
|
puc_top = ps_dec->pu1_prev_y_intra_pred_line + (ps_cur_mb_info->u2_mbx << 4);
|
|
pu1_top_u = ps_dec->pu1_prev_u_intra_pred_line
|
|
+ (ps_cur_mb_info->u2_mbx << 3) * YUV420SP_FACTOR;
|
|
}
|
|
else
|
|
{
|
|
puc_top = pu1_luma_rec_buffer - ui_rec_width;
|
|
pu1_top_u = pu1_mb_cb_rei1_buffer - u4_recwidth_cr;
|
|
}
|
|
/* CHANGED CODE */
|
|
|
|
/************* Left pointer *****************/
|
|
pu1_yleft = pu1_luma_rec_buffer - 1;
|
|
pu1_uleft = pu1_mb_cb_rei1_buffer - 1 * YUV420SP_FACTOR;
|
|
|
|
/**************Top Left pointer calculation**********/
|
|
pu1_ytop_left = puc_top - 1;
|
|
pu1_u_top_left = pu1_top_u - 1 * YUV420SP_FACTOR;
|
|
|
|
/* CHANGED CODE */
|
|
PROFILE_DISABLE_INTRA_PRED()
|
|
{
|
|
pu1_prev_intra4x4_pred_mode_data = (UWORD8 *)ps_dec->pv_proc_tu_coeff_data;
|
|
if(u1_mb_type == I_4x4_MB && ps_cur_mb_info->u1_tran_form8x8 == 0)
|
|
{
|
|
ps_dec->pv_proc_tu_coeff_data = (void *)((UWORD8 *)ps_dec->pv_proc_tu_coeff_data + 32);
|
|
|
|
}
|
|
else if (u1_mb_type == I_4x4_MB && ps_cur_mb_info->u1_tran_form8x8 == 1)
|
|
{
|
|
ps_dec->pv_proc_tu_coeff_data = (void *)((UWORD8 *)ps_dec->pv_proc_tu_coeff_data + 8);
|
|
}
|
|
}
|
|
if(!ps_cur_mb_info->u1_tran_form8x8)
|
|
{
|
|
u4_luma_dc_only_csbp = ih264d_unpack_luma_coeff4x4_mb(ps_dec,
|
|
ps_cur_mb_info,
|
|
1);
|
|
}
|
|
else
|
|
{
|
|
if(!ps_dec->ps_cur_pps->u1_entropy_coding_mode)
|
|
{
|
|
u4_luma_dc_only_cbp = ih264d_unpack_luma_coeff4x4_mb(ps_dec,
|
|
ps_cur_mb_info,
|
|
1);
|
|
}
|
|
else
|
|
{
|
|
u4_luma_dc_only_cbp = ih264d_unpack_luma_coeff8x8_mb(ps_dec,
|
|
ps_cur_mb_info);
|
|
}
|
|
}
|
|
|
|
pi2_y_coeff = ps_dec->pi2_coeff_data;
|
|
|
|
if(u1_mb_type != I_4x4_MB)
|
|
{
|
|
UWORD8 u1_intrapred_mode = MB_TYPE_TO_INTRA_16x16_MODE(u1_mb_type);
|
|
/*--------------------------------------------------------------------*/
|
|
/* 16x16 IntraPrediction */
|
|
/*--------------------------------------------------------------------*/
|
|
{
|
|
UWORD8 u1_packed_modes = (u1_top_available << 1)
|
|
+ u1_left_available;
|
|
UWORD8 u1_err_code =
|
|
(u1_intrapred_mode & 1) ?
|
|
u1_intrapred_mode :
|
|
(u1_intrapred_mode ^ 2);
|
|
|
|
if((u1_err_code & u1_packed_modes) ^ u1_err_code)
|
|
{
|
|
u1_intrapred_mode = 0;
|
|
ps_dec->i4_error_code = ERROR_INTRAPRED;
|
|
}
|
|
}
|
|
{
|
|
/* Align the size to multiple of 8, so that SIMD functions
|
|
can read 64 bits at a time. Only 33 bytes are actaully used */
|
|
UWORD8 au1_ngbr_pels[40];
|
|
/* Get neighbour pixels */
|
|
/* left pels */
|
|
if(u2_use_left_mb)
|
|
{
|
|
WORD32 i;
|
|
for(i = 0; i < 16; i++)
|
|
au1_ngbr_pels[16 - 1 - i] = pu1_yleft[i * ui_rec_width];
|
|
}
|
|
else
|
|
{
|
|
memset(au1_ngbr_pels, 0, 16);
|
|
}
|
|
|
|
/* top left pels */
|
|
au1_ngbr_pels[16] = *pu1_ytop_left;
|
|
|
|
/* top pels */
|
|
if(uc_useTopMB)
|
|
{
|
|
memcpy(au1_ngbr_pels + 16 + 1, puc_top, 16);
|
|
}
|
|
else
|
|
{
|
|
memset(au1_ngbr_pels + 16 + 1, 0, 16);
|
|
}
|
|
PROFILE_DISABLE_INTRA_PRED()
|
|
ps_dec->apf_intra_pred_luma_16x16[u1_intrapred_mode](
|
|
au1_ngbr_pels, pu1_luma_rec_buffer, 1, ui_rec_width,
|
|
((uc_useTopMB << 2) | u2_use_left_mb));
|
|
}
|
|
{
|
|
UWORD32 i;
|
|
WORD16 ai2_tmp[16];
|
|
for(i = 0; i < 16; i++)
|
|
{
|
|
WORD16 *pi2_level = pi2_y_coeff + (i << 4);
|
|
UWORD8 *pu1_pred_sblk = pu1_luma_rec_buffer
|
|
+ ((i & 0x3) * BLK_SIZE)
|
|
+ (i >> 2) * (ui_rec_width << 2);
|
|
PROFILE_DISABLE_IQ_IT_RECON()
|
|
{
|
|
if(CHECKBIT(ps_cur_mb_info->u2_luma_csbp, i))
|
|
{
|
|
ps_dec->pf_iquant_itrans_recon_luma_4x4(
|
|
pi2_level,
|
|
pu1_pred_sblk,
|
|
pu1_pred_sblk,
|
|
ui_rec_width,
|
|
ui_rec_width,
|
|
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qp_rem6],
|
|
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[0],
|
|
ps_cur_mb_info->u1_qp_div6, ai2_tmp, 1,
|
|
pi2_level);
|
|
}
|
|
else if((CHECKBIT(u4_luma_dc_only_csbp, i)) && pi2_level[0] != 0)
|
|
{
|
|
ps_dec->pf_iquant_itrans_recon_luma_4x4_dc(
|
|
pi2_level,
|
|
pu1_pred_sblk,
|
|
pu1_pred_sblk,
|
|
ui_rec_width,
|
|
ui_rec_width,
|
|
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qp_rem6],
|
|
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[0],
|
|
ps_cur_mb_info->u1_qp_div6, ai2_tmp, 1,
|
|
pi2_level);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
else if(!ps_cur_mb_info->u1_tran_form8x8)
|
|
{
|
|
UWORD8 u1_is_left_sub_block, u1_is_top_sub_block = uc_useTopMB;
|
|
UWORD8 u1_sub_blk_x, u1_sub_blk_y, u1_sub_mb_num;
|
|
WORD8 i1_top_pred_mode;
|
|
WORD8 i1_left_pred_mode;
|
|
UWORD8 *pu1_top, *pu1_left, *pu1_top_left, *pu1_top_right;
|
|
WORD8 *pi1_cur_pred_mode, *pi1_left_pred_mode, *pc_topPredMode;
|
|
UWORD16 ui2_left_pred_buf_width = 0xffff;
|
|
WORD8 i1_intra_pred;
|
|
UWORD8 *pu1_prev_intra4x4_pred_mode_flag = pu1_prev_intra4x4_pred_mode_data;
|
|
UWORD8 *pu1_rem_intra4x4_pred_mode = pu1_prev_intra4x4_pred_mode_data + 16;
|
|
WORD16 *pi2_y_coeff1;
|
|
UWORD8 u1_cur_sub_block;
|
|
UWORD16 ui2_top_rt_mask;
|
|
|
|
/*--------------------------------------------------------------------*/
|
|
/* 4x4 IntraPrediction */
|
|
/*--------------------------------------------------------------------*/
|
|
/* Calculation of Top Right subblock mask */
|
|
/* */
|
|
/* (a) Set it to default mask */
|
|
/* [It has 0 for sublocks which will never have top-right sub block] */
|
|
/* */
|
|
/* (b) If top MB is not available */
|
|
/* Clear the bits of the first row sub blocks */
|
|
/* */
|
|
/* (c) Set/Clear bit for top-right sublock of MB */
|
|
/* [5 sub-block in decoding order] based on TOP RIGHT MB availablity */
|
|
/*--------------------------------------------------------------------*/
|
|
|
|
pu1_top = puc_top;
|
|
|
|
ui2_top_rt_mask = (u1_use_top_right_mb << 3) | (0x5750);
|
|
if(uc_useTopMB)
|
|
ui2_top_rt_mask |= 0x7;
|
|
|
|
/*Top Related initialisations*/
|
|
|
|
|
|
pi1_cur_pred_mode = ps_cur_mb_info->ps_curmb->pi1_intrapredmodes;
|
|
pc_topPredMode = ps_cur_mb_info->ps_top_mb->pi1_intrapredmodes;
|
|
/*--------------------------------------
|
|
if(u1_mbaff)
|
|
{
|
|
|
|
pi1_cur_pred_mode += (u2_mbx << 2);
|
|
pc_topPredMode = pi1_cur_pred_mode + ps_cur_mb_info->i1_offset;
|
|
pi1_cur_pred_mode += (u1_topmb) ? 0: 4;
|
|
}*/
|
|
|
|
if(u1_top_available)
|
|
{
|
|
if(ps_top_mb->u1_mb_type == I_4x4_MB)
|
|
*(WORD32*)pi1_cur_pred_mode = *(WORD32*)pc_topPredMode;
|
|
else
|
|
*(WORD32*)pi1_cur_pred_mode =
|
|
(uc_useTopMB) ? DC_DC_DC_DC : NOT_VALID;
|
|
}
|
|
else
|
|
*(WORD32*)pi1_cur_pred_mode = NOT_VALID;
|
|
/* CHANGED CODE */
|
|
|
|
/* CHANGED CODE */
|
|
|
|
/*Left Related initialisations*/
|
|
pi1_left_pred_mode = ps_dec->pi1_left_pred_mode;
|
|
if(!u1_mbaff)
|
|
{
|
|
|
|
if(u1_left_available)
|
|
{
|
|
|
|
if(ps_left_mb->u1_mb_type != I_4x4_MB)
|
|
*(WORD32*)pi1_left_pred_mode =
|
|
(u2_use_left_mb_pack) ?
|
|
DC_DC_DC_DC :
|
|
NOT_VALID;
|
|
|
|
}
|
|
else
|
|
{
|
|
|
|
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
|
|
}
|
|
|
|
}
|
|
else
|
|
{
|
|
UWORD8 u1_curMbfld = ps_cur_mb_info->u1_mb_field_decodingflag;
|
|
UWORD8 u1_leftMbfld = ps_left_mb->u1_mb_fld;
|
|
|
|
if(u1_curMbfld ^ u1_leftMbfld)
|
|
{
|
|
|
|
if(u1_topmb
|
|
| ((u1_topmb == 0)
|
|
&& ((ps_curmb - 1)->u1_mb_type
|
|
!= I_4x4_MB)))
|
|
{
|
|
if(u1_left_available)
|
|
{
|
|
if(ps_left_mb->u1_mb_type != I_4x4_MB)
|
|
{
|
|
if(CHECKBIT(u2_use_left_mb_pack,0) == 0)
|
|
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
|
|
else
|
|
*(WORD32*)pi1_left_pred_mode = DC_DC_DC_DC;
|
|
}
|
|
}
|
|
else
|
|
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
|
|
|
|
if(u1_curMbfld)
|
|
{
|
|
if(u1_left_available)
|
|
{
|
|
if((ps_left_mb + 1)->u1_mb_type != I_4x4_MB)
|
|
{
|
|
if(u2_use_left_mb_pack >> 8)
|
|
*(WORD32*)(pi1_left_pred_mode + 4) =
|
|
DC_DC_DC_DC;
|
|
else
|
|
*(WORD32*)(pi1_left_pred_mode + 4) =
|
|
NOT_VALID;
|
|
}
|
|
}
|
|
else
|
|
*(WORD32*)(pi1_left_pred_mode + 4) = NOT_VALID;
|
|
pi1_left_pred_mode[1] = pi1_left_pred_mode[2];
|
|
pi1_left_pred_mode[2] = pi1_left_pred_mode[4];
|
|
pi1_left_pred_mode[3] = pi1_left_pred_mode[6];
|
|
*(WORD32*)(pi1_left_pred_mode + 4) =
|
|
*(WORD32*)pi1_left_pred_mode;
|
|
}
|
|
else
|
|
{
|
|
|
|
pi1_left_pred_mode[7] = pi1_left_pred_mode[3];
|
|
pi1_left_pred_mode[6] = pi1_left_pred_mode[3];
|
|
pi1_left_pred_mode[5] = pi1_left_pred_mode[2];
|
|
pi1_left_pred_mode[4] = pi1_left_pred_mode[2];
|
|
pi1_left_pred_mode[3] = pi1_left_pred_mode[1];
|
|
pi1_left_pred_mode[2] = pi1_left_pred_mode[1];
|
|
pi1_left_pred_mode[1] = pi1_left_pred_mode[0];
|
|
}
|
|
}
|
|
pi1_left_pred_mode += (u1_topmb) ? 0 : 4;
|
|
}
|
|
else
|
|
{
|
|
|
|
pi1_left_pred_mode += (u1_topmb) ? 0 : 4;
|
|
if(u1_left_available)
|
|
{
|
|
|
|
if(ps_left_mb->u1_mb_type != I_4x4_MB)
|
|
*(WORD32*)pi1_left_pred_mode =
|
|
(u2_use_left_mb_pack) ?
|
|
DC_DC_DC_DC :
|
|
NOT_VALID;
|
|
}
|
|
else
|
|
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
|
|
}
|
|
}
|
|
/* One time pointer initialisations*/
|
|
pi2_y_coeff1 = pi2_y_coeff;
|
|
pu1_top_left = pu1_ytop_left;
|
|
|
|
/* Scan the sub-blocks in Raster Scan Order */
|
|
for(u1_sub_mb_num = 0; u1_sub_mb_num < 16; u1_sub_mb_num++)
|
|
{
|
|
/* Align the size to multiple of 8, so that SIMD functions
|
|
can read 64 bits at a time. Only 13 bytes are actaully used */
|
|
UWORD8 au1_ngbr_pels[16];
|
|
|
|
u1_sub_blk_x = u1_sub_mb_num & 0x3;
|
|
u1_sub_blk_y = u1_sub_mb_num >> 2;
|
|
i1_top_pred_mode = pi1_cur_pred_mode[u1_sub_blk_x];
|
|
i1_left_pred_mode = pi1_left_pred_mode[u1_sub_blk_y];
|
|
u1_use_top_right_mb = (!!CHECKBIT(ui2_top_rt_mask, u1_sub_mb_num));
|
|
|
|
/*********** left subblock availability**********/
|
|
if(u1_sub_blk_x)
|
|
u1_is_left_sub_block = 1;
|
|
else
|
|
u1_is_left_sub_block =
|
|
(u1_sub_blk_y < 2) ?
|
|
(CHECKBIT(u2_use_left_mb_pack,
|
|
0)) :
|
|
(u2_use_left_mb_pack >> 8);
|
|
|
|
/* CHANGED CODE */
|
|
if(u1_sub_blk_y)
|
|
u1_is_top_sub_block = 1;
|
|
|
|
/* CHANGED CODE */
|
|
/***************** Top *********************/
|
|
if(ps_dec->u4_use_intrapred_line_copy == 1)
|
|
{
|
|
|
|
if(u1_sub_blk_y)
|
|
pu1_top = pu1_luma_rec_buffer - ui_rec_width;
|
|
else
|
|
pu1_top = puc_top + (u1_sub_blk_x << 2);
|
|
}
|
|
else
|
|
{
|
|
pu1_top = pu1_luma_rec_buffer - ui_rec_width;
|
|
}
|
|
/***************** Top Right *********************/
|
|
pu1_top_right = pu1_top + 4;
|
|
/***************** Top Left *********************/
|
|
pu1_top_left = pu1_top - 1;
|
|
/***************** Left *********************/
|
|
pu1_left = pu1_luma_rec_buffer - 1;
|
|
/* CHANGED CODE */
|
|
|
|
/*---------------------------------------------------------------*/
|
|
/* Calculation of Intra prediction mode */
|
|
/*---------------------------------------------------------------*/
|
|
i1_intra_pred = ((i1_left_pred_mode < 0) | (i1_top_pred_mode < 0)) ?
|
|
DC : MIN(i1_left_pred_mode, i1_top_pred_mode);
|
|
{
|
|
UWORD8 u1_packed_modes = (u1_is_top_sub_block << 1)
|
|
+ u1_is_left_sub_block;
|
|
UWORD8 *pu1_intra_err_codes =
|
|
(UWORD8 *)gau1_ih264d_intra_pred_err_code;
|
|
UWORD8 uc_b2b0 = ((u1_sub_mb_num & 4) >> 1) | (u1_sub_mb_num & 1);
|
|
UWORD8 uc_b3b1 = ((u1_sub_mb_num & 8) >> 2)
|
|
| ((u1_sub_mb_num & 2) >> 1);
|
|
|
|
u1_cur_sub_block = (uc_b3b1 << 2) + uc_b2b0;
|
|
PROFILE_DISABLE_INTRA_PRED()
|
|
if(!pu1_prev_intra4x4_pred_mode_flag[u1_cur_sub_block])
|
|
{
|
|
i1_intra_pred =
|
|
pu1_rem_intra4x4_pred_mode[u1_cur_sub_block]
|
|
+ (pu1_rem_intra4x4_pred_mode[u1_cur_sub_block]
|
|
>= i1_intra_pred);
|
|
}
|
|
i1_intra_pred = CLIP3(0, 8, i1_intra_pred);
|
|
{
|
|
UWORD8 u1_err_code = pu1_intra_err_codes[i1_intra_pred];
|
|
|
|
if((u1_err_code & u1_packed_modes) ^ u1_err_code)
|
|
{
|
|
i1_intra_pred = 0;
|
|
ps_dec->i4_error_code = ERROR_INTRAPRED;
|
|
}
|
|
|
|
}
|
|
}
|
|
{
|
|
/* Get neighbour pixels */
|
|
/* left pels */
|
|
if(u1_is_left_sub_block)
|
|
{
|
|
WORD32 i;
|
|
for(i = 0; i < 4; i++)
|
|
au1_ngbr_pels[4 - 1 - i] = pu1_left[i * ui_rec_width];
|
|
}
|
|
else
|
|
{
|
|
memset(au1_ngbr_pels, 0, 4);
|
|
}
|
|
|
|
/* top left pels */
|
|
au1_ngbr_pels[4] = *pu1_top_left;
|
|
|
|
/* top pels */
|
|
if(u1_is_top_sub_block)
|
|
{
|
|
memcpy(au1_ngbr_pels + 4 + 1, pu1_top, 4);
|
|
}
|
|
else
|
|
{
|
|
memset(au1_ngbr_pels + 4 + 1, 0, 4);
|
|
}
|
|
|
|
/* top right pels */
|
|
if(u1_use_top_right_mb)
|
|
{
|
|
memcpy(au1_ngbr_pels + 4 * 2 + 1, pu1_top_right, 4);
|
|
}
|
|
else if(u1_is_top_sub_block)
|
|
{
|
|
memset(au1_ngbr_pels + 4 * 2 + 1, au1_ngbr_pels[4 * 2], 4);
|
|
}
|
|
}
|
|
PROFILE_DISABLE_INTRA_PRED()
|
|
ps_dec->apf_intra_pred_luma_4x4[i1_intra_pred](
|
|
au1_ngbr_pels, pu1_luma_rec_buffer, 1,
|
|
ui_rec_width,
|
|
((u1_is_top_sub_block << 2) | u1_is_left_sub_block));
|
|
|
|
/* CHANGED CODE */
|
|
if(CHECKBIT(ui2_luma_csbp, u1_sub_mb_num))
|
|
{
|
|
WORD16 ai2_tmp[16];
|
|
PROFILE_DISABLE_IQ_IT_RECON()
|
|
{
|
|
if(CHECKBIT(u4_luma_dc_only_csbp, u1_sub_mb_num))
|
|
{
|
|
ps_dec->pf_iquant_itrans_recon_luma_4x4_dc(
|
|
pi2_y_coeff1,
|
|
pu1_luma_rec_buffer,
|
|
pu1_luma_rec_buffer,
|
|
ui_rec_width,
|
|
ui_rec_width,
|
|
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qp_rem6],
|
|
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[0],
|
|
ps_cur_mb_info->u1_qp_div6, ai2_tmp, 0,
|
|
NULL);
|
|
}
|
|
else
|
|
{
|
|
ps_dec->pf_iquant_itrans_recon_luma_4x4(
|
|
pi2_y_coeff1,
|
|
pu1_luma_rec_buffer,
|
|
pu1_luma_rec_buffer,
|
|
ui_rec_width,
|
|
ui_rec_width,
|
|
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qp_rem6],
|
|
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[0],
|
|
ps_cur_mb_info->u1_qp_div6, ai2_tmp, 0,
|
|
NULL);
|
|
}
|
|
}
|
|
|
|
}
|
|
|
|
/*---------------------------------------------------------------*/
|
|
/* Update sub block number */
|
|
/*---------------------------------------------------------------*/
|
|
pi2_y_coeff1 += 16;
|
|
pu1_luma_rec_buffer +=
|
|
(u1_sub_blk_x == 3) ? (ui_rec_width << 2) - 12 : 4;
|
|
pu1_luma_pred_buffer +=
|
|
(u1_sub_blk_x == 3) ? (ui_pred_width << 2) - 12 : 4;
|
|
/* CHANGED CODE */
|
|
pi1_cur_pred_mode[u1_sub_blk_x] = i1_intra_pred;
|
|
pi1_left_pred_mode[u1_sub_blk_y] = i1_intra_pred;
|
|
}
|
|
}
|
|
else if((u1_mb_type == I_4x4_MB) && (ps_cur_mb_info->u1_tran_form8x8 == 1))
|
|
{
|
|
UWORD8 u1_is_left_sub_block, u1_is_top_sub_block = uc_useTopMB;
|
|
UWORD8 u1_sub_blk_x, u1_sub_blk_y, u1_sub_mb_num;
|
|
WORD8 i1_top_pred_mode;
|
|
WORD8 i1_left_pred_mode;
|
|
UWORD8 *pu1_top, *pu1_left, *pu1_top_left;
|
|
WORD8 *pi1_cur_pred_mode, *pi1_left_pred_mode, *pc_topPredMode;
|
|
UWORD16 ui2_left_pred_buf_width = 0xffff;
|
|
WORD8 i1_intra_pred;
|
|
UWORD8 *pu1_prev_intra4x4_pred_mode_flag = pu1_prev_intra4x4_pred_mode_data;
|
|
UWORD8 *pu1_rem_intra4x4_pred_mode = pu1_prev_intra4x4_pred_mode_data + 4;
|
|
WORD16 *pi2_y_coeff1;
|
|
UWORD16 ui2_top_rt_mask;
|
|
UWORD32 u4_4x4_left_offset = 0;
|
|
|
|
/*--------------------------------------------------------------------*/
|
|
/* 8x8 IntraPrediction */
|
|
/*--------------------------------------------------------------------*/
|
|
/* Calculation of Top Right subblock mask */
|
|
/* */
|
|
/* (a) Set it to default mask */
|
|
/* [It has 0 for sublocks which will never have top-right sub block] */
|
|
/* */
|
|
/* (b) If top MB is not available */
|
|
/* Clear the bits of the first row sub blocks */
|
|
/* */
|
|
/* (c) Set/Clear bit for top-right sublock of MB */
|
|
/* [5 sub-block in decoding order] based on TOP RIGHT MB availablity */
|
|
/* */
|
|
/* ui2_top_rt_mask: marks availibility of top right(neighbour) */
|
|
/* in the 8x8 Block ordering */
|
|
/* */
|
|
/* tr0 tr1 */
|
|
/* 0 1 tr3 */
|
|
/* 2 3 */
|
|
/* */
|
|
/* Top rights for 0 is in top MB */
|
|
/* top right of 1 will be in top right MB */
|
|
/* top right of 3 in right MB and hence not available */
|
|
/* This corresponds to ui2_top_rt_mask having default value 0x4 */
|
|
/*--------------------------------------------------------------------*/
|
|
|
|
ui2_top_rt_mask = (u1_use_top_right_mb << 1) | (0x4);
|
|
|
|
if(uc_useTopMB)
|
|
{
|
|
ui2_top_rt_mask |= 0x1;
|
|
}
|
|
|
|
/* Top Related initialisations */
|
|
pi1_cur_pred_mode = ps_cur_mb_info->ps_curmb->pi1_intrapredmodes;
|
|
pc_topPredMode = ps_cur_mb_info->ps_top_mb->pi1_intrapredmodes;
|
|
/*
|
|
if(u1_mbaff)
|
|
{
|
|
pi1_cur_pred_mode += (u2_mbx << 2);
|
|
pc_topPredMode = pi1_cur_pred_mode + ps_cur_mb_info->i1_offset;
|
|
pi1_cur_pred_mode += (u1_topmb) ? 0: 4;
|
|
}
|
|
*/
|
|
if(u1_top_available)
|
|
{
|
|
if(ps_top_mb->u1_mb_type == I_4x4_MB)
|
|
{
|
|
*(WORD32*)pi1_cur_pred_mode = *(WORD32*)pc_topPredMode;
|
|
}
|
|
else
|
|
{
|
|
*(WORD32*)pi1_cur_pred_mode =
|
|
(uc_useTopMB) ? DC_DC_DC_DC : NOT_VALID;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
*(WORD32*)pi1_cur_pred_mode = NOT_VALID;
|
|
}
|
|
|
|
pu1_top = puc_top - 8;
|
|
|
|
/*Left Related initialisations*/
|
|
pi1_left_pred_mode = ps_dec->pi1_left_pred_mode;
|
|
|
|
if(!u1_mbaff)
|
|
{
|
|
if(u1_left_available)
|
|
{
|
|
if(ps_left_mb->u1_mb_type != I_4x4_MB)
|
|
{
|
|
*(WORD32*)pi1_left_pred_mode =
|
|
(u2_use_left_mb_pack) ?
|
|
DC_DC_DC_DC :
|
|
NOT_VALID;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
UWORD8 u1_curMbfld = ps_cur_mb_info->u1_mb_field_decodingflag;
|
|
|
|
UWORD8 u1_leftMbfld = ps_left_mb->u1_mb_fld;
|
|
|
|
if((!u1_curMbfld) && (u1_leftMbfld))
|
|
{
|
|
u4_4x4_left_offset = 1;
|
|
}
|
|
|
|
if(u1_curMbfld ^ u1_leftMbfld)
|
|
{
|
|
|
|
if(u1_topmb
|
|
| ((u1_topmb == 0)
|
|
&& ((ps_curmb - 1)->u1_mb_type
|
|
!= I_4x4_MB)))
|
|
|
|
{
|
|
if(u1_left_available)
|
|
{
|
|
if(ps_left_mb->u1_mb_type != I_4x4_MB)
|
|
{
|
|
if(CHECKBIT(u2_use_left_mb_pack,0) == 0)
|
|
{
|
|
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
|
|
}
|
|
else
|
|
{
|
|
*(WORD32*)pi1_left_pred_mode = DC_DC_DC_DC;
|
|
}
|
|
}
|
|
}
|
|
else
|
|
{
|
|
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
|
|
}
|
|
|
|
if(u1_curMbfld)
|
|
{
|
|
if(u1_left_available)
|
|
{
|
|
if((ps_left_mb + 1)->u1_mb_type != I_4x4_MB)
|
|
{
|
|
if(u2_use_left_mb_pack >> 8)
|
|
{
|
|
*(WORD32*)(pi1_left_pred_mode + 4) =
|
|
DC_DC_DC_DC;
|
|
}
|
|
else
|
|
{
|
|
*(WORD32*)(pi1_left_pred_mode + 4) =
|
|
NOT_VALID;
|
|
}
|
|
}
|
|
}
|
|
else
|
|
{
|
|
*(WORD32*)(pi1_left_pred_mode + 4) = NOT_VALID;
|
|
}
|
|
|
|
pi1_left_pred_mode[1] = pi1_left_pred_mode[2];
|
|
pi1_left_pred_mode[2] = pi1_left_pred_mode[4];
|
|
pi1_left_pred_mode[3] = pi1_left_pred_mode[6];
|
|
*(WORD32*)(pi1_left_pred_mode + 4) =
|
|
*(WORD32*)pi1_left_pred_mode;
|
|
}
|
|
else
|
|
{
|
|
pi1_left_pred_mode[7] = pi1_left_pred_mode[3];
|
|
pi1_left_pred_mode[6] = pi1_left_pred_mode[3];
|
|
pi1_left_pred_mode[5] = pi1_left_pred_mode[2];
|
|
pi1_left_pred_mode[4] = pi1_left_pred_mode[2];
|
|
pi1_left_pred_mode[3] = pi1_left_pred_mode[1];
|
|
pi1_left_pred_mode[2] = pi1_left_pred_mode[1];
|
|
pi1_left_pred_mode[1] = pi1_left_pred_mode[0];
|
|
}
|
|
}
|
|
pi1_left_pred_mode += (u1_topmb) ? 0 : 4;
|
|
}
|
|
else
|
|
{
|
|
pi1_left_pred_mode += (u1_topmb) ? 0 : 4;
|
|
|
|
if(u1_left_available)
|
|
{
|
|
if(ps_left_mb->u1_mb_type != I_4x4_MB)
|
|
{
|
|
*(WORD32*)pi1_left_pred_mode =
|
|
(u2_use_left_mb_pack) ?
|
|
DC_DC_DC_DC :
|
|
NOT_VALID;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
*(WORD32*)pi1_left_pred_mode = NOT_VALID;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* One time pointer initialisations*/
|
|
pi2_y_coeff1 = pi2_y_coeff;
|
|
|
|
if(u1_use_top_left_mb)
|
|
{
|
|
pu1_top_left = pu1_ytop_left;
|
|
}
|
|
else
|
|
{
|
|
pu1_top_left = NULL;
|
|
}
|
|
|
|
/* Scan the sub-blocks in Raster Scan Order */
|
|
for(u1_sub_mb_num = 0; u1_sub_mb_num < 4; u1_sub_mb_num++)
|
|
{
|
|
u1_sub_blk_x = (u1_sub_mb_num & 0x1);
|
|
u1_sub_blk_y = (u1_sub_mb_num >> 1);
|
|
i1_top_pred_mode = pi1_cur_pred_mode[u1_sub_blk_x << 1];
|
|
i1_left_pred_mode = pi1_left_pred_mode[u1_sub_blk_y << 1];
|
|
|
|
if(2 == u1_sub_mb_num)
|
|
{
|
|
i1_left_pred_mode = pi1_left_pred_mode[(u1_sub_blk_y << 1)
|
|
+ u4_4x4_left_offset];
|
|
}
|
|
|
|
u1_use_top_right_mb = (!!CHECKBIT(ui2_top_rt_mask, u1_sub_mb_num));
|
|
|
|
/*********** left subblock availability**********/
|
|
if(u1_sub_blk_x)
|
|
{
|
|
u1_is_left_sub_block = 1;
|
|
}
|
|
else
|
|
{
|
|
u1_is_left_sub_block =
|
|
(u1_sub_blk_y < 1) ?
|
|
(CHECKBIT(u2_use_left_mb_pack,
|
|
0)) :
|
|
(u2_use_left_mb_pack >> 8);
|
|
}
|
|
|
|
/***************** Top *********************/
|
|
if(u1_sub_blk_y)
|
|
{
|
|
u1_is_top_sub_block = 1;
|
|
// sushant
|
|
pu1_top = /*pu1_luma_pred_buffer*/pu1_luma_rec_buffer - ui_rec_width;
|
|
}
|
|
else
|
|
{
|
|
pu1_top += 8;
|
|
}
|
|
|
|
/***************** Left *********************/
|
|
if((u1_sub_blk_x) | (u4_num_pmbair != 0))
|
|
{
|
|
// sushant
|
|
pu1_left = /*pu1_luma_pred_buffer*/pu1_luma_rec_buffer - 1;
|
|
ui2_left_pred_buf_width = ui_rec_width;
|
|
}
|
|
else
|
|
{
|
|
pu1_left = pu1_yleft;
|
|
pu1_yleft += (ui_rec_width << 3);
|
|
ui2_left_pred_buf_width = ui_rec_width;
|
|
}
|
|
|
|
/***************** Top Left *********************/
|
|
if(u1_sub_mb_num)
|
|
{
|
|
pu1_top_left = (u1_sub_blk_x) ?
|
|
pu1_top - 1 : pu1_left - ui_rec_width;
|
|
|
|
if((u1_sub_blk_x && (!u1_is_top_sub_block))
|
|
|| ((!u1_sub_blk_x) && (!u1_is_left_sub_block)))
|
|
{
|
|
pu1_top_left = NULL;
|
|
}
|
|
}
|
|
|
|
/*---------------------------------------------------------------*/
|
|
/* Calculation of Intra prediction mode */
|
|
/*---------------------------------------------------------------*/
|
|
i1_intra_pred = ((i1_left_pred_mode < 0) | (i1_top_pred_mode < 0)) ?
|
|
DC : MIN(i1_left_pred_mode, i1_top_pred_mode);
|
|
{
|
|
UWORD8 u1_packed_modes = (u1_is_top_sub_block << 1)
|
|
+ u1_is_left_sub_block;
|
|
UWORD8 *pu1_intra_err_codes =
|
|
(UWORD8 *)gau1_ih264d_intra_pred_err_code;
|
|
|
|
/********************************************************************/
|
|
/* Same intra4x4_pred_mode array is filled with intra4x4_pred_mode */
|
|
/* for a MB with 8x8 intrapredicition */
|
|
/********************************************************************/
|
|
PROFILE_DISABLE_INTRA_PRED()
|
|
if(!pu1_prev_intra4x4_pred_mode_flag[u1_sub_mb_num])
|
|
{
|
|
i1_intra_pred = pu1_rem_intra4x4_pred_mode[u1_sub_mb_num]
|
|
+ (pu1_rem_intra4x4_pred_mode[u1_sub_mb_num]
|
|
>= i1_intra_pred);
|
|
}
|
|
i1_intra_pred = CLIP3(0, 8, i1_intra_pred);
|
|
{
|
|
UWORD8 u1_err_code = pu1_intra_err_codes[i1_intra_pred];
|
|
|
|
if((u1_err_code & u1_packed_modes) ^ u1_err_code)
|
|
{
|
|
i1_intra_pred = 0;
|
|
ps_dec->i4_error_code = ERROR_INTRAPRED;
|
|
}
|
|
}
|
|
}
|
|
|
|
{
|
|
/* Align the size to multiple of 8, so that SIMD functions
|
|
can read 64 bits at a time. Only 25 bytes are actaully used */
|
|
UWORD8 au1_ngbr_pels[32] = {0};
|
|
WORD32 ngbr_avail;
|
|
ngbr_avail = u1_is_left_sub_block << 0;
|
|
ngbr_avail |= u1_is_top_sub_block << 2;
|
|
|
|
if(pu1_top_left)
|
|
ngbr_avail |= 1 << 1;
|
|
|
|
ngbr_avail |= u1_use_top_right_mb << 3;
|
|
PROFILE_DISABLE_INTRA_PRED()
|
|
{
|
|
ps_dec->pf_intra_pred_ref_filtering(pu1_left, pu1_top_left,
|
|
pu1_top, au1_ngbr_pels,
|
|
ui2_left_pred_buf_width,
|
|
ngbr_avail);
|
|
|
|
ps_dec->apf_intra_pred_luma_8x8[i1_intra_pred](
|
|
au1_ngbr_pels, pu1_luma_rec_buffer, 1,
|
|
ui_rec_width,
|
|
((u1_is_top_sub_block << 2) | u1_is_left_sub_block));
|
|
}
|
|
}
|
|
|
|
/* Inverse Transform and Reconstruction */
|
|
if(CHECKBIT(ps_cur_mb_info->u1_cbp, u1_sub_mb_num))
|
|
{
|
|
WORD16 *pi2_scale_matrix_ptr;
|
|
WORD16 ai2_tmp[64];
|
|
|
|
pi2_scale_matrix_ptr =
|
|
ps_dec->s_high_profile.i2_scalinglist8x8[0];
|
|
PROFILE_DISABLE_IQ_IT_RECON()
|
|
{
|
|
if(CHECKBIT(u4_luma_dc_only_cbp, u1_sub_mb_num))
|
|
{
|
|
ps_dec->pf_iquant_itrans_recon_luma_8x8_dc(
|
|
pi2_y_coeff1,
|
|
pu1_luma_rec_buffer,
|
|
pu1_luma_rec_buffer,
|
|
ui_rec_width,
|
|
ui_rec_width,
|
|
gau1_ih264d_dequant8x8_cavlc[ps_cur_mb_info->u1_qp_rem6],
|
|
(UWORD16 *)pi2_scale_matrix_ptr,
|
|
ps_cur_mb_info->u1_qp_div6, ai2_tmp, 0,
|
|
NULL);
|
|
}
|
|
else
|
|
{
|
|
ps_dec->pf_iquant_itrans_recon_luma_8x8(
|
|
pi2_y_coeff1,
|
|
pu1_luma_rec_buffer,
|
|
pu1_luma_rec_buffer,
|
|
ui_rec_width,
|
|
ui_rec_width,
|
|
gau1_ih264d_dequant8x8_cavlc[ps_cur_mb_info->u1_qp_rem6],
|
|
(UWORD16 *)pi2_scale_matrix_ptr,
|
|
ps_cur_mb_info->u1_qp_div6, ai2_tmp, 0,
|
|
NULL);
|
|
}
|
|
}
|
|
|
|
}
|
|
|
|
/*---------------------------------------------------------------*/
|
|
/* Update sub block number */
|
|
/*---------------------------------------------------------------*/
|
|
pi2_y_coeff1 += 64;
|
|
|
|
pu1_luma_rec_buffer +=
|
|
(u1_sub_blk_x == 1) ?
|
|
(ui_rec_width << 3) - (8 * 1) : 8;
|
|
|
|
/*---------------------------------------------------------------*/
|
|
/* Pred mode filled in terms of 4x4 block so replicated in 2 */
|
|
/* locations. */
|
|
/*---------------------------------------------------------------*/
|
|
pi1_cur_pred_mode[u1_sub_blk_x << 1] = i1_intra_pred;
|
|
pi1_cur_pred_mode[(u1_sub_blk_x << 1) + 1] = i1_intra_pred;
|
|
pi1_left_pred_mode[u1_sub_blk_y << 1] = i1_intra_pred;
|
|
pi1_left_pred_mode[(u1_sub_blk_y << 1) + 1] = i1_intra_pred;
|
|
}
|
|
}
|
|
/* Decode Chroma Block */
|
|
ih264d_unpack_chroma_coeff4x4_mb(ps_dec,
|
|
ps_cur_mb_info);
|
|
/*--------------------------------------------------------------------*/
|
|
/* Chroma Blocks decoding */
|
|
/*--------------------------------------------------------------------*/
|
|
{
|
|
UWORD8 u1_intra_chrom_pred_mode;
|
|
UWORD8 u1_chroma_cbp = (UWORD8)(ps_cur_mb_info->u1_cbp >> 4);
|
|
|
|
/*--------------------------------------------------------------------*/
|
|
/* Perform Chroma intra prediction */
|
|
/*--------------------------------------------------------------------*/
|
|
|
|
u1_intra_chrom_pred_mode = CHROMA_TO_LUMA_INTRA_MODE(
|
|
ps_cur_mb_info->u1_chroma_pred_mode);
|
|
|
|
{
|
|
UWORD8 u1_packed_modes = (u1_top_available << 1)
|
|
+ u1_left_available;
|
|
UWORD8 u1_err_code =
|
|
(u1_intra_chrom_pred_mode & 1) ?
|
|
u1_intra_chrom_pred_mode :
|
|
(u1_intra_chrom_pred_mode ^ 2);
|
|
if((u1_err_code & u1_packed_modes) ^ u1_err_code)
|
|
{
|
|
u1_intra_chrom_pred_mode = 0;
|
|
ps_dec->i4_error_code = ERROR_INTRAPRED;
|
|
}
|
|
}
|
|
|
|
/* CHANGED CODE */
|
|
if(u1_chroma_cbp != CBPC_ALLZERO)
|
|
{
|
|
UWORD16 u2_chroma_csbp =
|
|
(u1_chroma_cbp == CBPC_ACZERO) ?
|
|
0 : ps_cur_mb_info->u2_chroma_csbp;
|
|
UWORD32 u4_scale_u;
|
|
UWORD32 u4_scale_v;
|
|
|
|
{
|
|
UWORD16 au2_ngbr_pels[33];
|
|
UWORD8 *pu1_ngbr_pels = (UWORD8 *)au2_ngbr_pels;
|
|
UWORD16 *pu2_left_uv;
|
|
UWORD16 *pu2_topleft_uv;
|
|
WORD32 use_left1 = (u2_use_left_mb_pack & 0x0ff);
|
|
WORD32 use_left2 = (u2_use_left_mb_pack & 0xff00) >> 8;
|
|
|
|
pu2_left_uv = (UWORD16 *)pu1_uleft;
|
|
pu2_topleft_uv = (UWORD16 *)pu1_u_top_left;
|
|
/* Get neighbour pixels */
|
|
/* left pels */
|
|
if(u2_use_left_mb_pack)
|
|
{
|
|
WORD32 i;
|
|
if(use_left1)
|
|
{
|
|
for(i = 0; i < 4; i++)
|
|
au2_ngbr_pels[8 - 1 - i] = pu2_left_uv[i
|
|
* u4_recwidth_cr / YUV420SP_FACTOR];
|
|
}
|
|
else
|
|
{
|
|
memset(au2_ngbr_pels + 4, 0, 4 * sizeof(UWORD16));
|
|
}
|
|
|
|
if(use_left2)
|
|
{
|
|
for(i = 4; i < 8; i++)
|
|
au2_ngbr_pels[8 - 1 - i] = pu2_left_uv[i
|
|
* u4_recwidth_cr / YUV420SP_FACTOR];
|
|
}
|
|
else
|
|
{
|
|
memset(au2_ngbr_pels, 0, 4 * sizeof(UWORD16));
|
|
}
|
|
}
|
|
else
|
|
{
|
|
memset(au2_ngbr_pels, 0, 8 * sizeof(UWORD16));
|
|
}
|
|
|
|
/* top left pels */
|
|
au2_ngbr_pels[8] = *pu2_topleft_uv;
|
|
|
|
/* top pels */
|
|
if(uc_useTopMB)
|
|
{
|
|
memcpy(au2_ngbr_pels + 8 + 1, pu1_top_u,
|
|
8 * sizeof(UWORD16));
|
|
}
|
|
else
|
|
{
|
|
memset(au2_ngbr_pels + 8 + 1, 0, 8 * sizeof(UWORD16));
|
|
}
|
|
|
|
PROFILE_DISABLE_INTRA_PRED()
|
|
ps_dec->apf_intra_pred_chroma[u1_intra_chrom_pred_mode](
|
|
pu1_ngbr_pels,
|
|
pu1_mb_cb_rei1_buffer,
|
|
1,
|
|
u4_recwidth_cr,
|
|
((uc_useTopMB << 2) | (use_left2 << 4)
|
|
| use_left1));
|
|
}
|
|
u4_scale_u = ps_cur_mb_info->u1_qpc_div6;
|
|
u4_scale_v = ps_cur_mb_info->u1_qpcr_div6;
|
|
pi2_y_coeff = ps_dec->pi2_coeff_data;
|
|
|
|
{
|
|
UWORD32 i;
|
|
WORD16 ai2_tmp[16];
|
|
for(i = 0; i < 4; i++)
|
|
{
|
|
WORD16 *pi2_level = pi2_y_coeff + (i << 4);
|
|
UWORD8 *pu1_pred_sblk = pu1_mb_cb_rei1_buffer
|
|
+ ((i & 0x1) * BLK_SIZE * YUV420SP_FACTOR)
|
|
+ (i >> 1) * (u4_recwidth_cr << 2);
|
|
PROFILE_DISABLE_IQ_IT_RECON()
|
|
{
|
|
if(CHECKBIT(u2_chroma_csbp, i))
|
|
{
|
|
ps_dec->pf_iquant_itrans_recon_chroma_4x4(
|
|
pi2_level,
|
|
pu1_pred_sblk,
|
|
pu1_pred_sblk,
|
|
u4_recwidth_cr,
|
|
u4_recwidth_cr,
|
|
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qpc_rem6],
|
|
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[1],
|
|
u4_scale_u, ai2_tmp, pi2_level);
|
|
}
|
|
else if(pi2_level[0] != 0)
|
|
{
|
|
ps_dec->pf_iquant_itrans_recon_chroma_4x4_dc(
|
|
pi2_level,
|
|
pu1_pred_sblk,
|
|
pu1_pred_sblk,
|
|
u4_recwidth_cr,
|
|
u4_recwidth_cr,
|
|
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qpc_rem6],
|
|
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[1],
|
|
u4_scale_u, ai2_tmp, pi2_level);
|
|
}
|
|
}
|
|
|
|
}
|
|
}
|
|
|
|
pi2_y_coeff += MB_CHROM_SIZE;
|
|
u2_chroma_csbp = u2_chroma_csbp >> 4;
|
|
{
|
|
UWORD32 i;
|
|
WORD16 ai2_tmp[16];
|
|
for(i = 0; i < 4; i++)
|
|
{
|
|
WORD16 *pi2_level = pi2_y_coeff + (i << 4);
|
|
UWORD8 *pu1_pred_sblk = pu1_mb_cb_rei1_buffer + 1
|
|
+ ((i & 0x1) * BLK_SIZE * YUV420SP_FACTOR)
|
|
+ (i >> 1) * (u4_recwidth_cr << 2);
|
|
PROFILE_DISABLE_IQ_IT_RECON()
|
|
{
|
|
if(CHECKBIT(u2_chroma_csbp, i))
|
|
{
|
|
ps_dec->pf_iquant_itrans_recon_chroma_4x4(
|
|
pi2_level,
|
|
pu1_pred_sblk,
|
|
pu1_pred_sblk,
|
|
u4_recwidth_cr,
|
|
u4_recwidth_cr,
|
|
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qpcr_rem6],
|
|
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[2],
|
|
u4_scale_v, ai2_tmp, pi2_level);
|
|
}
|
|
else if(pi2_level[0] != 0)
|
|
{
|
|
ps_dec->pf_iquant_itrans_recon_chroma_4x4_dc(
|
|
pi2_level,
|
|
pu1_pred_sblk,
|
|
pu1_pred_sblk,
|
|
u4_recwidth_cr,
|
|
u4_recwidth_cr,
|
|
gau2_ih264_iquant_scale_4x4[ps_cur_mb_info->u1_qpcr_rem6],
|
|
(UWORD16 *)ps_dec->s_high_profile.i2_scalinglist4x4[2],
|
|
u4_scale_v, ai2_tmp, pi2_level);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
}
|
|
else
|
|
{
|
|
/* If no inverse transform is needed, pass recon buffer pointer */
|
|
/* to Intraprediction module instead of pred buffer pointer */
|
|
{
|
|
UWORD16 au2_ngbr_pels[33];
|
|
UWORD8 *pu1_ngbr_pels = (UWORD8 *)au2_ngbr_pels;
|
|
UWORD16 *pu2_left_uv;
|
|
UWORD16 *pu2_topleft_uv;
|
|
WORD32 use_left1 = (u2_use_left_mb_pack & 0x0ff);
|
|
WORD32 use_left2 = (u2_use_left_mb_pack & 0xff00) >> 8;
|
|
|
|
pu2_topleft_uv = (UWORD16 *)pu1_u_top_left;
|
|
pu2_left_uv = (UWORD16 *)pu1_uleft;
|
|
|
|
/* Get neighbour pixels */
|
|
/* left pels */
|
|
if(u2_use_left_mb_pack)
|
|
{
|
|
WORD32 i;
|
|
if(use_left1)
|
|
{
|
|
for(i = 0; i < 4; i++)
|
|
au2_ngbr_pels[8 - 1 - i] = pu2_left_uv[i
|
|
* u4_recwidth_cr / YUV420SP_FACTOR];
|
|
}
|
|
else
|
|
{
|
|
memset(au2_ngbr_pels + 4, 0, 4 * sizeof(UWORD16));
|
|
}
|
|
|
|
if(use_left2)
|
|
{
|
|
for(i = 4; i < 8; i++)
|
|
au2_ngbr_pels[8 - 1 - i] = pu2_left_uv[i
|
|
* u4_recwidth_cr / YUV420SP_FACTOR];
|
|
}
|
|
else
|
|
{
|
|
memset(au2_ngbr_pels, 0, 4 * sizeof(UWORD16));
|
|
}
|
|
|
|
}
|
|
else
|
|
{
|
|
memset(au2_ngbr_pels, 0, 8 * sizeof(UWORD16));
|
|
}
|
|
|
|
/* top left pels */
|
|
au2_ngbr_pels[8] = *pu2_topleft_uv;
|
|
|
|
/* top pels */
|
|
if(uc_useTopMB)
|
|
{
|
|
memcpy(au2_ngbr_pels + 8 + 1, pu1_top_u,
|
|
8 * sizeof(UWORD16));
|
|
}
|
|
else
|
|
{
|
|
memset(au2_ngbr_pels + 8 + 1, 0, 8 * sizeof(UWORD16));
|
|
}
|
|
|
|
PROFILE_DISABLE_INTRA_PRED()
|
|
ps_dec->apf_intra_pred_chroma[u1_intra_chrom_pred_mode](
|
|
pu1_ngbr_pels,
|
|
pu1_mb_cb_rei1_buffer,
|
|
1,
|
|
u4_recwidth_cr,
|
|
((uc_useTopMB << 2) | (use_left2 << 4)
|
|
| use_left1));
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
return OK;
|
|
}
|