diff options
Diffstat (limited to 'Src/h264dec/ldecod/src/macroblock.c')
-rw-r--r-- | Src/h264dec/ldecod/src/macroblock.c | 6475 |
1 files changed, 6475 insertions, 0 deletions
diff --git a/Src/h264dec/ldecod/src/macroblock.c b/Src/h264dec/ldecod/src/macroblock.c new file mode 100644 index 00000000..10d083b1 --- /dev/null +++ b/Src/h264dec/ldecod/src/macroblock.c @@ -0,0 +1,6475 @@ + +/*! +*********************************************************************** +* \file macroblock.c +* +* \brief +* Decode a Macroblock +* +* \author +* Main contributors (see contributors.h for copyright, address and affiliation details) +* - Inge Lille-Langøy <inge.lille-langoy@telenor.com> +* - Rickard Sjoberg <rickard.sjoberg@era.ericsson.se> +* - Jani Lainema <jani.lainema@nokia.com> +* - Sebastian Purreiter <sebastian.purreiter@mch.siemens.de> +* - Thomas Wedi <wedi@tnt.uni-hannover.de> +* - Detlev Marpe <marpe@hhi.de> +* - Gabi Blaettermann +* - Ye-Kui Wang <wyk@ieee.org> +* - Lowell Winger <lwinger@lsil.com> +* - Alexis Michael Tourapis <alexismt@ieee.org> +*********************************************************************** +*/ + +#include "contributors.h" + +#include <math.h> + +#include "block.h" +#include "global.h" +#include "mbuffer.h" +#include "elements.h" +#include "errorconcealment.h" +#include "macroblock.h" +#include "fmo.h" +#include "cabac.h" +#include "vlc.h" +#include "image.h" +#include "mb_access.h" +#include "biaridecod.h" +#include "transform8x8.h" +#include "transform.h" +#include "mc_prediction.h" +#include "quant.h" +#include "intra4x4_pred.h" +#include "intra8x8_pred.h" +#include "intra16x16_pred.h" +#include "mv_prediction.h" +#include "optim.h" +#include "mb_prediction.h" +#include <emmintrin.h> +#include <smmintrin.h> + +#if TRACE +#define TRACE_STRING(s) strncpy(currSE.tracestring, s, TRACESTRING_SIZE) +#define TRACE_DECBITS(i) dectracebitcnt(1) +#define TRACE_PRINTF(s) sprintf(type, "%s", s); +#define TRACE_STRING_P(s) strncpy(currSE->tracestring, s, TRACESTRING_SIZE) +#else +#define TRACE_STRING(s) +#define TRACE_DECBITS(i) +#define TRACE_PRINTF(s) +#define TRACE_STRING_P(s) +#endif + +//! look up tables for FRExt_chroma support +void dectracebitcnt(int count); + +static void read_motion_info_from_NAL_p_slice (Macroblock *currMB); +static void read_motion_info_from_NAL_b_slice (Macroblock *currMB); +static void read_ipred_modes (Macroblock *currMB); +static void read_CBP_and_coeffs_from_NAL_CABAC (Macroblock *currMB); +static void read_CBP_and_coeffs_from_NAL_CAVLC (Macroblock *currMB); +static void read_IPCM_coeffs_from_NAL (Slice *currSlice, struct datapartition *dP); +static void read_one_macroblock_i_slice (Macroblock *currMB); +static void read_one_macroblock_p_slice (Macroblock *currMB); +static void read_one_macroblock_b_slice (Macroblock *currMB); +static int decode_one_component_i_slice (Macroblock *currMB, ColorPlane curr_plane, struct video_image *image, StorablePicture *dec_picture); +static int decode_one_component_p_slice (Macroblock *currMB, ColorPlane curr_plane, struct video_image *image, StorablePicture *dec_picture); +static int decode_one_component_b_slice (Macroblock *currMB, ColorPlane curr_plane, struct video_image *image, StorablePicture *dec_picture); +static int decode_one_component_sp_slice (Macroblock *currMB, ColorPlane curr_plane, struct video_image *image, StorablePicture *dec_picture); + +static inline void or_bits(int64 *x, int mask, int position) +{ +#ifdef _M_IX86 + __m64 mmx_x = *(__m64 *)x; + __m64 mmx_mask = _mm_cvtsi32_si64(mask); + mmx_mask=_mm_slli_si64(mmx_mask, position); + mmx_x = _mm_or_si64(mmx_x, mmx_mask); + *(__m64 *)x = mmx_x; +#else + *x |= ((int64) mask << position); +#endif +} + +/*! +************************************************************************ +* \brief +* Set context for reference frames +************************************************************************ +*/ +static inline int BType2CtxRef (int btype) +{ + return (btype >= 4); +} + +/*! +************************************************************************ +* \brief +* Function for reading the reference picture indices using VLC +************************************************************************ +*/ +static char readRefPictureIdx_VLC(SyntaxElement *currSE, DataPartition *dP, int list) +{ +#if TRACE + char tstring[20]; + sprintf( tstring, "ref_idx_l%d", list); + strncpy(currSE->tracestring, tstring, TRACESTRING_SIZE); +#endif + currSE->value2 = list; + readSyntaxElement_UVLC(currSE, dP); + return (char) currSE->value1; +} + +/*! +************************************************************************ +* \brief +* Function for reading the reference picture indices using FLC +************************************************************************ +*/ +static char readRefPictureIdx_FLC(SyntaxElement *currSE, DataPartition *dP, int list) +{ +#if TRACE + char tstring[20]; + sprintf( tstring, "ref_idx_l%d", list); + strncpy(currSE->tracestring, tstring, TRACESTRING_SIZE); +#endif + //currSE->len = 1; + currSE->value1 = 1 - readSyntaxElement_FLC(dP->bitstream, 1); + + return (char) currSE->value1; +} + +/*! +************************************************************************ +* \brief +* Dummy Function for reading the reference picture indices +************************************************************************ +*/ +static char readRefPictureIdx_Null(SyntaxElement *currSE, DataPartition *dP, int list) +{ + return 0; +} + +/*! +************************************************************************ +* \brief +* Function to prepare reference picture indice function pointer +************************************************************************ +*/ +static void prepareListforRefIdx ( Macroblock *currMB, SyntaxElement *currSE, int num_ref_idx_active, int refidx_present) +{ + currMB->readRefPictureIdx = readRefPictureIdx_Null; // Initialize readRefPictureIdx + if(num_ref_idx_active > 1) + { + currSE->mapping = linfo_ue; + if (refidx_present) + { + if (num_ref_idx_active == 2) + currMB->readRefPictureIdx = readRefPictureIdx_FLC; + else + currMB->readRefPictureIdx = readRefPictureIdx_VLC; + } + } +} + +#if defined(_DEBUG) || defined(_M_X64) +void set_chroma_qp(Macroblock* currMB) +{ + // TODO: benski> we could use MMX for this if we could find a formula for QP_SCALE_CR + VideoParameters *p_Vid = currMB->p_Vid; + StorablePicture *dec_picture = p_Vid->dec_picture; + int i; + for (i=0; i<2; ++i) + { + currMB->qpc[i] = iClip3 ( -p_Vid->bitdepth_chroma_qp_scale, 51, currMB->qp + dec_picture->chroma_qp_offset[i] ); + currMB->qpc[i] = currMB->qpc[i] < 0 ? currMB->qpc[i] : QP_SCALE_CR[currMB->qpc[i]]; + currMB->qp_scaled[i + 1] = currMB->qpc[i] + p_Vid->bitdepth_chroma_qp_scale; + } +} +#else +void set_chroma_qp(Macroblock* currMB); +#endif + +/*! +************************************************************************ +* \brief +* updates chroma QP according to luma QP and bit depth +************************************************************************ +*/ +static inline void update_qp(Macroblock *currMB, int qp) +{ + VideoParameters *p_Vid = currMB->p_Vid; + currMB->qp = qp; + currMB->qp_scaled[0] = qp + p_Vid->bitdepth_luma_qp_scale; + set_chroma_qp(currMB); + currMB->is_lossless = (Boolean) ((currMB->qp_scaled[0] == 0) && (p_Vid->lossless_qpprime_flag == 1)); +} + +static void read_delta_quant_CAVLC(SyntaxElement *currSE, DataPartition *dP, Macroblock *currMB, const byte *partMap, int type) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + + dP = &(currSlice->partArr[partMap[type]]); + + + currSE->mapping = linfo_se; + readSyntaxElement_UVLC(currSE, dP); + currMB->delta_quant = (short) currSE->value1; + + + if ((currMB->delta_quant < -(26 + p_Vid->bitdepth_luma_qp_scale/2)) || (currMB->delta_quant > (25 + p_Vid->bitdepth_luma_qp_scale/2))) + error ("mb_qp_delta is out of range", 500); + + p_Vid->qp = ((p_Vid->qp + currMB->delta_quant + 52 + 2*p_Vid->bitdepth_luma_qp_scale)%(52+p_Vid->bitdepth_luma_qp_scale)) - + p_Vid->bitdepth_luma_qp_scale; + update_qp(currMB, p_Vid->qp); +} + +static void inline read_delta_quant_CABAC(SyntaxElement *currSE, DataPartition *dP, Macroblock *currMB, const byte *partMap, int type) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + + dP = &(currSlice->partArr[partMap[type]]); + + currMB->delta_quant = readDquant_CABAC(currSlice, &dP->de_cabac); + + if ((currMB->delta_quant < -(26 + p_Vid->bitdepth_luma_qp_scale/2)) || (currMB->delta_quant > (25 + p_Vid->bitdepth_luma_qp_scale/2))) + error ("mb_qp_delta is out of range", 500); + + p_Vid->qp = ((p_Vid->qp + currMB->delta_quant + 52 + 2*p_Vid->bitdepth_luma_qp_scale)%(52+p_Vid->bitdepth_luma_qp_scale)) - p_Vid->bitdepth_luma_qp_scale; + update_qp(currMB, p_Vid->qp); +} + +/*! +************************************************************************ +* \brief +* Function to read reference picture indice values +************************************************************************ +*/ +static void readMBRefPictureIdx(SyntaxElement *currSE, DataPartition *dP, Macroblock *currMB, PicMotion **motion, int list, int step_v0, int step_h0) +{ + int k, j, j0, i0, i; + char refframe; + + for (j0 = 0; j0 < 4; j0 += step_v0) + { + currMB->subblock_y = j0 << 2; + for (i0 = 0; i0 < 4; i0 += step_h0) + { + currMB->subblock_x = i0 << 2; + k = 2 * (j0 >> 1) + (i0 >> 1); + + if ((currMB->b8pdir[k] == list || currMB->b8pdir[k] == BI_PRED) && currMB->b8mode[k] != 0) + { + refframe = currMB->readRefPictureIdx(currSE, dP, list); + + for (j = j0; j < j0 + step_v0; ++j) + { + for (i=0;i<step_h0;i++) + { + motion[j][currMB->block_x + i0 + i].ref_idx = refframe; + } + } + } + } + } +} + +static void readMBRefPictureIdx_CABAC1(DataPartition *dP, Macroblock *currMB, PicMotion **motion, int list, int step_v0) +{ + int k, j, j0, i0; + char refframe; + + for (j0 = 0; j0 < 4; j0 += step_v0) + { + currMB->subblock_y = j0 << 2; + for (i0 = 0; i0 < 4; i0 += 1) + { + currMB->subblock_x = i0 << 2; + k = 2 * (j0 >> 1) + (i0 >> 1); + + if ((currMB->b8pdir[k] == list || currMB->b8pdir[k] == BI_PRED) && currMB->b8mode[k] != 0) + { + refframe = readRefFrame_CABAC(currMB, &dP->de_cabac, list, i0<<2, j0<<2); + + for (j = j0; j < j0 + step_v0; ++j) + motion[j][currMB->block_x + i0].ref_idx=refframe; + } + } + } +} + +static void readMBRefPictureIdx_CABAC2(DataPartition *dP, Macroblock *currMB, PicMotion **motion, int list, int step_v0) +{ + int k, j, j0; + char refframe; + + for (j0 = 0; j0 < 4; j0 += step_v0) + { + currMB->subblock_y = j0 << 2; + + currMB->subblock_x = 0 << 2; + k = 2 * (j0 >> 1) + (0 >> 1); + + if ((currMB->b8pdir[k] == list || currMB->b8pdir[k] == BI_PRED) && currMB->b8mode[k] != 0) + { + refframe = readRefFrame_CABAC0(currMB, &dP->de_cabac, list, j0<<2); + + for (j = j0; j < j0 + step_v0; ++j) + { + motion[j][currMB->block_x + 0].ref_idx=refframe; + motion[j][currMB->block_x + 1].ref_idx=refframe; + } + } + + // + + currMB->subblock_x = 2 << 2; + k = 2 * (j0 >> 1) + (2 >> 1); + + if ((currMB->b8pdir[k] == list || currMB->b8pdir[k] == BI_PRED) && currMB->b8mode[k] != 0) + { + refframe = readRefFrame_CABAC(currMB, &dP->de_cabac, list, 8, j0<<2); + + for (j = j0; j < j0 + step_v0; ++j) + { + motion[j][currMB->block_x + 2].ref_idx=refframe; + motion[j][currMB->block_x + 3].ref_idx=refframe; + } + } + + } +} + + +static void readMBRefPictureIdx_CABAC4(DataPartition *dP, Macroblock *currMB, PicMotion **motion, int list, int step_v0) +{ + int k, j, j0; + char refframe; + + for (j0 = 0; j0 < 4; j0 += step_v0) + { + currMB->subblock_y = j0 << 2; + currMB->subblock_x = 0; + k = j0 & ~1; + + if ((currMB->b8pdir[k] == list || currMB->b8pdir[k] == BI_PRED) && currMB->b8mode[k] != 0) + { + refframe = readRefFrame_CABAC0(currMB, &dP->de_cabac, list, j0<<2); + for (j = j0; j < j0 + step_v0; ++j) + { + motion[j][currMB->block_x + 0].ref_idx=refframe; + motion[j][currMB->block_x + 1].ref_idx=refframe; + motion[j][currMB->block_x + 2].ref_idx=refframe; + motion[j][currMB->block_x + 3].ref_idx=refframe; + } + } + } +} + +static void readMBRefPictureIdx_CABAC(DataPartition *dP, Macroblock *currMB, PicMotion **motion, int list, int step_v0, int step_h0) +{ + switch(step_h0) + { + case 1: + readMBRefPictureIdx_CABAC1(dP, currMB, motion, list, step_v0); + break; + case 2: + readMBRefPictureIdx_CABAC2(dP, currMB, motion, list, step_v0); + break; + case 4: + readMBRefPictureIdx_CABAC4(dP, currMB, motion, list, step_v0); + break; + } +} + +static void readMBRefPictureIdx_CABAC_NoReference(Macroblock *currMB, PicMotion **motion, int list, int step_v0, int step_h0) +{ + int k, j, j0, i0, i; + + for (j0 = 0; j0 < 4; j0 += step_v0) + { + for (i0 = 0; i0 < 4; i0 += step_h0) + { + k = 2 * (j0 >> 1) + (i0 >> 1); + + if ((currMB->b8pdir[k] == list || currMB->b8pdir[k] == BI_PRED) && currMB->b8mode[k] != 0) + { + for (j = j0; j < j0 + step_v0; ++j) + { + for (i=0;i<step_h0;i++) + { + motion[j][currMB->block_x + i0 + i].ref_idx=0; + } + } + } + } + } +} + +/*! +************************************************************************ +* \brief +* Function to read reference picture indice values +************************************************************************ +*/ +static void readMBMotionVectors(SyntaxElement *currSE, DataPartition *dP, Macroblock *currMB, int list, int step_h0, int step_v0) +{ + int i, j, k, i4, j4, ii, jj, kk, i0, j0; + short curr_mvd[2], curr_mv[2], pred_mv[2]; + MotionVector (*mvd)[4]; + //MotionVector **mv; + int mv_mode, step_h, step_v; + char cur_ref_idx; + VideoParameters *p_Vid = currMB->p_Vid; + StorablePicture *dec_picture = p_Vid->dec_picture; + PicMotionParams *motion = &dec_picture->motion; + PixelPos block[4]; // neighbor blocks + + + for (j0=0; j0<4; j0+=step_v0) + { + for (i0=0; i0<4; i0+=step_h0) + { + kk = 2 * (j0 >> 1) + (i0 >> 1); + if ((currMB->b8pdir[kk]== list || currMB->b8pdir[kk]== BI_PRED) && (currMB->b8mode[kk] !=0))//has forward vector + { + PicMotion **list_motion = motion->motion[list]; + cur_ref_idx = list_motion[currMB->block_y+j0][currMB->block_x+i0].ref_idx; + mv_mode = currMB->b8mode[kk]; + step_h = BLOCK_STEP [mv_mode][0]; + step_v = BLOCK_STEP [mv_mode][1]; + + for (j = j0; j < j0 + step_v0; j += step_v) + { + PicMotion **mv; + currMB->subblock_y = j << 2; // position used for context determination + j4 = currMB->block_y + j; + mv = &list_motion[j4]; + mvd = &currMB->mvd [list][j]; + for (i = i0; i < i0 + step_h0; i += step_h) + { + currMB->subblock_x = i << 2; // position used for context determination + i4 = currMB->block_x + i; + + get_neighbors(currMB, block, BLOCK_SIZE * i, BLOCK_SIZE * j, 4 * step_h); + + // first make mv-prediction + currMB->GetMVPredictor (currMB, block, pred_mv, cur_ref_idx, list_motion, BLOCK_SIZE * i, BLOCK_SIZE * j, 4 * step_h, 4 * step_v); + + for (k=0; k < 2; ++k) + { + currSE->value2 = (k << 1) + list; // identifies the component; only used for context determination + readSyntaxElement_UVLC(currSE, dP); + curr_mvd[k] = (short) currSE->value1; + curr_mv [k] = (short)(curr_mvd[k] + pred_mv[k]); // compute motion vector + } + + // Init motion vectors + for(jj = 0; jj < step_v; ++jj) + { + for(ii = i4; ii < i4 + step_h; ++ii) + { + memcpy(&mv[jj][ii].mv, curr_mv, sizeof(MotionVector)); + } + } + + // Init first line (mvd) + for(ii = i; ii < i + step_h; ++ii) + { + memcpy(mvd[0][ii], curr_mvd, sizeof(MotionVector)); + } + + // now copy all other lines + for(jj = 1; jj < step_v; ++jj) + { + memcpy(mvd[jj][i], mvd[0][i], step_h * sizeof(MotionVector)); + } + } + } + } + } + } +} + +static void readMBMotionVectors_CABAC(DataPartition *dP, Macroblock *currMB, int list, int step_h0, int step_v0) +{ + int i, j, k, i4, j4, ii, jj, kk, i0, j0; + short curr_mvd[2], curr_mv[2], pred_mv[2]; + MotionVector (*mvd)[4]; + //MotionVector **mv; + int mv_mode, step_h, step_v; + char cur_ref_idx; + VideoParameters *p_Vid = currMB->p_Vid; + StorablePicture *dec_picture = p_Vid->dec_picture; + PicMotionParams *motion = &dec_picture->motion; + PixelPos block[4]; // neighbor blocks + + for (j0=0; j0<4; j0+=step_v0) + { + for (i0=0; i0<4; i0+=step_h0) + { + kk = (j0 & ~1) + (i0 >> 1); + if ((currMB->b8pdir[kk]== list || currMB->b8pdir[kk]== BI_PRED) && (currMB->b8mode[kk] !=0))//has forward vector + { + PicMotion **list_motion = motion->motion[list]; + cur_ref_idx = list_motion[currMB->block_y+j0][currMB->block_x+i0].ref_idx; + mv_mode = currMB->b8mode[kk]; + step_h = BLOCK_STEP [mv_mode][0]; + step_v = BLOCK_STEP [mv_mode][1]; + + for (j = j0; j < j0 + step_v0; j += step_v) + { + PicMotion **mv; + int block_j = j << 2; + currMB->subblock_y = block_j; // position used for context determination + j4 = currMB->block_y + j; + mv = &list_motion[j4]; + mvd = &currMB->mvd [list][j]; + for (i = i0; i < i0 + step_h0; i += step_h) + { + int block_i=i << 2; + currMB->subblock_x = block_i; // position used for context determination + i4 = currMB->block_x + i; + + get_neighbors(currMB, block, block_i, block_j, 4 * step_h); + + // first make mv-prediction + currMB->GetMVPredictor (currMB, block, pred_mv, cur_ref_idx, list_motion, block_i, block_j, 4 * step_h, 4 * step_v); + + for (k=0; k < 2; ++k) + { + //currSE.value2 = (k << 1) + list; // identifies the component; only used for context determination + curr_mvd[k] = (short)readMVD_CABAC(currMB, &dP->de_cabac, k, list, block_i, block_j); + curr_mv [k] = (short)(curr_mvd[k] + pred_mv[k]); // compute motion vector + } + + // Init motion vectors + for(jj = 0; jj < step_v; ++jj) + { + for(ii = i4; ii < i4 + step_h; ++ii) + { + *(int32_t *)(&mv[jj][ii].mv) = *(int32_t *)curr_mv; + } + } + + // Init first line (mvd) + for(ii = i; ii < i + step_h; ++ii) + { + *(int32_t *)(mvd[0][ii]) = *(int32_t *)curr_mvd; + } + + // now copy all other lines + for(jj = 1; jj < step_v; ++jj) + { + memcpy_amd(mvd[jj][i], mvd[0][i], step_h * sizeof(MotionVector)); + } + } + } + } + } + } +} + +/*! +************************************************************************ +* \brief +* initializes the current macroblock +************************************************************************ +*/ +void start_macroblock(Slice *currSlice, Macroblock **currMB) +{ + VideoParameters *p_Vid = currSlice->p_Vid; + StorablePicture *dec_picture = p_Vid->dec_picture; + int mb_nr = p_Vid->current_mb_nr; + Macroblock *mb = &p_Vid->mb_data[mb_nr]; // intialization code deleted, see below, StW + *currMB = mb; + + mb->p_Vid = p_Vid; + mb->p_Slice = currSlice; + mb->mbAddrX = mb_nr; + + //assert (mb_nr < (int) p_Vid->PicSizeInMbs); + + /* Update coordinates of the current macroblock */ + if (currSlice->mb_aff_frame_flag) + { + mb->mb_x = (mb_nr) % ((2*p_Vid->width) / MB_BLOCK_SIZE); + mb->mb_y = 2*((mb_nr) / ((2*p_Vid->width) / MB_BLOCK_SIZE)); + + mb->mb_y += (mb->mb_x & 0x01); + mb->mb_x >>= 1; + } + else + { + mb->mb_x = p_Vid->PicPos[mb_nr][0]; + mb->mb_y = p_Vid->PicPos[mb_nr][1]; + } + + /* Define vertical positions */ + mb->block_y = mb->mb_y * BLOCK_SIZE; /* luma block position */ + mb->block_y_aff = mb->block_y; + mb->pix_y = mb->mb_y * MB_BLOCK_SIZE; /* luma macroblock position */ + mb->pix_c_y = mb->mb_y * p_Vid->mb_cr_size_y; /* chroma macroblock position */ + + /* Define horizontal positions */ + mb->block_x = mb->mb_x * BLOCK_SIZE; /* luma block position */ + mb->pix_x = mb->mb_x * MB_BLOCK_SIZE; /* luma pixel position */ + mb->pix_c_x = mb->mb_x * p_Vid->mb_cr_size_x; /* chroma pixel position */ + + // Save the slice number of this macroblock. When the macroblock below + // is coded it will use this to decide if prediction for above is possible + mb->slice_nr = (short) p_Vid->current_slice_nr; + + if (p_Vid->current_slice_nr >= MAX_NUM_SLICES) + { + error ("Maximum number of supported slices exceeded. \nPlease recompile with increased value for MAX_NUM_SLICES", 200); + } + + dec_picture->slice_id[mb->mb_y][mb->mb_x] = (short) p_Vid->current_slice_nr; + dec_picture->max_slice_id = (short) imax(p_Vid->current_slice_nr, dec_picture->max_slice_id); + + CheckAvailabilityOfNeighbors(mb); + + // Select appropriate MV predictor function + init_motion_vector_prediction(*currMB, currSlice->mb_aff_frame_flag); + + set_read_and_store_CBP(currMB, currSlice->active_sps->chroma_format_idc); + + // Reset syntax element entries in MB struct + update_qp(*currMB, p_Vid->qp); + mb->mb_type = 0; + mb->delta_quant = 0; + mb->cbp = 0; + mb->c_ipred_mode = DC_PRED_8; //GB + + if (currSlice->slice_type != I_SLICE) + { + if (currSlice->slice_type != B_SLICE) + memzero64(mb->mvd);//, BLOCK_MULTIPLE * BLOCK_MULTIPLE * 2 * sizeof(short)); + else + memzero128(mb->mvd);//, 2 * BLOCK_MULTIPLE * BLOCK_MULTIPLE * 2 * sizeof(short)); + } + + memzero24(mb->cbp_blk); + memzero24(mb->cbp_bits); + memzero24(mb->cbp_bits_8x8); + + // initialize currSlice->mb_rres + memset(currSlice->mb_rres8, 0, sizeof(currSlice->mb_rres8)); + + // store filtering parameters for this MB + mb->DFDisableIdc = currSlice->DFDisableIdc; + mb->DFAlphaC0Offset = currSlice->DFAlphaC0Offset; + mb->DFBetaOffset = currSlice->DFBetaOffset; + +} + +/*! +************************************************************************ +* \brief +* set coordinates of the next macroblock +* check end_of_slice condition +************************************************************************ +*/ +Boolean exit_macroblock(Slice *currSlice, int eos_bit) +{ + VideoParameters *p_Vid = currSlice->p_Vid; + + //! The if() statement below resembles the original code, which tested + //! p_Vid->current_mb_nr == p_Vid->PicSizeInMbs. Both is, of course, nonsense + //! In an error prone environment, one can only be sure to have a new + //! picture by checking the tr of the next slice header! + + // printf ("exit_macroblock: FmoGetLastMBOfPicture %d, p_Vid->current_mb_nr %d\n", FmoGetLastMBOfPicture(), p_Vid->current_mb_nr); + ++(p_Vid->num_dec_mb); + + if (p_Vid->num_dec_mb == p_Vid->PicSizeInMbs) + { + return TRUE; + } + // ask for last mb in the slice CAVLC + else + { + + p_Vid->current_mb_nr = FmoGetNextMBNr (p_Vid, p_Vid->current_mb_nr); + + if (p_Vid->current_mb_nr == -1) // End of Slice group, MUST be end of slice + { + assert (currSlice->nal_startcode_follows (currSlice, eos_bit) == TRUE); + return TRUE; + } + + if(currSlice->nal_startcode_follows(currSlice, eos_bit) == FALSE) + return FALSE; + + if(currSlice->slice_type == I_SLICE || currSlice->slice_type == SI_SLICE || p_Vid->active_pps->entropy_coding_mode_flag == CABAC) + return TRUE; + if(p_Vid->cod_counter <= 0) + return TRUE; + return FALSE; + } +} + +/*! +************************************************************************ +* \brief +* Interpret the mb mode for P-Frames +************************************************************************ +*/ +static void interpret_mb_mode_P(Macroblock *currMB) +{ + VideoParameters *p_Vid = currMB->p_Vid; + + static const int ICBPTAB[6] = {0,16,32,15,31,47}; + int mbmode = currMB->mb_type; + +#define ZERO_P8x8 (mbmode==5) +#define MODE_IS_P8x8 (mbmode==4 || mbmode==5) +#define MODE_IS_I4x4 (mbmode==6) +#define I16OFFSET (mbmode-7) +#define MODE_IS_IPCM (mbmode==31) + + if(mbmode <4) + { + currMB->mb_type = mbmode; + memset(&currMB->b8mode[0],mbmode,4 * sizeof(char)); + memset(&currMB->b8pdir[0], 0, 4 * sizeof(char)); + } + else if(MODE_IS_P8x8) + { + currMB->mb_type = P8x8; + p_Vid->allrefzero = ZERO_P8x8; + } + else if(MODE_IS_I4x4) + { + currMB->mb_type = I4MB; + memset(&currMB->b8mode[0],IBLOCK, 4 * sizeof(char)); + memset(&currMB->b8pdir[0], -1, 4 * sizeof(char)); + } + else if(MODE_IS_IPCM) + { + currMB->mb_type = IPCM; + currMB->cbp = -1; + currMB->i16mode = 0; + + memset(&currMB->b8mode[0], 0, 4 * sizeof(char)); + memset(&currMB->b8pdir[0],-1, 4 * sizeof(char)); + } + else + { + currMB->mb_type = I16MB; + currMB->cbp = ICBPTAB[(I16OFFSET)>>2]; + currMB->i16mode = (I16OFFSET) & 0x03; + memset(&currMB->b8mode[0], 0, 4 * sizeof(char)); + memset(&currMB->b8pdir[0],-1, 4 * sizeof(char)); + } +} + +/*! +************************************************************************ +* \brief +* Interpret the mb mode for I-Frames +************************************************************************ +*/ +static void interpret_mb_mode_I(Macroblock *currMB) +{ + static const int ICBPTAB[6] = {0,16,32,15,31,47}; + int mbmode = currMB->mb_type; + + if (mbmode==0) + { + currMB->mb_type = I4MB; + memset(&currMB->b8mode[0],IBLOCK,4 * sizeof(char)); + memset(&currMB->b8pdir[0],-1,4 * sizeof(char)); + } + else if(mbmode==25) + { + currMB->mb_type=IPCM; + currMB->cbp= -1; + currMB->i16mode = 0; + + memset(&currMB->b8mode[0],0,4 * sizeof(char)); + memset(&currMB->b8pdir[0],-1,4 * sizeof(char)); + } + else + { + currMB->mb_type = I16MB; + currMB->cbp= ICBPTAB[(mbmode-1)>>2]; + currMB->i16mode = (mbmode-1) & 0x03; + memset(&currMB->b8mode[0], 0, 4 * sizeof(char)); + memset(&currMB->b8pdir[0],-1, 4 * sizeof(char)); + } +} + +/*! +************************************************************************ +* \brief +* Interpret the mb mode for B-Frames +************************************************************************ +*/ +static void interpret_mb_mode_B(Macroblock *currMB) +{ + static const int offset2pdir16x16[12] = {0, 0, 1, 2, 0,0,0,0,0,0,0,0}; + static const int offset2pdir16x8[22][2] = {{0,0},{0,0},{0,0},{0,0},{0,0},{0,0},{1,1},{0,0},{0,1},{0,0},{1,0}, + {0,0},{0,2},{0,0},{1,2},{0,0},{2,0},{0,0},{2,1},{0,0},{2,2},{0,0}}; + static const int offset2pdir8x16[22][2] = {{0,0},{0,0},{0,0},{0,0},{0,0},{0,0},{0,0},{1,1},{0,0},{0,1},{0,0}, + {1,0},{0,0},{0,2},{0,0},{1,2},{0,0},{2,0},{0,0},{2,1},{0,0},{2,2}}; + + static const int ICBPTAB[6] = {0,16,32,15,31,47}; + + int i, mbmode; + int mbtype = currMB->mb_type; + + //--- set mbtype, b8type, and b8pdir --- + if (mbtype==0) // direct + { + mbmode=0; + memset(&currMB->b8mode[0],0,4 * sizeof(char)); + memset(&currMB->b8pdir[0],2,4 * sizeof(char)); + } + else if (mbtype==23) // intra4x4 + { + mbmode=I4MB; + memset(&currMB->b8mode[0],IBLOCK,4 * sizeof(char)); + memset(&currMB->b8pdir[0],-1,4 * sizeof(char)); + } + else if ((mbtype>23) && (mbtype<48) ) // intra16x16 + { + mbmode=I16MB; + memset(&currMB->b8mode[0],0,4 * sizeof(char)); + memset(&currMB->b8pdir[0],-1,4 * sizeof(char)); + + currMB->cbp = ICBPTAB[(mbtype-24)>>2]; + currMB->i16mode = (mbtype-24) & 0x03; + } + else if (mbtype==22) // 8x8(+split) + { + mbmode=P8x8; // b8mode and pdir is transmitted in additional codewords + } + else if (mbtype<4) // 16x16 + { + mbmode=1; + memset(&currMB->b8mode[0], 1,4 * sizeof(char)); + memset(&currMB->b8pdir[0],offset2pdir16x16[mbtype],4 * sizeof(char)); + } + else if(mbtype==48) + { + mbmode=IPCM; + memset(&currMB->b8mode[0], 0,4 * sizeof(char)); + memset(&currMB->b8pdir[0],-1,4 * sizeof(char)); + + currMB->cbp= -1; + currMB->i16mode = 0; + } + + else if ((mbtype&0x01)==0) // 16x8 + { + mbmode=2; + memset(&currMB->b8mode[0], 2,4 * sizeof(char)); + for(i=0;i<4;++i) + { + currMB->b8pdir[i] = (char) offset2pdir16x8 [mbtype][i>>1]; + } + } + else + { + mbmode=3; + memset(&currMB->b8mode[0], 3,4 * sizeof(char)); + for(i=0;i<4; ++i) + { + currMB->b8pdir[i] = (char) offset2pdir8x16 [mbtype][i&0x01]; + } + } + currMB->mb_type = mbmode; +} +/*! +************************************************************************ +* \brief +* Interpret the mb mode for SI-Frames +************************************************************************ +*/ +static void interpret_mb_mode_SI(Macroblock *currMB) +{ + VideoParameters *p_Vid = currMB->p_Vid; + const int ICBPTAB[6] = {0,16,32,15,31,47}; + int mbmode = currMB->mb_type; + + if (mbmode==0) + { + currMB->mb_type = SI4MB; + memset(&currMB->b8mode[0],IBLOCK,4 * sizeof(char)); + memset(&currMB->b8pdir[0],-1,4 * sizeof(char)); + p_Vid->siblock[currMB->mb_y][currMB->mb_x]=1; + } + else if (mbmode==1) + { + currMB->mb_type = I4MB; + memset(&currMB->b8mode[0],IBLOCK,4 * sizeof(char)); + memset(&currMB->b8pdir[0],-1,4 * sizeof(char)); + } + else if(mbmode==26) + { + currMB->mb_type=IPCM; + currMB->cbp= -1; + currMB->i16mode = 0; + memset(&currMB->b8mode[0],0,4 * sizeof(char)); + memset(&currMB->b8pdir[0],-1,4 * sizeof(char)); + } + + else + { + currMB->mb_type = I16MB; + currMB->cbp= ICBPTAB[(mbmode-2)>>2]; + currMB->i16mode = (mbmode-2) & 0x03; + memset(&currMB->b8mode[0],0,4 * sizeof(char)); + memset(&currMB->b8pdir[0],-1,4 * sizeof(char)); + } +} + +/*! +************************************************************************ +* \brief +* Set mode interpretation based on slice type +************************************************************************ +*/ +void setup_slice_methods(Slice *currSlice) +{ + switch (currSlice->slice_type) + { + case P_SLICE: + currSlice->interpret_mb_mode = interpret_mb_mode_P; + currSlice->read_motion_info_from_NAL = read_motion_info_from_NAL_p_slice; + currSlice->read_one_macroblock = read_one_macroblock_p_slice; + currSlice->decode_one_component = decode_one_component_p_slice; + break; + case SP_SLICE: + currSlice->interpret_mb_mode = interpret_mb_mode_P; + currSlice->read_motion_info_from_NAL = read_motion_info_from_NAL_p_slice; + currSlice->read_one_macroblock = read_one_macroblock_p_slice; + currSlice->decode_one_component = decode_one_component_sp_slice; + break; + case B_SLICE: + currSlice->interpret_mb_mode = interpret_mb_mode_B; + currSlice->read_motion_info_from_NAL = read_motion_info_from_NAL_b_slice; + currSlice->read_one_macroblock = read_one_macroblock_b_slice; + currSlice->decode_one_component = decode_one_component_b_slice; + break; + case I_SLICE: + currSlice->interpret_mb_mode = interpret_mb_mode_I; + currSlice->read_motion_info_from_NAL = NULL; + currSlice->read_one_macroblock = read_one_macroblock_i_slice; + currSlice->decode_one_component = decode_one_component_i_slice; + break; + case SI_SLICE: + currSlice->interpret_mb_mode = interpret_mb_mode_SI; + currSlice->read_motion_info_from_NAL = NULL; + currSlice->read_one_macroblock = read_one_macroblock_i_slice; + currSlice->decode_one_component = decode_one_component_i_slice; + break; + default: + printf("Unsupported slice type\n"); + break; + } + + if( IS_INDEPENDENT(currSlice->p_Vid) ) + currSlice->compute_colocated = compute_colocated_JV; + else + { + if (currSlice->active_sps->frame_mbs_only_flag) + currSlice->compute_colocated = compute_colocated; + else + currSlice->compute_colocated = compute_colocated_frames_mbs; + } + + switch(currSlice->p_Vid->active_pps->entropy_coding_mode_flag) + { + case CABAC: + currSlice->read_CBP_and_coeffs_from_NAL = read_CBP_and_coeffs_from_NAL_CABAC; + break; + case CAVLC: + currSlice->read_CBP_and_coeffs_from_NAL = read_CBP_and_coeffs_from_NAL_CAVLC; + break; + default: + printf("Unsupported entropy coding mode\n"); + break; + } + +} + +void macroblock_set_dc_pred(VideoParameters *p_Vid, int block_x, int block_y) +{ + int32_t dc_pred = 2 + (2 << 8) + (2 << 16) + (2 << 24); + int32_t *pred = (int32_t *)&p_Vid->ipredmode[block_y][block_x]; + int stride = p_Vid->PicWidthInMbs; + int i; + for (i=0;i<BLOCK_SIZE;i++) + { + *pred = dc_pred; + pred += stride; + } +} +/*! +************************************************************************ +* \brief +* init macroblock I and P frames +************************************************************************ +*/ +#ifdef _M_IX86 +static void init_macroblock(Macroblock *currMB) +{ + VideoParameters *p_Vid = currMB->p_Vid; + int j; + int block_x = currMB->block_x, block_y = currMB->block_y; + PicMotionParams *motion = &p_Vid->dec_picture->motion; + PicMotion **list_motion0, **list_motion1; + __m64 const_0_minus_1 = _mm_setr_pi32(0, -1); + macroblock_set_dc_pred(p_Vid, block_x, block_y); + + // reset vectors and pred. modes + list_motion0 = motion->motion[LIST_0]; + for(j = 0; j < BLOCK_SIZE; j++) + { + PicMotion *block = &list_motion0[block_y+j][block_x]; + block[0].ref_pic_id = UNDEFINED_REFERENCE; + *(__m64 *)&block[0].mv = const_0_minus_1; + + block[1].ref_pic_id = UNDEFINED_REFERENCE; + *(__m64 *)&block[1].mv = const_0_minus_1; + + block[2].ref_pic_id = UNDEFINED_REFERENCE; + *(__m64 *)&block[2].mv = const_0_minus_1; + + + block[3].ref_pic_id = UNDEFINED_REFERENCE; + *(__m64 *)&block[3].mv = const_0_minus_1; + } + + list_motion1 = motion->motion[LIST_1]; + for(j = 0; j < BLOCK_SIZE; j++) + { + PicMotion *block = &list_motion1[block_y+j][block_x]; + + block[0].ref_pic_id = UNDEFINED_REFERENCE; + *(__m64 *)&block[0].mv = const_0_minus_1; + + block[1].ref_pic_id = UNDEFINED_REFERENCE; + *(__m64 *)&block[1].mv = const_0_minus_1; + + block[2].ref_pic_id = UNDEFINED_REFERENCE; + *(__m64 *)&block[2].mv = const_0_minus_1; + + + block[3].ref_pic_id = UNDEFINED_REFERENCE; + *(__m64 *)&block[3].mv = const_0_minus_1; + } + +} + + +#else +static void init_macroblock(Macroblock *currMB) +{ + VideoParameters *p_Vid = currMB->p_Vid; + int i, j; + int block_x = currMB->block_x, block_y = currMB->block_y; + PicMotionParams *motion = &p_Vid->dec_picture->motion; + PicMotion **list_motion0, **list_motion1; + macroblock_set_dc_pred(p_Vid, block_x, block_y); + + // reset vectors and pred. modes + list_motion0 = motion->motion[LIST_0]; + for(j = 0; j < BLOCK_SIZE; j++) + { + PicMotion *block0 = &list_motion0[block_y+j][block_x]; + block0[0].ref_pic_id = UNDEFINED_REFERENCE; + memset(block0[0].mv, 0, sizeof(MotionVector)); + block0[0].ref_idx = -1; + + block0[1].ref_pic_id = UNDEFINED_REFERENCE; + memset(block0[1].mv, 0, sizeof(MotionVector)); + block0[1].ref_idx = -1; + + block0[2].ref_pic_id = UNDEFINED_REFERENCE; + memset(block0[2].mv, 0, sizeof(MotionVector)); + block0[2].ref_idx = -1; + + block0[3].ref_pic_id = UNDEFINED_REFERENCE; + memset(block0[3].mv, 0, sizeof(MotionVector)); + block0[3].ref_idx = -1; + + + } + + list_motion1 = motion->motion[LIST_1]; + for(j = 0; j < BLOCK_SIZE; j++) + { + PicMotion *block1 = &list_motion1[block_y+j][block_x]; + + block1[0].ref_pic_id = UNDEFINED_REFERENCE; + memset(block1[0].mv, 0, sizeof(MotionVector)); + block1[0].ref_idx = -1; + + block1[1].ref_pic_id = UNDEFINED_REFERENCE; + memset(block1[1].mv, 0, sizeof(MotionVector)); + block1[1].ref_idx = -1; + + block1[2].ref_pic_id = UNDEFINED_REFERENCE; + memset(block1[2].mv, 0, sizeof(MotionVector)); + block1[2].ref_idx = -1; + + block1[3].ref_pic_id = UNDEFINED_REFERENCE; + memset(block1[3].mv, 0, sizeof(MotionVector)); + block1[3].ref_idx = -1; + } + +} + + +#endif +/*! +************************************************************************ +* \brief +* Sets mode for 8x8 block +************************************************************************ +*/ +void SetB8Mode (Macroblock* currMB, int value, int i) +{ + Slice* currSlice = currMB->p_Slice; + static const char p_v2b8 [ 5] = {4, 5, 6, 7, IBLOCK}; + static const char p_v2pd [ 5] = {0, 0, 0, 0, -1}; + static const char b_v2b8 [14] = {0, 4, 4, 4, 5, 6, 5, 6, 5, 6, 7, 7, 7, IBLOCK}; + static const char b_v2pd [14] = {2, 0, 1, 2, 0, 0, 1, 1, 2, 2, 0, 1, 2, -1}; + + if (currSlice->slice_type==B_SLICE) + { + currMB->b8mode[i] = b_v2b8[value]; + currMB->b8pdir[i] = b_v2pd[value]; + } + else + { + currMB->b8mode[i] = p_v2b8[value]; + currMB->b8pdir[i] = p_v2pd[value]; + } +} + + +void reset_coeffs(Slice *currSlice) +{ + + VideoParameters *p_Vid = currSlice->p_Vid; + + // reset all coeffs +#ifdef _DEBUG + { + int m; + for (m=0;m<3;m++) + { + int z; + short *b = &currSlice->cof[m][0][0]; + for (z=0;z<256;z++) + { + if (b[z] != 0) + { + DebugBreak(); + } + } + } + } +#endif + + // benski> don't think this is necessary... enable check above to be sure + // memset(currSlice->cof, 0, sizeof(currSlice->cof)); + + // CAVLC + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + memzero48(p_Vid->nz_coeff[p_Vid->current_mb_nr]); +} + +void field_flag_inference(Macroblock *currMB) +{ + VideoParameters *p_Vid = currMB->p_Vid; + if (currMB->mb_avail_left) + { + currMB->mb_field = p_Vid->mb_data[currMB->mb_addr_left].mb_field; + } + else + { + // check top macroblock pair + currMB->mb_field = currMB->mb_avail_up ? p_Vid->mb_data[currMB->mb_addr_up].mb_field : FALSE; + } +} + + +static void skip_macroblock(Macroblock *currMB) +{ + short pred_mv[2]; + int zeroMotionAbove; + int zeroMotionLeft; + PixelPos mb[4]; // neighbor blocks + int i, j; + int a_mv_y = 0; + int a_ref_idx = 0; + int b_mv_y = 0; + int b_ref_idx = 0; + int img_block_y = currMB->block_y; + VideoParameters *p_Vid = currMB->p_Vid; + Slice *currSlice = currMB->p_Slice; + int list_offset = ((currSlice->mb_aff_frame_flag) && (currMB->mb_field)) ? (currMB->mbAddrX & 0x01) ? 4 : 2 : 0; + StorablePicture *dec_picture = p_Vid->dec_picture; + PicMotionParams *motion = &dec_picture->motion; + short *a_mv = NULL; + short *b_mv = NULL; + + get_neighbors0016(currMB, mb); + + if (mb[0].available) + { + a_mv = motion->motion[LIST_0][mb[0].pos_y][mb[0].pos_x].mv; + a_mv_y = a_mv[1]; + a_ref_idx = motion->motion[LIST_0][mb[0].pos_y][mb[0].pos_x].ref_idx; + + if (currMB->mb_field && !p_Vid->mb_data[mb[0].mb_addr].mb_field) + { + a_mv_y /=2; + a_ref_idx *=2; + } + if (!currMB->mb_field && p_Vid->mb_data[mb[0].mb_addr].mb_field) + { + a_mv_y *=2; + a_ref_idx >>=1; + } + } + + if (mb[1].available) + { + b_mv = motion->motion[LIST_0][mb[1].pos_y][mb[1].pos_x].mv; + b_mv_y = b_mv[1]; + b_ref_idx = motion->motion[LIST_0][mb[1].pos_y][mb[1].pos_x].ref_idx; + + if (currMB->mb_field && !p_Vid->mb_data[mb[1].mb_addr].mb_field) + { + b_mv_y /=2; + b_ref_idx *=2; + } + if (!currMB->mb_field && p_Vid->mb_data[mb[1].mb_addr].mb_field) + { + b_mv_y *=2; + b_ref_idx >>=1; + } + } + + zeroMotionLeft = !mb[0].available ? 1 : a_ref_idx==0 && a_mv[0]==0 && a_mv_y==0 ? 1 : 0; + zeroMotionAbove = !mb[1].available ? 1 : b_ref_idx==0 && b_mv[0]==0 && b_mv_y==0 ? 1 : 0; + + currMB->cbp = 0; + reset_coeffs(currSlice); + + if (zeroMotionAbove || zeroMotionLeft) + { + for(j = img_block_y; j < img_block_y + BLOCK_SIZE; ++j) + { + for(i=currMB->block_x;i<currMB->block_x + BLOCK_SIZE; ++i) + { + memset(&motion->motion[LIST_0][j][i].mv, 0, sizeof(MotionVector)); + motion->motion[LIST_0][j][i].ref_idx=0; + motion->motion[LIST_0][j][i].ref_pic_id = dec_picture->ref_pic_num[p_Vid->current_slice_nr][LIST_0 + list_offset][0]; + } + } + } + else + { + currMB->GetMVPredictor (currMB, mb, pred_mv, 0, motion->motion[LIST_0], 0, 0, MB_BLOCK_SIZE, MB_BLOCK_SIZE); + + // Set first block line (position img_block_y) + for(j=img_block_y; j < img_block_y + BLOCK_SIZE; ++j) + { + for(i=currMB->block_x;i<currMB->block_x + BLOCK_SIZE; ++i) + { + memcpy(&motion->motion[LIST_0][j][i].mv, pred_mv, sizeof(MotionVector)); + motion->motion[LIST_0][j][i].ref_idx=0; + motion->motion[LIST_0][j][i].ref_pic_id = dec_picture->ref_pic_num[p_Vid->current_slice_nr][LIST_0 + list_offset][0]; + } + } + } +} + +static void concealIPCMcoeffs(Macroblock *currMB) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + StorablePicture *dec_picture = p_Vid->dec_picture; + int i, j, k; + + for(i=0;i<MB_BLOCK_SIZE;++i) + { + for(j=0;j<MB_BLOCK_SIZE;++j) + { + currSlice->ipcm[0][i][j] = p_Vid->dc_pred_value_comp[0]; + } + } + + if ((dec_picture->chroma_format_idc != YUV400) && !IS_INDEPENDENT(p_Vid)) + { + for (k = 0; k < 2; ++k) + { + for(i=0;i<p_Vid->mb_cr_size_y;++i) + { + for(j=0;j<p_Vid->mb_cr_size_x;++j) + { + currSlice->ipcm[k][i][j] = p_Vid->dc_pred_value_comp[k]; + } + } + } + } +} + +/*! +************************************************************************ +* \brief +* Get the syntax elements from the NAL +************************************************************************ +*/ +static void read_one_macroblock_i_slice(Macroblock *currMB) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + + SyntaxElement currSE; + int mb_nr = currMB->mbAddrX; + + DataPartition *dP; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + StorablePicture *dec_picture = p_Vid->dec_picture; + PicMotionParams *motion = &dec_picture->motion; + + currMB->mb_field = ((mb_nr&0x01) == 0)? FALSE : p_Vid->mb_data[mb_nr-1].mb_field; + + update_qp(currMB, p_Vid->qp); + + // read MB mode ***************************************************************** + dP = &(currSlice->partArr[partMap[SE_MBTYPE]]); + + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + currSE.mapping = linfo_ue; + + // read MB aff + if (currSlice->mb_aff_frame_flag && (mb_nr&0x01)==0) + { + TRACE_STRING("mb_field_decoding_flag"); + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + { + currMB->mb_field = readSyntaxElement_FLC(dP->bitstream, 1); + } + else + { + currMB->mb_field = readFieldModeInfo_CABAC(currMB, &dP->de_cabac); + } + } + + if(p_Vid->active_pps->entropy_coding_mode_flag == CABAC) + { + CheckAvailabilityOfNeighborsCABAC(currMB); + + // read MB type + currMB->mb_type = readMB_typeInfo_CABAC(currMB, &dP->de_cabac); + } + else + { // CAVLC + // read MB type + readSyntaxElement_UVLC(&currSE, dP); + currMB->mb_type = currSE.value1; + } + + + + currMB->ei_flag = 0; + + motion->mb_field[mb_nr] = (byte) currMB->mb_field; + + currMB->block_y_aff = ((currSlice->mb_aff_frame_flag) && (currMB->mb_field)) ? (mb_nr&0x01) ? (currMB->block_y - 4)>>1 : currMB->block_y >> 1 : currMB->block_y; + + p_Vid->siblock[currMB->mb_y][currMB->mb_x] = 0; + + currSlice->interpret_mb_mode(currMB); + + //init NoMbPartLessThan8x8Flag + currMB->NoMbPartLessThan8x8Flag = TRUE; + + //============= Transform Size Flag for INTRA MBs ============= + //------------------------------------------------------------- + //transform size flag for INTRA_4x4 and INTRA_8x8 modes + if (currMB->mb_type == I4MB && p_Vid->Transform8x8Mode) + { + dP = &(currSlice->partArr[partMap[SE_HEADER]]); + TRACE_STRING("transform_size_8x8_flag"); + + // read CAVLC transform_size_8x8_flag + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + { + currMB->luma_transform_size_8x8_flag = readSyntaxElement_FLC(dP->bitstream, 1); + } + else + { + currMB->luma_transform_size_8x8_flag = readMB_transform_size_flag_CABAC(currMB, &dP->de_cabac); + } + + if (currMB->luma_transform_size_8x8_flag) + { + currMB->mb_type = I8MB; + memset(&currMB->b8mode, I8MB, 4 * sizeof(char)); + memset(&currMB->b8pdir, -1, 4 * sizeof(char)); + } + } + else + { + currMB->luma_transform_size_8x8_flag = FALSE; + } + + //--- init macroblock data --- + init_macroblock(currMB); + + if(currMB->mb_type != IPCM) + { + // intra prediction modes for a macroblock 4x4 ********************************************** + read_ipred_modes(currMB); + + // read CBP and Coeffs *************************************************************** + currSlice->read_CBP_and_coeffs_from_NAL (currMB); + } + else + { + //read pcm_alignment_zero_bit and pcm_byte[i] + + // here dP is assigned with the same dP as SE_MBTYPE, because IPCM syntax is in the + // same category as MBTYPE + if ( currSlice->dp_mode && currSlice->dpB_NotPresent ) + { + concealIPCMcoeffs(currMB); + } + else + { + dP = &(currSlice->partArr[partMap[SE_LUM_DC_INTRA]]); + read_IPCM_coeffs_from_NAL(currSlice, dP); + } + } + + return; +} + +/*! +************************************************************************ +* \brief +* Get the syntax elements from the NAL +************************************************************************ +*/ +static void read_one_macroblock_p_slice(Macroblock *currMB) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + + int i; + + SyntaxElement currSE; + int mb_nr = currMB->mbAddrX; + + DataPartition *dP; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + Macroblock *topMB = NULL; + int prevMbSkipped = 0; + int check_bottom, read_bottom, read_top; + StorablePicture *dec_picture = p_Vid->dec_picture; + PicMotionParams *motion = &dec_picture->motion; + + if (currSlice->mb_aff_frame_flag) + { + if (mb_nr&0x01) + { + topMB= &p_Vid->mb_data[mb_nr-1]; + prevMbSkipped = (topMB->mb_type == 0); + } + else + prevMbSkipped = 0; + } + + currMB->mb_field = ((mb_nr&0x01) == 0)? FALSE : p_Vid->mb_data[mb_nr-1].mb_field; + + update_qp(currMB, p_Vid->qp); + + // read MB mode ***************************************************************** + dP = &(currSlice->partArr[partMap[SE_MBTYPE]]); + + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + currSE.mapping = linfo_ue; + + if (p_Vid->active_pps->entropy_coding_mode_flag == CABAC) + { + int skip; + // read MB skip_flag + if (currSlice->mb_aff_frame_flag && ((mb_nr&0x01) == 0||prevMbSkipped)) + field_flag_inference(currMB); + + CheckAvailabilityOfNeighborsCABAC(currMB); + TRACE_STRING("mb_skip_flag"); + skip = readMB_skip_flagInfo_CABAC(currMB, &dP->de_cabac); + + currMB->mb_type = !skip; + currMB->skip_flag = skip; + + currMB->ei_flag = 0; + + // read MB AFF + if (currSlice->mb_aff_frame_flag) + { + check_bottom=read_bottom=read_top=0; + if ((mb_nr&0x01)==0) + { + check_bottom = currMB->skip_flag; + read_top = !check_bottom; + } + else + { + read_bottom = (topMB->skip_flag && (!currMB->skip_flag)); + } + + if (read_bottom || read_top) + { + TRACE_STRING("mb_field_decoding_flag"); + currMB->mb_field = readFieldModeInfo_CABAC(currMB, &dP->de_cabac); + } + if (check_bottom) + check_next_mb_and_get_field_mode_CABAC(currSlice, dP); + + CheckAvailabilityOfNeighborsCABAC(currMB); + } + + // read MB type + if (currMB->mb_type != 0 ) + { + TRACE_STRING("mb_type"); + currMB->mb_type = readMB_typeInfo_CABAC(currMB, &dP->de_cabac); + currMB->ei_flag = 0; + } + } + // VLC Non-Intra + else + { + if(p_Vid->cod_counter == -1) + { + TRACE_STRING("mb_skip_run"); + readSyntaxElement_UVLC(&currSE, dP); + p_Vid->cod_counter = currSE.value1; + } + if (p_Vid->cod_counter==0) + { + // read MB aff + if ((currSlice->mb_aff_frame_flag) && (((mb_nr&0x01)==0) || ((mb_nr&0x01) && prevMbSkipped))) + { + TRACE_STRING("mb_field_decoding_flag"); + currMB->mb_field = (Boolean) readSyntaxElement_FLC(dP->bitstream, 1); + } + + // read MB type + TRACE_STRING("mb_type"); + readSyntaxElement_UVLC(&currSE, dP); + if(currSlice->slice_type == P_SLICE || currSlice->slice_type == SP_SLICE) + ++(currSE.value1); + currMB->mb_type = currSE.value1; + currMB->ei_flag = 0; + p_Vid->cod_counter--; + currMB->skip_flag = 0; + } + else + { + p_Vid->cod_counter--; + currMB->mb_type = 0; + currMB->ei_flag = 0; + currMB->skip_flag = 1; + + // read field flag of bottom block + if(currSlice->mb_aff_frame_flag) + { + if(p_Vid->cod_counter == 0 && ((mb_nr&0x01) == 0)) + { + TRACE_STRING("mb_field_decoding_flag (of coded bottom mb)"); + currMB->mb_field = (Boolean) readSyntaxElement_FLC(dP->bitstream, 1); + dP->bitstream->frame_bitoffset--; + TRACE_DECBITS(1); + } + else if (p_Vid->cod_counter > 0 && ((mb_nr & 0x01) == 0)) + { + // check left macroblock pair first + if (mb_is_available(mb_nr - 2, currMB) && ((mb_nr % (p_Vid->PicWidthInMbs * 2))!=0)) + { + currMB->mb_field = p_Vid->mb_data[mb_nr-2].mb_field; + } + else + { + // check top macroblock pair + if (mb_is_available(mb_nr - 2*p_Vid->PicWidthInMbs, currMB)) + { + currMB->mb_field = p_Vid->mb_data[mb_nr-2*p_Vid->PicWidthInMbs].mb_field; + } + else + currMB->mb_field = FALSE; + } + } + } + } + } + + motion->mb_field[mb_nr] = (byte) currMB->mb_field; + + currMB->block_y_aff = ((currSlice->mb_aff_frame_flag) && (currMB->mb_field)) ? (mb_nr&0x01) ? (currMB->block_y - 4)>>1 : currMB->block_y >> 1 : currMB->block_y; + + p_Vid->siblock[currMB->mb_y][currMB->mb_x] = 0; + + currSlice->interpret_mb_mode(currMB); + + if(currSlice->mb_aff_frame_flag) + { + if(currMB->mb_field) + { + currSlice->num_ref_idx_l0_active <<=1; + currSlice->num_ref_idx_l1_active <<=1; + } + } + + //init NoMbPartLessThan8x8Flag + currMB->NoMbPartLessThan8x8Flag = (IS_DIRECT(currMB) && !(p_Vid->active_sps->direct_8x8_inference_flag))? FALSE: TRUE; + + //====== READ 8x8 SUB-PARTITION MODES (modes of 8x8 blocks) and Intra VBST block modes ====== + if (currMB->mb_type == P8x8) + { + dP = &(currSlice->partArr[partMap[SE_MBTYPE]]); + + if (p_Vid->active_pps->entropy_coding_mode_flag ==CAVLC) + { + currSE.mapping = linfo_ue; + for (i = 0; i < 4; ++i) + { + TRACE_STRING("sub_mb_type"); + readSyntaxElement_UVLC(&currSE, dP); + SetB8Mode (currMB, currSE.value1, i); + + //set NoMbPartLessThan8x8Flag for P8x8 mode + currMB->NoMbPartLessThan8x8Flag &= (currMB->b8mode[i]==0 && p_Vid->active_sps->direct_8x8_inference_flag) || + (currMB->b8mode[i]==4); + } + } + else + { + for (i = 0; i < 4; ++i) + { + int value = readB8_typeInfo_CABAC(currSlice, &dP->de_cabac); + SetB8Mode (currMB, value, i); + + //set NoMbPartLessThan8x8Flag for P8x8 mode + currMB->NoMbPartLessThan8x8Flag &= (currMB->b8mode[i]==0 && p_Vid->active_sps->direct_8x8_inference_flag) || + (currMB->b8mode[i]==4); + } + } + + //--- init macroblock data --- + init_macroblock (currMB); + currSlice->read_motion_info_from_NAL (currMB); + } + + //============= Transform Size Flag for INTRA MBs ============= + //------------------------------------------------------------- + //transform size flag for INTRA_4x4 and INTRA_8x8 modes + if (currMB->mb_type == I4MB && p_Vid->Transform8x8Mode) + { + dP = &(currSlice->partArr[partMap[SE_HEADER]]); + TRACE_STRING("transform_size_8x8_flag"); + + // read CAVLC transform_size_8x8_flag + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + { + currMB->luma_transform_size_8x8_flag = (Boolean) readSyntaxElement_FLC(dP->bitstream, 1); + } + else + { + currMB->luma_transform_size_8x8_flag = readMB_transform_size_flag_CABAC(currMB, &dP->de_cabac); + } + + if (currMB->luma_transform_size_8x8_flag) + { + currMB->mb_type = I8MB; + memset(&currMB->b8mode, I8MB, 4 * sizeof(char)); + memset(&currMB->b8pdir, -1, 4 * sizeof(char)); + } + } + else + { + currMB->luma_transform_size_8x8_flag = FALSE; + } + + if(p_Vid->active_pps->constrained_intra_pred_flag) + { + if( !IS_INTRA(currMB) ) + { + p_Vid->intra_block[mb_nr] = 0; + } + } + + //--- init macroblock data --- + if (currMB->mb_type != P8x8) + init_macroblock(currMB); + + if (IS_SKIP (currMB)) //keep last macroblock + { + skip_macroblock(currMB); + } + else if(currMB->mb_type != IPCM) + { + // intra prediction modes for a macroblock 4x4 ********************************************** + if (IS_INTRA(currMB)) + read_ipred_modes(currMB); + + // read inter frame vector data ********************************************************* + if (IS_INTERMV (currMB) && (currMB->mb_type != P8x8)) + { + currSlice->read_motion_info_from_NAL (currMB); + } + // read CBP and Coeffs *************************************************************** + currSlice->read_CBP_and_coeffs_from_NAL (currMB); + } + else + { + //read pcm_alignment_zero_bit and pcm_byte[i] + + // here dP is assigned with the same dP as SE_MBTYPE, because IPCM syntax is in the + // same category as MBTYPE + if ( currSlice->dp_mode && currSlice->dpB_NotPresent ) + { + concealIPCMcoeffs(currMB); + } + else + { + dP = &(currSlice->partArr[partMap[SE_LUM_DC_INTRA]]); + read_IPCM_coeffs_from_NAL(currSlice, dP); + } + } + + return; +} + +/*! +************************************************************************ +* \brief +* Get the syntax elements from the NAL +************************************************************************ +*/ +static void read_one_macroblock_b_slice(Macroblock *currMB) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + int i; + + SyntaxElement currSE; + int mb_nr = currMB->mbAddrX; + + DataPartition *dP; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + Macroblock *topMB = NULL; + int prevMbSkipped = 0; + int check_bottom, read_bottom, read_top; + StorablePicture *dec_picture = p_Vid->dec_picture; + PicMotionParams *motion = &dec_picture->motion; + + if (currSlice->mb_aff_frame_flag) + { + if (mb_nr&0x01) + { + topMB= &p_Vid->mb_data[mb_nr-1]; + prevMbSkipped = topMB->skip_flag; + } + else + prevMbSkipped = 0; + } + + currMB->mb_field = ((mb_nr&0x01) == 0)? FALSE : p_Vid->mb_data[mb_nr-1].mb_field; + + update_qp(currMB, p_Vid->qp); + + // read MB mode ***************************************************************** + dP = &(currSlice->partArr[partMap[SE_MBTYPE]]); + + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + currSE.mapping = linfo_ue; + + if (p_Vid->active_pps->entropy_coding_mode_flag == CABAC) + { + // read MB skip_flag + int skip; + if (currSlice->mb_aff_frame_flag && ((mb_nr&0x01) == 0||prevMbSkipped)) + field_flag_inference(currMB); + + CheckAvailabilityOfNeighborsCABAC(currMB); + TRACE_STRING("mb_skip_flag"); + skip = readMB_skip_flagInfo_CABAC(currMB, &dP->de_cabac); + + currMB->mb_type = !skip; + currMB->skip_flag = skip; + + currMB->cbp = !skip; + + currMB->ei_flag = 0; + + if (skip) + p_Vid->cod_counter=0; + + // read MB AFF + if (currSlice->mb_aff_frame_flag) + { + check_bottom=read_bottom=read_top=0; + if ((mb_nr&0x01)==0) + { + check_bottom = currMB->skip_flag; + read_top = !check_bottom; + } + else + { + read_bottom = (topMB->skip_flag && (!currMB->skip_flag)); + } + + if (read_bottom || read_top) + { + TRACE_STRING("mb_field_decoding_flag"); + currMB->mb_field = readFieldModeInfo_CABAC(currMB, &dP->de_cabac); + } + if (check_bottom) + check_next_mb_and_get_field_mode_CABAC(currSlice,dP); + + CheckAvailabilityOfNeighborsCABAC(currMB); + } + + // read MB type + if (currMB->mb_type != 0 ) + { + TRACE_STRING("mb_type"); + currMB->mb_type = readMB_typeInfo_CABAC(currMB, &dP->de_cabac); + currMB->ei_flag = 0; + } + } + // VLC Non-Intra + else + { + if(p_Vid->cod_counter == -1) + { + TRACE_STRING("mb_skip_run"); + readSyntaxElement_UVLC(&currSE, dP); + p_Vid->cod_counter = currSE.value1; + } + if (p_Vid->cod_counter==0) + { + // read MB aff + if ((currSlice->mb_aff_frame_flag) && (((mb_nr&0x01)==0) || ((mb_nr&0x01) && prevMbSkipped))) + { + TRACE_STRING("mb_field_decoding_flag"); + currMB->mb_field = (Boolean) readSyntaxElement_FLC(dP->bitstream, 1); + } + + // read MB type + TRACE_STRING("mb_type"); + readSyntaxElement_UVLC(&currSE, dP); + if(currSlice->slice_type == P_SLICE || currSlice->slice_type == SP_SLICE) + ++(currSE.value1); + currMB->mb_type = currSE.value1; + currMB->ei_flag = 0; + p_Vid->cod_counter--; + currMB->skip_flag = 0; + } + else + { + p_Vid->cod_counter--; + currMB->mb_type = 0; + currMB->ei_flag = 0; + currMB->skip_flag = 1; + + // read field flag of bottom block + if(currSlice->mb_aff_frame_flag) + { + if(p_Vid->cod_counter == 0 && ((mb_nr&0x01) == 0)) + { + TRACE_STRING("mb_field_decoding_flag (of coded bottom mb)"); + currMB->mb_field = (Boolean) readSyntaxElement_FLC(dP->bitstream, 1); + dP->bitstream->frame_bitoffset--; + TRACE_DECBITS(1); + } + else if (p_Vid->cod_counter > 0 && ((mb_nr & 0x01) == 0)) + { + // check left macroblock pair first + if (mb_is_available(mb_nr - 2, currMB) && ((mb_nr % (p_Vid->PicWidthInMbs * 2))!=0)) + { + currMB->mb_field = p_Vid->mb_data[mb_nr-2].mb_field; + } + else + { + // check top macroblock pair + if (mb_is_available(mb_nr - 2*p_Vid->PicWidthInMbs, currMB)) + { + currMB->mb_field = p_Vid->mb_data[mb_nr-2*p_Vid->PicWidthInMbs].mb_field; + } + else + currMB->mb_field = FALSE; + } + } + } + } + } + + motion->mb_field[mb_nr] = (byte) currMB->mb_field; + + currMB->block_y_aff = ((currSlice->mb_aff_frame_flag) && (currMB->mb_field)) ? (mb_nr&0x01) ? (currMB->block_y - 4)>>1 : currMB->block_y >> 1 : currMB->block_y; + + p_Vid->siblock[currMB->mb_y][currMB->mb_x] = 0; + + currSlice->interpret_mb_mode(currMB); + + if(currSlice->mb_aff_frame_flag) + { + if(currMB->mb_field) + { + currSlice->num_ref_idx_l0_active <<=1; + currSlice->num_ref_idx_l1_active <<=1; + } + } + + //init NoMbPartLessThan8x8Flag + currMB->NoMbPartLessThan8x8Flag = (IS_DIRECT(currMB) && !(p_Vid->active_sps->direct_8x8_inference_flag))? FALSE: TRUE; + + //====== READ 8x8 SUB-PARTITION MODES (modes of 8x8 blocks) and Intra VBST block modes ====== + if (currMB->mb_type == P8x8) + { + dP = &(currSlice->partArr[partMap[SE_MBTYPE]]); + + if (p_Vid->active_pps->entropy_coding_mode_flag ==CAVLC) + { + currSE.mapping = linfo_ue; + for (i = 0; i < 4; ++i) + { + TRACE_STRING("sub_mb_type"); + readSyntaxElement_UVLC(&currSE, dP); + SetB8Mode (currMB, currSE.value1, i); + + //set NoMbPartLessThan8x8Flag for P8x8 mode + currMB->NoMbPartLessThan8x8Flag &= (currMB->b8mode[i]==0 && p_Vid->active_sps->direct_8x8_inference_flag) || + (currMB->b8mode[i]==4); + } + } + else + { + for (i = 0; i < 4; ++i) + { + int value = readB8_typeInfo_CABAC(currSlice, &dP->de_cabac); + SetB8Mode (currMB, value, i); + + //set NoMbPartLessThan8x8Flag for P8x8 mode + currMB->NoMbPartLessThan8x8Flag &= (currMB->b8mode[i]==0 && p_Vid->active_sps->direct_8x8_inference_flag) || + (currMB->b8mode[i]==4); + } + } + + //--- init macroblock data --- + init_macroblock (currMB); + currSlice->read_motion_info_from_NAL (currMB); + } + + //============= Transform Size Flag for INTRA MBs ============= + //------------------------------------------------------------- + //transform size flag for INTRA_4x4 and INTRA_8x8 modes + if (currMB->mb_type == I4MB && p_Vid->Transform8x8Mode) + { + dP = &(currSlice->partArr[partMap[SE_HEADER]]); + TRACE_STRING("transform_size_8x8_flag"); + + // read CAVLC transform_size_8x8_flag + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + { + currMB->luma_transform_size_8x8_flag = (Boolean) readSyntaxElement_FLC(dP->bitstream, 1); + } + else + { + currMB->luma_transform_size_8x8_flag = readMB_transform_size_flag_CABAC(currMB, &dP->de_cabac); + } + + + if (currMB->luma_transform_size_8x8_flag) + { + currMB->mb_type = I8MB; + memset(&currMB->b8mode, I8MB, 4 * sizeof(char)); + memset(&currMB->b8pdir, -1, 4 * sizeof(char)); + } + } + else + { + currMB->luma_transform_size_8x8_flag = FALSE; + } + + if(p_Vid->active_pps->constrained_intra_pred_flag) // inter frame + { + if( !IS_INTRA(currMB) ) + { + p_Vid->intra_block[mb_nr] = 0; + } + } + + //--- init macroblock data --- + if (currMB->mb_type != P8x8) + init_macroblock(currMB); + + if (IS_DIRECT (currMB) && p_Vid->cod_counter >= 0) + { + currMB->cbp = 0; + reset_coeffs(currSlice); + + if (p_Vid->active_pps->entropy_coding_mode_flag ==CABAC) + p_Vid->cod_counter=-1; + } + else if (IS_SKIP (currMB)) //keep last macroblock + { + skip_macroblock(currMB); + } + else if(currMB->mb_type != IPCM) + { + // intra prediction modes for a macroblock 4x4 ********************************************** + if (IS_INTRA(currMB)) + read_ipred_modes(currMB); + + // read inter frame vector data ********************************************************* + if (IS_INTERMV (currMB) && (currMB->mb_type != P8x8)) + { + currSlice->read_motion_info_from_NAL (currMB); + } + // read CBP and Coeffs *************************************************************** + currSlice->read_CBP_and_coeffs_from_NAL (currMB); + } + else + { + //read pcm_alignment_zero_bit and pcm_byte[i] + + // here dP is assigned with the same dP as SE_MBTYPE, because IPCM syntax is in the + // same category as MBTYPE + if ( currSlice->dp_mode && currSlice->dpB_NotPresent ) + { + concealIPCMcoeffs(currMB); + } + else + { + dP = &(currSlice->partArr[partMap[SE_LUM_DC_INTRA]]); + read_IPCM_coeffs_from_NAL(currSlice, dP); + } + } + + return; +} + + +/*! +************************************************************************ +* \brief +* Initialize decoding engine after decoding an IPCM macroblock +* (for IPCM CABAC 28/11/2003) +* +* \author +* Dong Wang <Dong.Wang@bristol.ac.uk> +************************************************************************ +*/ +static void init_decoding_engine_IPCM(Slice *currSlice) +{ + Bitstream *currStream; + int ByteStartPosition; + int PartitionNumber; + int i; + + if(currSlice->dp_mode==PAR_DP_1) + PartitionNumber=1; + else if(currSlice->dp_mode==PAR_DP_3) + PartitionNumber=3; + else + { + printf("Partition Mode is not supported\n"); + exit(1); + } + + for(i=0;i<PartitionNumber;++i) + { + currStream = currSlice->partArr[i].bitstream; + ByteStartPosition = currStream->read_len; + + arideco_start_decoding (&currSlice->partArr[i].de_cabac, currStream->streamBuffer, ByteStartPosition, &currStream->read_len); + } +} + + + + +/*! +************************************************************************ +* \brief +* Read IPCM pcm_alignment_zero_bit and pcm_byte[i] from stream to currSlice->ipcm +* (for IPCM CABAC and IPCM CAVLC) +* +* \author +* Dong Wang <Dong.Wang@bristol.ac.uk> +************************************************************************ +*/ + +static void read_IPCM_coeffs_from_NAL(Slice *currSlice, struct datapartition *dP) +{ + VideoParameters *p_Vid = currSlice->p_Vid; + + StorablePicture *dec_picture = p_Vid->dec_picture; + int i,j; + + //For CABAC, we don't need to read bits to let stream byte aligned + // because we have variable for integer bytes position + if(p_Vid->active_pps->entropy_coding_mode_flag == CABAC) + { + readIPCM_CABAC(currSlice, dP); + init_decoding_engine_IPCM(currSlice); + } + else + { + //read bits to let stream byte aligned + + if(((dP->bitstream->frame_bitoffset) & 0x07) != 0) + { + TRACE_STRING("pcm_alignment_zero_bit"); + readSyntaxElement_FLC(dP->bitstream, (8 - ((dP->bitstream->frame_bitoffset) & 0x07))); + } + + //read luma and chroma IPCM coefficients + TRACE_STRING("pcm_sample_luma"); + + for(i=0;i<MB_BLOCK_SIZE;++i) + { + for(j=0;j<MB_BLOCK_SIZE;++j) + { + currSlice->ipcm[0][i][j] = readSyntaxElement_FLC(dP->bitstream, p_Vid->bitdepth_luma); + } + } + if ((dec_picture->chroma_format_idc != YUV400) && !IS_INDEPENDENT(p_Vid)) + { + TRACE_STRING("pcm_sample_chroma (u)"); + for(i=0;i<p_Vid->mb_cr_size_y;++i) + { + for(j=0;j<p_Vid->mb_cr_size_x;++j) + { + currSlice->ipcm[1][i][j] = readSyntaxElement_FLC(dP->bitstream, p_Vid->bitdepth_chroma); + } + } + TRACE_STRING("pcm_sample_chroma (v)"); + for(i=0;i<p_Vid->mb_cr_size_y;++i) + { + for(j=0;j<p_Vid->mb_cr_size_x;++j) + { + currSlice->ipcm[2][i][j] = readSyntaxElement_FLC(dP->bitstream, p_Vid->bitdepth_chroma); + } + } + } + } +} + + +/*! +************************************************************************ +* \brief +* If data partition B is lost, conceal PCM sample values with DC. +* +************************************************************************ +*/ + + +static void __forceinline read_ipred_iblock(VideoParameters *p_Vid, Macroblock *currMB, Slice *currSlice, DataPartition *dP, int b8) +{ + int i, j; + int mostProbableIntraPredMode; + int upIntraPredMode; + int leftIntraPredMode; + int bx, by, bi, bj; + SyntaxElement currSE; + int ts, ls; + PixelPos left_block, top_block; + int dec; + + for(j=0;j<2;j++) //loop subblocks + { + by = (b8&2) + j; + bj = currMB->block_y + by; + for(i=0;i<2;i++) + { + int pred_mode; + bx = ((b8&1)<<1) + i; + bi = currMB->block_x + bx; + + //get from stream + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + { + readSyntaxElement_Intra4x4PredictionMode(&currSE, dP->bitstream); + pred_mode = currSE.value1; + } + else + { + pred_mode = readIntraPredMode_CABAC(currSlice, &dP->de_cabac); + } + + p_Vid->getNeighbourXPLumaNB(currMB, (bx<<2) - 1, (by<<2), &left_block); + p_Vid->getNeighbourPXLumaNB(currMB, (bx<<2), (by<<2) - 1, &top_block ); + + //get from array and decode + + if (p_Vid->active_pps->constrained_intra_pred_flag) + { + left_block.available = left_block.available ? p_Vid->intra_block[left_block.mb_addr] : 0; + top_block.available = top_block.available ? p_Vid->intra_block[top_block.mb_addr] : 0; + } + + // !! KS: not sure if the following is still correct... + ts = ls = 0; // Check to see if the neighboring block is SI + if (currMB->mb_type == I4MB && currSlice->slice_type == SI_SLICE) // need support for MBINTLC1 + { + if (left_block.available) + if (p_Vid->siblock [left_block.mb_addr / p_Vid->PicWidthInMbs][left_block.mb_addr % p_Vid->PicWidthInMbs]) + ls=1; + + if (top_block.available) + if (p_Vid->siblock [top_block.mb_addr / p_Vid->PicWidthInMbs][top_block.mb_addr % p_Vid->PicWidthInMbs]) + ts=1; + } + + upIntraPredMode = (top_block.available &&(ts == 0)) ? p_Vid->ipredmode[top_block.pos_y>>2 ][top_block.pos_x>>2 ] : -1; + leftIntraPredMode = (left_block.available &&(ls == 0)) ? p_Vid->ipredmode[left_block.pos_y>>2][left_block.pos_x>>2] : -1; + + mostProbableIntraPredMode = (upIntraPredMode < 0 || leftIntraPredMode < 0) ? DC_PRED : upIntraPredMode < leftIntraPredMode ? upIntraPredMode : leftIntraPredMode; + + dec = (pred_mode == -1) ? mostProbableIntraPredMode : pred_mode + (pred_mode >= mostProbableIntraPredMode); + + + p_Vid->ipredmode[bj][bi] = dec; + } + } +} + +static void __forceinline read_ipred_i8mb(VideoParameters *p_Vid, Macroblock *currMB, Slice *currSlice, DataPartition *dP, int b8) +{ + int mostProbableIntraPredMode; + int upIntraPredMode; + int leftIntraPredMode; + int bx, by, bi, bj; + int pred_mode; + SyntaxElement currSE; + int ts, ls; + PixelPos left_block, top_block; + int dec; + + by = (b8&2); + bj = currMB->block_y + by; + + bx = ((b8&1)<<1); + bi = currMB->block_x + bx; + + //get from stream + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + { + readSyntaxElement_Intra4x4PredictionMode(&currSE, dP->bitstream); + pred_mode = currSE.value1; + } + else + { + pred_mode = readIntraPredMode_CABAC(currSlice, &dP->de_cabac); + } + + p_Vid->getNeighbourXPLumaNB(currMB, (bx<<2) - 1, (by<<2), &left_block); + p_Vid->getNeighbourPXLumaNB(currMB, (bx<<2), (by<<2) - 1, &top_block ); + + //get from array and decode + + if (p_Vid->active_pps->constrained_intra_pred_flag) + { + left_block.available = left_block.available ? p_Vid->intra_block[left_block.mb_addr] : 0; + top_block.available = top_block.available ? p_Vid->intra_block[top_block.mb_addr] : 0; + } + + // !! KS: not sure if the following is still correct... + ts = ls = 0; // Check to see if the neighboring block is SI + if (currMB->mb_type == I4MB && currSlice->slice_type == SI_SLICE) // need support for MBINTLC1 + { + if (left_block.available) + if (p_Vid->siblock [left_block.mb_addr / p_Vid->PicWidthInMbs][left_block.mb_addr % p_Vid->PicWidthInMbs]) + ls=1; + + if (top_block.available) + if (p_Vid->siblock [top_block.mb_addr / p_Vid->PicWidthInMbs][top_block.mb_addr % p_Vid->PicWidthInMbs]) + ts=1; + } + + upIntraPredMode = (top_block.available &&(ts == 0)) ? p_Vid->ipredmode[top_block.pos_y>>2 ][top_block.pos_x>>2 ] : -1; + leftIntraPredMode = (left_block.available &&(ls == 0)) ? p_Vid->ipredmode[left_block.pos_y>>2][left_block.pos_x>>2] : -1; + + mostProbableIntraPredMode = (upIntraPredMode < 0 || leftIntraPredMode < 0) ? DC_PRED : upIntraPredMode < leftIntraPredMode ? upIntraPredMode : leftIntraPredMode; + + dec = (pred_mode == -1) ? mostProbableIntraPredMode : pred_mode + (pred_mode >= mostProbableIntraPredMode); + + //set + p_Vid->ipredmode[bj][bi] = dec; + p_Vid->ipredmode[bj][bi+1] = dec; + p_Vid->ipredmode[bj+1][bi] = dec; + p_Vid->ipredmode[bj+1][bi+1] = dec; +} + +static void read_ipred_modes(Macroblock *currMB) +{ + int b8; + SyntaxElement currSE; + DataPartition *dP; + Slice *currSlice = currMB->p_Slice; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + VideoParameters *p_Vid = currMB->p_Vid; + + StorablePicture *dec_picture = p_Vid->dec_picture; + char IntraChromaPredModeFlag = IS_INTRA(currMB); + + dP = &(currSlice->partArr[partMap[SE_INTRAPREDMODE]]); + + for(b8 = 0; b8 < 4; ++b8) //loop 8x8 blocks + { + if (currMB->b8mode[b8]==IBLOCK) + { + IntraChromaPredModeFlag = 1; + read_ipred_iblock(p_Vid, currMB, currSlice, dP, b8); + } + else if (currMB->b8mode[b8]==I8MB) + { + IntraChromaPredModeFlag = 1; + read_ipred_i8mb(p_Vid, currMB, currSlice, dP, b8); + } + } + + if (IntraChromaPredModeFlag && (dec_picture->chroma_format_idc != YUV400) && (dec_picture->chroma_format_idc != YUV444)) + { + TRACE_STRING("intra_chroma_pred_mode"); + dP = &(currSlice->partArr[partMap[SE_INTRAPREDMODE]]); + + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + { + currSE.mapping = linfo_ue; + readSyntaxElement_UVLC(&currSE, dP); + currMB->c_ipred_mode = (char) currSE.value1; + } + else + { + currMB->c_ipred_mode = readCIPredMode_CABAC(currMB, &dP->de_cabac); + } + + + + if (currMB->c_ipred_mode < DC_PRED_8 || currMB->c_ipred_mode > PLANE_8) + { + error("illegal chroma intra pred mode!\n", 600); + } + } +} + + +/*! +************************************************************************ +* \brief +* Get current block spatial neighbors +************************************************************************ +*/ +void get_neighbors(Macroblock *currMB, // <-- current Macroblock + PixelPos *block, // <--> neighbor blocks + int mb_x, // <-- block x position + int mb_y, // <-- block y position + int blockshape_x // <-- block width + ) +{ + VideoParameters *p_Vid = currMB->p_Vid; + int i; + p_Vid->getNeighbourXPLumaNB(currMB, mb_x - 1, mb_y , &block[0]); // left + p_Vid->getNeighbourPXLumaNB(currMB, mb_x, mb_y - 1, &block[1]); // up + p_Vid->getNeighbourPXLuma(currMB, mb_x + blockshape_x, mb_y - 1, &block[2]); // upper right + p_Vid->getNeighbourLuma(currMB, mb_x - 1, mb_y - 1, &block[3]); // upper left + for (i = 0; i < 4; i++) + { + block[i].pos_x >>= 2; + block[i].pos_y >>= 2; + } + + if (mb_y > 0) + { + if (mb_x < 8) // first column of 8x8 blocks + { + if (mb_y == 8 ) + { + if (blockshape_x == MB_BLOCK_SIZE) + block[2].available = 0; + } + else if (mb_x+blockshape_x == 8) + { + block[2].available = 0; + } + } + else if (mb_x + blockshape_x == MB_BLOCK_SIZE) + { + block[2].available = 0; + } + } + + if (!block[2].available) + { + block[2] = block[3]; + } +} + +/* this version is for mb_x == 0, mb_y == 0 and blockshape_x == 16 */ +void get_neighbors0016(Macroblock *currMB, // <-- current Macroblock + PixelPos *block // <--> neighbor blocks + ) +{ + VideoParameters *p_Vid = currMB->p_Vid; + int i; + + p_Vid->getNeighbourLeftLuma(currMB, &block[0]); // left + p_Vid->getNeighbourPXLumaNB(currMB, 0, -1, &block[1]); // up + p_Vid->getNeighbourPXLuma(currMB, 16, -1, &block[2]); // upper right + p_Vid->getNeighbourLuma(currMB, -1, -1, &block[3]); // upper left + for (i = 0; i < 4; i++) + { + if (block[i].available) + { + block[i].pos_x >>= 2; + block[i].pos_y >>= 2; + } + } + + if (!block[2].available) + { + block[2] = block[3]; + } +} + +/*! +************************************************************************ +* \brief +* Read motion info +************************************************************************ +*/ +static void read_motion_info_from_NAL_p_slice(Macroblock *currMB) +{ + VideoParameters *p_Vid = currMB->p_Vid; + Slice *currSlice = currMB->p_Slice; + + int mb_nr = currMB->mbAddrX; + + DataPartition *dP = NULL; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + int partmode = ((currMB->mb_type == P8x8) ? 4 : currMB->mb_type); + int step_h0 = BLOCK_STEP [partmode][0]; + int step_v0 = BLOCK_STEP [partmode][1]; + h264_ref_t *pic_num; + + int j4; + StorablePicture *dec_picture = p_Vid->dec_picture; + PicMotionParams *motion = &dec_picture->motion; + + int list_offset = ((currSlice->mb_aff_frame_flag)&&(currMB->mb_field))? (mb_nr&0x01) ? 4 : 2 : 0; + + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + { + SyntaxElement currSE; + //===== READ REFERENCE PICTURE INDICES ===== + dP = &(currSlice->partArr[partMap[SE_REFFRAME]]); + // For LIST_0, if multiple ref. pictures, read LIST_0 reference picture indices for the MB *********** + prepareListforRefIdx (currMB, &currSE, currSlice->num_ref_idx_l0_active, (currMB->mb_type != P8x8) || (!p_Vid->allrefzero)); + readMBRefPictureIdx (&currSE, dP, currMB, &motion->motion[LIST_0][currMB->block_y], LIST_0, step_v0, step_h0); + + // For LIST_1, if multiple ref. pictures, read LIST_1 reference picture indices for the MB *********** + prepareListforRefIdx (currMB, &currSE, currSlice->num_ref_idx_l1_active, (currMB->mb_type != P8x8) || (!p_Vid->allrefzero)); + readMBRefPictureIdx (&currSE, dP, currMB, &motion->motion[LIST_1][currMB->block_y], LIST_1, step_v0, step_h0); + + //===== READ MOTION VECTORS ===== + dP = &(currSlice->partArr[partMap[SE_MVD]]); + + currSE.mapping = linfo_se; + readMBMotionVectors (&currSE, dP, currMB, LIST_0, step_h0, step_v0); + } + else + { + if (currMB->mb_type != P8x8 || !p_Vid->allrefzero) + { + //===== READ REFERENCE PICTURE INDICES ===== + dP = &(currSlice->partArr[partMap[SE_REFFRAME]]); + if (currSlice->num_ref_idx_l0_active > 1) + { + // For LIST_0, if multiple ref. pictures, read LIST_0 reference picture indices for the MB *********** + readMBRefPictureIdx_CABAC(dP, currMB, &motion->motion[LIST_0][currMB->block_y], LIST_0, step_v0, step_h0); + } + else + { + readMBRefPictureIdx_CABAC_NoReference(currMB, &motion->motion[LIST_0][currMB->block_y], LIST_0, step_v0, step_h0); + } + + if (currSlice->num_ref_idx_l1_active > 1) + { + // For LIST_1, if multiple ref. pictures, read LIST_1 reference picture indices for the MB *********** + readMBRefPictureIdx_CABAC(dP, currMB, &motion->motion[LIST_1][currMB->block_y], LIST_1, step_v0, step_h0); + } + else + { + readMBRefPictureIdx_CABAC_NoReference(currMB, &motion->motion[LIST_1][currMB->block_y], LIST_1, step_v0, step_h0); + } + } + else + { + readMBRefPictureIdx_CABAC_NoReference(currMB, &motion->motion[LIST_0][currMB->block_y], LIST_0, step_v0, step_h0); + readMBRefPictureIdx_CABAC_NoReference(currMB, &motion->motion[LIST_1][currMB->block_y], LIST_1, step_v0, step_h0); + } + //===== READ MOTION VECTORS ===== + dP = &(currSlice->partArr[partMap[SE_MVD]]); + + readMBMotionVectors_CABAC(dP, currMB, LIST_0, step_h0, step_v0); + + } + + // LIST_0 Motion vectors + + + // record reference picture Ids for deblocking decisions + pic_num = dec_picture->ref_pic_num[p_Vid->current_slice_nr][LIST_0 + list_offset]; + for(j4 = currMB->block_y; j4 < (currMB->block_y +4);++j4) + { + PicMotion *ref = &motion->motion[LIST_0][j4][currMB->block_x]; + ref[0].ref_pic_id = (ref[0].ref_idx >= 0)?pic_num[(short)ref[0].ref_idx]:UNDEFINED_REFERENCE; + ref[1].ref_pic_id = (ref[1].ref_idx >= 0)?pic_num[(short)ref[1].ref_idx]:UNDEFINED_REFERENCE; + ref[2].ref_pic_id = (ref[2].ref_idx >= 0)?pic_num[(short)ref[2].ref_idx]:UNDEFINED_REFERENCE; + ref[3].ref_pic_id = (ref[3].ref_idx >= 0)?pic_num[(short)ref[3].ref_idx]:UNDEFINED_REFERENCE; + } +} + +/*! +************************************************************************ +* \brief +* Read motion info +************************************************************************ +*/ +static void read_motion_info_from_NAL_b_slice (Macroblock *currMB) +{ + VideoParameters *p_Vid = currMB->p_Vid; + Slice *currSlice = currMB->p_Slice; + int i,j,k; + int mb_nr = currMB->mbAddrX; + DataPartition *dP = NULL; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + int partmode = ((currMB->mb_type == P8x8) ? 4 : currMB->mb_type); + int step_h0 = BLOCK_STEP [partmode][0]; + int step_v0 = BLOCK_STEP [partmode][1]; + + int i0, j0, j6; + + int j4, i4, ii; + StorablePicture *dec_picture = p_Vid->dec_picture; + PicMotionParams *motion = &dec_picture->motion; + MotionParams *colocated; + + int mv_scale = 0; + + int list_offset = ((currSlice->mb_aff_frame_flag)&&(currMB->mb_field))? (mb_nr&0x01) ? 4 : 2 : 0; + + + if ((currSlice->mb_aff_frame_flag) && (currMB->mb_field)) + { + if(mb_nr&0x01) + { + colocated = &currSlice->p_colocated->bottom; + } + else + { + colocated = &currSlice->p_colocated->top; + } + } + else + { + colocated = &currSlice->p_colocated->frame; + } + + if (currMB->mb_type == P8x8) + { + if (currSlice->direct_spatial_mv_pred_flag) + { + char l0_rFrame, l1_rFrame; + short pmvl0[2]={0,0}, pmvl1[2]={0,0}; + + prepare_direct_params(currMB, dec_picture, pmvl0, pmvl1, &l0_rFrame, &l1_rFrame); + + for (k = 0; k < 4; ++k) + { + if (currMB->b8mode[k] == 0) + { + i = currMB->block_x + 2 * (k & 0x01); + for(j = 2 * (k >> 1); j < 2 * (k >> 1)+2;++j) + { + j6 = currMB->block_y_aff + j; + j4 = currMB->block_y + j; + for(i4 = i; i4 < i + 2; ++i4) + { + if (l0_rFrame >= 0) + { + if (!l0_rFrame && ((!colocated->moving_block[j6][i4]) && (!p_Vid->listX[LIST_1 + list_offset][0]->is_long_term))) + { + motion->motion[LIST_0][j4][i4].mv[0] = 0; + motion->motion[LIST_0][j4][i4].mv[1] = 0; + motion->motion[LIST_0][j4][i4].ref_idx = 0; + } + else + { + motion->motion[LIST_0][j4][i4].mv[0] = pmvl0[0]; + motion->motion[LIST_0][j4][i4].mv[1] = pmvl0[1]; + motion->motion[LIST_0][j4][i4].ref_idx = l0_rFrame; + } + } + else + { + motion->motion[LIST_0][j4][i4].mv[0] = 0; + motion->motion[LIST_0][j4][i4].mv[1] = 0; + motion->motion[LIST_0][j4][i4].ref_idx = -1; + } + + if (l1_rFrame >= 0) + { + if (l1_rFrame==0 && ((!colocated->moving_block[j6][i4])&& (!p_Vid->listX[LIST_1 + list_offset][0]->is_long_term))) + { + motion->motion[LIST_1][j4][i4].mv[0] = 0; + motion->motion[LIST_1][j4][i4].mv[1] = 0; + motion->motion[LIST_1][j4][i4].ref_idx = 0; + } + else + { + motion->motion[LIST_1][j4][i4].mv[0] = pmvl1[0]; + motion->motion[LIST_1][j4][i4].mv[1] = pmvl1[1]; + motion->motion[LIST_1][j4][i4].ref_idx = l1_rFrame; + } + } + else + { + motion->motion[LIST_1][j4][i4].mv[0] = 0; + motion->motion[LIST_1][j4][i4].mv[1] = 0; + motion->motion[LIST_1][j4][i4].ref_idx = -1; + } + + if (l0_rFrame <0 && l1_rFrame <0) + { + motion->motion[LIST_0][j4][i4].ref_idx = 0; + motion->motion[LIST_1][j4][i4].ref_idx = 0; + } + } + } + } + } + } + else + { + for (k = 0; k < 4; ++k) // Scan all blocks + { + if (currMB->b8mode[k] == 0) + { + for(j0 = 2 * (k >> 1); j0 < 2 * (k >> 1) + 2; j0 += step_v0) + { + for(i0 = currMB->block_x + 2*(k & 0x01); i0 < currMB->block_x + 2 * (k & 0x01)+2; i0 += step_h0) + { + int refList = colocated->motion[LIST_0 ][currMB->block_y_aff + j0][i0].ref_idx== -1 ? LIST_1 : LIST_0; + int ref_idx = colocated->motion[refList][currMB->block_y_aff + j0][i0].ref_idx; + int mapped_idx = -1, iref; + + if (ref_idx == -1) + { + for (j4 = currMB->block_y + j0; j4 < currMB->block_y + j0 + step_v0; ++j4) + { + int h; + for (h=0;h<step_h0;h++) + { + PicMotion *m0 = &motion->motion[LIST_0][j4][i0+h]; + PicMotion *m1 = &motion->motion[LIST_1][j4][i0+h]; + m0->ref_idx = 0; + m1->ref_idx = 0; + memset(&m0->mv, 0, sizeof(MotionVector)); + memset(&m1->mv, 0, sizeof(MotionVector)); + } + } + } + else + { + for (iref = 0; iref < imin(currSlice->num_ref_idx_l0_active, p_Vid->listXsize[LIST_0 + list_offset]); ++iref) + { + int curr_mb_field = ((currSlice->mb_aff_frame_flag)&&(currMB->mb_field)); + + if(p_Vid->structure==0 && curr_mb_field==0) + { + // If the current MB is a frame MB and the colocated is from a field picture, + // then the colocated->ref_pic_id may have been generated from the wrong value of + // frame_poc if it references it's complementary field, so test both POC values + if(p_Vid->listX[0][iref]->top_poc * 2 == colocated->motion[refList][currMB->block_y_aff + j0][i0].ref_pic_id + || p_Vid->listX[0][iref]->bottom_poc * 2 == colocated->motion[refList][currMB->block_y_aff + j0][i0].ref_pic_id) + { + mapped_idx=iref; + break; + } + else //! invalid index. Default to zero even though this case should not happen + mapped_idx=INVALIDINDEX; + continue; + } + if (dec_picture->ref_pic_num[p_Vid->current_slice_nr][LIST_0 + list_offset][iref]==colocated->motion[refList][currMB->block_y_aff + j0][i0].ref_pic_id) + { + mapped_idx=iref; + break; + } + else //! invalid index. Default to zero even though this case should not happen + mapped_idx=INVALIDINDEX; + } + + if (INVALIDINDEX == mapped_idx) + { + error("temporal direct error: colocated block has ref that is unavailable",-1111); + } + + for (j = j0; j < j0 + step_v0; ++j) + { + j4 = currMB->block_y + j; + j6 = currMB->block_y_aff + j; + + for (i4 = i0; i4 < i0 + step_h0; ++i4) + { + mv_scale = currSlice->mvscale[LIST_0 + list_offset][mapped_idx]; + + motion->motion[LIST_0][j4][i4].ref_idx = (char) mapped_idx; + motion->motion[LIST_1][j4][i4].ref_idx = 0; + + if (mv_scale == 9999 || p_Vid->listX[LIST_0+list_offset][mapped_idx]->is_long_term) + { + for (ii=0; ii < 2; ++ii) + { + motion->motion[LIST_0][j4][i4].mv[ii] = colocated->motion[refList][j6][i4].mv[ii]; + motion->motion[LIST_1][j4][i4].mv[ii] = 0; + } + } + else + { + for (ii=0; ii < 2; ++ii) + { + motion->motion[LIST_0][j4][i4].mv[ii] = (short) ((mv_scale * colocated->motion[refList][j6][i4].mv[ii] + 128 ) >> 8); + motion->motion[LIST_1][j4][i4].mv[ii] = (short) (motion->motion[LIST_0][j4][i4].mv[ii] - colocated->motion[refList][j6][i4].mv[ii]); + } + } + } + } + } + } + } + } + } + } + } + + + + if (p_Vid->active_pps->entropy_coding_mode_flag == CAVLC) + { + SyntaxElement currSE; + //===== READ REFERENCE PICTURE INDICES ===== + dP = &(currSlice->partArr[partMap[SE_REFFRAME]]); + // For LIST_0, if multiple ref. pictures, read LIST_0 reference picture indices for the MB *********** + prepareListforRefIdx (currMB, &currSE, currSlice->num_ref_idx_l0_active, TRUE); + readMBRefPictureIdx (&currSE, dP, currMB, &motion->motion[LIST_0][currMB->block_y], LIST_0, step_v0, step_h0); + + // For LIST_1, if multiple ref. pictures, read LIST_1 reference picture indices for the MB *********** + prepareListforRefIdx (currMB, &currSE, currSlice->num_ref_idx_l1_active, TRUE); + readMBRefPictureIdx (&currSE, dP, currMB, &motion->motion[LIST_1][currMB->block_y], LIST_1, step_v0, step_h0); + + //===== READ MOTION VECTORS ===== + dP = &(currSlice->partArr[partMap[SE_MVD]]); + + currSE.mapping = linfo_se; + // LIST_0 Motion vectors + readMBMotionVectors (&currSE, dP, currMB, LIST_0, step_h0, step_v0); + // LIST_1 Motion vectors + readMBMotionVectors (&currSE, dP, currMB, LIST_1, step_h0, step_v0); + } + else + { + //===== READ REFERENCE PICTURE INDICES ===== + dP = &(currSlice->partArr[partMap[SE_REFFRAME]]); + if (currSlice->num_ref_idx_l0_active>1) + { + // For LIST_0, if multiple ref. pictures, read LIST_0 reference picture indices for the MB *********** + readMBRefPictureIdx_CABAC(dP, currMB, &motion->motion[LIST_0][currMB->block_y], LIST_0, step_v0, step_h0); + } + else + { + readMBRefPictureIdx_CABAC_NoReference(currMB, &motion->motion[LIST_0][currMB->block_y], LIST_0, step_v0, step_h0); + } + + if (currSlice->num_ref_idx_l1_active > 1) + { + // For LIST_1, if multiple ref. pictures, read LIST_1 reference picture indices for the MB *********** + readMBRefPictureIdx_CABAC(dP, currMB, &motion->motion[LIST_1][currMB->block_y], LIST_1, step_v0, step_h0); + } + else + { + readMBRefPictureIdx_CABAC_NoReference(currMB, &motion->motion[LIST_1][currMB->block_y], LIST_1, step_v0, step_h0); + } + + //===== READ MOTION VECTORS ===== + dP = &(currSlice->partArr[partMap[SE_MVD]]); + + // LIST_0 Motion vectors + readMBMotionVectors_CABAC(dP, currMB, LIST_0, step_h0, step_v0); + // LIST_1 Motion vectors + readMBMotionVectors_CABAC(dP, currMB, LIST_1, step_h0, step_v0); + } + + + + // record reference picture Ids for deblocking decisions + + for (k = LIST_0; k <= LIST_1; ++k) + { + const h264_ref_t *rec_pic_num = dec_picture->ref_pic_num[p_Vid->current_slice_nr][k+list_offset]; + PicMotion **list_motion = &motion->motion[k][currMB->block_y]; + for(j4 = 0; j4 < 4 ;++j4) + { + PicMotion *m = &list_motion[j4][currMB->block_x]; + m[0].ref_pic_id = (m[0].ref_idx>=0)?rec_pic_num[(short)m[0].ref_idx]:UNDEFINED_REFERENCE; + m[1].ref_pic_id = (m[1].ref_idx>=0)?rec_pic_num[(short)m[1].ref_idx]:UNDEFINED_REFERENCE; + m[2].ref_pic_id = (m[2].ref_idx>=0)?rec_pic_num[(short)m[2].ref_idx]:UNDEFINED_REFERENCE; + m[3].ref_pic_id = (m[3].ref_idx>=0)?rec_pic_num[(short)m[3].ref_idx]:UNDEFINED_REFERENCE; + } + } +} + +/*! +************************************************************************ +* \brief +* Get the Prediction from the Neighboring Blocks for Number of +* Nonzero Coefficients +* +* Luma Blocks +************************************************************************ +*/ +static int predict_nnz_cb(Macroblock *currMB, int i,int j) +{ + VideoParameters *p_Vid = currMB->p_Vid; + + PixelPos pix; + + int pred_nnz = 0; + int cnt = 0; + + // left block + p_Vid->getNeighbourLuma(currMB, i - 1, j, &pix); + + if (IS_INTRA(currMB) && pix.available && p_Vid->active_pps->constrained_intra_pred_flag && (p_Vid->currentSlice->dp_mode==PAR_DP_3)) + { + pix.available &= p_Vid->intra_block[pix.mb_addr]; + if (!pix.available) + ++cnt; + } + + if (pix.available) + { + pred_nnz = p_Vid->nz_coeff [pix.mb_addr ][1][pix.y>>2][pix.x>>2]; + ++cnt; + } + + // top block + p_Vid->getNeighbourLuma(currMB, i, j - 1, &pix); + + if (IS_INTRA(currMB) && pix.available && p_Vid->active_pps->constrained_intra_pred_flag && (p_Vid->currentSlice->dp_mode==PAR_DP_3)) + { + pix.available &= p_Vid->intra_block[pix.mb_addr]; + if (!pix.available) + ++cnt; + } + + if (pix.available) + { + pred_nnz += p_Vid->nz_coeff [pix.mb_addr ][1][pix.y>>2][pix.x>>2]; + ++cnt; + } + + if (cnt==2) + { + ++pred_nnz; + pred_nnz>>=1; + } + + return pred_nnz; +} + + +static int predict_nnz_cr(Macroblock *currMB, int i,int j) +{ + VideoParameters *p_Vid = currMB->p_Vid; + + PixelPos pix; + + int pred_nnz = 0; + int cnt = 0; + + // left block + p_Vid->getNeighbourLuma(currMB, i - 1, j, &pix); + + if (IS_INTRA(currMB) && pix.available && p_Vid->active_pps->constrained_intra_pred_flag && (p_Vid->currentSlice->dp_mode==PAR_DP_3)) + { + pix.available &= p_Vid->intra_block[pix.mb_addr]; + if (!pix.available) + ++cnt; + } + + if (pix.available) + { + pred_nnz = p_Vid->nz_coeff [pix.mb_addr ][2][pix.y>>2][pix.x>>2]; + ++cnt; + } + + // top block + p_Vid->getNeighbourLuma(currMB, i, j - 1, &pix); + + if (IS_INTRA(currMB) && pix.available && p_Vid->active_pps->constrained_intra_pred_flag && (p_Vid->currentSlice->dp_mode==PAR_DP_3)) + { + pix.available &= p_Vid->intra_block[pix.mb_addr]; + if (!pix.available) + ++cnt; + } + + if (pix.available) + { + pred_nnz += p_Vid->nz_coeff [pix.mb_addr ][2][pix.y>>2][pix.x>>2]; + ++cnt; + } + + if (cnt==2) + { + ++pred_nnz; + pred_nnz>>=1; + } + + return pred_nnz; +} + + +static int predict_nnz_luma(Macroblock *currMB, int i,int j) +{ + VideoParameters *p_Vid = currMB->p_Vid; + + PixelPos pix; + + int pred_nnz = 0; + int cnt = 0; + + // left block + p_Vid->getNeighbourXPLuma(currMB, i - 1, j, &pix); + + if (pix.available) + { + pred_nnz = p_Vid->nz_coeff [pix.mb_addr ][0][pix.y>>2][pix.x>>2]; + ++cnt; + } + + // top block + p_Vid->getNeighbourPXLuma(currMB, i, j - 1, &pix); + + if (pix.available) + { + pred_nnz += p_Vid->nz_coeff [pix.mb_addr ][0][pix.y>>2][pix.x>>2]; + ++cnt; + } + + if (cnt==2) + { + ++pred_nnz; + pred_nnz>>=1; + } + + return pred_nnz; +} + + +static int predict_nnz_luma_intra(Macroblock *currMB, int i,int j) +{ + VideoParameters *p_Vid = currMB->p_Vid; + + PixelPos pix; + + int pred_nnz = 0; + int cnt = 0; + + // left block + p_Vid->getNeighbourXPLuma(currMB, i - 1, j, &pix); + + if (pix.available && p_Vid->active_pps->constrained_intra_pred_flag && (p_Vid->currentSlice->dp_mode==PAR_DP_3)) + { + pix.available &= p_Vid->intra_block[pix.mb_addr]; + if (!pix.available) + ++cnt; + } + + if (pix.available) + { + pred_nnz = p_Vid->nz_coeff [pix.mb_addr ][0][pix.y>>2][pix.x>>2]; + ++cnt; + } + + // top block + p_Vid->getNeighbourPXLuma(currMB, i, j - 1, &pix); + + if (pix.available && p_Vid->active_pps->constrained_intra_pred_flag && (p_Vid->currentSlice->dp_mode==PAR_DP_3)) + { + pix.available &= p_Vid->intra_block[pix.mb_addr]; + if (!pix.available) + ++cnt; + } + + if (pix.available) + { + pred_nnz += p_Vid->nz_coeff [pix.mb_addr ][0][pix.y>>2][pix.x>>2]; + ++cnt; + } + + if (cnt==2) + { + ++pred_nnz; + pred_nnz>>=1; + } + + return pred_nnz; +} + + +/*! +************************************************************************ +* \brief +* Get the Prediction from the Neighboring Blocks for Number of +* Nonzero Coefficients +* +* Chroma Blocks +************************************************************************ +*/ +static int predict_nnz_chroma_inter(Macroblock *currMB, int i,int j) +{ + VideoParameters *p_Vid = currMB->p_Vid; + StorablePicture *dec_picture = p_Vid->dec_picture; + PixelPos pix; + + int pred_nnz = 0; + int cnt = 0; + + if (dec_picture->chroma_format_idc != YUV444) + { + //YUV420 and YUV422 + // left block + p_Vid->getNeighbour(currMB, ((i&0x01)<<2) - 1, j, p_Vid->mb_size[IS_CHROMA], &pix); + if (pix.available) + { + pred_nnz = p_Vid->nz_coeff [pix.mb_addr ][1][pix.y>>2][2 * (i>>1) + (pix.x>>2)]; + ++cnt; + } + + // top block + p_Vid->getNeighbour(currMB, ((i&0x01)<<2), j - 1, p_Vid->mb_size[IS_CHROMA], &pix); + if (pix.available) + { + pred_nnz += p_Vid->nz_coeff [pix.mb_addr ][1][pix.y>>2][2 * (i>>1) + (pix.x>>2)]; + ++cnt; + } + + if (cnt==2) + { + ++pred_nnz; + pred_nnz >>= 1; + } + } + + return pred_nnz; +} + + +static int predict_nnz_chroma_intra(Macroblock *currMB, int i,int j) +{ + VideoParameters *p_Vid = currMB->p_Vid; + StorablePicture *dec_picture = p_Vid->dec_picture; + PixelPos pix; + + int pred_nnz = 0; + int cnt = 0; + + if (dec_picture->chroma_format_idc != YUV444) + { + //YUV420 and YUV422 + // left block + p_Vid->getNeighbour(currMB, ((i&0x01)<<2) - 1, j, p_Vid->mb_size[IS_CHROMA], &pix); + + if (pix.available && p_Vid->active_pps->constrained_intra_pred_flag && (p_Vid->currentSlice->dp_mode==PAR_DP_3)) + { + pix.available &= p_Vid->intra_block[pix.mb_addr]; + if (!pix.available) + ++cnt; + } + + if (pix.available) + { + pred_nnz = p_Vid->nz_coeff [pix.mb_addr ][1][pix.y>>2][2 * (i>>1) + (pix.x>>2)]; + ++cnt; + } + + // top block + p_Vid->getNeighbour(currMB, ((i&0x01)<<2), j - 1, p_Vid->mb_size[IS_CHROMA], &pix); + + if (pix.available && p_Vid->active_pps->constrained_intra_pred_flag && (p_Vid->currentSlice->dp_mode==PAR_DP_3)) + { + pix.available &= p_Vid->intra_block[pix.mb_addr]; + if (!pix.available) + ++cnt; + } + + if (pix.available) + { + pred_nnz += p_Vid->nz_coeff [pix.mb_addr ][1][pix.y>>2][2 * (i>>1) + (pix.x>>2)]; + ++cnt; + } + + if (cnt==2) + { + ++pred_nnz; + pred_nnz >>= 1; + } + } + + return pred_nnz; +} + + +/*! +************************************************************************ +* \brief +* Reads coeff of an 4x4 block (CAVLC) +* +* \author +* Karl Lillevold <karll@real.com> +* contributions by James Au <james@ubvideo.com> +************************************************************************ +*/ +static void readCoeff4x4_CAVLC_Luma (Macroblock *currMB, + int i, int j, int levarr[16], int runarr[16], + int *number_coefficients) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + int mb_nr = currMB->mbAddrX; + SyntaxElement currSE; + DataPartition *dP; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + Bitstream *currStream; + + int k, code, vlcnum; + int numcoeff = 0, numtrailingones, numcoeff_vlc; + int level_two_or_higher; + int numones, totzeros, abslevel; + int zerosleft; + int nnz; + static const int incVlc[] = {0,3,6,12,24,48,32768}; // maximum vlc = 6 + + p_Vid->nz_coeff[mb_nr][0][j][i] = 0; + + if (IS_INTRA (currMB)) + { + dP = &(currSlice->partArr[partMap[SE_LUM_AC_INTRA]]); + nnz = predict_nnz_luma_intra(currMB, i<<2, j<<2); + } + else + { + dP = &(currSlice->partArr[partMap[SE_LUM_AC_INTER]]); + nnz = predict_nnz_luma(currMB, i<<2, j<<2); + } + + if (nnz < 2) + { + numcoeff_vlc = 0; + } + else if (nnz < 4) + { + numcoeff_vlc = 1; + } + else if (nnz < 8) + { + numcoeff_vlc = 2; + } + else // + { + numcoeff_vlc = 3; + } + + currStream = dP->bitstream; + readSyntaxElement_NumCoeffTrailingOnes(&currSE, currStream, numcoeff_vlc); + + numcoeff = currSE.value1; + numtrailingones = currSE.value2; + + p_Vid->nz_coeff[mb_nr][0][j][i] = (byte) numcoeff; + + memzero64(levarr); + memzero64(runarr); + + numones = numtrailingones; + *number_coefficients = numcoeff; + + if (numcoeff) + { + if (numtrailingones) + { + code = readSyntaxElement_FLC(currStream, numtrailingones); + + for (k=0;k<numtrailingones;k++) + { +#ifdef _M_IX86 + levarr[k+numcoeff-numtrailingones] = ((_bittest((const long *)&code, k)<<1) ^ 0xFFFFFFFF) + 2; +#else + levarr[k+numcoeff-numtrailingones] = (code>>k)&1 ? -1:1; +#endif + } + } + + // decode levels + level_two_or_higher = (numcoeff > 3 && numtrailingones == 3)? 0 : 1; + vlcnum = (numcoeff > 10 && numtrailingones < 3) ? 1 : 0; + + for (k = numcoeff - 1 - numtrailingones; k >= 0; k--) + { + int level; + if (vlcnum == 0) + level=readSyntaxElement_Level_VLC0(currStream); + else + level=readSyntaxElement_Level_VLCN(vlcnum, currStream); + + if (level_two_or_higher) + { + level += (level > 0) ? 1 : -1; + level_two_or_higher = 0; + } + + levarr[k] = level; + abslevel = iabs(levarr[k]); + if (abslevel == 1) + ++numones; + + // update VLC table + if (abslevel > incVlc[vlcnum]) + ++vlcnum; + + if (k == numcoeff - 1 - numtrailingones && abslevel >3) + vlcnum = 2; + } + + if (numcoeff < 16) + { + // decode total run + vlcnum = numcoeff - 1; + totzeros = readSyntaxElement_TotalZeros(currStream, vlcnum); + } + else + { + totzeros = 0; + } + + // decode run before each coefficient + zerosleft = totzeros; + i = numcoeff - 1; + + if (zerosleft > 0 && i > 0) + { + do + { + // select VLC for runbefore + vlcnum = imin(zerosleft - 1, RUNBEFORE_NUM_M1); + + runarr[i] = readSyntaxElement_Run(currStream, vlcnum); + + zerosleft -= runarr[i]; + i --; + } while (zerosleft != 0 && i != 0); + } + runarr[i] = zerosleft; + } // if numcoeff +} + + +static void readCoeff4x4_CAVLC_ChromaAC(Macroblock *currMB, + int i, int j, int levarr[16], int runarr[16], + int *number_coefficients) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + int mb_nr = currMB->mbAddrX; + SyntaxElement currSE; + DataPartition *dP; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + Bitstream *currStream; + + int k, code, vlcnum; + int numcoeff = 0, numtrailingones, numcoeff_vlc; + int level_two_or_higher; + int numones, totzeros, abslevel; + int zerosleft, ntr; + int nnz; + static const int incVlc[] = {0,3,6,12,24,48,32768}; // maximum vlc = 6 + + TRACE_PRINTF("ChrDC"); + p_Vid->nz_coeff[mb_nr][0][j][i] = 0; + + if (IS_INTRA (currMB)) + { + dP = &(currSlice->partArr[partMap[SE_CHR_AC_INTRA]]); + nnz = predict_nnz_chroma_intra(currMB, i, ((j-4)<<2)); + } + else + { + dP = &(currSlice->partArr[partMap[SE_CHR_AC_INTER]]); + nnz = predict_nnz_chroma_inter(currMB, i, ((j-4)<<2)); + } + currStream = dP->bitstream; + + + // luma or chroma AC + + if (nnz < 2) + { + numcoeff_vlc = 0; + } + else if (nnz < 4) + { + numcoeff_vlc = 1; + } + else if (nnz < 8) + { + numcoeff_vlc = 2; + } + else // + { + numcoeff_vlc = 3; + } + + readSyntaxElement_NumCoeffTrailingOnes(&currSE, currStream, numcoeff_vlc); + + numcoeff = currSE.value1; + numtrailingones = currSE.value2; + + + p_Vid->nz_coeff[mb_nr][0][j][i] = (byte) numcoeff; + + memzero64(levarr); + memzero64(runarr); + + numones = numtrailingones; + *number_coefficients = numcoeff; + + if (numcoeff) + { + if (numtrailingones) + { + code = readSyntaxElement_FLC (currStream, numtrailingones); + + ntr = numtrailingones; + for (k = numcoeff - 1; k > numcoeff - 1 - numtrailingones; k--) + { + ntr --; + levarr[k] = (code>>ntr)&1 ? -1 : 1; + } + } + + // decode levels + level_two_or_higher = (numcoeff > 3 && numtrailingones == 3)? 0 : 1; + vlcnum = (numcoeff > 10 && numtrailingones < 3) ? 1 : 0; + + for (k = numcoeff - 1 - numtrailingones; k >= 0; k--) + { + +#if TRACE + snprintf(currSE.tracestring, + TRACESTRING_SIZE, "%s lev (%d,%d) k=%d vlc=%d ", type, i, j, k, vlcnum); +#endif + + int level; + if (vlcnum == 0) + level=readSyntaxElement_Level_VLC0(currStream); + else + level=readSyntaxElement_Level_VLCN(vlcnum, currStream); + + if (level_two_or_higher) + { + level += (level > 0) ? 1 : -1; + level_two_or_higher = 0; + } + + levarr[k] = level; + abslevel = iabs(levarr[k]); + if (abslevel == 1) + ++numones; + + // update VLC table + if (abslevel > incVlc[vlcnum]) + ++vlcnum; + + if (k == numcoeff - 1 - numtrailingones && abslevel >3) + vlcnum = 2; + } + + if (numcoeff < 15) + { + // decode total run + vlcnum = numcoeff - 1; + totzeros = readSyntaxElement_TotalZeros(currStream, vlcnum); + } + else + { + totzeros = 0; + } + + // decode run before each coefficient + zerosleft = totzeros; + i = numcoeff - 1; + + if (zerosleft > 0 && i > 0) + { + do + { + // select VLC for runbefore + vlcnum = imin(zerosleft - 1, RUNBEFORE_NUM_M1); + + runarr[i] = readSyntaxElement_Run(currStream, vlcnum); + + zerosleft -= runarr[i]; + i --; + } while (zerosleft != 0 && i != 0); + } + runarr[i] = zerosleft; + } // if numcoeff +} + +static void readCoeff4x4_CAVLC_ChromaDC(Macroblock *currMB, int i, int j, int levarr[16], int runarr[16], int *number_coefficients) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + int mb_nr = currMB->mbAddrX; + SyntaxElement currSE; + DataPartition *dP; + Bitstream *currStream; + + int k, code, vlcnum; + int numcoeff = 0, numtrailingones; + int level_two_or_higher; + int numones, totzeros, abslevel; + int zerosleft, ntr; + int max_coeff_num; + static const int incVlc[] = {0,3,6,12,24,48,32768}; // maximum vlc = 6 + + max_coeff_num = p_Vid->num_cdc_coeff; + TRACE_PRINTF("ChrDC"); + p_Vid->nz_coeff[mb_nr][0][j][i] = 0; + if (IS_INTRA (currMB)) + dP = &(currSlice->partArr[assignSE2partition[currSlice->dp_mode][SE_CHR_DC_INTRA]]); + else + dP = &(currSlice->partArr[assignSE2partition[currSlice->dp_mode][SE_CHR_DC_INTER]]); + currStream = dP->bitstream; + + readSyntaxElement_NumCoeffTrailingOnesChromaDC(p_Vid, &currSE, currStream); + + numcoeff = currSE.value1; + numtrailingones = currSE.value2; + + memzero64(levarr); + memzero64(runarr); + + numones = numtrailingones; + *number_coefficients = numcoeff; + + if (numcoeff) + { + if (numtrailingones) + { + code = readSyntaxElement_FLC (currStream, numtrailingones); + + ntr = numtrailingones; + for (k = numcoeff - 1; k > numcoeff - 1 - numtrailingones; k--) + { + ntr --; + levarr[k] = (code>>ntr)&1 ? -1 : 1; + } + } + + // decode levels + level_two_or_higher = (numcoeff > 3 && numtrailingones == 3)? 0 : 1; + vlcnum = (numcoeff > 10 && numtrailingones < 3) ? 1 : 0; + + for (k = numcoeff - 1 - numtrailingones; k >= 0; k--) + { + int level; + if (vlcnum == 0) + level=readSyntaxElement_Level_VLC0(currStream); + else + level=readSyntaxElement_Level_VLCN(vlcnum, currStream); + + if (level_two_or_higher) + { + level += (level > 0) ? 1 : -1; + level_two_or_higher = 0; + } + + levarr[k] = level; + abslevel = iabs(levarr[k]); + if (abslevel == 1) + ++numones; + + // update VLC table + if (abslevel > incVlc[vlcnum]) + ++vlcnum; + + if (k == numcoeff - 1 - numtrailingones && abslevel >3) + vlcnum = 2; + } + + if (numcoeff < max_coeff_num) + { + // decode total run + vlcnum = numcoeff - 1; + totzeros = readSyntaxElement_TotalZerosChromaDC(p_Vid, currStream, vlcnum); + } + else + { + totzeros = 0; + } + + // decode run before each coefficient + zerosleft = totzeros; + i = numcoeff - 1; + + if (zerosleft > 0 && i > 0) + { + do + { + // select VLC for runbefore + vlcnum = imin(zerosleft - 1, RUNBEFORE_NUM_M1); + + runarr[i] = readSyntaxElement_Run(currStream, vlcnum); + + zerosleft -= runarr[i]; + i --; + } while (zerosleft != 0 && i != 0); + } + runarr[i] = zerosleft; + } // if numcoeff +} + +static void readCoeff4x4_CAVLC(Macroblock *currMB, int block_type, int i, int j, int levarr[16], int runarr[16], int *number_coefficients) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + int mb_nr = currMB->mbAddrX; + SyntaxElement currSE; + DataPartition *dP; + Bitstream *currStream; + + int k, code, vlcnum; + int numcoeff = 0, numtrailingones, numcoeff_vlc; + int level_two_or_higher; + int numones, totzeros, abslevel; + int zerosleft, ntr, dptype = 0; + int max_coeff_num, nnz; + static const int incVlc[] = {0,3,6,12,24,48,32768}; // maximum vlc = 6 + + switch (block_type) + { + case LUMA: + readCoeff4x4_CAVLC_Luma(currMB, i, j, levarr, runarr, number_coefficients); + return; + case LUMA_INTRA16x16DC: + max_coeff_num = 16; + TRACE_PRINTF("Lum16DC"); + dptype = SE_LUM_DC_INTRA; + p_Vid->nz_coeff[mb_nr][0][j][i] = 0; + break; + case LUMA_INTRA16x16AC: + max_coeff_num = 15; + TRACE_PRINTF("Lum16AC"); + dptype = SE_LUM_AC_INTRA; + p_Vid->nz_coeff[mb_nr][0][j][i] = 0; + break; + case CB: + max_coeff_num = 16; + TRACE_PRINTF("Luma_add1"); + dptype = (IS_INTRA (currMB)) ? SE_LUM_AC_INTRA : SE_LUM_AC_INTER; + p_Vid->nz_coeff[mb_nr][1][j][i] = 0; + break; + case CB_INTRA16x16DC: + max_coeff_num = 16; + TRACE_PRINTF("Luma_add1_16DC"); + dptype = SE_LUM_DC_INTRA; + p_Vid->nz_coeff[mb_nr][1][j][i] = 0; + break; + case CB_INTRA16x16AC: + max_coeff_num = 15; + TRACE_PRINTF("Luma_add1_16AC"); + dptype = SE_LUM_AC_INTRA; + p_Vid->nz_coeff[mb_nr][1][j][i] = 0; + break; + case CR: + max_coeff_num = 16; + TRACE_PRINTF("Luma_add2"); + dptype = (IS_INTRA (currMB)) ? SE_LUM_AC_INTRA : SE_LUM_AC_INTER; + p_Vid->nz_coeff[mb_nr][2][j][i] = 0; + break; + case CR_INTRA16x16DC: + max_coeff_num = 16; + TRACE_PRINTF("Luma_add2_16DC"); + dptype = SE_LUM_DC_INTRA; + p_Vid->nz_coeff[mb_nr][2][j][i] = 0; + break; + case CR_INTRA16x16AC: + max_coeff_num = 15; + TRACE_PRINTF("Luma_add1_16AC"); + dptype = SE_LUM_AC_INTRA; + p_Vid->nz_coeff[mb_nr][2][j][i] = 0; + break; + case CHROMA_DC: + readCoeff4x4_CAVLC_ChromaDC(currMB, i, j, levarr, runarr, number_coefficients); + return; + case CHROMA_AC: + readCoeff4x4_CAVLC_ChromaAC(currMB, i, j, levarr, runarr, number_coefficients); + return; + default: + error ("readCoeff4x4_CAVLC: invalid block type", 600); + p_Vid->nz_coeff[mb_nr][0][j][i] = 0; + break; + } + + dP = &(currSlice->partArr[assignSE2partition[currSlice->dp_mode][dptype]]); + currStream = dP->bitstream; + + // luma or chroma AC + if(block_type==LUMA_INTRA16x16DC || block_type==LUMA_INTRA16x16AC) + { + nnz = predict_nnz_luma_intra(currMB, i<<2, j<<2); + } + else if (block_type==CB || block_type==CB_INTRA16x16DC || block_type==CB_INTRA16x16AC) + { + nnz = predict_nnz_cb(currMB, i<<2, j<<2); + } + else + { + nnz = predict_nnz_cr(currMB, i<<2, j<<2); + } + + if (nnz < 2) + { + numcoeff_vlc = 0; + } + else if (nnz < 4) + { + numcoeff_vlc = 1; + } + else if (nnz < 8) + { + numcoeff_vlc = 2; + } + else // + { + numcoeff_vlc = 3; + } + + readSyntaxElement_NumCoeffTrailingOnes(&currSE, currStream, numcoeff_vlc); + + numcoeff = currSE.value1; + numtrailingones = currSE.value2; + + if(block_type==LUMA_INTRA16x16DC || block_type==LUMA_INTRA16x16AC) + p_Vid->nz_coeff[mb_nr][0][j][i] = (byte) numcoeff; + else if (block_type==CB || block_type==CB_INTRA16x16DC || block_type==CB_INTRA16x16AC) + p_Vid->nz_coeff[mb_nr][1][j][i] = (byte) numcoeff; + else + p_Vid->nz_coeff[mb_nr][2][j][i] = (byte) numcoeff; + + + memzero64(levarr); + memzero64(runarr); + + numones = numtrailingones; + *number_coefficients = numcoeff; + + if (numcoeff) + { + if (numtrailingones) + { + code = readSyntaxElement_FLC(currStream, numtrailingones); + + ntr = numtrailingones; + for (k = numcoeff - 1; k > numcoeff - 1 - numtrailingones; k--) + { + ntr --; + levarr[k] = (code>>ntr)&1 ? -1 : 1; + } + } + + // decode levels + level_two_or_higher = (numcoeff > 3 && numtrailingones == 3)? 0 : 1; + vlcnum = (numcoeff > 10 && numtrailingones < 3) ? 1 : 0; + + for (k = numcoeff - 1 - numtrailingones; k >= 0; k--) + { + int level; + if (vlcnum == 0) + level=readSyntaxElement_Level_VLC0(currStream); + else + level=readSyntaxElement_Level_VLCN(vlcnum, currStream); + + if (level_two_or_higher) + { + level += (level > 0) ? 1 : -1; + level_two_or_higher = 0; + } + + levarr[k] = level; + abslevel = iabs(levarr[k]); + if (abslevel == 1) + ++numones; + + // update VLC table + if (abslevel > incVlc[vlcnum]) + ++vlcnum; + + if (k == numcoeff - 1 - numtrailingones && abslevel >3) + vlcnum = 2; + } + + if (numcoeff < max_coeff_num) + { + // decode total run + vlcnum = numcoeff - 1; + totzeros = readSyntaxElement_TotalZeros(currStream, vlcnum); + } + else + { + totzeros = 0; + } + + // decode run before each coefficient + zerosleft = totzeros; + i = numcoeff - 1; + + if (zerosleft > 0 && i > 0) + { + do + { + // select VLC for runbefore + vlcnum = imin(zerosleft - 1, RUNBEFORE_NUM_M1); + + runarr[i] = readSyntaxElement_Run(currStream, vlcnum); + + zerosleft -= runarr[i]; + i --; + } while (zerosleft != 0 && i != 0); + } + runarr[i] = zerosleft; + } // if numcoeff +} + +/*! +************************************************************************ +* \brief +* Get coefficients (run/level) of 4x4 blocks in a SMB +* from the NAL (CABAC Mode) +************************************************************************ +*/ +static void readCompCoeff4x4SMB_I16MB_CABAC(Macroblock *currMB, int context, h264_short_block_t *blocks, int block_y, int block_x, int64 *cbp_blk) +{ + // start_scan == 1 + int i,j,k; + RunLevel rl; + VideoParameters *p_Vid = currMB->p_Vid; + Slice *currSlice = currMB->p_Slice; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + + const byte *pos_scan4x4 = ((p_Vid->structure == FRAME) && (!currMB->mb_field)) ? SNGL_SCAN_1D : FIELD_SCAN_1D; + const byte *pos_scan_4x4; + // make distinction between INTRA and INTER coded luminance coefficients + int type = (currMB->is_intra_block ? SE_LUM_AC_INTRA : SE_LUM_AC_INTER); + DecodingEnvironment *de_cabac = &currSlice->partArr[partMap[type]].de_cabac; + + for (j = 0; j < BLOCK_SIZE_8x8; j += BLOCK_SIZE) + { + currMB->subblock_y = block_y + j; // position for coeff_count ctx + + for (i = 0; i < BLOCK_SIZE_8x8; i += BLOCK_SIZE) + { + int16_t *block = (int16_t *)(*blocks++); + currMB->subblock_x = block_x + i; // position for coeff_count ctx + pos_scan_4x4 = &pos_scan4x4[1]; + for(k = 0; k < 16; k++) + { + rl = readRunLevel_CABAC(currMB, de_cabac, context); + + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan_4x4 += rl.run; + block[*pos_scan_4x4++] = rl.level; + } + else + break; + } + } + } +} + +#ifdef _M_IX86 +static void readCompCoeff4x4SMB_CABAC(Macroblock *currMB, int context, h264_short_block_t *blocks, int block_y, int block_x, int64_t *cbp_blk64) +#else +static void readCompCoeff4x4SMB_CABAC(Macroblock *currMB, int context, h264_short_block_t *blocks, int block_y, int block_x, int64_t *cbp_blk) +#endif +{ + int k; + RunLevel rl; + VideoParameters *p_Vid = currMB->p_Vid; + Slice *currSlice = currMB->p_Slice; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + const byte *pos_scan4x4 = ((p_Vid->structure == FRAME) && (!currMB->mb_field)) ? SNGL_SCAN_1D : FIELD_SCAN_1D; + const byte *pos_scan_4x4; + int16_t *block; +#ifdef _M_IX86 + int32_t *cbp_blk = (int32_t *)cbp_blk64; +#endif + //h264_short_block_t *blocks = &currSlice->cof4[pl][cof4_pos_to_subblock[block_y>>2][block_x>>2]]; + DecodingEnvironment *de_cabac_dc, *de_cabac_ac; + /* + * make distinction between INTRA and INTER coded + * luminance coefficients + */ + if (currMB->is_intra_block) + { + de_cabac_dc = &currSlice->partArr[partMap[SE_LUM_DC_INTRA]].de_cabac; + de_cabac_ac = &currSlice->partArr[partMap[SE_LUM_AC_INTRA]].de_cabac; + } + else + { + de_cabac_dc = &currSlice->partArr[partMap[SE_LUM_DC_INTER]].de_cabac; + de_cabac_ac = &currSlice->partArr[partMap[SE_LUM_AC_INTER]].de_cabac; + } +// for (j = block_y; j < (block_y+BLOCK_SIZE_8x8); j += 4) + + + block = (int16_t *)(*blocks++); + currMB->subblock_y = block_y; // position for coeff_count ctx + currMB->subblock_x = block_x; // position for coeff_count ctx + pos_scan_4x4 = pos_scan4x4; + rl = readRunLevel_CABAC(currMB, de_cabac_dc, context); + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan_4x4 += rl.run; + *cbp_blk |= 1 << (block_y + (block_x >> 2)) ; + block[*pos_scan_4x4++] = rl.level; + for(k = 0; k < 16; ++k) + { + rl = readRunLevel_CABAC(currMB, de_cabac_ac, context); + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan_4x4 += rl.run; + block[*pos_scan_4x4++] = rl.level; + } + else + break; + } + } + + block = (int16_t *)(*blocks++); + currMB->subblock_x += 4; // position for coeff_count ctx + pos_scan_4x4 = pos_scan4x4; + rl = readRunLevel_CABAC(currMB, de_cabac_dc, context); + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan_4x4 += rl.run; + *cbp_blk |= 2 << (block_y + (block_x >> 2)) ; + block[*pos_scan_4x4++] = rl.level; + for(k = 0; k < 16; ++k) + { + rl = readRunLevel_CABAC(currMB, de_cabac_ac, context); + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan_4x4 += rl.run; + block[*pos_scan_4x4++] = rl.level; + } + else + break; + } + } + /* ---- */ + block = (int16_t *)(*blocks++); + currMB->subblock_y += 4; // position for coeff_count ctx + currMB->subblock_x = block_x; // position for coeff_count ctx + pos_scan_4x4 = pos_scan4x4; + rl = readRunLevel_CABAC(currMB, de_cabac_dc, context); + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan_4x4 += rl.run; + *cbp_blk |= 16 << (block_y + (block_x >> 2)) ; + block[*pos_scan_4x4++] = rl.level; + for(k = 0; k < 16; ++k) + { + rl = readRunLevel_CABAC(currMB, de_cabac_ac, context); + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan_4x4 += rl.run; + block[*pos_scan_4x4++] = rl.level; + } + else + break; + } + } + + block = (int16_t *)(*blocks++); + currMB->subblock_x += 4; // position for coeff_count ctx + pos_scan_4x4 = pos_scan4x4; + rl = readRunLevel_CABAC(currMB, de_cabac_dc, context); + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan_4x4 += rl.run; + *cbp_blk |= 32 << (block_y + (block_x >> 2)) ; + block[*pos_scan_4x4++] = rl.level; + for(k = 0; k < 16; ++k) + { + rl = readRunLevel_CABAC(currMB, de_cabac_ac, context); + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan_4x4 += rl.run; + block[*pos_scan_4x4++] = rl.level; + } + else + break; + } + } + +} + +#if defined(_DEBUG) || defined(_M_IX64) +static void inv_level_coefficients(h264_short_block_t *blocks, const int (*InvLevelScale)[4], int qp_per) +{ + int j, b; + + for (b = 0;b<4;b++) + { + h264_short_block_row_t *block = blocks[b]; + for (j = 0; j < 4; ++j) + { + if (block[j][0]) block[j][0]= rshift_rnd_sf((block[j][0] * InvLevelScale[j][0]) << qp_per, 4); + if (block[j][1]) block[j][1]= rshift_rnd_sf((block[j][1] * InvLevelScale[j][1]) << qp_per, 4); + if (block[j][2]) block[j][2]= rshift_rnd_sf((block[j][2] * InvLevelScale[j][2]) << qp_per, 4); + if (block[j][3]) block[j][3]= rshift_rnd_sf((block[j][3] * InvLevelScale[j][3]) << qp_per, 4); + } + } +} +#else +void inv_level_coefficients(h264_short_block_t *blocks, const int (*InvLevelScale)[4], int qp_per); +#endif + +static void inv_level_coefficients_AC(h264_short_block_t *blocks, const int (*InvLevelScale)[4], int qp_per) +{ + int b; + + for (b = 0;b<4;b++) + { + h264_short_block_row_t *block = blocks[b]; + if (block[0][1]) block[0][1]= rshift_rnd_sf((block[0][1] * InvLevelScale[0][1]) << qp_per, 4); + if (block[0][2]) block[0][2]= rshift_rnd_sf((block[0][2] * InvLevelScale[0][2]) << qp_per, 4); + if (block[0][3]) block[0][3]= rshift_rnd_sf((block[0][3] * InvLevelScale[0][3]) << qp_per, 4); + + if (block[1][0]) block[1][0]= rshift_rnd_sf((block[1][0] * InvLevelScale[1][0]) << qp_per, 4); + if (block[1][1]) block[1][1]= rshift_rnd_sf((block[1][1] * InvLevelScale[1][1]) << qp_per, 4); + if (block[1][2]) block[1][2]= rshift_rnd_sf((block[1][2] * InvLevelScale[1][2]) << qp_per, 4); + if (block[1][3]) block[1][3]= rshift_rnd_sf((block[1][3] * InvLevelScale[1][3]) << qp_per, 4); + + if (block[2][0]) block[2][0]= rshift_rnd_sf((block[2][0] * InvLevelScale[2][0]) << qp_per, 4); + if (block[2][1]) block[2][1]= rshift_rnd_sf((block[2][1] * InvLevelScale[2][1]) << qp_per, 4); + if (block[2][2]) block[2][2]= rshift_rnd_sf((block[2][2] * InvLevelScale[2][2]) << qp_per, 4); + if (block[2][3]) block[2][3]= rshift_rnd_sf((block[2][3] * InvLevelScale[2][3]) << qp_per, 4); + + if (block[3][0]) block[3][0]= rshift_rnd_sf((block[3][0] * InvLevelScale[3][0]) << qp_per, 4); + if (block[3][1]) block[3][1]= rshift_rnd_sf((block[3][1] * InvLevelScale[3][1]) << qp_per, 4); + if (block[3][2]) block[3][2]= rshift_rnd_sf((block[3][2] * InvLevelScale[3][2]) << qp_per, 4); + if (block[3][3]) block[3][3]= rshift_rnd_sf((block[3][3] * InvLevelScale[3][3]) << qp_per, 4); + } +} + +/*! +************************************************************************ +* \brief +* Get coefficients (run/level) of all 4x4 blocks in a MB +* from the NAL (CABAC Mode) +************************************************************************ +*/ +static void readCompCoeff4x4MB_CABAC(Macroblock *currMB, ColorPlane pl, int intra, int (*InvLevelScale4x4)[4], int qp_per, int cbp) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + int start_scan = IS_I16MB (currMB)? 1 : 0; + int64 *cbp_blk = &currMB->cbp_blk[pl]; + int context; + h264_short_block_t *blocks = currSlice->cof4[pl]; + + currMB->is_intra_block = intra; + + if( pl == PLANE_Y || IS_INDEPENDENT(p_Vid) ) + context = (IS_I16MB(currMB) ? LUMA_16AC: LUMA_4x4); + else if (pl == PLANE_U) + context = (IS_I16MB(currMB) ? CB_16AC: CB_4x4); + else + context = (IS_I16MB(currMB) ? CR_16AC: CR_4x4); + if (start_scan == 0) + { + if (currMB->is_lossless == FALSE) + { + if (cbp & 1) + { + readCompCoeff4x4SMB_CABAC(currMB, context, &blocks[0], 0, 0, cbp_blk); + inv_level_coefficients(&blocks[0], InvLevelScale4x4, qp_per); + } + if (cbp & 2) + { + readCompCoeff4x4SMB_CABAC(currMB, context, &blocks[4], 0, 8, cbp_blk); + inv_level_coefficients(&blocks[4], InvLevelScale4x4, qp_per); + } + if (cbp & 4) + { + readCompCoeff4x4SMB_CABAC(currMB, context, &blocks[8], 8, 0, cbp_blk); + inv_level_coefficients(&blocks[8], InvLevelScale4x4, qp_per); + } + if (cbp & 8) + { + readCompCoeff4x4SMB_CABAC(currMB, context, &blocks[12], 8, 8, cbp_blk); + inv_level_coefficients(&blocks[12], InvLevelScale4x4, qp_per); + } + } + else + { + if (cbp & 1) + readCompCoeff4x4SMB_CABAC(currMB, context, &blocks[0], 0, 0, cbp_blk); + if (cbp & 2) + readCompCoeff4x4SMB_CABAC(currMB, context, &blocks[4], 0, 8, cbp_blk); + if (cbp & 4) + readCompCoeff4x4SMB_CABAC(currMB, context, &blocks[8], 8, 0, cbp_blk); + if (cbp & 8) + readCompCoeff4x4SMB_CABAC(currMB, context, &blocks[12], 8, 8, cbp_blk); + } + } + else + { + if (currMB->is_lossless == FALSE) + { + if (cbp & 1) // are there any coeff in current block at all + { + readCompCoeff4x4SMB_I16MB_CABAC(currMB, context, &blocks[0], 0, 0, cbp_blk); + inv_level_coefficients_AC(&blocks[0], InvLevelScale4x4, qp_per); + } + if (cbp & 2) // are there any coeff in current block at all + { + readCompCoeff4x4SMB_I16MB_CABAC(currMB, context, &blocks[4], 0, 8, cbp_blk); + inv_level_coefficients_AC(&blocks[4], InvLevelScale4x4, qp_per); + } + if (cbp & 4) // are there any coeff in current block at all + { + readCompCoeff4x4SMB_I16MB_CABAC(currMB, context, &blocks[8], 8, 0, cbp_blk); + inv_level_coefficients_AC(&blocks[8], InvLevelScale4x4, qp_per); + } + if (cbp & 8) // are there any coeff in current block at all + { + readCompCoeff4x4SMB_I16MB_CABAC(currMB, context, &blocks[12], 8, 8, cbp_blk); + inv_level_coefficients_AC(&blocks[12], InvLevelScale4x4, qp_per); + } + } + else + { + if (cbp & 1) + readCompCoeff4x4SMB_I16MB_CABAC(currMB, context, &blocks[0], 0, 0, cbp_blk); + if (cbp & 2) + readCompCoeff4x4SMB_I16MB_CABAC(currMB, context, &blocks[4], 0, 8, cbp_blk); + if (cbp & 4) + readCompCoeff4x4SMB_I16MB_CABAC(currMB, context, &blocks[8], 8, 0, cbp_blk); + if (cbp & 8) + readCompCoeff4x4SMB_I16MB_CABAC(currMB, context, &blocks[12], 8, 8, cbp_blk); + } + } +} + +/*! +************************************************************************ +* \brief +* Get coefficients (run/level) of one 8x8 block +* from the NAL (CABAC Mode) +************************************************************************ +*/ +static void readCompCoeff8x8_CABAC_Lossless(Macroblock *currMB, ColorPlane pl, int b8) +{ + if (currMB->cbp & (1<<b8)) // are there any coefficients in the current block + { + VideoParameters *p_Vid = currMB->p_Vid; + int transform_pl = IS_INDEPENDENT(p_Vid) ? p_Vid->colour_plane_id : pl; + int scan; + short *tcoeffs; + int k; + RunLevel rl; + int context; + DataPartition *dP; + Slice *currSlice = currMB->p_Slice; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + + int cbp_mask = (int64) 51 << (4 * b8 - 2 * (b8 & 0x01)); // corresponds to 110011, as if all four 4x4 blocks contain coeff, shifted to block position + int64 *cur_cbp = &currMB->cbp_blk[pl]; + + // select scan type + const byte *pos_scan8x8 = ((p_Vid->structure == FRAME) && (!currMB->mb_field)) ? SNGL_SCAN8x8_1D : FIELD_SCAN8x8_1D; + + int qp_per = p_Vid->qp_per_matrix[ currMB->qp_scaled[pl] ]; + int qp_rem = p_Vid->qp_rem_matrix[ currMB->qp_scaled[pl] ]; + + const int *InvLevelScale8x8 = IS_INTRA(currMB)? currSlice->InvLevelScale8x8_Intra[transform_pl][qp_rem] : currSlice->InvLevelScale8x8_Inter[transform_pl][qp_rem]; + + currMB->is_intra_block = IS_INTRA(currMB); + + // === set offset in current macroblock === + tcoeffs = (short *)(currSlice->mb_rres8[pl][b8]); + + currMB->subblock_x = (b8&0x01) << 3; // position for coeff_count ctx + currMB->subblock_y = (b8 >> 1) << 3; // position for coeff_count ctx + + if (pl==PLANE_Y || IS_INDEPENDENT(p_Vid)) + context = LUMA_8x8; + else if (pl==PLANE_U) + context = CB_8x8; + else + context = CR_8x8; + + for(k=0; (k < 65);++k) + { + //============ read ============= + /* + * make distinction between INTRA and INTER coded + * luminance coefficients + */ + + int type = ((currMB->is_intra_block == 1) + ? (k==0 ? SE_LUM_DC_INTRA : SE_LUM_AC_INTRA) + : (k==0 ? SE_LUM_DC_INTER : SE_LUM_AC_INTER)); + + dP = &(currSlice->partArr[partMap[type]]); + rl = readRunLevel_CABAC(currMB, &(dP->de_cabac), context); + + //============ decode ============= + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan8x8 += rl.run; + + scan = *pos_scan8x8++; + + *cur_cbp |= cbp_mask; + + tcoeffs[scan] = rl.level; + } + else + break; + } + } +} + + +static void readCompCoeff8x8_CABAC_Intra(Macroblock *currMB, ColorPlane pl, int b8) +{ + if (currMB->cbp & (1<<b8)) // are there any coefficients in the current block + { + VideoParameters *p_Vid = currMB->p_Vid; + int transform_pl = IS_INDEPENDENT(p_Vid) ? p_Vid->colour_plane_id : pl; + int scan; + short *tcoeffs; + RunLevel rl; + int k; + int context; + DecodingEnvironment *cabac; + Slice *currSlice = currMB->p_Slice; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + + int cbp_mask = (int64) 51 << (4 * b8 - 2 * (b8 & 0x01)); // corresponds to 110011, as if all four 4x4 blocks contain coeff, shifted to block position + int64 *cur_cbp = &currMB->cbp_blk[pl]; + + // select scan type + const byte *pos_scan8x8 = ((p_Vid->structure == FRAME) && (!currMB->mb_field)) ? SNGL_SCAN8x8_1D : FIELD_SCAN8x8_1D; + + int qp_per = p_Vid->qp_per_matrix[ currMB->qp_scaled[pl] ]; + int qp_rem = p_Vid->qp_rem_matrix[ currMB->qp_scaled[pl] ]; + + const int *InvLevelScale8x8 = currSlice->InvLevelScale8x8_Intra[transform_pl][qp_rem]; + + currMB->is_intra_block = 1; + + // === set offset in current macroblock === + tcoeffs = (short *)(currSlice->mb_rres8[pl][b8]); + + currMB->subblock_x = (b8&0x01) << 3; // position for coeff_count ctx + currMB->subblock_y = (b8 >> 1) << 3; // position for coeff_count ctx + + if (pl==PLANE_Y || IS_INDEPENDENT(p_Vid)) + context = LUMA_8x8; + else if (pl==PLANE_U) + context = CB_8x8; + else + context = CR_8x8; + + // Read DC + cabac = &(currSlice->partArr[partMap[SE_LUM_DC_INTRA]].de_cabac); + rl = readRunLevel_CABAC(currMB, cabac, context); + + //============ decode ============= + if (rl.level != 0) /* leave if level == 0 */ + { + *cur_cbp |= cbp_mask; + + pos_scan8x8 += rl.run; + + scan = *pos_scan8x8++; + + tcoeffs[scan] = rshift_rnd_sf((rl.level * InvLevelScale8x8[scan]) << qp_per, 6); // dequantization + + // AC coefficients + cabac = &(currSlice->partArr[partMap[SE_LUM_AC_INTRA]].de_cabac); + + k = 64; + do + { + rl = readRunLevel_CABAC(currMB, cabac, context); + + //============ decode ============= + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan8x8 += rl.run; + + scan = *pos_scan8x8++; + + tcoeffs[scan] = rshift_rnd_sf((rl.level * InvLevelScale8x8[scan]) << qp_per, 6); // dequantization + } + else + break; + } while (--k); + } + } + +} + + + +static void readCompCoeff8x8_CABAC_Inter(Macroblock *currMB, ColorPlane pl, int b8) +{ + if (currMB->cbp & (1<<b8)) // are there any coefficients in the current block + { + VideoParameters *p_Vid = currMB->p_Vid; + int transform_pl = IS_INDEPENDENT(p_Vid) ? p_Vid->colour_plane_id : pl; + int scan; + short *tcoeffs; + int k; + RunLevel rl; + int context; + DecodingEnvironment *cabac; + Slice *currSlice = currMB->p_Slice; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + + int cbp_mask = (int64) 51 << (4 * b8 - 2 * (b8 & 0x01)); // corresponds to 110011, as if all four 4x4 blocks contain coeff, shifted to block position + int64 *cur_cbp = &currMB->cbp_blk[pl]; + + // select scan type + const byte *pos_scan8x8 = ((p_Vid->structure == FRAME) && (!currMB->mb_field)) ? SNGL_SCAN8x8_1D : FIELD_SCAN8x8_1D; + + int qp_per = p_Vid->qp_per_matrix[ currMB->qp_scaled[pl] ]; + int qp_rem = p_Vid->qp_rem_matrix[ currMB->qp_scaled[pl] ]; + + const int *InvLevelScale8x8 = currSlice->InvLevelScale8x8_Inter[transform_pl][qp_rem]; + + currMB->is_intra_block = 0; + + // === set offset in current macroblock === + tcoeffs = (short *)(currSlice->mb_rres8[pl][b8]); + + currMB->subblock_x = (b8&0x01) << 3; // position for coeff_count ctx + currMB->subblock_y = (b8 >> 1) << 3; // position for coeff_count ctx + + if (pl==PLANE_Y || IS_INDEPENDENT(p_Vid)) + context = LUMA_8x8; + else if (pl==PLANE_U) + context = CB_8x8; + else + context = CR_8x8; + + // Read DC + cabac = &(currSlice->partArr[partMap[SE_LUM_DC_INTER]].de_cabac); + rl = readRunLevel_CABAC(currMB, cabac, context); + + //============ decode ============= + if (rl.level != 0) /* leave if level == 0 */ + { + *cur_cbp |= cbp_mask; + + pos_scan8x8 += rl.run; + + scan = *pos_scan8x8++; + + tcoeffs[scan] = rshift_rnd_sf((rl.level * InvLevelScale8x8[scan]) << qp_per, 6); // dequantization + + // AC coefficients + cabac = &(currSlice->partArr[partMap[SE_LUM_AC_INTER]].de_cabac); + + k=64; + do + { + rl = readRunLevel_CABAC(currMB, cabac, context); + + //============ decode ============= + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan8x8 += rl.run; + + scan = *pos_scan8x8++; + + tcoeffs[scan] = rshift_rnd_sf((rl.level * InvLevelScale8x8[scan]) << qp_per, 6); // dequantization + } + else + break; + } while (--k); + } + } + +} + + +/*! +************************************************************************ +* \brief +* Get coefficients (run/level) of 8x8 blocks in a MB +* from the NAL (CABAC Mode) +************************************************************************ +*/ +static void readCompCoeff8x8MB_CABAC(Macroblock *currMB, ColorPlane pl) +{ + //======= 8x8 transform size & CABAC ======== + if(currMB->is_lossless == FALSE) + { + if (IS_INTRA(currMB)) + { + readCompCoeff8x8_CABAC_Intra(currMB, pl, 0); + readCompCoeff8x8_CABAC_Intra(currMB, pl, 1); + readCompCoeff8x8_CABAC_Intra(currMB, pl, 2); + readCompCoeff8x8_CABAC_Intra(currMB, pl, 3); + } + else + { + readCompCoeff8x8_CABAC_Inter(currMB, pl, 0); + readCompCoeff8x8_CABAC_Inter(currMB, pl, 1); + readCompCoeff8x8_CABAC_Inter(currMB, pl, 2); + readCompCoeff8x8_CABAC_Inter(currMB, pl, 3); + } + } + else + { + readCompCoeff8x8_CABAC_Lossless(currMB, pl, 0); + readCompCoeff8x8_CABAC_Lossless(currMB, pl, 1); + readCompCoeff8x8_CABAC_Lossless(currMB, pl, 2); + readCompCoeff8x8_CABAC_Lossless(currMB, pl, 3); + } +} + +/*! +************************************************************************ +* \brief +* Get coefficients (run/level) of 4x4 blocks in a MB +* from the NAL (CABAC Mode) +************************************************************************ +*/ +static void readCompCoeff4x4MB_CAVLC (Macroblock *currMB, ColorPlane pl, int (*InvLevelScale4x4)[4], int qp_per, int cbp, h264_4x4_byte nzcoeff) +{ + int block_y, block_x, b8; + int i, j, k; + int i0, j0; + __declspec(align(32)) int levarr[16], runarr[16]; + int numcoeff; + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + const byte (*pos_scan4x4)[2] = ((p_Vid->structure == FRAME) && (!currMB->mb_field)) ? SNGL_SCAN : FIELD_SCAN; + const byte *pos_scan_4x4 = pos_scan4x4[0]; + int start_scan = IS_I16MB(currMB) ? 1 : 0; + int64 *cur_cbp = &currMB->cbp_blk[pl]; + int coef_ctr, cur_context; + + memzero64(levarr); + memzero64(runarr); + + if (IS_I16MB(currMB)) + { + if (pl == PLANE_Y) + cur_context = LUMA_INTRA16x16AC; + else if (pl == PLANE_U) + cur_context = CB_INTRA16x16AC; + else + cur_context = CR_INTRA16x16AC; + } + else + { + if (pl == PLANE_Y) + cur_context = LUMA; + else if (pl == PLANE_U) + cur_context = CB; + else + cur_context = CR; + } + + if (currMB->is_lossless == FALSE) + { + for (block_y = 0; block_y < 4; block_y += 2) /* all modes */ + { + for (block_x = 0; block_x < 4; block_x += 2) + { + b8 = (block_y + (block_x >> 1)); + + if (cbp & (1 << b8)) // test if the block contains any coefficients + { + for (j=block_y << 2; j < (block_y + 2) << 2; j += BLOCK_SIZE) + { + for (i=block_x << 2; i < (block_x + 2) << 2; i += BLOCK_SIZE) + { + readCoeff4x4_CAVLC(currMB, cur_context, i >> 2, j >> 2, levarr, runarr, &numcoeff); + pos_scan_4x4 = pos_scan4x4[start_scan]; + + for (k = 0; k < numcoeff; ++k) + { + if (levarr[k] != 0) + { + pos_scan_4x4 += (runarr[k] << 1); + + i0 = *pos_scan_4x4++; + j0 = *pos_scan_4x4++; + + // inverse quant for 4x4 transform only + *cur_cbp |= (int64) 1 << (j + (i >> 2)); + + currSlice->cof4[pl][cof4_pos_to_subblock[j>>2][i>>2]][j0][i0]= rshift_rnd_sf((levarr[k] * InvLevelScale4x4[j0][i0])<<qp_per, 4); + } + } + } + } + } + else + { + for (j=0; j < 2; j++) + { + for (i=0;i<2;i++) + { + nzcoeff[block_y+j][block_x+i]=0; + } + } + } + } + } + } + else + { + for (block_y=0; block_y < 4; block_y += 2) /* all modes */ + { + for (block_x=0; block_x < 4; block_x += 2) + { + b8 = 2*(block_y>>1) + (block_x>>1); + + if (cbp & (1<<b8)) /* are there any coeff in current block at all */ + { + for (j=block_y; j < block_y+2; ++j) + { + for (i=block_x; i < block_x+2; ++i) + { + readCoeff4x4_CAVLC(currMB, cur_context, i, j, levarr, runarr, &numcoeff); + + coef_ctr = start_scan - 1; + + for (k = 0; k < numcoeff; ++k) + { + if (levarr[k] != 0) + { + coef_ctr += runarr[k]+1; + + i0=pos_scan4x4[coef_ctr][0]; + j0=pos_scan4x4[coef_ctr][1]; + + *cur_cbp |= (int64) 1 << ((j<<2) + i); + currSlice->cof4[pl][cof4_pos_to_subblock[j>>2][i>>2]][j0][i0]= levarr[k]; + } + } + } + } + } + else + { + for (j=0; j < 2; j++) + { + for (i=0;i<2;i++) + { + nzcoeff[block_y+j][block_x+i]=0; + } + } + } + } + } + } +} + + +/*! +************************************************************************ +* \brief +* Get coefficients (run/level) of 4x4 blocks in a MB +* from the NAL (CABAC Mode) +************************************************************************ +*/ +static void readCompCoeff8x8MB_CAVLC (Macroblock *currMB, ColorPlane pl, const int *InvLevelScale8x8, int qp_per, int cbp, h264_4x4_byte nzcoeff) +{ + int block_y, block_x, b4, b8; + int i,j,k; + int scan; + __declspec(align(32)) int levarr[16] = {0}, runarr[16] = {0}; + int numcoeff; + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + const byte *pos_scan8x8 = ((p_Vid->structure == FRAME) && (!currMB->mb_field)) ? SNGL_SCAN8x8_1D : FIELD_SCAN8x8_1D; + int start_scan = IS_I16MB(currMB) ? 1 : 0; + int64 *cur_cbp = &currMB->cbp_blk[pl]; + int coef_ctr, cur_context; + short *coefficients; + + if (IS_I16MB(currMB)) + { + if (pl == PLANE_Y) + cur_context = LUMA_INTRA16x16AC; + else if (pl == PLANE_U) + cur_context = CB_INTRA16x16AC; + else + cur_context = CR_INTRA16x16AC; + } + else + { + if (pl == PLANE_Y) + cur_context = LUMA; + else if (pl == PLANE_U) + cur_context = CB; + else + cur_context = CR; + } + + if (currMB->is_lossless == FALSE) + { + for (block_y=0; block_y < 4; block_y += 2) /* all modes */ + { + for (block_x=0; block_x < 4; block_x += 2) + { + b8 = block_y + (block_x>>1); + coefficients =(short *)(currSlice->mb_rres8[pl][b8]); + if (cbp & (1<<b8)) /* are there any coeff in current block at all */ + { + for (j=block_y; j < block_y+2; ++j) + { + for (i=block_x; i < block_x+2; ++i) + { + readCoeff4x4_CAVLC(currMB, cur_context, i, j, levarr, runarr, &numcoeff); + + coef_ctr = start_scan - 1; + + for (k = 0; k < numcoeff; ++k) + { + if (levarr[k] != 0) + { + coef_ctr += runarr[k]+1; + + // do same as CABAC for deblocking: any coeff in the 8x8 marks all the 4x4s + //as containing coefficients + *cur_cbp |= 51 << ((block_y<<2) + block_x); + + b4 = (coef_ctr << 2) + 2*(j - block_y)+(i - block_x); + + scan = pos_scan8x8[b4]; + + coefficients[scan] = rshift_rnd_sf((levarr[k] * InvLevelScale8x8[scan])<<qp_per, 6); // dequantization + } + }//else (!currMB->luma_transform_size_8x8_flag) + } + } + } + else + { + for (j=block_y; j < block_y+2; ++j) + { + memset(&nzcoeff[j][block_x], 0, 2 * sizeof(byte)); + } + } + } + } + } + else // inverse quant for 8x8 transform + { + for (block_y=0; block_y < 4; block_y += 2) /* all modes */ + { + for (block_x=0; block_x < 4; block_x += 2) + { + b8 = 2*(block_y>>1) + (block_x>>1); + coefficients =(short *)(currSlice->mb_rres8[pl][b8]); + if (cbp & (1<<b8)) /* are there any coeff in current block at all */ + { + for (j=block_y; j < block_y+2; ++j) + { + for (i=block_x; i < block_x+2; ++i) + { + + readCoeff4x4_CAVLC(currMB, cur_context, i, j, levarr, runarr, &numcoeff); + + coef_ctr = start_scan - 1; + + for (k = 0; k < numcoeff; ++k) + { + if (levarr[k] != 0) + { + coef_ctr += runarr[k]+1; + + // do same as CABAC for deblocking: any coeff in the 8x8 marks all the 4x4s + //as containing coefficients + *cur_cbp |= 51 << ((block_y<<2) + block_x); + + b4 = 2*(j-block_y)+(i-block_x); + + scan=pos_scan8x8[coef_ctr*4+b4]; + + coefficients[scan] = levarr[k]; + } + } + } + } + } + else + { + for (j=block_y; j < block_y+2; ++j) + { + memset(&nzcoeff[j][block_x], 0, 2 * sizeof(byte)); + } + } + } + } + } +} + +/*! +************************************************************************ +* \brief +* Data partitioning: Check if neighboring macroblock is needed for +* CAVLC context decoding, and disable current MB if data partition +* is missing. +************************************************************************ +*/ +static void check_dp_neighbors (Macroblock *currMB) +{ + VideoParameters *p_Vid = currMB->p_Vid; + + if (IS_INTER (currMB) || (IS_INTRA (currMB) && !(p_Vid->active_pps->constrained_intra_pred_flag)) ) + { + PixelPos up, left; + + p_Vid->getNeighbourLeft(currMB, p_Vid->mb_size[1], &left); + p_Vid->getNeighbourUp(currMB, p_Vid->mb_size[1], &up); + + if (left.available) + { + currMB->dpl_flag |= p_Vid->mb_data[left.mb_addr].dpl_flag; + } + if (up.available) + { + currMB->dpl_flag |= p_Vid->mb_data[up.mb_addr].dpl_flag; + } + } +} + + +/*! +************************************************************************ +* \brief +* Get coded block pattern and coefficients (run/level) +* from the NAL +************************************************************************ +*/ +static void read_CBP_and_coeffs_from_NAL_CABAC(Macroblock *currMB) +{ + int i,j,k; + int cbp; + SyntaxElement currSE; + DataPartition *dP = NULL; + Slice *currSlice = currMB->p_Slice; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + int coef_ctr, i0, j0, b8; + int ll; + RunLevel rl; + + int qp_per, qp_rem; + VideoParameters *p_Vid = currMB->p_Vid; + int intra = IS_INTRA (currMB); + int smb = ((p_Vid->type==SP_SLICE) && !intra) || (p_Vid->type == SI_SLICE && currMB->mb_type == SI4MB); + + int uv; + int qp_per_uv[2]; + int qp_rem_uv[2]; + + + int temp[4]; + + int b4; + StorablePicture *dec_picture = p_Vid->dec_picture; + int yuv = dec_picture->chroma_format_idc - 1; + int m6[4]; + + int need_transform_size_flag; + + int (*InvLevelScale4x4)[4] = NULL; + + // select scan type + const byte (*pos_scan4x4)[2] = ((p_Vid->structure == FRAME) && (!currMB->mb_field)) ? SNGL_SCAN : FIELD_SCAN; + const byte *pos_scan4x4_1d = ((p_Vid->structure == FRAME) && (!currMB->mb_field)) ? SNGL_SCAN_1D : FIELD_SCAN_1D; + const byte *pos_scan4x4_dc = ((p_Vid->structure == FRAME) && (!currMB->mb_field)) ? SNGL_SCAN_DC : FIELD_SCAN_DC; + const byte *pos_scan_4x4; + + // QPI + //init constants for every chroma qp offset + if (dec_picture->chroma_format_idc != YUV400) + { + for (i=0; i<2; ++i) + { + qp_per_uv[i] = p_Vid->qp_per_matrix[ currMB->qp_scaled[i + 1] ]; + qp_rem_uv[i] = p_Vid->qp_rem_matrix[ currMB->qp_scaled[i + 1] ]; + } + } + + // read CBP if not new intra mode + if (!IS_I16MB (currMB)) + { + //===== C B P ===== + //--------------------- + int type = (currMB->mb_type == I4MB || currMB->mb_type == SI4MB || currMB->mb_type == I8MB) + ? SE_CBP_INTRA + : SE_CBP_INTER; + + dP = &(currSlice->partArr[partMap[type]]); + + currMB->cbp = cbp = readCBP_CABAC(currMB, &(dP->de_cabac)); + + TRACE_STRING("coded_block_pattern"); + + + //============= Transform size flag for INTER MBs ============= + //------------------------------------------------------------- + need_transform_size_flag = (((currMB->mb_type >= 1 && currMB->mb_type <= 3)|| + (IS_DIRECT(currMB) && p_Vid->active_sps->direct_8x8_inference_flag) || + (currMB->NoMbPartLessThan8x8Flag)) + && currMB->mb_type != I8MB && currMB->mb_type != I4MB + && (currMB->cbp&15) + && p_Vid->Transform8x8Mode); + + if (need_transform_size_flag) + { + dP = &(currSlice->partArr[partMap[SE_HEADER]]); + TRACE_STRING("transform_size_8x8_flag"); + + // read CAVLC transform_size_8x8_flag + currMB->luma_transform_size_8x8_flag = readMB_transform_size_flag_CABAC(currMB, &(dP->de_cabac)); + } + + //===== DQUANT ===== + //---------------------- + // Delta quant only if nonzero coeffs + if (cbp !=0) + { + read_delta_quant_CABAC(&currSE, dP, currMB, partMap, (!intra) ? SE_DELTA_QUANT_INTER : SE_DELTA_QUANT_INTRA); + + if (currSlice->dp_mode) + { + if (!intra && currSlice->dpC_NotPresent ) + currMB->dpl_flag = 1; + + if( intra && currSlice->dpB_NotPresent ) + { + currMB->ei_flag = 1; + currMB->dpl_flag = 1; + } + + // check for prediction from neighbours + check_dp_neighbors (currMB); + if (currMB->dpl_flag) + { + cbp = 0; + currMB->cbp = cbp; + } + } + } + } + else + { + cbp = currMB->cbp; + } + + if (IS_I16MB (currMB)) // read DC coeffs for new intra modes + { + read_delta_quant_CABAC(&currSE, dP, currMB, partMap, SE_DELTA_QUANT_INTRA); + + macroblock_set_dc_pred(p_Vid, currMB->block_x, currMB->block_y); + + if (currSlice->dp_mode) + { + if (currSlice->dpB_NotPresent) + { + currMB->ei_flag = 1; + currMB->dpl_flag = 1; + } + check_dp_neighbors (currMB); + if (currMB->dpl_flag) + { + currMB->cbp = cbp = 0; + } + } + + if (!currMB->dpl_flag) + { + pos_scan_4x4 = pos_scan4x4_dc; + + { + dP = &(currSlice->partArr[partMap[SE_LUM_DC_INTRA]]); + + currMB->is_intra_block = 1; + + for(k = 0; k < 17 ; k++) + { + rl = readRunLevel_CABAC(currMB, &(dP->de_cabac), LUMA_16DC); + + if (rl.level != 0) /* leave if level == 0 */ + { + pos_scan_4x4 += rl.run; + currSlice->cof4[0][*pos_scan_4x4++][0][0] = rl.level;// add new intra DC coeff + } + else + break; + } + + } + + if(currMB->is_lossless == FALSE) + itrans_2(currMB, (ColorPlane) p_Vid->colour_plane_id);// transform new intra DC + } + } + + update_qp(currMB, p_Vid->qp); + + qp_per = p_Vid->qp_per_matrix[ currMB->qp_scaled[p_Vid->colour_plane_id] ]; + qp_rem = p_Vid->qp_rem_matrix[ currMB->qp_scaled[p_Vid->colour_plane_id] ]; + + //init quant parameters for chroma + if (dec_picture->chroma_format_idc != YUV400) + { + for(i=0; i < 2; ++i) + { + qp_per_uv[i] = p_Vid->qp_per_matrix[ currMB->qp_scaled[i + 1] ]; + qp_rem_uv[i] = p_Vid->qp_rem_matrix[ currMB->qp_scaled[i + 1] ]; + } + } + + InvLevelScale4x4 = intra? currSlice->InvLevelScale4x4_Intra[p_Vid->colour_plane_id][qp_rem] : currSlice->InvLevelScale4x4_Inter[p_Vid->colour_plane_id][qp_rem]; + + // luma coefficients + { + //======= Other Modes & CABAC ======== + //------------------------------------ + if (cbp) + { + if(currMB->luma_transform_size_8x8_flag) + { + //======= 8x8 transform size & CABAC ======== + readCompCoeff8x8MB_CABAC (currMB, PLANE_Y); + } + else + { + readCompCoeff4x4MB_CABAC (currMB, PLANE_Y, intra, InvLevelScale4x4, qp_per, cbp); + } + } + } + + if ( p_Vid->active_sps->chroma_format_idc==YUV444 && !IS_INDEPENDENT(p_Vid) ) + { + for (uv = 0; uv < 2; ++uv ) + { + /*----------------------16x16DC Luma_Add----------------------*/ + if (IS_I16MB (currMB)) // read DC coeffs for new intra modes + { + macroblock_set_dc_pred(p_Vid, currMB->block_x, currMB->block_y); + + { + int context; + dP = &(currSlice->partArr[partMap[SE_LUM_DC_INTRA]]); + + if( IS_INDEPENDENT(p_Vid) ) + context = LUMA_16DC; + else + context = (uv==0) ? CB_16DC : CR_16DC; + + currMB->is_intra_block = 1; + + coef_ctr = -1; + + for(k=0;k<17;++k) + { + rl = readRunLevel_CABAC(currMB, &dP->de_cabac, context); + + if (rl.level != 0) // leave if level == 0 + { + coef_ctr += rl.run + 1; + currSlice->cof4[uv + 1][pos_scan4x4_1d[coef_ctr]][0][0] = rl.level; + } + else + break; + } //k loop + } // else CAVLC + + if(currMB->is_lossless == FALSE) + { + itrans_2(currMB, (ColorPlane) (uv + 1)); // transform new intra DC + } + } //IS_I16MB + + update_qp(currMB, p_Vid->qp); + + qp_per = p_Vid->qp_per_matrix[ (p_Vid->qp + p_Vid->bitdepth_luma_qp_scale) ]; + qp_rem = p_Vid->qp_rem_matrix[ (p_Vid->qp + p_Vid->bitdepth_luma_qp_scale) ]; + + //init constants for every chroma qp offset + qp_per_uv[uv] = p_Vid->qp_per_matrix[ (currMB->qpc[uv] + p_Vid->bitdepth_chroma_qp_scale) ]; + qp_rem_uv[uv] = p_Vid->qp_rem_matrix[ (currMB->qpc[uv] + p_Vid->bitdepth_chroma_qp_scale) ]; + + InvLevelScale4x4 = intra? currSlice->InvLevelScale4x4_Intra[uv + 1][qp_rem_uv[uv]] : currSlice->InvLevelScale4x4_Inter[uv + 1][qp_rem_uv[uv]]; + + { + if (cbp) + { + if(currMB->luma_transform_size_8x8_flag) + { + //======= 8x8 transform size & CABAC ======== + readCompCoeff8x8MB_CABAC(currMB, (ColorPlane) (PLANE_U + uv)); + } + else //4x4 + { + readCompCoeff4x4MB_CABAC(currMB, (ColorPlane) (PLANE_U + uv), intra, InvLevelScale4x4, qp_per_uv[uv], cbp); + } + } + } + } + } //444 + else if ((dec_picture->chroma_format_idc != YUV400) && (dec_picture->chroma_format_idc != YUV444)) + { + //========================== CHROMA DC ============================ + //----------------------------------------------------------------- + // chroma DC coeff + if(cbp>15) + { + if (dec_picture->chroma_format_idc == YUV420) + { + for (ll=0;ll<3;ll+=2) + { + uv = ll>>1; + + InvLevelScale4x4 = intra ? currSlice->InvLevelScale4x4_Intra[uv + 1][qp_rem_uv[uv]] : currSlice->InvLevelScale4x4_Inter[uv + 1][qp_rem_uv[uv]]; + //===================== CHROMA DC YUV420 ====================== + memzero16(&currSlice->cofu[0]); + coef_ctr=-1; + + { + int type = (intra ? SE_CHR_DC_INTRA : SE_CHR_DC_INTER); + + currMB->is_intra_block = intra; + currMB->is_v_block = ll; + + dP = &(currSlice->partArr[partMap[type]]); + + for(k = 0; k < (p_Vid->num_cdc_coeff + 1);++k) + { + rl = readRunLevel_CABAC(currMB, &(dP->de_cabac), CHROMA_DC); + + if (rl.level != 0) + { + currMB->cbp_blk[0] |= 0xf0000 << (ll<<1) ; + coef_ctr += rl.run + 1; + + // Bug: currSlice->cofu has only 4 entries, hence coef_ctr MUST be <4 (which is + // caught by the assert(). If it is bigger than 4, it starts patching the + // p_Vid->predmode pointer, which leads to bugs later on. + // + // This assert() should be left in the code, because it captures a very likely + // bug early when testing in error prone environments (or when testing NAL + // functionality). + assert (coef_ctr < p_Vid->num_cdc_coeff); + currSlice->cofu[coef_ctr&3]=rl.level; + } + else + break; + } + } + + if (smb || (currMB->is_lossless == TRUE)) // check to see if MB type is SPred or SIntra4x4 + { + currSlice->cof4[uv + 1][0][0][0] = currSlice->cofu[0]; + currSlice->cof4[uv + 1][1][0][0] = currSlice->cofu[1]; + currSlice->cof4[uv + 1][2][0][0] = currSlice->cofu[2]; + currSlice->cof4[uv + 1][3][0][0] = currSlice->cofu[3]; + } + else + { + ihadamard2x2(currSlice->cofu, temp); + + currSlice->cof4[uv + 1][0][0][0] = (((temp[0] * InvLevelScale4x4[0][0])<<qp_per_uv[uv])>>5); + currSlice->cof4[uv + 1][1][0][0] = (((temp[1] * InvLevelScale4x4[0][0])<<qp_per_uv[uv])>>5); + currSlice->cof4[uv + 1][2][0][0] = (((temp[2] * InvLevelScale4x4[0][0])<<qp_per_uv[uv])>>5); + currSlice->cof4[uv + 1][3][0][0] = (((temp[3] * InvLevelScale4x4[0][0])<<qp_per_uv[uv])>>5); + } + } + } + else if (dec_picture->chroma_format_idc == YUV422) + { + for (ll=0;ll<3;ll+=2) + { + int (*InvLevelScale4x4)[4] = NULL; + uv = ll>>1; + { + h264_short_block_t *imgcof = currSlice->cof4[uv + 1]; + int m3[2][4] = {{0,0,0,0},{0,0,0,0}}; + int m4[2][4] = {{0,0,0,0},{0,0,0,0}}; + int qp_per_uv_dc = p_Vid->qp_per_matrix[ (currMB->qpc[uv] + 3 + p_Vid->bitdepth_chroma_qp_scale) ]; //for YUV422 only + int qp_rem_uv_dc = p_Vid->qp_rem_matrix[ (currMB->qpc[uv] + 3 + p_Vid->bitdepth_chroma_qp_scale) ]; //for YUV422 only + if (intra) + InvLevelScale4x4 = currSlice->InvLevelScale4x4_Intra[uv + 1][qp_rem_uv_dc]; + else + InvLevelScale4x4 = currSlice->InvLevelScale4x4_Inter[uv + 1][qp_rem_uv_dc]; + + + //===================== CHROMA DC YUV422 ====================== + { + coef_ctr=-1; + for(k=0;k<9;++k) + { + int type = (intra ? SE_CHR_DC_INTRA : SE_CHR_DC_INTER); + currMB->is_intra_block = intra; + currMB->is_v_block = ll; + + dP = &(currSlice->partArr[partMap[type]]); + + rl = readRunLevel_CABAC(currMB, &dP->de_cabac, CHROMA_DC_2x4); + + if (rl.level != 0) + { + currMB->cbp_blk[0] |= ((int64)0xff0000) << (ll<<2) ; + coef_ctr += rl.run + 1; + assert (coef_ctr < p_Vid->num_cdc_coeff); + i0=SCAN_YUV422[coef_ctr][0]; + j0=SCAN_YUV422[coef_ctr][1]; + + m3[i0][j0]=rl.level; + } + else + break; + } + } + // inverse CHROMA DC YUV422 transform + // horizontal + if(currMB->is_lossless == FALSE) + { + m4[0][0] = m3[0][0] + m3[1][0]; + m4[0][1] = m3[0][1] + m3[1][1]; + m4[0][2] = m3[0][2] + m3[1][2]; + m4[0][3] = m3[0][3] + m3[1][3]; + + m4[1][0] = m3[0][0] - m3[1][0]; + m4[1][1] = m3[0][1] - m3[1][1]; + m4[1][2] = m3[0][2] - m3[1][2]; + m4[1][3] = m3[0][3] - m3[1][3]; + + for (i = 0; i < 2; ++i) + { + m6[0] = m4[i][0] + m4[i][2]; + m6[1] = m4[i][0] - m4[i][2]; + m6[2] = m4[i][1] - m4[i][3]; + m6[3] = m4[i][1] + m4[i][3]; + + imgcof[cof4_pos_to_subblock[0][i]][0][0] = m6[0] + m6[3]; + imgcof[cof4_pos_to_subblock[1][i]][0][0] = m6[1] + m6[2]; + imgcof[cof4_pos_to_subblock[2][i]][0][0] = m6[1] - m6[2]; + imgcof[cof4_pos_to_subblock[3][i]][0][0]= m6[0] - m6[3]; + }//for (i=0;i<2;++i) + } + else + { + for(j=0;j<4;++j) + { + for(i=0;i<2;++i) + { + currSlice->cof4[uv + 1][cof4_pos_to_subblock[j][i]][0][0] = m3[i][j]; + } + } + } + + for(j = 0;j < p_Vid->mb_cr_size_y; j += BLOCK_SIZE) + { + for(i=0;i < p_Vid->mb_cr_size_x;i+=BLOCK_SIZE) + { + imgcof[cof4_pos_to_subblock[j>>2][i>>2]][0][0] = rshift_rnd_sf((imgcof[cof4_pos_to_subblock[j>>2][i>>2]][0][0] * InvLevelScale4x4[0][0]) << qp_per_uv_dc, 6); + } + } + } + }//for (ll=0;ll<3;ll+=2) + }//else if (dec_picture->chroma_format_idc == YUV422) + } + + //========================== CHROMA AC ============================ + //----------------------------------------------------------------- + // chroma AC coeff, all zero fram start_scan + if (cbp<=31) + { + } + else + { + { + int type; + currMB->is_intra_block = intra; + type = (intra ? SE_CHR_AC_INTRA : SE_CHR_AC_INTER); + + dP = &(currSlice->partArr[partMap[type]]); + + + if(currMB->is_lossless == FALSE) + { + for (b8=0; b8 < p_Vid->num_blk8x8_uv; ++b8) + { + currMB->is_v_block = uv = (b8 > ((p_Vid->num_uv_blocks) - 1 )); + InvLevelScale4x4 = intra ? currSlice->InvLevelScale4x4_Intra[uv + 1][qp_rem_uv[uv]] : currSlice->InvLevelScale4x4_Inter[uv + 1][qp_rem_uv[uv]]; + + for (b4 = 0; b4 < 4; ++b4) + { + int *scale = &InvLevelScale4x4[0][0]; + i = cofuv_blk_x[yuv][b8][b4]; + j = cofuv_blk_y[yuv][b8][b4]; + + currMB->subblock_y = subblk_offset_y[yuv][b8][b4]; + currMB->subblock_x = subblk_offset_x[yuv][b8][b4]; + + pos_scan_4x4 = &pos_scan4x4_1d[1]; + for(k = 0; k < 16;++k) + { + rl = readRunLevel_CABAC(currMB, &(dP->de_cabac), CHROMA_AC); + + if (rl.level != 0) + { + byte position; + currMB->cbp_blk[0] |= ((int64)1) << cbp_blk_chroma[b8][b4]; + pos_scan_4x4 += rl.run; + position = *pos_scan_4x4++; + + ((int16_t *)currSlice->cof4[uv + 1][cof4_pos_to_subblock[j][i]])[position] = rshift_rnd_sf((rl.level * scale[position])<<qp_per_uv[uv], 4); + } + else + break; + } //for(k=0;(k<16)&&(level!=0);++k) + } + } + } + else + { + for (b8=0; b8 < p_Vid->num_blk8x8_uv; ++b8) + { + currMB->is_v_block = uv = (b8 > ((p_Vid->num_uv_blocks) - 1 )); + + for (b4=0; b4 < 4; ++b4) + { + i = cofuv_blk_x[yuv][b8][b4]; + j = cofuv_blk_y[yuv][b8][b4]; + + pos_scan_4x4 = &pos_scan4x4_1d[1]; + + currMB->subblock_y = subblk_offset_y[yuv][b8][b4]; + currMB->subblock_x = subblk_offset_x[yuv][b8][b4]; + + for(k=0;k<16;++k) + { + rl = readRunLevel_CABAC(currMB, &dP->de_cabac, CHROMA_AC); + + if (rl.level != 0) + { + currMB->cbp_blk[0] |= ((int64)1) << cbp_blk_chroma[b8][b4]; + pos_scan_4x4 += rl.run; + + ((int16_t *)currSlice->cof4[uv + 1][cof4_pos_to_subblock[j][i]])[*pos_scan_4x4++] = rl.level; + } + else + break; + } + } + } + } //for (b4=0; b4 < 4; b4++) + } //for (b8=0; b8 < p_Vid->num_blk8x8_uv; b8++) + } //if (dec_picture->chroma_format_idc != YUV400) + } +} + +/*! +************************************************************************ +* \brief +* Get coded block pattern and coefficients (run/level) +* from the NAL +************************************************************************ +*/ +static void read_CBP_and_coeffs_from_NAL_CAVLC(Macroblock *currMB) +{ + int i,j,k; + int level; + int mb_nr = currMB->mbAddrX; + int cbp; + SyntaxElement currSE; + DataPartition *dP = NULL; + Slice *currSlice = currMB->p_Slice; + const byte *partMap = assignSE2partition[currSlice->dp_mode]; + int coef_ctr, i0, j0, b8; + int ll; + __declspec(align(32)) int levarr[16], runarr[16]; + int numcoeff; + + int qp_per, qp_rem; + VideoParameters *p_Vid = currMB->p_Vid; + int smb = ((p_Vid->type==SP_SLICE) && IS_INTER (currMB)) || (p_Vid->type == SI_SLICE && currMB->mb_type == SI4MB); + + int uv; + int qp_per_uv[2]; + int qp_rem_uv[2]; + + int intra = IS_INTRA (currMB); + int temp[4]; + + int b4; + StorablePicture *dec_picture = p_Vid->dec_picture; + int yuv = dec_picture->chroma_format_idc - 1; + int m6[4]; + + int need_transform_size_flag; + + int (*InvLevelScale4x4)[4] = NULL; + const int *InvLevelScale8x8 = NULL; + // select scan type + const byte (*pos_scan4x4)[2] = ((p_Vid->structure == FRAME) && (!currMB->mb_field)) ? SNGL_SCAN : FIELD_SCAN; + const byte *pos_scan_4x4 = pos_scan4x4[0]; + + // QPI + //init constants for every chroma qp offset + if (dec_picture->chroma_format_idc != YUV400) + { + for (i=0; i<2; ++i) + { + qp_per_uv[i] = p_Vid->qp_per_matrix[ currMB->qp_scaled[i + 1] ]; + qp_rem_uv[i] = p_Vid->qp_rem_matrix[ currMB->qp_scaled[i + 1] ]; + } + } + + // read CBP if not new intra mode + if (!IS_I16MB (currMB)) + { + //===== C B P ===== + //--------------------- + int type = (currMB->mb_type == I4MB || currMB->mb_type == SI4MB || currMB->mb_type == I8MB) + ? SE_CBP_INTRA + : SE_CBP_INTER; + + dP = &(currSlice->partArr[partMap[type]]); + + currSE.mapping = (currMB->mb_type == I4MB || currMB->mb_type == SI4MB || currMB->mb_type == I8MB) + ? currSlice->linfo_cbp_intra + : currSlice->linfo_cbp_inter; + + TRACE_STRING("coded_block_pattern"); + readSyntaxElement_UVLC(&currSE, dP); + currMB->cbp = cbp = currSE.value1; + + + //============= Transform size flag for INTER MBs ============= + //------------------------------------------------------------- + need_transform_size_flag = (((currMB->mb_type >= 1 && currMB->mb_type <= 3)|| + (IS_DIRECT(currMB) && p_Vid->active_sps->direct_8x8_inference_flag) || + (currMB->NoMbPartLessThan8x8Flag)) + && currMB->mb_type != I8MB && currMB->mb_type != I4MB + && (currMB->cbp&15) + && p_Vid->Transform8x8Mode); + + if (need_transform_size_flag) + { + dP = &(currSlice->partArr[partMap[SE_HEADER]]); + TRACE_STRING("transform_size_8x8_flag"); + + // read CAVLC transform_size_8x8_flag + currMB->luma_transform_size_8x8_flag = (Boolean) readSyntaxElement_FLC(dP->bitstream, 1); + } + + //===== DQUANT ===== + //---------------------- + // Delta quant only if nonzero coeffs + if (cbp !=0) + { + read_delta_quant_CAVLC(&currSE, dP, currMB, partMap, (IS_INTER (currMB)) ? SE_DELTA_QUANT_INTER : SE_DELTA_QUANT_INTRA); + + if (currSlice->dp_mode) + { + if (IS_INTER (currMB) && currSlice->dpC_NotPresent ) + currMB->dpl_flag = 1; + + if( intra && currSlice->dpB_NotPresent ) + { + currMB->ei_flag = 1; + currMB->dpl_flag = 1; + } + + // check for prediction from neighbours + check_dp_neighbors (currMB); + if (currMB->dpl_flag) + { + cbp = 0; + currMB->cbp = cbp; + } + } + } + } + else + { + cbp = currMB->cbp; + } + + if (IS_I16MB (currMB)) // read DC coeffs for new intra modes + { + read_delta_quant_CAVLC(&currSE, dP, currMB, partMap, SE_DELTA_QUANT_INTRA); + + macroblock_set_dc_pred(p_Vid, currMB->block_x, currMB->block_y); + + if (currSlice->dp_mode) + { + if (currSlice->dpB_NotPresent) + { + currMB->ei_flag = 1; + currMB->dpl_flag = 1; + } + check_dp_neighbors (currMB); + if (currMB->dpl_flag) + { + currMB->cbp = cbp = 0; + } + } + + if (!currMB->dpl_flag) + { + pos_scan_4x4 = pos_scan4x4[0]; + + readCoeff4x4_CAVLC(currMB, LUMA_INTRA16x16DC, 0, 0, levarr, runarr, &numcoeff); + + for(k = 0; k < numcoeff; ++k) + { + if (levarr[k] != 0) // leave if level == 0 + { + pos_scan_4x4 += 2 * runarr[k]; + + i0 = (*pos_scan_4x4++); + j0 = (*pos_scan_4x4++); + + currSlice->cof4[0][cof4_pos_to_subblock[j0][i0]][0][0] = levarr[k];// add new intra DC coeff + } + } + + + if(currMB->is_lossless == FALSE) + itrans_2(currMB, (ColorPlane) p_Vid->colour_plane_id);// transform new intra DC + } + } + + update_qp(currMB, p_Vid->qp); + + qp_per = p_Vid->qp_per_matrix[ currMB->qp_scaled[p_Vid->colour_plane_id] ]; + qp_rem = p_Vid->qp_rem_matrix[ currMB->qp_scaled[p_Vid->colour_plane_id] ]; + + //init quant parameters for chroma + if (dec_picture->chroma_format_idc != YUV400) + { + for(i=0; i < 2; ++i) + { + qp_per_uv[i] = p_Vid->qp_per_matrix[ currMB->qp_scaled[i + 1] ]; + qp_rem_uv[i] = p_Vid->qp_rem_matrix[ currMB->qp_scaled[i + 1] ]; + } + } + + InvLevelScale4x4 = intra? currSlice->InvLevelScale4x4_Intra[p_Vid->colour_plane_id][qp_rem] : currSlice->InvLevelScale4x4_Inter[p_Vid->colour_plane_id][qp_rem]; + InvLevelScale8x8 = intra? currSlice->InvLevelScale8x8_Intra[p_Vid->colour_plane_id][qp_rem] : currSlice->InvLevelScale8x8_Inter[p_Vid->colour_plane_id][qp_rem]; + + // luma coefficients + if (cbp) + { + if (!currMB->luma_transform_size_8x8_flag) // 4x4 transform + { + readCompCoeff4x4MB_CAVLC(currMB, PLANE_Y, InvLevelScale4x4, qp_per, cbp, p_Vid->nz_coeff[mb_nr][PLANE_Y]); + } + else // 8x8 transform + { + readCompCoeff8x8MB_CAVLC(currMB, PLANE_Y, InvLevelScale8x8, qp_per, cbp, p_Vid->nz_coeff[mb_nr][PLANE_Y]); + } + } + else + { + memset(&p_Vid->nz_coeff[mb_nr][0][0][0], 0, BLOCK_SIZE * BLOCK_SIZE * sizeof(byte)); + } + + if ( p_Vid->active_sps->chroma_format_idc==YUV444 && !IS_INDEPENDENT(p_Vid) ) + { + for (uv = 0; uv < 2; ++uv ) + { + /*----------------------16x16DC Luma_Add----------------------*/ + if (IS_I16MB (currMB)) // read DC coeffs for new intra modes + { + macroblock_set_dc_pred(p_Vid, currMB->block_x, currMB->block_y); + + if (uv == 0) + readCoeff4x4_CAVLC(currMB, CB_INTRA16x16DC, 0, 0, levarr, runarr, &numcoeff); + else + readCoeff4x4_CAVLC(currMB, CR_INTRA16x16DC, 0, 0, levarr, runarr, &numcoeff); + + coef_ctr=-1; + level = 1; // just to get inside the loop + + for(k = 0; k < numcoeff; ++k) + { + if (levarr[k] != 0) // leave if level == 0 + { + coef_ctr += runarr[k] + 1; + + i0 = pos_scan4x4[coef_ctr][0]; + j0 = pos_scan4x4[coef_ctr][1]; + currSlice->cof4[uv + 1][cof4_pos_to_subblock[j0][i0]][0][0] = levarr[k];// add new intra DC coeff + } //if leavarr[k] + } //k loop + + if(currMB->is_lossless == FALSE) + { + itrans_2(currMB, (ColorPlane) (uv + 1)); // transform new intra DC + } + } //IS_I16MB + + update_qp(currMB, p_Vid->qp); + + qp_per = p_Vid->qp_per_matrix[ (p_Vid->qp + p_Vid->bitdepth_luma_qp_scale) ]; + qp_rem = p_Vid->qp_rem_matrix[ (p_Vid->qp + p_Vid->bitdepth_luma_qp_scale) ]; + + //init constants for every chroma qp offset + qp_per_uv[uv] = p_Vid->qp_per_matrix[ (currMB->qpc[uv] + p_Vid->bitdepth_chroma_qp_scale) ]; + qp_rem_uv[uv] = p_Vid->qp_rem_matrix[ (currMB->qpc[uv] + p_Vid->bitdepth_chroma_qp_scale) ]; + + InvLevelScale4x4 = intra? currSlice->InvLevelScale4x4_Intra[uv + 1][qp_rem_uv[uv]] : currSlice->InvLevelScale4x4_Inter[uv + 1][qp_rem_uv[uv]]; + InvLevelScale8x8 = intra? currSlice->InvLevelScale8x8_Intra[uv + 1][qp_rem_uv[uv]] : currSlice->InvLevelScale8x8_Inter[uv + 1][qp_rem_uv[uv]]; + + if (!currMB->luma_transform_size_8x8_flag) // 4x4 transform + { + readCompCoeff4x4MB_CAVLC(currMB, (ColorPlane) (PLANE_U + uv), InvLevelScale4x4, qp_per_uv[uv], cbp, p_Vid->nz_coeff[mb_nr][PLANE_U + uv]); + } + else // 8x8 transform + { + readCompCoeff8x8MB_CAVLC(currMB, (ColorPlane) (PLANE_U + uv), InvLevelScale8x8, qp_per_uv[uv], cbp, p_Vid->nz_coeff[mb_nr][PLANE_U + uv]); + } + } + } //444 + else if ((dec_picture->chroma_format_idc != YUV400) && (dec_picture->chroma_format_idc != YUV444)) + { + //========================== CHROMA DC ============================ + //----------------------------------------------------------------- + // chroma DC coeff + if(cbp>15) + { + if (dec_picture->chroma_format_idc == YUV420) + { + for (ll=0;ll<3;ll+=2) + { + uv = ll>>1; + + InvLevelScale4x4 = intra ? currSlice->InvLevelScale4x4_Intra[uv + 1][qp_rem_uv[uv]] : currSlice->InvLevelScale4x4_Inter[uv + 1][qp_rem_uv[uv]]; + //===================== CHROMA DC YUV420 ====================== + memset(&currSlice->cofu[0], 0, 4 *sizeof(int)); + coef_ctr=-1; + + readCoeff4x4_CAVLC(currMB, CHROMA_DC, 0, 0, levarr, runarr, &numcoeff); + + for(k = 0; k < numcoeff; ++k) + { + if (levarr[k] != 0) + { + currMB->cbp_blk[0] |= 0xf0000 << (ll<<1) ; + coef_ctr += runarr[k] + 1; + currSlice->cofu[coef_ctr]=levarr[k]; + } + } + + if (smb || (currMB->is_lossless == TRUE)) // check to see if MB type is SPred or SIntra4x4 + { + currSlice->cof4[uv + 1][0][0][0] = currSlice->cofu[0]; + currSlice->cof4[uv + 1][1][0][0] = currSlice->cofu[1]; + currSlice->cof4[uv + 1][2][0][0] = currSlice->cofu[2]; + currSlice->cof4[uv + 1][3][0][0] = currSlice->cofu[3]; + } + else + { + ihadamard2x2(currSlice->cofu, temp); + + currSlice->cof4[uv + 1][0][0][0] = (((temp[0] * InvLevelScale4x4[0][0])<<qp_per_uv[uv])>>5); + currSlice->cof4[uv + 1][1][0][0] = (((temp[1] * InvLevelScale4x4[0][0])<<qp_per_uv[uv])>>5); + currSlice->cof4[uv + 1][2][0][0] = (((temp[2] * InvLevelScale4x4[0][0])<<qp_per_uv[uv])>>5); + currSlice->cof4[uv + 1][3][0][0] = (((temp[3] * InvLevelScale4x4[0][0])<<qp_per_uv[uv])>>5); + } + } + } + else if (dec_picture->chroma_format_idc == YUV422) + { + for (ll=0;ll<3;ll+=2) + { + int (*InvLevelScale4x4)[4] = NULL; + uv = ll>>1; + { + h264_short_block_t *imgcof = currSlice->cof4[uv + 1]; + int m3[2][4] = {{0,0,0,0},{0,0,0,0}}; + int m4[2][4] = {{0,0,0,0},{0,0,0,0}}; + int qp_per_uv_dc = p_Vid->qp_per_matrix[ (currMB->qpc[uv] + 3 + p_Vid->bitdepth_chroma_qp_scale) ]; //for YUV422 only + int qp_rem_uv_dc = p_Vid->qp_rem_matrix[ (currMB->qpc[uv] + 3 + p_Vid->bitdepth_chroma_qp_scale) ]; //for YUV422 only + if (intra) + InvLevelScale4x4 = currSlice->InvLevelScale4x4_Intra[uv + 1][qp_rem_uv_dc]; + else + InvLevelScale4x4 = currSlice->InvLevelScale4x4_Inter[uv + 1][qp_rem_uv_dc]; + + + //===================== CHROMA DC YUV422 ====================== + readCoeff4x4_CAVLC(currMB, CHROMA_DC, 0, 0, levarr, runarr, &numcoeff); + coef_ctr=-1; + level=1; + for(k = 0; k < numcoeff; ++k) + { + if (levarr[k] != 0) + { + currMB->cbp_blk[0] |= ((int64)0xff0000) << (ll<<2); + coef_ctr += runarr[k]+1; + i0 = SCAN_YUV422[coef_ctr][0]; + j0 = SCAN_YUV422[coef_ctr][1]; + + m3[i0][j0]=levarr[k]; + } + } + + // inverse CHROMA DC YUV422 transform + // horizontal + if(currMB->is_lossless == FALSE) + { + m4[0][0] = m3[0][0] + m3[1][0]; + m4[0][1] = m3[0][1] + m3[1][1]; + m4[0][2] = m3[0][2] + m3[1][2]; + m4[0][3] = m3[0][3] + m3[1][3]; + + m4[1][0] = m3[0][0] - m3[1][0]; + m4[1][1] = m3[0][1] - m3[1][1]; + m4[1][2] = m3[0][2] - m3[1][2]; + m4[1][3] = m3[0][3] - m3[1][3]; + + for (i = 0; i < 2; ++i) + { + m6[0] = m4[i][0] + m4[i][2]; + m6[1] = m4[i][0] - m4[i][2]; + m6[2] = m4[i][1] - m4[i][3]; + m6[3] = m4[i][1] + m4[i][3]; + + imgcof[cof4_pos_to_subblock[0][i]][0][0] = m6[0] + m6[3]; + imgcof[cof4_pos_to_subblock[1][i]][0][0] = m6[1] + m6[2]; + imgcof[cof4_pos_to_subblock[2][i]][0][0] = m6[1] - m6[2]; + imgcof[cof4_pos_to_subblock[3][i]][0][0] = m6[0] - m6[3]; + }//for (i=0;i<2;++i) + } + else + { + currSlice->cof4[uv + 1][0][0][0] = m3[0][0]; + currSlice->cof4[uv + 1][1][0][0] = m3[1][0]; + currSlice->cof4[uv + 1][2][0][0] = m3[0][1]; + currSlice->cof4[uv + 1][3][0][0] = m3[1][1]; + currSlice->cof4[uv + 1][8][0][0] = m3[0][2]; + currSlice->cof4[uv + 1][9][0][0] = m3[1][2]; + currSlice->cof4[uv + 1][10][0][0] = m3[0][3]; + currSlice->cof4[uv + 1][11][0][0] = m3[1][3]; + } + + for(j = 0;j < 16; j += BLOCK_SIZE) + { + for(i=0;i < 8;i+=BLOCK_SIZE) + { + imgcof[cof4_pos_to_subblock[j>>2][i>>2]][0][0] = rshift_rnd_sf((imgcof[cof4_pos_to_subblock[j>>2][i>>2]][0][0] * InvLevelScale4x4[0][0]) << qp_per_uv_dc, 6); + } + } + } + }//for (ll=0;ll<3;ll+=2) + }//else if (dec_picture->chroma_format_idc == YUV422) + } + + //========================== CHROMA AC ============================ + //----------------------------------------------------------------- + // chroma AC coeff, all zero fram start_scan + if (cbp<=31) + { + memset(&p_Vid->nz_coeff [mb_nr ][1][0][0], 0, 2 * BLOCK_SIZE * BLOCK_SIZE * sizeof(byte)); + } + else + { + if(currMB->is_lossless == FALSE) + { + for (b8=0; b8 < p_Vid->num_blk8x8_uv; ++b8) + { + currMB->is_v_block = uv = (b8 > ((p_Vid->num_uv_blocks) - 1 )); + InvLevelScale4x4 = intra ? currSlice->InvLevelScale4x4_Intra[uv + 1][qp_rem_uv[uv]] : currSlice->InvLevelScale4x4_Inter[uv + 1][qp_rem_uv[uv]]; + + for (b4=0; b4 < 4; ++b4) + { + i = cofuv_blk_x[yuv][b8][b4]; + j = cofuv_blk_y[yuv][b8][b4]; + + readCoeff4x4_CAVLC(currMB, CHROMA_AC, i + 2*uv, j + 4, levarr, runarr, &numcoeff); + coef_ctr = 0; + + for(k = 0; k < numcoeff;++k) + { + if (levarr[k] != 0) + { + currMB->cbp_blk[0] |= ((int64)1) << cbp_blk_chroma[b8][b4]; + coef_ctr += runarr[k] + 1; + + i0=pos_scan4x4[coef_ctr][0]; + j0=pos_scan4x4[coef_ctr][1]; + + currSlice->cof4[uv + 1][cof4_pos_to_subblock[j][i]][j0][i0] = rshift_rnd_sf((levarr[k] * InvLevelScale4x4[j0][i0])<<qp_per_uv[uv], 4); + } + } + } + } + } + else + { + int type; + currMB->is_intra_block = IS_INTRA(currMB); + type = (currMB->is_intra_block ? SE_CHR_AC_INTRA : SE_CHR_AC_INTER); + + dP = &(currSlice->partArr[partMap[type]]); + currSE.mapping = linfo_levrun_inter; + + if(currMB->is_lossless == FALSE) + { + for (b8=0; b8 < p_Vid->num_blk8x8_uv; ++b8) + { + currMB->is_v_block = uv = (b8 > ((p_Vid->num_uv_blocks) - 1 )); + InvLevelScale4x4 = intra ? currSlice->InvLevelScale4x4_Intra[uv + 1][qp_rem_uv[uv]] : currSlice->InvLevelScale4x4_Inter[uv + 1][qp_rem_uv[uv]]; + + for (b4 = 0; b4 < 4; ++b4) + { + i = cofuv_blk_x[yuv][b8][b4]; + j = cofuv_blk_y[yuv][b8][b4]; + + currMB->subblock_y = subblk_offset_y[yuv][b8][b4]; + currMB->subblock_x = subblk_offset_x[yuv][b8][b4]; + + pos_scan_4x4 = pos_scan4x4[1]; + + for(k = 0; k < 16;k++) + { + readSyntaxElement_UVLC(&currSE, dP); + level = currSE.value1; + + if (level != 0) + { + currMB->cbp_blk[0] |= ((int64)1) << cbp_blk_chroma[b8][b4]; + pos_scan_4x4 += (currSE.value2 << 1); + + i0 = *pos_scan_4x4++; + j0 = *pos_scan_4x4++; + + currSlice->cof4[uv + 1][cof4_pos_to_subblock[j][i]][j0][i0] = rshift_rnd_sf((level * InvLevelScale4x4[j0][i0])<<qp_per_uv[uv], 4); + } + else + break; + } //for(k=0;(k<16)&&(level!=0);++k) + } + } + } + else + { + for (b8=0; b8 < p_Vid->num_blk8x8_uv; ++b8) + { + currMB->is_v_block = uv = (b8 > ((p_Vid->num_uv_blocks) - 1 )); + + for (b4=0; b4 < 4; ++b4) + { + i = cofuv_blk_x[yuv][b8][b4]; + j = cofuv_blk_y[yuv][b8][b4]; + + pos_scan_4x4 = pos_scan4x4[1]; + + currMB->subblock_y = subblk_offset_y[yuv][b8][b4]; + currMB->subblock_x = subblk_offset_x[yuv][b8][b4]; + + for(k=0;k<16;++k) + { + readSyntaxElement_UVLC(&currSE, dP); + level = currSE.value1; + + if (level != 0) + { + currMB->cbp_blk[0] |= ((int64)1) << cbp_blk_chroma[b8][b4]; + pos_scan_4x4 += (currSE.value2 << 1); + + i0 = *pos_scan_4x4++; + j0 = *pos_scan_4x4++; + + currSlice->cof4[uv + 1][cof4_pos_to_subblock[j][i]][j0][i0] = level; + } + else + break; + } + } + } + } //for (b4=0; b4 < 4; b4++) + } //for (b8=0; b8 < p_Vid->num_blk8x8_uv; b8++) + } //if (dec_picture->chroma_format_idc != YUV400) + } +} + + +/*! +************************************************************************ +* \brief +* decode one color component in an I slice +************************************************************************ +*/ + +static int decode_one_component_i_slice(Macroblock *currMB, ColorPlane curr_plane, VideoImage *image, StorablePicture *dec_picture) +{ + //For residual DPCM + currMB->ipmode_DPCM = NO_INTRA_PMODE; + if(currMB->mb_type == IPCM) + mb_pred_ipcm(currMB); + else if (IS_I16MB (currMB)) // get prediction for INTRA_MB_16x16 + mb_pred_intra16x16(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == I4MB) + mb_pred_intra4x4(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == I8MB) + mb_pred_intra8x8(currMB, curr_plane, image, dec_picture); + + return 1; +} + +/*! +************************************************************************ +* \brief +* decode one color component for a p slice +************************************************************************ +*/ +static int decode_one_component_p_slice(Macroblock *currMB, ColorPlane curr_plane, VideoImage *image, StorablePicture *dec_picture) +{ + //For residual DPCM + currMB->ipmode_DPCM = NO_INTRA_PMODE; + if(currMB->mb_type == IPCM) + mb_pred_ipcm(currMB); + else if (IS_I16MB (currMB)) // get prediction for INTRA_MB_16x16 + mb_pred_intra16x16(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == I4MB) + mb_pred_intra4x4(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == I8MB) + mb_pred_intra8x8(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == PSKIP) + mb_pred_skip(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == P16x16) + mb_pred_p_inter16x16(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == P16x8) + mb_pred_p_inter16x8(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == P8x16) + mb_pred_p_inter8x16(currMB, curr_plane, image, dec_picture); + else + mb_pred_p_inter8x8(currMB, curr_plane, image, dec_picture); + + return 1; +} + + +/*! +************************************************************************ +* \brief +* decode one color component for a sp slice +************************************************************************ +*/ +static int decode_one_component_sp_slice(Macroblock *currMB, ColorPlane curr_plane, VideoImage *image, StorablePicture *dec_picture) +{ + //For residual DPCM + currMB->ipmode_DPCM = NO_INTRA_PMODE; + + if(currMB->mb_type == IPCM) + mb_pred_ipcm(currMB); + else if (IS_I16MB (currMB)) // get prediction for INTRA_MB_16x16 + mb_pred_intra16x16(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == I4MB) + mb_pred_intra4x4(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == I8MB) + mb_pred_intra8x8(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == PSKIP) + mb_pred_sp_skip(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == P16x16) + mb_pred_p_inter16x16(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == P16x8) + mb_pred_p_inter16x8(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == P8x16) + mb_pred_p_inter8x16(currMB, curr_plane, image, dec_picture); + else + mb_pred_p_inter8x8(currMB, curr_plane, image, dec_picture); + + return 1; +} + +static void set_chroma_vector(Macroblock *currMB, int *list_offset) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + + if (!currSlice->mb_aff_frame_flag) + { + if(p_Vid->structure == TOP_FIELD) + { + int k,l; + for (l = LIST_0; l <= (LIST_1); l++) + { + for(k = 0; k < p_Vid->listXsize[l]; k++) + { + if(p_Vid->structure != p_Vid->listX[l][k]->structure) + p_Vid->listX[l][k]->chroma_vector_adjustment = -2; + else + p_Vid->listX[l][k]->chroma_vector_adjustment= 0; + } + } + } + else if(p_Vid->structure == BOTTOM_FIELD) + { + int k,l; + for (l = LIST_0; l <= (LIST_1); l++) + { + for(k = 0; k < p_Vid->listXsize[l]; k++) + { + if (p_Vid->structure != p_Vid->listX[l][k]->structure) + p_Vid->listX[l][k]->chroma_vector_adjustment = 2; + else + p_Vid->listX[l][k]->chroma_vector_adjustment= 0; + } + } + } + else + { + int k,l; + for (l = LIST_0; l <= (LIST_1); l++) + { + for(k = 0; k < p_Vid->listXsize[l]; k++) + { + p_Vid->listX[l][k]->chroma_vector_adjustment= 0; + } + } + } + } + else + { + int mb_nr = (currMB->mbAddrX & 0x01); + int k,l; + + ////////////////////////// + // find out the correct list offsets + if (currMB->mb_field) + { + *list_offset = mb_nr ? 4 : 2; + + for (l = LIST_0 + *list_offset; l <= (LIST_1 + *list_offset); l++) + { + for(k = 0; k < p_Vid->listXsize[l]; k++) + { + if(mb_nr == 0 && p_Vid->listX[l][k]->structure == BOTTOM_FIELD) + p_Vid->listX[l][k]->chroma_vector_adjustment = -2; + else if(mb_nr == 1 && p_Vid->listX[l][k]->structure == TOP_FIELD) + p_Vid->listX[l][k]->chroma_vector_adjustment = 2; + else + p_Vid->listX[l][k]->chroma_vector_adjustment= 0; + } + } + } + else + { + for (l = LIST_0; l <= (LIST_1); l++) + { + for(k = 0; k < p_Vid->listXsize[l]; k++) + { + p_Vid->listX[l][k]->chroma_vector_adjustment= 0; + } + } + } + } + + p_Vid->max_mb_vmv_r = (p_Vid->structure != FRAME || (currSlice->mb_aff_frame_flag && currMB->mb_field)) ? p_Vid->max_vmv_r >> 1 : p_Vid->max_vmv_r; +} + + +static void mb_pred_b_dspatial(Macroblock *currMB, ColorPlane curr_plane, VideoImage *image, StorablePicture *dec_picture) +{ + char l0_rFrame = -1, l1_rFrame = -1; + PicMotionParams *motion = &dec_picture->motion; + MotionVector pmvl0={0,0}, pmvl1={0,0}; + int k; + int block8x8; + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + int curr_mb_field = ((currSlice->mb_aff_frame_flag)&&(currMB->mb_field)); + + MotionParams *colocated = &currSlice->p_colocated->frame; + int list_offset = 0; + int pred_dir = 0; + + Boolean has_zero_partitions = FALSE; + h264_ref_t *ref_pic_num_l0, *ref_pic_num_l1; + + set_chroma_vector(currMB, &list_offset); + + if (currMB->mb_field) + { + if(currMB->mbAddrX & 0x01) + { + colocated = &currSlice->p_colocated->bottom; + } + else + { + colocated = &currSlice->p_colocated->top; + } + } + + prepare_direct_params(currMB, dec_picture, pmvl0, pmvl1, &l0_rFrame, &l1_rFrame); + + ref_pic_num_l0 = dec_picture->ref_pic_num[p_Vid->current_slice_nr][LIST_0 + list_offset]; + ref_pic_num_l1 = dec_picture->ref_pic_num[p_Vid->current_slice_nr][LIST_1 + list_offset]; + + if (p_Vid->active_sps->direct_8x8_inference_flag) + { + if (l0_rFrame >=0 && l1_rFrame >=0) + { + PicMotion **motion0 = &motion->motion[LIST_0][currMB->block_y]; + PicMotion **motion1 = &motion->motion[LIST_1][currMB->block_y]; + int block_x = currMB->block_x; + has_zero_partitions = TRUE; + pred_dir = 2; + if (p_Vid->listX[LIST_1 + list_offset][0]->is_long_term) + { // long term + //--- + memcpy(motion0[0][block_x + 0].mv, pmvl0, sizeof(MotionVector)); + motion0[0][block_x + 0].ref_idx = l0_rFrame; + memcpy(motion1[0][block_x + 0].mv, pmvl1, sizeof(MotionVector)); + motion1[0][block_x + 0].ref_idx = l1_rFrame; + motion0[0][block_x + 0].ref_pic_id = ref_pic_num_l0[(short)motion0[0][block_x + 0].ref_idx]; + motion1[0][block_x + 0].ref_pic_id = ref_pic_num_l1[(short)motion1[0][block_x + 0].ref_idx]; + memcpy(motion0[0][block_x + 1].mv, pmvl0, sizeof(MotionVector)); + motion0[0][block_x + 1].ref_idx = l0_rFrame; + memcpy(motion1[0][block_x + 1].mv, pmvl1, sizeof(MotionVector)); + motion1[0][block_x + 1].ref_idx = l1_rFrame; + motion0[0][block_x + 1].ref_pic_id = ref_pic_num_l0[(short)motion0[0][block_x + 1].ref_idx]; + motion1[0][block_x + 1].ref_pic_id = ref_pic_num_l1[(short)motion1[0][block_x + 1].ref_idx]; + memcpy(motion0[1][block_x + 0].mv, pmvl0, sizeof(MotionVector)); + motion0[1][block_x + 0].ref_idx = l0_rFrame; + memcpy(motion1[1][block_x + 0].mv, pmvl1, sizeof(MotionVector)); + motion1[1][block_x + 0].ref_idx = l1_rFrame; + motion0[1][block_x + 0].ref_pic_id = ref_pic_num_l0[(short)motion0[1][block_x + 0].ref_idx]; + motion1[1][block_x + 0].ref_pic_id = ref_pic_num_l1[(short)motion1[1][block_x + 0].ref_idx]; + memcpy(motion0[1][block_x + 1].mv, pmvl0, sizeof(MotionVector)); + motion0[1][block_x + 1].ref_idx = l0_rFrame; + memcpy(motion1[1][block_x + 1].mv, pmvl1, sizeof(MotionVector)); + motion1[1][block_x + 1].ref_idx = l1_rFrame; + motion0[1][block_x + 1].ref_pic_id = ref_pic_num_l0[(short)motion0[1][block_x + 1].ref_idx]; + motion1[1][block_x + 1].ref_pic_id = ref_pic_num_l1[(short)motion1[1][block_x + 1].ref_idx]; + perform_mc8x8(currMB, curr_plane, dec_picture, pred_dir, 0, 0, list_offset, curr_mb_field); + //--- + memcpy(motion0[0][block_x + 2].mv, pmvl0, sizeof(MotionVector)); + motion0[0][block_x + 2].ref_idx = l0_rFrame; + memcpy(motion1[0][block_x + 2].mv, pmvl1, sizeof(MotionVector)); + motion1[0][block_x + 2].ref_idx = l1_rFrame; + motion0[0][block_x + 2].ref_pic_id = ref_pic_num_l0[(short)motion0[0][block_x + 2].ref_idx]; + motion1[0][block_x + 2].ref_pic_id = ref_pic_num_l1[(short)motion1[0][block_x + 2].ref_idx]; + memcpy(motion0[0][block_x + 3].mv, pmvl0, sizeof(MotionVector)); + motion0[0][block_x + 3].ref_idx = l0_rFrame; + memcpy(motion1[0][block_x + 3].mv, pmvl1, sizeof(MotionVector)); + motion1[0][block_x + 3].ref_idx = l1_rFrame; + motion0[0][block_x + 3].ref_pic_id = ref_pic_num_l0[(short)motion0[0][block_x + 3].ref_idx]; + motion1[0][block_x + 3].ref_pic_id = ref_pic_num_l1[(short)motion1[0][block_x + 3].ref_idx]; + memcpy(motion0[1][block_x + 2].mv, pmvl0, sizeof(MotionVector)); + motion0[1][block_x + 2].ref_idx = l0_rFrame; + memcpy(motion1[1][block_x + 2].mv, pmvl1, sizeof(MotionVector)); + motion1[1][block_x + 2].ref_idx = l1_rFrame; + motion0[1][block_x + 2].ref_pic_id = ref_pic_num_l0[(short)motion0[1][block_x + 2].ref_idx]; + motion1[1][block_x + 2].ref_pic_id = ref_pic_num_l1[(short)motion1[1][block_x + 2].ref_idx]; + memcpy(motion0[1][block_x + 3].mv, pmvl0, sizeof(MotionVector)); + motion0[1][block_x + 3].ref_idx = l0_rFrame; + memcpy(motion1[1][block_x + 3].mv, pmvl1, sizeof(MotionVector)); + motion1[1][block_x + 3].ref_idx = l1_rFrame; + motion0[1][block_x + 3].ref_pic_id = ref_pic_num_l0[(short)motion0[1][block_x + 3].ref_idx]; + motion1[1][block_x + 3].ref_pic_id = ref_pic_num_l1[(short)motion1[1][block_x + 3].ref_idx]; + perform_mc8x8(currMB, curr_plane, dec_picture, pred_dir, 2, 0, list_offset, curr_mb_field); + //--- + memcpy(motion0[2][block_x + 0].mv, pmvl0, sizeof(MotionVector)); + motion0[2][block_x + 0].ref_idx = l0_rFrame; + memcpy(motion1[2][block_x + 0].mv, pmvl1, sizeof(MotionVector)); + motion1[2][block_x + 0].ref_idx = l1_rFrame; + motion0[2][block_x + 0].ref_pic_id = ref_pic_num_l0[(short)motion0[2][block_x + 0].ref_idx]; + motion1[2][block_x + 0].ref_pic_id = ref_pic_num_l1[(short)motion1[2][block_x + 0].ref_idx]; + memcpy(motion0[2][block_x + 1].mv, pmvl0, sizeof(MotionVector)); + motion0[2][block_x + 1].ref_idx = l0_rFrame; + memcpy(motion1[2][block_x + 1].mv, pmvl1, sizeof(MotionVector)); + motion1[2][block_x + 1].ref_idx = l1_rFrame; + motion0[2][block_x + 1].ref_pic_id = ref_pic_num_l0[(short)motion0[2][block_x + 1].ref_idx]; + motion1[2][block_x + 1].ref_pic_id = ref_pic_num_l1[(short)motion1[2][block_x + 1].ref_idx]; + memcpy(motion0[3][block_x + 0].mv, pmvl0, sizeof(MotionVector)); + motion0[3][block_x + 0].ref_idx = l0_rFrame; + memcpy(motion1[3][block_x + 0].mv, pmvl1, sizeof(MotionVector)); + motion1[3][block_x + 0].ref_idx = l1_rFrame; + motion0[3][block_x + 0].ref_pic_id = ref_pic_num_l0[(short)motion0[3][block_x + 0].ref_idx]; + motion1[3][block_x + 0].ref_pic_id = ref_pic_num_l1[(short)motion1[3][block_x + 0].ref_idx]; + memcpy(motion0[3][block_x + 1].mv, pmvl0, sizeof(MotionVector)); + motion0[3][block_x + 1].ref_idx = l0_rFrame; + memcpy(motion1[3][block_x + 1].mv, pmvl1, sizeof(MotionVector)); + motion1[3][block_x + 1].ref_idx = l1_rFrame; + motion0[3][block_x + 1].ref_pic_id = ref_pic_num_l0[(short)motion0[3][block_x + 1].ref_idx]; + motion1[3][block_x + 1].ref_pic_id = ref_pic_num_l1[(short)motion1[3][block_x + 1].ref_idx]; + perform_mc8x8(currMB, curr_plane, dec_picture, pred_dir, 0, 2, list_offset, curr_mb_field); + //--- + memcpy(motion0[2][block_x + 2].mv, pmvl0, sizeof(MotionVector)); + motion0[2][block_x + 2].ref_idx = l0_rFrame; + memcpy(motion1[2][block_x + 2].mv, pmvl1, sizeof(MotionVector)); + motion1[2][block_x + 2].ref_idx = l1_rFrame; + motion0[2][block_x + 2].ref_pic_id = ref_pic_num_l0[(short)motion0[2][block_x + 2].ref_idx]; + motion1[2][block_x + 2].ref_pic_id = ref_pic_num_l1[(short)motion1[2][block_x + 2].ref_idx]; + memcpy(motion0[2][block_x + 3].mv, pmvl0, sizeof(MotionVector)); + motion0[2][block_x + 3].ref_idx = l0_rFrame; + memcpy(motion1[2][block_x + 3].mv, pmvl1, sizeof(MotionVector)); + motion1[2][block_x + 3].ref_idx = l1_rFrame; + motion0[2][block_x + 3].ref_pic_id = ref_pic_num_l0[(short)motion0[2][block_x + 3].ref_idx]; + motion1[2][block_x + 3].ref_pic_id = ref_pic_num_l1[(short)motion1[2][block_x + 3].ref_idx]; + memcpy(motion0[3][block_x + 2].mv, pmvl0, sizeof(MotionVector)); + motion0[3][block_x + 2].ref_idx = l0_rFrame; + memcpy(motion1[3][block_x + 2].mv, pmvl1, sizeof(MotionVector)); + motion1[3][block_x + 2].ref_idx = l1_rFrame; + motion0[3][block_x + 2].ref_pic_id = ref_pic_num_l0[(short)motion0[3][block_x + 2].ref_idx]; + motion1[3][block_x + 2].ref_pic_id = ref_pic_num_l1[(short)motion1[3][block_x + 2].ref_idx]; + memcpy(motion0[3][block_x + 3].mv, pmvl0, sizeof(MotionVector)); + motion0[3][block_x + 3].ref_idx = l0_rFrame; + memcpy(motion1[3][block_x + 3].mv, pmvl1, sizeof(MotionVector)); + motion1[3][block_x + 3].ref_idx = l1_rFrame; + motion0[3][block_x + 3].ref_pic_id = ref_pic_num_l0[(short)motion0[3][block_x + 3].ref_idx]; + motion1[3][block_x + 3].ref_pic_id = ref_pic_num_l1[(short)motion1[3][block_x + 3].ref_idx]; + perform_mc8x8(currMB, curr_plane, dec_picture, pred_dir, 2, 2, list_offset, curr_mb_field); + } + else + { // not long term + const byte **colocated_moving_block = &colocated->moving_block[currMB->block_y_aff]; + for (block8x8 = 0; block8x8 < 4; block8x8++) + { + int k_start = (block8x8 << 2); + for (k = k_start; k < k_start + BLOCK_MULTIPLE; k ++) + { + int i = (decode_block_scan[k] & 3); + int j = ((decode_block_scan[k] >> 2) & 3); + int i4 = currMB->block_x + i; + + //===== DIRECT PREDICTION ===== + if (!l0_rFrame && !colocated_moving_block[j][i4]) + { + motion0[j][i4].mv[0] = 0; + motion0[j][i4].mv[1] = 0; + motion0[j][i4].ref_idx = 0; + } + else + { + motion0[j][i4].mv[0] = pmvl0[0]; + motion0[j][i4].mv[1] = pmvl0[1]; + motion0[j][i4].ref_idx = l0_rFrame; + } + + if (l1_rFrame == 0 && !colocated_moving_block[j][i4]) + { + motion1[j][i4].mv[0] = 0; + motion1[j][i4].mv[1] = 0; + motion1[j][i4].ref_idx = 0; + } + else + { + motion1[j][i4].mv[0] = pmvl1[0]; + motion1[j][i4].mv[1] = pmvl1[1]; + motion1[j][i4].ref_idx = l1_rFrame; + } + + motion0[j][i4].ref_pic_id = ref_pic_num_l0[(short)motion0[j][i4].ref_idx]; + motion1[j][i4].ref_pic_id = ref_pic_num_l1[(short)motion1[j][i4].ref_idx]; + } + + perform_mc8x8(currMB, curr_plane, dec_picture, pred_dir, (decode_block_scan[k_start] & 3), ((decode_block_scan[k_start] >> 2) & 3), list_offset, curr_mb_field); + } + } + } + else + { + for (block8x8 = 0; block8x8 < 4; block8x8++) + { + int k_start = (block8x8 << 2); + for (k = k_start; k < k_start + BLOCK_MULTIPLE; k ++) + { + int i = (decode_block_scan[k] & 3); + int j = ((decode_block_scan[k] >> 2) & 3); + int i4 = currMB->block_x + i; + int j4 = currMB->block_y + j; + int j6 = currMB->block_y_aff + j; + + //printf("%d %d\n", i, j); + + //===== DIRECT PREDICTION ===== + + if (l0_rFrame >=0) + { + if (!l0_rFrame && ((!colocated->moving_block[j6][i4]) && (!p_Vid->listX[LIST_1 + list_offset][0]->is_long_term))) + { + has_zero_partitions = TRUE; + motion->motion[LIST_0][j4][i4].mv[0] = 0; + motion->motion[LIST_0][j4][i4].mv[1] = 0; + motion->motion[LIST_0][j4][i4].ref_idx = 0; + } + else + { + has_zero_partitions = TRUE; + motion->motion[LIST_0][j4][i4].mv[0] = pmvl0[0]; + motion->motion[LIST_0][j4][i4].mv[1] = pmvl0[1]; + motion->motion[LIST_0][j4][i4].ref_idx = l0_rFrame; + } + } + else + { + motion->motion[LIST_0][j4][i4].mv[0] = 0; + motion->motion[LIST_0][j4][i4].mv[1] = 0; + motion->motion[LIST_0][j4][i4].ref_idx = -1; + } + + if (l1_rFrame >=0) + { + if (l1_rFrame == 0 && ((!colocated->moving_block[j6][i4]) && (!p_Vid->listX[LIST_1 + list_offset][0]->is_long_term))) + { + has_zero_partitions = TRUE; + motion->motion[LIST_1][j4][i4].mv[0] = 0; + motion->motion[LIST_1][j4][i4].mv[1] = 0; + motion->motion[LIST_1][j4][i4].ref_idx = 0; + } + else + { + has_zero_partitions = TRUE; + motion->motion[LIST_1][j4][i4].mv[0] = pmvl1[0]; + motion->motion[LIST_1][j4][i4].mv[1] = pmvl1[1]; + motion->motion[LIST_1][j4][i4].ref_idx = l1_rFrame; + } + } + else + { + motion->motion[LIST_1][j4][i4].mv[0] = 0; + motion->motion[LIST_1][j4][i4].mv[1] = 0; + motion->motion[LIST_1][j4][i4].ref_idx = -1; + } + + if (l1_rFrame == -1) + pred_dir = 0; + else if (l0_rFrame == -1) + pred_dir = 1; + else + pred_dir = 2; + + if (l0_rFrame < 0 && l1_rFrame < 0) + { + motion->motion[LIST_0][j4][i4].ref_idx = 0; + motion->motion[LIST_1][j4][i4].ref_idx = 0; + pred_dir = 2; + } + + motion->motion[LIST_0][j4][i4].ref_pic_id = ref_pic_num_l0[(short)motion->motion[LIST_0][j4][i4].ref_idx]; + motion->motion[LIST_1][j4][i4].ref_pic_id = ref_pic_num_l1[(short)motion->motion[LIST_1][j4][i4].ref_idx]; + } + + if (has_zero_partitions == TRUE) + { + int i = (decode_block_scan[k_start] & 3); + int j = ((decode_block_scan[k_start] >> 2) & 3); + + perform_mc8x8(currMB, curr_plane, dec_picture, pred_dir, i, j, list_offset, curr_mb_field); + } + } + } + } + else + { + for (block8x8 = 0; block8x8 < 4; block8x8++) + { + int k_start = (block8x8 << 2); + int k_end = k_start + BLOCK_MULTIPLE; + + for (k = k_start; k < k_end; k ++) + { + int i = (decode_block_scan[k] & 3); + int j = ((decode_block_scan[k] >> 2) & 3); + int i4 = currMB->block_x + i; + int j4 = currMB->block_y + j; + int j6 = currMB->block_y_aff + j; + + //===== DIRECT PREDICTION ===== + + if (l0_rFrame >=0) + { + if (!l0_rFrame && ((!colocated->moving_block[j6][i4]) && (!p_Vid->listX[LIST_1 + list_offset][0]->is_long_term))) + { + has_zero_partitions = TRUE; + motion->motion[LIST_0][j4][i4].mv[0] = 0; + motion->motion[LIST_0][j4][i4].mv[1] = 0; + motion->motion[LIST_0][j4][i4].ref_idx = 0; + } + else + { + has_zero_partitions = TRUE; + motion->motion[LIST_0][j4][i4].mv[0] = pmvl0[0]; + motion->motion[LIST_0][j4][i4].mv[1] = pmvl0[1]; + motion->motion[LIST_0][j4][i4].ref_idx = l0_rFrame; + } + } + else + { + motion->motion[LIST_0][j4][i4].mv[0] = 0; + motion->motion[LIST_0][j4][i4].mv[1] = 0; + motion->motion[LIST_0][j4][i4].ref_idx = -1; + } + + if (l1_rFrame >=0) + { + if (l1_rFrame == 0 && ((!colocated->moving_block[j6][i4]) && (!p_Vid->listX[LIST_1 + list_offset][0]->is_long_term))) + { + has_zero_partitions = TRUE; + motion->motion[LIST_1][j4][i4].mv[0] = 0; + motion->motion[LIST_1][j4][i4].mv[1] = 0; + motion->motion[LIST_1][j4][i4].ref_idx = 0; + } + else + { + has_zero_partitions = TRUE; + motion->motion[LIST_1][j4][i4].mv[0] = pmvl1[0]; + motion->motion[LIST_1][j4][i4].mv[1] = pmvl1[1]; + motion->motion[LIST_1][j4][i4].ref_idx = l1_rFrame; + } + } + else + { + motion->motion[LIST_1][j4][i4].mv[0] = 0; + motion->motion[LIST_1][j4][i4].mv[1] = 0; + motion->motion[LIST_1][j4][i4].ref_idx = -1; + } + + if (l0_rFrame < 0 && l1_rFrame < 0) + { + motion->motion[LIST_0][j4][i4].ref_idx = 0; + motion->motion[LIST_1][j4][i4].ref_idx = 0; + } + + if (l1_rFrame == -1) + { + if (l0_rFrame == -1) + pred_dir = 2; + else + pred_dir = 0; + } + else if (l0_rFrame == -1) + { + pred_dir = 1; + } + else + pred_dir = 2; + + motion->motion[LIST_0][j4][i4].ref_pic_id = ref_pic_num_l0[(short)motion->motion[LIST_0][j4][i4].ref_idx]; + motion->motion[LIST_1][j4][i4].ref_pic_id = ref_pic_num_l1[(short)motion->motion[LIST_1][j4][i4].ref_idx]; + } + + if (has_zero_partitions == TRUE) + { + for (k = k_start; k < k_end; k ++) + { + int i = (decode_block_scan[k] & 3); + int j = ((decode_block_scan[k] >> 2) & 3); + + perform_mc(currMB, curr_plane, dec_picture, pred_dir, i, j, list_offset, BLOCK_SIZE, BLOCK_SIZE, curr_mb_field); + } + } + } + } + + if (has_zero_partitions == FALSE) + { + perform_mc16x16(currMB, curr_plane, dec_picture, pred_dir, list_offset, curr_mb_field); + } + + if (currMB->cbp == 0) + { + opt_copy_image_data_16x16_stride(image, currMB->pix_x, currMB->pix_y, currSlice->mb_pred[curr_plane]); + + if (dec_picture->chroma_format_idc == YUV420) + { + copy_image_data_8x8_stride(dec_picture->imgUV[0], currMB->pix_c_x, currMB->pix_c_y, currSlice->mb_pred[1]); + copy_image_data_8x8_stride(dec_picture->imgUV[1], currMB->pix_c_x, currMB->pix_c_y, currSlice->mb_pred[2]); + } + else if (dec_picture->chroma_format_idc == YUV422) + { + copy_image_data_stride(dec_picture->imgUV[0], currMB->pix_c_x, currMB->pix_c_y, currSlice->mb_pred[1], 8, 16); + copy_image_data_stride(dec_picture->imgUV[1], currMB->pix_c_x, currMB->pix_c_y, currSlice->mb_pred[2], 8, 16); + } + } + else + iTransform(currMB, curr_plane, 0); +} + + + +/*! +************************************************************************ +* \brief +* decode one color component for a b slice +************************************************************************ +*/ + +static int decode_one_component_b_slice(Macroblock *currMB, ColorPlane curr_plane, VideoImage *image, StorablePicture *dec_picture) +{ + //For residual DPCM + currMB->ipmode_DPCM = NO_INTRA_PMODE; + + if(currMB->mb_type == IPCM) + mb_pred_ipcm(currMB); + else if (IS_I16MB (currMB)) // get prediction for INTRA_MB_16x16 + mb_pred_intra16x16(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == I4MB) + mb_pred_intra4x4(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == I8MB) + mb_pred_intra8x8(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == P16x16) + mb_pred_p_inter16x16(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == P16x8) + mb_pred_p_inter16x8(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == P8x16) + mb_pred_p_inter8x16(currMB, curr_plane, image, dec_picture); + else if (currMB->mb_type == BSKIP_DIRECT) + { + if (currMB->p_Slice->direct_spatial_mv_pred_flag == 0) + mb_pred_b_dtemporal (currMB, curr_plane, image, dec_picture); + else + mb_pred_b_dspatial (currMB, curr_plane, image, dec_picture); + } + else + mb_pred_b_inter8x8 (currMB, curr_plane, image, dec_picture); + + return 1; +} + +/*! +************************************************************************ +* \brief +* decode one macroblock +************************************************************************ +*/ + +int decode_one_macroblock(Macroblock *currMB, StorablePicture *dec_picture) +{ + Slice *currSlice = currMB->p_Slice; + VideoParameters *p_Vid = currMB->p_Vid; + + // luma decoding ************************************************** + currSlice->decode_one_component(currMB, PLANE_Y, dec_picture->imgY, dec_picture); + + if ((p_Vid->active_sps->chroma_format_idc==YUV444)&&(!IS_INDEPENDENT(p_Vid))) + { + currSlice->decode_one_component(currMB, PLANE_U, dec_picture->imgUV[0], dec_picture); + currSlice->decode_one_component(currMB, PLANE_V, dec_picture->imgUV[1], dec_picture); + } + return 0; +} + + +/*! +************************************************************************ +* \brief +* change target plane +* for 4:4:4 Independent mode +************************************************************************ +*/ +void change_plane_JV( VideoParameters *p_Vid, int nplane ) +{ + Slice *currSlice = p_Vid->currentSlice; + p_Vid->colour_plane_id = nplane; + p_Vid->mb_data = p_Vid->mb_data_JV[nplane]; + p_Vid->dec_picture = p_Vid->dec_picture_JV[nplane]; + currSlice->p_colocated = currSlice->Co_located_JV[nplane]; +} + +/*! +************************************************************************ +* \brief +* make frame picture from each plane data +* for 4:4:4 Independent mode +************************************************************************ +*/ +void make_frame_picture_JV(VideoParameters *p_Vid) +{ + int uv, line; + int nsize; + int nplane; + p_Vid->dec_picture = p_Vid->dec_picture_JV[0]; + + // Copy Storable Params + for( nplane=0; nplane<MAX_PLANE; nplane++ ) + { + copy_storable_param_JV( p_Vid, &p_Vid->dec_picture->JVmotion[nplane], &p_Vid->dec_picture_JV[nplane]->motion ); + } + + // This could be done with pointers and seems not necessary + for( uv=0; uv<2; uv++ ) + { + for( line=0; line<p_Vid->height; line++ ) + { + nsize = sizeof(imgpel) * p_Vid->width; + memcpy( p_Vid->dec_picture->imgUV[uv]->img[line], p_Vid->dec_picture_JV[uv+1]->imgY->img[line], nsize ); + } + free_storable_picture(p_Vid, p_Vid->dec_picture_JV[uv+1]); + } +} + + |