在开始研究这部分代码之前,重新回顾一下理论部分。
众所周知,H.264及其之前的编码标准中,VCL层的核心结构称作“宏块”(MacroBlock, MB),大小为16×16像素。一个宏块里面包含着一个16×16分辨率的亮度采样矩阵和两个8×8分辨率的色度采样矩阵。相应的,在HEVC中,编码所采用的块结构为树形编码单元(Coding Tree Unit, CTU),每个CTU的大小由编码器决定,并且通常要大于宏块的16×16大小。比CTU更小的单位称为树形编码块(Coding Tree Block, CTB),一个CTU由一个亮度信号CTB及其相应的色度CTB,以及其他一些语法元素构成。一个正方形的亮度CTB的边长(以像素为单位)可能取16、32或者64个像素,CTB越大则压缩效率越高。HEVC标准支持将一个CTB按照四叉树的方法分割为多个更小的块结构。
采用了四叉树分割的方法后,这个树结构保存了亮度和色度编码单元(Coding Unit, CU)的位置和大小。这个四叉树结构的根与当前的这个CTU对应,也就是说,一个亮度CU最大可能的大小就是亮度CTB的大小。通常,一个CU的组成包括一个亮度编码块(Coding Block, CB),一个色度CB以及其他相应的语法元素。一个CTB可能包含一个CU,也可能被分割成多个CU,每一个CU进一步分割成预测单元(Prediction Unit, PU)和树结构的变换单元(Transform Unit, TU)。
判断采用帧内预测还是帧间预测在CU层完成。PU的分割结构就以CU为根,根据基本的预测模式判定,亮度和色度CB被进一步分割,由亮度和色度预测块(Prediction Block, PB)中获取预测值。每一个PB的大小可能由64×64到4×4不等。预测的残差信号由TU进行编码。同PU类似,TU树形结构的根节点也是CU,一个亮度CB的残差信号可能由一个完整的变换块(Transform Block, TB)表示,也可能树形分割成多个子TB。对4×4、8×8、16×16和32×32的正方形TB块,HEVC依然采用整数变换;当TB大小为4×4,且采用帧内编码的残差信号则采用了一种类离散正弦变换的方法。
标准文档的7.3.8.4节给出了Coding quadtree的语法结构:
该结构中的第一个语法元素split_cu_flag[x0][y0]表明这个Coding quadtree是否继续四等分,下标x0和y0表示当前拟作为cu的像素块左上角像素相对于该帧左上角的坐标。从该结构的定义来看,Coding quadtree采用了递归的结构,只要split_cu_flag[x0][y0]为1,则这个Coding quadtree就会继续分割下去,直到split_cu_flag[x0][y0]为0时,这个Coding quadtree进一步处理为一个coding unit。
回到代码中。实现解析Coding quadtree的函数由Void TDecCu::xDecodeCU( TComDataCU* pcCU, UInt uiAbsPartIdx, UInt uiDepth, UInt& ruiIsLast)实现:
Void TDecCu::xDecodeCU( TComDataCU* pcCU, UInt uiAbsPartIdx, UInt uiDepth, UInt& ruiIsLast)
{
TComPic* pcPic = pcCU->getPic();
UInt uiCurNumParts = pcPic->getNumPartInCU() >> (uiDepth<<1);
UInt uiQNumParts = uiCurNumParts>>2;
Bool bBoundary = false;
UInt uiLPelX = pcCU->getCUPelX() + g_auiRasterToPelX[ g_auiZscanToRaster[uiAbsPartIdx] ];
UInt uiRPelX = uiLPelX + (g_uiMaxCUWidth>>uiDepth) - 1;
UInt uiTPelY = pcCU->getCUPelY() + g_auiRasterToPelY[ g_auiZscanToRaster[uiAbsPartIdx] ];
UInt uiBPelY = uiTPelY + (g_uiMaxCUHeight>>uiDepth) - 1;
TComSlice * pcSlice = pcCU->getPic()->getSlice(pcCU->getPic()->getCurrSliceIdx());
Bool bStartInCU = pcCU->getSCUAddr()+uiAbsPartIdx+uiCurNumParts>pcSlice->getSliceSegmentCurStartCUAddr()&&pcCU->getSCUAddr()+uiAbsPartIdx<pcSlice->getSliceSegmentCurStartCUAddr();
if((!bStartInCU) && ( uiRPelX < pcSlice->getSPS()->getPicWidthInLumaSamples() ) && ( uiBPelY < pcSlice->getSPS()->getPicHeightInLumaSamples() ) )
{
m_pcEntropyDecoder->decodeSplitFlag( pcCU, uiAbsPartIdx, uiDepth );
}
else
{
bBoundary = true;
}
if( ( ( uiDepth < pcCU->getDepth( uiAbsPartIdx ) ) && ( uiDepth < g_uiMaxCUDepth - g_uiAddCUDepth ) ) || bBoundary )
{
UInt uiIdx = uiAbsPartIdx;
if( (g_uiMaxCUWidth>>uiDepth) == pcCU->getSlice()->getPPS()->getMinCuDQPSize() && pcCU->getSlice()->getPPS()->getUseDQP())
{
setdQPFlag(true);
pcCU->setQPSubParts( pcCU->getRefQP(uiAbsPartIdx), uiAbsPartIdx, uiDepth ); // set QP to default QP
}
for ( UInt uiPartUnitIdx = 0; uiPartUnitIdx < 4; uiPartUnitIdx++ )
{
uiLPelX = pcCU->getCUPelX() + g_auiRasterToPelX[ g_auiZscanToRaster[uiIdx] ];
uiTPelY = pcCU->getCUPelY() + g_auiRasterToPelY[ g_auiZscanToRaster[uiIdx] ];
Bool bSubInSlice = pcCU->getSCUAddr()+uiIdx+uiQNumParts>pcSlice->getSliceSegmentCurStartCUAddr();
if ( bSubInSlice )
{
if ( !ruiIsLast && ( uiLPelX < pcCU->getSlice()->getSPS()->getPicWidthInLumaSamples() ) && ( uiTPelY < pcCU->getSlice()->getSPS()->getPicHeightInLumaSamples() ) )
{
xDecodeCU( pcCU, uiIdx, uiDepth+1, ruiIsLast );
}
else
{
pcCU->setOutsideCUPart( uiIdx, uiDepth+1 );
}
}
uiIdx += uiQNumParts;
}
if( (g_uiMaxCUWidth>>uiDepth) == pcCU->getSlice()->getPPS()->getMinCuDQPSize() && pcCU->getSlice()->getPPS()->getUseDQP())
{
if ( getdQPFlag() )
{
UInt uiQPSrcPartIdx;
if ( pcPic->getCU( pcCU->getAddr() )->getSliceSegmentStartCU(uiAbsPartIdx) != pcSlice->getSliceSegmentCurStartCUAddr() )
{
uiQPSrcPartIdx = pcSlice->getSliceSegmentCurStartCUAddr() % pcPic->getNumPartInCU();
}
else
{
uiQPSrcPartIdx = uiAbsPartIdx;
}
pcCU->setQPSubParts( pcCU->getRefQP( uiQPSrcPartIdx ), uiAbsPartIdx, uiDepth ); // set QP to default QP
}
}
return;
}
if( (g_uiMaxCUWidth>>uiDepth) >= pcCU->getSlice()->getPPS()->getMinCuDQPSize() && pcCU->getSlice()->getPPS()->getUseDQP())
{
setdQPFlag(true);
pcCU->setQPSubParts( pcCU->getRefQP(uiAbsPartIdx), uiAbsPartIdx, uiDepth ); // set QP to default QP
}
if (pcCU->getSlice()->getPPS()->getTransquantBypassEnableFlag())
{
m_pcEntropyDecoder->decodeCUTransquantBypassFlag( pcCU, uiAbsPartIdx, uiDepth );
}
// decode CU mode and the partition size
if( !pcCU->getSlice()->isIntra())
{
m_pcEntropyDecoder->decodeSkipFlag( pcCU, uiAbsPartIdx, uiDepth );
}
if( pcCU->isSkipped(uiAbsPartIdx) )
{
m_ppcCU[uiDepth]->copyInterPredInfoFrom( pcCU, uiAbsPartIdx, REF_PIC_LIST_0 );
m_ppcCU[uiDepth]->copyInterPredInfoFrom( pcCU, uiAbsPartIdx, REF_PIC_LIST_1 );
TComMvField cMvFieldNeighbours[MRG_MAX_NUM_CANDS << 1]; // double length for mv of both lists
UChar uhInterDirNeighbours[MRG_MAX_NUM_CANDS];
Int numValidMergeCand = 0;
for( UInt ui = 0; ui < m_ppcCU[uiDepth]->getSlice()->getMaxNumMergeCand(); ++ui )
{
uhInterDirNeighbours[ui] = 0;
}
m_pcEntropyDecoder->decodeMergeIndex( pcCU, 0, uiAbsPartIdx, uiDepth );
UInt uiMergeIndex = pcCU->getMergeIndex(uiAbsPartIdx);
m_ppcCU[uiDepth]->getInterMergeCandidates( 0, 0, cMvFieldNeighbours, uhInterDirNeighbours, numValidMergeCand, uiMergeIndex );
pcCU->setInterDirSubParts( uhInterDirNeighbours[uiMergeIndex], uiAbsPartIdx, 0, uiDepth );
TComMv cTmpMv( 0, 0 );
for ( UInt uiRefListIdx = 0; uiRefListIdx < 2; uiRefListIdx++ )
{
if ( pcCU->getSlice()->getNumRefIdx( RefPicList( uiRefListIdx ) ) > 0 )
{
pcCU->setMVPIdxSubParts( 0, RefPicList( uiRefListIdx ), uiAbsPartIdx, 0, uiDepth);
pcCU->setMVPNumSubParts( 0, RefPicList( uiRefListIdx ), uiAbsPartIdx, 0, uiDepth);
pcCU->getCUMvField( RefPicList( uiRefListIdx ) )->setAllMvd( cTmpMv, SIZE_2Nx2N, uiAbsPartIdx, uiDepth );
pcCU->getCUMvField( RefPicList( uiRefListIdx ) )->setAllMvField( cMvFieldNeighbours[ 2*uiMergeIndex + uiRefListIdx ], SIZE_2Nx2N, uiAbsPartIdx, uiDepth );
}
}
xFinishDecodeCU( pcCU, uiAbsPartIdx, uiDepth, ruiIsLast );
return;
}
m_pcEntropyDecoder->decodePredMode( pcCU, uiAbsPartIdx, uiDepth );
m_pcEntropyDecoder->decodePartSize( pcCU, uiAbsPartIdx, uiDepth );
if (pcCU->isIntra( uiAbsPartIdx ) && pcCU->getPartitionSize( uiAbsPartIdx ) == SIZE_2Nx2N )
{
m_pcEntropyDecoder->decodeIPCMInfo( pcCU, uiAbsPartIdx, uiDepth );
if(pcCU->getIPCMFlag(uiAbsPartIdx))
{
xFinishDecodeCU( pcCU, uiAbsPartIdx, uiDepth, ruiIsLast );
return;
}
}
UInt uiCurrWidth = pcCU->getWidth ( uiAbsPartIdx );
UInt uiCurrHeight = pcCU->getHeight( uiAbsPartIdx );
// prediction mode ( Intra : direction mode, Inter : Mv, reference idx )
m_pcEntropyDecoder->decodePredInfo( pcCU, uiAbsPartIdx, uiDepth, m_ppcCU[uiDepth]);
// Coefficient decoding
Bool bCodeDQP = getdQPFlag();
m_pcEntropyDecoder->decodeCoeff( pcCU, uiAbsPartIdx, uiDepth, uiCurrWidth, uiCurrHeight, bCodeDQP );
setdQPFlag( bCodeDQP );
xFinishDecodeCU( pcCU, uiAbsPartIdx, uiDepth, ruiIsLast );
}
TDecEntropy::decodeSplitFlag ( TComDataCU* pcCU, UInt uiAbsPartIdx, UInt uiDepth )函数调用m_pcEntropyDecoderIf->parseSplitFlag( pcCU, uiAbsPartIdx, uiDepth )来解析 split_cu_flag[x0][y0]的值。在这个过程中,由于规定了最大的CUDepth为4,所以只进行了4次分割便返回。其后,将处理coding block数据。