解析完成条带头之后下一步的工作是解析条带数据slice_segment_data。slice_segment_data数据主要由一个个的Coding_Tree_Unit(CTU)组成。每一个CTU的结构如下所示:
coding_tree_unit( ) { xCtb = ( CtbAddrInRs % PicWidthInCtbsY ) << CtbLog2SizeY yCtb = ( CtbAddrInRs / PicWidthInCtbsY ) << CtbLog2SizeY if( slice_sao_luma_flag | | slice_sao_chroma_flag ) sao( xCtb >> CtbLog2SizeY, yCtb >> CtbLog2SizeY ) coding_quadtree( xCtb, yCtb, CtbLog2SizeY, 0 ) }
可以看出,每一个CTU的coding_quadtree部分之前是语法结构sao。那么现在来研究一下如何从码流中解码出sao,这里着重讨论cabac而非sao的意义。
对sao的解析部分在TDecSlice::decompressSlice()中。在真正开始解码之前,TDecSlice::decompressSlice()调用了m_pcEntropyDecoderIf->resetEntropy(p)函数进行熵解码器的一些初始化操作,如为不同语法元素进行initBuffer。在最后,调用了m_pcTDecBinIf->start()函数。该函数读出了码流中的前两个字节组成一个UInt16的数字赋给m_uiValue。
TDecBinCABAC::start() { assert( m_pcTComBitstream->getNumBitsUntilByteAligned() == 0 ); m_uiRange = 510; m_bitsNeeded = -8; m_uiValue = (m_pcTComBitstream->readByte() << 8); m_uiValue |= m_pcTComBitstream->readByte(); }
以下是TDecSlice::decompressSlice()中sao的解析部分:
if ( pcSlice->getSPS()->getUseSAO() && (pcSlice->getSaoEnabledFlag()||pcSlice->getSaoEnabledFlagChroma()) )
{
SAOParam *saoParam = rpcPic->getPicSym()->getSaoParam();
saoParam->bSaoFlag[0] = pcSlice->getSaoEnabledFlag();
if (iCUAddr == iStartCUAddr)
{
saoParam->bSaoFlag[1] = pcSlice->getSaoEnabledFlagChroma();
}
Int numCuInWidth = saoParam->numCuInWidth;
Int cuAddrInSlice = iCUAddr - rpcPic->getPicSym()->getCUOrderMap(pcSlice->getSliceCurStartCUAddr()/rpcPic->getNumPartInCU());
Int cuAddrUpInSlice = cuAddrInSlice - numCuInWidth;
Int rx = iCUAddr % numCuInWidth;
Int ry = iCUAddr / numCuInWidth;
Int allowMergeLeft = 1;
Int allowMergeUp = 1;
if (rx!=0)
{
if (rpcPic->getPicSym()->getTileIdxMap(iCUAddr-1) != rpcPic->getPicSym()->getTileIdxMap(iCUAddr))
{
allowMergeLeft = 0;
}
}
if (ry!=0)
{
if (rpcPic->getPicSym()->getTileIdxMap(iCUAddr-numCuInWidth) != rpcPic->getPicSym()->getTileIdxMap(iCUAddr))
{
allowMergeUp = 0;
}
}
pcSbacDecoder->parseSaoOneLcuInterleaving(rx, ry, saoParam,pcCU, cuAddrInSlice, cuAddrUpInSlice, allowMergeLeft, allowMergeUp);
}
else if ( pcSlice->getSPS()->getUseSAO() )
{
Int addr = pcCU->getAddr();
SAOParam *saoParam = rpcPic->getPicSym()->getSaoParam();
for (Int cIdx=0; cIdx<3; cIdx++)
{
SaoLcuParam *saoLcuParam = &(saoParam->saoLcuParam[cIdx][addr]);
if ( ((cIdx == 0) && !pcSlice->getSaoEnabledFlag()) || ((cIdx == 1 || cIdx == 2) && !pcSlice->getSaoEnabledFlagChroma()))
{
saoLcuParam->mergeUpFlag = 0;
saoLcuParam->mergeLeftFlag = 0;
saoLcuParam->subTypeIdx = 0;
saoLcuParam->typeIdx = -1;
saoLcuParam->offset[0] = 0;
saoLcuParam->offset[1] = 0;
saoLcuParam->offset[2] = 0;
saoLcuParam->offset[3] = 0;
}
}
}
Void TDecSbac::parseSaoOneLcuInterleaving(Int rx, Int ry, SAOParam* pSaoParam, TComDataCU* pcCU, Int iCUAddrInSlice, Int iCUAddrUpInSlice, Int allowMergeLeft, Int allowMergeUp) { Int iAddr = pcCU->getAddr(); UInt uiSymbol; for (Int iCompIdx=0; iCompIdx<3; iCompIdx++) { pSaoParam->saoLcuParam[iCompIdx][iAddr].mergeUpFlag = 0; pSaoParam->saoLcuParam[iCompIdx][iAddr].mergeLeftFlag = 0; pSaoParam->saoLcuParam[iCompIdx][iAddr].subTypeIdx = 0; pSaoParam->saoLcuParam[iCompIdx][iAddr].typeIdx = -1; pSaoParam->saoLcuParam[iCompIdx][iAddr].offset[0] = 0; pSaoParam->saoLcuParam[iCompIdx][iAddr].offset[1] = 0; pSaoParam->saoLcuParam[iCompIdx][iAddr].offset[2] = 0; pSaoParam->saoLcuParam[iCompIdx][iAddr].offset[3] = 0; } if (pSaoParam->bSaoFlag[0] || pSaoParam->bSaoFlag[1] ) { if (rx>0 && iCUAddrInSlice!=0 && allowMergeLeft) { parseSaoMerge(uiSymbol); pSaoParam->saoLcuParam[0][iAddr].mergeLeftFlag = (Bool)uiSymbol; } if (pSaoParam->saoLcuParam[0][iAddr].mergeLeftFlag==0) { if ((ry > 0) && (iCUAddrUpInSlice>=0) && allowMergeUp) { parseSaoMerge(uiSymbol); pSaoParam->saoLcuParam[0][iAddr].mergeUpFlag = (Bool)uiSymbol; } } } for (Int iCompIdx=0; iCompIdx<3; iCompIdx++) { if ((iCompIdx == 0 && pSaoParam->bSaoFlag[0]) || (iCompIdx > 0 && pSaoParam->bSaoFlag[1]) ) { if (rx>0 && iCUAddrInSlice!=0 && allowMergeLeft) { pSaoParam->saoLcuParam[iCompIdx][iAddr].mergeLeftFlag = pSaoParam->saoLcuParam[0][iAddr].mergeLeftFlag; } else { pSaoParam->saoLcuParam[iCompIdx][iAddr].mergeLeftFlag = 0; } if (pSaoParam->saoLcuParam[iCompIdx][iAddr].mergeLeftFlag==0) { if ((ry > 0) && (iCUAddrUpInSlice>=0) && allowMergeUp) { pSaoParam->saoLcuParam[iCompIdx][iAddr].mergeUpFlag = pSaoParam->saoLcuParam[0][iAddr].mergeUpFlag; } else { pSaoParam->saoLcuParam[iCompIdx][iAddr].mergeUpFlag = 0; } if (!pSaoParam->saoLcuParam[iCompIdx][iAddr].mergeUpFlag) { pSaoParam->saoLcuParam[2][iAddr].typeIdx = pSaoParam->saoLcuParam[1][iAddr].typeIdx; parseSaoOffset(&(pSaoParam->saoLcuParam[iCompIdx][iAddr]), iCompIdx); } else { copySaoOneLcuParam(&pSaoParam->saoLcuParam[iCompIdx][iAddr], &pSaoParam->saoLcuParam[iCompIdx][iAddr-pSaoParam->numCuInWidth]); } } else { copySaoOneLcuParam(&pSaoParam->saoLcuParam[iCompIdx][iAddr], &pSaoParam->saoLcuParam[iCompIdx][iAddr-1]); } } else { pSaoParam->saoLcuParam[iCompIdx][iAddr].typeIdx = -1; pSaoParam->saoLcuParam[iCompIdx][iAddr].subTypeIdx = 0; } } }
Void TDecSbac::parseSaoOffset(SaoLcuParam* psSaoLcuParam, UInt compIdx) { UInt uiSymbol; static Int iTypeLength[MAX_NUM_SAO_TYPE] = { SAO_EO_LEN, SAO_EO_LEN, SAO_EO_LEN, SAO_EO_LEN, SAO_BO_LEN }; if (compIdx==2) { uiSymbol = (UInt)( psSaoLcuParam->typeIdx + 1); } else { parseSaoTypeIdx(uiSymbol); } psSaoLcuParam->typeIdx = (Int)uiSymbol - 1; if (uiSymbol) { psSaoLcuParam->length = iTypeLength[psSaoLcuParam->typeIdx]; Int bitDepth = compIdx ? g_bitDepthC : g_bitDepthY; Int offsetTh = 1 << min(bitDepth - 5,5); if( psSaoLcuParam->typeIdx == SAO_BO ) { for(Int i=0; i< psSaoLcuParam->length; i++) { parseSaoMaxUvlc(uiSymbol, offsetTh -1 ); psSaoLcuParam->offset[i] = uiSymbol; } for(Int i=0; i< psSaoLcuParam->length; i++) { if (psSaoLcuParam->offset[i] != 0) { m_pcTDecBinIf->decodeBinEP ( uiSymbol); if (uiSymbol) { psSaoLcuParam->offset[i] = -psSaoLcuParam->offset[i] ; } } } parseSaoUflc(5, uiSymbol ); psSaoLcuParam->subTypeIdx = uiSymbol; } else if( psSaoLcuParam->typeIdx < 4 ) { parseSaoMaxUvlc(uiSymbol, offsetTh -1 ); psSaoLcuParam->offset[0] = uiSymbol; parseSaoMaxUvlc(uiSymbol, offsetTh -1 ); psSaoLcuParam->offset[1] = uiSymbol; parseSaoMaxUvlc(uiSymbol, offsetTh -1 ); psSaoLcuParam->offset[2] = -(Int)uiSymbol; parseSaoMaxUvlc(uiSymbol, offsetTh -1 ); psSaoLcuParam->offset[3] = -(Int)uiSymbol; if (compIdx != 2) { parseSaoUflc(2, uiSymbol ); psSaoLcuParam->subTypeIdx = uiSymbol; psSaoLcuParam->typeIdx += psSaoLcuParam->subTypeIdx; } } } else { psSaoLcuParam->length = 0; } }
Void TDecSbac::parseSaoTypeIdx (UInt& ruiVal) { UInt uiCode; m_pcTDecBinIf->decodeBin( uiCode, m_cSaoTypeIdxSCModel.get( 0, 0, 0 ) ); if (uiCode == 0) { ruiVal = 0; } else { m_pcTDecBinIf->decodeBinEP( uiCode ); if (uiCode == 0) { ruiVal = 5; } else { ruiVal = 1; } } }
从parseSaoOneLcuInterleaving函数中可以看出,parseSaoOffset将会循环调用3次。在第二次调用中,我们的demo程序显示,parseSaoTypeIdx中uiCode返回值为1,因此,下面继续调用了decodeBinEP函数:
Void TDecBinCABAC::decodeBinEP( UInt& ruiBin ) { m_uiValue += m_uiValue; if ( ++m_bitsNeeded >= 0 ) { m_bitsNeeded = -8; m_uiValue += m_pcTComBitstream->readByte(); } ruiBin = 0; UInt scaledRange = m_uiRange << 7; if ( m_uiValue >= scaledRange ) { ruiBin = 1; m_uiValue -= scaledRange; } }
Void TDecSbac::parseSaoMaxUvlc ( UInt& val, UInt maxSymbol ) { if (maxSymbol == 0) { val = 0; return; } UInt code; Int i; m_pcTDecBinIf->decodeBinEP( code );//① if ( code == 0 ) { val = 0; return; } i=1; while (1) { m_pcTDecBinIf->decodeBinEP( code );//② if ( code == 0 ) { break; } i++; if (i == maxSymbol) { break; } } val = i; }
接下来,对第2~4个offset值,将各调用一次decodeBinEP,为1则取其负值。
调用parseSaoUflc(5, uiSymbol ),该函数调用了decodeBinsEP,该函数可以认为一次处理多位。实现如下:
Void TDecBinCABAC::decodeBinsEP( UInt& ruiBin, Int numBins ) { UInt bins = 0; while ( numBins > 8 ) { m_uiValue = ( m_uiValue << 8 ) + ( m_pcTComBitstream->readByte() << ( 8 + m_bitsNeeded ) ); UInt scaledRange = m_uiRange << 15; for ( Int i = 0; i < 8; i++ ) { bins += bins; scaledRange >>= 1; if ( m_uiValue >= scaledRange ) { bins++; m_uiValue -= scaledRange; } } numBins -= 8; } m_bitsNeeded += numBins; m_uiValue <<= numBins; if ( m_bitsNeeded >= 0 ) { m_uiValue += m_pcTComBitstream->readByte() << m_bitsNeeded; m_bitsNeeded -= 8; } UInt scaledRange = m_uiRange << ( numBins + 7 ); for ( Int i = 0; i < numBins; i++ ) { bins += bins; scaledRange >>= 1; if ( m_uiValue >= scaledRange ) { bins++; m_uiValue -= scaledRange; } } ruiBin = bins; }
自此,parseSaoOffset的任务便已完成。而类似的工作将循环三次以完成pcSbacDecoder->parseSaoOneLcuInterleaving的功能。
PS:跟踪了这么久的代码,但是现在的问题依然是知其然不知其所以然……看来接下来需要在标准文档和其他一些资料上面下些功夫了。