shithub: openh264

ref: a15ad8cc80773b251f88798e364668cc175c0738
dir: /codec/encoder/core/src/encoder.cpp/

View raw version
/*!
 * \copy
 *     Copyright (c)  2009-2013, Cisco Systems
 *     All rights reserved.
 *
 *     Redistribution and use in source and binary forms, with or without
 *     modification, are permitted provided that the following conditions
 *     are met:
 *
 *        * Redistributions of source code must retain the above copyright
 *          notice, this list of conditions and the following disclaimer.
 *
 *        * Redistributions in binary form must reproduce the above copyright
 *          notice, this list of conditions and the following disclaimer in
 *          the documentation and/or other materials provided with the
 *          distribution.
 *
 *     THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 *     "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 *     LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
 *     FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
 *     COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
 *     INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
 *     BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 *     LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
 *     CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 *     LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
 *     ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 *     POSSIBILITY OF SUCH DAMAGE.
 *
 *
 * \file	encoder.c
 *
 * \brief	core encoder
 *
 * \date	5/14/2009 Created
 *
 *************************************************************************************
 */
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <assert.h>
#include "encoder.h"
#include "extern.h"
#include "cpu.h"
#include "cpu_core.h"
#include "utils.h"

#include "encode_mb_aux.h"
#include "decode_mb_aux.h"
#include "get_intra_predictor.h"
#include "svc_encode_mb.h"

#include "deblocking.h"
#include "expand_pic.h"

#include "mc.h"
#include "sample.h"

#include "svc_encode_slice.h"
#include "svc_base_layer_md.h"
#include "svc_mode_decision.h"
#include "set_mb_syn_cavlc.h"
#include "crt_util_safe_x.h"	// Safe CRT routines like utils for cross_platforms
#include "codec_def.h"
#ifdef MT_ENABLED
#include "slice_multi_threading.h"
#endif//MT_ENABLED

//  global   function  pointers  definition
namespace WelsSVCEnc {
/* Motion compensation */


/*!
 * \brief	initialize source picture body
 * \param	pSrc		SSourcePicture*
 * \param	csp		internal csp format
 * \param	iWidth	widht of picture in pixels
 * \param	iHeight	iHeight of picture in pixels
 * \return	successful - 0; otherwise none 0 for failed
 */
int32_t InitPic( const void *kpSrc, const int32_t kiColorspace, const int32_t kiWidth, const int32_t kiHeight )
{
	SSourcePicture *pSrcPic = (SSourcePicture *)kpSrc;

	if ( NULL == pSrcPic || kiWidth == 0 || kiHeight == 0 )
		return 1;

	pSrcPic->iColorFormat	= kiColorspace;
	pSrcPic->iPicWidth		= kiWidth;
	pSrcPic->iPicHeight		= kiHeight;
	
	switch( kiColorspace & (~videoFormatVFlip) ) {
	case videoFormatI420:
	case videoFormatYV12:
		pSrcPic->pData[0]	= NULL;
		pSrcPic->pData[1]	= NULL;
		pSrcPic->pData[2]	= NULL;
		pSrcPic->pData[3]	= NULL;
		pSrcPic->iStride[0]	= kiWidth;
		pSrcPic->iStride[2]	= pSrcPic->iStride[1] = kiWidth >> 1;
		pSrcPic->iStride[3]	= 0;
		break;	
	case videoFormatYUY2:
	case videoFormatYVYU:
	case videoFormatUYVY:
		pSrcPic->pData[0]	= NULL;
		pSrcPic->pData[1]	= NULL;
		pSrcPic->pData[2]	= NULL;
		pSrcPic->pData[3]	= NULL;		
		pSrcPic->iStride[0]	= CALC_BI_STRIDE(kiWidth,  16);
		pSrcPic->iStride[3]	= pSrcPic->iStride[2] = pSrcPic->iStride[1] = 0;		
		break;
	case videoFormatRGB:
	case videoFormatBGR:
		pSrcPic->pData[0]	= NULL;
		pSrcPic->pData[1]	= NULL;
		pSrcPic->pData[2]	= NULL;
		pSrcPic->pData[3]	= NULL;		
		pSrcPic->iStride[0]	= CALC_BI_STRIDE(kiWidth, 24);
		pSrcPic->iStride[3]	= pSrcPic->iStride[2] = pSrcPic->iStride[1] = 0;
		if( kiColorspace & videoFormatVFlip )
			pSrcPic->iColorFormat = kiColorspace & (~videoFormatVFlip);
		else 
			pSrcPic->iColorFormat = kiColorspace | videoFormatVFlip;
		break;
	case videoFormatBGRA:
	case videoFormatRGBA:
	case videoFormatARGB:
	case videoFormatABGR:
		pSrcPic->pData[0]	= NULL;
		pSrcPic->pData[1]	= NULL;
		pSrcPic->pData[2]	= NULL;
		pSrcPic->pData[3]	= NULL;		
		pSrcPic->iStride[0]	= kiWidth << 2;
		pSrcPic->iStride[3]	= pSrcPic->iStride[2] = pSrcPic->iStride[1] = 0;	
		if( kiColorspace & videoFormatVFlip )
			pSrcPic->iColorFormat = kiColorspace & (~videoFormatVFlip);
		else 
			pSrcPic->iColorFormat = kiColorspace | videoFormatVFlip;
		break;
	default:
		return 2;	// any else?
	}

	return 0;
}


void WelsInitBGDFunc( SWelsFuncPtrList *pFuncList, const bool_t kbEnableBackgroundDetection )
{
	if ( kbEnableBackgroundDetection )
	{
		 pFuncList->pfInterMdBackgroundDecision = (PInterMdBackgroundDecisionFunc)WelsMdInterJudgeBGDPskip;
		 pFuncList->pfInterMdBackgroundInfoUpdate = (PInterMdBackgroundInfoUpdateFunc)WelsMdInterUpdateBGDInfo;
	}
	else
	{
		 pFuncList->pfInterMdBackgroundDecision = (PInterMdBackgroundDecisionFunc)WelsMdInterJudgeBGDPskipFalse;
		 pFuncList->pfInterMdBackgroundInfoUpdate = (PInterMdBackgroundInfoUpdateFunc)WelsMdInterUpdateBGDInfoNULL;
	}
}

/*!
 * \brief	initialize function pointers that potentially used in Wels encoding
 * \param	pEncCtx		sWelsEncCtx*
 * \return	successful - 0; otherwise none 0 for failed
 */
int32_t InitFunctionPointers( SWelsFuncPtrList *pFuncList, SWelsSvcCodingParam *pParam, uint32_t uiCpuFlag )
{	
	int32_t iReturn = 0;

	/* Functionality utilization of CPU instructions dependency */
	pFuncList->pfSetMemZeroSize8	= WelsSetMemZero_c;		// confirmed_safe_unsafe_usage
	pFuncList->pfSetMemZeroSize64Aligned16	= WelsSetMemZero_c;	// confirmed_safe_unsafe_usage
	pFuncList->pfSetMemZeroSize64	= WelsSetMemZero_c;	// confirmed_safe_unsafe_usage
#if defined(X86_ASM)
	if ( uiCpuFlag & WELS_CPU_MMXEXT )
	{		
		pFuncList->pfSetMemZeroSize8	= WelsSetMemZeroSize8_mmx;		// confirmed_safe_unsafe_usage
		pFuncList->pfSetMemZeroSize64Aligned16	= WelsSetMemZeroSize64_mmx;	// confirmed_safe_unsafe_usage
		pFuncList->pfSetMemZeroSize64	= WelsSetMemZeroSize64_mmx;	// confirmed_safe_unsafe_usage
	}
	if ( uiCpuFlag & WELS_CPU_SSE2 )
	{
		pFuncList->pfSetMemZeroSize64Aligned16	= WelsSetMemZeroAligned64_sse2;	// confirmed_safe_unsafe_usage
	}
#endif//X86_ASM

	InitExpandPictureFunc( pFuncList, uiCpuFlag );

	/* Intra_Prediction_fn*/	
	WelsInitFillingPredFuncs( uiCpuFlag );
	WelsInitIntraPredFuncs( pFuncList, uiCpuFlag );

	/* sad, satd, average */
	WelsInitSampleSadFunc(pFuncList, uiCpuFlag);

	//
	WelsInitBGDFunc(pFuncList, pParam->bEnableBackgroundDetection );
	// for pfGetVarianceFromIntraVaa function ptr adaptive by CPU features, 6/7/2010
	InitIntraAnalysisVaaInfo( pFuncList, uiCpuFlag );
	
	/* Motion compensation */
	/*init pixel average function*/
	/*get one column or row pixel when refinement*/
	WelsInitMcFuncs(pFuncList, uiCpuFlag);
	InitCoeffFunc( uiCpuFlag );

	WelsInitEncodingFuncs( pFuncList, uiCpuFlag );
	WelsInitReconstructionFuncs( pFuncList, uiCpuFlag );

	DeblockingInit( &pFuncList->pfDeblocking, uiCpuFlag );
	WelsBlockFuncInit( &pFuncList->pfSetNZCZero, uiCpuFlag );

	InitFillNeighborCacheInterFunc ( pFuncList, pParam->bEnableBackgroundDetection );

	return iReturn;
}

/*!
 * \brief	initialize frame coding	
 */
void InitFrameCoding( sWelsEncCtx *pEncCtx, const EFrameType keFrameType )
{
	// for bitstream writing
	pEncCtx->iPosBsBuffer		= 0;	// reset bs pBuffer position
	pEncCtx->pOut->iNalIndex		= 0;	// reset NAL index
	
	InitBits( &pEncCtx->pOut->sBsWrite, pEncCtx->pOut->pBsBuffer, pEncCtx->pOut->uiSize );

	if ( keFrameType == WELS_FRAME_TYPE_P )
	{
		if ( pEncCtx->pSvcParam->uiIntraPeriod )
		{
			++pEncCtx->iFrameIndex;
		}
		
		++pEncCtx->uiFrameIdxRc;

		if ( pEncCtx->iPOC < ( 1 << pEncCtx->pSps->iLog2MaxPocLsb ) - 2 ) // if iPOC type is no 0, this need be modification
			pEncCtx->iPOC			+= 2;	// for POC type 0
		else
			pEncCtx->iPOC = 0;
		
		if ( pEncCtx->eLastNalPriority != 0 )
		{
			if ( pEncCtx->iFrameNum < (1 << pEncCtx->pSps->uiLog2MaxFrameNum) - 1  )
				++ pEncCtx->iFrameNum;
			else
				pEncCtx->iFrameNum	= 0;	// if iFrameNum overflow
		}
		pEncCtx->eNalType		= NAL_UNIT_CODED_SLICE;
		pEncCtx->eSliceType	= P_SLICE;
		pEncCtx->eNalPriority	= NRI_PRI_HIGH;
	}
	else if ( keFrameType == WELS_FRAME_TYPE_IDR )
	{
		pEncCtx->iFrameNum		= 0;
		pEncCtx->iPOC			= 0;
		pEncCtx->bEncCurFrmAsIdrFlag = false;
		if ( pEncCtx->pSvcParam->uiIntraPeriod )
		{
			pEncCtx->iFrameIndex = 0;
		}		
		pEncCtx->uiFrameIdxRc = 0;

		pEncCtx->eNalType		= NAL_UNIT_CODED_SLICE_IDR;
		pEncCtx->eSliceType	= I_SLICE;
		pEncCtx->eNalPriority	= NRI_PRI_HIGHEST;

		pEncCtx->iCodingIndex	= 0;

		// reset_ref_list

		// rc_init_gop		
	}
	else if ( keFrameType == WELS_FRAME_TYPE_I )
	{
		if ( pEncCtx->iPOC < ( 1 << pEncCtx->pSps->iLog2MaxPocLsb ) - 2 ) // if iPOC type is no 0, this need be modification
			pEncCtx->iPOC			+= 2;	// for POC type 0
		else
			pEncCtx->iPOC = 0;
		
		if ( pEncCtx->eLastNalPriority != 0 )
		{
			if ( pEncCtx->iFrameNum < (1 << pEncCtx->pSps->uiLog2MaxFrameNum) - 1  )
				++ pEncCtx->iFrameNum;
			else
				pEncCtx->iFrameNum	= 0;	// if iFrameNum overflow
		}

		pEncCtx->eNalType		= NAL_UNIT_CODED_SLICE;
		pEncCtx->eSliceType	= I_SLICE;
		pEncCtx->eNalPriority	= NRI_PRI_HIGHEST;

		// rc_init_gop
	}
	else	// B pictures are not supported now, any else?
	{
		assert( 0 );
	}

#if defined(STAT_OUTPUT)
	memset( &pEncCtx->sPerInfo, 0, sizeof(SStatSliceInfo) );
#endif//FRAME_INFO_OUTPUT

#if defined(MT_ENABLED) && defined(PACKING_ONE_SLICE_PER_LAYER)
	if ( pEncCtx->pSvcParam->iMultipleThreadIdc > 1 )
		reset_env_mt( pEncCtx );
#endif
}

EFrameType DecideFrameType( sWelsEncCtx *pEncCtx, const int8_t kiSpatialNum )
{	
	SWelsSvcCodingParam *pSvcParam	= pEncCtx->pSvcParam;
	EFrameType iFrameType = WELS_FRAME_TYPE_AUTO;
	bool_t bSceneChangeFlag = false;
	
	// perform scene change detection	
	if ( (!pSvcParam->bEnableSceneChangeDetect) || pEncCtx->pVaa->bIdrPeriodFlag || 
		(kiSpatialNum < pSvcParam->iNumDependencyLayer) || (pEncCtx->uiFrameIdxRc < (VGOP_SIZE << 1)) ) // avoid too frequent I frame coding, rc control 
	{
		bSceneChangeFlag = false;
	}
	else
	{
		bSceneChangeFlag = pEncCtx->pVaa->bSceneChangeFlag;
	}

	//scene_changed_flag: RC enable && iSpatialNum == pSvcParam->iNumDependencyLayer 
	//bIdrPeriodFlag: RC disable || iSpatialNum != pSvcParam->iNumDependencyLayer
	//pEncCtx->bEncCurFrmAsIdrFlag: 1. first frame should be IDR; 2. idr pause; 3. idr request
	iFrameType = ( pEncCtx->pVaa->bIdrPeriodFlag || bSceneChangeFlag || pEncCtx->bEncCurFrmAsIdrFlag ) ? WELS_FRAME_TYPE_IDR : WELS_FRAME_TYPE_P;

	if (  WELS_FRAME_TYPE_P == iFrameType && pEncCtx->iSkipFrameFlag > 0 ) // for frame skip, 1/5/2010
	{
		-- pEncCtx->iSkipFrameFlag;
		iFrameType = WELS_FRAME_TYPE_SKIP;
	}
	else if ( WELS_FRAME_TYPE_IDR == iFrameType )
	{
		pEncCtx->iCodingIndex = 0;
	}

	return iFrameType;
}

/*!
 * \brief	Dump reconstruction for dependency layer
 */

extern "C" void DumpDependencyRec( SPicture *pCurPicture, const str_t *kpFileName, const int8_t kiDid )
{
	FILE *pDumpRecFile											= NULL;	
	static bool_t bDependencyRecFlag[MAX_DEPENDENCY_LAYER]	= {0};
	int32_t iWrittenSize											= 0;

	if ( NULL == pCurPicture || NULL == kpFileName || kiDid >= MAX_DEPENDENCY_LAYER )
		return;
	
	if ( bDependencyRecFlag[kiDid] )
	{
		if ( STRNLEN(kpFileName, MAX_FNAME_LEN) > 0 )	// confirmed_safe_unsafe_usage
#if defined(__GNUC__) || (defined(WIN32) && defined(_MSC_VER) && (_MSC_VER<1500))
			pDumpRecFile	= FOPEN( kpFileName, "ab" );
#elif defined(WIN32) && defined(_MSC_VER) && (_MSC_VER>=1500)	// vs2008
			FOPEN(&pDumpRecFile, kpFileName, "ab");
#endif//__GNUC__..
		else
		{
			str_t sDependencyRecFileName[16] = {0};			
#if defined(WIN32) && defined(_MSC_VER) && (_MSC_VER>=1500)	// vs2008
			SNPRINTF( sDependencyRecFileName, 16, 16, "rec%d.yuv", kiDid );	// confirmed_safe_unsafe_usage
			FOPEN( &pDumpRecFile, sDependencyRecFileName, "ab" );
#else
			SNPRINTF( sDependencyRecFileName, 16, "rec%d.yuv", kiDid );	// confirmed_safe_unsafe_usage
			pDumpRecFile	= FOPEN( sDependencyRecFileName, "ab" );
#endif//WIN32..
		}
		if ( NULL != pDumpRecFile)
			fseek( pDumpRecFile, 0, SEEK_END );
	}
	else
	{
		if ( STRNLEN(kpFileName, MAX_FNAME_LEN) > 0 )	// confirmed_safe_unsafe_usage
		{
#if defined(WIN32) && defined(_MSC_VER) && (_MSC_VER>=1500)	// vs2008
			FOPEN(&pDumpRecFile, kpFileName, "wb");
#else
			pDumpRecFile	= FOPEN( kpFileName, "wb" );
#endif//WIN32..
		}
		else
		{
			str_t sDependencyRecFileName[16] = {0};
#if defined(WIN32) && defined(_MSC_VER) && (_MSC_VER>=1500)	// vs2008
			SNPRINTF( sDependencyRecFileName, 16, 16, "rec%d.yuv", kiDid );	// confirmed_safe_unsafe_usage
			FOPEN(&pDumpRecFile, sDependencyRecFileName, "wb");
#else
			SNPRINTF( sDependencyRecFileName, 16, "rec%d.yuv", kiDid );	// confirmed_safe_unsafe_usage
			pDumpRecFile	= FOPEN( sDependencyRecFileName, "wb");
#endif//WIN32..
		}
		bDependencyRecFlag[kiDid]	= true;
	}

	if ( NULL != pDumpRecFile )
	{
		int32_t i = 0;
		int32_t j = 0;
		const int32_t kiStrideY	= pCurPicture->iLineSize[0];		
		const int32_t kiLumaWidth	= pCurPicture->iWidthInPixel;
		const int32_t kiLumaHeight	= pCurPicture->iHeightInPixel;
		const int32_t kiChromaWidth	= kiLumaWidth >> 1;
		const int32_t kiChromaHeight	= kiLumaHeight >> 1;		
		
		for( j = 0; j < kiLumaHeight; ++ j)
		{
			iWrittenSize = fwrite( &pCurPicture->pData[0][j*kiStrideY], 1, kiLumaWidth, pDumpRecFile );
			assert( iWrittenSize == kiLumaWidth );
			if ( iWrittenSize < kiLumaWidth )
			{
				assert( 0 );	// make no sense for us if writing failed
				fclose(pDumpRecFile);
				return;
			}
		}
		for( i = 1; i < I420_PLANES; ++ i)
		{
			const int32_t kiStrideUV = pCurPicture->iLineSize[i];			
			for ( j = 0; j < kiChromaHeight; ++ j)
			{
				iWrittenSize = fwrite( &pCurPicture->pData[i][j*kiStrideUV], 1, kiChromaWidth, pDumpRecFile );
				assert(iWrittenSize == kiChromaWidth );
				if ( iWrittenSize < kiChromaWidth )
				{
					assert( 0 );	// make no sense for us if writing failed
					fclose(pDumpRecFile);
					return;
				}
			}
		}
		fclose(pDumpRecFile);
		pDumpRecFile = NULL;
	}
}

/*!
 * \brief	Dump the reconstruction pictures
 */

void DumpRecFrame( SPicture *pCurPicture, const str_t *kpFileName )
{
	FILE *pDumpRecFile				= NULL;	
	static bool_t bRecFlag	= false;
	int32_t iWrittenSize			= 0;

	if ( NULL == pCurPicture || NULL == kpFileName )
		return;
	
	if ( bRecFlag )
	{
		if ( STRNLEN(kpFileName, MAX_FNAME_LEN) > 0 )	// confirmed_safe_unsafe_usage
		{
#if defined(WIN32) && defined(_MSC_VER) && (_MSC_VER>=1500)	// vs2008
			FOPEN(&pDumpRecFile, kpFileName, "ab");
#else
			pDumpRecFile	= FOPEN( kpFileName, "ab" );
#endif//WIN32
		}
		else
		{
#if defined(WIN32) && defined(_MSC_VER) && (_MSC_VER>=1500)	// vs2008
			FOPEN(&pDumpRecFile, "rec.yuv", "ab");
#else
			pDumpRecFile	= FOPEN( "rec.yuv", "ab" );
#endif//WIN32
		}
		if ( NULL != pDumpRecFile)
			fseek( pDumpRecFile, 0, SEEK_END );
	}
	else
	{
		if ( STRNLEN(kpFileName, MAX_FNAME_LEN) > 0 )	// confirmed_safe_unsafe_usage
		{
#if defined(WIN32) && defined(_MSC_VER) && (_MSC_VER>=1500)	// vs2008
			FOPEN(&pDumpRecFile, kpFileName, "wb");
#else
			pDumpRecFile	= FOPEN( kpFileName, "wb" );
#endif//WIN32
		}
		else
		{
#if defined(WIN32) && defined(_MSC_VER) && (_MSC_VER>=1500)	// vs2008
			FOPEN(&pDumpRecFile, "rec.yuv", "wb");
#else
			pDumpRecFile	= FOPEN( "rec.yuv", "wb");
#endif//WIN32..
		}
		bRecFlag	= true;
	}

	if ( NULL != pDumpRecFile )
	{
		int32_t i = 0;
		int32_t j = 0;
		const int32_t kiStrideY	= pCurPicture->iLineSize[0];		
		const int32_t kiLumaWidth	= pCurPicture->iWidthInPixel;
		const int32_t kiLumaHeight	= pCurPicture->iHeightInPixel;
		const int32_t kiChromaWidth	= kiLumaWidth >> 1;
		const int32_t kiChromaHeight	= kiLumaHeight >> 1;		
		
		for( j = 0; j < kiLumaHeight; ++ j)
		{
			iWrittenSize = fwrite( &pCurPicture->pData[0][j*kiStrideY], 1, kiLumaWidth, pDumpRecFile );
			assert( iWrittenSize == kiLumaWidth );
			if ( iWrittenSize < kiLumaWidth )
			{
				assert( 0 );	// make no sense for us if writing failed
				fclose(pDumpRecFile);
				return;
			}
		}
		for( i = 1; i < I420_PLANES; ++ i)
		{
			const int32_t kiStrideUV = pCurPicture->iLineSize[i];			
			for ( j = 0; j < kiChromaHeight; ++ j)
			{
				iWrittenSize = fwrite( &pCurPicture->pData[i][j*kiStrideUV], 1, kiChromaWidth, pDumpRecFile );
				assert(iWrittenSize == kiChromaWidth );
				if ( iWrittenSize < kiChromaWidth )
				{
					assert( 0 );	// make no sense for us if writing failed
					fclose(pDumpRecFile);
					return;
				}
			}
		}
		fclose(pDumpRecFile);
		pDumpRecFile = NULL;
	}
}



/***********************************************************************************/
void WelsSetMemZero_c(void *pDst, int32_t iSize)	// confirmed_safe_unsafe_usage
{
	memset(pDst, 0, iSize);
}
}