ref: bc3c63c4319949a9da0257d4a195de43987a5db5
dir: /codec/encoder/core/src/svc_motion_estimate.cpp/
/*! * \copy * Copyright (c) 2009-2013, Cisco Systems * All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * * * Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * * * Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in * the documentation and/or other materials provided with the * distribution. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE * COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE * POSSIBILITY OF SUCH DAMAGE. * * * \file svc motion estimate.c * * \brief Interfaces introduced in svc mb motion estimation * * \date 08/11/2009 Created * ************************************************************************************* */ #include <stdlib.h> #include <stdio.h> #include <string.h> #include "svc_motion_estimate.h" #include "svc_enc_golomb.h" #include "macros.h" #include "sample.h" #include "array_stack_align.h" #include "cpu_core.h" // WELS_CPU_SSE41 namespace WelsSVCEnc { /*! * \brief BL mb motion estimate search * * \param enc Wels encoder context * \param pMe Wels me information * * \return NONE */ void WelsMotionEstimateSearchSatd (SWelsFuncPtrList *pFuncList, void* pLplayer, void* pLpme, void* pLpslice) { SDqLayer* pCurDqLayer = (SDqLayer *)pLplayer; SWelsME* pMe = (SWelsME *)pLpme; SSlice* pSlice = (SSlice *)pLpslice; int32_t iStrideEnc = pCurDqLayer->iEncStride[0]; int32_t iStrideRef = pCurDqLayer->pRefPic->iLineSize[0]; // Step 1: Initial point prediction WelsMotionEstimateInitialPoint ( pFuncList, pMe, pSlice, iStrideEnc, iStrideRef ); pMe->uSadPredISatd.uiSatd = pFuncList->sSampleDealingFuncs.pfSampleSatd[pMe->uiPixel]( pMe->pEncMb, iStrideEnc, pMe->pRefMb, iStrideRef ); pMe->uiSatdCost = pMe->uSadPredISatd.uiSatd + COST_MVD(pMe->pMvdCost, pMe->sMv.iMvX - pMe->sMvp.iMvX, pMe->sMv.iMvY - pMe->sMvp.iMvY); } void WelsMotionEstimateSearchSad (SWelsFuncPtrList *pFuncList, void* pLplayer, void* pLpme, void* pLpslice) { SDqLayer* pCurDqLayer = (SDqLayer *)pLplayer; SWelsME* pMe = (SWelsME *)pLpme; SSlice* slice = (SSlice *)pLpslice; int32_t iStrideEnc = pCurDqLayer->iEncStride[0]; int32_t iStrideRef = pCurDqLayer->pRefPic->iLineSize[0]; // Step 1: Initial point prediction WelsMotionEstimateInitialPoint ( pFuncList, pMe, slice, iStrideEnc, iStrideRef ); } /*! * \brief EL mb motion estimate initial point testing * * \param pix_pFuncList SSampleDealingFunc * \param pMe Wels me information * \param mv_range search range in motion estimate * \param point the best match point in motion estimation * * \return NONE */ void WelsMotionEstimateInitialPoint(SWelsFuncPtrList *pFuncList, SWelsME * pMe, SSlice *pSlice, int32_t iStrideEnc, int32_t iStrideRef ) { PSampleSadSatdCostFunc pSad = pFuncList->sSampleDealingFuncs.pfSampleSad[pMe->uiPixel]; const uint16_t *kpMvdCost = pMe->pMvdCost; uint8_t* const kpEncMb = pMe->pEncMb; int16_t iMvc0, iMvc1; int32_t iSadCost; int32_t iBestSadCost; uint8_t *pRefMb; uint8_t *pFref2; uint32_t i; const uint32_t kuiMvcNum = pSlice->uiMvcNum; const SMVUnitXY *kpMvcList = &pSlice->sMvc[0]; const SMVUnitXY ksMvMin = pSlice->sMvMin; const SMVUnitXY ksMvMax = pSlice->sMvMax; const SMVUnitXY ksMvp = pMe->sMvp; SMVUnitXY sMv; // Step 1: Initial point prediction // init with sMvp sMv.iMvX = WELS_CLIP3( (2 + ksMvp.iMvX) >> 2, ksMvMin.iMvX, ksMvMax.iMvX ); sMv.iMvY = WELS_CLIP3( (2 + ksMvp.iMvY) >> 2, ksMvMin.iMvY, ksMvMax.iMvY ); pRefMb = &pMe->pRefMb[sMv.iMvY * iStrideRef + sMv.iMvX]; iBestSadCost = pSad( kpEncMb, iStrideEnc, pRefMb, iStrideRef ); iBestSadCost += COST_MVD(kpMvdCost, ((sMv.iMvX)<<2) - ksMvp.iMvX, ((sMv.iMvY)<<2) - ksMvp.iMvY); for (i = 0; i < kuiMvcNum; i++) { //clipping here is essential since some pOut-of-range MVC may happen here (i.e., refer to baseMV) iMvc0 = WELS_CLIP3( ( 2 + kpMvcList[i].iMvX ) >> 2, ksMvMin.iMvX, ksMvMax.iMvX ); iMvc1 = WELS_CLIP3( ( 2 + kpMvcList[i].iMvY ) >> 2, ksMvMin.iMvY, ksMvMax.iMvY ); if( ((iMvc0-sMv.iMvX) || (iMvc1-sMv.iMvY)) ) { pFref2 = &pMe->pRefMb[iMvc1*iStrideRef+iMvc0]; iSadCost = pSad( kpEncMb, iStrideEnc, pFref2, iStrideRef ) + COST_MVD(kpMvdCost, (iMvc0<<2) - ksMvp.iMvX, (iMvc1<<2) - ksMvp.iMvY); if( iSadCost < iBestSadCost ) { sMv.iMvX = iMvc0; sMv.iMvY = iMvc1; pRefMb = pFref2; iBestSadCost = iSadCost; } } } pMe->sMv = sMv; pMe->uiSadCost = iBestSadCost; if ( iBestSadCost < pMe->uSadPredISatd.uiSadPred ) { // Step 2: Initial early Stop /* -> qpel mv */ pMe->sMv.iMvX <<= 2; pMe->sMv.iMvY <<= 2; /* -> pRef */ pMe->pRefMb = pRefMb; /* compute the real cost */ pMe->uiSatdCost = iBestSadCost; } else { // Step 3: Fast search pattern WelsMotionEstimateIterativeSearch ( pFuncList, pMe, iStrideEnc, iStrideRef, pRefMb ); } } bool_t WelsMeSadCostSelect( int32_t *iSadCost, const uint16_t *kpMvdCost, int32_t *pBestCost, const int32_t kiDx, const int32_t kiDy, int32_t *pIx, int32_t *pIy) { int32_t iTempSadCost[4]; int32_t iInputSadCost=*pBestCost; iTempSadCost[0] = iSadCost[0]+COST_MVD(kpMvdCost, kiDx, kiDy - 4); iTempSadCost[1] = iSadCost[1]+COST_MVD(kpMvdCost, kiDx, kiDy + 4); iTempSadCost[2] = iSadCost[2]+COST_MVD(kpMvdCost, kiDx - 4, kiDy); iTempSadCost[3] = iSadCost[3]+COST_MVD(kpMvdCost, kiDx + 4, kiDy); if (iTempSadCost[0]<*pBestCost) { *pBestCost = iTempSadCost[0]; *pIx = 0; *pIy = 1; } if (iTempSadCost[1]<*pBestCost) { *pBestCost = iTempSadCost[1]; *pIx = 0; *pIy = -1; } if (iTempSadCost[2]<*pBestCost) { *pBestCost = iTempSadCost[2]; *pIx = 1; *pIy = 0; } if (iTempSadCost[3]<*pBestCost) { *pBestCost = iTempSadCost[3]; *pIx = -1; *pIy = 0; } return (*pBestCost==iInputSadCost); } void WelsMotionEstimateIterativeSearch( SWelsFuncPtrList *pFuncList, SWelsME *pMe, const int32_t kiStrideEnc, const int32_t kiStrideRef, uint8_t *pFref ) { PSample4SadCostFunc pSad = pFuncList->sSampleDealingFuncs.pfSample4Sad[pMe->uiPixel]; uint8_t* const kpEncMb = pMe->pEncMb; const uint16_t *kpMvdCost = pMe->pMvdCost; int32_t iMvDx = ((pMe->sMv.iMvX)<<2) - pMe->sMvp.iMvX; int32_t iMvDy = ((pMe->sMv.iMvY)<<2) - pMe->sMvp.iMvY; uint8_t *pRefMb = pFref; int32_t iBestCost = (pMe->uiSadCost); int32_t iTimeThreshold = ITERATIVE_TIMES; ENFORCE_STACK_ALIGN_1D(int32_t, iSadCosts, 4, 16) while(iTimeThreshold--) { pSad( kpEncMb,kiStrideEnc,pRefMb,kiStrideRef,&iSadCosts[0] ); int32_t iX,iY; const bool_t kbIsBestCostWorse = WelsMeSadCostSelect( iSadCosts, kpMvdCost, &iBestCost,iMvDx, iMvDy,&iX,&iY ); if (kbIsBestCostWorse) break; iMvDx -= iX<<2 ; iMvDy -= iY<<2 ; pRefMb -= (iX+iY*kiStrideRef); } /* -> qpel mv */ pMe->sMv.iMvX = (iMvDx + pMe->sMvp.iMvX) & 0xFFFC; pMe->sMv.iMvY = (iMvDy + pMe->sMvp.iMvY) & 0xFFFC; pMe->uiSatdCost = pMe->uiSadCost = (iBestCost); pMe->pRefMb = pRefMb; } } // namespace WelsSVCEnc