ref: 3d25c25aeafcf7c186ff449201ef7c061db00192
dir: /codec/processing/src/vaacalc/vaacalculation.cpp/
/*! * \copy * Copyright (c) 2013, Cisco Systems * All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * * * Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * * * Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in * the documentation and/or other materials provided with the * distribution. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE * COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE * POSSIBILITY OF SUCH DAMAGE. * */ #include "vaacalculation.h" #include "cpu.h" WELSVP_NAMESPACE_BEGIN /////////////////////////////////////////////////////////////////////////////////////////////////////////////// CVAACalculation::CVAACalculation (int32_t iCpuFlag) { m_iCPUFlag = iCpuFlag; m_eMethod = METHOD_VAA_STATISTICS; WelsMemset (&m_sCalcParam, 0, sizeof (m_sCalcParam)); WelsMemset (&m_sVaaFuncs, 0, sizeof (m_sVaaFuncs)); InitVaaFuncs (m_sVaaFuncs, m_iCPUFlag); } CVAACalculation::~CVAACalculation() { } void CVAACalculation::InitVaaFuncs (SVaaFuncs& sVaaFuncs, int32_t iCpuFlag) { sVaaFuncs.pfVAACalcSad = VAACalcSad_c; sVaaFuncs.pfVAACalcSadBgd = VAACalcSadBgd_c; sVaaFuncs.pfVAACalcSadSsd = VAACalcSadSsd_c; sVaaFuncs.pfVAACalcSadSsdBgd = VAACalcSadSsdBgd_c; sVaaFuncs.pfVAACalcSadVar = VAACalcSadVar_c; #ifdef X86_ASM if ((iCpuFlag & WELS_CPU_SSE2) == WELS_CPU_SSE2) { sVaaFuncs.pfVAACalcSad = VAACalcSad_sse2; sVaaFuncs.pfVAACalcSadBgd = VAACalcSadBgd_sse2; sVaaFuncs.pfVAACalcSadSsd = VAACalcSadSsd_sse2; sVaaFuncs.pfVAACalcSadSsdBgd = VAACalcSadSsdBgd_sse2; sVaaFuncs.pfVAACalcSadVar = VAACalcSadVar_sse2; } #ifdef HAVE_AVX2 if (iCpuFlag & WELS_CPU_AVX2) { sVaaFuncs.pfVAACalcSad = VAACalcSad_avx2; sVaaFuncs.pfVAACalcSadBgd = VAACalcSadBgd_avx2; sVaaFuncs.pfVAACalcSadSsd = VAACalcSadSsd_avx2; sVaaFuncs.pfVAACalcSadSsdBgd = VAACalcSadSsdBgd_avx2; sVaaFuncs.pfVAACalcSadVar = VAACalcSadVar_avx2; } #endif #endif//X86_ASM #ifdef HAVE_NEON if ((iCpuFlag & WELS_CPU_NEON) == WELS_CPU_NEON) { sVaaFuncs.pfVAACalcSad = VAACalcSad_neon; sVaaFuncs.pfVAACalcSadBgd = VAACalcSadBgd_neon; sVaaFuncs.pfVAACalcSadSsd = VAACalcSadSsd_neon; sVaaFuncs.pfVAACalcSadSsdBgd = VAACalcSadSsdBgd_neon; sVaaFuncs.pfVAACalcSadVar = VAACalcSadVar_neon; } #endif//HAVE_NEON #ifdef HAVE_NEON_AARCH64 if ((iCpuFlag & WELS_CPU_NEON) == WELS_CPU_NEON) { sVaaFuncs.pfVAACalcSad = VAACalcSad_AArch64_neon; sVaaFuncs.pfVAACalcSadBgd = VAACalcSadBgd_AArch64_neon; sVaaFuncs.pfVAACalcSadSsd = VAACalcSadSsd_AArch64_neon; sVaaFuncs.pfVAACalcSadSsdBgd = VAACalcSadSsdBgd_AArch64_neon; sVaaFuncs.pfVAACalcSadVar = VAACalcSadVar_AArch64_neon; } #endif//HAVE_NEON_AARCH64 } EResult CVAACalculation::Process (int32_t iType, SPixMap* pSrcPixMap, SPixMap* pRefPixMap) { uint8_t* pCurData = (uint8_t*)pSrcPixMap->pPixel[0]; uint8_t* pRefData = (uint8_t*)pRefPixMap->pPixel[0]; int32_t iPicWidth = pSrcPixMap->sRect.iRectWidth; int32_t iPicHeight = pSrcPixMap->sRect.iRectHeight; int32_t iPicStride = pSrcPixMap->iStride[0]; SVAACalcResult* pResult = m_sCalcParam.pCalcResult; if (pCurData == NULL || pRefData == NULL) { return RET_INVALIDPARAM; } pResult->pCurY = pCurData; pResult->pRefY = pRefData; if (m_sCalcParam.iCalcBgd) { if (m_sCalcParam.iCalcSsd) { m_sVaaFuncs.pfVAACalcSadSsdBgd (pCurData, pRefData, iPicWidth, iPicHeight, iPicStride, &pResult->iFrameSad, (int32_t*)pResult->pSad8x8, pResult->pSum16x16, pResult->pSumOfSquare16x16, pResult->pSsd16x16, (int32_t*)pResult->pSumOfDiff8x8, (uint8_t*)pResult->pMad8x8); } else { m_sVaaFuncs.pfVAACalcSadBgd (pCurData, pRefData, iPicWidth, iPicHeight, iPicStride, &pResult->iFrameSad, (int32_t*) (pResult->pSad8x8), (int32_t*) (pResult->pSumOfDiff8x8), (uint8_t*)pResult->pMad8x8); } } else { if (m_sCalcParam.iCalcSsd) { m_sVaaFuncs.pfVAACalcSadSsd (pCurData, pRefData, iPicWidth, iPicHeight, iPicStride, &pResult->iFrameSad, (int32_t*)pResult->pSad8x8, pResult->pSum16x16, pResult->pSumOfSquare16x16, pResult->pSsd16x16); } else { if (m_sCalcParam.iCalcVar) { m_sVaaFuncs.pfVAACalcSadVar (pCurData, pRefData, iPicWidth, iPicHeight, iPicStride, &pResult->iFrameSad, (int32_t*)pResult->pSad8x8, pResult->pSum16x16, pResult->pSumOfSquare16x16); } else { m_sVaaFuncs.pfVAACalcSad (pCurData, pRefData, iPicWidth, iPicHeight, iPicStride, &pResult->iFrameSad, (int32_t*)pResult->pSad8x8); } } } return RET_SUCCESS; } EResult CVAACalculation::Set (int32_t iType, void* pParam) { if (pParam == NULL || ((SVAACalcParam*)pParam)->pCalcResult == NULL) { return RET_INVALIDPARAM; } m_sCalcParam = * (SVAACalcParam*)pParam; return RET_SUCCESS; } WELSVP_NAMESPACE_END