| /*! |
| * \copy |
| * Copyright (c) 2013, Cisco Systems |
| * All rights reserved. |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions |
| * are met: |
| * |
| * * Redistributions of source code must retain the above copyright |
| * notice, this list of conditions and the following disclaimer. |
| * |
| * * Redistributions in binary form must reproduce the above copyright |
| * notice, this list of conditions and the following disclaimer in |
| * the documentation and/or other materials provided with the |
| * distribution. |
| * |
| * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS |
| * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE |
| * COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, |
| * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, |
| * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |
| * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER |
| * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT |
| * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN |
| * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE |
| * POSSIBILITY OF SUCH DAMAGE. |
| * |
| */ |
| |
| #include "vaacalculation.h" |
| #include "cpu.h" |
| |
| WELSVP_NAMESPACE_BEGIN |
| |
| |
| /////////////////////////////////////////////////////////////////////////////////////////////////////////////// |
| |
| CVAACalculation::CVAACalculation (int32_t iCpuFlag) { |
| m_iCPUFlag = iCpuFlag; |
| m_eMethod = METHOD_VAA_STATISTICS; |
| |
| WelsMemset (&m_sCalcParam, 0, sizeof (m_sCalcParam)); |
| WelsMemset (&m_sVaaFuncs, 0, sizeof (m_sVaaFuncs)); |
| InitVaaFuncs (m_sVaaFuncs, m_iCPUFlag); |
| } |
| |
| CVAACalculation::~CVAACalculation() { |
| } |
| |
| void CVAACalculation::InitVaaFuncs (SVaaFuncs& sVaaFuncs, int32_t iCpuFlag) { |
| sVaaFuncs.pfVAACalcSad = VAACalcSad_c; |
| sVaaFuncs.pfVAACalcSadBgd = VAACalcSadBgd_c; |
| sVaaFuncs.pfVAACalcSadSsd = VAACalcSadSsd_c; |
| sVaaFuncs.pfVAACalcSadSsdBgd = VAACalcSadSsdBgd_c; |
| sVaaFuncs.pfVAACalcSadVar = VAACalcSadVar_c; |
| #ifdef X86_ASM |
| if ((iCpuFlag & WELS_CPU_SSE2) == WELS_CPU_SSE2) { |
| sVaaFuncs.pfVAACalcSad = VAACalcSad_sse2; |
| sVaaFuncs.pfVAACalcSadBgd = VAACalcSadBgd_sse2; |
| sVaaFuncs.pfVAACalcSadSsd = VAACalcSadSsd_sse2; |
| sVaaFuncs.pfVAACalcSadSsdBgd = VAACalcSadSsdBgd_sse2; |
| sVaaFuncs.pfVAACalcSadVar = VAACalcSadVar_sse2; |
| } |
| #endif//X86_ASM |
| #ifdef HAVE_NEON |
| if ((iCpuFlag & WELS_CPU_NEON) == WELS_CPU_NEON) { |
| sVaaFuncs.pfVAACalcSad = VAACalcSad_neon; |
| sVaaFuncs.pfVAACalcSadBgd = VAACalcSadBgd_neon; |
| sVaaFuncs.pfVAACalcSadSsd = VAACalcSadSsd_neon; |
| sVaaFuncs.pfVAACalcSadSsdBgd = VAACalcSadSsdBgd_neon; |
| sVaaFuncs.pfVAACalcSadVar = VAACalcSadVar_neon; |
| } |
| #endif//HAVE_NEON |
| |
| #ifdef HAVE_NEON_AARCH64 |
| if ((iCpuFlag & WELS_CPU_NEON) == WELS_CPU_NEON) { |
| sVaaFuncs.pfVAACalcSad = VAACalcSad_AArch64_neon; |
| sVaaFuncs.pfVAACalcSadBgd = VAACalcSadBgd_AArch64_neon; |
| sVaaFuncs.pfVAACalcSadSsd = VAACalcSadSsd_AArch64_neon; |
| sVaaFuncs.pfVAACalcSadSsdBgd = VAACalcSadSsdBgd_AArch64_neon; |
| sVaaFuncs.pfVAACalcSadVar = VAACalcSadVar_AArch64_neon; |
| } |
| #endif//HAVE_NEON_AARCH64 |
| } |
| |
| EResult CVAACalculation::Process (int32_t iType, SPixMap* pSrcPixMap, SPixMap* pRefPixMap) { |
| uint8_t* pCurData = (uint8_t*)pSrcPixMap->pPixel[0]; |
| uint8_t* pRefData = (uint8_t*)pRefPixMap->pPixel[0]; |
| int32_t iPicWidth = pSrcPixMap->sRect.iRectWidth; |
| int32_t iPicHeight = pSrcPixMap->sRect.iRectHeight; |
| int32_t iPicStride = pSrcPixMap->iStride[0]; |
| |
| SVAACalcResult* pResult = m_sCalcParam.pCalcResult; |
| |
| if (pCurData == NULL || pRefData == NULL) { |
| return RET_INVALIDPARAM; |
| } |
| |
| pResult->pCurY = pCurData; |
| pResult->pRefY = pRefData; |
| if (m_sCalcParam.iCalcBgd) { |
| if (m_sCalcParam.iCalcSsd) { |
| m_sVaaFuncs.pfVAACalcSadSsdBgd (pCurData, pRefData, iPicWidth, iPicHeight, iPicStride, &pResult->iFrameSad, |
| (int32_t*)pResult->pSad8x8, pResult->pSum16x16, pResult->pSumOfSquare16x16, pResult->pSsd16x16, |
| (int32_t*)pResult->pSumOfDiff8x8, (uint8_t*)pResult->pMad8x8); |
| } else { |
| m_sVaaFuncs.pfVAACalcSadBgd (pCurData, pRefData, iPicWidth, iPicHeight, iPicStride, &pResult->iFrameSad, |
| (int32_t*) (pResult->pSad8x8), (int32_t*) (pResult->pSumOfDiff8x8), (uint8_t*)pResult->pMad8x8); |
| } |
| } else { |
| if (m_sCalcParam.iCalcSsd) { |
| m_sVaaFuncs.pfVAACalcSadSsd (pCurData, pRefData, iPicWidth, iPicHeight, iPicStride, &pResult->iFrameSad, |
| (int32_t*)pResult->pSad8x8, pResult->pSum16x16, pResult->pSumOfSquare16x16, pResult->pSsd16x16); |
| } else { |
| if (m_sCalcParam.iCalcVar) { |
| m_sVaaFuncs.pfVAACalcSadVar (pCurData, pRefData, iPicWidth, iPicHeight, iPicStride, &pResult->iFrameSad, |
| (int32_t*)pResult->pSad8x8, pResult->pSum16x16, pResult->pSumOfSquare16x16); |
| } else { |
| m_sVaaFuncs.pfVAACalcSad (pCurData, pRefData, iPicWidth, iPicHeight, iPicStride, &pResult->iFrameSad, |
| (int32_t*)pResult->pSad8x8); |
| } |
| } |
| } |
| |
| return RET_SUCCESS; |
| } |
| |
| EResult CVAACalculation::Set (int32_t iType, void* pParam) { |
| if (pParam == NULL || ((SVAACalcParam*)pParam)->pCalcResult == NULL) { |
| return RET_INVALIDPARAM; |
| } |
| |
| m_sCalcParam = * (SVAACalcParam*)pParam; |
| |
| return RET_SUCCESS; |
| } |
| |
| |
| WELSVP_NAMESPACE_END |