shithub: openh264

ref: b4e1c41bcac77e7b60d80c7ad5ea21196e2fce9f
dir: /processing/src/downsample/downsample.cpp/

View raw version
/*!
 * \copy
 *     Copyright (c)  2013, Cisco Systems
 *     All rights reserved.
 *
 *     Redistribution and use in source and binary forms, with or without
 *     modification, are permitted provided that the following conditions
 *     are met:
 *
 *        * Redistributions of source code must retain the above copyright
 *          notice, this list of conditions and the following disclaimer.
 *
 *        * Redistributions in binary form must reproduce the above copyright
 *          notice, this list of conditions and the following disclaimer in
 *          the documentation and/or other materials provided with the
 *          distribution.
 *
 *     THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 *     "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 *     LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
 *     FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
 *     COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
 *     INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
 *     BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 *     LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
 *     CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 *     LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
 *     ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 *     POSSIBILITY OF SUCH DAMAGE.
 *
 */

#include "downsample.h"
#include "../common/cpu.h"

WELSVP_NAMESPACE_BEGIN


///////////////////////////////////////////////////////////////////////////////////////////////////////////////

CDownsampling::CDownsampling(int32_t iCpuFlag)
{
	m_iCPUFlag = iCpuFlag;
	m_eMethod   = METHOD_DOWNSAMPLE;
	WelsMemset(&m_pfDownsample, 0, sizeof(m_pfDownsample));
	InitDownsampleFuncs(m_pfDownsample, m_iCPUFlag);
}

CDownsampling::~CDownsampling()
{	
}

void CDownsampling::InitDownsampleFuncs(SDownsampleFuncs &sDownsampleFunc,  int32_t iCpuFlag)
{
	sDownsampleFunc.pfHalfAverage[0] = DyadicBilinearDownsampler_c;
	sDownsampleFunc.pfHalfAverage[1] = DyadicBilinearDownsampler_c;
	sDownsampleFunc.pfHalfAverage[2] = DyadicBilinearDownsampler_c;
	sDownsampleFunc.pfHalfAverage[3] = DyadicBilinearDownsampler_c;
	sDownsampleFunc.pfGeneralRatioChroma = GeneralBilinearAccurateDownsampler_c;
	sDownsampleFunc.pfGeneralRatioLuma	 = GeneralBilinearFastDownsampler_c;
#if defined(X86_ASM)
	if ( iCpuFlag & WELS_CPU_SSE )
	{
		sDownsampleFunc.pfHalfAverage[0]	= DyadicBilinearDownsamplerWidthx32_sse;
		sDownsampleFunc.pfHalfAverage[1]	= DyadicBilinearDownsamplerWidthx16_sse;
		sDownsampleFunc.pfHalfAverage[2]	= DyadicBilinearDownsamplerWidthx8_sse;
	}
	if ( iCpuFlag & WELS_CPU_SSE2 )
	{
		sDownsampleFunc.pfGeneralRatioChroma = GeneralBilinearAccurateDownsamplerWrap_sse2;
		sDownsampleFunc.pfGeneralRatioLuma   = GeneralBilinearFastDownsamplerWrap_sse2;
	}
	if ( iCpuFlag & WELS_CPU_SSSE3 )
	{
		sDownsampleFunc.pfHalfAverage[0]	= DyadicBilinearDownsamplerWidthx32_ssse3;
		sDownsampleFunc.pfHalfAverage[1]	= DyadicBilinearDownsamplerWidthx16_ssse3;
	}
	if ( iCpuFlag & WELS_CPU_SSE41 )
	{
		sDownsampleFunc.pfHalfAverage[0]	= DyadicBilinearDownsamplerWidthx32_sse4;
		sDownsampleFunc.pfHalfAverage[1]	= DyadicBilinearDownsamplerWidthx16_sse4;
	}
#endif//X86_ASM
	
}

EResult CDownsampling::Process(int32_t iType, SPixMap *pSrcPixMap, SPixMap *pDstPixMap)
{
	int32_t iSrcWidthY = pSrcPixMap->sRect.iRectWidth;
	int32_t iSrcHeightY = pSrcPixMap->sRect.iRectHeight;
	int32_t iDstWidthY = pDstPixMap->sRect.iRectWidth;
	int32_t iDstHeightY = pDstPixMap->sRect.iRectHeight;

	int32_t iSrcWidthUV = iSrcWidthY >> 1;
	int32_t iSrcHeightUV = iSrcHeightY >> 1;
	int32_t iDstWidthUV = iDstWidthY >> 1;
	int32_t iDstHeightUV = iDstHeightY >> 1;

	if (iSrcWidthY <= iDstWidthY || iSrcHeightY <= iDstHeightY)
	{
		return RET_INVALIDPARAM;
	}

	if ((iSrcWidthY >>1) == iDstWidthY && (iSrcHeightY >> 1) == iDstHeightY)
	{
		// use half average functions
		uint8_t iAlignIndex = 3;

		iAlignIndex = GetAlignedIndex(iSrcWidthY);
		m_pfDownsample.pfHalfAverage[iAlignIndex]((uint8_t*)pDstPixMap->pPixel[0], pDstPixMap->iStride[0], (uint8_t*)pSrcPixMap->pPixel[0], pSrcPixMap->iStride[0], iSrcWidthY, iSrcHeightY);

		iAlignIndex = GetAlignedIndex(iSrcWidthUV);
		m_pfDownsample.pfHalfAverage[iAlignIndex]((uint8_t*)pDstPixMap->pPixel[1], pDstPixMap->iStride[1], (uint8_t*)pSrcPixMap->pPixel[1], pSrcPixMap->iStride[1], iSrcWidthUV, iSrcHeightUV);
		m_pfDownsample.pfHalfAverage[iAlignIndex]((uint8_t*)pDstPixMap->pPixel[2], pDstPixMap->iStride[2], (uint8_t*)pSrcPixMap->pPixel[2], pSrcPixMap->iStride[2], iSrcWidthUV, iSrcHeightUV);
	}
	else 
	{
		m_pfDownsample.pfGeneralRatioLuma((uint8_t*)pDstPixMap->pPixel[0], pDstPixMap->iStride[0], iDstWidthY, iDstHeightY, 
			(uint8_t*)pSrcPixMap->pPixel[0], pSrcPixMap->iStride[0], iSrcWidthY, iSrcHeightY);

		m_pfDownsample.pfGeneralRatioChroma((uint8_t*)pDstPixMap->pPixel[1], pDstPixMap->iStride[1], iDstWidthUV, iDstHeightUV,
			(uint8_t*)pSrcPixMap->pPixel[1], pSrcPixMap->iStride[1], iSrcWidthUV, iSrcHeightUV);

		m_pfDownsample.pfGeneralRatioChroma((uint8_t*)pDstPixMap->pPixel[2], pDstPixMap->iStride[2], iDstWidthUV, iDstHeightUV,
			(uint8_t*)pSrcPixMap->pPixel[2], pSrcPixMap->iStride[2], iSrcWidthUV, iSrcHeightUV);
	}
	return RET_SUCCESS;
}

int32_t CDownsampling::GetAlignedIndex( const int32_t kiSrcWidth )
{
	int32_t iAlignIndex = 3;
	if ( (kiSrcWidth & 0x1f) == 0 )	// x32	
		iAlignIndex	= 0;
	else if ( (kiSrcWidth & 0x0f) == 0 )	// x16
		iAlignIndex	= 1;
	else if ( (kiSrcWidth & 0x07) == 0 )	// x8
		iAlignIndex	= 2;
	else
		iAlignIndex	= 3;
	return iAlignIndex;
}


WELSVP_NAMESPACE_END