ref: d657db3bf49b42561161ef60d6e3e182e517a5ab
dir: /CoreAAC/CoreAAC.cpp/
/* * CoreAAC - AAC DirectShow Decoder Filter * * Modification to decode AAC without ADTS and multichannel support * (c) 2003 [email protected] * * Under section 8 of the GNU General Public License, the copyright * holders of CoreAAC explicitly forbid distribution in the following * countries: * - Japan * - United States of America * * * AAC DirectShow Decoder Filter * Copyright (C) 2003 Robert Cioch * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. * */ #include <windows.h> #include <streams.h> #include <initguid.h> #include <olectl.h> #include <transfrm.h> #include <mmreg.h> #include <ks.h> #include <ksmedia.h> #include <stdio.h> #include "AACProfilesName.h" #include "ICoreAAC.h" #include "CoreAACGUID.h" #include "CoreAACInfoProp.h" #include "CoreAACAboutProp.h" #include "CoreAAC.h" // ============================================================================ // Registration setup stuff AMOVIESETUP_MEDIATYPE sudInputType[] = { { &MEDIATYPE_Audio, &MEDIASUBTYPE_AAC } }; AMOVIESETUP_MEDIATYPE sudOutputType[] = { { &MEDIATYPE_Audio, &MEDIASUBTYPE_PCM } }; AMOVIESETUP_PIN sudPins[] = { { L"Input", FALSE, // bRendered FALSE, // bOutput FALSE, // bZero FALSE, // bMany &CLSID_NULL, // clsConnectsToFilter NULL, // ConnectsToPin NUMELMS(sudInputType), // Number of media types sudInputType }, { L"Output", FALSE, // bRendered TRUE, // bOutput FALSE, // bZero FALSE, // bMany &CLSID_NULL, // clsConnectsToFilter NULL, // ConnectsToPin NUMELMS(sudOutputType), // Number of media types sudOutputType } }; AMOVIESETUP_FILTER sudDecoder = { &CLSID_DECODER, L"CoreAAC Audio Decoder", MERIT_PREFERRED, NUMELMS(sudPins), sudPins }; // ============================================================================ // COM Global table of objects in this dll CFactoryTemplate g_Templates[] = { { L"CoreAAC Audio Decoder", &CLSID_DECODER, CCoreAACDecoder::CreateInstance, NULL, &sudDecoder }, { L"CoreAAC Audio Decoder Info", &CLSID_CoreAACInfoProp, CCoreAACInfoProp::CreateInstance, NULL, NULL}, { L"CoreAAC Audio Decoder About", &CLSID_CoreAACAboutProp, CCoreAACAboutProp::CreateInstance, NULL, NULL}, }; // Count of objects listed in g_cTemplates int g_cTemplates = sizeof(g_Templates) / sizeof(g_Templates[0]); // ============================================================================ STDAPI DllRegisterServer() { return AMovieDllRegisterServer2(TRUE); } // ---------------------------------------------------------------------------- STDAPI DllUnregisterServer() { return AMovieDllRegisterServer2(FALSE); } // ---------------------------------------------------------------------------- // The streams.h DLL entrypoint. extern "C" BOOL WINAPI DllEntryPoint(HINSTANCE, ULONG, LPVOID); // The entrypoint required by the MSVC runtimes. This is used instead // of DllEntryPoint directly to ensure global C++ classes get initialised. BOOL WINAPI DllMain(HANDLE hDllHandle, DWORD dwReason, LPVOID lpreserved) { return DllEntryPoint(reinterpret_cast<HINSTANCE>(hDllHandle), dwReason, lpreserved); } // ---------------------------------------------------------------------------- CUnknown *WINAPI CCoreAACDecoder::CreateInstance(LPUNKNOWN punk, HRESULT *phr) { CCoreAACDecoder *pNewObject = new CCoreAACDecoder(punk, phr); if (!pNewObject) *phr = E_OUTOFMEMORY; return pNewObject; } // ---------------------------------------------------------------------------- void SaveInt(char* keyname, int value) { HKEY hKey; DWORD dwDisp; if (ERROR_SUCCESS == RegCreateKeyEx(HKEY_CURRENT_USER, "Software\\CoreAAC", 0, "REG_SZ", REG_OPTION_NON_VOLATILE, KEY_WRITE, NULL, &hKey, &dwDisp)) { DWORD dwSize = sizeof(DWORD); RegSetValueEx(hKey, keyname, 0, REG_DWORD, (CONST BYTE*)&value, dwSize); RegCloseKey(hKey); } } int LoadInt(char* keyname, int default_value) { HKEY hKey; int result = default_value; if (ERROR_SUCCESS == RegOpenKeyEx(HKEY_CURRENT_USER, "Software\\CoreAAC", 0, KEY_READ, &hKey)) { DWORD dwTmp = 0; DWORD dwcbData = sizeof(DWORD); if(RegQueryValueEx(hKey, keyname, NULL, NULL, (LPBYTE) &dwTmp, &dwcbData) == ERROR_SUCCESS) { result = dwTmp; } RegCloseKey(hKey); } return result; } // ---------------------------------------------------------------------------- CCoreAACDecoder::CCoreAACDecoder(LPUNKNOWN lpunk, HRESULT *phr) : CTransformFilter(NAME("CoreAAC Audio Decoder"), lpunk, CLSID_DECODER), m_decHandle(NULL), m_decoderSpecificLen(0), m_decoderSpecific(NULL), m_Channels(0), m_SamplesPerSec(0), m_BitsPerSample(0), m_Bitrate(0), m_brCalcFrames(0), m_brBytesConsumed(0), m_DecodedFrames(0), m_OutputBuffLen(0), m_DownMatrix(false) { NOTE("CCoreAACDecoder::CCoreAACDecoder"); m_ProfileName[0] = '\0'; m_DownMatrix = LoadInt("DownMatrix", TRUE) ? true : false; } // ---------------------------------------------------------------------------- CCoreAACDecoder::~CCoreAACDecoder() { NOTE("CCoreAACDecoder::~CCoreAACDecoder"); SaveInt("DownMatrix",m_DownMatrix); if(m_decHandle) { faacDecClose(m_decHandle); m_decHandle = NULL; } if(m_decoderSpecific) { delete m_decoderSpecific; m_decoderSpecific = NULL; } } // ---------------------------------------------------------------------------- STDMETHODIMP CCoreAACDecoder::NonDelegatingQueryInterface(REFIID riid, void **ppv) { if(riid == IID_ICoreAACDec) return GetInterface((ICoreAACDec *)this, ppv); else if (riid == IID_ISpecifyPropertyPages) return GetInterface((ISpecifyPropertyPages *)this, ppv); else return CTransformFilter::NonDelegatingQueryInterface(riid, ppv); } // ---------------------------------------------------------------------------- // property pages STDMETHODIMP CCoreAACDecoder::GetPages(CAUUID *pPages) { pPages->cElems = 2; pPages->pElems = (GUID *)CoTaskMemAlloc(pPages->cElems * sizeof(GUID)); if (!pPages->pElems) return E_OUTOFMEMORY; pPages->pElems[0] = CLSID_CoreAACInfoProp; pPages->pElems[1] = CLSID_CoreAACAboutProp; return S_OK; } // ============================================================================ // accept only aac audio wrapped in waveformat HRESULT CCoreAACDecoder::CheckInputType(const CMediaType *mtIn) { if (*mtIn->Type() != MEDIATYPE_Audio || *mtIn->Subtype() != MEDIASUBTYPE_AAC) return VFW_E_TYPE_NOT_ACCEPTED; if (*mtIn->FormatType() != FORMAT_WaveFormatEx) return VFW_E_TYPE_NOT_ACCEPTED; WAVEFORMATEX *wfex = (WAVEFORMATEX *)mtIn->Format(); if (wfex->wFormatTag != WAVE_FORMAT_AAC) return VFW_E_TYPE_NOT_ACCEPTED; if(wfex->cbSize < 2) return VFW_E_TYPE_NOT_ACCEPTED; m_decoderSpecificLen = wfex->cbSize; if(m_decoderSpecific) { delete m_decoderSpecific; m_decoderSpecific = NULL; } m_decoderSpecific = new unsigned char[m_decoderSpecificLen]; // Keep decoderSpecific initialization data (appended to the WAVEFORMATEX struct) memcpy(m_decoderSpecific,(char*)wfex+sizeof(WAVEFORMATEX), m_decoderSpecificLen); return S_OK; } // ============================================================================ // propose proper waveformat HRESULT CCoreAACDecoder::GetMediaType(int iPosition, CMediaType *mtOut) { if (!m_pInput->IsConnected()) { return E_UNEXPECTED; } if (iPosition < 0) { return E_INVALIDARG; } if (iPosition > 0) { return VFW_S_NO_MORE_ITEMS; } // Some drivers don't like WAVEFORMATEXTENSIBLE when channels are <= 2 so // we fall back to a classic WAVEFORMATEX struct in this case WAVEFORMATEXTENSIBLE wfex; ZeroMemory(&wfex, sizeof(WAVEFORMATEXTENSIBLE)); wfex.SubFormat = KSDATAFORMAT_SUBTYPE_PCM; wfex.Format.wFormatTag = (m_Channels <= 2) ? WAVE_FORMAT_PCM : WAVE_FORMAT_EXTENSIBLE; wfex.Format.cbSize = (m_Channels <= 2) ? 0 : sizeof(WAVEFORMATEXTENSIBLE) - sizeof(WAVEFORMATEX); wfex.Format.nChannels = (unsigned short)m_Channels; wfex.Format.nSamplesPerSec = (unsigned short)m_SamplesPerSec; wfex.Format.wBitsPerSample = m_BitsPerSample; wfex.Format.nBlockAlign = (unsigned short)((wfex.Format.nChannels * wfex.Format.wBitsPerSample) / 8); wfex.Format.nAvgBytesPerSec = wfex.Format.nSamplesPerSec * wfex.Format.nBlockAlign; switch(m_Channels) { case 1: wfex.dwChannelMask = KSAUDIO_SPEAKER_MONO; break; case 2: wfex.dwChannelMask = KSAUDIO_SPEAKER_STEREO; break; case 3: wfex.dwChannelMask = KSAUDIO_SPEAKER_STEREO | SPEAKER_FRONT_CENTER; break; case 4: //wfex.dwChannelMask = KSAUDIO_SPEAKER_QUAD; wfex.dwChannelMask = (SPEAKER_FRONT_LEFT | SPEAKER_FRONT_RIGHT | SPEAKER_FRONT_CENTER | SPEAKER_BACK_CENTER); break; case 5: wfex.dwChannelMask = KSAUDIO_SPEAKER_QUAD | SPEAKER_FRONT_CENTER; break; case 6: wfex.dwChannelMask = KSAUDIO_SPEAKER_5POINT1; break; default: wfex.dwChannelMask = KSAUDIO_SPEAKER_DIRECTOUT; // XXX : or SPEAKER_ALL ?? break; } wfex.Samples.wValidBitsPerSample = wfex.Format.wBitsPerSample; mtOut->SetType(&MEDIATYPE_Audio); mtOut->SetSubtype(&MEDIASUBTYPE_PCM); mtOut->SetFormatType(&FORMAT_WaveFormatEx); mtOut->SetFormat( (BYTE*) &wfex, sizeof(WAVEFORMATEX)+wfex.Format.cbSize); mtOut->SetTemporalCompression(FALSE); return S_OK; } // ---------------------------------------------------------------------------- HRESULT CCoreAACDecoder::CheckTransform(const CMediaType *mtIn, const CMediaType *mtOut) { if (*mtOut->Type() != MEDIATYPE_Audio || *mtOut->Subtype() != MEDIASUBTYPE_PCM || *mtOut->FormatType() != FORMAT_WaveFormatEx) { return VFW_E_TYPE_NOT_ACCEPTED; } return S_OK; } // ---------------------------------------------------------------------------- // 960 for LD or else 1024 (expanded to 2048 for HE-AAC) #define MAXFRAMELEN 2048 HRESULT CCoreAACDecoder::DecideBufferSize(IMemAllocator *pAllocator, ALLOCATOR_PROPERTIES *pProperties) { pProperties->cBuffers = 8; m_OutputBuffLen = m_Channels * MAXFRAMELEN * sizeof(short); pProperties->cbBuffer = m_OutputBuffLen; NOTE1("CCoreAACDecoder::DecideBufferSize %d", pProperties->cbBuffer); ALLOCATOR_PROPERTIES Actual; HRESULT hr = pAllocator->SetProperties(pProperties, &Actual); if(FAILED(hr)) return hr; if (Actual.cbBuffer < pProperties->cbBuffer || Actual.cBuffers < pProperties->cBuffers) return E_INVALIDARG; return S_OK; } // ---------------------------------------------------------------------------- HRESULT CCoreAACDecoder::CompleteConnect(PIN_DIRECTION direction, IPin *pReceivePin) { HRESULT hr = CTransformFilter::CompleteConnect(direction, pReceivePin); if(direction == PINDIR_INPUT) { if(m_decHandle) { faacDecClose(m_decHandle); m_decHandle = NULL; } m_decHandle = faacDecOpen(); faacDecConfigurationPtr config; config = faacDecGetCurrentConfiguration(m_decHandle); config->downMatrix = m_DownMatrix; faacDecSetConfiguration(m_decHandle, config); // Initialize the decoder unsigned long SamplesPerSec = 0; unsigned char Channels = 0; if(faacDecInit2(m_decHandle, m_decoderSpecific, m_decoderSpecificLen, &SamplesPerSec, &Channels) < 0) { return E_FAIL; } if(m_DownMatrix) { Channels = 2; // TODO : check with mono } mp4AudioSpecificConfig info; AudioSpecificConfig(m_decoderSpecific,m_decoderSpecificLen,&info); wsprintf(m_ProfileName,"%s%s", ObjectTypesNameTable[info.objectTypeIndex], #if 0 info.sbr_present_flag ? #else false ? #endif "+SBR" : "" ); m_Channels = Channels; m_SamplesPerSec = SamplesPerSec; m_BitsPerSample = 16; // we always decode to the default 16 bits (we could add 24,32,float) m_brCalcFrames = 0; m_brBytesConsumed = 0; m_DecodedFrames = 0; } return hr; } // ---------------------------------------------------------------------------- HRESULT CCoreAACDecoder::StartStreaming(void) { m_brCalcFrames = 0; m_brBytesConsumed = 0; m_DecodedFrames = 0; return CTransformFilter::StartStreaming(); } // ---------------------------------------------------------------------------- HRESULT CCoreAACDecoder::Transform(IMediaSample *pIn, IMediaSample *pOut) { if (m_State == State_Stopped) { pOut->SetActualDataLength(0); return S_OK; } if(pIn->IsPreroll() == S_OK) { return S_FALSE; } // Decode the sample data DWORD ActualDstLength; BYTE *pSrc, *pDst; DWORD SrcLength = pIn->GetActualDataLength(); DWORD DstLength = pOut->GetSize(); HRESULT hr; hr = pIn->GetPointer(&pSrc); if(hr != S_OK) return hr; hr = pOut->GetPointer(&pDst); if(hr != S_OK) return hr; if(!pSrc || !pDst || (DstLength < m_OutputBuffLen)) return S_FALSE; // Decode data // (use our buffer calculated len, as the Waveout renderer seems to report wrongly a bigger size) if(!Decode(pSrc, SrcLength, pDst, m_OutputBuffLen, &ActualDstLength)) return S_FALSE; NOTE3("Transform: %u->%u (%u)\n", SrcLength, ActualDstLength, m_OutputBuffLen); // Copy the actual data length pOut->SetActualDataLength(ActualDstLength); return S_OK; } // ---------------------------------------------------------------------------- // AAC order : C, L, R, L", R", LFE // DShow order : L, R, C, LFE, L", R" const int MAXCHANNELS = 6; const int chmap[MAXCHANNELS][MAXCHANNELS+1] = { // first column tell us if we need to remap { 0, }, // mono { 0, }, // l, r { 1, 1, 2, 0, }, // c ,l, r -> l, r, c { 1, 1, 2, 0, 3, }, // c, l, r, bc -> l, r, c, bc { 1, 1, 2, 0, 3, 4, }, // c, l, r, bl, br -> l, r, c, bl, br { 1, 1, 2, 0, 5, 3, 4 } // c, l, r, bl, br, lfe -> l, r, c, lfe, bl, br }; // ---------------------------------------------------------------------------- bool CCoreAACDecoder::Decode(BYTE *pSrc, DWORD SrcLength, BYTE *pDst, DWORD DstLength, DWORD *ActualDstLength) { faacDecFrameInfo frameInfo; short *outsamples = (short *)faacDecDecode(m_decHandle, &frameInfo, pSrc, DstLength); if (frameInfo.error) { NOTE2("CCoreAACDecoder::Decode Error %d [%s]\n", frameInfo.error, faacDecGetErrorMessage(frameInfo.error)); return false; } m_brCalcFrames++; m_DecodedFrames++; m_brBytesConsumed += SrcLength; if(m_brCalcFrames == 43) { m_Bitrate = (int)((m_brBytesConsumed * 8) / (m_DecodedFrames / 43.07)); m_brCalcFrames = 0; } if (!frameInfo.error && outsamples) { int channelidx = frameInfo.channels-1; if(chmap[channelidx][0]) { // dshow remapping short *dstBuffer = (short*)pDst; for(unsigned int i = 0; i < frameInfo.samples; i += frameInfo.channels, outsamples += frameInfo.channels) { for(unsigned int j=1; j <= frameInfo.channels; j++) { *dstBuffer++ = outsamples[chmap[channelidx][j]]; } } } else { memcpy(pDst, outsamples, frameInfo.samples * sizeof(short)); } } else return false; *ActualDstLength = frameInfo.samples * sizeof(short); return true; } // ============================================================================ // ICoreAAC // ============================================================================ STDMETHODIMP CCoreAACDecoder::get_ProfileName(char** name) { CheckPointer(name,E_POINTER); *name = m_ProfileName; return S_OK; } STDMETHODIMP CCoreAACDecoder::get_SampleRate(int* sample_rate) { CheckPointer(sample_rate,E_POINTER); *sample_rate = m_SamplesPerSec; return S_OK; } STDMETHODIMP CCoreAACDecoder::get_Channels(int *channels) { CheckPointer(channels,E_POINTER); *channels = m_Channels; return S_OK; } STDMETHODIMP CCoreAACDecoder::get_BitsPerSample(int *bits_per_sample) { CheckPointer(bits_per_sample,E_POINTER); *bits_per_sample = m_BitsPerSample; return S_OK; } STDMETHODIMP CCoreAACDecoder::get_Bitrate(int *bitrate) { CheckPointer(bitrate,E_POINTER); *bitrate = m_Bitrate; return S_OK; } STDMETHODIMP CCoreAACDecoder::get_FramesDecoded(unsigned int *frames_decoded) { CheckPointer(frames_decoded,E_POINTER); *frames_decoded = m_DecodedFrames; return S_OK; } STDMETHODIMP CCoreAACDecoder::get_DownMatrix(bool *down_matrix) { CheckPointer(down_matrix,E_POINTER); *down_matrix = m_DownMatrix; return S_OK; } STDMETHODIMP CCoreAACDecoder::set_DownMatrix(bool down_matrix) { m_DownMatrix = down_matrix; return S_OK; } // ============================================================================