Source code of Windows XP (NT5)
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 

1822 lines
58 KiB

/*******************************************************************************
* VoiceDataObj.cpp *
*------------------*
* Description:
* This module is the main implementation file for the CVoiceDataObj class.
*-------------------------------------------------------------------------------
* Created By: EDC Date: 05/06/99
* Copyright (C) 1999 Microsoft Corporation
* All Rights Reserved
*
*******************************************************************************/
//--- Additional includes
#include "stdafx.h"
#include "VoiceDataObj.h"
/*****************************************************************************
* CVoiceDataObj::FinalConstruct *
*-------------------------------*
* Description:
* Constructor
********************************************************************* EDC ***/
HRESULT CVoiceDataObj::FinalConstruct()
{
//--- Init vars
m_hVoiceDef = NULL;
m_hVoiceData = NULL;
m_pVoiceData = NULL;
m_pVoiceDef = NULL;
//--- Create driver voice but initialize later
return m_cpunkDrvVoice.CoCreateInstance( CLSID_MSTTSEngine, GetControllingUnknown() );
} /* CVoiceDataObj::FinalConstruct */
/*****************************************************************************
* CVoiceDataObj::FinalRelease *
*-----------------------------*
* Description:
* destructor
********************************************************************* EDC ***/
void CVoiceDataObj::FinalRelease()
{
SPDBG_FUNC( "CVoiceDataObj::FinalRelease" );
if( m_pVoiceDef )
{
::UnmapViewOfFile( (void*)m_pVoiceDef );
}
if( m_pVoiceData )
{
::UnmapViewOfFile( (void*)m_pVoiceData );
}
if( m_hVoiceDef ) ::CloseHandle( m_hVoiceDef );
if( m_hVoiceData ) ::CloseHandle( m_hVoiceData );
} /* CVoiceDataObj::FinalRelease */
/*****************************************************************************
* CVoiceDataObj::MapFile *
*------------------------*
* Description:
* Helper function used by SetObjectToken to map file. This function
* assumes that m_cpToken has been initialized.+++
********************************************************************* RAL ***/
HRESULT CVoiceDataObj::MapFile( const WCHAR * pszTokenVal, // Value that contains file path
HANDLE * phMapping, // Pointer to file mapping handle
void ** ppvData ) // Pointer to the data
{
HRESULT hr = S_OK;
bool fWorked;
CSpDynamicString dstrFilePath;
hr = m_cpToken->GetStringValue( pszTokenVal, &dstrFilePath );
if ( SUCCEEDED( hr ) )
{
fWorked = false;
*phMapping = NULL;
*ppvData = NULL;
HANDLE hFile;
#ifndef _WIN32_WCE
hFile = g_Unicode.CreateFile(
dstrFilePath,
GENERIC_READ,
FILE_SHARE_READ,
NULL,
OPEN_EXISTING,
FILE_ATTRIBUTE_NORMAL,
NULL );
#else //_WIN32_WCE
hFile = g_Unicode.CreateFileForMapping(
dstrFilePath,
GENERIC_READ,
FILE_SHARE_READ,
NULL,
OPEN_EXISTING,
FILE_ATTRIBUTE_NORMAL,
NULL );
#endif //_WIN32_WCE
if (hFile != INVALID_HANDLE_VALUE)
{
//-------------------------------------
// Make a unique map name from path
//-------------------------------------
long i;
for( i = 0; i < _MAX_PATH-1; i++ )
{
if( dstrFilePath[i] == 0 )
{
// End of string
break;
}
if( dstrFilePath[i] == '\\' )
{
//-------------------------------------
// Change backslash to underscore
//-------------------------------------
dstrFilePath[i] = '_';
}
}
*phMapping = g_Unicode.CreateFileMapping( hFile, NULL, PAGE_READONLY, 0, 0, dstrFilePath );
::CloseHandle( hFile );
}
if (*phMapping)
{
*ppvData = ::MapViewOfFile( *phMapping, FILE_MAP_READ, 0, 0, 0 );
if (*ppvData)
{
fWorked = true;
}
}
if (!fWorked)
{
hr = HRESULT_FROM_WIN32(::GetLastError());
if (hr == E_HANDLE)
{
hr &= 0xFFFFF000;
hr |= ERROR_FILE_NOT_FOUND;
}
if (*phMapping)
{
::CloseHandle(*phMapping);
*phMapping = NULL;
}
}
}
return hr;
} /* CVoiceDataObj::MapFile */
/*****************************************************************************
* CVoiceDataObj::SetObjectToken *
*-------------------------------*
* Description:
* This function performs the majority of the initialization of the voice.
* Once the object token has been provided, the filenames are read from the
* token key and the files are mapped.+++
********************************************************************* RAL ***/
STDMETHODIMP CVoiceDataObj::SetObjectToken(ISpObjectToken * pToken)
{
SPDBG_FUNC( "CVoiceDataObj::SetObjectToken" );
HRESULT hr = SpGenericSetObjectToken(pToken, m_cpToken);
if ( SUCCEEDED( hr ) )
{
hr = MapFile( L"VoiceDef", &m_hVoiceDef, (void **)&m_pVoiceDef );
}
if ( SUCCEEDED( hr ) )
{
hr = MapFile( L"VoiceData", &m_hVoiceData, (void **)&m_pVoiceData );
}
//--- Init voice data pointers
if (SUCCEEDED(hr))
{
hr = InitVoiceData();
}
if( SUCCEEDED( hr ))
{
CComQIPtr<IMSTTSEngineInit> cpInit( m_cpunkDrvVoice );
SPDBG_ASSERT( cpInit );
hr = cpInit->VoiceInit( this );
}
return hr;
} /* CVoiceDataObj::SetObjectToken */
/*****************************************************************************
* CVoiceDataObj::GetVoiceInfo *
*-----------------------------*
* Description:
* This method is used to retrieve the voice file data description.+++
********************************************************************* EDC ***/
STDMETHODIMP CVoiceDataObj::GetVoiceInfo( MSVOICEINFO* pVoiceInfo )
{
SPDBG_FUNC( "CVoiceDataObj::GetVoiceInfo" );
HRESULT hr = S_OK;
long i;
//--- Check args
if( ( SP_IS_BAD_WRITE_PTR( pVoiceInfo ) ) || ( m_pVoiceDef == NULL ) )
{
hr = E_INVALIDARG;
}
else
{
if (!m_cpToken)
{
hr = SPERR_UNINITIALIZED;
}
else
{
pVoiceInfo->pWindow = m_pWindow;
pVoiceInfo->FFTSize = m_FFTSize;
pVoiceInfo->LPCOrder = m_cOrder;
pVoiceInfo->ProsodyGain = m_pVoiceDef->ProsodyGain;
pVoiceInfo->eReverbType = m_pVoiceDef->ReverbType;
pVoiceInfo->Pitch = m_pVoiceDef->Pitch;
pVoiceInfo->Rate = m_pVoiceDef->Rate;
pVoiceInfo->LangID = m_pVoiceDef->LangID;
pVoiceInfo->SampleRate = m_pVoiceDef->SampleRate;
pVoiceInfo->VibratoFreq = m_pVoiceDef->VibratoFreq;
pVoiceInfo->VibratoDepth = m_pVoiceDef->VibratoDepth;
pVoiceInfo->NumOfTaps = m_pVoiceDef->NumOfTaps;
// Assumes voices are ALWAYS 16-bit mono (probably valid for now)***
pVoiceInfo->WaveFormatEx.wFormatTag = WAVE_FORMAT_PCM;
pVoiceInfo->WaveFormatEx.nSamplesPerSec = pVoiceInfo->SampleRate;
pVoiceInfo->WaveFormatEx.wBitsPerSample = 16; // ***
pVoiceInfo->WaveFormatEx.nChannels = 1; // ***
pVoiceInfo->WaveFormatEx.nBlockAlign = (unsigned short)(pVoiceInfo->WaveFormatEx.nChannels * sizeof(short)); // ***
pVoiceInfo->WaveFormatEx.nAvgBytesPerSec = pVoiceInfo->WaveFormatEx.nSamplesPerSec * pVoiceInfo->WaveFormatEx.nBlockAlign;
pVoiceInfo->WaveFormatEx.cbSize = 0;
for (i = 0; i < MAXTAPS; i++)
{
pVoiceInfo->TapCoefficients[i] = m_pVoiceDef->TapCoefficients[i];
}
}
}
return hr;
} /* CVoiceDataObj::GetVoiceInfo */
/*****************************************************************************
* CVoiceDataObj::GetUnit *
*------------------------*
* Description:
* Retrieves and uncompresses audio data from the unit inventory. +++
*
********************************************************************* EDC ***/
STDMETHODIMP CVoiceDataObj::GetUnitData( ULONG unitID, MSUNITDATA* pUnitData )
{
SPDBG_FUNC( "CVoiceDataObj::GetUnit" );
HRESULT hr = S_OK;
//--- Check args
if( SP_IS_BAD_WRITE_PTR( pUnitData ) )
{
hr = E_INVALIDARG;
}
else if( unitID > m_NumOfUnits )
{
//--------------------------
// ID is out of range!
//--------------------------
hr = E_INVALIDARG;
}
else
{
if (!m_cpToken)
{
hr = SPERR_UNINITIALIZED;
}
else
{
if( m_CompressionType != COMPRESS_LPC )
{
//--------------------------------------
// Unsupported compression type
//--------------------------------------
hr = E_FAIL;
}
else
{
//-------------------------------------------------------------------
// Retrieve data from compressed inventory
//-------------------------------------------------------------------
hr = DecompressUnit( unitID, pUnitData );
}
}
}
return hr;
} /* CVoiceDataObj::GetUnit */
/*****************************************************************************
* CVoiceDataObj::AlloToUnit *
*---------------------------*
* Description:
* Converts FE allo code to BE unit phon code.+++
*
********************************************************************* EDC ***/
STDMETHODIMP CVoiceDataObj::AlloToUnit( short allo, long attributes, long* pUnitID )
{
SPDBG_FUNC( "CVoiceDataObj::AlloToUnit" );
HRESULT hr = S_OK;
long index;
union {
char c[2];
short s;
} temp;
char* pb;
//--- Check args
if( (SP_IS_BAD_READ_PTR( pUnitID )) || (allo >= m_NumOfAllos) )
{
hr = E_INVALIDARG;
}
else
{
index = (long)allo << 1; // 2 entries per phon
if( attributes & ALLO_IS_STRESSED )
{
//--- 2nd half
pb = (char*) &m_AlloToUnitTbl[index + (m_NumOfAllos << 1)];
}
else
{
pb = (char*) &m_AlloToUnitTbl[index];
}
// We read this way to avoid missaligned data accesses in 64bit.
temp.c[0] = *pb++;
temp.c[1] = *pb;
*pUnitID = (long) temp.s;
}
return hr;
} /* CVoiceDataObj::AlloToUnit */
/*****************************************************************************
* CVoiceDataObj::GetUnitIDs *
*---------------------------*
* Description:
* Gets the inventory triphone (in context) unit code.+++
*
********************************************************************* EDC ***/
STDMETHODIMP CVoiceDataObj::GetUnitIDs( UNIT_CVT* pUnits, ULONG cUnits )
{
SPDBG_FUNC( "CVoiceDataObj::GetUnitIDs" );
ULONG i;
ULONG curID, prevID, nextID;
ULONG curF, prevF, nextF;
char cPos;
ULONG senoneID;
UNALIGNED UNIT_STATS *pStats;
HRESULT hr = S_OK;
//--- Check args
if( (SP_IS_BAD_READ_PTR( pUnits)) ||
(SP_IS_BAD_WRITE_PTR( pUnits)) )
{
hr = E_INVALIDARG;
}
else
{
if (!m_cpToken)
{
hr = SPERR_UNINITIALIZED;
}
else
{
for( i = 0; i < cUnits; i++ )
{
//---------------------------
// CURRENT phon
//---------------------------
curID = pUnits[i].PhonID;
curF = pUnits[i].flags;
//---------------------------
// PREVIOUS phon
//---------------------------
if( i == 0 )
{
prevID = m_Sil_Index;
prevF = 0;
}
else
{
prevID = pUnits[i-1].PhonID;
prevF = pUnits[i-1].flags;
}
//---------------------------
// NEXT phon
//---------------------------
if( i >= cUnits -1 )
{
nextID = m_Sil_Index;
nextF = 0;
}
else
{
nextID = pUnits[i+1].PhonID;
nextF = pUnits[i+1].flags;
}
if( curID == m_Sil_Index )
{
//----------------------
// SILENCE phon
//----------------------
pUnits[i].UnitID = 0;
pUnits[i].SenoneID = 0;
pUnits[i].szUnitName[0] = 0;
pUnits[i].Dur = SIL_DURATION;
pUnits[i].Amp = 0;
pUnits[i].AmpRatio = 1.0f;
}
else
{
cPos = '\0';
if( curF & WORD_START_FLAG )
{
if( nextF & WORD_START_FLAG )
//---------------------------------------
// Both Cur and Next are word start
//---------------------------------------
cPos = 's';
else
//---------------------------------------
// Cur is word start
// Next is not
//---------------------------------------
cPos = 'b';
}
else if( nextF & WORD_START_FLAG )
{
//---------------------------------------
// Next is word start
// Cur is not
//---------------------------------------
cPos = 'e';
}
HRESULT hrt;
hrt = GetTriphoneID( m_pForest,
curID,
prevID,
nextID,
cPos,
m_pd,
&senoneID);
if( FAILED(hrt) )
{
//------------------------------------------------
// Instead of failing, I'll be robust and ignore
// the error. Force triphone to something that's
// valid.
//------------------------------------------------
senoneID = 0;
}
pUnits[i].UnitID = (m_pForest->gsOffset[curID] -
m_First_Context_Phone) + (senoneID + 1);
pUnits[i].SenoneID = senoneID;
//-----------------------------
// Get phon name strings
//-----------------------------
char *pName;
pName = PhonFromID( m_pd, pUnits[i].PhonID );
strcpy( &pUnits[i].szUnitName[0], pName );
//-----------------------------
// Get unit stats
//-----------------------------
pStats = (UNALIGNED UNIT_STATS*)(m_SenoneBlock[curID] + (char*)m_SenoneBlock);
pStats = &pStats[senoneID+1];
pStats = (UNALIGNED UNIT_STATS*)(m_SenoneBlock[curID] + (char*)m_SenoneBlock);
pStats = &pStats[senoneID-1];
pStats = (UNALIGNED UNIT_STATS*)(m_SenoneBlock[curID] + (char*)m_SenoneBlock);
pStats = &pStats[senoneID];
pUnits[i].Dur = pStats->dur / 1000.0f; // ms -> sec
pUnits[i].Amp = pStats->amp;
pUnits[i].AmpRatio = (float)sqrt(pStats->ampRatio);
//----------------------------------------------------------
// Looks like the "SENONE" table durations are
// incorrect (not even close!).
// Calc the real duration from inv epochs
// TODO: Make new table in voice data block
//----------------------------------------------------------
//hr = GetUnitDur( pUnits[i].UnitID, &pUnits[i].Dur );
if( FAILED(hr) )
{
break;
}
}
}
}
}
return hr;
} /* CVoiceDataObj::GetUnitIDs */
/*****************************************************************************
* GetDataBlock *
*--------------*
* Description:
* Return ptr and length of specified voice data block. +++
*
********************************************************************** MC ***/
HRESULT CVoiceDataObj::GetDataBlock( VOICEDATATYPE type, char **ppvOut, ULONG *pdwSize )
{
SPDBG_FUNC( "CVoiceDataObj::GetDataBlock" );
long *offs;
HRESULT hr = S_OK;
long dataType;
if( !m_pVoiceData )
{
hr = E_INVALIDARG;
}
else
{
dataType = (long)type * 2; // x2 since each entry is an offset/length pair
offs = (long*)&m_pVoiceData->PhonOffset; // Table start
*ppvOut = offs[dataType] + ((char*)m_pVoiceData); // Offset -> abs address
*pdwSize = offs[dataType + 1];
}
return hr;
} /* CVoiceDataObj::GetDataBlock */
/*****************************************************************************
* InitVoiceData *
*---------------*
* Description:
* Create pointers to voice data blocks from m_pVoiceData offsets.+++
*
********************************************************************** MC ***/
HRESULT CVoiceDataObj::InitVoiceData()
{
SPDBG_FUNC( "CVoiceDataObj::InitVoiceData" );
char *pRawData;
ULONG dataSize;
HRESULT hr = S_OK;
//------------------------------------------
// Check data type and version
//------------------------------------------
if( (m_pVoiceData != NULL)
&& (m_pVoiceData->Type == MS_DATA_TYPE)
&& (m_pVoiceData->Version == HEADER_VERSION) )
{
//-------------------------------
// Get ptr to PHONs
//-------------------------------
hr = GetDataBlock( MSVD_PHONE, &pRawData, &dataSize );
m_pd = (PHON_DICT*)pRawData;
//-------------------------------
// Get ptr to TREE
//-------------------------------
if( SUCCEEDED(hr) )
{
hr = GetDataBlock( MSVD_TREEIMAGE, &pRawData, &dataSize );
m_pForest = (TRIPHONE_TREE*)pRawData;
}
//-------------------------------
// Get ptr to SENONE
//-------------------------------
if( SUCCEEDED(hr) )
{
hr = GetDataBlock( MSVD_SENONE, &pRawData, &dataSize );
m_SenoneBlock = (long*)pRawData;
}
//-------------------------------
// Get ptr to ALLOID
//-------------------------------
if( SUCCEEDED(hr) )
{
hr = GetDataBlock( MSVD_ALLOID, &pRawData, &dataSize );
m_AlloToUnitTbl = (short*)pRawData;
m_NumOfAllos = dataSize / 8;
}
if( SUCCEEDED(hr) )
{
m_First_Context_Phone = m_pd->numCiPhones;
m_Sil_Index = PhonToID( m_pd, "SIL" );
}
//-----------------------------------------------------
// Init voice data INVENTORY parameters
//-----------------------------------------------------
if( SUCCEEDED(hr) )
{
hr = GetDataBlock( MSVD_INVENTORY, &pRawData, &dataSize );
if( SUCCEEDED(hr) )
{
m_pInv = (INVENTORY*)pRawData;
m_CompressionType = m_pVoiceDef->CompressionType;
//---------------------------------------------
// Convert REL to ABS
//---------------------------------------------
m_pUnit = (long*)((char*)m_pInv + m_pInv->UnitsOffset);
m_pTrig = (float*)((char*)m_pInv + m_pInv->TrigOffset);
m_pWindow = (float*)((char*)m_pInv + m_pInv->WindowOffset);
m_pGauss = (float*)((char*)m_pInv + m_pInv->pGaussOffset);
m_SampleRate = (float)m_pInv->SampleRate;
m_FFTSize = m_pInv->FFTSize;
m_cOrder = m_pInv->cOrder;
m_GaussID = 0;
m_NumOfUnits = m_pInv->cNumUnits;
}
}
}
else
{
//-------------------------
// Not a voice file!
//-------------------------
hr = E_FAIL;
}
return hr;
} /* CVoiceDataObj::InitVoiceData */
/*****************************************************************************
* CVoiceDataObj::DecompressUnit *
*-------------------------------*
* Description:
* Decompress acoustic unit.+++
*
* INPUT:
* UnitID - unit number (1 - 3333 typ)
*
* OUTPUT:
* Fills pSynth if success
*
********************************************************************** MC ***/
HRESULT CVoiceDataObj::DecompressUnit( ULONG UnitID, MSUNITDATA* pSynth )
{
SPDBG_FUNC( "CVoiceDataObj::DecompressUnit" );
long i, j, k, cNumEpochs, cBytes, cOrder = 0, VectDim;
long frameSize, cNumBins, startBin;
char *pCurStor;
unsigned char index;
float pLSP[MAX_LPCORDER], pFFT[MAX_FFTSIZE], pRes[MAX_FFTSIZE], Gain;
float *pCurLSP, *pCurLPC, *pMean, *pCurRes;
HRESULT hr = S_OK;
memset( pSynth, 0, sizeof(MSUNITDATA) );
//-----------------------------------------
// Pointer to unit data from inventory
//-----------------------------------------
pCurStor = (char*)((char*)m_pInv + m_pUnit[UnitID] ); // Rel to abs
//---------------------------------
// Get epoch count - 'cNumEpochs'
//---------------------------------
cBytes = sizeof(long);
memcpy( &cNumEpochs, pCurStor, cBytes );
pSynth->cNumEpochs = cNumEpochs;
pCurStor += cBytes;
//---------------------------------
// Get epoch lengths - 'pEpoch'
//---------------------------------
pSynth->pEpoch = new float[cNumEpochs];
if( pSynth->pEpoch == NULL )
{
hr = E_OUTOFMEMORY;
}
if( SUCCEEDED(hr) )
{
cBytes = DecompressEpoch( (signed char *) pCurStor, cNumEpochs, pSynth->pEpoch );
pCurStor += cBytes;
//+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-
//
// Uncompress LPC coefficients...
//
//+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-
cOrder = m_pInv->cOrder;
pSynth->cOrder = cOrder;
pSynth->pLPC = new float[cNumEpochs * (1 + cOrder)];
if( pSynth->pLPC == NULL )
{
hr = E_OUTOFMEMORY;
}
}
if( SUCCEEDED(hr) )
{
pCurLPC = pSynth->pLPC;
//---------------------------------
// ... for each epoch
//---------------------------------
for( i = 0; i < cNumEpochs; i++, pCurLPC += (1 + cOrder) )
{
//-------------------------------------
// Decode quantized LSP's...
//-------------------------------------
pCurLSP = pLSP;
for( k = 0; k < m_pInv->cNumLPCBooks; k++ )
{
VectDim = m_pInv->LPCBook[k].cCodeDim;
memcpy( &index, pCurStor, sizeof(char));
pCurStor += sizeof(char);
pMean = ((float*)((char*)m_pInv + m_pInv->LPCBook[k].pData)) + (index * VectDim);
for( j = 0; j < VectDim; j++ )
pCurLSP[j] = pMean[j];
pCurLSP += VectDim;
}
//--------------------------------------------------
// ...then convert to predictor coefficients
// (LSP's quantize better than PC's)
//--------------------------------------------------
LSPtoPC( pLSP, pCurLPC, cOrder, i );
}
//---------------------------------------
// Get pointer to residual gains
//---------------------------------------
cBytes = cNumEpochs * sizeof(float);
pSynth->pGain = (float*) pCurStor;
pCurStor += cBytes;
//+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-
//
// Uncompress residual waveform
//
//+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-
//--------------------------------------------
// First, figure out the buffer length...
//--------------------------------------------
pSynth->cNumSamples = 0;
for( j = 0; j < cNumEpochs; j++ )
{
pSynth->cNumSamples += (long) ABS(pSynth->pEpoch[j]);
}
//--------------------------------------------
// ...get buffer memory...
//--------------------------------------------
pSynth->pRes = new float[pSynth->cNumSamples];
if( pSynth->pRes == NULL )
{
hr = E_OUTOFMEMORY;
}
}
if( SUCCEEDED(hr) )
{
//--------------------------------------------
// ...and fill with uncompressed residual
//--------------------------------------------
pCurRes = pSynth->pRes;
for( i = 0; i < (long)pSynth->cNumEpochs; i++ )
{
//-------------------------------------
// Get epoch length
//-------------------------------------
frameSize = (long)(ABS(pSynth->pEpoch[i]));
// restore whisper
//if( (pSynth->pEpoch[i] > 0) && !(m_fModifiers & BACKEND_BITFLAG_WHISPER) )
if( pSynth->pEpoch[i] > 0 )
{
//-----------------------------------------------
// VOICED epoch
//-----------------------------------------------
if( (m_pInv->cNumDresBooks == 0) || (i == 0) || (pSynth->pEpoch[i - 1] < 0) )
{
//--------------------------------------
// Do static quantization
//--------------------------------------
for( j = 0; j < m_pInv->FFTSize; j++ )
{
pFFT[j] = 0.0f;
}
startBin = 1;
for( k = 0; k < m_pInv->cNumResBooks; k++ )
{
VectDim = m_pInv->ResBook[k].cCodeDim;
cNumBins = VectDim / 2;
memcpy( &index, pCurStor, sizeof(char) );
pCurStor += sizeof(char);
//------------------------------------------
// Uncompress spectrum using 'pResBook'
//------------------------------------------
pMean = ((float*)((char*)m_pInv + m_pInv->ResBook[k].pData)) + (index * VectDim);
PutSpectralBand( pFFT, pMean, startBin, cNumBins, m_pInv->FFTSize );
startBin += cNumBins;
}
}
else
{
//--------------------------------------
// Do delta quantization
//--------------------------------------
startBin = 1;
for( k = 0; k < m_pInv->cNumDresBooks; k++ )
{
VectDim = m_pInv->DresBook[k].cCodeDim;
cNumBins = VectDim / 2;
memcpy( &index, pCurStor, sizeof(char));
pCurStor += sizeof(char);
//------------------------------------------
// Uncompress spectrum using 'pDresBook'
//------------------------------------------
pMean = ((float*)((char*)m_pInv + m_pInv->DresBook[k].pData)) + (index * VectDim);
AddSpectralBand( pFFT, pMean, startBin, cNumBins, m_pInv->FFTSize );
startBin += cNumBins;
}
}
//--------------------------------------------------------
// Convert quantized FFT back to time residual
//--------------------------------------------------------
memcpy( pRes, pFFT, m_pInv->FFTSize * sizeof(float) ); // preserve original for delta residual
InverseFFT( pRes, m_pInv->FFTSize, m_pInv->FFTOrder, m_pTrig );
GainDeNormalize( pRes, (long)m_pInv->FFTSize, ((UNALIGNED float*)pSynth->pGain)[i] );
SetEpochLen( pCurRes, frameSize, pRes, m_pInv->FFTSize );
}
else
{
//-----------------------------------------------
// UNVOICED epoch
// NOTE: Assumes 'm_pGauss' is 1 sec
//-----------------------------------------------
Gain = 0.02f * ((UNALIGNED float*)pSynth->pGain)[i];
if( m_GaussID + frameSize >= m_pInv->SampleRate)
{
m_GaussID = 0;
}
//----------------------------------------------------------
// Generate gaussian random noise for unvoiced sounds
//----------------------------------------------------------
for( j = 0; j < frameSize; j++ )
{
pCurRes[j] = Gain * m_pGauss[j + m_GaussID];
}
m_GaussID += frameSize;
}
// restore whisper
/*if( (pSynth->pEpoch[i] > 0) && m_fModifiers & BACKEND_BITFLAG_WHISPER)
{
pSynth->pEpoch[i] = - pSynth->pEpoch[i];
}*/
pCurRes += frameSize;
}
}
if( FAILED(hr) )
{
//----------------------------------
// Cleanup allocated memory
//----------------------------------
if( pSynth->pEpoch )
{
delete pSynth->pEpoch;
pSynth->pEpoch = NULL;
}
if( pSynth->pRes )
{
delete pSynth->pRes;
pSynth->pRes = NULL;
}
if( pSynth->pLPC )
{
delete pSynth->pLPC;
pSynth->pLPC = NULL;
}
}
return hr;
} /* CVoiceDataObj::DecompressUnit */
/*****************************************************************************
* CVoiceDataObj::DecompressUnit *
*-------------------------------*
* Description:
* Decompress acoustic unit. +++
*
* INPUT:
* UnitID - unit number (1 - 3333 typ)
*
* OUTPUT:
* Fills pSynth if success
*
********************************************************************** MC ***/
HRESULT CVoiceDataObj::GetUnitDur( ULONG UnitID, float* pDur )
{
SPDBG_FUNC( "CVoiceDataObj::GetUnitDur" );
char *pCurStor;
float *pEpoch = NULL;
long cBytes, cNumEpochs, i;
float totalDur;
HRESULT hr = S_OK;
totalDur = 0;
if( UnitID > m_NumOfUnits )
{
//--------------------------
// ID is out of range!
//--------------------------
hr = E_INVALIDARG;
}
if( SUCCEEDED(hr) )
{
//-----------------------------------------
// Pointer to unit data from inventory
//-----------------------------------------
pCurStor = (char*)((char*)m_pInv + m_pUnit[UnitID] ); // Rel to abs
//---------------------------------
// Get epoch count - 'cNumEpochs'
//---------------------------------
cBytes = sizeof(long);
memcpy( &cNumEpochs, pCurStor, cBytes );
pCurStor += cBytes;
//---------------------------------
// Get epoch lengths - 'pEpoch'
//---------------------------------
pEpoch = new float[cNumEpochs];
if( pEpoch == NULL )
{
hr = E_OUTOFMEMORY;
}
if( SUCCEEDED(hr) )
{
cBytes = DecompressEpoch( (signed char *) pCurStor, cNumEpochs, pEpoch );
for( i = 0; i < cNumEpochs; i++)
{
totalDur += ABS(pEpoch[i]);
}
}
}
*pDur = totalDur / 22050;
//----------------------------------
// Cleanup allocated memory
//----------------------------------
if( pEpoch )
{
delete pEpoch;
}
return hr;
} /* CVoiceDataObj::GetUnitDur */
/*****************************************************************************
* CVoiceDataObj::DecompressEpoch *
*--------------------------------*
* Description:
* Decompress epoch len stream from RLE. Fills 'pEpoch' with lengths.
* Returns number of 'rgbyte' src bytes consumed.
*
********************************************************************** MC ***/
long CVoiceDataObj::DecompressEpoch( signed char *rgbyte, long cNumEpochs, float *pEpoch )
{
SPDBG_FUNC( "CVoiceDataObj::DecompressEpoch" );
long iDest, iSrc;
for( iSrc = 0, iDest = 0; iDest < cNumEpochs; ++iDest, ++iSrc )
{
//--------------------------------------
// Decode RLE for VOICED epochs
//--------------------------------------
if( rgbyte[iSrc] == 127 )
{
pEpoch[iDest] = 127.0f;
while( rgbyte[iSrc] == 127 )
{
pEpoch[iDest] += rgbyte[++iSrc];
}
}
//--------------------------------------
// Decode RLE for UNVOICED epochs
//--------------------------------------
else if( rgbyte[iSrc] == - 128 )
{
pEpoch[iDest] = - 128.0f;
while( rgbyte[iSrc] == - 128 )
pEpoch[iDest] += rgbyte[++iSrc];
}
//--------------------------------------
// No compression here
//--------------------------------------
else
{
pEpoch[iDest] = rgbyte[iSrc];
}
}
return iSrc;
} /* CVoiceDataObj::DecompressEpoch */
/*****************************************************************************
* LSPCompare *
*------------*
* Description:
* QSORT callback
*
********************************************************************** MC ***/
static int __cdecl LSPCompare( const void *a, const void *b )
{
SPDBG_FUNC( "LSPCompare" );
if( *((PFLOAT) a) > *((PFLOAT) b) )
{
return 1;
}
else if( *((PFLOAT) a) == *((PFLOAT) b) )
{
return 0;
}
else
{
return -1;
}
} /* LSPCompare */
/*****************************************************************************
* CVoiceDataObj::OrderLSP *
*-------------------------*
* Description:
* This routine reorders the LSP frequencies so that they are monotonic
*
********************************************************************** MC ***/
long CVoiceDataObj::OrderLSP( PFLOAT pLSPFrame, INT cOrder )
{
SPDBG_FUNC( "CVoiceDataObj::OrderLSP" );
long i, retCode = true;
for( i = 1; i < cOrder; i++ )
{
if( pLSPFrame[i - 1] > pLSPFrame[i] )
{
retCode = false;
}
}
qsort( (void *) pLSPFrame, (size_t) cOrder, (size_t) sizeof (float), LSPCompare );
return retCode;
} /* CVoiceDataObj::OrderLSP */
/*****************************************************************************
* CVoiceDataObj::LSPtoPC *
*------------------------*
* Description:
* Converts line spectral frequencies to LPC predictor coefficients.
*
********************************************************************** MC ***/
void CVoiceDataObj::LSPtoPC( float *pLSP, float *pLPC, long cOrder, long /*frame*/ )
{
SPDBG_FUNC( "CVoiceDataObj::LSPtoPC" );
long i, j, k, noh;
double freq[MAXNO], p[MAXNO / 2], q[MAXNO / 2];
double a[MAXNO / 2 + 1], a1[MAXNO / 2 + 1], a2[MAXNO / 2 + 1];
double b[MAXNO / 2 + 1], b1[MAXNO / 2 + 1], b2[MAXNO / 2 + 1];
double pi, xx, xf;
//----------------------------------
// Check for non-monotonic LSPs
//----------------------------------
for( i = 1; i < cOrder; i++ )
{
if( pLSP[i] <= pLSP[i - 1] )
{
//-----------------------------
// Reorder LSPs
//-----------------------------
OrderLSP( pLSP, cOrder );
break;
}
}
//--------------------------
// Initialization
//--------------------------
pi = KTWOPI;
noh = cOrder / 2;
for( j = 0; j < cOrder; j++ )
{
freq[j] = pLSP[j];
}
for( i = 0; i < noh + 1; i++ )
{
a[i] = 0.0f;
a1[i] = 0.0f;
a2[i] = 0.0f;
b[i] = 0.0f;
b1[i] = 0.0f;
b2[i] = 0.0f;
}
//-------------------------------------
// LSP filter parameters
//-------------------------------------
for( i = 0; i < noh; i++ )
{
p[i] = - 2.0 * cos( pi * freq[2 * i] );
q[i] = - 2.0 * cos( pi * freq[2 * i + 1] );
}
//-------------------------------------
// Impulse response of analysis filter
//-------------------------------------
xf = 0.0f;
for( k = 0; k < cOrder + 1; k++ )
{
xx = 0.0f;
if( k == 0 )
{
xx = 1.0f;
}
a[0] = xx + xf;
b[0] = xx - xf;
xf = xx;
for( i = 0; i < noh; i++ )
{
a[i + 1] = a[i] + p[i] * a1[i] + a2[i];
b[i + 1] = b[i] + q[i] * b1[i] + b2[i];
a2[i] = a1[i];
a1[i] = a[i];
b2[i] = b1[i];
b1[i] = b[i];
}
if( k != 0)
{
pLPC[k - 1] = (float) (- 0.5 * (a[noh] + b[noh]));
}
}
//-------------------------------------------------------
// Convert to predictor coefficient array configuration
//-------------------------------------------------------
for( i = cOrder - 1; i >= 0; i-- )
{
pLPC[i + 1] = - pLPC[i];
}
pLPC[0] = 1.0f;
} /* CVoiceDataObj::LSPtoPC */
/*****************************************************************************
* CVoiceDataObj::PutSpectralBand *
*--------------------------------*
* Description:
* This routine copies the frequency band specified by StartBin as
* is initial FFT bin, and containing cNumBins.
*
********************************************************************** MC ***/
void CVoiceDataObj::PutSpectralBand( float *pFFT, float *pBand, long StartBin,
long cNumBins, long FFTSize )
{
SPDBG_FUNC( "CVoiceDataObj::PutSpectralBand" );
long j, k, VectDim;
VectDim = 2 * cNumBins;
for( j = 0, k = StartBin; j < cNumBins; j++, k++ )
{
pFFT[k] = pBand[j];
}
k = FFTSize - (StartBin - 1 + cNumBins);
for( j = cNumBins; j < 2 * cNumBins; j++, k++ )
{
pFFT[k] = pBand[j];
}
} /* CVoiceDataObj::PutSpectralBand */
/*****************************************************************************
* CVoiceDataObj::AddSpectralBand *
*--------------------------------*
* Description:
* This routine adds the frequency band specified by StartBin as
* is initial FFT bin, and containing cNumBins, to the existing band.
*
********************************************************************** MC ***/
void CVoiceDataObj::AddSpectralBand( float *pFFT, float *pBand, long StartBin,
long cNumBins, long FFTSize )
{
SPDBG_FUNC( "CVoiceDataObj::AddSpectralBand" );
long j, k, VectDim;
VectDim = 2 * cNumBins;
for( j = 0, k = StartBin; j < cNumBins; j++, k++ )
{
pFFT[k] += pBand[j];
}
k = FFTSize - (StartBin - 1 + cNumBins);
for( j = cNumBins; j < 2 * cNumBins; j++, k++ )
{
pFFT[k] += pBand[j];
}
} /* CVoiceDataObj::AddSpectralBand */
/*****************************************************************************
* CVoiceDataObj::InverseFFT *
*---------------------------*
* Description:
* Return TRUE if consoants can be clustered.
* This subroutine computes a split-radix IFFT for real data
* It is a C version of the FORTRAN program in "Real-Valued
* Fast Fourier Transform Algorithms" by H. Sorensen et al.
* in Trans. on ASSP, June 1987, pp. 849-863. It uses half
* of the operations than its counterpart for complex data.
* *
* Length is n = 2^(fftOrder). Decimation in frequency. Result is
* in place. It uses table look-up for the trigonometric functions.
*
* Input order: *
* (Re[0], Re[1], ... Re[n/2], Im[n/2 - 1]...Im[1])
* Output order:
* (x[0], x[1], ... x[n - 1])
* The output transform exhibit hermitian symmetry (i.e. real
* part of transform is even while imaginary part is odd).
* Hence Im[0] = Im[n/2] = 0; and n memory locations suffice.
*
********************************************************************** MC ***/
void CVoiceDataObj::InverseFFT( float *pDest, long fftSize, long fftOrder, float *sinePtr )
{
SPDBG_FUNC( "CVoiceDataObj::InverseFFT" );
long n1, n2, n4, n8, i0, i1, i2, i3, i4, i5, i6, i7, i8;
long is, id, i, j, k, ie, ia, ia3;
float xt, t1, t2, t3, t4, t5, *cosPtr, r1, cc1, cc3, ss1, ss3;
cosPtr = sinePtr + (fftSize / 2);
//---------------------------------
// L shaped butterflies
//---------------------------------
n2 = 2 * fftSize;
ie = 1;
for( k = 1; k < fftOrder; k++ )
{
is = 0;
id = n2;
n2 = n2 / 2;
n4 = n2 / 4;
n8 = n4 / 2;
ie *= 2;
while( is < fftSize - 1 )
{
for( i = is; i < fftSize; i += id )
{
i1 = i;
i2 = i1 + n4;
i3 = i2 + n4;
i4 = i3 + n4;
t1 = pDest[i1] - pDest[i3];
pDest[i1] = pDest[i1] + pDest[i3];
pDest[i2] = 2 * pDest[i2];
pDest[i3] = t1 - 2 * pDest[i4];
pDest[i4] = t1 + 2 * pDest[i4];
if( n4 > 1 )
{
i1 = i1 + n8;
i2 = i2 + n8;
i3 = i3 + n8;
i4 = i4 + n8;
t1 = K2 * (pDest[i2] - pDest[i1]);
t2 = K2 * (pDest[i4] + pDest[i3]);
pDest[i1] = pDest[i1] + pDest[i2];
pDest[i2] = pDest[i4] - pDest[i3];
pDest[i3] = - 2 * (t1 + t2);
pDest[i4] = 2 * (t1 - t2);
}
}
is = 2 * id - n2;
id = 4 * id;
}
ia = 0;
for( j = 1; j < n8; j++ )
{
ia += ie;
ia3 = 3 * ia;
cc1 = cosPtr[ia];
ss1 = sinePtr[ia];
cc3 = cosPtr[ia3];
ss3 = sinePtr[ia3];
is = 0;
id = 2 * n2;
while( is < fftSize - 1 )
{
for( i = is; i < fftSize; i += id )
{
i1 = i + j;
i2 = i1 + n4;
i3 = i2 + n4;
i4 = i3 + n4;
i5 = i + n4 - j;
i6 = i5 + n4;
i7 = i6 + n4;
i8 = i7 + n4;
t1 = pDest[i1] - pDest[i6];
pDest[i1] = pDest[i1] + pDest[i6];
t2 = pDest[i5] - pDest[i2];
pDest[i5] = pDest[i2] + pDest[i5];
t3 = pDest[i8] + pDest[i3];
pDest[i6] = pDest[i8] - pDest[i3];
t4 = pDest[i4] + pDest[i7];
pDest[i2] = pDest[i4] - pDest[i7];
t5 = t1 - t4;
t1 = t1 + t4;
t4 = t2 - t3;
t2 = t2 + t3;
pDest[i3] = t5 * cc1 + t4 * ss1;
pDest[i7] = - t4 * cc1 + t5 * ss1;
pDest[i4] = t1 * cc3 - t2 * ss3;
pDest[i8] = t2 * cc3 + t1 * ss3;
}
is = 2 * id - n2;
id = 4 * id;
}
}
}
//---------------------------------
// length two butterflies
//---------------------------------
is = 0;
id = 4;
while( is < fftSize - 1 )
{
for( i0 = is; i0 < fftSize; i0 += id )
{
i1 = i0 + 1;
r1 = pDest[i0];
pDest[i0] = r1 + pDest[i1];
pDest[i1] = r1 - pDest[i1];
}
is = 2 * (id - 1);
id = 4 * id;
}
//---------------------------------
// digit reverse counter
//---------------------------------
j = 0;
n1 = fftSize - 1;
for( i = 0; i < n1; i++ )
{
if( i < j )
{
xt = pDest[j];
pDest[j] = pDest[i];
pDest[i] = xt;
}
k = fftSize / 2;
while( k <= j )
{
j -= k;
k /= 2;
}
j += k;
}
for( i = 0; i < fftSize; i++ )
{
pDest[i] /= fftSize;
}
} /* CVoiceDataObj::InverseFFT */
/*****************************************************************************
* CVoiceDataObj::SetEpochLen *
*----------------------*
* Description:
* Copy residual epoch to 'OutSize' length from 'pInRes' to 'pOutRes'
*
********************************************************************** MC ***/
void CVoiceDataObj::SetEpochLen( float *pOutRes, long OutSize, float *pInRes,
long InSize )
{
SPDBG_FUNC( "CVoiceDataObj::AddSpectralBand" );
long j, curFrame;
curFrame = MIN(InSize / 2, OutSize);
//-------------------------------
// Copy SRC to DEST
//-------------------------------
for( j = 0; j < curFrame; j++ )
pOutRes[j] = pInRes[j];
//-------------------------------
// Pad DEST if longer
//-------------------------------
for( j = curFrame; j < OutSize; j++ )
pOutRes[j] = 0.0f;
//-------------------------------
// Mix DEST if shorter
//-------------------------------
for( j = OutSize - curFrame; j < OutSize; j++ )
pOutRes[j] += pInRes[InSize - OutSize + j];
} /* CVoiceDataObj::SetEpochLen */
/*****************************************************************************
* CVoiceDataObj::GainDeNormalize *
*--------------------------------*
* Description:
* Scale residual to given gain.
*
********************************************************************** MC ***/
void CVoiceDataObj::GainDeNormalize( float *pRes, long FFTSize, float Gain )
{
SPDBG_FUNC( "CVoiceDataObj::GainDeNormalize" );
long j;
for( j = 0; j < FFTSize; j++ )
{
pRes[j] *= Gain;
}
} /* CVoiceDataObj::GainDeNormalize */
/*****************************************************************************
* CVoiceDataObj::PhonHashLookup *
*-------------------------------*
* Description:
* Lookup 'sym' in 'ht' and place its associated value in
* *val. If sym is not found place its key in *val.
* RETURN
* Return 0 indicating we found the 'sym' in the table.
* Return -1 'sym' is not in ht.
*
********************************************************************** MC ***/
long CVoiceDataObj::PhonHashLookup(
PHON_DICT *pPD, // the hash table
char *sym, // The symbol to look up
long *val ) // Phon ID
{
SPDBG_FUNC( "CVoiceDataObj::PhonHashLookup" );
char *cp;
unsigned long key;
long i;
HASH_TABLE *ht;
char *pStr;
HASH_ENTRY *pHE;
ht = &pPD->phonHash;
key = 0;
i = -1;
cp = sym;
pHE = (HASH_ENTRY*)((char*)pPD + ht->entryArrayOffs); // Offset to Abs address
do
{
key += *cp++ << (0xF & i--);
}
while( *cp );
while( true )
{
key %= ht->size;
if( pHE[key].obj == 0 )
{
//------------------------------
// Not in hash table!
//------------------------------
*val = (long) key;
return -1;
}
//-------------------------------
// Offset to Abs address
//-------------------------------
pStr = (char*)((char*)pPD + pHE[key].obj);
if( strcmp(pStr, sym) == 0 )
{
*val = pHE[key].val;
return 0;
}
key++;
}
} /* CVoiceDataObj::PhonHashLookup */
/*****************************************************************************
* CVoiceDataObj::PhonToID *
*-------------------------*
* Description:
* Return ID from phoneme string.
*
********************************************************************** MC ***/
long CVoiceDataObj::PhonToID( PHON_DICT *pd, char *phone_str )
{
SPDBG_FUNC( "CVoiceDataObj::PhonToID" );
long phon_id;
if( PhonHashLookup( pd, phone_str, &phon_id ) )
{
phon_id = NO_PHON;
}
return phon_id;
} /* CVoiceDataObj::PhonToID */
/*****************************************************************************
* CVoiceDataObj::PhonFromID *
*---------------------------*
* Description:
* Return string from phoneme ID
*
********************************************************************** MC ***/
char *CVoiceDataObj::PhonFromID( PHON_DICT *pd, long phone_id )
{
SPDBG_FUNC( "CVoiceDataObj::PhonFromID" );
char *strPtr;
long *pOffs;
pOffs = (long*)((char*)pd + pd->phones_list);
strPtr = (char*) ((char*)pd + pOffs[phone_id]);
return strPtr;
} /* CVoiceDataObj::PhonFromID */
#define CNODE_ISA_LEAF(n) ((n)->yes < 0)
#define BADTREE_ERROR (-1)
#define PARAM_ERROR (-2)
#define END_OF_PROD 65535
#define WB_BEGIN 1
#define WB_END 2
#define WB_SINGLE 4
#define WB_WWT 8
#define POS_TYPE 4
#define GET_BIT(p,feat,i,b) \
{ \
(i) = ( (p)+POS_TYPE+(feat)->nstateq ) / 32; \
(b) = 1 << ( ((p)+POS_TYPE+(feat)->nstateq ) % 32); \
}
#define GET_RBIT(p,feat,i,b) \
{ \
GET_BIT(p,feat,i,b); \
(i) += (feat)->nint32perq; \
}
#define GET_CBIT(p,feat,i,b) \
{ \
GET_BIT(p,feat,i,b); \
(i) += 2 * (feat)->nint32perq; \
}
/*****************************************************************************
* AnswerQ *
*---------*
* Description:
* Tree node test.
*
********************************************************************** MC ***/
static _inline long AnswerQ( unsigned short *prod, long *uniq_prod,
long li, long bitpos, long ri, long rbitpos,
long pos, long nint32perProd)
{
UNALIGNED long *p;
for( ; *prod != END_OF_PROD; prod++ )
{
p = &uniq_prod[(*prod) * nint32perProd];
if( ((p[0] & pos) == pos) && (p[li] & bitpos) && (p[ri] & rbitpos) )
{
return true;
}
}
return false;
} /* AnswerQ */
/*****************************************************************************
* CVoiceDataObj::GetTriphoneID *
*------------------------------*
* Description:
* Retrieve triphone ID from phoneme context.+++
* Store result into 'pResult'
*
********************************************************************** MC ***/
HRESULT CVoiceDataObj::GetTriphoneID( TRIPHONE_TREE *forest,
long phon, // target phon
long leftPhon, // left context
long rightPhon, // right context
long pos, // word position ("b", "e" or "s"
PHON_DICT *pd,
ULONG *pResult)
{
SPDBG_FUNC( "CVoiceDataObj::GetTriphoneID" );
C_NODE *cnode, *croot;
TREE_ELEM *tree = NULL;
long *uniq_prod;
char *ll, *rr;
long li, bitpos, ri, rbitpos, nint32perProd, c;
unsigned short *prodspace;
FEATURE *feat;
long *pOffs;
HRESULT hr = S_OK;
long triphoneID = 0;
if( (phon < 0) || (phon >= pd->numCiPhones) ||
(leftPhon < 0) || (leftPhon >= pd->numCiPhones) ||
(rightPhon < 0) || (rightPhon >= pd->numCiPhones) )
{
//--------------------------------
// Phon out of range!
//--------------------------------
hr = E_INVALIDARG;
}
if( SUCCEEDED(hr) )
{
c = phon;
tree = &forest->tree[c];
if( tree->nnodes == 0 )
{
//--------------------------------
// No CD triphones in tree!
//--------------------------------
hr = E_INVALIDARG;
}
}
if( SUCCEEDED(hr) )
{
if( pos == 'b' || pos == 'B' )
{
pos = WB_BEGIN;
}
else if( pos == 'e' || pos == 'E' )
{
pos = WB_END;
}
else if( pos == 's' || pos == 'S' )
{
pos = WB_SINGLE;
}
else if( pos == '\0' )
{
pos = WB_WWT;
}
else
{
//--------------------------------
// Unknown word position
//--------------------------------
hr = E_INVALIDARG;
}
}
if( SUCCEEDED(hr) )
{
pOffs = (long*)((char*)pd + pd->phones_list);
ll = (char*) ((char*)pd + pOffs[leftPhon]);
if( ll[0] == '+' || _strnicmp(ll, "SIL", 3) == 0 )
{
leftPhon = forest->silPhoneId;
}
rr = (char*) ((char*)pd + pOffs[rightPhon]);
if( rr[0] == '+' || _strnicmp(rr, "SIL", 3) == 0 ) // includes SIL
{
rightPhon = forest->silPhoneId;
}
else if( forest->nonSilCxt >= 0 && (pos == WB_END || pos == WB_SINGLE) )
{
rightPhon = forest->nonSilCxt;
}
feat = &forest->feat;
GET_BIT(leftPhon,feat,li,bitpos);
GET_RBIT(rightPhon,feat,ri,rbitpos);
uniq_prod = (long*)(forest->uniq_prod_Offset + (char*)forest); // Offset to ABS
croot = cnode = (C_NODE*)(tree->nodes + (char*)forest); // Offset to ABS
nint32perProd = forest->nint32perProd;
while( ! CNODE_ISA_LEAF(cnode) )
{
prodspace = (unsigned short*)((char*)forest + cnode->prod); // Offset to ABS
if( AnswerQ (prodspace, uniq_prod, li, bitpos, ri, rbitpos, pos, nint32perProd) )
{
cnode = &croot[cnode->yes];
}
else
{
cnode = &croot[cnode->no];
}
}
//-----------------------------
// Return successful result
//-----------------------------
triphoneID = (ULONG) cnode->no;
}
*pResult = triphoneID;
return hr;
} /* CVoiceDataObj::GetTriphoneID */
/*****************************************************************************
* FIR_Filter *
*------------*
* Description:
* FIR filter. For an input x[n] it does an FIR filter with
* output y[n]. Result is in place. pHistory contains the last
* cNumTaps values.
*
* y[n] = pFilter[0] * x[n] + pFilter[1] * x[n - 1]
* + ... + pFilter[cNumTaps - 1] * x[n - cNumTaps - 1]
*
********************************************************************** MC ***/
void CVoiceDataObj::FIR_Filter( float *pVector, long cNumSamples, float *pFilter,
float *pHistory, long cNumTaps )
{
SPDBG_FUNC( "CVoiceDataObj::FIR_Filter" );
long i, j;
float sum;
for( i = 0; i < cNumSamples; i++ )
{
pHistory[0] = pVector[i];
sum = pHistory[0] * pFilter[0];
for( j = cNumTaps - 1; j > 0; j-- )
{
sum += pHistory[j] * pFilter[j];
pHistory[j] = pHistory[j - 1];
}
pVector[i] = sum;
}
} /* CVoiceDataObj::FIR_Filter */
/*****************************************************************************
* IIR_Filter *
*------------*
* Description:
* IIR filter. For an input x[n] it does an IIR filter with
* output y[n]. Result is in place. pHistory contains the last
* cNumTaps values.
*
* y[n] = pFilter[0] * x[n] + pFilter[1] * y[n - 1]
* + ... + pFilter[cNumTaps - 1] * y[n - cNumTaps - 1]
*
********************************************************************** MC ***/
void CVoiceDataObj::IIR_Filter( float *pVector, long cNumSamples, float *pFilter,
float *pHistory, long cNumTaps )
{
SPDBG_FUNC( "CVoiceDataObj::IIR_Filter" );
long i, j;
float sum;
for( i = 0; i < cNumSamples; i++ )
{
sum = pVector[i] * pFilter[0];
for( j = cNumTaps - 1; j > 0; j-- )
{
pHistory[j] = pHistory[j - 1];
sum += pHistory[j] * pFilter[j];
}
pVector[i] = sum;
pHistory[0] = sum;
}
} /* CVoiceDataObj::IIR_Filter */