diff options
author | John Glover <glover.john@gmail.com> | 2010-11-04 14:50:08 +0000 |
---|---|---|
committer | John Glover <glover.john@gmail.com> | 2010-11-04 14:50:08 +0000 |
commit | c741f6ce7bb43b115d08e190b93e0ce090ae3475 (patch) | |
tree | 9ad817d457a0b5595a4de802b069f149745295ac /sms/sms.h | |
parent | 82ae0ec4aa684dbe6285b265bc6a07c6f555d90d (diff) | |
download | simpl-c741f6ce7bb43b115d08e190b93e0ce090ae3475.tar.gz simpl-c741f6ce7bb43b115d08e190b93e0ce090ae3475.tar.bz2 simpl-c741f6ce7bb43b115d08e190b93e0ce090ae3475.zip |
Fixed a couple of SMSPeakDetection bugs and updated the unit tests
Diffstat (limited to 'sms/sms.h')
-rw-r--r-- | sms/sms.h | 559 |
1 files changed, 279 insertions, 280 deletions
@@ -59,26 +59,26 @@ */ typedef struct { - int iSmsMagic; /*!< identification constant */ - int iHeadBSize; /*!< size in bytes of header */ - int nFrames; /*!< number of data frames */ - int iFrameBSize; /*!< size in bytes of each data frame */ - int iSamplingRate; /*!< samplerate of analysis signal (necessary to recreate residual spectrum */ - int iFormat; /*!< type of data format \see SMS_Format */ - int nTracks; /*!< number of sinusoidal tracks per frame */ - int iFrameRate; /*!< rate in Hz of data frames */ - int iStochasticType; /*!< type stochastic representation */ - int nStochasticCoeff; /*!< number of stochastic coefficients per frame */ - int iEnvType; /*!< type of envelope representation */ - int nEnvCoeff; /*!< number of cepstral coefficents per frame */ - int iMaxFreq; /*!< maximum frequency of peaks (also corresponds to the last bin of the specEnv */ -/* sfloat fAmplitude; /\*!< average amplitude of represented sound. *\/ */ -/* sfloat fFrequency; /\*!< average fundamental frequency *\/ */ -/* int iBegSteadyState; /\*!< record number of begining of steady state. *\/ */ -/* int iEndSteadyState; /\*!< record number of end of steady state. *\/ */ - sfloat fResidualPerc; /*!< percentage of the residual to original */ - int nTextCharacters; /*!< number of text characters */ - char *pChTextCharacters; /*!< Text string relating to the sound */ + int iSmsMagic; /*!< identification constant */ + int iHeadBSize; /*!< size in bytes of header */ + int nFrames; /*!< number of data frames */ + int iFrameBSize; /*!< size in bytes of each data frame */ + int iSamplingRate; /*!< samplerate of analysis signal (necessary to recreate residual spectrum */ + int iFormat; /*!< type of data format \see SMS_Format */ + int nTracks; /*!< number of sinusoidal tracks per frame */ + int iFrameRate; /*!< rate in Hz of data frames */ + int iStochasticType; /*!< type stochastic representation */ + int nStochasticCoeff; /*!< number of stochastic coefficients per frame */ + int iEnvType; /*!< type of envelope representation */ + int nEnvCoeff; /*!< number of cepstral coefficents per frame */ + int iMaxFreq; /*!< maximum frequency of peaks (also corresponds to the last bin of the specEnv */ + /* sfloat fAmplitude; /\*!< average amplitude of represented sound. *\/ */ + /* sfloat fFrequency; /\*!< average fundamental frequency *\/ */ + /* int iBegSteadyState; /\*!< record number of begining of steady state. *\/ */ + /* int iEndSteadyState; /\*!< record number of end of steady state. *\/ */ + sfloat fResidualPerc; /*!< percentage of the residual to original */ + int nTextCharacters; /*!< number of text characters */ + char *pChTextCharacters; /*!< Text string relating to the sound */ } SMS_Header; /*! \struct SMS_Data @@ -95,16 +95,16 @@ typedef struct */ typedef struct { - sfloat *pSmsData; /*!< pointer to all SMS data */ - int sizeData; /*!< size of all the data */ - sfloat *pFSinFreq; /*!< frequency of sinusoids */ - sfloat *pFSinAmp; /*!< magnitude of sinusoids (stored in dB) */ - sfloat *pFSinPha; /*!< phase of sinusoids */ - int nTracks; /*!< number of sinusoidal tracks in frame */ - sfloat *pFStocGain; /*!< gain of stochastic component */ - int nCoeff; /*!< number of filter coefficients */ - sfloat *pFStocCoeff; /*!< filter coefficients for stochastic component */ - sfloat *pResPhase; /*!< residual phase spectrum */ + sfloat *pSmsData; /*!< pointer to all SMS data */ + int sizeData; /*!< size of all the data */ + sfloat *pFSinFreq; /*!< frequency of sinusoids */ + sfloat *pFSinAmp; /*!< magnitude of sinusoids (stored in dB) */ + sfloat *pFSinPha; /*!< phase of sinusoids */ + int nTracks; /*!< number of sinusoidal tracks in frame */ + sfloat *pFStocGain; /*!< gain of stochastic component */ + int nCoeff; /*!< number of filter coefficients */ + sfloat *pFStocCoeff; /*!< filter coefficients for stochastic component */ + sfloat *pResPhase; /*!< residual phase spectrum */ int nEnvCoeff; /*!< number of spectral envelope coefficients */ sfloat *pSpecEnv; } SMS_Data; @@ -120,10 +120,10 @@ typedef struct */ typedef struct { - sfloat *pFBuffer; /*!< buffer for sound data*/ - int sizeBuffer; /*!< size of buffer */ - int iMarker; /*!< sample marker relating to sound source */ - int iFirstGood; /*!< first sample in buffer that is a good one */ + sfloat *pFBuffer; /*!< buffer for sound data*/ + int sizeBuffer; /*!< size of buffer */ + int iMarker; /*!< sample marker relating to sound source */ + int iFirstGood; /*!< first sample in buffer that is a good one */ } SMS_SndBuffer; /*! \struct SMS_Peak @@ -133,17 +133,17 @@ typedef struct /* information attached to a spectral peak */ typedef struct { - sfloat fFreq; /*!< frequency of peak */ - sfloat fMag; /*!< magnitude of peak */ - sfloat fPhase; /*!< phase of peak */ + sfloat fFreq; /*!< frequency of peak */ + sfloat fMag; /*!< magnitude of peak */ + sfloat fPhase; /*!< phase of peak */ } SMS_Peak; /* a collection of spectral peaks */ typedef struct { - SMS_Peak *pSpectralPeaks; - int nPeaks; - int nPeaksFound; + SMS_Peak *pSpectralPeaks; + int nPeaks; + int nPeaksFound; } SMS_SpectralPeaks; /*! \struct SMS_AnalFrame @@ -154,35 +154,35 @@ typedef struct */ typedef struct { - int iFrameSample; /*!< sample number of the middle of the frame */ - int iFrameSize; /*!< number of samples used in the frame */ - int iFrameNum; /*!< frame number */ - SMS_Peak *pSpectralPeaks; /*!< spectral peaks found in frame */ - int nPeaks; /*!< number of peaks found */ - sfloat fFundamental; /*!< fundamental frequency in frame */ - SMS_Data deterministic; /*!< deterministic data */ - int iStatus; /*!< status of frame enumerated by SMS_FRAME_STATUS - \see SMS_FRAME_STATUS */ + int iFrameSample; /*!< sample number of the middle of the frame */ + int iFrameSize; /*!< number of samples used in the frame */ + int iFrameNum; /*!< frame number */ + SMS_Peak *pSpectralPeaks; /*!< spectral peaks found in frame */ + int nPeaks; /*!< number of peaks found */ + sfloat fFundamental; /*!< fundamental frequency in frame */ + SMS_Data deterministic; /*!< deterministic data */ + int iStatus; /*!< status of frame enumerated by SMS_FRAME_STATUS + \see SMS_FRAME_STATUS */ } SMS_AnalFrame; /*! \struct SMS_PeakParams * \brief structure with useful information for peak detection and continuation * */ -typedef struct -{ - sfloat fLowestFreq; /*!< the first bin to look for a peak */ - sfloat fHighestFreq; /*!< the last bin to look for a peak */ - sfloat fMinPeakMag; /*!< mininum magnitude to consider as a peak */ - int iSamplingRate; /*!< sampling rate of analysis signal */ - int iMaxPeaks; /*!< maximum number of spectral peaks to look for */ - int nPeaksFound; /*!< the number of peaks found in each analysis */ - sfloat fHighestFundamental;/*!< highest fundamental frequency in Hz */ - int iRefHarmonic; /*!< reference harmonic to use in the fundamental detection */ - sfloat fMinRefHarmMag; /*!< minimum magnitude in dB for reference peak */ - sfloat fRefHarmMagDiffFromMax; /*!< maximum magnitude difference from reference peak to highest peak */ - int iSoundType; /*!< type of sound to be analyzed \see SMS_SOUND_TYPE */ -} SMS_PeakParams; +//typedef struct +//{ +// sfloat fLowestFreq; [>!< the first bin to look for a peak <] +// sfloat fHighestFreq; [>!< the last bin to look for a peak <] +// sfloat fMinPeakMag; [>!< mininum magnitude to consider as a peak <] +// int iSamplingRate; [>!< sampling rate of analysis signal <] +// int iMaxPeaks; [>!< maximum number of spectral peaks to look for <] +// int nPeaksFound; [>!< the number of peaks found in each analysis <] +// sfloat fHighestFundamental;[>!< highest fundamental frequency in Hz <] +// int iRefHarmonic; [>!< reference harmonic to use in the fundamental detection <] +// sfloat fMinRefHarmMag; [>!< minimum magnitude in dB for reference peak <] +// sfloat fRefHarmMagDiffFromMax; [>!< maximum magnitude difference from reference peak to highest peak <] +// int iSoundType; [>!< type of sound to be analyzed \see SMS_SOUND_TYPE <] +//} SMS_PeakParams; /*! \struct SMS_SEnvParams; * \brief structure information and data for spectral enveloping @@ -190,12 +190,12 @@ typedef struct */ typedef struct { - int iType; /*!< envelope type \see SMS_SpecEnvType */ - int iOrder; /*!< ceptrum order */ - int iMaxFreq; /*!< maximum frequency covered by the envelope */ - sfloat fLambda; /*!< regularization factor */ - int nCoeff; /*!< number of coefficients (bins) in the envelope */ - int iAnchor; /*!< whether to make anchor points at DC / Nyquist or not */ + int iType; /*!< envelope type \see SMS_SpecEnvType */ + int iOrder; /*!< ceptrum order */ + int iMaxFreq; /*!< maximum frequency covered by the envelope */ + sfloat fLambda; /*!< regularization factor */ + int nCoeff; /*!< number of coefficients (bins) in the envelope */ + int iAnchor; /*!< whether to make anchor points at DC / Nyquist or not */ } SMS_SEnvParams; @@ -216,54 +216,56 @@ typedef struct */ typedef struct { - int iDebugMode; /*!< debug codes enumerated by SMS_DBG \see SMS_DBG */ - int iFormat; /*!< analysis format code defined by SMS_Format \see SMS_Format */ - int iSoundType; /*!< type of sound to be analyzed \see SMS_SOUND_TYPE */ - int iStochasticType; /*!< type of stochastic model defined by SMS_StocSynthType \see SMS_StocSynthType */ - int iFrameRate; /*!< rate in Hz of data frames */ - int nStochasticCoeff; /*!< number of stochastic coefficients per frame */ - sfloat fLowestFundamental; /*!< lowest fundamental frequency in Hz */ - sfloat fHighestFundamental;/*!< highest fundamental frequency in Hz */ - sfloat fDefaultFundamental;/*!< default fundamental in Hz */ - sfloat fPeakContToGuide; /*!< contribution of previous peak to current guide (between 0 and 1) */ - sfloat fFundContToGuide; /*!< contribution of current fundamental to current guide (between 0 and 1) */ - sfloat fFreqDeviation; /*!< maximum deviation from peak to peak */ - int iSamplingRate; /*! sampling rate of sound to be analyzed */ - int iDefaultSizeWindow; /*!< default size of analysis window in samples */ - int windowSize; /*!< the current window size */ - int sizeHop; /*!< hop size of analysis window in samples */ - sfloat fSizeWindow; /*!< size of analysis window in number of periods */ - int nTracks; /*!< number of sinusoidal tracks in frame */ - int nGuides; /*!< number of guides used for peak detection and continuation \see SMS_Guide */ - int iCleanTracks; /*!< whether or not to clean sinusoidal tracks */ - //int iEnvelope; /*!< whether or not to compute spectral envelope */ - sfloat fMinRefHarmMag; /*!< minimum magnitude in dB for reference peak */ - sfloat fRefHarmMagDiffFromMax; /*!< maximum magnitude difference from reference peak to highest peak */ - int iRefHarmonic; /*!< reference harmonic to use in the fundamental detection */ - int iMinTrackLength; /*!< minimum length in samples of a given track */ - int iMaxSleepingTime; /*!< maximum sleeping time for a track */ - sfloat fHighestFreq; /*!< highest frequency to be searched */ - sfloat fMinPeakMag; /*!< minimum magnitude in dB for a good peak */ - int iAnalysisDirection; /*!< analysis direction, direct or reverse */ - int iSizeSound; /*!< total size of sound to be analyzed in samples */ - int nFrames; /*!< total number of frames that will be analyzed */ - int iWindowType; /*!< type of FFT analysis window \see SMS_WINDOWS */ - int iMaxDelayFrames; /*!< maximum number of frames to delay before peak continuation */ - int minGoodFrames; /*!< minimum number of stable frames for backward search */ - sfloat maxDeviation; /*!< maximum deviation allowed */ - int analDelay; /*! number of frames in the past to be looked in possible re-analyze */ - sfloat fResidualAccumPerc; /*!< accumalitive residual percentage */ - int sizeNextRead; /*!< size of samples to read from sound file next analysis */ - sfloat preEmphasisLastValue; - int resetGuides; - int resetGuideStates; - SMS_PeakParams peakParams; /*!< structure with parameters for spectral peaks */ - SMS_Data prevFrame; /*!< the previous analysis frame */ - SMS_SEnvParams specEnvParams; /*!< all data for spectral enveloping */ - SMS_SndBuffer soundBuffer; /*!< signal to be analyzed */ - SMS_SndBuffer synthBuffer; /*!< resynthesized signal used to create the residual */ - SMS_AnalFrame *pFrames; /*!< an array of frames that have already been analyzed */ - SMS_AnalFrame **ppFrames; /*!< pointers to the frames analyzed (it is circular-shifted once the array is full */ + int iDebugMode; /*!< debug codes enumerated by SMS_DBG \see SMS_DBG */ + int iFormat; /*!< analysis format code defined by SMS_Format \see SMS_Format */ + int iSoundType; /*!< type of sound to be analyzed \see SMS_SOUND_TYPE */ + int iStochasticType; /*!< type of stochastic model defined by SMS_StocSynthType \see SMS_StocSynthType */ + int iFrameRate; /*!< rate in Hz of data frames */ + int nStochasticCoeff; /*!< number of stochastic coefficients per frame */ + sfloat fLowestFundamental; /*!< lowest fundamental frequency in Hz */ + sfloat fHighestFundamental;/*!< highest fundamental frequency in Hz */ + sfloat fDefaultFundamental;/*!< default fundamental in Hz */ + sfloat fPeakContToGuide; /*!< contribution of previous peak to current guide (between 0 and 1) */ + sfloat fFundContToGuide; /*!< contribution of current fundamental to current guide (between 0 and 1) */ + sfloat fFreqDeviation; /*!< maximum deviation from peak to peak */ + int iSamplingRate; /*! sampling rate of sound to be analyzed */ + int iDefaultSizeWindow; /*!< default size of analysis window in samples */ + int windowSize; /*!< the current window size */ + int sizeHop; /*!< hop size of analysis window in samples */ + sfloat fSizeWindow; /*!< size of analysis window in number of periods */ + int nTracks; /*!< number of sinusoidal tracks in frame */ + int maxPeaks; /*!< maximum number of peaks in a frame */ + int nGuides; /*!< number of guides used for peak detection and continuation \see SMS_Guide */ + int iCleanTracks; /*!< whether or not to clean sinusoidal tracks */ + //int iEnvelope; /*!< whether or not to compute spectral envelope */ + sfloat fMinRefHarmMag; /*!< minimum magnitude in dB for reference peak */ + sfloat fRefHarmMagDiffFromMax; /*!< maximum magnitude difference from reference peak to highest peak */ + int iRefHarmonic; /*!< reference harmonic to use in the fundamental detection */ + int iMinTrackLength; /*!< minimum length in samples of a given track */ + int iMaxSleepingTime; /*!< maximum sleeping time for a track */ + sfloat fLowestFreq; /*!< lowest frequency to be searched */ + sfloat fHighestFreq; /*!< highest frequency to be searched */ + sfloat fMinPeakMag; /*!< minimum magnitude in dB for a good peak */ + int iAnalysisDirection; /*!< analysis direction, direct or reverse */ + int iSizeSound; /*!< total size of sound to be analyzed in samples */ + int nFrames; /*!< total number of frames that will be analyzed */ + int iWindowType; /*!< type of FFT analysis window \see SMS_WINDOWS */ + int iMaxDelayFrames; /*!< maximum number of frames to delay before peak continuation */ + int minGoodFrames; /*!< minimum number of stable frames for backward search */ + sfloat maxDeviation; /*!< maximum deviation allowed */ + int analDelay; /*! number of frames in the past to be looked in possible re-analyze */ + sfloat fResidualAccumPerc; /*!< accumalitive residual percentage */ + int sizeNextRead; /*!< size of samples to read from sound file next analysis */ + sfloat preEmphasisLastValue; + int resetGuides; + int resetGuideStates; + //SMS_PeakParams peakParams; [>!< structure with parameters for spectral peaks <] + SMS_Data prevFrame; /*!< the previous analysis frame */ + SMS_SEnvParams specEnvParams; /*!< all data for spectral enveloping */ + SMS_SndBuffer soundBuffer; /*!< signal to be analyzed */ + SMS_SndBuffer synthBuffer; /*!< resynthesized signal used to create the residual */ + SMS_AnalFrame *pFrames; /*!< an array of frames that have already been analyzed */ + SMS_AnalFrame **ppFrames; /*!< pointers to the frames analyzed (it is circular-shifted once the array is full */ } SMS_AnalParams; /*! \struct SMS_ModifyParams @@ -272,20 +274,20 @@ typedef struct */ typedef struct { - int ready; /*!< a flag to know if the struct has been initialized) */ - int maxFreq; /*!< maximum frequency component */ - int doResGain; /*!< whether or not to scale residual gain */ - sfloat resGain; /*!< residual scale factor */ - int doTranspose; /*!< whether or not to transpose */ - sfloat transpose; /*!< transposition factor */ - int doSinEnv; /*!< whether or not to apply a new spectral envelope to the sin component */ - sfloat sinEnvInterp; /*!< value between 0 (use frame's env) and 1 (use *env). Interpolates inbetween values*/ - int sizeSinEnv; /*!< size of the envelope pointed to by env */ - sfloat *sinEnv; /*!< sinusoidal spectral envelope */ - int doResEnv; /*!< whether or not to apply a new spectral envelope to the residual component */ - sfloat resEnvInterp; /*!< value between 0 (use frame's env) and 1 (use *env). Interpolates inbetween values*/ - int sizeResEnv; /*!< size of the envelope pointed to by resEnv */ - sfloat *resEnv; /*!< residual spectral envelope */ + int ready; /*!< a flag to know if the struct has been initialized) */ + int maxFreq; /*!< maximum frequency component */ + int doResGain; /*!< whether or not to scale residual gain */ + sfloat resGain; /*!< residual scale factor */ + int doTranspose; /*!< whether or not to transpose */ + sfloat transpose; /*!< transposition factor */ + int doSinEnv; /*!< whether or not to apply a new spectral envelope to the sin component */ + sfloat sinEnvInterp; /*!< value between 0 (use frame's env) and 1 (use *env). Interpolates inbetween values*/ + int sizeSinEnv; /*!< size of the envelope pointed to by env */ + sfloat *sinEnv; /*!< sinusoidal spectral envelope */ + int doResEnv; /*!< whether or not to apply a new spectral envelope to the residual component */ + sfloat resEnvInterp; /*!< value between 0 (use frame's env) and 1 (use *env). Interpolates inbetween values*/ + int sizeResEnv; /*!< size of the envelope pointed to by resEnv */ + sfloat *resEnv; /*!< residual spectral envelope */ } SMS_ModifyParams; /*! \struct SMS_SynthParams @@ -298,24 +300,24 @@ typedef struct */ typedef struct { - int iStochasticType; /*!< type of stochastic model defined by SMS_StocSynthType \see SMS_StocSynthType */ - int iSynthesisType; /*!< type of synthesis to perform \see SMS_SynthType */ - int iDetSynthType; /*!< method for synthesizing deterministic component \see SMS_DetSynthType */ - int iOriginalSRate; /*!< samplerate of the sound model source (for stochastic synthesis approximation) */ - int iSamplingRate; /*!< synthesis samplerate */ - int sizeHop; /*!< number of samples to synthesis for each frame */ - int origSizeHop; /*!< original number of samples used to create each analysis frame */ - int nTracks; - int nStochasticCoeff; - sfloat deemphasisLastValue; - sfloat *pFDetWindow; /*!< array to hold the window used for deterministic synthesis \see SMS_WIN_IFFT */ - sfloat *pFStocWindow; /*!< array to hold the window used for stochastic synthesis (Hanning) */ - sfloat *pSynthBuff; /*!< an array for keeping samples during overlap-add (2x sizeHop) */ - sfloat *pMagBuff; /*!< an array for keeping magnitude spectrum for stochastic synthesis */ - sfloat *pPhaseBuff; /*!< an array for keeping phase spectrum for stochastic synthesis */ - sfloat *pSpectra; /*!< array for in-place FFT transform */ - SMS_Data prevFrame; /*!< previous data frame, for interpolation between frames */ - SMS_ModifyParams modParams; /*!< modification parameters */ + int iStochasticType; /*!< type of stochastic model defined by SMS_StocSynthType \see SMS_StocSynthType */ + int iSynthesisType; /*!< type of synthesis to perform \see SMS_SynthType */ + int iDetSynthType; /*!< method for synthesizing deterministic component \see SMS_DetSynthType */ + int iOriginalSRate; /*!< samplerate of the sound model source (for stochastic synthesis approximation) */ + int iSamplingRate; /*!< synthesis samplerate */ + int sizeHop; /*!< number of samples to synthesis for each frame */ + int origSizeHop; /*!< original number of samples used to create each analysis frame */ + int nTracks; + int nStochasticCoeff; + sfloat deemphasisLastValue; + sfloat *pFDetWindow; /*!< array to hold the window used for deterministic synthesis \see SMS_WIN_IFFT */ + sfloat *pFStocWindow; /*!< array to hold the window used for stochastic synthesis (Hanning) */ + sfloat *pSynthBuff; /*!< an array for keeping samples during overlap-add (2x sizeHop) */ + sfloat *pMagBuff; /*!< an array for keeping magnitude spectrum for stochastic synthesis */ + sfloat *pPhaseBuff; /*!< an array for keeping phase spectrum for stochastic synthesis */ + sfloat *pSpectra; /*!< array for in-place FFT transform */ + SMS_Data prevFrame; /*!< previous data frame, for interpolation between frames */ + SMS_ModifyParams modParams; /*!< modification parameters */ } SMS_SynthParams; /*! \struct SMS_HarmCandidate @@ -327,11 +329,11 @@ typedef struct */ typedef struct { - sfloat fFreq; /*!< frequency of harmonic */ - sfloat fMag; /*!< magnitude of harmonic */ - sfloat fMagPerc; /*!< percentage of magnitude */ - sfloat fFreqDev; /*!< deviation from perfect harmonic */ - sfloat fHarmRatio; /*!< percentage of harmonics found */ + sfloat fFreq; /*!< frequency of harmonic */ + sfloat fMag; /*!< magnitude of harmonic */ + sfloat fMagPerc; /*!< percentage of magnitude */ + sfloat fFreqDev; /*!< deviation from perfect harmonic */ + sfloat fHarmRatio; /*!< percentage of harmonics found */ } SMS_HarmCandidate; /*! \struct SMS_ContCandidate @@ -342,9 +344,9 @@ typedef struct */ typedef struct { - sfloat fFreqDev; /*!< frequency deviation from guide */ - sfloat fMagDev; /*!< magnitude deviation from guide */ - int iPeak; /*!< peak number (organized according to frequency)*/ + sfloat fFreqDev; /*!< frequency deviation from guide */ + sfloat fMagDev; /*!< magnitude deviation from guide */ + int iPeak; /*!< peak number (organized according to frequency)*/ } SMS_ContCandidate; /*! \struct SMS_Guide @@ -357,10 +359,10 @@ typedef struct */ typedef struct { - sfloat fFreq; /*!< frequency of guide */ - sfloat fMag; /*!< magnitude of guide */ - int iStatus; /*!< status of guide: DEAD, SLEEPING, ACTIVE */ - int iPeakChosen; /*!< peak number chosen by the guide */ + sfloat fFreq; /*!< frequency of guide */ + sfloat fMag; /*!< magnitude of guide */ + int iStatus; /*!< status of guide: DEAD, SLEEPING, ACTIVE */ + int iPeakChosen; /*!< peak number chosen by the guide */ } SMS_Guide; /*! \brief analysis format @@ -373,10 +375,10 @@ typedef struct */ enum SMS_Format { - SMS_FORMAT_H, /*!< 0, format harmonic */ - SMS_FORMAT_IH, /*!< 1, format inharmonic */ - SMS_FORMAT_HP, /*!< 2, format harmonic with phase */ - SMS_FORMAT_IHP /*!< 3, format inharmonic with phase */ + SMS_FORMAT_H, /*!< 0, format harmonic */ + SMS_FORMAT_IH, /*!< 1, format inharmonic */ + SMS_FORMAT_HP, /*!< 2, format harmonic with phase */ + SMS_FORMAT_IHP /*!< 3, format inharmonic with phase */ }; /*! \brief synthesis types @@ -388,9 +390,9 @@ enum SMS_Format */ enum SMS_SynthType { - SMS_STYPE_ALL, /*!< both components combined */ - SMS_STYPE_DET, /*!< deterministic component alone */ - SMS_STYPE_STOC /*!< stochastic component alone */ + SMS_STYPE_ALL, /*!< both components combined */ + SMS_STYPE_DET, /*!< deterministic component alone */ + SMS_STYPE_STOC /*!< stochastic component alone */ }; /*! \brief synthesis method for deterministic component @@ -404,8 +406,8 @@ enum SMS_SynthType */ enum SMS_DetSynthType { - SMS_DET_IFFT, /*!< Inverse Fast Fourier Transform (IFFT) */ - SMS_DET_SIN /*!< Sinusoidal Table Lookup (SIN) */ + SMS_DET_IFFT, /*!< Inverse Fast Fourier Transform (IFFT) */ + SMS_DET_SIN /*!< Sinusoidal Table Lookup (SIN) */ }; /*! \brief synthesis method for stochastic component @@ -431,9 +433,9 @@ enum SMS_DetSynthType */ enum SMS_StocSynthType { - SMS_STOC_NONE, /*!< 0, no stochastistic component */ - SMS_STOC_APPROX, /*!< 1, Inverse FFT, magnitude approximation and generated phases */ - SMS_STOC_IFFT /*!< 2, inverse FFT, interpolated spectrum (not used) */ + SMS_STOC_NONE, /*!< 0, no stochastistic component */ + SMS_STOC_APPROX, /*!< 1, Inverse FFT, magnitude approximation and generated phases */ + SMS_STOC_IFFT /*!< 2, inverse FFT, interpolated spectrum (not used) */ }; /*! \brief synthesis method for deterministic component @@ -447,9 +449,9 @@ enum SMS_StocSynthType */ enum SMS_SpecEnvType { - SMS_ENV_NONE, /*!< none */ - SMS_ENV_CEP, /*!< cepstral coefficients */ - SMS_ENV_FBINS /*!< frequency bins */ + SMS_ENV_NONE, /*!< none */ + SMS_ENV_CEP, /*!< cepstral coefficients */ + SMS_ENV_FBINS /*!< frequency bins */ }; @@ -457,13 +459,13 @@ enum SMS_SpecEnvType /* \todo remove me */ enum SMS_ERRORS { - SMS_OK, /*!< 0, no error*/ - SMS_NOPEN, /*!< 1, couldn't open file */ - SMS_NSMS , /*!< 2, not a SMS file */ - SMS_MALLOC, /*!< 3, couldn't allocate memory */ - SMS_RDERR, /*!< 4, read error */ - SMS_WRERR, /*!< 5, write error */ - SMS_SNDERR /*!< 7, sound IO error */ + SMS_OK, /*!< 0, no error*/ + SMS_NOPEN, /*!< 1, couldn't open file */ + SMS_NSMS , /*!< 2, not a SMS file */ + SMS_MALLOC, /*!< 3, couldn't allocate memory */ + SMS_RDERR, /*!< 4, read error */ + SMS_WRERR, /*!< 5, write error */ + SMS_SNDERR /*!< 7, sound IO error */ }; /*! \brief debug modes @@ -472,21 +474,21 @@ enum SMS_ERRORS */ enum SMS_DBG { - SMS_DBG_NONE, /*!< 0, no debugging */ - SMS_DBG_DET, /*!< 1, not yet implemented \todo make this show main information to look at for discovering the correct deterministic parameters*/ - SMS_DBG_PEAK_DET, /*!< 2, peak detection function */ - SMS_DBG_HARM_DET, /*!< 3, harmonic detection function */ - SMS_DBG_PEAK_CONT, /*!< 4, peak continuation function */ - SMS_DBG_CLEAN_TRAJ, /*!< 5, clean tracks function */ - SMS_DBG_SINE_SYNTH, /*!< 6, sine synthesis function */ - SMS_DBG_STOC_ANAL, /*!< 7, stochastic analysis function */ - SMS_DBG_STOC_SYNTH, /*!< 8, stochastic synthesis function */ - SMS_DBG_SMS_ANAL, /*!< 9, top level analysis function */ - SMS_DBG_ALL, /*!< 10, everything */ - SMS_DBG_RESIDUAL, /*!< 11, write residual to file */ - SMS_DBG_SYNC, /*!< 12, write original, synthesis and residual - to a text file */ - }; + SMS_DBG_NONE, /*!< 0, no debugging */ + SMS_DBG_DET, /*!< 1, not yet implemented \todo make this show main information to look at for discovering the correct deterministic parameters*/ + SMS_DBG_PEAK_DET, /*!< 2, peak detection function */ + SMS_DBG_HARM_DET, /*!< 3, harmonic detection function */ + SMS_DBG_PEAK_CONT, /*!< 4, peak continuation function */ + SMS_DBG_CLEAN_TRAJ, /*!< 5, clean tracks function */ + SMS_DBG_SINE_SYNTH, /*!< 6, sine synthesis function */ + SMS_DBG_STOC_ANAL, /*!< 7, stochastic analysis function */ + SMS_DBG_STOC_SYNTH, /*!< 8, stochastic synthesis function */ + SMS_DBG_SMS_ANAL, /*!< 9, top level analysis function */ + SMS_DBG_ALL, /*!< 10, everything */ + SMS_DBG_RESIDUAL, /*!< 11, write residual to file */ + SMS_DBG_SYNC, /*!< 12, write original, synthesis and residual + to a text file */ +}; #define SMS_MAX_WINDOW 8190 /*!< \brief maximum size for analysis window */ @@ -496,8 +498,8 @@ enum SMS_DBG */ enum SMS_SOUND_TYPE { - SMS_SOUND_TYPE_MELODY, /*!< 0, sound composed of several notes */ - SMS_SOUND_TYPE_NOTE /*!< 1, sound composed of a single note */ + SMS_SOUND_TYPE_MELODY, /*!< 0, sound composed of several notes */ + SMS_SOUND_TYPE_NOTE /*!< 1, sound composed of a single note */ }; /* \brief direction of analysis @@ -508,22 +510,22 @@ enum SMS_SOUND_TYPE */ enum SMS_DIRECTION { - SMS_DIR_FWD, /*!< analysis from left to right */ - SMS_DIR_REV /*!< analysis from right to left */ + SMS_DIR_FWD, /*!< analysis from left to right */ + SMS_DIR_REV /*!< analysis from right to left */ }; /* \brief window selection - */ +*/ enum SMS_WINDOWS { - SMS_WIN_HAMMING, /*!< 0: hamming */ - SMS_WIN_BH_62, /*!< 1: blackman-harris, 62dB cutoff */ - SMS_WIN_BH_70, /*!< 2: blackman-harris, 70dB cutoff */ - SMS_WIN_BH_74, /*!< 3: blackman-harris, 74dB cutoff */ - SMS_WIN_BH_92, /*!< 4: blackman-harris, 92dB cutoff */ - SMS_WIN_HANNING, /*!< 5: hanning */ - SMS_WIN_IFFT /*!< 6: window for deterministic synthesis based on the Inverse-FFT algorithm. - This is a combination of an inverse Blackman-Harris 92dB and a triangular window. */ + SMS_WIN_HAMMING, /*!< 0: hamming */ + SMS_WIN_BH_62, /*!< 1: blackman-harris, 62dB cutoff */ + SMS_WIN_BH_70, /*!< 2: blackman-harris, 70dB cutoff */ + SMS_WIN_BH_74, /*!< 3: blackman-harris, 74dB cutoff */ + SMS_WIN_BH_92, /*!< 4: blackman-harris, 92dB cutoff */ + SMS_WIN_HANNING, /*!< 5: hanning */ + SMS_WIN_IFFT /*!< 6: window for deterministic synthesis based on the Inverse-FFT algorithm. + This is a combination of an inverse Blackman-Harris 92dB and a triangular window. */ }; /*! @@ -531,17 +533,17 @@ enum SMS_WINDOWS */ enum SMS_FRAME_STATUS { - SMS_FRAME_EMPTY, - SMS_FRAME_READY, - SMS_FRAME_PEAKS_FOUND, - SMS_FRAME_FUND_FOUND, - SMS_FRAME_TRAJ_FOUND, - SMS_FRAME_CLEANED, - SMS_FRAME_RECOMPUTED, - SMS_FRAME_DETER_SYNTH, - SMS_FRAME_STOC_COMPUTED, - SMS_FRAME_DONE, - SMS_FRAME_END + SMS_FRAME_EMPTY, + SMS_FRAME_READY, + SMS_FRAME_PEAKS_FOUND, + SMS_FRAME_FUND_FOUND, + SMS_FRAME_TRAJ_FOUND, + SMS_FRAME_CLEANED, + SMS_FRAME_RECOMPUTED, + SMS_FRAME_DETER_SYNTH, + SMS_FRAME_STOC_COMPUTED, + SMS_FRAME_DONE, + SMS_FRAME_END }; @@ -575,38 +577,38 @@ void sms_arrayScalarTempered( int sizeArray, sfloat *pArray); #ifndef MAX /*! \brief returns the maximum of a and b */ -#define MAX(a,b) ((a) > (b) ? (a) : (b)) +#define MAX(a,b) ((a) > (b) ? (a) : (b)) #endif #ifndef MIN /*! \brief returns the minimum of a and b */ -#define MIN(a,b) ((a) < (b) ? (a) : (b)) +#define MIN(a,b) ((a) < (b) ? (a) : (b)) #endif /*! \} */ /* function declarations */ void sms_setPeaks(SMS_AnalParams *pAnalParams, int numamps, sfloat* amps, - int numfreqs, sfloat* freqs, int numphases, sfloat* phases); + int numfreqs, sfloat* freqs, int numphases, sfloat* phases); int sms_findPeaks(int sizeWaveform, sfloat *pWaveform, SMS_AnalParams *pAnalParams, SMS_SpectralPeaks *pSpectralPeaks); int sms_findPartials(SMS_Data *pSmsFrame, SMS_AnalParams *pAnalParams); int sms_findResidual(int sizeSynthesis, sfloat* pSynthesis, - int sizeOriginal, sfloat* pOriginal, - int sizeResidual, sfloat* pResidual, - SMS_AnalParams *analParams); + int sizeOriginal, sfloat* pOriginal, + int sizeResidual, sfloat* pResidual, + SMS_AnalParams *analParams); int sms_analyze(int sizeWaveform, sfloat *pWaveform, SMS_Data *pSmsData, SMS_AnalParams *pAnalParams); void sms_analyzeFrame(int iCurrentFrame, SMS_AnalParams *pAnalParams, sfloat fRefFundamental); -int sms_init( void ); +int sms_init(void); -void sms_free( void ); +void sms_free(void); -int sms_initAnalysis ( SMS_AnalParams *pAnalParams); +int sms_initAnalysis(SMS_AnalParams *pAnalParams); -void sms_initAnalParams (SMS_AnalParams *pAnalParams); +void sms_initAnalParams(SMS_AnalParams *pAnalParams); void sms_changeHopSize(int hopSize, SMS_AnalParams *pAnalParams); @@ -614,57 +616,54 @@ void sms_initSynthParams(SMS_SynthParams *synthParams); int sms_initSynth(SMS_SynthParams *pSynthParams); -int sms_changeSynthHop( SMS_SynthParams *pSynthParams, int sizeHop); +int sms_changeSynthHop(SMS_SynthParams *pSynthParams, int sizeHop); -void sms_freeAnalysis (SMS_AnalParams *pAnalParams); +void sms_freeAnalysis(SMS_AnalParams *pAnalParams); -void sms_freeSynth( SMS_SynthParams *pSynthParams ); +void sms_freeSynth(SMS_SynthParams *pSynthParams ); -void sms_fillSoundBuffer (int sizeWaveform, sfloat *pWaveform, SMS_AnalParams *pAnalParams); +void sms_fillSoundBuffer(int sizeWaveform, sfloat *pWaveform, SMS_AnalParams *pAnalParams); -void sms_windowCentered (int sizeWindow, sfloat *pWaveform, sfloat *pWindow, int sizeFft, sfloat *pFftBuffer); +void sms_windowCentered(int sizeWindow, sfloat *pWaveform, sfloat *pWindow, int sizeFft, sfloat *pFftBuffer); -void sms_getWindow (int sizeWindow, sfloat *pWindow, int iWindowType); +void sms_getWindow(int sizeWindow, sfloat *pWindow, int iWindowType); -void sms_scaleWindow (int sizeWindow, sfloat *pWindow); +void sms_scaleWindow(int sizeWindow, sfloat *pWindow); -int sms_spectrum (int sizeWindow, sfloat *pWaveform, sfloat *pWindow, int sizeMag, - sfloat *pMag, sfloat *pPhase); +int sms_spectrum(int sizeWindow, sfloat *pWaveform, sfloat *pWindow, int sizeMag, + sfloat *pMag, sfloat *pPhase); -int sms_invSpectrum (int sizeWaveform, sfloat *pWaveform, sfloat *pWindow , - int sizeMag, sfloat *pMag, sfloat *pPhase); +int sms_invSpectrum(int sizeWaveform, sfloat *pWaveform, sfloat *pWindow , + int sizeMag, sfloat *pMag, sfloat *pPhase); /* \todo remove this once invSpectrum is completely implemented */ -int sms_invQuickSpectrumW (sfloat *pFMagSpectrum, sfloat *pFPhaseSpectrum, - int sizeFft, sfloat *pFWaveform, int sizeWave, - sfloat *pFWindow); +int sms_invQuickSpectrumW(sfloat *pFMagSpectrum, sfloat *pFPhaseSpectrum, + int sizeFft, sfloat *pFWaveform, int sizeWave, + sfloat *pFWindow); -int sms_spectralApprox (sfloat *pSpec1, int sizeSpec1, int sizeSpec1Used, - sfloat *pSpec2, int sizeSpec2, int nCoefficients); +int sms_spectralApprox(sfloat *pSpec1, int sizeSpec1, int sizeSpec1Used, + sfloat *pSpec2, int sizeSpec2, int nCoefficients); -int sms_spectrumMag (int sizeWindow, sfloat *pWaveform, sfloat *pWindow, - int sizeMag, sfloat *pMag); - -void sms_dCepstrum( int sizeCepstrum, sfloat *pCepstrum, int sizeFreq, sfloat *pFreq, sfloat *pMag, - sfloat fLambda, int iSamplingRate); +int sms_spectrumMag(int sizeWindow, sfloat *pWaveform, sfloat *pWindow, + int sizeMag, sfloat *pMag); -void sms_dCepstrumEnvelope (int sizeCepstrum, sfloat *pCepstrum, int sizeEnv, sfloat *pEnv); +void sms_dCepstrum(int sizeCepstrum, sfloat *pCepstrum, int sizeFreq, sfloat *pFreq, sfloat *pMag, + sfloat fLambda, int iSamplingRate); -void sms_spectralEnvelope ( SMS_Data *pSmsData, SMS_SEnvParams *pSpecEnvParams); +void sms_dCepstrumEnvelope(int sizeCepstrum, sfloat *pCepstrum, int sizeEnv, sfloat *pEnv); -int sms_sizeNextWindow (int iCurrentFrame, SMS_AnalParams *pAnalParams); +void sms_spectralEnvelope(SMS_Data *pSmsData, SMS_SEnvParams *pSpecEnvParams); -sfloat sms_fundDeviation (SMS_AnalParams *pAnalParams, int iCurrentFrame); +int sms_sizeNextWindow(int iCurrentFrame, SMS_AnalParams *pAnalParams); -int sms_detectPeaks (int sizeSpec, sfloat *pFMag, sfloat *pPhase, - SMS_Peak *pSpectralPeaks, SMS_PeakParams *pPeakParams); +sfloat sms_fundDeviation(SMS_AnalParams *pAnalParams, int iCurrentFrame); -//void sms_harmDetection (SMS_AnalFrame *pFrame, sfloat fRefFundamental, -// SMS_PeakParams *pPeakParams); +int sms_detectPeaks(int sizeSpec, sfloat *pFMag, sfloat *pPhase, + SMS_Peak *pSpectralPeaks, SMS_AnalParams *pAnalParams); sfloat sms_harmDetection(int numPeaks, SMS_Peak* spectralPeaks, sfloat refFundamental, - sfloat refHarmonic, sfloat lowestFreq, sfloat highestFreq, - int soundType, sfloat minRefHarmMag, sfloat refHarmMagDiffFromMax); + sfloat refHarmonic, sfloat lowestFreq, sfloat highestFreq, + int soundType, sfloat minRefHarmMag, sfloat refHarmMagDiffFromMax); int sms_peakContinuation (int iFrame, SMS_AnalParams *pAnalParams); @@ -675,8 +674,8 @@ sfloat sms_deEmphasis(sfloat fInput, SMS_SynthParams *pSynthParams); void sms_cleanTracks (int iCurrentFrame, SMS_AnalParams *pAnalParams); void sms_scaleDet (sfloat *pSynthBuffer, sfloat *pOriginalBuffer, - sfloat *pSinAmp, SMS_AnalParams *pAnalParams, int nTracks); - + sfloat *pSinAmp, SMS_AnalParams *pAnalParams, int nTracks); + int sms_prepSine (int nTableSize); int sms_prepSinc (int nTableSize); @@ -686,38 +685,38 @@ void sms_clearSine( void ); void sms_clearSinc( void ); void sms_synthesize (SMS_Data *pSmsFrame, sfloat*pSynthesis, - SMS_SynthParams *pSynthParams); - + SMS_SynthParams *pSynthParams); + void sms_sineSynthFrame (SMS_Data *pSmsFrame, sfloat *pBuffer, - int sizeBuffer, SMS_Data *pLastFrame, - int iSamplingRate); + int sizeBuffer, SMS_Data *pLastFrame, + int iSamplingRate); void sms_initHeader (SMS_Header *pSmsHeader); int sms_getHeader (char *pChFileName, SMS_Header **ppSmsHeader, - FILE **ppInputFile); + FILE **ppInputFile); void sms_fillHeader (SMS_Header *pSmsHeader, SMS_AnalParams *pAnalParams, - char *pProgramString); + char *pProgramString); int sms_writeHeader (char *pFileName, SMS_Header *pSmsHeader, - FILE **ppOutSmsFile); + FILE **ppOutSmsFile); int sms_writeFile (FILE *pSmsFile, SMS_Header *pSmsHeader); int sms_initFrame (int iCurrentFrame, SMS_AnalParams *pAnalParams, - int sizeWindow); - + int sizeWindow); + int sms_allocFrame (SMS_Data *pSmsFrame, int nTracks, int nCoeff, - int iPhase, int stochType, int nEnvCoeff); + int iPhase, int stochType, int nEnvCoeff); int sms_allocFrameH (SMS_Header *pSmsHeader, SMS_Data *pSmsFrame); int sms_getFrame (FILE *pInputFile, SMS_Header *pSmsHeader, int iFrame, - SMS_Data *pSmsFrame); + SMS_Data *pSmsFrame); int sms_writeFrame (FILE *pSmsFile, SMS_Header *pSmsHeader, - SMS_Data *pSmsFrame); + SMS_Data *pSmsFrame); void sms_freeFrame (SMS_Data *pSmsFrame); @@ -732,10 +731,10 @@ int sms_residual (int sizeWindow, sfloat *pSynthesis, sfloat *pOriginal, sfloat void sms_filterHighPass ( int sizeResidual, sfloat *pResidual, int iSamplingRate); int sms_stocAnalysis ( int sizeWindow, sfloat *pResidual, sfloat *pWindow, - SMS_Data *pSmsFrame); + SMS_Data *pSmsFrame); void sms_interpolateFrames (SMS_Data *pSmsFrame1, SMS_Data *pSmsFrame2, - SMS_Data *pSmsFrameOut, sfloat fInterpFactor); + SMS_Data *pSmsFrameOut, sfloat fInterpFactor); void sms_fft(int sizeFft, sfloat *pArray); @@ -761,7 +760,7 @@ void sms_modify(SMS_Data *frame, SMS_ModifyParams *params); int sms_createDebugFile (SMS_AnalParams *pAnalParams); void sms_writeDebugData (sfloat *pBuffer1, sfloat *pBuffer2, - sfloat *pBuffer3, int sizeBuffer); + sfloat *pBuffer3, int sizeBuffer); void sms_writeDebugFile ( void ); |