summaryrefslogtreecommitdiff
path: root/sms/sms.h
diff options
context:
space:
mode:
authorJohn Glover <glover.john@gmail.com>2010-11-04 14:50:08 +0000
committerJohn Glover <glover.john@gmail.com>2010-11-04 14:50:08 +0000
commitc741f6ce7bb43b115d08e190b93e0ce090ae3475 (patch)
tree9ad817d457a0b5595a4de802b069f149745295ac /sms/sms.h
parent82ae0ec4aa684dbe6285b265bc6a07c6f555d90d (diff)
downloadsimpl-c741f6ce7bb43b115d08e190b93e0ce090ae3475.tar.gz
simpl-c741f6ce7bb43b115d08e190b93e0ce090ae3475.tar.bz2
simpl-c741f6ce7bb43b115d08e190b93e0ce090ae3475.zip
Fixed a couple of SMSPeakDetection bugs and updated the unit tests
Diffstat (limited to 'sms/sms.h')
-rw-r--r--sms/sms.h559
1 files changed, 279 insertions, 280 deletions
diff --git a/sms/sms.h b/sms/sms.h
index 265ee29..bedc7d3 100644
--- a/sms/sms.h
+++ b/sms/sms.h
@@ -59,26 +59,26 @@
*/
typedef struct
{
- int iSmsMagic; /*!< identification constant */
- int iHeadBSize; /*!< size in bytes of header */
- int nFrames; /*!< number of data frames */
- int iFrameBSize; /*!< size in bytes of each data frame */
- int iSamplingRate; /*!< samplerate of analysis signal (necessary to recreate residual spectrum */
- int iFormat; /*!< type of data format \see SMS_Format */
- int nTracks; /*!< number of sinusoidal tracks per frame */
- int iFrameRate; /*!< rate in Hz of data frames */
- int iStochasticType; /*!< type stochastic representation */
- int nStochasticCoeff; /*!< number of stochastic coefficients per frame */
- int iEnvType; /*!< type of envelope representation */
- int nEnvCoeff; /*!< number of cepstral coefficents per frame */
- int iMaxFreq; /*!< maximum frequency of peaks (also corresponds to the last bin of the specEnv */
-/* sfloat fAmplitude; /\*!< average amplitude of represented sound. *\/ */
-/* sfloat fFrequency; /\*!< average fundamental frequency *\/ */
-/* int iBegSteadyState; /\*!< record number of begining of steady state. *\/ */
-/* int iEndSteadyState; /\*!< record number of end of steady state. *\/ */
- sfloat fResidualPerc; /*!< percentage of the residual to original */
- int nTextCharacters; /*!< number of text characters */
- char *pChTextCharacters; /*!< Text string relating to the sound */
+ int iSmsMagic; /*!< identification constant */
+ int iHeadBSize; /*!< size in bytes of header */
+ int nFrames; /*!< number of data frames */
+ int iFrameBSize; /*!< size in bytes of each data frame */
+ int iSamplingRate; /*!< samplerate of analysis signal (necessary to recreate residual spectrum */
+ int iFormat; /*!< type of data format \see SMS_Format */
+ int nTracks; /*!< number of sinusoidal tracks per frame */
+ int iFrameRate; /*!< rate in Hz of data frames */
+ int iStochasticType; /*!< type stochastic representation */
+ int nStochasticCoeff; /*!< number of stochastic coefficients per frame */
+ int iEnvType; /*!< type of envelope representation */
+ int nEnvCoeff; /*!< number of cepstral coefficents per frame */
+ int iMaxFreq; /*!< maximum frequency of peaks (also corresponds to the last bin of the specEnv */
+ /* sfloat fAmplitude; /\*!< average amplitude of represented sound. *\/ */
+ /* sfloat fFrequency; /\*!< average fundamental frequency *\/ */
+ /* int iBegSteadyState; /\*!< record number of begining of steady state. *\/ */
+ /* int iEndSteadyState; /\*!< record number of end of steady state. *\/ */
+ sfloat fResidualPerc; /*!< percentage of the residual to original */
+ int nTextCharacters; /*!< number of text characters */
+ char *pChTextCharacters; /*!< Text string relating to the sound */
} SMS_Header;
/*! \struct SMS_Data
@@ -95,16 +95,16 @@ typedef struct
*/
typedef struct
{
- sfloat *pSmsData; /*!< pointer to all SMS data */
- int sizeData; /*!< size of all the data */
- sfloat *pFSinFreq; /*!< frequency of sinusoids */
- sfloat *pFSinAmp; /*!< magnitude of sinusoids (stored in dB) */
- sfloat *pFSinPha; /*!< phase of sinusoids */
- int nTracks; /*!< number of sinusoidal tracks in frame */
- sfloat *pFStocGain; /*!< gain of stochastic component */
- int nCoeff; /*!< number of filter coefficients */
- sfloat *pFStocCoeff; /*!< filter coefficients for stochastic component */
- sfloat *pResPhase; /*!< residual phase spectrum */
+ sfloat *pSmsData; /*!< pointer to all SMS data */
+ int sizeData; /*!< size of all the data */
+ sfloat *pFSinFreq; /*!< frequency of sinusoids */
+ sfloat *pFSinAmp; /*!< magnitude of sinusoids (stored in dB) */
+ sfloat *pFSinPha; /*!< phase of sinusoids */
+ int nTracks; /*!< number of sinusoidal tracks in frame */
+ sfloat *pFStocGain; /*!< gain of stochastic component */
+ int nCoeff; /*!< number of filter coefficients */
+ sfloat *pFStocCoeff; /*!< filter coefficients for stochastic component */
+ sfloat *pResPhase; /*!< residual phase spectrum */
int nEnvCoeff; /*!< number of spectral envelope coefficients */
sfloat *pSpecEnv;
} SMS_Data;
@@ -120,10 +120,10 @@ typedef struct
*/
typedef struct
{
- sfloat *pFBuffer; /*!< buffer for sound data*/
- int sizeBuffer; /*!< size of buffer */
- int iMarker; /*!< sample marker relating to sound source */
- int iFirstGood; /*!< first sample in buffer that is a good one */
+ sfloat *pFBuffer; /*!< buffer for sound data*/
+ int sizeBuffer; /*!< size of buffer */
+ int iMarker; /*!< sample marker relating to sound source */
+ int iFirstGood; /*!< first sample in buffer that is a good one */
} SMS_SndBuffer;
/*! \struct SMS_Peak
@@ -133,17 +133,17 @@ typedef struct
/* information attached to a spectral peak */
typedef struct
{
- sfloat fFreq; /*!< frequency of peak */
- sfloat fMag; /*!< magnitude of peak */
- sfloat fPhase; /*!< phase of peak */
+ sfloat fFreq; /*!< frequency of peak */
+ sfloat fMag; /*!< magnitude of peak */
+ sfloat fPhase; /*!< phase of peak */
} SMS_Peak;
/* a collection of spectral peaks */
typedef struct
{
- SMS_Peak *pSpectralPeaks;
- int nPeaks;
- int nPeaksFound;
+ SMS_Peak *pSpectralPeaks;
+ int nPeaks;
+ int nPeaksFound;
} SMS_SpectralPeaks;
/*! \struct SMS_AnalFrame
@@ -154,35 +154,35 @@ typedef struct
*/
typedef struct
{
- int iFrameSample; /*!< sample number of the middle of the frame */
- int iFrameSize; /*!< number of samples used in the frame */
- int iFrameNum; /*!< frame number */
- SMS_Peak *pSpectralPeaks; /*!< spectral peaks found in frame */
- int nPeaks; /*!< number of peaks found */
- sfloat fFundamental; /*!< fundamental frequency in frame */
- SMS_Data deterministic; /*!< deterministic data */
- int iStatus; /*!< status of frame enumerated by SMS_FRAME_STATUS
- \see SMS_FRAME_STATUS */
+ int iFrameSample; /*!< sample number of the middle of the frame */
+ int iFrameSize; /*!< number of samples used in the frame */
+ int iFrameNum; /*!< frame number */
+ SMS_Peak *pSpectralPeaks; /*!< spectral peaks found in frame */
+ int nPeaks; /*!< number of peaks found */
+ sfloat fFundamental; /*!< fundamental frequency in frame */
+ SMS_Data deterministic; /*!< deterministic data */
+ int iStatus; /*!< status of frame enumerated by SMS_FRAME_STATUS
+ \see SMS_FRAME_STATUS */
} SMS_AnalFrame;
/*! \struct SMS_PeakParams
* \brief structure with useful information for peak detection and continuation
*
*/
-typedef struct
-{
- sfloat fLowestFreq; /*!< the first bin to look for a peak */
- sfloat fHighestFreq; /*!< the last bin to look for a peak */
- sfloat fMinPeakMag; /*!< mininum magnitude to consider as a peak */
- int iSamplingRate; /*!< sampling rate of analysis signal */
- int iMaxPeaks; /*!< maximum number of spectral peaks to look for */
- int nPeaksFound; /*!< the number of peaks found in each analysis */
- sfloat fHighestFundamental;/*!< highest fundamental frequency in Hz */
- int iRefHarmonic; /*!< reference harmonic to use in the fundamental detection */
- sfloat fMinRefHarmMag; /*!< minimum magnitude in dB for reference peak */
- sfloat fRefHarmMagDiffFromMax; /*!< maximum magnitude difference from reference peak to highest peak */
- int iSoundType; /*!< type of sound to be analyzed \see SMS_SOUND_TYPE */
-} SMS_PeakParams;
+//typedef struct
+//{
+// sfloat fLowestFreq; [>!< the first bin to look for a peak <]
+// sfloat fHighestFreq; [>!< the last bin to look for a peak <]
+// sfloat fMinPeakMag; [>!< mininum magnitude to consider as a peak <]
+// int iSamplingRate; [>!< sampling rate of analysis signal <]
+// int iMaxPeaks; [>!< maximum number of spectral peaks to look for <]
+// int nPeaksFound; [>!< the number of peaks found in each analysis <]
+// sfloat fHighestFundamental;[>!< highest fundamental frequency in Hz <]
+// int iRefHarmonic; [>!< reference harmonic to use in the fundamental detection <]
+// sfloat fMinRefHarmMag; [>!< minimum magnitude in dB for reference peak <]
+// sfloat fRefHarmMagDiffFromMax; [>!< maximum magnitude difference from reference peak to highest peak <]
+// int iSoundType; [>!< type of sound to be analyzed \see SMS_SOUND_TYPE <]
+//} SMS_PeakParams;
/*! \struct SMS_SEnvParams;
* \brief structure information and data for spectral enveloping
@@ -190,12 +190,12 @@ typedef struct
*/
typedef struct
{
- int iType; /*!< envelope type \see SMS_SpecEnvType */
- int iOrder; /*!< ceptrum order */
- int iMaxFreq; /*!< maximum frequency covered by the envelope */
- sfloat fLambda; /*!< regularization factor */
- int nCoeff; /*!< number of coefficients (bins) in the envelope */
- int iAnchor; /*!< whether to make anchor points at DC / Nyquist or not */
+ int iType; /*!< envelope type \see SMS_SpecEnvType */
+ int iOrder; /*!< ceptrum order */
+ int iMaxFreq; /*!< maximum frequency covered by the envelope */
+ sfloat fLambda; /*!< regularization factor */
+ int nCoeff; /*!< number of coefficients (bins) in the envelope */
+ int iAnchor; /*!< whether to make anchor points at DC / Nyquist or not */
} SMS_SEnvParams;
@@ -216,54 +216,56 @@ typedef struct
*/
typedef struct
{
- int iDebugMode; /*!< debug codes enumerated by SMS_DBG \see SMS_DBG */
- int iFormat; /*!< analysis format code defined by SMS_Format \see SMS_Format */
- int iSoundType; /*!< type of sound to be analyzed \see SMS_SOUND_TYPE */
- int iStochasticType; /*!< type of stochastic model defined by SMS_StocSynthType \see SMS_StocSynthType */
- int iFrameRate; /*!< rate in Hz of data frames */
- int nStochasticCoeff; /*!< number of stochastic coefficients per frame */
- sfloat fLowestFundamental; /*!< lowest fundamental frequency in Hz */
- sfloat fHighestFundamental;/*!< highest fundamental frequency in Hz */
- sfloat fDefaultFundamental;/*!< default fundamental in Hz */
- sfloat fPeakContToGuide; /*!< contribution of previous peak to current guide (between 0 and 1) */
- sfloat fFundContToGuide; /*!< contribution of current fundamental to current guide (between 0 and 1) */
- sfloat fFreqDeviation; /*!< maximum deviation from peak to peak */
- int iSamplingRate; /*! sampling rate of sound to be analyzed */
- int iDefaultSizeWindow; /*!< default size of analysis window in samples */
- int windowSize; /*!< the current window size */
- int sizeHop; /*!< hop size of analysis window in samples */
- sfloat fSizeWindow; /*!< size of analysis window in number of periods */
- int nTracks; /*!< number of sinusoidal tracks in frame */
- int nGuides; /*!< number of guides used for peak detection and continuation \see SMS_Guide */
- int iCleanTracks; /*!< whether or not to clean sinusoidal tracks */
- //int iEnvelope; /*!< whether or not to compute spectral envelope */
- sfloat fMinRefHarmMag; /*!< minimum magnitude in dB for reference peak */
- sfloat fRefHarmMagDiffFromMax; /*!< maximum magnitude difference from reference peak to highest peak */
- int iRefHarmonic; /*!< reference harmonic to use in the fundamental detection */
- int iMinTrackLength; /*!< minimum length in samples of a given track */
- int iMaxSleepingTime; /*!< maximum sleeping time for a track */
- sfloat fHighestFreq; /*!< highest frequency to be searched */
- sfloat fMinPeakMag; /*!< minimum magnitude in dB for a good peak */
- int iAnalysisDirection; /*!< analysis direction, direct or reverse */
- int iSizeSound; /*!< total size of sound to be analyzed in samples */
- int nFrames; /*!< total number of frames that will be analyzed */
- int iWindowType; /*!< type of FFT analysis window \see SMS_WINDOWS */
- int iMaxDelayFrames; /*!< maximum number of frames to delay before peak continuation */
- int minGoodFrames; /*!< minimum number of stable frames for backward search */
- sfloat maxDeviation; /*!< maximum deviation allowed */
- int analDelay; /*! number of frames in the past to be looked in possible re-analyze */
- sfloat fResidualAccumPerc; /*!< accumalitive residual percentage */
- int sizeNextRead; /*!< size of samples to read from sound file next analysis */
- sfloat preEmphasisLastValue;
- int resetGuides;
- int resetGuideStates;
- SMS_PeakParams peakParams; /*!< structure with parameters for spectral peaks */
- SMS_Data prevFrame; /*!< the previous analysis frame */
- SMS_SEnvParams specEnvParams; /*!< all data for spectral enveloping */
- SMS_SndBuffer soundBuffer; /*!< signal to be analyzed */
- SMS_SndBuffer synthBuffer; /*!< resynthesized signal used to create the residual */
- SMS_AnalFrame *pFrames; /*!< an array of frames that have already been analyzed */
- SMS_AnalFrame **ppFrames; /*!< pointers to the frames analyzed (it is circular-shifted once the array is full */
+ int iDebugMode; /*!< debug codes enumerated by SMS_DBG \see SMS_DBG */
+ int iFormat; /*!< analysis format code defined by SMS_Format \see SMS_Format */
+ int iSoundType; /*!< type of sound to be analyzed \see SMS_SOUND_TYPE */
+ int iStochasticType; /*!< type of stochastic model defined by SMS_StocSynthType \see SMS_StocSynthType */
+ int iFrameRate; /*!< rate in Hz of data frames */
+ int nStochasticCoeff; /*!< number of stochastic coefficients per frame */
+ sfloat fLowestFundamental; /*!< lowest fundamental frequency in Hz */
+ sfloat fHighestFundamental;/*!< highest fundamental frequency in Hz */
+ sfloat fDefaultFundamental;/*!< default fundamental in Hz */
+ sfloat fPeakContToGuide; /*!< contribution of previous peak to current guide (between 0 and 1) */
+ sfloat fFundContToGuide; /*!< contribution of current fundamental to current guide (between 0 and 1) */
+ sfloat fFreqDeviation; /*!< maximum deviation from peak to peak */
+ int iSamplingRate; /*! sampling rate of sound to be analyzed */
+ int iDefaultSizeWindow; /*!< default size of analysis window in samples */
+ int windowSize; /*!< the current window size */
+ int sizeHop; /*!< hop size of analysis window in samples */
+ sfloat fSizeWindow; /*!< size of analysis window in number of periods */
+ int nTracks; /*!< number of sinusoidal tracks in frame */
+ int maxPeaks; /*!< maximum number of peaks in a frame */
+ int nGuides; /*!< number of guides used for peak detection and continuation \see SMS_Guide */
+ int iCleanTracks; /*!< whether or not to clean sinusoidal tracks */
+ //int iEnvelope; /*!< whether or not to compute spectral envelope */
+ sfloat fMinRefHarmMag; /*!< minimum magnitude in dB for reference peak */
+ sfloat fRefHarmMagDiffFromMax; /*!< maximum magnitude difference from reference peak to highest peak */
+ int iRefHarmonic; /*!< reference harmonic to use in the fundamental detection */
+ int iMinTrackLength; /*!< minimum length in samples of a given track */
+ int iMaxSleepingTime; /*!< maximum sleeping time for a track */
+ sfloat fLowestFreq; /*!< lowest frequency to be searched */
+ sfloat fHighestFreq; /*!< highest frequency to be searched */
+ sfloat fMinPeakMag; /*!< minimum magnitude in dB for a good peak */
+ int iAnalysisDirection; /*!< analysis direction, direct or reverse */
+ int iSizeSound; /*!< total size of sound to be analyzed in samples */
+ int nFrames; /*!< total number of frames that will be analyzed */
+ int iWindowType; /*!< type of FFT analysis window \see SMS_WINDOWS */
+ int iMaxDelayFrames; /*!< maximum number of frames to delay before peak continuation */
+ int minGoodFrames; /*!< minimum number of stable frames for backward search */
+ sfloat maxDeviation; /*!< maximum deviation allowed */
+ int analDelay; /*! number of frames in the past to be looked in possible re-analyze */
+ sfloat fResidualAccumPerc; /*!< accumalitive residual percentage */
+ int sizeNextRead; /*!< size of samples to read from sound file next analysis */
+ sfloat preEmphasisLastValue;
+ int resetGuides;
+ int resetGuideStates;
+ //SMS_PeakParams peakParams; [>!< structure with parameters for spectral peaks <]
+ SMS_Data prevFrame; /*!< the previous analysis frame */
+ SMS_SEnvParams specEnvParams; /*!< all data for spectral enveloping */
+ SMS_SndBuffer soundBuffer; /*!< signal to be analyzed */
+ SMS_SndBuffer synthBuffer; /*!< resynthesized signal used to create the residual */
+ SMS_AnalFrame *pFrames; /*!< an array of frames that have already been analyzed */
+ SMS_AnalFrame **ppFrames; /*!< pointers to the frames analyzed (it is circular-shifted once the array is full */
} SMS_AnalParams;
/*! \struct SMS_ModifyParams
@@ -272,20 +274,20 @@ typedef struct
*/
typedef struct
{
- int ready; /*!< a flag to know if the struct has been initialized) */
- int maxFreq; /*!< maximum frequency component */
- int doResGain; /*!< whether or not to scale residual gain */
- sfloat resGain; /*!< residual scale factor */
- int doTranspose; /*!< whether or not to transpose */
- sfloat transpose; /*!< transposition factor */
- int doSinEnv; /*!< whether or not to apply a new spectral envelope to the sin component */
- sfloat sinEnvInterp; /*!< value between 0 (use frame's env) and 1 (use *env). Interpolates inbetween values*/
- int sizeSinEnv; /*!< size of the envelope pointed to by env */
- sfloat *sinEnv; /*!< sinusoidal spectral envelope */
- int doResEnv; /*!< whether or not to apply a new spectral envelope to the residual component */
- sfloat resEnvInterp; /*!< value between 0 (use frame's env) and 1 (use *env). Interpolates inbetween values*/
- int sizeResEnv; /*!< size of the envelope pointed to by resEnv */
- sfloat *resEnv; /*!< residual spectral envelope */
+ int ready; /*!< a flag to know if the struct has been initialized) */
+ int maxFreq; /*!< maximum frequency component */
+ int doResGain; /*!< whether or not to scale residual gain */
+ sfloat resGain; /*!< residual scale factor */
+ int doTranspose; /*!< whether or not to transpose */
+ sfloat transpose; /*!< transposition factor */
+ int doSinEnv; /*!< whether or not to apply a new spectral envelope to the sin component */
+ sfloat sinEnvInterp; /*!< value between 0 (use frame's env) and 1 (use *env). Interpolates inbetween values*/
+ int sizeSinEnv; /*!< size of the envelope pointed to by env */
+ sfloat *sinEnv; /*!< sinusoidal spectral envelope */
+ int doResEnv; /*!< whether or not to apply a new spectral envelope to the residual component */
+ sfloat resEnvInterp; /*!< value between 0 (use frame's env) and 1 (use *env). Interpolates inbetween values*/
+ int sizeResEnv; /*!< size of the envelope pointed to by resEnv */
+ sfloat *resEnv; /*!< residual spectral envelope */
} SMS_ModifyParams;
/*! \struct SMS_SynthParams
@@ -298,24 +300,24 @@ typedef struct
*/
typedef struct
{
- int iStochasticType; /*!< type of stochastic model defined by SMS_StocSynthType \see SMS_StocSynthType */
- int iSynthesisType; /*!< type of synthesis to perform \see SMS_SynthType */
- int iDetSynthType; /*!< method for synthesizing deterministic component \see SMS_DetSynthType */
- int iOriginalSRate; /*!< samplerate of the sound model source (for stochastic synthesis approximation) */
- int iSamplingRate; /*!< synthesis samplerate */
- int sizeHop; /*!< number of samples to synthesis for each frame */
- int origSizeHop; /*!< original number of samples used to create each analysis frame */
- int nTracks;
- int nStochasticCoeff;
- sfloat deemphasisLastValue;
- sfloat *pFDetWindow; /*!< array to hold the window used for deterministic synthesis \see SMS_WIN_IFFT */
- sfloat *pFStocWindow; /*!< array to hold the window used for stochastic synthesis (Hanning) */
- sfloat *pSynthBuff; /*!< an array for keeping samples during overlap-add (2x sizeHop) */
- sfloat *pMagBuff; /*!< an array for keeping magnitude spectrum for stochastic synthesis */
- sfloat *pPhaseBuff; /*!< an array for keeping phase spectrum for stochastic synthesis */
- sfloat *pSpectra; /*!< array for in-place FFT transform */
- SMS_Data prevFrame; /*!< previous data frame, for interpolation between frames */
- SMS_ModifyParams modParams; /*!< modification parameters */
+ int iStochasticType; /*!< type of stochastic model defined by SMS_StocSynthType \see SMS_StocSynthType */
+ int iSynthesisType; /*!< type of synthesis to perform \see SMS_SynthType */
+ int iDetSynthType; /*!< method for synthesizing deterministic component \see SMS_DetSynthType */
+ int iOriginalSRate; /*!< samplerate of the sound model source (for stochastic synthesis approximation) */
+ int iSamplingRate; /*!< synthesis samplerate */
+ int sizeHop; /*!< number of samples to synthesis for each frame */
+ int origSizeHop; /*!< original number of samples used to create each analysis frame */
+ int nTracks;
+ int nStochasticCoeff;
+ sfloat deemphasisLastValue;
+ sfloat *pFDetWindow; /*!< array to hold the window used for deterministic synthesis \see SMS_WIN_IFFT */
+ sfloat *pFStocWindow; /*!< array to hold the window used for stochastic synthesis (Hanning) */
+ sfloat *pSynthBuff; /*!< an array for keeping samples during overlap-add (2x sizeHop) */
+ sfloat *pMagBuff; /*!< an array for keeping magnitude spectrum for stochastic synthesis */
+ sfloat *pPhaseBuff; /*!< an array for keeping phase spectrum for stochastic synthesis */
+ sfloat *pSpectra; /*!< array for in-place FFT transform */
+ SMS_Data prevFrame; /*!< previous data frame, for interpolation between frames */
+ SMS_ModifyParams modParams; /*!< modification parameters */
} SMS_SynthParams;
/*! \struct SMS_HarmCandidate
@@ -327,11 +329,11 @@ typedef struct
*/
typedef struct
{
- sfloat fFreq; /*!< frequency of harmonic */
- sfloat fMag; /*!< magnitude of harmonic */
- sfloat fMagPerc; /*!< percentage of magnitude */
- sfloat fFreqDev; /*!< deviation from perfect harmonic */
- sfloat fHarmRatio; /*!< percentage of harmonics found */
+ sfloat fFreq; /*!< frequency of harmonic */
+ sfloat fMag; /*!< magnitude of harmonic */
+ sfloat fMagPerc; /*!< percentage of magnitude */
+ sfloat fFreqDev; /*!< deviation from perfect harmonic */
+ sfloat fHarmRatio; /*!< percentage of harmonics found */
} SMS_HarmCandidate;
/*! \struct SMS_ContCandidate
@@ -342,9 +344,9 @@ typedef struct
*/
typedef struct
{
- sfloat fFreqDev; /*!< frequency deviation from guide */
- sfloat fMagDev; /*!< magnitude deviation from guide */
- int iPeak; /*!< peak number (organized according to frequency)*/
+ sfloat fFreqDev; /*!< frequency deviation from guide */
+ sfloat fMagDev; /*!< magnitude deviation from guide */
+ int iPeak; /*!< peak number (organized according to frequency)*/
} SMS_ContCandidate;
/*! \struct SMS_Guide
@@ -357,10 +359,10 @@ typedef struct
*/
typedef struct
{
- sfloat fFreq; /*!< frequency of guide */
- sfloat fMag; /*!< magnitude of guide */
- int iStatus; /*!< status of guide: DEAD, SLEEPING, ACTIVE */
- int iPeakChosen; /*!< peak number chosen by the guide */
+ sfloat fFreq; /*!< frequency of guide */
+ sfloat fMag; /*!< magnitude of guide */
+ int iStatus; /*!< status of guide: DEAD, SLEEPING, ACTIVE */
+ int iPeakChosen; /*!< peak number chosen by the guide */
} SMS_Guide;
/*! \brief analysis format
@@ -373,10 +375,10 @@ typedef struct
*/
enum SMS_Format
{
- SMS_FORMAT_H, /*!< 0, format harmonic */
- SMS_FORMAT_IH, /*!< 1, format inharmonic */
- SMS_FORMAT_HP, /*!< 2, format harmonic with phase */
- SMS_FORMAT_IHP /*!< 3, format inharmonic with phase */
+ SMS_FORMAT_H, /*!< 0, format harmonic */
+ SMS_FORMAT_IH, /*!< 1, format inharmonic */
+ SMS_FORMAT_HP, /*!< 2, format harmonic with phase */
+ SMS_FORMAT_IHP /*!< 3, format inharmonic with phase */
};
/*! \brief synthesis types
@@ -388,9 +390,9 @@ enum SMS_Format
*/
enum SMS_SynthType
{
- SMS_STYPE_ALL, /*!< both components combined */
- SMS_STYPE_DET, /*!< deterministic component alone */
- SMS_STYPE_STOC /*!< stochastic component alone */
+ SMS_STYPE_ALL, /*!< both components combined */
+ SMS_STYPE_DET, /*!< deterministic component alone */
+ SMS_STYPE_STOC /*!< stochastic component alone */
};
/*! \brief synthesis method for deterministic component
@@ -404,8 +406,8 @@ enum SMS_SynthType
*/
enum SMS_DetSynthType
{
- SMS_DET_IFFT, /*!< Inverse Fast Fourier Transform (IFFT) */
- SMS_DET_SIN /*!< Sinusoidal Table Lookup (SIN) */
+ SMS_DET_IFFT, /*!< Inverse Fast Fourier Transform (IFFT) */
+ SMS_DET_SIN /*!< Sinusoidal Table Lookup (SIN) */
};
/*! \brief synthesis method for stochastic component
@@ -431,9 +433,9 @@ enum SMS_DetSynthType
*/
enum SMS_StocSynthType
{
- SMS_STOC_NONE, /*!< 0, no stochastistic component */
- SMS_STOC_APPROX, /*!< 1, Inverse FFT, magnitude approximation and generated phases */
- SMS_STOC_IFFT /*!< 2, inverse FFT, interpolated spectrum (not used) */
+ SMS_STOC_NONE, /*!< 0, no stochastistic component */
+ SMS_STOC_APPROX, /*!< 1, Inverse FFT, magnitude approximation and generated phases */
+ SMS_STOC_IFFT /*!< 2, inverse FFT, interpolated spectrum (not used) */
};
/*! \brief synthesis method for deterministic component
@@ -447,9 +449,9 @@ enum SMS_StocSynthType
*/
enum SMS_SpecEnvType
{
- SMS_ENV_NONE, /*!< none */
- SMS_ENV_CEP, /*!< cepstral coefficients */
- SMS_ENV_FBINS /*!< frequency bins */
+ SMS_ENV_NONE, /*!< none */
+ SMS_ENV_CEP, /*!< cepstral coefficients */
+ SMS_ENV_FBINS /*!< frequency bins */
};
@@ -457,13 +459,13 @@ enum SMS_SpecEnvType
/* \todo remove me */
enum SMS_ERRORS
{
- SMS_OK, /*!< 0, no error*/
- SMS_NOPEN, /*!< 1, couldn't open file */
- SMS_NSMS , /*!< 2, not a SMS file */
- SMS_MALLOC, /*!< 3, couldn't allocate memory */
- SMS_RDERR, /*!< 4, read error */
- SMS_WRERR, /*!< 5, write error */
- SMS_SNDERR /*!< 7, sound IO error */
+ SMS_OK, /*!< 0, no error*/
+ SMS_NOPEN, /*!< 1, couldn't open file */
+ SMS_NSMS , /*!< 2, not a SMS file */
+ SMS_MALLOC, /*!< 3, couldn't allocate memory */
+ SMS_RDERR, /*!< 4, read error */
+ SMS_WRERR, /*!< 5, write error */
+ SMS_SNDERR /*!< 7, sound IO error */
};
/*! \brief debug modes
@@ -472,21 +474,21 @@ enum SMS_ERRORS
*/
enum SMS_DBG
{
- SMS_DBG_NONE, /*!< 0, no debugging */
- SMS_DBG_DET, /*!< 1, not yet implemented \todo make this show main information to look at for discovering the correct deterministic parameters*/
- SMS_DBG_PEAK_DET, /*!< 2, peak detection function */
- SMS_DBG_HARM_DET, /*!< 3, harmonic detection function */
- SMS_DBG_PEAK_CONT, /*!< 4, peak continuation function */
- SMS_DBG_CLEAN_TRAJ, /*!< 5, clean tracks function */
- SMS_DBG_SINE_SYNTH, /*!< 6, sine synthesis function */
- SMS_DBG_STOC_ANAL, /*!< 7, stochastic analysis function */
- SMS_DBG_STOC_SYNTH, /*!< 8, stochastic synthesis function */
- SMS_DBG_SMS_ANAL, /*!< 9, top level analysis function */
- SMS_DBG_ALL, /*!< 10, everything */
- SMS_DBG_RESIDUAL, /*!< 11, write residual to file */
- SMS_DBG_SYNC, /*!< 12, write original, synthesis and residual
- to a text file */
- };
+ SMS_DBG_NONE, /*!< 0, no debugging */
+ SMS_DBG_DET, /*!< 1, not yet implemented \todo make this show main information to look at for discovering the correct deterministic parameters*/
+ SMS_DBG_PEAK_DET, /*!< 2, peak detection function */
+ SMS_DBG_HARM_DET, /*!< 3, harmonic detection function */
+ SMS_DBG_PEAK_CONT, /*!< 4, peak continuation function */
+ SMS_DBG_CLEAN_TRAJ, /*!< 5, clean tracks function */
+ SMS_DBG_SINE_SYNTH, /*!< 6, sine synthesis function */
+ SMS_DBG_STOC_ANAL, /*!< 7, stochastic analysis function */
+ SMS_DBG_STOC_SYNTH, /*!< 8, stochastic synthesis function */
+ SMS_DBG_SMS_ANAL, /*!< 9, top level analysis function */
+ SMS_DBG_ALL, /*!< 10, everything */
+ SMS_DBG_RESIDUAL, /*!< 11, write residual to file */
+ SMS_DBG_SYNC, /*!< 12, write original, synthesis and residual
+ to a text file */
+};
#define SMS_MAX_WINDOW 8190 /*!< \brief maximum size for analysis window */
@@ -496,8 +498,8 @@ enum SMS_DBG
*/
enum SMS_SOUND_TYPE
{
- SMS_SOUND_TYPE_MELODY, /*!< 0, sound composed of several notes */
- SMS_SOUND_TYPE_NOTE /*!< 1, sound composed of a single note */
+ SMS_SOUND_TYPE_MELODY, /*!< 0, sound composed of several notes */
+ SMS_SOUND_TYPE_NOTE /*!< 1, sound composed of a single note */
};
/* \brief direction of analysis
@@ -508,22 +510,22 @@ enum SMS_SOUND_TYPE
*/
enum SMS_DIRECTION
{
- SMS_DIR_FWD, /*!< analysis from left to right */
- SMS_DIR_REV /*!< analysis from right to left */
+ SMS_DIR_FWD, /*!< analysis from left to right */
+ SMS_DIR_REV /*!< analysis from right to left */
};
/* \brief window selection
- */
+*/
enum SMS_WINDOWS
{
- SMS_WIN_HAMMING, /*!< 0: hamming */
- SMS_WIN_BH_62, /*!< 1: blackman-harris, 62dB cutoff */
- SMS_WIN_BH_70, /*!< 2: blackman-harris, 70dB cutoff */
- SMS_WIN_BH_74, /*!< 3: blackman-harris, 74dB cutoff */
- SMS_WIN_BH_92, /*!< 4: blackman-harris, 92dB cutoff */
- SMS_WIN_HANNING, /*!< 5: hanning */
- SMS_WIN_IFFT /*!< 6: window for deterministic synthesis based on the Inverse-FFT algorithm.
- This is a combination of an inverse Blackman-Harris 92dB and a triangular window. */
+ SMS_WIN_HAMMING, /*!< 0: hamming */
+ SMS_WIN_BH_62, /*!< 1: blackman-harris, 62dB cutoff */
+ SMS_WIN_BH_70, /*!< 2: blackman-harris, 70dB cutoff */
+ SMS_WIN_BH_74, /*!< 3: blackman-harris, 74dB cutoff */
+ SMS_WIN_BH_92, /*!< 4: blackman-harris, 92dB cutoff */
+ SMS_WIN_HANNING, /*!< 5: hanning */
+ SMS_WIN_IFFT /*!< 6: window for deterministic synthesis based on the Inverse-FFT algorithm.
+ This is a combination of an inverse Blackman-Harris 92dB and a triangular window. */
};
/*!
@@ -531,17 +533,17 @@ enum SMS_WINDOWS
*/
enum SMS_FRAME_STATUS
{
- SMS_FRAME_EMPTY,
- SMS_FRAME_READY,
- SMS_FRAME_PEAKS_FOUND,
- SMS_FRAME_FUND_FOUND,
- SMS_FRAME_TRAJ_FOUND,
- SMS_FRAME_CLEANED,
- SMS_FRAME_RECOMPUTED,
- SMS_FRAME_DETER_SYNTH,
- SMS_FRAME_STOC_COMPUTED,
- SMS_FRAME_DONE,
- SMS_FRAME_END
+ SMS_FRAME_EMPTY,
+ SMS_FRAME_READY,
+ SMS_FRAME_PEAKS_FOUND,
+ SMS_FRAME_FUND_FOUND,
+ SMS_FRAME_TRAJ_FOUND,
+ SMS_FRAME_CLEANED,
+ SMS_FRAME_RECOMPUTED,
+ SMS_FRAME_DETER_SYNTH,
+ SMS_FRAME_STOC_COMPUTED,
+ SMS_FRAME_DONE,
+ SMS_FRAME_END
};
@@ -575,38 +577,38 @@ void sms_arrayScalarTempered( int sizeArray, sfloat *pArray);
#ifndef MAX
/*! \brief returns the maximum of a and b */
-#define MAX(a,b) ((a) > (b) ? (a) : (b))
+#define MAX(a,b) ((a) > (b) ? (a) : (b))
#endif
#ifndef MIN
/*! \brief returns the minimum of a and b */
-#define MIN(a,b) ((a) < (b) ? (a) : (b))
+#define MIN(a,b) ((a) < (b) ? (a) : (b))
#endif
/*! \} */
/* function declarations */
void sms_setPeaks(SMS_AnalParams *pAnalParams, int numamps, sfloat* amps,
- int numfreqs, sfloat* freqs, int numphases, sfloat* phases);
+ int numfreqs, sfloat* freqs, int numphases, sfloat* phases);
int sms_findPeaks(int sizeWaveform, sfloat *pWaveform, SMS_AnalParams *pAnalParams, SMS_SpectralPeaks *pSpectralPeaks);
int sms_findPartials(SMS_Data *pSmsFrame, SMS_AnalParams *pAnalParams);
int sms_findResidual(int sizeSynthesis, sfloat* pSynthesis,
- int sizeOriginal, sfloat* pOriginal,
- int sizeResidual, sfloat* pResidual,
- SMS_AnalParams *analParams);
+ int sizeOriginal, sfloat* pOriginal,
+ int sizeResidual, sfloat* pResidual,
+ SMS_AnalParams *analParams);
int sms_analyze(int sizeWaveform, sfloat *pWaveform, SMS_Data *pSmsData, SMS_AnalParams *pAnalParams);
void sms_analyzeFrame(int iCurrentFrame, SMS_AnalParams *pAnalParams, sfloat fRefFundamental);
-int sms_init( void );
+int sms_init(void);
-void sms_free( void );
+void sms_free(void);
-int sms_initAnalysis ( SMS_AnalParams *pAnalParams);
+int sms_initAnalysis(SMS_AnalParams *pAnalParams);
-void sms_initAnalParams (SMS_AnalParams *pAnalParams);
+void sms_initAnalParams(SMS_AnalParams *pAnalParams);
void sms_changeHopSize(int hopSize, SMS_AnalParams *pAnalParams);
@@ -614,57 +616,54 @@ void sms_initSynthParams(SMS_SynthParams *synthParams);
int sms_initSynth(SMS_SynthParams *pSynthParams);
-int sms_changeSynthHop( SMS_SynthParams *pSynthParams, int sizeHop);
+int sms_changeSynthHop(SMS_SynthParams *pSynthParams, int sizeHop);
-void sms_freeAnalysis (SMS_AnalParams *pAnalParams);
+void sms_freeAnalysis(SMS_AnalParams *pAnalParams);
-void sms_freeSynth( SMS_SynthParams *pSynthParams );
+void sms_freeSynth(SMS_SynthParams *pSynthParams );
-void sms_fillSoundBuffer (int sizeWaveform, sfloat *pWaveform, SMS_AnalParams *pAnalParams);
+void sms_fillSoundBuffer(int sizeWaveform, sfloat *pWaveform, SMS_AnalParams *pAnalParams);
-void sms_windowCentered (int sizeWindow, sfloat *pWaveform, sfloat *pWindow, int sizeFft, sfloat *pFftBuffer);
+void sms_windowCentered(int sizeWindow, sfloat *pWaveform, sfloat *pWindow, int sizeFft, sfloat *pFftBuffer);
-void sms_getWindow (int sizeWindow, sfloat *pWindow, int iWindowType);
+void sms_getWindow(int sizeWindow, sfloat *pWindow, int iWindowType);
-void sms_scaleWindow (int sizeWindow, sfloat *pWindow);
+void sms_scaleWindow(int sizeWindow, sfloat *pWindow);
-int sms_spectrum (int sizeWindow, sfloat *pWaveform, sfloat *pWindow, int sizeMag,
- sfloat *pMag, sfloat *pPhase);
+int sms_spectrum(int sizeWindow, sfloat *pWaveform, sfloat *pWindow, int sizeMag,
+ sfloat *pMag, sfloat *pPhase);
-int sms_invSpectrum (int sizeWaveform, sfloat *pWaveform, sfloat *pWindow ,
- int sizeMag, sfloat *pMag, sfloat *pPhase);
+int sms_invSpectrum(int sizeWaveform, sfloat *pWaveform, sfloat *pWindow ,
+ int sizeMag, sfloat *pMag, sfloat *pPhase);
/* \todo remove this once invSpectrum is completely implemented */
-int sms_invQuickSpectrumW (sfloat *pFMagSpectrum, sfloat *pFPhaseSpectrum,
- int sizeFft, sfloat *pFWaveform, int sizeWave,
- sfloat *pFWindow);
+int sms_invQuickSpectrumW(sfloat *pFMagSpectrum, sfloat *pFPhaseSpectrum,
+ int sizeFft, sfloat *pFWaveform, int sizeWave,
+ sfloat *pFWindow);
-int sms_spectralApprox (sfloat *pSpec1, int sizeSpec1, int sizeSpec1Used,
- sfloat *pSpec2, int sizeSpec2, int nCoefficients);
+int sms_spectralApprox(sfloat *pSpec1, int sizeSpec1, int sizeSpec1Used,
+ sfloat *pSpec2, int sizeSpec2, int nCoefficients);
-int sms_spectrumMag (int sizeWindow, sfloat *pWaveform, sfloat *pWindow,
- int sizeMag, sfloat *pMag);
-
-void sms_dCepstrum( int sizeCepstrum, sfloat *pCepstrum, int sizeFreq, sfloat *pFreq, sfloat *pMag,
- sfloat fLambda, int iSamplingRate);
+int sms_spectrumMag(int sizeWindow, sfloat *pWaveform, sfloat *pWindow,
+ int sizeMag, sfloat *pMag);
-void sms_dCepstrumEnvelope (int sizeCepstrum, sfloat *pCepstrum, int sizeEnv, sfloat *pEnv);
+void sms_dCepstrum(int sizeCepstrum, sfloat *pCepstrum, int sizeFreq, sfloat *pFreq, sfloat *pMag,
+ sfloat fLambda, int iSamplingRate);
-void sms_spectralEnvelope ( SMS_Data *pSmsData, SMS_SEnvParams *pSpecEnvParams);
+void sms_dCepstrumEnvelope(int sizeCepstrum, sfloat *pCepstrum, int sizeEnv, sfloat *pEnv);
-int sms_sizeNextWindow (int iCurrentFrame, SMS_AnalParams *pAnalParams);
+void sms_spectralEnvelope(SMS_Data *pSmsData, SMS_SEnvParams *pSpecEnvParams);
-sfloat sms_fundDeviation (SMS_AnalParams *pAnalParams, int iCurrentFrame);
+int sms_sizeNextWindow(int iCurrentFrame, SMS_AnalParams *pAnalParams);
-int sms_detectPeaks (int sizeSpec, sfloat *pFMag, sfloat *pPhase,
- SMS_Peak *pSpectralPeaks, SMS_PeakParams *pPeakParams);
+sfloat sms_fundDeviation(SMS_AnalParams *pAnalParams, int iCurrentFrame);
-//void sms_harmDetection (SMS_AnalFrame *pFrame, sfloat fRefFundamental,
-// SMS_PeakParams *pPeakParams);
+int sms_detectPeaks(int sizeSpec, sfloat *pFMag, sfloat *pPhase,
+ SMS_Peak *pSpectralPeaks, SMS_AnalParams *pAnalParams);
sfloat sms_harmDetection(int numPeaks, SMS_Peak* spectralPeaks, sfloat refFundamental,
- sfloat refHarmonic, sfloat lowestFreq, sfloat highestFreq,
- int soundType, sfloat minRefHarmMag, sfloat refHarmMagDiffFromMax);
+ sfloat refHarmonic, sfloat lowestFreq, sfloat highestFreq,
+ int soundType, sfloat minRefHarmMag, sfloat refHarmMagDiffFromMax);
int sms_peakContinuation (int iFrame, SMS_AnalParams *pAnalParams);
@@ -675,8 +674,8 @@ sfloat sms_deEmphasis(sfloat fInput, SMS_SynthParams *pSynthParams);
void sms_cleanTracks (int iCurrentFrame, SMS_AnalParams *pAnalParams);
void sms_scaleDet (sfloat *pSynthBuffer, sfloat *pOriginalBuffer,
- sfloat *pSinAmp, SMS_AnalParams *pAnalParams, int nTracks);
-
+ sfloat *pSinAmp, SMS_AnalParams *pAnalParams, int nTracks);
+
int sms_prepSine (int nTableSize);
int sms_prepSinc (int nTableSize);
@@ -686,38 +685,38 @@ void sms_clearSine( void );
void sms_clearSinc( void );
void sms_synthesize (SMS_Data *pSmsFrame, sfloat*pSynthesis,
- SMS_SynthParams *pSynthParams);
-
+ SMS_SynthParams *pSynthParams);
+
void sms_sineSynthFrame (SMS_Data *pSmsFrame, sfloat *pBuffer,
- int sizeBuffer, SMS_Data *pLastFrame,
- int iSamplingRate);
+ int sizeBuffer, SMS_Data *pLastFrame,
+ int iSamplingRate);
void sms_initHeader (SMS_Header *pSmsHeader);
int sms_getHeader (char *pChFileName, SMS_Header **ppSmsHeader,
- FILE **ppInputFile);
+ FILE **ppInputFile);
void sms_fillHeader (SMS_Header *pSmsHeader, SMS_AnalParams *pAnalParams,
- char *pProgramString);
+ char *pProgramString);
int sms_writeHeader (char *pFileName, SMS_Header *pSmsHeader,
- FILE **ppOutSmsFile);
+ FILE **ppOutSmsFile);
int sms_writeFile (FILE *pSmsFile, SMS_Header *pSmsHeader);
int sms_initFrame (int iCurrentFrame, SMS_AnalParams *pAnalParams,
- int sizeWindow);
-
+ int sizeWindow);
+
int sms_allocFrame (SMS_Data *pSmsFrame, int nTracks, int nCoeff,
- int iPhase, int stochType, int nEnvCoeff);
+ int iPhase, int stochType, int nEnvCoeff);
int sms_allocFrameH (SMS_Header *pSmsHeader, SMS_Data *pSmsFrame);
int sms_getFrame (FILE *pInputFile, SMS_Header *pSmsHeader, int iFrame,
- SMS_Data *pSmsFrame);
+ SMS_Data *pSmsFrame);
int sms_writeFrame (FILE *pSmsFile, SMS_Header *pSmsHeader,
- SMS_Data *pSmsFrame);
+ SMS_Data *pSmsFrame);
void sms_freeFrame (SMS_Data *pSmsFrame);
@@ -732,10 +731,10 @@ int sms_residual (int sizeWindow, sfloat *pSynthesis, sfloat *pOriginal, sfloat
void sms_filterHighPass ( int sizeResidual, sfloat *pResidual, int iSamplingRate);
int sms_stocAnalysis ( int sizeWindow, sfloat *pResidual, sfloat *pWindow,
- SMS_Data *pSmsFrame);
+ SMS_Data *pSmsFrame);
void sms_interpolateFrames (SMS_Data *pSmsFrame1, SMS_Data *pSmsFrame2,
- SMS_Data *pSmsFrameOut, sfloat fInterpFactor);
+ SMS_Data *pSmsFrameOut, sfloat fInterpFactor);
void sms_fft(int sizeFft, sfloat *pArray);
@@ -761,7 +760,7 @@ void sms_modify(SMS_Data *frame, SMS_ModifyParams *params);
int sms_createDebugFile (SMS_AnalParams *pAnalParams);
void sms_writeDebugData (sfloat *pBuffer1, sfloat *pBuffer2,
- sfloat *pBuffer3, int sizeBuffer);
+ sfloat *pBuffer3, int sizeBuffer);
void sms_writeDebugFile ( void );