diff options
author | John Glover <glover.john@gmail.com> | 2010-12-24 12:37:39 +0000 |
---|---|---|
committer | John Glover <glover.john@gmail.com> | 2010-12-24 12:37:39 +0000 |
commit | 0aaf61396643d7884b792b6d1a053c7dae7390b2 (patch) | |
tree | 6e7fafe7ecf7a318cdbcc0129f3f6b0dc39fec77 | |
parent | c0d481904d7a12065f5a29b631326924dc674c99 (diff) | |
download | simpl-0aaf61396643d7884b792b6d1a053c7dae7390b2.tar.gz simpl-0aaf61396643d7884b792b6d1a053c7dae7390b2.tar.bz2 simpl-0aaf61396643d7884b792b6d1a053c7dae7390b2.zip |
Updated MQ and SndObj peak detection and partial tracking to simpl 0.2
-rw-r--r-- | mq.py | 2 | ||||
-rw-r--r-- | sndobj.py | 46 | ||||
-rw-r--r-- | sndobj/SinAnal.cpp | 230 |
3 files changed, 144 insertions, 134 deletions
@@ -144,7 +144,7 @@ class MQPeakDetection(simpl.PeakDetection): self._max_peaks peaks.""" self._current_peaks = [] # fft of frame - f = np.fft.rfft(frame * self._window) + f = np.fft.rfft(frame.audio * self._window) spectrum = abs(f) # find all peaks in the spectrum prev_mag = np.abs(spectrum[0]) @@ -75,8 +75,8 @@ class SndObjPeakDetection(simpl.PeakDetection): def find_peaks_in_frame(self, frame): "Find and return all spectral peaks in a given frame of audio" - current_peaks = [] - self._input.PushIn(frame) + peaks = [] + self._input.PushIn(frame.audio) self._input.DoProcess() self._ifgram.DoProcess() num_peaks_found = self._analysis.FindPeaks() @@ -86,24 +86,24 @@ class SndObjPeakDetection(simpl.PeakDetection): p.amplitude = self._analysis.Output(i*3) p.frequency = self._analysis.Output((i*3)+1) p.phase = self._analysis.Output((i*3)+2) - if not current_peaks: - current_peaks.append(p) + if not peaks: + peaks.append(p) else: - if np.abs(p.frequency - current_peaks[-1].frequency) > self._min_peak_separation: - current_peaks.append(p) + if np.abs(p.frequency - peaks[-1].frequency) > self._min_peak_separation: + peaks.append(p) else: - if p.amplitude > current_peaks[-1].amplitude: - current_peaks.remove(current_peaks[-1]) - current_peaks.append(p) - return current_peaks + if p.amplitude > peaks[-1].amplitude: + peaks.remove(peaks[-1]) + peaks.append(p) + return peaks class SndObjPartialTracking(simpl.PartialTracking): "Partial tracking using the algorithm from the Sound Object Library" def __init__(self): simpl.PartialTracking.__init__(self) - self._threshold = 0.003 # todo: property - self._num_bins = 1025 # todo: property + self._threshold = 0.003 # TODO: make this a property + self._num_bins = 1025 # TODO: make this a property self._analysis = simplsndobj.SinAnal(simplsndobj.SndObj(), self._num_bins, self._threshold, self.max_partials) @@ -111,16 +111,16 @@ class SndObjPartialTracking(simpl.PartialTracking): self._analysis.Set("max tracks", num_partials) self._max_partials = num_partials - def update_partials(self, frame, frame_number): + def update_partials(self, frame): "Streamable (real-time) partial-tracking." - frame_partials = [] + partials = [] # load Peak amplitudes, frequencies and phases into arrays - num_peaks = len(frame) + num_peaks = len(frame.peaks) amps = simpl.zeros(num_peaks) freqs = simpl.zeros(num_peaks) phases = simpl.zeros(num_peaks) for i in range(num_peaks): - peak = frame[i] + peak = frame.peaks[i] amps[i] = peak.amplitude freqs[i] = peak.frequency phases[i] = peak.phase @@ -135,18 +135,8 @@ class SndObjPartialTracking(simpl.PartialTracking): peak.amplitude = self._analysis.Output(i*3) peak.frequency = self._analysis.Output((i*3)+1) peak.phase = self._analysis.Output((i*3)+2) - id = self._analysis.GetTrackID(i) - # if this is a continuing partial, create a peak and append it - if id >= 0 and id <= len(self.partials) - 1: - self.partials[id].add_peak(peak) - # if not, make a new partial - else: - partial = simpl.Partial() - partial.starting_frame = frame_number - partial.add_peak(peak) - self.partials.append(partial) - frame_partials.append(peak) - return frame_partials + partials.append(peak) + return partials class SimplSndObjAnalysisWrapper(simplsndobj.SinAnal): diff --git a/sndobj/SinAnal.cpp b/sndobj/SinAnal.cpp index 510d2db..e5c19c7 100644 --- a/sndobj/SinAnal.cpp +++ b/sndobj/SinAnal.cpp @@ -57,14 +57,14 @@ SinAnal::SinAnal(SndObj* input, double threshold, int maxtracks, m_numpeaks = 0; m_numbins = ((FFT *)m_input)->GetFFTSize()/2 + 1; - m_bndx = new double*[minpoints+2]; - m_pkmags = new double*[minpoints+2]; - m_adthresh = new double*[minpoints+2]; - m_tstart = new unsigned int*[minpoints+2]; - m_lastpk = new unsigned int*[minpoints+2]; - m_trkid = new unsigned int*[minpoints+2]; + m_bndx = new double*[m_minpoints+2]; + m_pkmags = new double*[m_minpoints+2]; + m_adthresh = new double*[m_minpoints+2]; + m_tstart = new unsigned int*[m_minpoints+2]; + m_lastpk = new unsigned int*[m_minpoints+2]; + m_trkid = new unsigned int*[m_minpoints+2]; int i; - for(i = 0; i < minpoints+2; i++){ + for(i = 0; i < m_minpoints+2; i++){ m_bndx[i] = new double[m_maxtracks]; memset(m_bndx[i], 0, sizeof(double) * m_maxtracks); m_pkmags[i] = new double[m_maxtracks]; @@ -129,20 +129,20 @@ SinAnal::SinAnal(SndObj* input, int numbins, double threshold, int maxtracks, m_numpeaks = 0; m_numbins = numbins; - m_bndx = new double*[minpoints+2]; - m_pkmags = new double*[minpoints+2]; - m_adthresh = new double*[minpoints+2]; - m_tstart = new unsigned int*[minpoints+2]; - m_lastpk = new unsigned int*[minpoints+2]; - m_trkid = new unsigned int*[minpoints+2]; + m_bndx = new double*[m_minpoints+2]; + m_pkmags = new double*[m_minpoints+2]; + m_adthresh = new double*[m_minpoints+2]; + m_tstart = new unsigned int*[m_minpoints+2]; + m_lastpk = new unsigned int*[m_minpoints+2]; + m_trkid = new unsigned int*[m_minpoints+2]; int i; - for(i=0; i<minpoints+2; i++){ + for(i = 0; i < m_minpoints+2; i++){ m_bndx[i] = new double[m_maxtracks]; memset(m_bndx[i], 0, sizeof(double) * m_maxtracks); m_pkmags[i] = new double[m_maxtracks]; memset(m_pkmags[i], 0, sizeof(double) * m_maxtracks); m_adthresh[i] = new double[m_maxtracks]; - memset(m_pkmags[i], 0, sizeof(double) * m_maxtracks); + memset(m_adthresh[i], 0, sizeof(double) * m_maxtracks); m_tstart[i] = new unsigned int[m_maxtracks]; memset(m_tstart[i], 0, sizeof(unsigned int) * m_maxtracks); m_lastpk[i] = new unsigned int[m_maxtracks]; @@ -189,62 +189,91 @@ SinAnal::SinAnal(SndObj* input, int numbins, double threshold, int maxtracks, } SinAnal::~SinAnal(){ - delete[] m_phases; - delete[] m_freqs; - delete[] m_mags; - delete[] m_binmax; - delete[] m_magmax; - delete[] m_diffs; - delete[] m_maxix; - delete[] m_bndx; - delete[] m_pkmags; - delete[] m_adthresh; - delete[] m_tstart; - delete[] m_lastpk; - delete[] m_trkid; - delete[] m_trndx; - delete[] m_contflag; - delete[] m_bins; + if(m_numbins){ + int i; + for(i = 0; i < m_minpoints+2; i++){ + delete [] m_bndx[i]; + delete [] m_pkmags[i]; + delete [] m_adthresh[i]; + delete [] m_tstart[i]; + delete [] m_lastpk[i]; + delete [] m_trkid[i]; + } + } + + if(m_bndx) delete[] m_bndx; + if(m_pkmags) delete[] m_pkmags; + if(m_adthresh) delete[] m_adthresh; + if(m_tstart) delete[] m_tstart; + if(m_lastpk) delete[] m_lastpk; + if(m_trkid) delete[] m_trkid; + if(m_bins) delete[] m_bins; + if(m_trndx) delete[] m_trndx; + if(m_contflag) delete[] m_contflag; + + if(m_phases) delete[] m_phases; + if(m_freqs) delete[] m_freqs; + if(m_mags) delete[] m_mags; + if(m_binmax) delete[] m_binmax; + if(m_magmax) delete[] m_magmax; + if(m_diffs) delete[] m_diffs; + if(m_maxix) delete[] m_maxix; } void SinAnal::SetMaxTracks(int maxtracks){ + if(m_numbins){ + int i; + for(i = 0; i < m_minpoints+2; i++){ + delete [] m_bndx[i]; + delete [] m_pkmags[i]; + delete [] m_adthresh[i]; + delete [] m_tstart[i]; + delete [] m_lastpk[i]; + delete [] m_trkid[i]; + } + } + + if(m_bndx) delete[] m_bndx; + if(m_pkmags) delete[] m_pkmags; + if(m_adthresh) delete[] m_adthresh; + if(m_tstart) delete[] m_tstart; + if(m_lastpk) delete[] m_lastpk; + if(m_trkid) delete[] m_trkid; + if(m_bins) delete[] m_bins; + if(m_trndx) delete[] m_trndx; + if(m_contflag) delete[] m_contflag; + m_maxtracks = maxtracks; - - if(m_numbins){ - delete[] m_bndx; - delete[] m_pkmags; - delete[] m_adthresh; - delete[] m_trndx; - delete[] m_contflag; - delete[] m_bins; - } - - m_contflag = new bool[m_maxtracks]; m_bins = new double[m_maxtracks]; + memset(m_bins, 0, sizeof(double) * m_maxtracks); m_trndx = new int[m_maxtracks]; - m_prev = m_minpoints+1; m_cur = 0; - m_bndx = new double*[2]; - m_pkmags = new double*[2]; - m_adthresh = new double*[2]; - m_tstart = new unsigned int*[2]; - m_lastpk = new unsigned int*[2]; - m_trkid = new unsigned int*[2]; + memset(m_trndx, 0, sizeof(int) * m_maxtracks); + m_contflag = new bool[m_maxtracks]; + memset(m_contflag, 0, sizeof(bool) * m_maxtracks); + + m_prev = 1; + m_cur = 0; + m_bndx = new double*[m_minpoints+2]; + m_pkmags = new double*[m_minpoints+2]; + m_adthresh = new double*[m_minpoints+2]; + m_tstart = new unsigned int*[m_minpoints+2]; + m_lastpk = new unsigned int*[m_minpoints+2]; + m_trkid = new unsigned int*[m_minpoints+2]; int i; - for(i=0; i<m_minpoints+2; i++){ + for(i = 0; i < m_minpoints+2; i++){ m_bndx[i] = new double[m_maxtracks]; - memset(m_bndx[i],0,sizeof(double)*m_maxtracks); + memset(m_bndx[i], 0, sizeof(double) * m_maxtracks); m_pkmags[i] = new double[m_maxtracks]; - memset(m_pkmags[i],0,sizeof(double)*m_maxtracks); + memset(m_pkmags[i], 0, sizeof(double) * m_maxtracks); m_adthresh[i] = new double[m_maxtracks]; - memset(m_pkmags[i],0,sizeof(double)*m_maxtracks); + memset(m_adthresh[i], 0, sizeof(double) * m_maxtracks); m_tstart[i] = new unsigned int[m_maxtracks]; - memset(m_tstart[i],0,sizeof(unsigned int)*m_maxtracks); + memset(m_tstart[i], 0, sizeof(unsigned int) * m_maxtracks); m_lastpk[i] = new unsigned int[m_maxtracks]; - memset(m_lastpk[i],0,sizeof(unsigned int)*m_maxtracks); + memset(m_lastpk[i], 0, sizeof(unsigned int) * m_maxtracks); m_trkid[i] = new unsigned int[m_maxtracks]; - memset(m_trkid[i],0,sizeof(unsigned int)*m_maxtracks); - + memset(m_trkid[i], 0, sizeof(unsigned int) * m_maxtracks); } for(i = 0; i < m_maxtracks; i++) m_pkmags[m_prev][i] = m_bndx[m_prev][i] = m_adthresh[m_prev][i] = 0.f; @@ -252,7 +281,6 @@ SinAnal::SetMaxTracks(int maxtracks){ SetVectorSize(m_maxtracks*3); } - void SinAnal::SetIFGram(SndObj* input){ if(m_input){ @@ -282,8 +310,6 @@ SinAnal::SetIFGram(SndObj* input){ m_freqs[m_numbins-1] = m_sr/2; } - - int SinAnal::Set(char* mess, double value){ switch(FindMsg(mess)){ @@ -473,36 +499,35 @@ SinAnal::PartialTracking(){ for(i=0; i < m_numbins; i++) if(m_diffs[i] < m_diffs[bestix]) bestix = i; - // if difference smaller than 1 bin - double tempf = F - m_binmax[bestix]; - tempf = (tempf < 0 ? -tempf : tempf); - if(tempf < 1.){ - // if amp jump is too great (check) - if(m_adthresh[m_prev][j] < - (dbstep = 20*log10(m_magmax[bestix]/m_pkmags[m_prev][j]))){ - // mark for discontinuation; - m_contflag[j] = false; - } - else { - m_bndx[m_prev][j] = m_binmax[bestix]; - m_pkmags[m_prev][j] = m_magmax[bestix]; - // track index keeps track history - // so we know which ones continue - m_contflag[j] = true; - m_binmax[bestix] = m_magmax[bestix] = 0.f; - m_lastpk[m_prev][j] = m_timecount; - foundcont = 1; - count++; - - // update the adaptive mag threshold - double tmp1 = dbstep*1.5f; - double tmp2 = m_adthresh[m_prev][j] - - (m_adthresh[m_prev][j] - 1.5f)*0.048770575f; - m_adthresh[m_prev][j] = (tmp1 > tmp2 ? tmp1 : tmp2); - } // else - } // if difference - // if check - } + // if difference smaller than 1 bin + double tempf = F - m_binmax[bestix]; + tempf = (tempf < 0 ? -tempf : tempf); + if(tempf < 1.){ + // if amp jump is too great (check) + if(m_adthresh[m_prev][j] < + (dbstep = 20*log10(m_magmax[bestix]/m_pkmags[m_prev][j]))){ + // mark for discontinuation; + m_contflag[j] = false; + } + else{ + m_bndx[m_prev][j] = m_binmax[bestix]; + m_pkmags[m_prev][j] = m_magmax[bestix]; + // track index keeps track history + // so we know which ones continue + m_contflag[j] = true; + m_binmax[bestix] = m_magmax[bestix] = 0.f; + m_lastpk[m_prev][j] = m_timecount; + foundcont = 1; + count++; + + // update the adaptive mag threshold + double tmp1 = dbstep*1.5f; + double tmp2 = m_adthresh[m_prev][j] - + (m_adthresh[m_prev][j] - 1.5f)*0.048770575f; + m_adthresh[m_prev][j] = (tmp1 > tmp2 ? tmp1 : tmp2); + } // else + } // if difference + } // if check // if we did not find a continuation // we'll check if the magnitudes around it are below @@ -511,17 +536,14 @@ SinAnal::PartialTracking(){ // old if(!foundcont){ if((exp(m_mags[int(m_bndx[m_prev][j]+0.5)]) < 0.2*m_pkmags[m_prev][j]) - || ((m_timecount - m_lastpk[m_prev][j]) > (unsigned int) m_maxgap)) - { + || ((m_timecount - m_lastpk[m_prev][j]) > (unsigned int) m_maxgap)){ m_contflag[j] = false; - - } else { + } + else{ m_contflag[j] = true; count++; } - } - } // for loop // compress the arrays @@ -544,9 +566,9 @@ SinAnal::PartialTracking(){ // create new tracks for all new peaks for(j=0; j< m_numbins && count < m_maxtracks; j++){ if(m_magmax[j] > m_startupThresh){ - m_bndx[m_cur][count] = m_binmax[j]; - m_pkmags[m_cur][count] = m_magmax[j]; - m_adthresh[m_cur][count] = 400.f; + m_bndx[m_cur][count] = m_binmax[j]; + m_pkmags[m_cur][count] = m_magmax[j]; + m_adthresh[m_cur][count] = 400.f; // track ID is a positive number in the // range of 0 - maxtracks*3 - 1 // it is given when the track starts @@ -567,16 +589,15 @@ SinAnal::PartialTracking(){ // count is the number of continuing tracks + new tracks // now we check for tracks that have been there for more // than minpoints hop periods and output them - m_tracks = 0; for(i=0; i < count; i++){ int curpos = m_timecount-m_minpoints; if(curpos >= 0 && m_tstart[m_cur][i] <= (unsigned int)curpos){ int tpoint = m_cur-m_minpoints; - - if(tpoint < 0) { + if(tpoint < 0){ tpoint += m_minpoints+2; } + m_bins[i] = m_bndx[tpoint][i]; m_mags[i] = m_pkmags[tpoint][i]; m_trndx[i] = m_trkid[tpoint][i]; @@ -586,9 +607,8 @@ SinAnal::PartialTracking(){ // end track-selecting // current arrays become previous - //int tmp = m_prev; - m_prev = m_cur; - m_cur = (m_cur < m_minpoints+1 ? m_cur+1 : 0); + m_prev = m_cur; + m_cur = (m_cur < m_minpoints+1 ? m_cur+1 : 0); m_timecount++; // Output |