diff options
Diffstat (limited to 'tests')
-rw-r--r-- | tests/testsms.py | 612 | ||||
-rw-r--r-- | tests/testsndobj.py | 389 |
2 files changed, 1001 insertions, 0 deletions
diff --git a/tests/testsms.py b/tests/testsms.py new file mode 100644 index 0000000..7c1c0b3 --- /dev/null +++ b/tests/testsms.py @@ -0,0 +1,612 @@ +# Copyright (c) 2009 John Glover, National University of Ireland, Maynooth +# +# This program is free software; you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation; either version 2 of the License, or +# (at your option) any later version. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with this program; if not, write to the Free Software +# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + +import unittest +from simpl import pysms as simplsms +import simpl +import pysms +from scipy.io.wavfile import read +import numpy as np + +FLOAT_PRECISION = 3 # number of decimal places to check for accuracy +input_file = 'audio/flute.wav' +audio_in_data = read(input_file) +audio_in = np.asarray(audio_in_data[1], np.float32) / 32768.0 +sampling_rate = audio_in_data[0] +frame_size = 2048 +hop_size = 256 +num_frames = 5 +max_peaks = 10 +max_partials = 3 +num_samples = frame_size + ((num_frames - 1) * hop_size) +audio_in = audio_in[0:num_samples] + +def print_partials(partials): + for partial in partials: + print [p.frequency for p in partial.peaks], ":", partial.starting_frame + +class TestSimplSMS(unittest.TestCase): + + def test_size_next_read(self): + """test_size_next_read + Make sure pysms PeakDetection is calculating + the correct value for the size of the next frame.""" + pysms.sms_init() + sms_header = pysms.SMS_Header() + analysis_params = pysms.SMS_AnalParams() + snd_header = pysms.SMS_SndHeader() + # Try to open the input file to fill snd_header + if(pysms.sms_openSF(input_file, snd_header)): + raise NameError("error opening sound file: " + pysms.sms_errorString()) + analysis_params.iSamplingRate = sampling_rate + analysis_params.iFrameRate = sampling_rate / hop_size + analysis_params.iWindowType = pysms.SMS_WIN_HAMMING + analysis_params.fDefaultFundamental = 100 + analysis_params.fHighestFreq = 20000 + analysis_params.peakParams.iMaxPeaks = max_peaks + analysis_params.iMaxDelayFrames = num_frames + 1 + analysis_params.analDelay = 0 + analysis_params.minGoodFrames = 1 + pysms.sms_initAnalysis(analysis_params, snd_header) + sms_header.nStochasticCoeff = 128 + pysms.sms_fillHeader(sms_header, analysis_params, "pysms") + + sample_offset = 0 + pysms_size_new_data = 0 + current_frame = 0 + sms_next_read_sizes = [] + + while current_frame < num_frames: + sms_next_read_sizes.append(analysis_params.sizeNextRead) + sample_offset += pysms_size_new_data + if((sample_offset + analysis_params.sizeNextRead) < num_samples): + pysms_size_new_data = analysis_params.sizeNextRead + else: + pysms_size_new_data = num_samples - sample_offset + frame = audio_in[sample_offset:sample_offset + pysms_size_new_data] + analysis_data = pysms.SMS_Data() + pysms.sms_allocFrameH(sms_header, analysis_data) + status = pysms.sms_analyze(frame, analysis_data, analysis_params) + # as the no. of frames of delay is > num_frames, sms_analyze should + # never get around to performing partial tracking, and so the return + # value should be 0 + self.assertEquals(status, 0) + current_frame += 1 + + pysms.sms_freeAnalysis(analysis_params) + pysms.sms_closeSF() + pysms.sms_free() + + pd = simpl.SMSPeakDetection() + pd.hop_size = hop_size + current_frame = 0 + sample_offset = 0 + size_new_data = 0 + + while current_frame < num_frames: + self.assertEquals(sms_next_read_sizes[current_frame], pd.frame_size) + sample_offset += size_new_data + size_new_data = pd.frame_size + pd.find_peaks_in_frame(audio_in[sample_offset:sample_offset + size_new_data]) + pd.frame_size = pd._analysis_params.sizeNextRead + current_frame += 1 + + def test_peak_detection(self): + """test_peak_detection + Compare pysms Peaks with SMS peaks. Exact peak + information cannot be retrieved using libsms. Basic peak detection + is performed by sms_detectPeaks, but this is called multiple times + with different frame sizes by sms_analyze. This peak data cannot + be returned from sms_analyze without modifying it, so here + we compare the peaks to a slightly modified version of sms_analyze + from pysms. The peak values should be the same as those found by + the pysms find_peaks function. Analyses have to be performed + separately due to libsms implementation issues.""" + pysms.sms_init() + sms_header = pysms.SMS_Header() + analysis_params = pysms.SMS_AnalParams() + analysis_params.iSamplingRate = sampling_rate + analysis_params.iFrameRate = sampling_rate / hop_size + sms_header.nStochasticCoeff = 128 + analysis_params.fDefaultFundamental = 100 + analysis_params.fHighestFreq = 20000 + analysis_params.iMaxDelayFrames = num_frames + 1 + analysis_params.analDelay = 0 + analysis_params.minGoodFrames = 1 + analysis_params.iFormat = pysms.SMS_FORMAT_HP + analysis_params.nTracks = max_peaks + analysis_params.iWindowType = pysms.SMS_WIN_HAMMING + simplsms.sms_initAnalysis(analysis_params) + analysis_params.peakParams.iMaxPeaks = max_peaks + pysms.sms_fillHeader(sms_header, analysis_params, "pysms") + + sample_offset = 0 + size_new_data = 0 + current_frame = 0 + sms_peaks = [] + + while current_frame < num_frames: + sample_offset += size_new_data + if((sample_offset + analysis_params.sizeNextRead) < num_samples): + size_new_data = analysis_params.sizeNextRead + else: + size_new_data = num_samples - sample_offset + frame = audio_in[sample_offset:sample_offset + size_new_data] + analysis_data = pysms.SMS_Data() + pysms.sms_allocFrameH(sms_header, analysis_data) + status = pysms.sms_analyze(frame, analysis_data, analysis_params) + # as the no. of frames of delay is > num_frames, sms_analyze should + # never get around to performing partial tracking, and so the return + # value should be 0 + self.assertEquals(status, 0) + num_peaks = analysis_data.nTracks + frame_peaks = [] + pysms_freqs = simpl.zeros(num_peaks) + pysms_amps = simpl.zeros(num_peaks) + pysms_phases = simpl.zeros(num_peaks) + analysis_data.getSinFreq(pysms_freqs) + analysis_data.getSinAmp(pysms_amps) + analysis_data.getSinPhase(pysms_phases) + for i in range(num_peaks): + p = simpl.Peak() + p.amplitude = pysms_amps[i] + p.frequency = pysms_freqs[i] + p.phase = pysms_phases[i] + frame_peaks.append(p) + sms_peaks.append(frame_peaks) + current_frame += 1 + + pysms.sms_freeAnalysis(analysis_params) + pysms.sms_free() + + pd = simpl.SMSPeakDetection() + pd.hop_size = hop_size + pd.max_peaks = max_peaks + current_frame = 0 + sample_offset = 0 + size_new_data = 0 + pysms_peaks = [] + + while current_frame < num_frames: + sample_offset += size_new_data + size_new_data = pd.frame_size + pysms_peaks.append( + pd.find_peaks_in_frame(audio_in[sample_offset:sample_offset + size_new_data])) + pd.frame_size = pd._analysis_params.sizeNextRead + current_frame += 1 + + # make sure we have the same number of frames + self.assertEquals(len(sms_peaks), len(pysms_peaks)) + + for frame_number in range(len(sms_peaks)): + sms_frame = sms_peaks[frame_number] + pysms_frame = pysms_peaks[frame_number] + # make sure we have the same number of peaks in each frame + self.assertEquals(len(sms_frame), len(pysms_frame)) + # check peak values + for peak_number in range(len(sms_frame)): + sms_peak = sms_frame[peak_number] + pysms_peak = pysms_frame[peak_number] + self.assertAlmostEquals(sms_peak.amplitude, pysms_peak.amplitude, + places=FLOAT_PRECISION) + self.assertAlmostEquals(sms_peak.frequency, pysms_peak.frequency, + places=FLOAT_PRECISION) + self.assertAlmostEquals(sms_peak.phase, pysms_peak.phase, + places=FLOAT_PRECISION) + + def test_partial_tracking(self): + """test_partial_tracking + Compare pysms Partials with SMS partials.""" + pysms.sms_init() + sms_header = pysms.SMS_Header() + snd_header = pysms.SMS_SndHeader() + # Try to open the input file to fill snd_header + if(pysms.sms_openSF(input_file, snd_header)): + raise NameError("error opening sound file: " + pysms.sms_errorString()) + analysis_params = pysms.SMS_AnalParams() + analysis_params.iSamplingRate = sampling_rate + analysis_params.iFrameRate = sampling_rate / hop_size + sms_header.nStochasticCoeff = 128 + analysis_params.fDefaultFundamental = 100 + analysis_params.fHighestFreq = 20000 + analysis_params.iMaxDelayFrames = 3 + analysis_params.analDelay = 0 + analysis_params.minGoodFrames = 1 + analysis_params.iFormat = pysms.SMS_FORMAT_HP + analysis_params.nTracks = max_partials + analysis_params.nGuides = max_partials + analysis_params.iWindowType = pysms.SMS_WIN_HAMMING + pysms.sms_initAnalysis(analysis_params, snd_header) + analysis_params.nFrames = num_samples / hop_size + analysis_params.iSizeSound = num_samples + analysis_params.peakParams.iMaxPeaks = max_peaks + analysis_params.iStochasticType = pysms.SMS_STOC_NONE + pysms.sms_fillHeader(sms_header, analysis_params, "pysms") + + sample_offset = 0 + size_new_data = 0 + current_frame = 0 + sms_partials = [] + live_partials = [None for i in range(max_partials)] + do_analysis = True + + while do_analysis and (current_frame < num_frames): + sample_offset += size_new_data + if((sample_offset + analysis_params.sizeNextRead) < num_samples): + size_new_data = analysis_params.sizeNextRead + else: + size_new_data = num_samples - sample_offset + frame = audio_in[sample_offset:sample_offset + size_new_data] + analysis_data = pysms.SMS_Data() + pysms.sms_allocFrameH(sms_header, analysis_data) + status = pysms.sms_analyze(frame, analysis_data, analysis_params) + + if status == 1: + num_partials = analysis_data.nTracks + pysms_freqs = simpl.zeros(num_partials) + pysms_amps = simpl.zeros(num_partials) + pysms_phases = simpl.zeros(num_partials) + analysis_data.getSinFreq(pysms_freqs) + analysis_data.getSinAmp(pysms_amps) + analysis_data.getSinPhase(pysms_phases) + # make partial objects + for i in range(num_partials): + # for each partial, if the mag is > 0, this partial is alive + if pysms_amps[i] > 0: + # create a peak object + p = simpl.Peak() + p.amplitude = pysms_amps[i] + p.frequency = pysms_freqs[i] + p.phase = pysms_phases[i] + # add this peak to the appropriate partial + if not live_partials[i]: + live_partials[i] = simpl.Partial() + live_partials[i].starting_frame = current_frame + sms_partials.append(live_partials[i]) + live_partials[i].add_peak(p) + # if the mag is 0 and this partial was alive, kill it + else: + if live_partials[i]: + live_partials[i] = None + elif status == -1: + do_analysis = False + current_frame += 1 + + pysms.sms_freeAnalysis(analysis_params) + pysms.sms_closeSF() + pysms.sms_free() + + pd = simpl.SMSPeakDetection() + pd.max_peaks = max_peaks + pd.hop_size = hop_size + peaks = pd.find_peaks(audio_in) + pt = simpl.SMSPartialTracking() + pt.max_partials = max_partials + partials = pt.find_partials(peaks[0:num_frames]) + + # make sure both have the same number of partials + self.assertEquals(len(sms_partials), len(partials)) + + # make sure each partial is the same + for i in range(len(sms_partials)): + self.assertEquals(sms_partials[i].get_length(), partials[i].get_length()) + for peak_number in range(sms_partials[i].get_length()): + self.assertAlmostEquals(sms_partials[i].peaks[peak_number].amplitude, + partials[i].peaks[peak_number].amplitude, + places = FLOAT_PRECISION) + self.assertAlmostEquals(sms_partials[i].peaks[peak_number].frequency, + partials[i].peaks[peak_number].frequency, + places = FLOAT_PRECISION) + self.assertAlmostEquals(sms_partials[i].peaks[peak_number].phase, + partials[i].peaks[peak_number].phase, + places = FLOAT_PRECISION) + + def test_interpolate_frames(self): + """test_interpolate_frames + Make sure that pysms.sms_interpolateFrames returns the expected values + with interpolation factors of 0 and 1.""" + pysms.sms_init() + sms_header = pysms.SMS_Header() + snd_header = pysms.SMS_SndHeader() + # Try to open the input file to fill snd_header + if(pysms.sms_openSF(input_file, snd_header)): + raise NameError("error opening sound file: " + pysms.sms_errorString()) + analysis_params = pysms.SMS_AnalParams() + analysis_params.iSamplingRate = 44100 + analysis_params.iFrameRate = sampling_rate / hop_size + sms_header.nStochasticCoeff = 128 + analysis_params.fDefaultFundamental = 100 + analysis_params.fHighestFreq = 20000 + analysis_params.iMaxDelayFrames = 3 + analysis_params.analDelay = 0 + analysis_params.minGoodFrames = 1 + analysis_params.iFormat = pysms.SMS_FORMAT_HP + analysis_params.nTracks = max_partials + analysis_params.nGuides = max_partials + analysis_params.iWindowType = pysms.SMS_WIN_HAMMING + pysms.sms_initAnalysis(analysis_params, snd_header) + analysis_params.nFrames = num_samples / hop_size + analysis_params.iSizeSound = num_samples + analysis_params.peakParams.iMaxPeaks = max_peaks + analysis_params.iStochasticType = pysms.SMS_STOC_NONE + pysms.sms_fillHeader(sms_header, analysis_params, "pysms") + interp_frame = pysms.SMS_Data() + pysms.sms_allocFrame(interp_frame, sms_header.nTracks, sms_header.nStochasticCoeff, 1, sms_header.iStochasticType, 0) + + sample_offset = 0 + size_new_data = 0 + current_frame = 0 + sms_header.nFrames = num_frames + analysis_frames = [] + do_analysis = True + + while do_analysis and (current_frame < num_frames): + sample_offset += size_new_data + if((sample_offset + analysis_params.sizeNextRead) < num_samples): + size_new_data = analysis_params.sizeNextRead + else: + size_new_data = num_samples - sample_offset + frame = audio_in[sample_offset:sample_offset + size_new_data] + analysis_data = pysms.SMS_Data() + pysms.sms_allocFrameH(sms_header, analysis_data) + status = pysms.sms_analyze(frame, analysis_data, analysis_params) + + if status == 1: + analysis_frames.append(analysis_data) + # test interpolateFrames on the last two analysis frames + if current_frame == num_frames - 1: + left_frame = analysis_frames[-2] + right_frame = analysis_frames[-1] + pysms.sms_interpolateFrames(left_frame, right_frame, interp_frame, 0) + # make sure that interp_frame == left_frame + # interpolateFrames doesn't interpolate phases so ignore + left_amps = simpl.zeros(max_partials) + left_freqs = simpl.zeros(max_partials) + left_frame.getSinAmp(left_amps) + left_frame.getSinFreq(left_freqs) + right_amps = simpl.zeros(max_partials) + right_freqs = simpl.zeros(max_partials) + right_frame.getSinAmp(right_amps) + right_frame.getSinFreq(right_freqs) + interp_amps = simpl.zeros(max_partials) + interp_freqs = simpl.zeros(max_partials) + interp_frame.getSinAmp(interp_amps) + interp_frame.getSinFreq(interp_freqs) + for i in range(max_partials): + self.assertAlmostEquals(left_amps[i], interp_amps[i], + places = FLOAT_PRECISION) + if left_freqs[i] != 0: + self.assertAlmostEquals(left_freqs[i], interp_freqs[i], + places = FLOAT_PRECISION) + else: + self.assertAlmostEquals(right_freqs[i], interp_freqs[i], + places = FLOAT_PRECISION) + pysms.sms_interpolateFrames(left_frame, right_frame, interp_frame, 1) + interp_amps = simpl.zeros(max_partials) + interp_freqs = simpl.zeros(max_partials) + interp_frame.getSinAmp(interp_amps) + interp_frame.getSinFreq(interp_freqs) + for i in range(max_partials): + self.assertAlmostEquals(right_amps[i], interp_amps[i], + places = FLOAT_PRECISION) + if right_freqs[i] != 0: + self.assertAlmostEquals(right_freqs[i], interp_freqs[i], + places = FLOAT_PRECISION) + else: + self.assertAlmostEquals(left_freqs[i], interp_freqs[i], + places = FLOAT_PRECISION) + elif status == -1: + raise Exception("AnalysisStoppedEarly") + current_frame += 1 + + pysms.sms_freeAnalysis(analysis_params) + pysms.sms_closeSF() + + def test_harmonic_synthesis(self): + """test_harmonic_synthesis + Compare pysms synthesised harmonic component with SMS synthesised + harmonic component.""" + pysms.sms_init() + sms_header = pysms.SMS_Header() + snd_header = pysms.SMS_SndHeader() + # Try to open the input file to fill snd_header + if(pysms.sms_openSF(input_file, snd_header)): + raise NameError("error opening sound file: " + pysms.sms_errorString()) + analysis_params = pysms.SMS_AnalParams() + analysis_params.iSamplingRate = 44100 + analysis_params.iFrameRate = sampling_rate / hop_size + sms_header.nStochasticCoeff = 128 + analysis_params.fDefaultFundamental = 100 + analysis_params.fHighestFreq = 20000 + analysis_params.iMaxDelayFrames = 3 + analysis_params.analDelay = 0 + analysis_params.minGoodFrames = 1 + analysis_params.iFormat = pysms.SMS_FORMAT_HP + analysis_params.nTracks = max_partials + analysis_params.nGuides = max_partials + analysis_params.iWindowType = pysms.SMS_WIN_HAMMING + pysms.sms_initAnalysis(analysis_params, snd_header) + analysis_params.nFrames = num_samples / hop_size + analysis_params.iSizeSound = num_samples + analysis_params.peakParams.iMaxPeaks = max_peaks + analysis_params.iStochasticType = pysms.SMS_STOC_NONE + pysms.sms_fillHeader(sms_header, analysis_params, "pysms") + + sample_offset = 0 + size_new_data = 0 + current_frame = 0 + sms_header.nFrames = num_frames + analysis_frames = [] + do_analysis = True + + while do_analysis and (current_frame < num_frames): + sample_offset += size_new_data + if((sample_offset + analysis_params.sizeNextRead) < num_samples): + size_new_data = analysis_params.sizeNextRead + else: + size_new_data = num_samples - sample_offset + frame = audio_in[sample_offset:sample_offset + size_new_data] + analysis_data = pysms.SMS_Data() + pysms.sms_allocFrameH(sms_header, analysis_data) + status = pysms.sms_analyze(frame, analysis_data, analysis_params) + analysis_frames.append(analysis_data) + if status == -1: + do_analysis = False + current_frame += 1 + + pysms.sms_freeAnalysis(analysis_params) + pysms.sms_closeSF() + + interp_frame = pysms.SMS_Data() + synth_params = pysms.SMS_SynthParams() + synth_params.iSynthesisType = pysms.SMS_STYPE_DET + synth_params.iDetSynthType = pysms.SMS_DET_SIN + synth_params.sizeHop = hop_size + synth_params.iSamplingRate = 0 + + pysms.sms_initSynth(sms_header, synth_params) + pysms.sms_allocFrame(interp_frame, sms_header.nTracks, sms_header.nStochasticCoeff, 1, sms_header.iStochasticType, sms_header.nEnvCoeff) + + synth_samples = pysms.zeros(synth_params.sizeHop) + num_synth_samples = 0 + target_synth_samples = len(analysis_frames) * hop_size + pysms_audio = pysms.array([]) + current_frame = 0 + + while num_synth_samples < target_synth_samples: + pysms.sms_synthesize(analysis_frames[current_frame], synth_samples, synth_params) + pysms_audio = np.hstack((pysms_audio, synth_samples)) + num_synth_samples += synth_params.sizeHop + current_frame += 1 + + pysms.sms_freeSynth(synth_params) + pysms.sms_free() + + pd = simpl.SMSPeakDetection() + pd.max_peaks = max_peaks + pd.hop_size = hop_size + pt = simpl.SMSPartialTracking() + pt.max_partials = max_partials + peaks = pd.find_peaks(audio_in) + partials = pt.find_partials(peaks[0:num_frames]) + synth = simpl.SMSSynthesis() + synth.hop_size = hop_size + synth.stochastic_type = pysms.SMS_STOC_NONE + synth.synthesis_type = pysms.SMS_STYPE_DET + synth.max_partials = max_partials + simpl_audio = synth.synth(partials) + + self.assertEquals(pysms_audio.size, simpl_audio.size) + for i in range(simpl_audio.size): + self.assertAlmostEquals(pysms_audio[i], simpl_audio[i], + places = FLOAT_PRECISION) + + def test_residual_synthesis(self): + """test_residual_synthesis + Compare pysms residual signal with SMS residual""" + pysms.sms_init() + sms_header = pysms.SMS_Header() + snd_header = pysms.SMS_SndHeader() + # Try to open the input file to fill snd_header + if(pysms.sms_openSF(input_file, snd_header)): + raise NameError("error opening sound file: " + pysms.sms_errorString()) + analysis_params = pysms.SMS_AnalParams() + analysis_params.iSamplingRate = 44100 + analysis_params.iFrameRate = sampling_rate / hop_size + sms_header.nStochasticCoeff = 128 + analysis_params.fDefaultFundamental = 100 + analysis_params.fHighestFreq = 20000 + analysis_params.iMaxDelayFrames = 3 + analysis_params.analDelay = 0 + analysis_params.minGoodFrames = 1 + analysis_params.iFormat = pysms.SMS_FORMAT_HP + analysis_params.nTracks = max_partials + analysis_params.nGuides = max_partials + analysis_params.iWindowType = pysms.SMS_WIN_HAMMING + pysms.sms_initAnalysis(analysis_params, snd_header) + analysis_params.nFrames = num_samples / hop_size + analysis_params.iSizeSound = num_samples + analysis_params.peakParams.iMaxPeaks = max_peaks + analysis_params.iStochasticType = pysms.SMS_STOC_APPROX + pysms.sms_fillHeader(sms_header, analysis_params, "pysms") + + sample_offset = 0 + size_new_data = 0 + current_frame = 0 + sms_header.nFrames = num_frames + analysis_frames = [] + do_analysis = True + + while do_analysis and (current_frame < num_frames-1): + sample_offset += size_new_data + if((sample_offset + analysis_params.sizeNextRead) < num_samples): + size_new_data = analysis_params.sizeNextRead + else: + size_new_data = num_samples - sample_offset + frame = audio_in[sample_offset:sample_offset + size_new_data] + analysis_data = pysms.SMS_Data() + pysms.sms_allocFrameH(sms_header, analysis_data) + status = pysms.sms_analyze(frame, analysis_data, analysis_params) + analysis_frames.append(analysis_data) + if status == -1: + do_analysis = False + current_frame += 1 + + pysms.sms_freeAnalysis(analysis_params) + pysms.sms_closeSF() + pysms.sms_free() + + pd = simpl.SMSPeakDetection() + pd.max_peaks = max_peaks + pd.hop_size = hop_size + pt = simpl.SMSPartialTracking() + pt.max_partials = max_partials + peaks = pd.find_peaks(audio_in) + partials = pt.find_partials(peaks[0:num_frames]) + synth = simpl.SMSSynthesis() + synth.hop_size = hop_size + synth.stochastic_type = pysms.SMS_STOC_NONE + synth.synthesis_type = pysms.SMS_STYPE_DET + synth.max_partials = max_partials + simpl_harmonic = synth.synth(partials) + res = simpl.SMSResidual() + res.num_coefficients = 128 + res.type = simpl.SMSResidual.TIME_DOMAIN + residual = res.find_residual(simpl_harmonic, audio_in[0:simpl_harmonic.size]) +# print_partials(partials) +# print simpl_harmonic.size +# for i in range(residual.size): +# print residual[i] +# for i in range(simpl_harmonic.size): +# print simpl_harmonic[i] +# from pylab import plot, show +# plot(simpl_harmonic) +# plot(residual) +# plot(audio_in[0:simpl_harmonic.size]) +# show() +# from scipy.io.wavfile import write +# write("res.wav", 44100, residual) +# res.synth(simpl_harmonic, audio_in) + +if __name__ == '__main__': + suite = unittest.TestSuite() + suite.addTest(TestSimplSMS('test_size_next_read')) + suite.addTest(TestSimplSMS('test_peak_detection')) + suite.addTest(TestSimplSMS('test_partial_tracking')) + suite.addTest(TestSimplSMS('test_interpolate_frames')) + suite.addTest(TestSimplSMS('test_harmonic_synthesis')) + suite.addTest(TestSimplSMS('test_residual_synthesis')) + unittest.TextTestRunner().run(suite)
\ No newline at end of file diff --git a/tests/testsndobj.py b/tests/testsndobj.py new file mode 100644 index 0000000..7ef0a85 --- /dev/null +++ b/tests/testsndobj.py @@ -0,0 +1,389 @@ +# Copyright (c) 2009 John Glover, National University of Ireland, Maynooth +# +# This program is free software; you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation; either version 2 of the License, or +# (at your option) any later version. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with this program; if not, write to the Free Software +# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + +import unittest +import sndobj +import simpl +from simpl import pysndobj +from scipy.io.wavfile import read +import numpy as np + +FLOAT_PRECISION = 2 # number of decimal places to check for accuracy + +class TestSimplSndObj(unittest.TestCase): + def setUp(self): + self.input_file = 'audio/flute.wav' + + def test_sndobj_numpy(self): + "Test reading and writing numpy data in SndObjs" + frame_size = 2048 + hop_size = 2048 + num_frames = 4 + num_samples = frame_size + (num_frames * hop_size) + + audio_in_data = read(self.input_file) + audio_in = np.asarray(audio_in_data[1], np.float32) / 32768.0 + audio_in = audio_in[0:num_samples] + frame = np.zeros(frame_size, dtype=np.float32) + frame_out = np.zeros(hop_size, dtype=np.float32) + audio_out = np.array([]) + + input = pysndobj.SndObj() + input.SetVectorSize(frame_size) + + i = 0 + while (i + frame_size) <= num_samples: + frame = audio_in[i:i+frame_size] + input.PushIn(frame) + input.PopOut(frame_out) + audio_out = np.hstack((audio_out, frame_out)) + i += hop_size + + self.assertEqual(audio_in.size, audio_out.size) + for i in range(audio_out.size): + self.assertEqual(audio_in[i], audio_out[i]) + + def test_hammingtable(self): + "Compare sndobj.HammingTable with simplsndobj.HammingTable" + frame_size = 2048 + window1 = sndobj.HammingTable(frame_size, 0.5) + window2 = pysndobj.HammingTable(frame_size, 0.5) + for i in range(frame_size): + self.assertEqual(window1.Lookup(i), window2.Lookup(i)) + + def test_ifgram(self): + "Compare sndobj.IFGram with simplsndobj.IFGram" + frame_size = 2048 + hop_size = 512 + num_frames = 4 + num_samples = frame_size + ((num_frames - 1) * hop_size) + + audio_in_data = read(self.input_file) + audio_in = np.asarray(audio_in_data[1], np.float32) / 32768.0 + audio_in = audio_in[0:num_samples] + frame = np.zeros(frame_size, dtype=np.float32) + + sndobj_input = sndobj.SndObj() + simpl_input = pysndobj.SndObj() + sndobj_input.SetVectorSize(frame_size) + simpl_input.SetVectorSize(frame_size) + sndobj_window = sndobj.HammingTable(frame_size, 0.5) + simpl_window = pysndobj.HammingTable(frame_size, 0.5) + sndobj_ifgram = sndobj.IFGram(sndobj_window, sndobj_input, 1, frame_size, hop_size) + simpl_ifgram = pysndobj.IFGram(simpl_window, simpl_input, 1, frame_size, hop_size) + + i = 0 + while (i + frame_size) <= num_samples: + frame = audio_in[i:i+frame_size] + sndobj_input.PushIn(frame) + simpl_input.PushIn(frame) + sndobj_ifgram.DoProcess() + simpl_ifgram.DoProcess() + for j in range(frame_size): + self.assertAlmostEquals(sndobj_ifgram.Output(j), simpl_ifgram.Output(j), + places = FLOAT_PRECISION) + i += hop_size + + def test_sinanal(self): + "Compare sndobj.SinAnal with simplsndobj.SinAnal" + frame_size = 2048 + hop_size = 512 + max_tracks = 20 + num_frames = 4 + num_samples = frame_size + ((num_frames - 1) * hop_size) + + audio_in_data = read(self.input_file) + audio_in = np.asarray(audio_in_data[1], np.float32) / 32768.0 + audio_in = audio_in[0:num_samples] + frame = np.zeros(frame_size, dtype=np.float32) + + sndobj_input = sndobj.SndObj() + simpl_input = pysndobj.SndObj() + sndobj_input.SetVectorSize(frame_size) + simpl_input.SetVectorSize(frame_size) + sndobj_window = sndobj.HammingTable(frame_size, 0.5) + simpl_window = pysndobj.HammingTable(frame_size, 0.5) + sndobj_ifgram = sndobj.IFGram(sndobj_window, sndobj_input, 1, frame_size, hop_size) + simpl_ifgram = pysndobj.IFGram(simpl_window, simpl_input, 1, frame_size, hop_size) + sndobj_sinmod = sndobj.SinAnal(sndobj_ifgram, 0.003, max_tracks, 1, 3) + simpl_sinmod = pysndobj.SinAnal(simpl_ifgram, 0.003, max_tracks, 1, 3) + + i = 0 + while (i + frame_size) <= num_samples: + frame = audio_in[i:i+frame_size] + sndobj_input.PushIn(frame) + simpl_input.PushIn(frame) + sndobj_ifgram.DoProcess() + simpl_ifgram.DoProcess() + sndobj_sinmod.DoProcess() + simpl_sinmod.DoProcess() + for j in range(max_tracks * 3): + self.assertAlmostEquals(sndobj_sinmod.Output(j), simpl_sinmod.Output(j), + places = FLOAT_PRECISION) + i += hop_size + + def test_adsyn_doprocess(self): + "Compare sndobj.AdSyn with simplsndobj.AdSyn" + frame_size = 2048 + hop_size = 512 + max_tracks = 20 + num_frames = 4 + num_samples = frame_size + ((num_frames - 1) * hop_size) + + audio_in_data = read(self.input_file) + audio_in = np.asarray(audio_in_data[1], np.float32) / 32768.0 + audio_in = audio_in[0:num_samples] + frame = np.zeros(frame_size, dtype=np.float32) + sndobj_frame_out = np.zeros(hop_size, dtype=np.float32) + simpl_frame_out = np.zeros(hop_size, dtype=np.float32) + sndobj_audio_out = np.array([]) + simpl_audio_out = np.array([]) + + sndobj_input = sndobj.SndObj() + simpl_input = pysndobj.SndObj() + sndobj_input.SetVectorSize(frame_size) + simpl_input.SetVectorSize(frame_size) + sndobj_window = sndobj.HammingTable(frame_size, 0.5) + simpl_window = pysndobj.HammingTable(frame_size, 0.5) + sndobj_ifgram = sndobj.IFGram(sndobj_window, sndobj_input, 1, frame_size, hop_size) + simpl_ifgram = pysndobj.IFGram(simpl_window, simpl_input, 1, frame_size, hop_size) + sndobj_sinmod = sndobj.SinAnal(sndobj_ifgram, 0.003, max_tracks, 1, 3) + simpl_sinmod = pysndobj.SinAnal(simpl_ifgram, 0.003, max_tracks, 1, 3) + sndobj_table = sndobj.HarmTable(10000, 1, 1, 0.25) + simpl_table = pysndobj.HarmTable(10000, 1, 1, 0.25) + sndobj_synth = sndobj.AdSyn(sndobj_sinmod, max_tracks, sndobj_table, 1, 1, hop_size) + simpl_synth = pysndobj.AdSyn(simpl_sinmod, max_tracks, simpl_table, 1, 1, hop_size) + + i = 0 + while (i + frame_size) <= num_samples: + frame = audio_in[i:i+frame_size] + sndobj_input.PushIn(frame) + simpl_input.PushIn(frame) + sndobj_ifgram.DoProcess() + simpl_ifgram.DoProcess() + sndobj_sinmod.DoProcess() + simpl_sinmod.DoProcess() + sndobj_synth.DoProcess() + simpl_synth.DoProcess() + sndobj_synth.PopOut(sndobj_frame_out) + simpl_synth.PopOut(simpl_frame_out) + sndobj_audio_out = np.hstack((sndobj_audio_out, sndobj_frame_out)) + simpl_audio_out = np.hstack((simpl_audio_out, simpl_frame_out)) + i += hop_size + + self.assertEqual(sndobj_audio_out.size, simpl_audio_out.size) + for i in range(sndobj_audio_out.size): + self.assertAlmostEquals(sndobj_audio_out[i], simpl_audio_out[i], + places = FLOAT_PRECISION) + + def test_sinsyn_doprocess(self): + "Compare sndobj.SinSyn with pysndobj.SinSyn" + frame_size = 2048 + hop_size = 512 + max_tracks = 20 + num_frames = 4 + num_samples = frame_size + ((num_frames - 1) * hop_size) + + audio_in_data = read(self.input_file) + audio_in = np.asarray(audio_in_data[1], np.float32) / 32768.0 + audio_in = audio_in[0:num_samples] + frame = np.zeros(frame_size, dtype=np.float32) + sndobj_frame_out = np.zeros(hop_size, dtype=np.float32) + simpl_frame_out = np.zeros(hop_size, dtype=np.float32) + sndobj_audio_out = np.array([]) + simpl_audio_out = np.array([]) + + sndobj_input = sndobj.SndObj() + simpl_input = pysndobj.SndObj() + sndobj_input.SetVectorSize(frame_size) + simpl_input.SetVectorSize(frame_size) + sndobj_window = sndobj.HammingTable(frame_size, 0.5) + simpl_window = pysndobj.HammingTable(frame_size, 0.5) + sndobj_ifgram = sndobj.IFGram(sndobj_window, sndobj_input, 1, frame_size, hop_size) + simpl_ifgram = pysndobj.IFGram(simpl_window, simpl_input, 1, frame_size, hop_size) + sndobj_sinmod = sndobj.SinAnal(sndobj_ifgram, 0.003, max_tracks, 1, 3) + simpl_sinmod = pysndobj.SinAnal(simpl_ifgram, 0.003, max_tracks, 1, 3) + sndobj_table = sndobj.HarmTable(10000, 1, 1, 0.25) + simpl_table = pysndobj.HarmTable(10000, 1, 1, 0.25) + sndobj_synth = sndobj.SinSyn(sndobj_sinmod, max_tracks, sndobj_table, 1, hop_size) + simpl_synth = pysndobj.SinSyn(simpl_sinmod, max_tracks, simpl_table, 1, hop_size) + + i = 0 + while (i + frame_size) <= num_samples: + frame = audio_in[i:i+frame_size] + sndobj_input.PushIn(frame) + simpl_input.PushIn(frame) + sndobj_ifgram.DoProcess() + simpl_ifgram.DoProcess() + sndobj_sinmod.DoProcess() + simpl_sinmod.DoProcess() + sndobj_synth.DoProcess() + simpl_synth.DoProcess() + sndobj_synth.PopOut(sndobj_frame_out) + simpl_synth.PopOut(simpl_frame_out) + sndobj_audio_out = np.hstack((sndobj_audio_out, sndobj_frame_out)) + simpl_audio_out = np.hstack((simpl_audio_out, simpl_frame_out)) + i += hop_size + + self.assertEqual(sndobj_audio_out.size, simpl_audio_out.size) + for i in range(sndobj_audio_out.size): + self.assertAlmostEquals(sndobj_audio_out[i], simpl_audio_out[i], + places = FLOAT_PRECISION) + + def test_peak_detection(self): + "Compare pysndobj Peaks with SndObj peaks" + frame_size = 2048 + hop_size = 512 + num_frames = 4 + max_peaks = 20 + max_tracks = 20 + num_samples = frame_size + ((num_frames - 1) * hop_size) + + audio_in_data = read(self.input_file) + audio_in = np.asarray(audio_in_data[1], np.float32) / 32768.0 + audio_in = audio_in[0:num_samples] + frame = np.zeros(frame_size, dtype=np.float32) + + sndobj_input = sndobj.SndObj() + sndobj_input.SetVectorSize(frame_size) + sndobj_window = sndobj.HammingTable(frame_size, 0.5) + sndobj_ifgram = sndobj.IFGram(sndobj_window, sndobj_input, 1, frame_size, hop_size) + simpl_sinmod = pysndobj.SinAnal(sndobj_ifgram, 0.003, max_tracks, 1, 3) + + pd = simpl.SndObjPeakDetection() + pd.max_peaks = max_peaks + + i = 0 + while (i + frame_size) <= num_samples: + frame = audio_in[i:i+frame_size] + sndobj_input.PushIn(frame) + sndobj_ifgram.DoProcess() + num_peaks_found = simpl_sinmod.FindPeaks() + + frame = audio_in[i:i+frame_size] + peaks = pd.find_peaks(frame) + self.assertEquals(len(peaks), 1) + peaks = peaks[0] + + self.assertEquals(num_peaks_found, len(peaks)) + for j in range(num_peaks_found): + self.assertAlmostEquals(peaks[j].amplitude, simpl_sinmod.Output(j*3), + places=FLOAT_PRECISION) + self.assertAlmostEquals(peaks[j].frequency, simpl_sinmod.Output((j*3)+1), + places=FLOAT_PRECISION) + self.assertAlmostEquals(peaks[j].phase, simpl_sinmod.Output((j*3)+2), + places=FLOAT_PRECISION) + i += hop_size + + def test_partial_tracking(self): + "Compare pysndobj Partials with SndObj tracks" + frame_size = 2048 + hop_size = 512 + num_frames = 4 + max_tracks = 20 + max_peaks = 20 + num_samples = frame_size + ((num_frames - 1) * hop_size) + + audio_in_data = read(self.input_file) + audio_in = np.asarray(audio_in_data[1], np.float32) / 32768.0 + audio_in = audio_in[0:num_samples] + frame = np.zeros(frame_size, dtype=np.float32) + + sndobj_input = sndobj.SndObj() + sndobj_input.SetVectorSize(frame_size) + sndobj_window = sndobj.HammingTable(frame_size, 0.5) + sndobj_ifgram = sndobj.IFGram(sndobj_window, sndobj_input, 1, frame_size, hop_size) + sndobj_sinmod = pysndobj.SinAnal(sndobj_ifgram, 0.003, max_tracks, 1, 3) + + pd = simpl.SndObjPeakDetection() + pd.max_peaks = max_peaks + pt = simpl.SndObjPartialTracking() + pt.max_partials = max_tracks + + i = 0 + while (i + frame_size) <= num_samples: + frame = audio_in[i:i+frame_size] + sndobj_input.PushIn(frame) + sndobj_ifgram.DoProcess() + sndobj_sinmod.DoProcess() + + frame = audio_in[i:i+frame_size] + peaks = pd.find_peaks(frame)[0] + partials = pt.update_partials(peaks, i/hop_size) + + num_sndobj_partials = sndobj_sinmod.GetTracks() + num_simpl_partials = len(partials) + self.assertEquals(num_sndobj_partials, num_simpl_partials) + + for j in range(num_simpl_partials): + self.assertAlmostEquals(partials[j].amplitude, sndobj_sinmod.Output(j*3), + places=FLOAT_PRECISION) + self.assertAlmostEquals(partials[j].frequency, sndobj_sinmod.Output((j*3)+1), + places=FLOAT_PRECISION) + self.assertAlmostEquals(partials[j].phase, sndobj_sinmod.Output((j*3)+2), + places=FLOAT_PRECISION) + i += hop_size + + def test_synthesis(self): + "Compare pysndobj synthesised audio with SndObj synthesised audio" + frame_size = 2048 + hop_size = 512 + num_frames = 4 + max_tracks = 20 + max_peaks = 20 + num_samples = frame_size + ((num_frames - 1) * hop_size) + + audio_in_data = read(self.input_file) + audio_in = np.asarray(audio_in_data[1], np.float32) / 32768.0 + audio_in = audio_in[0:num_samples] + frame = np.zeros(frame_size, dtype=np.float32) + sndobj_frame_out = np.zeros(hop_size, dtype=np.float32) + sndobj_audio_out = np.array([]) + + sndobj_input = sndobj.SndObj() + sndobj_input.SetVectorSize(frame_size) + sndobj_window = sndobj.HammingTable(frame_size, 0.5) + sndobj_ifgram = sndobj.IFGram(sndobj_window, sndobj_input, 1, frame_size, hop_size) + sndobj_sinmod = pysndobj.SinAnal(sndobj_ifgram, 0.003, max_tracks, 1, 3) + sndobj_table = sndobj.HarmTable(10000, 1, 1, 0.25) + sndobj_synth = sndobj.AdSyn(sndobj_sinmod, max_tracks, sndobj_table, 1, 1, hop_size) + + i = 0 + while (i + frame_size) <= num_samples: + frame = audio_in[i:i+frame_size] + sndobj_input.PushIn(frame) + sndobj_ifgram.DoProcess() + sndobj_sinmod.DoProcess() + sndobj_synth.DoProcess() + sndobj_synth.PopOut(sndobj_frame_out) + sndobj_audio_out = np.hstack((sndobj_audio_out, sndobj_frame_out)) + i += hop_size + + pd = simpl.SndObjPeakDetection() + pd.max_peaks = max_peaks + pt = simpl.SndObjPartialTracking() + pt.max_partials = max_tracks + peaks = pd.find_peaks(audio_in) + partials = pt.find_partials(peaks) + synth = simpl.SndObjSynthesis() + simpl_audio_out = synth.synth(partials) + self.assertEquals(sndobj_audio_out.size, simpl_audio_out.size) + for i in range(simpl_audio_out.size): + self.assertAlmostEquals(sndobj_audio_out[i], simpl_audio_out[i], + places = FLOAT_PRECISION) + +if __name__ == '__main__': + unittest.main()
\ No newline at end of file |