summaryrefslogtreecommitdiff
path: root/tests
diff options
context:
space:
mode:
Diffstat (limited to 'tests')
-rw-r--r--tests/Makefile19
-rw-r--r--tests/create_libsms_test_data.py345
-rw-r--r--tests/debug.py29
-rw-r--r--tests/signals.py16
-rw-r--r--tests/simpl.supp19
-rw-r--r--tests/test_base.cpp370
-rw-r--r--tests/test_base.py70
-rw-r--r--tests/test_lp.py22
-rw-r--r--tests/test_partial_tracking.py108
-rw-r--r--tests/test_peak_detection.py104
-rw-r--r--tests/test_peakdetection.py24
-rw-r--r--tests/test_residual.py95
-rw-r--r--tests/test_sms.py1266
-rw-r--r--tests/test_sms_old.py126
-rw-r--r--tests/test_sndobj.py19
-rw-r--r--tests/test_synthesis.py126
16 files changed, 1261 insertions, 1497 deletions
diff --git a/tests/Makefile b/tests/Makefile
new file mode 100644
index 0000000..c5374f3
--- /dev/null
+++ b/tests/Makefile
@@ -0,0 +1,19 @@
+CC=g++
+CFLAGS=-Wall -c -g
+
+all: testbase
+
+testbase: testbase.o base.o exceptions.o
+ $(CC) testbase.o base.o exceptions.o -o testbase -lcppunit
+
+testbase.o: testbase.cpp
+ $(CC) $(CFLAGS) testbase.cpp
+
+base.o: ../src/simpl/base.cpp
+ $(CC) $(CFLAGS) ../src/simpl/base.cpp
+
+exceptions.o: ../src/simpl/exceptions.cpp
+ $(CC) $(CFLAGS) ../src/simpl/exceptions.cpp
+
+clean:
+ rm -rf *.o testbase
diff --git a/tests/create_libsms_test_data.py b/tests/create_libsms_test_data.py
new file mode 100644
index 0000000..05b8cee
--- /dev/null
+++ b/tests/create_libsms_test_data.py
@@ -0,0 +1,345 @@
+import os
+import json
+import numpy as np
+import scipy.io.wavfile as wav
+import pysms
+import simpl
+
+float_precision = 5
+frame_size = 512
+hop_size = 512
+max_peaks = 10
+max_partials = 10
+num_frames = 30
+num_samples = num_frames * hop_size
+audio_path = os.path.join(
+ os.path.dirname(__file__), 'audio/flute.wav'
+)
+
+audio, sampling_rate = simpl.read_wav(audio_path)
+
+
+def _pysms_analysis_params(sampling_rate):
+ analysis_params = pysms.SMS_AnalParams()
+ pysms.sms_initAnalParams(analysis_params)
+ analysis_params.iSamplingRate = sampling_rate
+ analysis_params.iFrameRate = sampling_rate / hop_size
+ analysis_params.iWindowType = pysms.SMS_WIN_HAMMING
+ analysis_params.fHighestFreq = 20000
+ analysis_params.iFormat = pysms.SMS_FORMAT_HP
+ analysis_params.nTracks = max_peaks
+ analysis_params.peakParams.iMaxPeaks = max_peaks
+ analysis_params.nGuides = max_peaks
+ analysis_params.iMaxDelayFrames = 4
+ analysis_params.analDelay = 0
+ analysis_params.minGoodFrames = 1
+ analysis_params.iCleanTracks = 0
+ analysis_params.iStochasticType = pysms.SMS_STOC_NONE
+ analysis_params.preEmphasis = 0
+ return analysis_params
+
+
+def _pysms_synthesis_params(sampling_rate):
+ synth_params = pysms.SMS_SynthParams()
+ pysms.sms_initSynthParams(synth_params)
+ synth_params.iSamplingRate = sampling_rate
+ synth_params.iSynthesisType = pysms.SMS_STYPE_DET
+ synth_params.iStochasticType = pysms.SMS_STOC_NONE
+ synth_params.sizeHop = hop_size
+ synth_params.nTracks = max_partials
+ synth_params.deEmphasis = 0
+ return synth_params
+
+
+def _size_next_read():
+ pysms.sms_init()
+ snd_header = pysms.SMS_SndHeader()
+
+ # Try to open the input file to fill snd_header
+ if(pysms.sms_openSF(audio_path, snd_header)):
+ raise NameError(
+ "error opening sound file: " + pysms.sms_errorString()
+ )
+
+ analysis_params = _pysms_analysis_params(sampling_rate)
+ analysis_params.iMaxDelayFrames = num_frames + 1
+ if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
+ raise Exception("Error allocating memory for analysis_params")
+ analysis_params.nFrames = num_frames
+ sms_header = pysms.SMS_Header()
+ pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
+
+ sample_offset = 0
+ pysms_size_new_data = 0
+ current_frame = 0
+ next_read_sizes = []
+
+ while current_frame < num_frames:
+ next_read_sizes.append(analysis_params.sizeNextRead)
+ sample_offset += pysms_size_new_data
+ pysms_size_new_data = analysis_params.sizeNextRead
+
+ # convert frame to floats for libsms
+ frame = audio[sample_offset:sample_offset + pysms_size_new_data]
+ frame = np.array(frame, dtype=np.float32)
+ if len(frame) < pysms_size_new_data:
+ frame = np.hstack((
+ frame, np.zeros(pysms_size_new_data - len(frame),
+ dtype=np.float32)
+ ))
+
+ analysis_data = pysms.SMS_Data()
+ pysms.sms_allocFrameH(sms_header, analysis_data)
+ status = pysms.sms_analyze(frame, analysis_data, analysis_params)
+ # as the no. of frames of delay is > num_frames, sms_analyze should
+ # never get around to performing partial tracking, and so the
+ # return value should be 0
+ assert status == 0
+ pysms.sms_freeFrame(analysis_data)
+ current_frame += 1
+
+ pysms.sms_freeAnalysis(analysis_params)
+ pysms.sms_closeSF()
+ pysms.sms_free()
+
+ return next_read_sizes
+
+
+def _partial_tracking():
+ pysms.sms_init()
+ snd_header = pysms.SMS_SndHeader()
+
+ if(pysms.sms_openSF(audio_path, snd_header)):
+ raise NameError(pysms.sms_errorString())
+
+ analysis_params = _pysms_analysis_params(sampling_rate)
+ if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
+ raise Exception("Error allocating memory for analysis_params")
+ analysis_params.iSizeSound = num_samples
+ analysis_params.nFrames = num_frames
+ sms_header = pysms.SMS_Header()
+ pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
+
+ sample_offset = 0
+ size_new_data = 0
+ current_frame = 0
+ sms_frames = []
+ do_analysis = True
+
+ while do_analysis and (current_frame < num_frames):
+ sample_offset += size_new_data
+ size_new_data = analysis_params.sizeNextRead
+
+ frame_audio = audio[sample_offset:sample_offset + size_new_data]
+ frame_audio = np.array(frame_audio, dtype=np.float32)
+ if len(frame_audio) < size_new_data:
+ frame_audio = np.hstack((
+ frame_audio, np.zeros(size_new_data - len(frame_audio),
+ dtype=np.float32)
+ ))
+
+ analysis_data = pysms.SMS_Data()
+ pysms.sms_allocFrameH(sms_header, analysis_data)
+ num_partials = analysis_data.nTracks
+ status = pysms.sms_analyze(frame_audio, analysis_data,
+ analysis_params)
+
+ sms_freqs = np.zeros(num_partials, dtype=np.float32)
+ sms_amps = np.zeros(num_partials, dtype=np.float32)
+ sms_phases = np.zeros(num_partials, dtype=np.float32)
+
+ frame = {'status': status}
+ frame['partials'] = []
+
+ if status == 1:
+ analysis_data.getSinFreq(sms_freqs)
+ analysis_data.getSinAmp(sms_amps)
+ analysis_data.getSinPhase(sms_phases)
+ current_frame += 1
+
+ if status == -1:
+ do_analysis = False
+
+ for i in range(num_partials):
+ frame['partials'].append({
+ 'n': i,
+ 'amplitude': float(sms_amps[i]),
+ 'frequency': float(sms_freqs[i]),
+ 'phase': float(sms_phases[i])
+ })
+
+ sms_frames.append(frame)
+ pysms.sms_freeFrame(analysis_data)
+
+ pysms.sms_freeAnalysis(analysis_params)
+ pysms.sms_closeSF()
+ pysms.sms_free()
+
+ return sms_frames
+
+
+def _harmonic_synthesis(det_synth_type):
+ pysms.sms_init()
+ snd_header = pysms.SMS_SndHeader()
+
+ if(pysms.sms_openSF(audio_path, snd_header)):
+ raise NameError(pysms.sms_errorString())
+
+ analysis_params = _pysms_analysis_params(sampling_rate)
+ if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
+ raise Exception("Error allocating memory for analysis_params")
+ analysis_params.iSizeSound = num_samples
+ analysis_params.nFrames = num_frames
+ sms_header = pysms.SMS_Header()
+ pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
+
+ sample_offset = 0
+ size_new_data = 0
+ current_frame = 0
+ analysis_frames = []
+ do_analysis = True
+
+ while do_analysis and (current_frame < num_frames):
+ sample_offset += size_new_data
+ size_new_data = analysis_params.sizeNextRead
+
+ frame_audio = audio[sample_offset:sample_offset + size_new_data]
+ frame_audio = np.array(frame_audio, dtype=np.float32)
+ if len(frame_audio) < size_new_data:
+ frame_audio = np.hstack((
+ frame_audio, np.zeros(size_new_data - len(frame_audio),
+ dtype=np.float32)
+ ))
+
+ analysis_data = pysms.SMS_Data()
+ pysms.sms_allocFrameH(sms_header, analysis_data)
+ status = pysms.sms_analyze(frame_audio, analysis_data,
+ analysis_params)
+
+ analysis_frames.append(analysis_data)
+ current_frame += 1
+
+ if status == -1:
+ do_analysis = False
+
+ synth_params = _pysms_synthesis_params(sampling_rate)
+ if det_synth_type == 'ifft':
+ synth_params.iDetSynthType = pysms.SMS_DET_IFFT
+ elif det_synth_type == 'sin':
+ synth_params.iDetSynthType = pysms.SMS_DET_SIN
+ else:
+ raise Exception("Invalid deterministic synthesis type")
+
+ pysms.sms_initSynth(sms_header, synth_params)
+
+ synth_frame = np.zeros(synth_params.sizeHop, dtype=np.float32)
+ synth_audio = np.array([], dtype=np.float32)
+
+ for i in range(len(analysis_frames)):
+ pysms.sms_synthesize(analysis_frames[i], synth_frame, synth_params)
+ synth_audio = np.hstack((synth_audio, synth_frame))
+
+ synth_audio = np.asarray(synth_audio * 32768, np.int16)
+
+ for frame in analysis_frames:
+ pysms.sms_freeFrame(frame)
+ pysms.sms_freeAnalysis(analysis_params)
+ pysms.sms_closeSF()
+ pysms.sms_freeSynth(synth_params)
+ pysms.sms_free()
+
+ return synth_audio
+
+
+def _residual_synthesis():
+ pysms.sms_init()
+ snd_header = pysms.SMS_SndHeader()
+
+ if(pysms.sms_openSF(audio_path, snd_header)):
+ raise NameError(pysms.sms_errorString())
+
+ analysis_params = _pysms_analysis_params(sampling_rate)
+ analysis_params.nStochasticCoeff = 128
+ analysis_params.iStochasticType = pysms.SMS_STOC_APPROX
+ if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
+ raise Exception("Error allocating memory for analysis_params")
+ analysis_params.iSizeSound = num_samples
+ analysis_params.nFrames = num_frames
+ sms_header = pysms.SMS_Header()
+ pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
+
+ sample_offset = 0
+ size_new_data = 0
+ current_frame = 0
+ analysis_frames = []
+ do_analysis = True
+
+ while do_analysis and (current_frame < num_frames):
+ sample_offset += size_new_data
+ size_new_data = analysis_params.sizeNextRead
+
+ frame_audio = audio[sample_offset:sample_offset + size_new_data]
+ frame_audio = np.array(frame_audio, dtype=np.float32)
+ if len(frame_audio) < size_new_data:
+ frame_audio = np.hstack((
+ frame_audio, np.zeros(size_new_data - len(frame_audio),
+ dtype=np.float32)
+ ))
+
+ analysis_data = pysms.SMS_Data()
+ pysms.sms_allocFrameH(sms_header, analysis_data)
+ status = pysms.sms_analyze(frame_audio, analysis_data,
+ analysis_params)
+
+ analysis_frames.append(analysis_data)
+ current_frame += 1
+
+ if status == -1:
+ do_analysis = False
+
+ sms_header.nFrames = len(analysis_frames)
+ synth_params = _pysms_synthesis_params(sampling_rate)
+ synth_params.iStochasticType = pysms.SMS_STOC_APPROX
+ synth_params.iSynthesisType = pysms.SMS_STYPE_STOC
+ pysms.sms_initSynth(sms_header, synth_params)
+
+ synth_frame = np.zeros(synth_params.sizeHop, dtype=np.float32)
+ synth_audio = np.array([], dtype=np.float32)
+
+ for i in range(len(analysis_frames)):
+ pysms.sms_synthesize(analysis_frames[i], synth_frame, synth_params)
+ synth_audio = np.hstack((synth_audio, synth_frame))
+
+ synth_audio = np.asarray(synth_audio * 32768, np.int16)
+
+ for frame in analysis_frames:
+ pysms.sms_freeFrame(frame)
+ pysms.sms_freeAnalysis(analysis_params)
+ pysms.sms_closeSF()
+ pysms.sms_freeSynth(synth_params)
+ pysms.sms_free()
+
+ return synth_audio
+
+
+if __name__ == '__main__':
+ size_next_read = _size_next_read()
+ partial_tracking = _partial_tracking()
+ harmonic_synthesis_ifft = _harmonic_synthesis('ifft')
+ harmonic_synthesis_sin = _harmonic_synthesis('sin')
+ residual_synthesis = _residual_synthesis()
+
+ test_data = {'size_next_read': size_next_read,
+ 'peak_detection': partial_tracking,
+ 'partial_tracking': partial_tracking}
+
+ test_data = json.dumps(test_data)
+ with open('libsms_test_data.json', 'w') as f:
+ f.write(test_data)
+
+ wav.write('libsms_harmonic_synthesis_ifft.wav', sampling_rate,
+ harmonic_synthesis_ifft)
+ wav.write('libsms_harmonic_synthesis_sin.wav', sampling_rate,
+ harmonic_synthesis_sin)
+ wav.write('libsms_residual_synthesis.wav', sampling_rate,
+ residual_synthesis)
diff --git a/tests/debug.py b/tests/debug.py
deleted file mode 100644
index 084df72..0000000
--- a/tests/debug.py
+++ /dev/null
@@ -1,29 +0,0 @@
-# Copyright (c) 2010 John Glover, National University of Ireland, Maynooth
-#
-# This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation; either version 2 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program; if not, write to the Free Software
-# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
-
-def print_peaks(frames):
- for n, f in enumerate(frames):
- for p in f:
- print str(n) + ":", p.frequency
-
-def print_partials(partials):
- for partial_num, partial in enumerate(partials):
- print partial_num,
- print "(" + str(partial.starting_frame) + " to",
- print str(partial.starting_frame + len(partial.peaks)) + "):",
- for peak_number, peak in enumerate(partial.peaks):
- print peak.frequency,
- print
diff --git a/tests/signals.py b/tests/signals.py
index 5b04c03..8083f94 100644
--- a/tests/signals.py
+++ b/tests/signals.py
@@ -1,19 +1,3 @@
-# Copyright (c) 2010 John Glover, National University of Ireland, Maynooth
-#
-# This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation; either version 2 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program; if not, write to the Free Software
-# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
-
import simpl
import numpy as np
diff --git a/tests/simpl.supp b/tests/simpl.supp
new file mode 100644
index 0000000..8f8239e
--- /dev/null
+++ b/tests/simpl.supp
@@ -0,0 +1,19 @@
+# Valgrind suppression file for Simpl
+
+# On Mac OS X 10.6 Snow Leopard, throwing std::exceptions gives a memory leak
+{
+ simpl.exceptions
+ Memcheck:Leak
+ fun:malloc
+ fun:__cxa_get_globals
+ fun:__cxa_allocate_exception
+ fun:_ZN5Simpl4Peak7is_freeESs
+ fun:_ZN5Simpl8TestPeak29test_is_free_invalid_argumentEv
+ fun:_ZN7CppUnit10TestCallerIN5Simpl8TestPeakEE7runTestEv
+ fun:_ZNK7CppUnit21TestCaseMethodFunctorclEv
+ fun:_ZN7CppUnit16DefaultProtector7protectERKNS_7FunctorERKNS_16ProtectorContextE
+ fun:_ZNK7CppUnit14ProtectorChain14ProtectFunctorclEv
+ fun:_ZN7CppUnit14ProtectorChain7protectERKNS_7FunctorERKNS_16ProtectorContextE
+ fun:_ZN7CppUnit10TestResult7protectERKNS_7FunctorEPNS_4TestERKSs
+ fun:_ZN7CppUnit8TestCase3runEPNS_10TestResultE
+}
diff --git a/tests/test_base.cpp b/tests/test_base.cpp
new file mode 100644
index 0000000..a37024f
--- /dev/null
+++ b/tests/test_base.cpp
@@ -0,0 +1,370 @@
+#include <iostream>
+#include <cppunit/ui/text/TextTestRunner.h>
+#include <cppunit/TestResult.h>
+#include <cppunit/TestResultCollector.h>
+#include <cppunit/extensions/HelperMacros.h>
+#include <cppunit/BriefTestProgressListener.h>
+#include <cppunit/extensions/TestFactoryRegistry.h>
+
+#include "../src/simpl/base.h"
+#include "../src/simpl/exceptions.h"
+
+namespace Simpl
+{
+
+// ---------------------------------------------------------------------------
+// TestPeak
+// ---------------------------------------------------------------------------
+class TestPeak : public CPPUNIT_NS::TestCase
+{
+ CPPUNIT_TEST_SUITE(TestPeak);
+ CPPUNIT_TEST(test_constructor);
+ CPPUNIT_TEST(test_is_start_of_partial);
+ CPPUNIT_TEST(test_is_free);
+ CPPUNIT_TEST(test_is_free_invalid_argument);
+ CPPUNIT_TEST_SUITE_END();
+
+protected:
+ static const double PRECISION = 0.001;
+ Peak* peak;
+
+ void test_constructor()
+ {
+ CPPUNIT_ASSERT_DOUBLES_EQUAL(peak->amplitude, 0.0, PRECISION);
+ CPPUNIT_ASSERT_DOUBLES_EQUAL(peak->frequency, 0.0, PRECISION);
+ CPPUNIT_ASSERT_DOUBLES_EQUAL(peak->phase, 0.0, PRECISION);
+ CPPUNIT_ASSERT(peak->next_peak == NULL);
+ CPPUNIT_ASSERT(peak->previous_peak == NULL);
+ CPPUNIT_ASSERT(peak->partial_id == 0);
+ CPPUNIT_ASSERT(peak->partial_position == 0);
+ CPPUNIT_ASSERT(peak->frame_number == 0);
+ }
+
+ void test_is_start_of_partial()
+ {
+ CPPUNIT_ASSERT(peak->is_start_of_partial());
+ Peak* tmp = new Peak();
+ peak->previous_peak = tmp;
+ CPPUNIT_ASSERT(!peak->is_start_of_partial());
+ peak->previous_peak = NULL;
+ delete tmp;
+ }
+
+ void test_is_free()
+ {
+ peak->amplitude = 0.0;
+ CPPUNIT_ASSERT(!peak->is_free());
+ peak->amplitude = 1.0;
+ CPPUNIT_ASSERT(peak->is_free());
+
+ Peak* tmp = new Peak();
+
+ peak->next_peak = tmp;
+ CPPUNIT_ASSERT(!peak->is_free());
+ CPPUNIT_ASSERT(!peak->is_free("forwards"));
+ CPPUNIT_ASSERT(peak->is_free("backwards"));
+ peak->next_peak = NULL;
+
+ peak->previous_peak = tmp;
+ CPPUNIT_ASSERT(peak->is_free());
+ CPPUNIT_ASSERT(peak->is_free("forwards"));
+ CPPUNIT_ASSERT(!peak->is_free("backwards"));
+ peak->previous_peak = NULL;
+
+ delete tmp;
+ }
+
+ void test_is_free_invalid_argument()
+ {
+ peak->amplitude = 1.0;
+ CPPUNIT_ASSERT_THROW(peak->is_free("random_text"), InvalidArgument);
+ peak->amplitude = 0.0;
+ }
+
+public:
+ void setUp()
+ {
+ peak = new Peak();
+ }
+
+ void tearDown()
+ {
+ delete peak;
+ }
+};
+
+// ---------------------------------------------------------------------------
+// TestFrame
+// ---------------------------------------------------------------------------
+class TestFrame : public CPPUNIT_NS::TestCase
+{
+ CPPUNIT_TEST_SUITE(TestFrame);
+ CPPUNIT_TEST(test_constructor);
+ CPPUNIT_TEST(test_size);
+ CPPUNIT_TEST(test_max_peaks);
+ CPPUNIT_TEST(test_max_partials);
+ CPPUNIT_TEST(test_add_peak);
+ CPPUNIT_TEST(test_add_peaks);
+ CPPUNIT_TEST(test_peak_clear);
+ CPPUNIT_TEST(test_peak_iteration);
+ CPPUNIT_TEST_SUITE_END();
+
+protected:
+ static const double PRECISION = 0.001;
+ Frame* frame;
+
+ void test_constructor()
+ {
+ CPPUNIT_ASSERT(frame->size() == 512);
+ CPPUNIT_ASSERT(frame->max_peaks() == 100);
+ CPPUNIT_ASSERT(frame->num_peaks() == 0);
+ CPPUNIT_ASSERT(frame->max_partials() == 100);
+ CPPUNIT_ASSERT(frame->num_partials() == 0);
+ }
+
+ void test_size()
+ {
+ frame->size(1024);
+ CPPUNIT_ASSERT(frame->size() == 1024);
+ frame->size(512);
+ }
+
+ void test_max_peaks()
+ {
+ frame->max_peaks(200);
+ CPPUNIT_ASSERT(frame->max_peaks() == 200);
+ CPPUNIT_ASSERT(frame->num_peaks() == 0);
+ frame->max_peaks(100);
+ }
+
+ void test_max_partials()
+ {
+ frame->max_partials(200);
+ CPPUNIT_ASSERT(frame->max_partials() == 200);
+ CPPUNIT_ASSERT(frame->num_partials() == 0);
+ frame->max_partials(100);
+ }
+
+ void test_add_peak()
+ {
+ Peak p = Peak();
+ p.amplitude = 1.5;
+ frame->add_peak(p);
+ CPPUNIT_ASSERT(frame->max_peaks() == 100);
+ CPPUNIT_ASSERT(frame->num_peaks() == 1);
+ CPPUNIT_ASSERT_DOUBLES_EQUAL(1.5, frame->peak(0).amplitude, PRECISION);
+ frame->clear_peaks();
+ }
+
+ void test_add_peaks()
+ {
+ Peaks* peaks = new Peaks();
+
+ Peak p1 = Peak();
+ p1.amplitude = 1.0;
+ peaks->push_back(p1);
+
+ Peak p2 = Peak();
+ p2.amplitude = 2.0;
+ peaks->push_back(p2);
+
+ frame->add_peaks(peaks);
+ CPPUNIT_ASSERT(frame->num_peaks() == 2);
+
+ frame->clear_peaks();
+ delete peaks;
+ }
+
+ void test_peak_clear()
+ {
+ Peak p = Peak();
+ p.amplitude = 1.5;
+ frame->add_peak(p);
+ CPPUNIT_ASSERT(frame->num_peaks() == 1);
+ frame->clear_peaks();
+ CPPUNIT_ASSERT(frame->num_peaks() == 0);
+ }
+
+ void test_peak_iteration()
+ {
+ Peak p1 = Peak();
+ p1.amplitude = 1.0;
+ frame->add_peak(p1);
+
+ Peak p2 = Peak();
+ p2.amplitude = 2.0;
+ frame->add_peak(p2);
+
+ CPPUNIT_ASSERT(frame->num_peaks() == 2);
+
+ int peak_num = 0;
+ for(Peaks::iterator i = frame->peaks_begin(); i != frame->peaks_end(); i++)
+ {
+ if(peak_num == 0)
+ {
+ CPPUNIT_ASSERT_DOUBLES_EQUAL(1.0, i->amplitude, PRECISION);
+ }
+ else if(peak_num == 1)
+ {
+ CPPUNIT_ASSERT_DOUBLES_EQUAL(2.0, i->amplitude, PRECISION);
+ }
+ peak_num += 1;
+ }
+ frame->clear_peaks();
+ }
+
+public:
+ void setUp()
+ {
+ frame = new Frame();
+ }
+
+ void tearDown()
+ {
+ delete frame;
+ }
+};
+
+// ---------------------------------------------------------------------------
+// TestPeakDetection
+// ---------------------------------------------------------------------------
+class TestPeakDetection : public CPPUNIT_NS::TestCase
+{
+ CPPUNIT_TEST_SUITE(TestPeakDetection);
+ CPPUNIT_TEST(test_constructor);
+ CPPUNIT_TEST(test_frame_size);
+ CPPUNIT_TEST(test_static_frame_size);
+ CPPUNIT_TEST(test_next_frame_size);
+ CPPUNIT_TEST(test_hop_size);
+ CPPUNIT_TEST(test_max_peaks);
+ CPPUNIT_TEST(test_window_type);
+ CPPUNIT_TEST(test_window_size);
+ CPPUNIT_TEST(test_min_peak_separation);
+ CPPUNIT_TEST(test_find_peaks_in_frame);
+ CPPUNIT_TEST(test_find_peaks);
+ CPPUNIT_TEST_SUITE_END();
+
+protected:
+ static const double PRECISION = 0.001;
+ PeakDetection* pd;
+
+ void test_constructor()
+ {
+ CPPUNIT_ASSERT(pd->sampling_rate() == 44100);
+ CPPUNIT_ASSERT(pd->frame_size() == 2048);
+ CPPUNIT_ASSERT(pd->static_frame_size());
+ CPPUNIT_ASSERT(pd->hop_size() == 512);
+ CPPUNIT_ASSERT(pd->max_peaks() == 100);
+ CPPUNIT_ASSERT(pd->window_type() == "hamming");
+ CPPUNIT_ASSERT(pd->window_size() == 2048);
+ CPPUNIT_ASSERT_DOUBLES_EQUAL(1.0, pd->min_peak_separation(), 0.00001);
+ CPPUNIT_ASSERT(pd->frames()->size() == 0);
+ }
+
+ void test_sampling_rate()
+ {
+ pd->sampling_rate(96000);
+ CPPUNIT_ASSERT(pd->sampling_rate() == 96000);
+ pd->sampling_rate(44100);
+ }
+
+ void test_frame_size()
+ {
+ pd->frame_size(1024);
+ CPPUNIT_ASSERT(pd->frame_size() == 1024);
+ pd->frame_size(2048);
+ }
+
+ void test_static_frame_size()
+ {
+ pd->static_frame_size(false);
+ CPPUNIT_ASSERT(!pd->static_frame_size());
+ pd->static_frame_size(true);
+ }
+
+ void test_next_frame_size()
+ {
+ CPPUNIT_ASSERT(pd->next_frame_size() == pd->frame_size());
+ }
+
+ void test_hop_size()
+ {
+ pd->hop_size(128);
+ CPPUNIT_ASSERT(pd->hop_size() == 128);
+ pd->hop_size(512);
+ }
+
+ void test_max_peaks()
+ {
+ pd->max_peaks(20);
+ CPPUNIT_ASSERT(pd->max_peaks() == 20);
+ pd->max_peaks(100);
+ }
+
+ void test_window_type()
+ {
+ pd->window_type("hanning");
+ CPPUNIT_ASSERT(pd->window_type() == "hanning");
+ pd->window_type("hamming");
+ }
+
+ void test_window_size()
+ {
+ pd->window_size(2048);
+ CPPUNIT_ASSERT(pd->window_size() == 2048);
+ pd->window_size(2048);
+ }
+
+ void test_min_peak_separation()
+ {
+ pd->min_peak_separation(0.5);
+ CPPUNIT_ASSERT_DOUBLES_EQUAL(0.5, pd->min_peak_separation(), 0.00001);
+ pd->min_peak_separation(1.0);
+ }
+
+ void test_find_peaks_in_frame()
+ {
+ Frame* f = new Frame();
+ Peaks* p = pd->find_peaks_in_frame(*f);
+ CPPUNIT_ASSERT(p->size() == 0);
+ delete p;
+ delete f;
+ }
+
+ void test_find_peaks()
+ {
+ const samples audio = samples(1024);
+ pd->frame_size(256);
+ pd->hop_size(256);
+ Frames* frames = pd->find_peaks(audio);
+ CPPUNIT_ASSERT(frames->size() == 4);
+ for(Frames::iterator i = frames->begin(); i != frames->end(); i++)
+ {
+ CPPUNIT_ASSERT(i->num_peaks() == 0);
+ }
+ }
+
+public:
+ void setUp()
+ {
+ pd = new PeakDetection();
+ }
+
+ void tearDown()
+ {
+ delete pd;
+ }
+};
+
+} // end of namespace Simpl
+
+CPPUNIT_TEST_SUITE_REGISTRATION(Simpl::TestPeak);
+CPPUNIT_TEST_SUITE_REGISTRATION(Simpl::TestFrame);
+CPPUNIT_TEST_SUITE_REGISTRATION(Simpl::TestPeakDetection);
+
+int main(int arg, char **argv)
+{
+ CppUnit::TextTestRunner runner;
+ runner.addTest(CppUnit::TestFactoryRegistry::getRegistry().makeTest());
+ return runner.run("", false);
+}
diff --git a/tests/test_base.py b/tests/test_base.py
new file mode 100644
index 0000000..9d3173a
--- /dev/null
+++ b/tests/test_base.py
@@ -0,0 +1,70 @@
+import os
+import numpy as np
+from nose.tools import assert_almost_equals
+import simpl.base as base
+
+float_precision = 5
+frame_size = 512
+hop_size = 512
+audio_path = os.path.join(
+ os.path.dirname(__file__), 'audio/flute.wav'
+)
+
+
+class TestFrame(object):
+ def test_buffers(self):
+ N = 256
+ f = base.Frame(N)
+ assert f.size == N
+
+ a = np.random.rand(N)
+ f.audio = a
+ assert np.all(f.audio == a)
+
+ a = np.random.rand(N)
+ f.synth = a
+ assert np.all(f.synth == a)
+
+ a = np.random.rand(N)
+ f.residual = a
+ assert np.all(f.residual == a)
+
+ a = np.random.rand(N)
+ f.synth_residual = a
+ assert np.all(f.synth_residual == a)
+
+ def test_peaks(self):
+ p = base.Peak()
+ p.amplitude = 0.5
+ p.frequency = 220.0
+ p.phase = 0.0
+
+ f = base.Frame()
+ assert f.num_peaks == 0
+ assert f.max_peaks > 0
+ f.add_peak(p)
+
+ assert f.num_peaks == 1
+ assert_almost_equals(f.peak(0).amplitude, p.amplitude,
+ float_precision)
+ assert_almost_equals(f.peaks[0].amplitude, p.amplitude,
+ float_precision)
+
+ f.clear()
+ assert f.num_peaks == 0
+
+ def test_partials(self):
+ N = 256
+ f = base.Frame(N)
+ f.max_partials = 10
+
+ p = base.Peak()
+ p.amplitude = 0.5
+ p.frequency = 220.0
+ p.phase = 0.0
+
+ f.partial(0, p)
+ assert_almost_equals(f.partial(0).amplitude, p.amplitude,
+ float_precision)
+ assert_almost_equals(f.partial(0).frequency, p.frequency,
+ float_precision)
diff --git a/tests/test_lp.py b/tests/test_lp.py
index 8d80ba2..4537f46 100644
--- a/tests/test_lp.py
+++ b/tests/test_lp.py
@@ -1,28 +1,12 @@
-# Copyright (c) 2010 John Glover, National University of Ireland, Maynooth
-#
-# This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation; either version 2 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program; if not, write to the Free Software
-# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
-
from simpl import lp
import numpy as np
-class TestLP(object):
+class TestLP(object):
def test_predict(self):
"""test_predict"""
- coefs = np.array([1,2,3,4,5])
+ coefs = np.array([1, 2, 3, 4, 5])
test_signal = np.ones(5)
predictions = lp.predict(test_signal, coefs, 2)
assert predictions[0] == -sum(coefs)
- assert predictions[1] == -sum(coefs[1:])-predictions[0]
+ assert predictions[1] == -sum(coefs[1:]) - predictions[0]
diff --git a/tests/test_partial_tracking.py b/tests/test_partial_tracking.py
new file mode 100644
index 0000000..32f2653
--- /dev/null
+++ b/tests/test_partial_tracking.py
@@ -0,0 +1,108 @@
+import os
+import json
+from nose.tools import assert_almost_equals
+import simpl
+import simpl.peak_detection as peak_detection
+import simpl.partial_tracking as partial_tracking
+
+PeakDetection = peak_detection.PeakDetection
+SMSPeakDetection = peak_detection.SMSPeakDetection
+PartialTracking = partial_tracking.PartialTracking
+SMSPartialTracking = partial_tracking.SMSPartialTracking
+
+float_precision = 2
+frame_size = 512
+hop_size = 512
+max_peaks = 10
+max_partials = 10
+num_frames = 30
+num_samples = num_frames * hop_size
+audio_path = os.path.join(
+ os.path.dirname(__file__), 'audio/flute.wav'
+)
+libsms_test_data_path = os.path.join(
+ os.path.dirname(__file__), 'libsms_test_data.json'
+)
+
+
+def _load_libsms_test_data():
+ test_data = None
+ with open(libsms_test_data_path, 'r') as f:
+ test_data = json.loads(f.read())
+ return test_data
+
+
+class TestPartialTracking(object):
+ @classmethod
+ def setup_class(cls):
+ cls.audio = simpl.read_wav(audio_path)[0]
+ cls.audio = cls.audio[0:num_samples]
+
+ def test_basic(self):
+ pd = PeakDetection()
+ pd.hop_size = hop_size
+ frames = pd.find_peaks(self.audio)
+
+ pt = PartialTracking()
+ frames = pt.find_partials(frames)
+
+ print 'frames: %d (expected: %d)' %\
+ (len(frames), len(self.audio) / hop_size)
+ assert len(frames) == len(self.audio) / hop_size
+
+ assert len(frames[0].partials) == 0
+ assert frames[0].max_partials == 100
+
+
+class TestSMSPartialTracking(object):
+ @classmethod
+ def setup_class(cls):
+ cls.audio = simpl.read_wav(audio_path)[0]
+ cls.audio = cls.audio[0:num_samples]
+ cls.test_data = _load_libsms_test_data()
+
+ def test_basic(self):
+ pd = SMSPeakDetection()
+ pd.hop_size = hop_size
+ pd.max_peaks = max_peaks
+ pd.static_frame_size = True
+ frames = pd.find_peaks(self.audio)
+
+ pt = SMSPartialTracking()
+ pt.max_partials = max_partials
+ frames = pt.find_partials(frames)
+
+ print 'frames: %d (expected: %d)' %\
+ (len(frames), len(self.audio) / hop_size)
+ assert len(frames) == len(self.audio) / hop_size
+
+ assert frames[0].num_partials == max_partials
+ assert frames[0].max_partials == max_partials
+
+ def test_partial_tracking(self):
+ pd = SMSPeakDetection()
+ pd.max_peaks = max_peaks
+ pd.hop_size = hop_size
+ peaks = pd.find_peaks(self.audio)
+ pt = SMSPartialTracking()
+ pt.max_partials = max_partials
+ frames = pt.find_partials(peaks)
+
+ sms_frames = self.test_data['partial_tracking']
+ sms_frames = sms_frames[0:len(sms_frames) - 3]
+
+ assert len(sms_frames) == len(frames)
+
+ for i in range(len(frames)):
+ assert len(frames[i].partials) == len(sms_frames[i]['partials'])
+
+ for p in range(len(frames[i].partials)):
+ assert_almost_equals(frames[i].partials[p].amplitude,
+ sms_frames[i]['partials'][p]['amplitude'],
+ float_precision)
+ assert_almost_equals(frames[i].partials[p].frequency,
+ sms_frames[i]['partials'][p]['frequency'],
+ float_precision)
+ assert_almost_equals(frames[i].partials[p].phase,
+ sms_frames[i]['partials'][p]['phase'],
+ float_precision)
diff --git a/tests/test_peak_detection.py b/tests/test_peak_detection.py
new file mode 100644
index 0000000..f339818
--- /dev/null
+++ b/tests/test_peak_detection.py
@@ -0,0 +1,104 @@
+import os
+import json
+import simpl
+import simpl.peak_detection as peak_detection
+
+PeakDetection = peak_detection.PeakDetection
+SMSPeakDetection = peak_detection.SMSPeakDetection
+
+float_precision = 5
+frame_size = 512
+hop_size = 512
+max_peaks = 10
+max_partials = 10
+num_frames = 30
+num_samples = num_frames * hop_size
+audio_path = os.path.join(
+ os.path.dirname(__file__), 'audio/flute.wav'
+)
+test_data_path = os.path.join(
+ os.path.dirname(__file__), 'libsms_test_data.json'
+)
+
+
+def _load_libsms_test_data():
+ test_data = None
+ with open(test_data_path, 'r') as f:
+ test_data = json.loads(f.read())
+ return test_data
+
+
+class TestPeakDetection(object):
+ @classmethod
+ def setup_class(cls):
+ cls.audio = simpl.read_wav(audio_path)[0]
+
+ def test_basic(self):
+ pd = PeakDetection()
+ pd.max_peaks = max_peaks
+ pd.find_peaks(self.audio)
+
+ assert len(pd.frames) == len(self.audio) / hop_size
+ assert len(pd.frames[0].peaks) == 0
+ assert pd.frames[0].max_peaks == max_peaks
+
+
+class TestSMSPeakDetection(object):
+ @classmethod
+ def setup_class(cls):
+ cls.audio = simpl.read_wav(audio_path)[0]
+ cls.test_data = _load_libsms_test_data()
+
+ def test_basic(self):
+ pd = SMSPeakDetection()
+ pd.hop_size = hop_size
+ pd.static_frame_size = True
+ pd.find_peaks(self.audio)
+
+ assert len(pd.frames) == len(self.audio) / hop_size
+ assert len(pd.frames[0].peaks)
+
+ def test_size_next_read(self):
+ """
+ Make sure SMSPeakDetection is calculating the correct value for the
+ size of the next frame.
+ """
+ audio, sampling_rate = simpl.read_wav(audio_path)
+
+ pd = SMSPeakDetection()
+ pd.hop_size = hop_size
+ pd.max_peaks = max_peaks
+ current_frame = 0
+ sample_offset = 0
+
+ next_read_sizes = self.test_data['size_next_read']
+
+ while current_frame < num_frames:
+ pd.frame_size = pd.next_frame_size()
+ assert next_read_sizes[current_frame] == pd.frame_size,\
+ (next_read_sizes[current_frame], pd.frame_size)
+ frame = simpl.Frame()
+ frame.size = pd.frame_size
+ frame.audio = audio[sample_offset:sample_offset + pd.frame_size]
+ pd.find_peaks_in_frame(frame)
+ sample_offset += pd.frame_size
+ current_frame += 1
+
+ def test_peak_detection(self):
+ audio, sampling_rate = simpl.read_wav(audio_path)
+
+ pd = SMSPeakDetection()
+ pd.max_peaks = max_peaks
+ pd.hop_size = hop_size
+ frames = pd.find_peaks(audio[0:num_samples])
+
+ sms_frames = self.test_data['peak_detection']
+ sms_frames = [f for f in sms_frames if f['status'] != 0]
+
+ print 'frames: %d (expected: %d)' % (len(frames), len(sms_frames))
+ assert len(sms_frames) == len(frames)
+
+ for frame in frames:
+ assert frame.num_peaks <= max_peaks, frame.num_peaks
+ max_amp = max([p.amplitude for p in frame.peaks])
+ assert max_amp
diff --git a/tests/test_peakdetection.py b/tests/test_peakdetection.py
deleted file mode 100644
index 1257f02..0000000
--- a/tests/test_peakdetection.py
+++ /dev/null
@@ -1,24 +0,0 @@
-# Copyright (c) 2009 John Glover, National University of Ireland, Maynooth
-#
-# This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation; either version 2 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program; if not, write to the Free Software
-# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
-
-import simpl
-import numpy as np
-from scipy.io.wavfile import read
-
-class TestPeakDetection(object):
- frame_size = 2048
- hop_size = 512
- max_peaks = 10
diff --git a/tests/test_residual.py b/tests/test_residual.py
new file mode 100644
index 0000000..006c77a
--- /dev/null
+++ b/tests/test_residual.py
@@ -0,0 +1,95 @@
+import os
+import numpy as np
+from nose.tools import assert_almost_equals
+import simpl
+import simpl.peak_detection as peak_detection
+import simpl.partial_tracking as partial_tracking
+import simpl.synthesis as synthesis
+import simpl.residual as residual
+
+float_precision = 2
+frame_size = 512
+hop_size = 512
+max_peaks = 10
+max_partials = 10
+num_frames = 30
+num_samples = num_frames * hop_size
+audio_path = os.path.join(
+ os.path.dirname(__file__), 'audio/flute.wav'
+)
+libsms_residual_synthesis_path = os.path.join(
+ os.path.dirname(__file__), 'libsms_residual_synthesis.wav'
+)
+
+PeakDetection = peak_detection.PeakDetection
+SMSPeakDetection = peak_detection.SMSPeakDetection
+PartialTracking = partial_tracking.PartialTracking
+SMSPartialTracking = partial_tracking.SMSPartialTracking
+Synthesis = synthesis.Synthesis
+SMSSynthesis = synthesis.SMSSynthesis
+Residual = residual.Residual
+SMSResidual = residual.SMSResidual
+
+
+class TestResidual(object):
+ @classmethod
+ def setup_class(cls):
+ cls.audio = simpl.read_wav(audio_path)[0]
+
+ def test_basic(self):
+ pd = PeakDetection()
+ frames = pd.find_peaks(self.audio)
+
+ pt = PartialTracking()
+ frames = pt.find_partials(frames)
+
+ synth = Synthesis()
+ synth_audio = synth.synth(frames)
+
+ res = Residual()
+ residual_audio = res.find_residual(synth_audio, self.audio)
+ assert len(residual_audio)
+
+
+class TestSMSResidual(object):
+ @classmethod
+ def setup_class(cls):
+ cls.audio = simpl.read_wav(audio_path)[0]
+ cls.audio = cls.audio[0:num_samples]
+
+ def test_basic(self):
+ pd = SMSPeakDetection()
+ pd.hop_size = hop_size
+ frames = pd.find_peaks(self.audio)
+
+ pt = SMSPartialTracking()
+ pt.max_partials = max_partials
+ frames = pt.find_partials(frames)
+
+ synth = SMSSynthesis()
+ synth.hop_size = hop_size
+ synth_audio = synth.synth(frames)
+
+ res = SMSResidual()
+ residual_audio = res.find_residual(synth_audio, self.audio)
+ assert len(residual_audio)
+
+ def test_residual_synthesis(self):
+ res = SMSResidual()
+ res.hop_size = hop_size
+ simpl_residual = res.synth(self.audio)
+
+ sms_residual, sampling_rate = simpl.read_wav(
+ libsms_residual_synthesis_path
+ )
+
+ assert len(simpl_residual) == len(sms_residual)
+
+ import matplotlib.pyplot as plt
+ plt.plot(simpl_residual)
+ plt.plot(sms_residual)
+ plt.show()
+
+ for i in range(len(simpl_residual)):
+ assert_almost_equals(simpl_residual[i], sms_residual[i],
+ float_precision)
diff --git a/tests/test_sms.py b/tests/test_sms.py
deleted file mode 100644
index ca51f3f..0000000
--- a/tests/test_sms.py
+++ /dev/null
@@ -1,1266 +0,0 @@
-# Copyright (c) 2009 John Glover, National University of Ireland, Maynooth
-#
-# This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation; either version 2 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program; if not, write to the Free Software
-# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
-
-import simpl
-from simpl import simplsms
-import pysms
-import numpy as np
-from scipy.io.wavfile import read
-from nose.tools import assert_almost_equals
-
-class TestSimplSMS(object):
- FLOAT_PRECISION = 2 # number of decimal places to check for accuracy
- input_file = 'audio/flute.wav'
- hop_size = 512
- num_frames = 50
- num_samples = num_frames * hop_size
- max_peaks = 10
- max_partials = 10
-
- def get_audio(self):
- audio_data = read(self.input_file)
- audio = simpl.asarray(audio_data[1]) / 32768.0
- sampling_rate = audio_data[0]
- return audio[0:self.num_samples], sampling_rate
-
- def pysms_analysis_params(self, sampling_rate):
- analysis_params = pysms.SMS_AnalParams()
- pysms.sms_initAnalParams(analysis_params)
- analysis_params.iSamplingRate = sampling_rate
- analysis_params.iFrameRate = sampling_rate / self.hop_size
- analysis_params.iWindowType = pysms.SMS_WIN_HAMMING
- analysis_params.fDefaultFundamental = 100
- analysis_params.fHighestFreq = 20000
- analysis_params.iFormat = pysms.SMS_FORMAT_HP
- analysis_params.nTracks = self.max_peaks
- analysis_params.peakParams.iMaxPeaks = self.max_peaks
- analysis_params.nGuides = self.max_peaks
- analysis_params.iMaxDelayFrames = 4
- analysis_params.analDelay = 0
- analysis_params.minGoodFrames = 1
- analysis_params.iCleanTracks = 0
- analysis_params.iStochasticType = pysms.SMS_STOC_NONE
- analysis_params.preEmphasis = 0
- return analysis_params
-
- def simplsms_analysis_params(self, sampling_rate):
- analysis_params = simplsms.SMS_AnalParams()
- simplsms.sms_initAnalParams(analysis_params)
- analysis_params.iSamplingRate = sampling_rate
- analysis_params.iFrameRate = sampling_rate / self.hop_size
- analysis_params.iWindowType = simplsms.SMS_WIN_HAMMING
- analysis_params.fDefaultFundamental = 100
- analysis_params.fHighestFreq = 20000
- analysis_params.iFormat = simplsms.SMS_FORMAT_HP
- analysis_params.nTracks = self.max_peaks
- analysis_params.maxPeaks = self.max_peaks
- analysis_params.nGuides = self.max_peaks
- analysis_params.iMaxDelayFrames = 4
- analysis_params.analDelay = 0
- analysis_params.minGoodFrames = 1
- analysis_params.iCleanTracks = 0
- analysis_params.iStochasticType = simplsms.SMS_STOC_NONE
- analysis_params.preEmphasis = 0
- return analysis_params
-
- def pysms_synthesis_params(self, sampling_rate):
- synth_params = pysms.SMS_SynthParams()
- pysms.sms_initSynthParams(synth_params)
- synth_params.iSamplingRate = sampling_rate
- synth_params.iSynthesisType = pysms.SMS_STYPE_DET
- synth_params.iStochasticType = pysms.SMS_STOC_NONE
- synth_params.sizeHop = self.hop_size
- synth_params.nTracks = self.max_peaks
- synth_params.deEmphasis = 0
- return synth_params
-
- def test_size_next_read(self):
- """test_size_next_read
- Make sure pysms PeakDetection is calculating
- the correct value for the size of the next frame."""
- audio, sampling_rate = self.get_audio()
- pysms.sms_init()
- snd_header = pysms.SMS_SndHeader()
- # Try to open the input file to fill snd_header
- if(pysms.sms_openSF(self.input_file, snd_header)):
- raise NameError("error opening sound file: " + pysms.sms_errorString())
- analysis_params = self.pysms_analysis_params(sampling_rate)
- analysis_params.iMaxDelayFrames = self.num_frames + 1
- if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.nFrames = self.num_frames
- sms_header = pysms.SMS_Header()
- pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
-
- sample_offset = 0
- pysms_size_new_data = 0
- current_frame = 0
- sms_next_read_sizes = []
-
- while current_frame < self.num_frames:
- sms_next_read_sizes.append(analysis_params.sizeNextRead)
- sample_offset += pysms_size_new_data
- pysms_size_new_data = analysis_params.sizeNextRead
- # convert frame to floats for libsms
- frame = audio[sample_offset:sample_offset + pysms_size_new_data]
- frame = np.array(frame, dtype=np.float32)
- if len(frame) < pysms_size_new_data:
- frame = np.hstack((frame, np.zeros(pysms_size_new_data - len(frame),
- dtype=np.float32)))
- analysis_data = pysms.SMS_Data()
- pysms.sms_allocFrameH(sms_header, analysis_data)
- status = pysms.sms_analyze(frame, analysis_data, analysis_params)
- # as the no. of frames of delay is > num_frames, sms_analyze should
- # never get around to performing partial tracking, and so the return
- # value should be 0
- assert status == 0
- pysms.sms_freeFrame(analysis_data)
- current_frame += 1
-
- pysms.sms_freeAnalysis(analysis_params)
- pysms.sms_closeSF()
- pysms.sms_free()
-
- pd = simpl.SMSPeakDetection()
- pd.hop_size = self.hop_size
- pd.max_peaks = self.max_peaks
- current_frame = 0
- sample_offset = 0
-
- while current_frame < self.num_frames:
- pd.frame_size = pd.get_next_frame_size()
- #print current_frame, sms_next_read_sizes[current_frame], pd.frame_size
- assert sms_next_read_sizes[current_frame] == pd.frame_size
- frame = simpl.Frame()
- frame.size = pd.frame_size
- frame.audio = audio[sample_offset:sample_offset + pd.frame_size]
- pd.find_peaks_in_frame(frame)
- sample_offset += pd.frame_size
- current_frame += 1
-
- def test_sms_analyze(self):
- """test_sms_analyze
- Make sure that the simplsms.sms_analyze function does the same thing
- as the sms_analyze function from libsms."""
- audio, sampling_rate = self.get_audio()
- pysms.sms_init()
- snd_header = pysms.SMS_SndHeader()
- # Try to open the input file to fill snd_header
- if(pysms.sms_openSF(self.input_file, snd_header)):
- raise NameError("error opening sound file: " + pysms.sms_errorString())
- analysis_params = self.pysms_analysis_params(sampling_rate)
- if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.nFrames = self.num_frames
- analysis_params.iSizeSound = self.num_samples
- sms_header = pysms.SMS_Header()
- pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- sms_frames = []
- do_analysis = True
-
- while do_analysis and (current_frame < self.num_frames):
- sample_offset += size_new_data
- size_new_data = analysis_params.sizeNextRead
- # convert frame to floats for libsms
- frame = simpl.Frame()
- frame.size = size_new_data
- frame.audio = np.array(audio[sample_offset:sample_offset + size_new_data],
- dtype=np.float32)
- if len(frame.audio) < size_new_data:
- frame.audio = np.hstack((frame.audio, np.zeros(size_new_data - len(frame.audio),
- dtype=np.float32)))
- analysis_data = pysms.SMS_Data()
- pysms.sms_allocFrameH(sms_header, analysis_data)
- status = pysms.sms_analyze(frame.audio, analysis_data, analysis_params)
- num_partials = analysis_data.nTracks
- peaks = []
-
- if status == 1:
- sms_amps = np.zeros(num_partials, dtype=np.float32)
- sms_freqs = np.zeros(num_partials, dtype=np.float32)
- sms_phases = np.zeros(num_partials, dtype=np.float32)
- analysis_data.getSinFreq(sms_freqs)
- analysis_data.getSinAmp(sms_amps)
- analysis_data.getSinPhase(sms_phases)
- for i in range(num_partials):
- p = simpl.Peak()
- p.amplitude = sms_amps[i]
- p.frequency = sms_freqs[i]
- p.phase = sms_phases[i]
- peaks.append(p)
- else:
- for i in range(num_partials):
- p = simpl.Peak()
- p.amplitude = 0.0
- p.frequency = 0.0
- p.phase = 0.0
- peaks.append(p)
-
- if status == -1:
- do_analysis = False
-
- frame.partials = peaks
- sms_frames.append(frame)
- pysms.sms_freeFrame(analysis_data)
- current_frame += 1
-
- pysms.sms_freeAnalysis(analysis_params)
- pysms.sms_closeSF()
- pysms.sms_free()
-
- audio, sampling_rate = self.get_audio()
- simplsms.sms_init()
- simpl_analysis_params = self.simplsms_analysis_params(sampling_rate)
- if simplsms.sms_initAnalysis(simpl_analysis_params) != 0:
- raise Exception("Error allocating memory for analysis_params")
- simpl_analysis_params.nFrames = self.num_frames
- simpl_analysis_params.iSizeSound = self.num_samples
- simpl_sms_header = simplsms.SMS_Header()
- simplsms.sms_fillHeader(simpl_sms_header, simpl_analysis_params, "simplsms")
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- simplsms_frames = []
- do_analysis = True
-
- while do_analysis and (current_frame < self.num_frames):
- sample_offset += size_new_data
- size_new_data = simpl_analysis_params.sizeNextRead
- frame = simpl.Frame()
- frame.size = size_new_data
- frame.audio = audio[sample_offset:sample_offset + size_new_data]
- if len(frame.audio) < size_new_data:
- frame.audio = np.hstack((frame.audio, simpl.zeros(size_new_data - len(frame.audio))))
- analysis_data = simplsms.SMS_Data()
- simplsms.sms_allocFrameH(simpl_sms_header, analysis_data)
- status = simplsms.sms_analyze(frame.audio, analysis_data, simpl_analysis_params)
- num_partials = analysis_data.nTracks
- peaks = []
-
- if status == 1:
- freqs = simpl.zeros(num_partials)
- amps = simpl.zeros(num_partials)
- phases = simpl.zeros(num_partials)
- analysis_data.getSinAmp(amps)
- analysis_data.getSinFreq(freqs)
- analysis_data.getSinPhase(phases)
- for i in range(num_partials):
- p = simpl.Peak()
- p.amplitude = amps[i]
- p.frequency = freqs[i]
- p.phase = phases[i]
- peaks.append(p)
- else:
- for i in range(num_partials):
- p = simpl.Peak()
- p.amplitude = 0.0
- p.frequency = 0.0
- p.phase = 0.0
- peaks.append(p)
-
- if status == -1:
- do_analysis = False
-
- frame.partials = peaks
- simplsms_frames.append(frame)
- simplsms.sms_freeFrame(analysis_data)
- current_frame += 1
-
- simplsms.sms_freeAnalysis(simpl_analysis_params)
- simplsms.sms_free()
-
- # make sure both have the same number of partials
- assert len(sms_frames) == len(simplsms_frames)
-
- # make sure each partial is the same
- for i in range(len(sms_frames)):
- assert len(sms_frames[i].partials) == len(simplsms_frames[i].partials)
- for p in range(len(sms_frames[i].partials)):
- assert_almost_equals(sms_frames[i].partials[p].amplitude,
- simplsms_frames[i].partials[p].amplitude,
- self.FLOAT_PRECISION)
- assert_almost_equals(sms_frames[i].partials[p].frequency,
- simplsms_frames[i].partials[p].frequency,
- self.FLOAT_PRECISION)
- assert_almost_equals(sms_frames[i].partials[p].phase,
- simplsms_frames[i].partials[p].phase,
- self.FLOAT_PRECISION)
-
- def test_multi_sms_peak_detection(self):
- """test_multi_sms_peak_detection
- Test that running the same peak detection process twice in a row
- produces the same results each time. This makes sure that results
- are independent, and also helps to highlight any memory errors."""
- audio, sampling_rate = self.get_audio()
- simplsms.sms_init()
- analysis_params = self.simplsms_analysis_params(sampling_rate)
- analysis_params.iMaxDelayFrames = self.num_frames + 1
- if simplsms.sms_initAnalysis(analysis_params) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.nFrames = self.num_frames
- sms_header = simplsms.SMS_Header()
- simplsms.sms_fillHeader(sms_header, analysis_params, "simplsms")
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- peaks1 = []
-
- while current_frame < self.num_frames:
- sample_offset += size_new_data
- size_new_data = analysis_params.sizeNextRead
- frame = audio[sample_offset:sample_offset + size_new_data]
- analysis_data = simplsms.SMS_Data()
- simplsms.sms_allocFrameH(sms_header, analysis_data)
- status = simplsms.sms_analyze(frame, analysis_data, analysis_params)
- # as the no. of frames of delay is > num_frames, sms_analyze should
- # never get around to performing partial tracking, and so the return
- # value should be 0
- assert status == 0
- num_peaks = analysis_data.nTracks
- frame_peaks = []
- simplsms_freqs = simpl.zeros(num_peaks)
- simplsms_amps = simpl.zeros(num_peaks)
- simplsms_phases = simpl.zeros(num_peaks)
- analysis_data.getSinFreq(simplsms_freqs)
- analysis_data.getSinAmp(simplsms_amps)
- analysis_data.getSinPhase(simplsms_phases)
- for i in range(num_peaks):
- if simplsms_amps[i]:
- p = simpl.Peak()
- # convert amplitude back to linear
- p.amplitude = 10**(simplsms_amps[i]/20.0)
- p.frequency = simplsms_freqs[i]
- p.phase = simplsms_phases[i]
- frame_peaks.append(p)
- peaks1.append(frame_peaks)
- pysms.sms_freeFrame(analysis_data)
- current_frame += 1
-
- simplsms.sms_freeAnalysis(analysis_params)
- simplsms.sms_free()
-
- # Second run
- audio, sampling_rate = self.get_audio()
- simplsms.sms_init()
- analysis_params = self.simplsms_analysis_params(sampling_rate)
- analysis_params.iMaxDelayFrames = self.num_frames + 1
- if simplsms.sms_initAnalysis(analysis_params) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.nFrames = self.num_frames
- sms_header = simplsms.SMS_Header()
- simplsms.sms_fillHeader(sms_header, analysis_params, "simplsms")
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- peaks2 = []
-
- while current_frame < self.num_frames:
- sample_offset += size_new_data
- size_new_data = analysis_params.sizeNextRead
- frame = audio[sample_offset:sample_offset + size_new_data]
- analysis_data = simplsms.SMS_Data()
- simplsms.sms_allocFrameH(sms_header, analysis_data)
- status = simplsms.sms_analyze(frame, analysis_data, analysis_params)
- # as the no. of frames of delay is > num_frames, sms_analyze should
- # never get around to performing partial tracking, and so the return
- # value should be 0
- assert status == 0
- num_peaks = analysis_data.nTracks
- frame_peaks = []
- simplsms_freqs = simpl.zeros(num_peaks)
- simplsms_amps = simpl.zeros(num_peaks)
- simplsms_phases = simpl.zeros(num_peaks)
- analysis_data.getSinFreq(simplsms_freqs)
- analysis_data.getSinAmp(simplsms_amps)
- analysis_data.getSinPhase(simplsms_phases)
- for i in range(num_peaks):
- if simplsms_amps[i]:
- p = simpl.Peak()
- # convert amplitude back to linear
- p.amplitude = 10**(simplsms_amps[i]/20.0)
- p.frequency = simplsms_freqs[i]
- p.phase = simplsms_phases[i]
- frame_peaks.append(p)
- peaks2.append(frame_peaks)
- pysms.sms_freeFrame(analysis_data)
- current_frame += 1
-
- simplsms.sms_freeAnalysis(analysis_params)
- simplsms.sms_free()
-
- # make sure we have the same number of frames in each run
- assert len(peaks1) == len(peaks2)
- for f in range(len(peaks1)):
- # in each frame, make sure that we have the same number of peaks
- assert len(peaks1[f]) == len(peaks2[f])
- # make sure that each peak has the same value
- for p in range(len(peaks1[f])):
- assert_almost_equals(peaks1[f][p].frequency,
- peaks2[f][p].frequency,
- self.FLOAT_PRECISION)
- assert_almost_equals(peaks1[f][p].amplitude,
- peaks2[f][p].amplitude,
- self.FLOAT_PRECISION)
- assert_almost_equals(peaks1[f][p].phase,
- peaks2[f][p].phase,
- self.FLOAT_PRECISION)
-
- def test_multi_simpl_peak_detection(self):
- """test_multi_simpl_peak_detection
- Test that running the simpl peak detection process twice in a row
- produces the same results each time. This makes sure that results
- are independent, and also helps to highlight any memory errors."""
- audio, sampling_rate = self.get_audio()
- pd = simpl.SMSPeakDetection()
- pd.max_peaks = self.max_peaks
- pd.hop_size = self.hop_size
- frames1 = pd.find_peaks(audio)[0:self.num_frames]
- del pd
- # second run
- audio, sampling_rate = self.get_audio()
- pd = simpl.SMSPeakDetection()
- pd.max_peaks = self.max_peaks
- pd.hop_size = self.hop_size
- frames2 = pd.find_peaks(audio)[0:self.num_frames]
-
- # make sure we have the same number of frames in each run
- assert len(frames1) == len(frames2)
- for f in range(len(frames1)):
- # in each frame, make sure that we have the same number of peaks
- assert len(frames1[f].peaks) == len(frames2[f].peaks)
- # make sure that each peak has the same value
- for p in range(len(frames1[f].peaks)):
- assert_almost_equals(frames1[f].peaks[p].frequency,
- frames2[f].peaks[p].frequency,
- self.FLOAT_PRECISION)
- assert_almost_equals(frames1[f].peaks[p].amplitude,
- frames2[f].peaks[p].amplitude,
- self.FLOAT_PRECISION)
- assert_almost_equals(frames1[f].peaks[p].phase,
- frames2[f].peaks[p].phase,
- self.FLOAT_PRECISION)
-
- def test_peak_detection(self):
- """test_peak_detection
- Compare simplsms Peaks with SMS peaks. Exact peak
- information cannot be retrieved using libsms. Basic peak detection
- is performed by sms_detectPeaks, but this is called multiple times
- with different frame sizes by sms_analyze. This peak data cannot
- be returned from sms_analyze without modifying it, so here
- we compare the peaks to a slightly modified version of sms_analyze
- from simplsms. The peak values should be the same as those found by
- the simplsms find_peaks function. Analyses have to be performed
- separately due to libsms implementation issues."""
- audio, sampling_rate = self.get_audio()
- simplsms.sms_init()
- analysis_params = self.simplsms_analysis_params(sampling_rate)
- analysis_params.iMaxDelayFrames = self.num_frames + 1
- if simplsms.sms_initAnalysis(analysis_params) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.nFrames = self.num_frames
- sms_header = simplsms.SMS_Header()
- simplsms.sms_fillHeader(sms_header, analysis_params, "simplsms")
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- sms_peaks = []
-
- while current_frame < self.num_frames:
- sample_offset += size_new_data
- size_new_data = analysis_params.sizeNextRead
- frame = audio[sample_offset:sample_offset + size_new_data]
- if len(frame) < size_new_data:
- frame = np.hstack((frame, simpl.zeros(size_new_data - len(frame))))
- analysis_data = simplsms.SMS_Data()
- simplsms.sms_allocFrameH(sms_header, analysis_data)
- status = simplsms.sms_analyze(frame, analysis_data, analysis_params)
- # as the no. of frames of delay is > num_frames, sms_analyze should
- # never get around to performing partial tracking, and so the return
- # value should be 0
- assert status == 0
- num_peaks = analysis_data.nTracks
- frame_peaks = []
- simplsms_freqs = simpl.zeros(num_peaks)
- simplsms_amps = simpl.zeros(num_peaks)
- simplsms_phases = simpl.zeros(num_peaks)
- analysis_data.getSinFreq(simplsms_freqs)
- analysis_data.getSinAmp(simplsms_amps)
- analysis_data.getSinPhase(simplsms_phases)
- for i in range(num_peaks):
- if simplsms_amps[i]:
- p = simpl.Peak()
- # convert amplitude back to linear
- p.amplitude = simplsms_amps[i]
- p.frequency = simplsms_freqs[i]
- p.phase = simplsms_phases[i]
- frame_peaks.append(p)
- sms_peaks.append(frame_peaks)
- pysms.sms_freeFrame(analysis_data)
- current_frame += 1
-
- simplsms.sms_freeAnalysis(analysis_params)
- simplsms.sms_free()
-
- # get simpl peaks
- pd = simpl.SMSPeakDetection()
- pd.hop_size = self.hop_size
- pd.max_peaks = self.max_peaks
- current_frame = 0
- sample_offset = 0
- simpl_peaks = []
-
- while current_frame < self.num_frames:
- pd.frame_size = pd.get_next_frame_size()
- frame = simpl.Frame()
- frame.size = pd.frame_size
- frame.audio = audio[sample_offset:sample_offset + pd.frame_size]
- if len(frame.audio) < pd.frame_size:
- frame.audio = np.hstack((frame.audio, simpl.zeros(pd.frame_size - len(frame.audio))))
- simpl_peaks.append(pd.find_peaks_in_frame(frame))
- sample_offset += pd.frame_size
- current_frame += 1
-
- # make sure we have the same number of frames
- assert len(sms_peaks) == len(simpl_peaks)
-
- # compare data for each frame
- for frame_number in range(len(sms_peaks)):
- sms_frame = sms_peaks[frame_number]
- simpl_frame = simpl_peaks[frame_number]
- # make sure we have the same number of peaks in each frame
- assert len(sms_frame) == len(simpl_frame)
- # check peak values
- for peak_number in range(len(sms_frame)):
- sms_peak = sms_frame[peak_number]
- simpl_peak = simpl_frame[peak_number]
- assert_almost_equals(sms_peak.amplitude, simpl_peak.amplitude,
- self.FLOAT_PRECISION)
- assert_almost_equals(sms_peak.frequency, simpl_peak.frequency,
- self.FLOAT_PRECISION)
- assert_almost_equals(sms_peak.phase, simpl_peak.phase,
- self.FLOAT_PRECISION)
-
- def test_multi_pysms_analyze(self):
- """test_multi_pysms_analyze
- Test that running the pysms sms_analyze function twice in a row
- produces the same results each time. This makes sure that results
- are independent, and also helps to highlight any memory errors."""
- audio, sampling_rate = self.get_audio()
- pysms.sms_init()
- snd_header = pysms.SMS_SndHeader()
- # Try to open the input file to fill snd_header
- if(pysms.sms_openSF(self.input_file, snd_header)):
- raise NameError("error opening sound file: " + pysms.sms_errorString())
- analysis_params = self.pysms_analysis_params(sampling_rate)
- if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.iSizeSound = self.num_samples
- sms_header = pysms.SMS_Header()
- pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- freqs1 = []
- amps1 = []
- phases1 = []
- do_analysis = True
-
- while do_analysis and (current_frame < self.num_frames):
- sample_offset += size_new_data
- size_new_data = analysis_params.sizeNextRead
- # convert frame to floats for libsms
- frame = audio[sample_offset:sample_offset + size_new_data]
- frame = np.array(frame, dtype=np.float32)
- analysis_data = pysms.SMS_Data()
- pysms.sms_allocFrameH(sms_header, analysis_data)
- status = pysms.sms_analyze(frame, analysis_data, analysis_params)
- if status == 1:
- num_partials = analysis_data.nTracks
- freqs = np.zeros(num_partials, dtype=np.float32)
- amps = np.zeros(num_partials, dtype=np.float32)
- phases = np.zeros(num_partials, dtype=np.float32)
- analysis_data.getSinFreq(freqs)
- analysis_data.getSinAmp(amps)
- analysis_data.getSinPhase(phases)
- amps1.append(amps)
- freqs1.append(freqs)
- phases1.append(phases)
- elif status == -1:
- do_analysis = False
- pysms.sms_freeFrame(analysis_data)
- current_frame += 1
-
- pysms.sms_freeAnalysis(analysis_params)
- pysms.sms_closeSF()
- pysms.sms_free()
-
- # second run
- audio, sampling_rate = self.get_audio()
- pysms.sms_init()
- snd_header = pysms.SMS_SndHeader()
- # Try to open the input file to fill snd_header
- if(pysms.sms_openSF(self.input_file, snd_header)):
- raise NameError("error opening sound file: " + pysms.sms_errorString())
- analysis_params = self.pysms_analysis_params(sampling_rate)
- if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.iSizeSound = self.num_samples
- sms_header = pysms.SMS_Header()
- pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- freqs2 = []
- amps2 = []
- phases2 = []
- do_analysis = True
-
- while do_analysis and (current_frame < self.num_frames):
- sample_offset += size_new_data
- size_new_data = analysis_params.sizeNextRead
- # convert frame to floats for libsms
- frame = audio[sample_offset:sample_offset + size_new_data]
- frame = np.array(frame, dtype=np.float32)
- analysis_data = pysms.SMS_Data()
- pysms.sms_allocFrameH(sms_header, analysis_data)
- status = pysms.sms_analyze(frame, analysis_data, analysis_params)
- if status == 1:
- num_partials = analysis_data.nTracks
- freqs = np.zeros(num_partials, dtype=np.float32)
- amps = np.zeros(num_partials, dtype=np.float32)
- phases = np.zeros(num_partials, dtype=np.float32)
- analysis_data.getSinFreq(freqs)
- analysis_data.getSinAmp(amps)
- analysis_data.getSinPhase(phases)
- amps2.append(amps)
- freqs2.append(freqs)
- phases2.append(phases)
- elif status == -1:
- do_analysis = False
- pysms.sms_freeFrame(analysis_data)
- current_frame += 1
-
- pysms.sms_freeAnalysis(analysis_params)
- pysms.sms_closeSF()
- pysms.sms_free()
-
- # make sure we have the same number of results in each run
- assert len(freqs1) == len(freqs2)
- assert len(amps1) == len(amps2)
- assert len(phases1) == len(phases2)
-
- for r in range(len(freqs1)):
- # in each result, make sure that we have the same number amps, freqs and phases
- assert len(freqs1[r]) == len(freqs2[r])
- assert len(amps1[r]) == len(amps2[r])
- assert len(phases1[r]) == len(phases2[r])
- # make sure that each partial has the same value
- for p in range(len(freqs1[r])):
- assert_almost_equals(freqs1[r][p], freqs2[r][p], self.FLOAT_PRECISION)
- assert_almost_equals(amps1[r][p], amps2[r][p], self.FLOAT_PRECISION)
- assert_almost_equals(phases1[r][p], phases2[r][p], self.FLOAT_PRECISION)
-
- def test_multi_simpl_partial_tracking(self):
- """test_multi_simpl_partial_tracking
- Test that running the simpl peak detection process twice in a row
- produces the same results each time. This makes sure that results
- are independent, and also helps to highlight any memory errors."""
- audio, sampling_rate = self.get_audio()
- pd = simpl.SMSPeakDetection()
- pd.max_peaks = self.max_peaks
- pd.hop_size = self.hop_size
- peaks = pd.find_peaks(audio)[0:self.num_frames]
- pt = simpl.SMSPartialTracking()
- pt.max_partials = self.max_peaks
- frames1 = pt.find_partials(peaks)
- del pd
- del pt
- # second run
- audio, sampling_rate = self.get_audio()
- pd = simpl.SMSPeakDetection()
- pd.max_peaks = self.max_peaks
- pd.hop_size = self.hop_size
- peaks = pd.find_peaks(audio)[0:self.num_frames]
- pt = simpl.SMSPartialTracking()
- pt.max_partials = self.max_peaks
- frames2 = pt.find_partials(peaks)
-
- # make sure we have the same number of partials in each run
- assert len(frames1) == len(frames2)
- for i in range(len(frames1)):
- # make sure each partial is the same length
- assert len(frames1[i].partials) == len(frames2[i].partials)
- # make sure that the peaks in each partial have the same values
- for p in range(len(frames1[i].partials)):
- assert_almost_equals(frames1[i].partials[p].frequency,
- frames2[i].partials[p].frequency,
- self.FLOAT_PRECISION)
- assert_almost_equals(frames1[i].partials[p].amplitude,
- frames2[i].partials[p].amplitude,
- self.FLOAT_PRECISION)
- assert_almost_equals(frames1[i].partials[p].phase,
- frames2[i].partials[p].phase,
- self.FLOAT_PRECISION)
-
- def test_partial_tracking(self):
- """test_partial_tracking
- Compare pysms Partials with SMS partials."""
- audio, sampling_rate = self.get_audio()
- pysms.sms_init()
- snd_header = pysms.SMS_SndHeader()
- # Try to open the input file to fill snd_header
- if(pysms.sms_openSF(self.input_file, snd_header)):
- raise NameError("error opening sound file: " + pysms.sms_errorString())
- analysis_params = self.pysms_analysis_params(sampling_rate)
- if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.iSizeSound = self.num_samples
- analysis_params.nFrames = self.num_frames
- sms_header = pysms.SMS_Header()
- pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- sms_frames = []
- do_analysis = True
-
- while do_analysis and (current_frame < self.num_frames):
- sample_offset += size_new_data
- size_new_data = analysis_params.sizeNextRead
- # convert frame to floats for libsms
- frame = simpl.Frame()
- frame.size = size_new_data
- frame.audio = np.array(audio[sample_offset:sample_offset + size_new_data],
- dtype=np.float32)
- analysis_data = pysms.SMS_Data()
- pysms.sms_allocFrameH(sms_header, analysis_data)
- num_partials = analysis_data.nTracks
- peaks = []
- status = pysms.sms_analyze(frame.audio, analysis_data, analysis_params)
-
- if status == 1:
- sms_freqs = np.zeros(num_partials, dtype=np.float32)
- sms_amps = np.zeros(num_partials, dtype=np.float32)
- sms_phases = np.zeros(num_partials, dtype=np.float32)
- analysis_data.getSinFreq(sms_freqs)
- analysis_data.getSinAmp(sms_amps)
- analysis_data.getSinPhase(sms_phases)
- for i in range(num_partials):
- p = simpl.Peak()
- p.amplitude = sms_amps[i]
- p.frequency = sms_freqs[i]
- p.phase = sms_phases[i]
- peaks.append(p)
- frame.partials = peaks
- sms_frames.append(frame)
- current_frame += 1
-
- if status == -1:
- do_analysis = False
-
- pysms.sms_freeFrame(analysis_data)
-
- # first frame is blank
- sms_frames = sms_frames[1:]
-
- # free sms memory
- pysms.sms_freeAnalysis(analysis_params)
- pysms.sms_closeSF()
- pysms.sms_free()
-
- pd = simpl.SMSPeakDetection()
- pd.max_peaks = self.max_peaks
- pd.hop_size = self.hop_size
- peaks = pd.find_peaks(audio)
- pt = simpl.SMSPartialTracking()
- pt.max_partials = self.max_partials
- simpl_frames = pt.find_partials(peaks)
-
- # make sure both have the same number of partials
- assert len(sms_frames) == len(simpl_frames)
-
- # make sure each partial is the same
- for i in range(len(sms_frames)):
- assert len(sms_frames[i].partials) == len(simpl_frames[i].partials)
- for p in range(len(sms_frames[i].partials)):
- assert_almost_equals(sms_frames[i].partials[p].amplitude,
- simpl_frames[i].partials[p].amplitude,
- self.FLOAT_PRECISION)
- assert_almost_equals(sms_frames[i].partials[p].frequency,
- simpl_frames[i].partials[p].frequency,
- self.FLOAT_PRECISION)
- assert_almost_equals(sms_frames[i].partials[p].phase,
- simpl_frames[i].partials[p].phase,
- self.FLOAT_PRECISION)
-
- def test_sms_interpolate_frames(self):
- """test_sms_interpolate_frames
- Make sure that sms_interpolateFrames returns the expected values
- with interpolation factors of 0 and 1."""
- audio, sampling_rate = self.get_audio()
- pysms.sms_init()
- snd_header = pysms.SMS_SndHeader()
- # Try to open the input file to fill snd_header
- if(pysms.sms_openSF(self.input_file, snd_header)):
- raise NameError("error opening sound file: " + pysms.sms_errorString())
- analysis_params = self.pysms_analysis_params(sampling_rate)
- analysis_params.nFrames = self.num_frames
- if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.iSizeSound = self.num_samples
- sms_header = pysms.SMS_Header()
- pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
-
- interp_frame = pysms.SMS_Data()
- pysms.sms_allocFrameH(sms_header, interp_frame)
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- analysis_frames = []
- do_analysis = True
-
- while do_analysis and (current_frame < self.num_frames):
- sample_offset += size_new_data
- size_new_data = analysis_params.sizeNextRead
- frame = audio[sample_offset:sample_offset + size_new_data]
- # convert frame to floats for libsms
- frame = np.array(frame, dtype=np.float32)
- analysis_data = pysms.SMS_Data()
- pysms.sms_allocFrameH(sms_header, analysis_data)
- status = pysms.sms_analyze(frame, analysis_data, analysis_params)
-
- if status == 1:
- analysis_frames.append(analysis_data)
- # test interpolateFrames on the last two analysis frames
- if current_frame == self.num_frames - 1:
- left_frame = analysis_frames[-2]
- right_frame = analysis_frames[-1]
- pysms.sms_interpolateFrames(left_frame, right_frame, interp_frame, 0)
- # make sure that interp_frame == left_frame
- # interpolateFrames doesn't interpolate phases so ignore
- left_amps = np.zeros(self.max_partials, dtype=np.float32)
- left_freqs = np.zeros(self.max_partials, dtype=np.float32)
- left_frame.getSinAmp(left_amps)
- left_frame.getSinFreq(left_freqs)
- right_amps = np.zeros(self.max_partials, dtype=np.float32)
- right_freqs = np.zeros(self.max_partials, dtype=np.float32)
- right_frame.getSinAmp(right_amps)
- right_frame.getSinFreq(right_freqs)
- interp_amps = np.zeros(self.max_partials, dtype=np.float32)
- interp_freqs = np.zeros(self.max_partials, dtype=np.float32)
- interp_frame.getSinAmp(interp_amps)
- interp_frame.getSinFreq(interp_freqs)
- for i in range(self.max_partials):
- assert_almost_equals(left_amps[i], interp_amps[i],
- self.FLOAT_PRECISION)
- if left_freqs[i] != 0:
- assert_almost_equals(left_freqs[i], interp_freqs[i],
- self.FLOAT_PRECISION)
- else:
- assert_almost_equals(right_freqs[i], interp_freqs[i],
- self.FLOAT_PRECISION)
- pysms.sms_interpolateFrames(left_frame, right_frame, interp_frame, 1)
- interp_amps = np.zeros(self.max_partials, dtype=np.float32)
- interp_freqs = np.zeros(self.max_partials, dtype=np.float32)
- interp_frame.getSinAmp(interp_amps)
- interp_frame.getSinFreq(interp_freqs)
- for i in range(self.max_partials):
- assert_almost_equals(right_amps[i], interp_amps[i],
- self.FLOAT_PRECISION)
- if right_freqs[i] != 0:
- assert_almost_equals(right_freqs[i], interp_freqs[i],
- self.FLOAT_PRECISION)
- else:
- assert_almost_equals(left_freqs[i], interp_freqs[i],
- self.FLOAT_PRECISION)
- elif status == -1:
- raise Exception("AnalysisStoppedEarly")
- else:
- pysms.sms_freeFrame(analysis_data)
- current_frame += 1
-
- for frame in analysis_frames:
- pysms.sms_freeFrame(frame)
- pysms.sms_freeFrame(interp_frame)
- pysms.sms_freeAnalysis(analysis_params)
- pysms.sms_closeSF()
- pysms.sms_free()
-
- def test_simplsms_interpolate_frames(self):
- """test_simplsms_interpolate_frames
- Make sure that sms_interpolateFrames returns the expected values
- with interpolation factors of 0 and 1."""
- audio, sampling_rate = self.get_audio()
- simplsms.sms_init()
- analysis_params = self.simplsms_analysis_params(sampling_rate)
- analysis_params.nFrames = self.num_frames
- if simplsms.sms_initAnalysis(analysis_params) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.iSizeSound = self.num_samples
- sms_header = simplsms.SMS_Header()
- simplsms.sms_fillHeader(sms_header, analysis_params, "simplsms")
-
- interp_frame = simplsms.SMS_Data()
- simplsms.sms_allocFrameH(sms_header, interp_frame)
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- analysis_frames = []
- do_analysis = True
-
- while do_analysis and (current_frame < self.num_frames):
- sample_offset += size_new_data
- size_new_data = analysis_params.sizeNextRead
- frame = audio[sample_offset:sample_offset + size_new_data]
- analysis_data = simplsms.SMS_Data()
- simplsms.sms_allocFrameH(sms_header, analysis_data)
- status = simplsms.sms_analyze(frame, analysis_data, analysis_params)
-
- if status == 1:
- analysis_frames.append(analysis_data)
- # test interpolateFrames on the last two analysis frames
- if current_frame == self.num_frames - 1:
- left_frame = analysis_frames[-2]
- right_frame = analysis_frames[-1]
- simplsms.sms_interpolateFrames(left_frame, right_frame, interp_frame, 0)
- # make sure that interp_frame == left_frame
- # interpolateFrames doesn't interpolate phases so ignore
- left_amps = simpl.zeros(self.max_partials)
- left_freqs = simpl.zeros(self.max_partials)
- left_frame.getSinAmp(left_amps)
- left_frame.getSinFreq(left_freqs)
- right_amps = simpl.zeros(self.max_partials)
- right_freqs = simpl.zeros(self.max_partials)
- right_frame.getSinAmp(right_amps)
- right_frame.getSinFreq(right_freqs)
- interp_amps = simpl.zeros(self.max_partials)
- interp_freqs = simpl.zeros(self.max_partials)
- interp_frame.getSinAmp(interp_amps)
- interp_frame.getSinFreq(interp_freqs)
- for i in range(self.max_partials):
- assert_almost_equals(left_amps[i], interp_amps[i],
- self.FLOAT_PRECISION)
- if left_freqs[i] != 0:
- assert_almost_equals(left_freqs[i], interp_freqs[i],
- self.FLOAT_PRECISION)
- else:
- assert_almost_equals(right_freqs[i], interp_freqs[i],
- self.FLOAT_PRECISION)
- simplsms.sms_interpolateFrames(left_frame, right_frame, interp_frame, 1)
- interp_amps = simpl.zeros(self.max_partials)
- interp_freqs = simpl.zeros(self.max_partials)
- interp_frame.getSinAmp(interp_amps)
- interp_frame.getSinFreq(interp_freqs)
- for i in range(self.max_partials):
- assert_almost_equals(right_amps[i], interp_amps[i],
- self.FLOAT_PRECISION)
- if right_freqs[i] != 0:
- assert_almost_equals(right_freqs[i], interp_freqs[i],
- self.FLOAT_PRECISION)
- else:
- assert_almost_equals(left_freqs[i], interp_freqs[i],
- self.FLOAT_PRECISION)
- elif status == -1:
- raise Exception("AnalysisStoppedEarly")
- else:
- simplsms.sms_freeFrame(analysis_data)
- current_frame += 1
-
- for frame in analysis_frames:
- simplsms.sms_freeFrame(frame)
- simplsms.sms_freeFrame(interp_frame)
- simplsms.sms_freeAnalysis(analysis_params)
- simplsms.sms_free()
-
- def test_harmonic_synthesis(self):
- """test_harmonic_synthesis
- Compare pysms synthesised harmonic component with SMS synthesised
- harmonic component."""
- audio, sampling_rate = self.get_audio()
- pysms.sms_init()
- snd_header = pysms.SMS_SndHeader()
- # Try to open the input file to fill snd_header
- if(pysms.sms_openSF(self.input_file, snd_header)):
- raise NameError("error opening sound file: " + pysms.sms_errorString())
- analysis_params = self.pysms_analysis_params(sampling_rate)
- analysis_params.nFrames = self.num_frames
- if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.iSizeSound = self.num_samples
- sms_header = pysms.SMS_Header()
- pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- analysis_frames = []
- do_analysis = True
-
- while do_analysis and (current_frame < self.num_frames):
- sample_offset += size_new_data
- size_new_data = analysis_params.sizeNextRead
- frame = audio[sample_offset:sample_offset + size_new_data]
- # convert frame to floats for libsms
- frame = np.array(frame, dtype=np.float32)
- analysis_data = pysms.SMS_Data()
- pysms.sms_allocFrameH(sms_header, analysis_data)
- status = pysms.sms_analyze(frame, analysis_data, analysis_params)
- if status == 1:
- analysis_frames.append(analysis_data)
- current_frame += 1
- elif status == 0:
- pysms.sms_freeFrame(analysis_data)
- elif status == -1:
- do_analysis = False
- pysms.sms_freeFrame(analysis_data)
-
- # remove the first frame, it's blank
- blank_frame = analysis_frames[0]
- analysis_frames = analysis_frames[1:]
- pysms.sms_freeFrame(blank_frame)
-
- synth_params = self.pysms_synthesis_params(sampling_rate)
- pysms.sms_initSynth(sms_header, synth_params)
-
- synth_samples = np.zeros(synth_params.sizeHop, dtype=np.float32)
- sms_audio = np.array([], dtype=np.float32)
- current_frame = 0
-
- while current_frame < len(analysis_frames):
- pysms.sms_synthesize(analysis_frames[current_frame], synth_samples, synth_params)
- sms_audio = np.hstack((sms_audio, synth_samples))
- current_frame += 1
-
- for frame in analysis_frames:
- pysms.sms_freeFrame(frame)
- pysms.sms_freeAnalysis(analysis_params)
- pysms.sms_closeSF()
- pysms.sms_freeSynth(synth_params)
- pysms.sms_free()
-
- pd = simpl.SMSPeakDetection()
- pd.max_peaks = self.max_peaks
- pd.hop_size = self.hop_size
- peaks = pd.find_peaks(audio)
- pt = simpl.SMSPartialTracking()
- pt.max_partials = self.max_partials
- partials = pt.find_partials(peaks)
- synth = simpl.SMSSynthesis()
- synth.hop_size = self.hop_size
- synth.max_partials = self.max_partials
- synth.det_synthesis_type = simplsms.SMS_DET_IFFT
- simpl_audio = synth.synth(partials)
-
- assert len(sms_audio) == len(simpl_audio)
- for i in range(simpl_audio.size):
- assert_almost_equals(sms_audio[i], simpl_audio[i], self.FLOAT_PRECISION)
-
- def test_harmonic_synthesis_sin(self):
- """test_harmonic_synthesis_sin
- Compare pysms synthesised harmonic component with SMS synthesised
- harmonic component."""
- audio, sampling_rate = self.get_audio()
- pysms.sms_init()
- snd_header = pysms.SMS_SndHeader()
- # Try to open the input file to fill snd_header
- if(pysms.sms_openSF(self.input_file, snd_header)):
- raise NameError("error opening sound file: " + pysms.sms_errorString())
- analysis_params = self.pysms_analysis_params(sampling_rate)
- if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.iSizeSound = self.num_samples
- analysis_params.nFrames = self.num_frames
- sms_header = pysms.SMS_Header()
- pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- analysis_frames = []
- do_analysis = True
-
- while do_analysis and (current_frame < self.num_frames):
- sample_offset += size_new_data
- size_new_data = analysis_params.sizeNextRead
- frame = audio[sample_offset:sample_offset + size_new_data]
- # convert frame to floats for libsms
- frame = np.array(frame, dtype=np.float32)
- if len(frame) < size_new_data:
- frame = np.hstack((frame, np.zeros(size_new_data - len(frame),
- dtype=np.float32)))
- analysis_data = pysms.SMS_Data()
- pysms.sms_allocFrameH(sms_header, analysis_data)
- status = pysms.sms_analyze(frame, analysis_data, analysis_params)
- if status == 1:
- analysis_frames.append(analysis_data)
- current_frame += 1
- elif status == 0:
- pysms.sms_freeFrame(analysis_data)
- elif status == -1:
- do_analysis = False
- pysms.sms_freeFrame(analysis_data)
-
- # remove the first frame, it's blank
- blank_frame = analysis_frames[0]
- analysis_frames = analysis_frames[1:]
- pysms.sms_freeFrame(blank_frame)
-
- synth_params = self.pysms_synthesis_params(sampling_rate)
- synth_params.iDetSynthType = pysms.SMS_DET_SIN
- pysms.sms_initSynth(sms_header, synth_params)
-
- synth_samples = np.zeros(synth_params.sizeHop, dtype=np.float32)
- sms_audio = np.array([], dtype=np.float32)
- current_frame = 0
-
- while current_frame < len(analysis_frames):
- pysms.sms_synthesize(analysis_frames[current_frame], synth_samples, synth_params)
- sms_audio = np.hstack((sms_audio, synth_samples))
- current_frame += 1
-
- for frame in analysis_frames:
- pysms.sms_freeFrame(frame)
- pysms.sms_freeAnalysis(analysis_params)
- pysms.sms_closeSF()
- pysms.sms_freeSynth(synth_params)
- pysms.sms_free()
-
- pd = simpl.SMSPeakDetection()
- pd.max_peaks = self.max_peaks
- pd.hop_size = self.hop_size
- peaks = pd.find_peaks(audio)
- pt = simpl.SMSPartialTracking()
- pt.max_partials = self.max_partials
- partials = pt.find_partials(peaks)
- synth = simpl.SMSSynthesis()
- synth.hop_size = self.hop_size
- synth.max_partials = self.max_partials
- synth.det_synthesis_type = simplsms.SMS_DET_SIN
- simpl_audio = synth.synth(partials)
-
- assert len(sms_audio) == len(simpl_audio)
- for i in range(simpl_audio.size):
- assert_almost_equals(sms_audio[i], simpl_audio[i], self.FLOAT_PRECISION)
-
- def test_residual_synthesis(self):
- """test_residual_synthesis
- Compare pysms residual signal with SMS residual"""
-
- # -------------------------------------------
- # This test is not finished yet. Skip for now
- from nose.plugins.skip import SkipTest
- raise SkipTest
- # -------------------------------------------
-
- audio, sampling_rate = self.get_audio()
- pysms.sms_init()
- snd_header = pysms.SMS_SndHeader()
- # Try to open the input file to fill snd_header
- if(pysms.sms_openSF(self.input_file, snd_header)):
- raise NameError("error opening sound file: " + pysms.sms_errorString())
- analysis_params = self.pysms_analysis_params(sampling_rate)
- analysis_params.nFrames = self.num_frames
- analysis_params.nStochasticCoeff = 128
- analysis_params.iStochasticType = pysms.SMS_STOC_APPROX
- if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
- raise Exception("Error allocating memory for analysis_params")
- analysis_params.iSizeSound = self.num_samples
- sms_header = pysms.SMS_Header()
- pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
-
- sample_offset = 0
- size_new_data = 0
- current_frame = 0
- analysis_frames = []
- do_analysis = True
-
- while do_analysis and (current_frame < self.num_frames):
- sample_offset += size_new_data
- size_new_data = analysis_params.sizeNextRead
- # convert frame to floats for libsms
- frame = audio[sample_offset:sample_offset + size_new_data]
- frame = np.array(frame, dtype=np.float32)
- analysis_data = pysms.SMS_Data()
- pysms.sms_allocFrameH(sms_header, analysis_data)
- status = pysms.sms_analyze(frame, analysis_data, analysis_params)
- analysis_frames.append(analysis_data)
- if status == -1:
- do_analysis = False
- current_frame += 1
-
- sms_header.nFrames = len(analysis_frames)
- synth_params = self.pysms_synthesis_params(sampling_rate)
- synth_params.iStochasticType = pysms.SMS_STOC_APPROX
- synth_params.iSynthesisType = pysms.SMS_STYPE_STOC
- pysms.sms_initSynth(sms_header, synth_params)
- synth_samples = np.zeros(synth_params.sizeHop, dtype=np.float32)
- sms_residual = np.array([], dtype=np.float32)
- current_frame = 0
-
- while current_frame < len(analysis_frames):
- pysms.sms_synthesize(analysis_frames[current_frame], synth_samples, synth_params)
- sms_residual = np.hstack((sms_residual, synth_samples))
- current_frame += 1
-
- for frame in analysis_frames:
- pysms.sms_freeFrame(frame)
- pysms.sms_freeAnalysis(analysis_params)
- pysms.sms_closeSF()
- pysms.sms_freeSynth(synth_params)
- pysms.sms_free()
-
- pd = simpl.SMSPeakDetection()
- pd.max_peaks = self.max_peaks
- pd.hop_size = self.hop_size
- peaks = pd.find_peaks(audio)[0:self.num_frames]
- pt = simpl.SMSPartialTracking()
- pt.max_partials = self.max_partials
- partials = pt.find_partials(peaks)
- synth = simpl.SMSSynthesis()
- synth.hop_size = self.hop_size
- synth.max_partials = self.max_partials
- simpl_harmonic = synth.synth(partials)
- res = simpl.SMSResidual()
- simpl_residual = res.synth(simpl_harmonic, audio[0:simpl_harmonic.size])
-
- assert len(simpl_residual) == len(sms_residual)
- for i in range(len(simpl_residual)):
- assert_almost_equals(simpl_residual[i], sms_residual[i],
- self.FLOAT_PRECISION)
-
-
-if __name__ == "__main__":
- # run individual tests programatically
- # useful for debugging, particularly with GDB
- import nose
- argv = [__file__,
- "--nocapture",
- #__file__ + ":TestSimplSMS.test_residual_synthesis"]
- __file__ + ":TestSimplSMS.test_harmonic_synthesis_sin"]
- nose.run(argv=argv)
diff --git a/tests/test_sms_old.py b/tests/test_sms_old.py
deleted file mode 100644
index 7ed8724..0000000
--- a/tests/test_sms_old.py
+++ /dev/null
@@ -1,126 +0,0 @@
-# Copyright (c) 2009 John Glover, National University of Ireland, Maynooth
-#
-# This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation; either version 2 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program; if not, write to the Free Software
-# Foundation, Inc., 59 Temple Place, Suite 330, Boston, M 02111-1307 USA
-
-import unittest
-from pysms import SMS_Header, SMS_Data, SMS_SndHeader, SMS_AnalParams, \
- sms_openSF, sms_errorString, sms_getSound, \
- sms_fillHeader, sms_init, sms_initAnalysis, sms_allocFrameH, \
- sms_freeFrame, sms_freeAnalysis, sms_free
-from scipy import zeros, sin, pi, asarray, int16
-from scipy.io.wavfile import read, write
-import os
-import random
-from pylab import plot, show
-
-TEST_AUDIO_FILE = "Tests.wav"
-
-# Create a test audio file (1 second of a sine wave at 220 Hz)
-test_audio = zeros(44100)
-for sample_number in range(test_audio.size):
- test_audio[sample_number] = sin(2 * pi * 220 * sample_number / 44100.0)
-# convert to int values
-test_audio *= 32767
-test_audio = asarray(test_audio, int16)
-
-def create_test_audio_file():
- "Create a test audio file in the current directory"
- write(TEST_AUDIO_FILE, 44100, test_audio)
-
-def delete_test_audio_file():
- "Delete the test audio file created by the function create_test_audio_file"
- os.remove(TEST_AUDIO_FILE)
-
-class TestSoundIO(unittest.TestCase):
- def setUp(self):
- self.snd_header = SMS_SndHeader()
-
- def test_sms_openSF_file_exists(self):
- "sms_openSF returns True when trying to open an existing file"
- create_test_audio_file()
- self.assert_(sms_openSF(TEST_AUDIO_FILE, self.snd_header) == 0)
- delete_test_audio_file()
-
- def test_sms_openSF_file_missing(self):
- "sms_openSF returns False when trying to open a file that doesn't exist"
- file_path = ""
- max_file_names = 1000
- count = 0
- class MaxFilesReached(Exception): pass
- # create a path to a non-existent file
- while True:
- file_path = str(random.randint(0, max_file_names)) + ".wav"
- if not os.path.isfile(file_path):
- break
- if count > max_file_names:
- raise MaxFilesReached
- count += 1
- # call sms_openSF, should return an error
- self.assertRaises(IndexError, sms_openSF, file_path, self.snd_header)
-
- def test_sms_getSound(self):
- "sms_getSound"
- create_test_audio_file()
- self.assert_(sms_openSF(TEST_AUDIO_FILE, self.snd_header) == 0)
- frame_size = 512
- frame = zeros(frame_size).astype('float32')
- self.assert_(sms_getSound(self.snd_header, frame, 0) == 0)
- # test that values read in are the same as those written (allowing for some rounding errors)
- class SampleMismatch(Exception): pass
- for sample_number in range(frame_size):
- if abs((test_audio[sample_number] / 32768.0) - frame[sample_number] > 0.000001):
- raise SampleMismatch
- delete_test_audio_file()
-
-class TestInit(unittest.TestCase):
- def setUp(self):
- self.snd_header = SMS_SndHeader()
- self.sms_header = SMS_Header()
- self.data = SMS_Data()
- self.analysis_params = SMS_AnalParams()
-
- def tearDown(self):
- sms_freeFrame(self.data)
-
- def test_sms_fillHeader(self):
- "sms_fillHeader copies data from an SMS_AnalParams to an SMS_Header"
- data_fields = ["nFrames", "iFormat", "iFrameRate", "iStochasticType", \
- "nTracks", "iSamplingRate", "nStochasticCoeff"]
- sms_fillHeader(self.sms_header, self.analysis_params, "")
- for field in data_fields:
- self.assert_(eval("self.sms_header."+field) == eval("self.analysis_params."+field))
-
- def test_sms_init(self):
- "sms_init"
- self.assert_(sms_init() == 0)
-
- def test_sms_initAnalysis(self):
- "sms_initAnalysis"
- create_test_audio_file()
- if(sms_openSF(TEST_AUDIO_FILE, self.snd_header)):
- raise NameError("error opening sound file: " + sms_errorString())
- self.assert_(sms_initAnalysis(self.analysis_params, self.snd_header) == 0)
- delete_test_audio_file()
-
- def test_sms_allocFrameH(self):
- "sms_allocFrameH"
- create_test_audio_file()
- if(sms_openSF(TEST_AUDIO_FILE, self.snd_header)):
- raise NameError("error opening sound file: " + sms_errorString())
- self.assert_(sms_allocFrameH(self.sms_header, self.data) == 0)
- delete_test_audio_file()
-
-if __name__ == '__main__':
- unittest.main()
diff --git a/tests/test_sndobj.py b/tests/test_sndobj.py
index 527a9d7..2a27930 100644
--- a/tests/test_sndobj.py
+++ b/tests/test_sndobj.py
@@ -1,19 +1,3 @@
-# Copyright (c) 2009 John Glover, National University of Ireland, Maynooth
-#
-# This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation; either version 2 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program; if not, write to the Free Software
-# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
-
import unittest
import sndobj
import simpl
@@ -21,7 +5,8 @@ from simpl import pysndobj
from scipy.io.wavfile import read
import numpy as np
-FLOAT_PRECISION = 2 # number of decimal places to check for accuracy
+FLOAT_PRECISION = 2 # number of decimal places to check for accuracy
+
class TestSimplSndObj(unittest.TestCase):
def setUp(self):
diff --git a/tests/test_synthesis.py b/tests/test_synthesis.py
new file mode 100644
index 0000000..2e620ea
--- /dev/null
+++ b/tests/test_synthesis.py
@@ -0,0 +1,126 @@
+import os
+from nose.tools import assert_almost_equals
+import simpl
+import simpl.peak_detection as peak_detection
+import simpl.partial_tracking as partial_tracking
+import simpl.synthesis as synthesis
+
+float_precision = 2
+frame_size = 512
+hop_size = 512
+max_peaks = 10
+max_partials = 10
+num_frames = 30
+num_samples = num_frames * hop_size
+audio_path = os.path.join(
+ os.path.dirname(__file__), 'audio/flute.wav'
+)
+libsms_harmonic_synthesis_ifft_path = os.path.join(
+ os.path.dirname(__file__), 'libsms_harmonic_synthesis_ifft.wav'
+)
+libsms_harmonic_synthesis_sin_path = os.path.join(
+ os.path.dirname(__file__), 'libsms_harmonic_synthesis_sin.wav'
+)
+
+PeakDetection = peak_detection.PeakDetection
+SMSPeakDetection = peak_detection.SMSPeakDetection
+PartialTracking = partial_tracking.PartialTracking
+SMSPartialTracking = partial_tracking.SMSPartialTracking
+Synthesis = synthesis.Synthesis
+SMSSynthesis = synthesis.SMSSynthesis
+
+
+class TestSynthesis(object):
+ @classmethod
+ def setup_class(cls):
+ cls.audio = simpl.read_wav(audio_path)[0]
+ cls.audio = cls.audio[0:num_samples]
+
+ def test_basic(self):
+ pd = PeakDetection()
+ pd.hop_size = hop_size
+ frames = pd.find_peaks(self.audio)
+
+ pt = PartialTracking()
+ pt.max_partials = max_partials
+ frames = pt.find_partials(frames)
+
+ s = Synthesis()
+ s.hop_size = hop_size
+ synth_audio = s.synth(frames)
+
+ assert len(synth_audio) == len(self.audio)
+
+
+class TestSMSSynthesis(object):
+ @classmethod
+ def setup_class(cls):
+ cls.audio = simpl.read_wav(audio_path)[0]
+ cls.audio = cls.audio[0:num_samples]
+
+ def test_basic(self):
+ pd = SMSPeakDetection()
+ pd.hop_size = hop_size
+ frames = pd.find_peaks(self.audio)
+
+ pt = SMSPartialTracking()
+ pt.max_partials = max_partials
+ frames = pt.find_partials(frames)
+
+ s = SMSSynthesis()
+ s.hop_size = hop_size
+ synth_audio = s.synth(frames)
+
+ assert len(synth_audio) == len(self.audio)
+
+ def test_harmonic_synthesis_ifft(self):
+ pd = SMSPeakDetection()
+ pd.hop_size = hop_size
+ frames = pd.find_peaks(self.audio)
+
+ pt = SMSPartialTracking()
+ pt.max_partials = max_partials
+ frames = pt.find_partials(frames)
+
+ synth = SMSSynthesis()
+ synth.hop_size = hop_size
+ synth.max_partials = max_partials
+ synth.det_synthesis_type = SMSSynthesis.SMS_DET_IFFT
+ synth_audio = synth.synth(frames)
+
+ assert len(synth_audio) == len(self.audio)
+
+ sms_audio, sampling_rate = simpl.read_wav(
+ libsms_harmonic_synthesis_ifft_path
+ )
+
+ assert len(synth_audio) == len(sms_audio)
+
+ for i in range(len(synth_audio)):
+ assert_almost_equals(synth_audio[i], sms_audio[i], float_precision)
+
+ def test_harmonic_synthesis_sin(self):
+ pd = SMSPeakDetection()
+ pd.hop_size = hop_size
+ frames = pd.find_peaks(self.audio)
+
+ pt = SMSPartialTracking()
+ pt.max_partials = max_partials
+ frames = pt.find_partials(frames)
+
+ synth = SMSSynthesis()
+ synth.hop_size = hop_size
+ synth.max_partials = max_partials
+ synth.det_synthesis_type = SMSSynthesis.SMS_DET_SIN
+ synth_audio = synth.synth(frames)
+
+ assert len(synth_audio) == len(self.audio)
+
+ sms_audio, sampling_rate = simpl.read_wav(
+ libsms_harmonic_synthesis_sin_path
+ )
+
+ assert len(synth_audio) == len(sms_audio)
+
+ for i in range(len(synth_audio)):
+ assert_almost_equals(synth_audio[i], sms_audio[i], float_precision)