summaryrefslogtreecommitdiff
path: root/tests
diff options
context:
space:
mode:
authorJohn Glover <j@johnglover.net>2012-06-30 19:04:02 +0100
committerJohn Glover <j@johnglover.net>2012-06-30 19:04:02 +0100
commitb2e6565c4f94134948cb2d38c27b8c062191ce4a (patch)
tree9e8f849a149723389c033d5005fe082e659687f6 /tests
parent1ef9783c3faed6a18e8cc2fba34f48b50bedd08a (diff)
downloadsimpl-b2e6565c4f94134948cb2d38c27b8c062191ce4a.tar.gz
simpl-b2e6565c4f94134948cb2d38c27b8c062191ce4a.tar.bz2
simpl-b2e6565c4f94134948cb2d38c27b8c062191ce4a.zip
[sms] Add C++ implementation of SMSPeakDetection.
Diffstat (limited to 'tests')
-rw-r--r--tests/test_peak_detection.py106
1 files changed, 105 insertions, 1 deletions
diff --git a/tests/test_peak_detection.py b/tests/test_peak_detection.py
index b24b701..6d623b6 100644
--- a/tests/test_peak_detection.py
+++ b/tests/test_peak_detection.py
@@ -1,12 +1,20 @@
import os
import numpy as np
from nose.tools import assert_almost_equals
+import pysms
import simpl
import simpl.peak_detection as peak_detection
+PeakDetection = peak_detection.PeakDetection
+SMSPeakDetection = peak_detection.SMSPeakDetection
+
float_precision = 5
frame_size = 512
hop_size = 512
+max_peaks = 10
+max_partials = 10
+num_frames = 30
+num_samples = num_frames * hop_size
audio_path = os.path.join(
os.path.dirname(__file__), 'audio/flute.wav'
)
@@ -18,8 +26,104 @@ class TestPeakDetection(object):
cls.audio = simpl.read_wav(audio_path)[0]
def test_peak_detection(self):
- pd = peak_detection.PeakDetection()
+ pd = PeakDetection()
pd.find_peaks(self.audio)
assert len(pd.frames) == len(self.audio) / hop_size
assert len(pd.frames[0].peaks) == 0
+
+
+class TestSMSPeakDetection(object):
+ def _pysms_analysis_params(self, sampling_rate):
+ analysis_params = pysms.SMS_AnalParams()
+ pysms.sms_initAnalParams(analysis_params)
+ analysis_params.iSamplingRate = sampling_rate
+ analysis_params.iFrameRate = sampling_rate / hop_size
+ analysis_params.iWindowType = pysms.SMS_WIN_HAMMING
+ analysis_params.fDefaultFundamental = 100
+ analysis_params.fHighestFreq = 20000
+ analysis_params.iFormat = pysms.SMS_FORMAT_HP
+ analysis_params.nTracks = max_peaks
+ analysis_params.peakParams.iMaxPeaks = max_peaks
+ analysis_params.nGuides = max_peaks
+ analysis_params.iMaxDelayFrames = 4
+ analysis_params.analDelay = 0
+ analysis_params.minGoodFrames = 1
+ analysis_params.iCleanTracks = 0
+ analysis_params.iStochasticType = pysms.SMS_STOC_NONE
+ analysis_params.preEmphasis = 0
+ return analysis_params
+
+ def test_size_next_read(self):
+ """
+ test_size_next_read
+ Make sure PeakDetection is calculating the correct value for the
+ size of the next frame.
+ """
+ audio, sampling_rate = simpl.read_wav(audio_path)
+ pysms.sms_init()
+ snd_header = pysms.SMS_SndHeader()
+
+ # Try to open the input file to fill snd_header
+ if(pysms.sms_openSF(audio_path, snd_header)):
+ raise NameError(
+ "error opening sound file: " + pysms.sms_errorString()
+ )
+
+ analysis_params = self._pysms_analysis_params(sampling_rate)
+ analysis_params.iMaxDelayFrames = num_frames + 1
+ if pysms.sms_initAnalysis(analysis_params, snd_header) != 0:
+ raise Exception("Error allocating memory for analysis_params")
+ analysis_params.nFrames = num_frames
+ sms_header = pysms.SMS_Header()
+ pysms.sms_fillHeader(sms_header, analysis_params, "pysms")
+
+ sample_offset = 0
+ pysms_size_new_data = 0
+ current_frame = 0
+ sms_next_read_sizes = []
+
+ while current_frame < num_frames:
+ sms_next_read_sizes.append(analysis_params.sizeNextRead)
+ sample_offset += pysms_size_new_data
+ pysms_size_new_data = analysis_params.sizeNextRead
+
+ # convert frame to floats for libsms
+ frame = audio[sample_offset:sample_offset + pysms_size_new_data]
+ frame = np.array(frame, dtype=np.float32)
+ if len(frame) < pysms_size_new_data:
+ frame = np.hstack((
+ frame, np.zeros(pysms_size_new_data - len(frame),
+ dtype=np.float32)
+ ))
+
+ analysis_data = pysms.SMS_Data()
+ pysms.sms_allocFrameH(sms_header, analysis_data)
+ status = pysms.sms_analyze(frame, analysis_data, analysis_params)
+ # as the no. of frames of delay is > num_frames, sms_analyze should
+ # never get around to performing partial tracking, and so the
+ # return value should be 0
+ assert status == 0
+ pysms.sms_freeFrame(analysis_data)
+ current_frame += 1
+
+ pysms.sms_freeAnalysis(analysis_params)
+ pysms.sms_closeSF()
+ pysms.sms_free()
+
+ pd = SMSPeakDetection()
+ pd.hop_size = hop_size
+ pd.max_peaks = max_peaks
+ current_frame = 0
+ sample_offset = 0
+
+ while current_frame < num_frames:
+ pd.frame_size = pd.next_frame_size()
+ assert sms_next_read_sizes[current_frame] == pd.frame_size,\
+ (sms_next_read_sizes[current_frame], pd.frame_size)
+ frame = simpl.Frame()
+ frame.size = pd.frame_size
+ frame.audio = audio[sample_offset:sample_offset + pd.frame_size]
+ pd.find_peaks_in_frame(frame)
+ sample_offset += pd.frame_size
+ current_frame += 1