summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorJohn Glover <j@johnglover.net>2012-06-28 19:02:34 +0100
committerJohn Glover <j@johnglover.net>2012-06-28 19:02:34 +0100
commit48e299eacc65b5df1b3305f7123eccf30c69d834 (patch)
tree1b4631c78a1bae04016d6d62892ce6ad128ce518
parent974a493e6c6e2563de08952cb16792e691396afa (diff)
downloadsimpl-48e299eacc65b5df1b3305f7123eccf30c69d834.tar.gz
simpl-48e299eacc65b5df1b3305f7123eccf30c69d834.tar.bz2
simpl-48e299eacc65b5df1b3305f7123eccf30c69d834.zip
[base] Add C++ implementation of Synthesis and Residual.
-rw-r--r--simpl/base.pyx128
-rw-r--r--src/simpl/base.cpp113
-rw-r--r--src/simpl/base.h71
-rw-r--r--tests/test_base.py83
4 files changed, 368 insertions, 27 deletions
diff --git a/simpl/base.pyx b/simpl/base.pyx
index bb34e14..b126be1 100644
--- a/simpl/base.pyx
+++ b/simpl/base.pyx
@@ -92,6 +92,38 @@ cdef extern from "../src/simpl/base.h" namespace "simpl":
vector[c_Peak*] update_partials(c_Frame* frame)
vector[c_Frame*] find_partials(vector[c_Frame*] frames)
+ cdef cppclass c_Synthesis "simpl::Synthesis":
+ c_Synthesis()
+ int frame_size()
+ void frame_size(int new_frame_size)
+ int next_frame_size()
+ int hop_size()
+ void hop_size(int new_hop_size)
+ int sampling_rate()
+ void sampling_rate(int new_sampling_rate)
+ int max_partials()
+ void max_partials(int new_max_partials)
+ void synth_frame(c_Frame* frame)
+ vector[c_Frame*] synth(vector[c_Frame*] frames)
+
+ cdef cppclass c_Residual "simpl::Residual":
+ c_Synthesis()
+ int frame_size()
+ void frame_size(int new_frame_size)
+ int next_frame_size()
+ int hop_size()
+ void hop_size(int new_hop_size)
+ int sampling_rate()
+ void sampling_rate(int new_sampling_rate)
+ void residual_frame(int synth_size, double* synth,
+ int original_size, double* original,
+ int residual_size, double* residual)
+ void find_residual(int synth_size, double* synth,
+ int original_size, double* original,
+ int residual_size, double* residual)
+ void synth_frame(c_Frame* frame)
+ vector[c_Frame*] synth(vector[c_Frame*] frames)
+
cdef class Peak:
cdef c_Peak* thisptr
@@ -355,3 +387,99 @@ cdef class PartialTracking:
f.set_frame(output_frames[i])
partial_frames.append(f)
return partial_frames
+
+
+cdef class Synthesis:
+ cdef c_Synthesis* thisptr
+
+ def __cinit__(self): self.thisptr = new c_Synthesis()
+ def __dealloc__(self): del self.thisptr
+
+ property sampling_rate:
+ def __get__(self): return self.thisptr.sampling_rate()
+ def __set__(self, int i): self.thisptr.sampling_rate(i)
+
+ property frame_size:
+ def __get__(self): return self.thisptr.frame_size()
+ def __set__(self, int i): self.thisptr.frame_size(i)
+
+ property hop_size:
+ def __get__(self): return self.thisptr.hop_size()
+ def __set__(self, int i): self.thisptr.hop_size(i)
+
+ property max_partials:
+ def __get__(self): return self.thisptr.max_partials()
+ def __set__(self, int i): self.thisptr.max_partials(i)
+
+ def synth_frame(self, Frame frame not None):
+ self.thisptr.synth_frame(frame.thisptr)
+ return frame.audio
+
+ def synth(self, frames):
+ cdef vector[c_Frame*] c_frames
+ for frame in frames:
+ c_frames.push_back((<Frame>frame).thisptr)
+ cdef vector[c_Frame*] output_frames = self.thisptr.synth(c_frames)
+ cdef np.ndarray[dtype_t, ndim=1] output = np.zeros(
+ output_frames.size() * self.thisptr.hop_size()
+ )
+ cdef np.npy_intp shape[1]
+ shape[0] = <np.npy_intp> self.thisptr.hop_size()
+ for i in range(output_frames.size()):
+ frame_audio = np.PyArray_SimpleNewFromData(1, shape, np.NPY_DOUBLE, output_frames[i].synth())
+ output[i * self.thisptr.hop_size():(i + 1) * self.thisptr.hop_size()] = frame_audio
+ return output
+
+
+cdef class Residual:
+ cdef c_Residual* thisptr
+
+ def __cinit__(self): self.thisptr = new c_Residual()
+ def __dealloc__(self): del self.thisptr
+
+ property sampling_rate:
+ def __get__(self): return self.thisptr.sampling_rate()
+ def __set__(self, int i): self.thisptr.sampling_rate(i)
+
+ property frame_size:
+ def __get__(self): return self.thisptr.frame_size()
+ def __set__(self, int i): self.thisptr.frame_size(i)
+
+ property hop_size:
+ def __get__(self): return self.thisptr.hop_size()
+ def __set__(self, int i): self.thisptr.hop_size(i)
+
+ def residual_frame(self, np.ndarray[dtype_t, ndim=1] synth,
+ np.ndarray[dtype_t, ndim=1] original):
+ cdef np.ndarray[dtype_t, ndim=1] residual = np.zeros(len(synth))
+ self.thisptr.residual_frame(len(synth), <double*> synth.data,
+ len(original), <double*> original.data,
+ len(residual), <double*> residual.data)
+ return residual
+
+ def find_residual(self, np.ndarray[dtype_t, ndim=1] synth,
+ np.ndarray[dtype_t, ndim=1] original):
+ cdef np.ndarray[dtype_t, ndim=1] residual = np.zeros(len(synth))
+ self.thisptr.find_residual(len(synth), <double*> synth.data,
+ len(original), <double*> original.data,
+ len(residual), <double*> residual.data)
+ return residual
+
+ def synth_frame(self, Frame frame not None):
+ self.thisptr.synth_frame(frame.thisptr)
+ return frame.audio
+
+ def synth(self, frames):
+ cdef vector[c_Frame*] c_frames
+ for frame in frames:
+ c_frames.push_back((<Frame>frame).thisptr)
+ cdef vector[c_Frame*] output_frames = self.thisptr.synth(c_frames)
+ cdef np.ndarray[dtype_t, ndim=1] output = np.zeros(
+ output_frames.size() * self.thisptr.hop_size()
+ )
+ cdef np.npy_intp shape[1]
+ shape[0] = <np.npy_intp> self.thisptr.hop_size()
+ for i in range(output_frames.size()):
+ frame_audio = np.PyArray_SimpleNewFromData(1, shape, np.NPY_DOUBLE, output_frames[i].synth())
+ output[i * self.thisptr.hop_size():(i + 1) * self.thisptr.hop_size()] = frame_audio
+ return output
diff --git a/src/simpl/base.cpp b/src/simpl/base.cpp
index 9c70403..9d5f7ad 100644
--- a/src/simpl/base.cpp
+++ b/src/simpl/base.cpp
@@ -428,3 +428,116 @@ Frames PartialTracking::find_partials(Frames frames) {
_frames = frames;
return _frames;
}
+
+
+// ---------------------------------------------------------------------------
+// Synthesis
+// ---------------------------------------------------------------------------
+Synthesis::Synthesis() {
+ _frame_size = 512;
+ _hop_size = 512;
+ _max_partials = 100;
+ _sampling_rate = 44100;
+}
+
+int Synthesis::frame_size() {
+ return _frame_size;
+}
+
+void Synthesis::frame_size(int new_frame_size) {
+ _frame_size = new_frame_size;
+}
+
+int Synthesis::hop_size() {
+ return _hop_size;
+}
+
+void Synthesis::hop_size(int new_hop_size) {
+ _hop_size = new_hop_size;
+}
+
+int Synthesis::max_partials() {
+ return _max_partials;
+}
+
+void Synthesis::max_partials(int new_max_partials) {
+ _max_partials = new_max_partials;
+}
+
+int Synthesis::sampling_rate() {
+ return _sampling_rate;
+}
+
+void Synthesis::sampling_rate(int new_sampling_rate) {
+ _sampling_rate = new_sampling_rate;
+}
+
+void Synthesis::synth_frame(Frame* frame) {
+}
+
+Frames Synthesis::synth(Frames frames) {
+ for(int i = 0; i < frames.size(); i++) {
+ synth_frame(frames[i]);
+ }
+ return frames;
+}
+
+
+// ---------------------------------------------------------------------------
+// Residual
+// ---------------------------------------------------------------------------
+Residual::Residual() {
+ _frame_size = 512;
+ _hop_size = 512;
+ _sampling_rate = 44100;
+}
+
+int Residual::frame_size() {
+ return _frame_size;
+}
+
+void Residual::frame_size(int new_frame_size) {
+ _frame_size = new_frame_size;
+}
+
+int Residual::hop_size() {
+ return _hop_size;
+}
+
+void Residual::hop_size(int new_hop_size) {
+ _hop_size = new_hop_size;
+}
+
+int Residual::sampling_rate() {
+ return _sampling_rate;
+}
+
+void Residual::sampling_rate(int new_sampling_rate) {
+ _sampling_rate = new_sampling_rate;
+}
+
+void Residual::residual_frame(int synth_size, sample* synth,
+ int original_size, sample* original,
+ int residual_size, sample* residual) {
+}
+
+void Residual::find_residual(int synth_size, sample* synth,
+ int original_size, sample* original,
+ int residual_size, sample* residual) {
+ for(int i = 0; i < synth_size; i += _hop_size) {
+ residual_frame(_hop_size, &synth[i],
+ _hop_size, &original[i],
+ _hop_size, &residual[i]);
+ }
+}
+
+void Residual::synth_frame(Frame* frame) {
+}
+
+// Calculate and return a synthesised residual signal
+Frames Residual::synth(Frames frames) {
+ for(int i = 0; i < frames.size(); i++) {
+ synth_frame(frames[i]);
+ }
+ return frames;
+}
diff --git a/src/simpl/base.h b/src/simpl/base.h
index 385e2a9..bdb0d96 100644
--- a/src/simpl/base.h
+++ b/src/simpl/base.h
@@ -7,7 +7,7 @@
using namespace std;
-namespace simpl
+namespace simpl
{
typedef double sample;
@@ -68,10 +68,10 @@ typedef std::vector<Partial*> Partials;
// ---------------------------------------------------------------------------
// Frame
-//
+//
// Represents a frame of audio information.
-// This can be: - raw audio samples
-// - an unordered list of sinusoidal peaks
+// This can be: - raw audio samples
+// - an unordered list of sinusoidal peaks
// - an ordered list of partials
// - synthesised audio samples
// - residual samples
@@ -129,7 +129,7 @@ typedef std::vector<Frame*> Frames;
// ---------------------------------------------------------------------------
// PeakDetection
-//
+//
// Detect spectral peaks
// ---------------------------------------------------------------------------
@@ -214,6 +214,67 @@ class PartialTracking {
virtual Frames find_partials(Frames frames);
};
+
+// ---------------------------------------------------------------------------
+// Synthesis
+//
+// Synthesise audio from spectral analysis data
+// ---------------------------------------------------------------------------
+
+class Synthesis {
+ private:
+ int _frame_size;
+ int _hop_size;
+ int _max_partials;
+ int _sampling_rate;
+
+ public:
+ Synthesis();
+ int frame_size();
+ void frame_size(int new_frame_size);
+ int hop_size();
+ void hop_size(int new_hop_size);
+ int max_partials();
+ void max_partials(int new_max_partials);
+ int sampling_rate();
+ void sampling_rate(int new_sampling_rate);
+
+ virtual void synth_frame(Frame* frame);
+ virtual Frames synth(Frames frames);
+};
+
+// ---------------------------------------------------------------------------
+// Residual
+//
+// Calculate a residual signal
+// ---------------------------------------------------------------------------
+
+class Residual {
+ private:
+ int _frame_size;
+ int _hop_size;
+ int _sampling_rate;
+
+ public:
+ Residual();
+ int frame_size();
+ void frame_size(int new_frame_size);
+ int hop_size();
+ void hop_size(int new_hop_size);
+ int sampling_rate();
+ void sampling_rate(int new_sampling_rate);
+
+ virtual void residual_frame(int synth_size, sample* synth,
+ int original_size, sample* original,
+ int residual_size, sample* residual);
+ virtual void find_residual(int synth_size, sample* synth,
+ int original_size, sample* original,
+ int residual_size, sample* residual);
+
+ virtual void synth_frame(Frame* frame);
+ virtual Frames synth(Frames frames);
+};
+
} // end of namespace Simpl
#endif
diff --git a/tests/test_base.py b/tests/test_base.py
index 738d530..ce4297e 100644
--- a/tests/test_base.py
+++ b/tests/test_base.py
@@ -4,6 +4,13 @@ import scipy.io.wavfile as wavfile
from nose.tools import assert_almost_equals
import simpl.base as base
+float_precision = 5
+frame_size = 512
+hop_size = 512
+audio_path = os.path.join(
+ os.path.dirname(__file__), 'audio/flute.wav'
+)
+
class TestFrame(object):
def test_buffers(self):
@@ -39,8 +46,10 @@ class TestFrame(object):
f.add_peak(p)
assert f.num_peaks == 1
- assert f.peak(0).amplitude == p.amplitude
- assert f.peaks[0].amplitude == p.amplitude
+ assert_almost_equals(f.peak(0).amplitude, p.amplitude,
+ float_precision)
+ assert_almost_equals(f.peaks[0].amplitude, p.amplitude,
+ float_precision)
f.clear()
assert f.num_peaks == 0
@@ -56,21 +65,16 @@ class TestFrame(object):
p.phase = 0.0
f.partial(0, p)
- assert f.partial(0).amplitude == p.amplitude
- assert f.partial(0).frequency == p.frequency
+ assert_almost_equals(f.partial(0).amplitude, p.amplitude,
+ float_precision)
+ assert_almost_equals(f.partial(0).frequency, p.frequency,
+ float_precision)
class TestPeakDetection(object):
- float_precision = 5
- frame_size = 512
- hop_size = 512
- audio_path = os.path.join(
- os.path.dirname(__file__), 'audio/flute.wav'
- )
-
@classmethod
def setup_class(cls):
- cls.audio = wavfile.read(cls.audio_path)[1]
+ cls.audio = wavfile.read(audio_path)[1]
cls.audio = np.asarray(cls.audio, dtype=np.double)
cls.audio /= np.max(cls.audio)
@@ -78,21 +82,14 @@ class TestPeakDetection(object):
pd = base.PeakDetection()
pd.find_peaks(self.audio)
- assert len(pd.frames) == len(self.audio) / self.hop_size
+ assert len(pd.frames) == len(self.audio) / hop_size
assert len(pd.frames[0].peaks) == 0
class TestPartialTracking(object):
- float_precision = 5
- frame_size = 512
- hop_size = 512
- audio_path = os.path.join(
- os.path.dirname(__file__), 'audio/flute.wav'
- )
-
@classmethod
def setup_class(cls):
- cls.audio = wavfile.read(cls.audio_path)[1]
+ cls.audio = wavfile.read(audio_path)[1]
cls.audio = np.asarray(cls.audio, dtype=np.double)
cls.audio /= np.max(cls.audio)
@@ -103,5 +100,47 @@ class TestPartialTracking(object):
pt = base.PartialTracking()
frames = pt.find_partials(frames)
- assert len(frames) == len(self.audio) / self.hop_size
+ assert len(frames) == len(self.audio) / hop_size
assert len(frames[0].partials) == 100
+
+
+class TestSynthesis(object):
+ @classmethod
+ def setup_class(cls):
+ cls.audio = wavfile.read(audio_path)[1]
+ cls.audio = np.asarray(cls.audio, dtype=np.double)
+ cls.audio /= np.max(cls.audio)
+
+ def test_synthesis(self):
+ pd = base.PeakDetection()
+ frames = pd.find_peaks(self.audio)
+
+ pt = base.PartialTracking()
+ frames = pt.find_partials(frames)
+
+ s = base.Synthesis()
+ synth_audio = s.synth(frames)
+
+ assert len(synth_audio)
+
+
+class TestResidual(object):
+ @classmethod
+ def setup_class(cls):
+ cls.audio = wavfile.read(audio_path)[1]
+ cls.audio = np.asarray(cls.audio, dtype=np.double)
+ cls.audio /= np.max(cls.audio)
+
+ def test_synthesis(self):
+ pd = base.PeakDetection()
+ frames = pd.find_peaks(self.audio)
+
+ pt = base.PartialTracking()
+ frames = pt.find_partials(frames)
+
+ s = base.Synthesis()
+ synth_audio = s.synth(frames)
+
+ r = base.Residual()
+ residual_audio = r.find_residual(synth_audio, self.audio)
+ assert len(residual_audio)