Chris@34
|
1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
|
Chris@34
|
2
|
Chris@34
|
3 /*
|
Chris@34
|
4 Silvet
|
Chris@34
|
5
|
Chris@34
|
6 A Vamp plugin for note transcription.
|
Chris@34
|
7 Centre for Digital Music, Queen Mary University of London.
|
Chris@34
|
8
|
Chris@34
|
9 This program is free software; you can redistribute it and/or
|
Chris@34
|
10 modify it under the terms of the GNU General Public License as
|
Chris@34
|
11 published by the Free Software Foundation; either version 2 of the
|
Chris@34
|
12 License, or (at your option) any later version. See the file
|
Chris@34
|
13 COPYING included with this distribution for more information.
|
Chris@34
|
14 */
|
Chris@34
|
15
|
Chris@34
|
16 #ifndef SILVET_EM_H
|
Chris@34
|
17 #define SILVET_EM_H
|
Chris@34
|
18
|
Chris@34
|
19 #include <vector>
|
Chris@34
|
20
|
Chris@161
|
21 class InstrumentPack;
|
Chris@161
|
22
|
Chris@34
|
23 class EM
|
Chris@34
|
24 {
|
Chris@34
|
25 public:
|
Chris@161
|
26 EM(const InstrumentPack *pack, bool useShifts); // pack must outlive me
|
Chris@34
|
27 ~EM();
|
Chris@34
|
28
|
Chris@183
|
29 void setPitchSparsity(float sparsity) { m_pitchSparsity = sparsity; }
|
Chris@213
|
30 void setSourceSparsity(float sparsity) { m_sourceSparsity = sparsity; }
|
Chris@183
|
31
|
Chris@125
|
32 int getBinCount() const { return m_binCount; }
|
Chris@125
|
33 int getNoteCount() const { return m_noteCount; }
|
Chris@91
|
34 int getSourceCount() const { return m_sourceCount; }
|
Chris@166
|
35 int getShiftCount() const { return m_shiftCount; }
|
Chris@34
|
36
|
Chris@125
|
37 /**
|
Chris@125
|
38 * Carry out one iteration using the given column as input. The
|
Chris@125
|
39 * column must have getBinCount() values.
|
Chris@125
|
40 */
|
Chris@92
|
41 void iterate(const double *column);
|
Chris@91
|
42
|
Chris@125
|
43 /**
|
Chris@125
|
44 * Return the estimated distribution after the current iteration.
|
Chris@125
|
45 * Like the input, this will have getBinCount() values.
|
Chris@125
|
46 */
|
Chris@151
|
47 const float *getEstimate() const {
|
Chris@38
|
48 return m_estimate;
|
Chris@38
|
49 }
|
Chris@125
|
50
|
Chris@125
|
51 /**
|
Chris@125
|
52 * Return the pitch distribution for the current estimate. The
|
Chris@125
|
53 * returned array has getNoteCount() values.
|
Chris@125
|
54 */
|
Chris@151
|
55 const float *getPitchDistribution() const {
|
Chris@38
|
56 return m_pitches;
|
Chris@38
|
57 }
|
Chris@125
|
58
|
Chris@125
|
59 /**
|
Chris@125
|
60 * Return the source distribution for the current estimate. The
|
Chris@125
|
61 * returned pointer refers to getSourceCount() arrays of
|
Chris@125
|
62 * getNoteCount() values.
|
Chris@125
|
63 */
|
Chris@151
|
64 const float *const *getSources() const {
|
Chris@38
|
65 return m_sources;
|
Chris@38
|
66 }
|
Chris@166
|
67
|
Chris@166
|
68 /**
|
Chris@166
|
69 * Return the shift distribution for the current estimate. The
|
Chris@166
|
70 * returned pointer refers to getShiftCount() arrays of
|
Chris@166
|
71 * getNoteCount() values.
|
Chris@166
|
72 */
|
Chris@166
|
73 const float *const *getShifts() const {
|
Chris@166
|
74 return m_shifts;
|
Chris@166
|
75 }
|
Chris@38
|
76
|
Chris@34
|
77 private:
|
Chris@161
|
78 const InstrumentPack *m_pack;
|
Chris@161
|
79
|
Chris@151
|
80 float *m_pitches;
|
Chris@151
|
81 float **m_shifts;
|
Chris@151
|
82 float **m_sources;
|
Chris@55
|
83
|
Chris@151
|
84 float *m_updatePitches;
|
Chris@151
|
85 float **m_updateShifts;
|
Chris@151
|
86 float **m_updateSources;
|
Chris@34
|
87
|
Chris@151
|
88 float *m_estimate;
|
Chris@151
|
89 float *m_q;
|
Chris@55
|
90
|
Chris@83
|
91 const int m_noteCount;
|
Chris@83
|
92 const int m_shiftCount; // 1 + 2 * max template shift
|
Chris@83
|
93 const int m_binCount;
|
Chris@91
|
94 const int m_sourceCount;
|
Chris@55
|
95
|
Chris@183
|
96 float m_pitchSparsity;
|
Chris@183
|
97 float m_shiftSparsity;
|
Chris@183
|
98 float m_sourceSparsity;
|
Chris@36
|
99
|
Chris@151
|
100 void normaliseColumn(float *column, int size);
|
Chris@151
|
101 void normaliseGrid(float **grid, int size1, int size2);
|
Chris@35
|
102
|
Chris@151
|
103 void expectation(const float *column); // size is m_binCount
|
Chris@151
|
104 void maximisation(const float *column); // size is m_binCount
|
Chris@36
|
105
|
Chris@151
|
106 const float *templateFor(int instrument, int note, int shift);
|
Chris@45
|
107 void rangeFor(int instrument, int &minPitch, int &maxPitch);
|
Chris@45
|
108 bool inRange(int instrument, int pitch);
|
Chris@34
|
109 };
|
Chris@34
|
110
|
Chris@34
|
111 #endif
|