tomwalters@32
|
1 #!/usr/bin/env python
|
tomwalters@32
|
2 # encoding: utf-8
|
tomwalters@32
|
3 #
|
tomwalters@32
|
4 # AIM-C: A C++ implementation of the Auditory Image Model
|
tomwalters@32
|
5 # http://www.acousticscale.org/AIMC
|
tomwalters@32
|
6 #
|
tomwalters@32
|
7 # This program is free software: you can redistribute it and/or modify
|
tomwalters@32
|
8 # it under the terms of the GNU General Public License as published by
|
tomwalters@32
|
9 # the Free Software Foundation, either version 3 of the License, or
|
tomwalters@32
|
10 # (at your option) any later version.
|
tomwalters@32
|
11 #
|
tomwalters@32
|
12 # This program is distributed in the hope that it will be useful,
|
tomwalters@32
|
13 # but WITHOUT ANY WARRANTY; without even the implied warranty of
|
tomwalters@32
|
14 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
tomwalters@32
|
15 # GNU General Public License for more details.
|
tomwalters@32
|
16 #
|
tomwalters@32
|
17 # You should have received a copy of the GNU General Public License
|
tomwalters@32
|
18 # along with this program. If not, see <http://www.gnu.org/licenses/>.
|
tomwalters@32
|
19 """
|
tomwalters@32
|
20 Profiles_test.py
|
tomwalters@32
|
21
|
tomwalters@32
|
22 Created by Thomas Walters on 2010-02-22.
|
tomwalters@32
|
23 Copyright 2010 Thomas Walters <tom@acousticscale.org>
|
tomwalters@32
|
24 Test the AIM-C model from filterbank to SSI profiles
|
tomwalters@32
|
25 """
|
tomwalters@32
|
26
|
tomwalters@32
|
27 import aimc
|
tomwalters@32
|
28 from scipy.io import wavfile
|
tomwalters@32
|
29 from scipy import io
|
tomwalters@32
|
30 import scipy
|
tomwalters@32
|
31 import pylab
|
tomwalters@32
|
32 from itertools import izip, chain, repeat
|
tomwalters@32
|
33
|
tomwalters@32
|
34 def grouper(n, iterable, padvalue=None):
|
tomwalters@32
|
35 "grouper(3, 'abcdefg', 'x') --> ('a','b','c'), ('d','e','f'), ('g','x','x')"
|
tomwalters@32
|
36 return izip(*[chain(iterable, repeat(padvalue, n-1))]*n)
|
tomwalters@32
|
37
|
tomwalters@32
|
38 def BankToArray(out_bank):
|
tomwalters@32
|
39 channel_count = out_bank.channel_count()
|
tomwalters@32
|
40 out_buffer_length = out_bank.buffer_length()
|
tomwalters@32
|
41 out = scipy.zeros((channel_count, out_buffer_length))
|
tomwalters@32
|
42 for ch in range(0, channel_count):
|
tomwalters@32
|
43 for i in range(0, out_buffer_length):
|
tomwalters@32
|
44 out[ch, i] = out_bank.sample(ch, i)
|
tomwalters@32
|
45 return out
|
tomwalters@32
|
46
|
tomwalters@32
|
47 def StrobesToList(bank):
|
tomwalters@32
|
48 channel_count = bank.channel_count()
|
tomwalters@32
|
49 strobes = []
|
tomwalters@32
|
50 for ch in range(0, channel_count):
|
tomwalters@32
|
51 s = []
|
tomwalters@32
|
52 for i in range(0, bank.strobe_count(ch)):
|
tomwalters@32
|
53 s.append(bank.strobe(ch, i))
|
tomwalters@32
|
54 strobes.append(s)
|
tomwalters@32
|
55
|
tomwalters@32
|
56 def main():
|
tomwalters@32
|
57 wave_path = "/Users/Tom/Documents/Work/PhD/HTK-AIM/Sounds/"
|
tomwalters@32
|
58 #features_path = "/Users/Tom/Documents/Work/PhD/HTK-AIM/work08-jess-original-rec_rubber/features/"
|
tomwalters@32
|
59
|
tomwalters@32
|
60 file_name = "ii/ii172.5p112.5s100.0t+000itd"
|
tomwalters@32
|
61
|
tomwalters@32
|
62 wave_suffix = ".wav"
|
tomwalters@32
|
63 features_suffix = ".mat"
|
tomwalters@32
|
64
|
tomwalters@32
|
65 frame_period_ms = 10;
|
tomwalters@32
|
66
|
tomwalters@32
|
67 wave_filename = wave_path + file_name + wave_suffix
|
tomwalters@32
|
68 #features_filename = features_path + file_name + features_suffix
|
tomwalters@32
|
69
|
tomwalters@32
|
70 (sample_rate, input_wave) = wavfile.read(wave_filename)
|
tomwalters@32
|
71 wave_length = input_wave.size
|
tomwalters@32
|
72 buffer_length = int(frame_period_ms * sample_rate / 1000)
|
tomwalters@32
|
73
|
tomwalters@32
|
74 #pylab.plot(input_wave)
|
tomwalters@32
|
75 #pylab.show()
|
tomwalters@32
|
76
|
tomwalters@32
|
77 input_sig = aimc.SignalBank()
|
tomwalters@32
|
78 input_sig.Initialize(1, buffer_length, sample_rate)
|
tomwalters@32
|
79 parameters = aimc.Parameters()
|
tomwalters@32
|
80 parameters.SetFloat("sai.frame_period_ms", 10.0)
|
tomwalters@32
|
81 parameters.SetInt("input.buffersize", 480)
|
tomwalters@32
|
82
|
tomwalters@32
|
83 mod_gt = aimc.ModuleGammatone(parameters)
|
tomwalters@32
|
84 mod_hl = aimc.ModuleHCL(parameters)
|
tomwalters@32
|
85 mod_strobes = aimc.ModuleLocalMax(parameters)
|
tomwalters@32
|
86 mod_sai = aimc.ModuleSAI(parameters)
|
tomwalters@32
|
87 parameters.SetBool("ssi.pitch_cutoff", True)
|
tomwalters@32
|
88 parameters.SetBool("ssi.weight_by_cutoff", False)
|
tomwalters@32
|
89 parameters.SetBool("ssi.weight_by_scaling", True)
|
tomwalters@32
|
90 parameters.SetBool("ssi.log_cycles_axis", True)
|
tomwalters@32
|
91 mod_ssi = aimc.ModuleSSI(parameters)
|
tomwalters@32
|
92
|
tomwalters@32
|
93 parameters.SetFloat("nap.lowpass_cutoff", 100.0)
|
tomwalters@32
|
94 mod_nap_smooth = aimc.ModuleHCL(parameters)
|
tomwalters@32
|
95 mod_scaler = aimc.ModuleScaler(parameters)
|
tomwalters@32
|
96
|
tomwalters@32
|
97 parameters.SetBool("slice.all", False)
|
tomwalters@32
|
98 parameters.SetInt("slice.lower_index", 77)
|
tomwalters@32
|
99 parameters.SetInt("slice.upper_index", 150)
|
tomwalters@32
|
100 slice_1 = aimc.ModuleSlice(parameters)
|
tomwalters@32
|
101
|
tomwalters@32
|
102 parameters.SetInt("slice.lower_index", 210)
|
tomwalters@32
|
103 parameters.SetInt("slice.upper_index", 240)
|
tomwalters@32
|
104 slice_2 = aimc.ModuleSlice(parameters)
|
tomwalters@32
|
105
|
tomwalters@32
|
106 parameters.SetInt("slice.lower_index", 280)
|
tomwalters@32
|
107 parameters.SetInt("slice.upper_index", 304)
|
tomwalters@32
|
108 slice_3 = aimc.ModuleSlice(parameters)
|
tomwalters@32
|
109
|
tomwalters@32
|
110 parameters.SetInt("slice.lower_index", 328)
|
tomwalters@32
|
111 parameters.SetInt("slice.upper_index", 352)
|
tomwalters@32
|
112 slice_4 = aimc.ModuleSlice(parameters)
|
tomwalters@32
|
113
|
tomwalters@32
|
114 parameters.SetBool("slice.all", True)
|
tomwalters@32
|
115 slice_5 = aimc.ModuleSlice(parameters)
|
tomwalters@32
|
116
|
tomwalters@32
|
117 nap_profile = aimc.ModuleSlice(parameters)
|
tomwalters@32
|
118
|
tomwalters@32
|
119 features_1 = aimc.ModuleGaussians(parameters)
|
tomwalters@32
|
120 features_2 = aimc.ModuleGaussians(parameters)
|
tomwalters@32
|
121 features_3 = aimc.ModuleGaussians(parameters)
|
tomwalters@32
|
122 features_4 = aimc.ModuleGaussians(parameters)
|
tomwalters@32
|
123 features_5 = aimc.ModuleGaussians(parameters)
|
tomwalters@32
|
124
|
tomwalters@32
|
125 mod_gt.AddTarget(mod_hl)
|
tomwalters@32
|
126 mod_gt.AddTarget(mod_nap_smooth)
|
tomwalters@32
|
127 mod_nap_smooth.AddTarget(nap_profile)
|
tomwalters@32
|
128 nap_profile.AddTarget(mod_scaler)
|
tomwalters@32
|
129 mod_hl.AddTarget(mod_strobes)
|
tomwalters@32
|
130 mod_strobes.AddTarget(mod_sai)
|
tomwalters@32
|
131 mod_sai.AddTarget(mod_ssi)
|
tomwalters@32
|
132 mod_ssi.AddTarget(slice_1)
|
tomwalters@32
|
133 mod_ssi.AddTarget(slice_2)
|
tomwalters@32
|
134 mod_ssi.AddTarget(slice_3)
|
tomwalters@32
|
135 mod_ssi.AddTarget(slice_4)
|
tomwalters@32
|
136 mod_ssi.AddTarget(slice_5)
|
tomwalters@32
|
137
|
tomwalters@32
|
138 slice_1.AddTarget(features_1)
|
tomwalters@32
|
139 slice_2.AddTarget(features_2)
|
tomwalters@32
|
140 slice_3.AddTarget(features_3)
|
tomwalters@32
|
141 slice_4.AddTarget(features_4)
|
tomwalters@32
|
142 slice_5.AddTarget(features_5)
|
tomwalters@32
|
143
|
tomwalters@32
|
144 mod_gt.Initialize(input_sig)
|
tomwalters@32
|
145
|
tomwalters@32
|
146 correct_count = 0;
|
tomwalters@32
|
147 incorrect_count = 0;
|
tomwalters@32
|
148
|
tomwalters@32
|
149 scaled_wave = []
|
tomwalters@32
|
150 for sample in input_wave:
|
tomwalters@32
|
151 scaled_wave.append(float(sample / float(pow(2,15) - 1)))
|
tomwalters@32
|
152 i = 0
|
tomwalters@32
|
153
|
tomwalters@32
|
154 wave_chunks = grouper(buffer_length, scaled_wave, 0)
|
tomwalters@32
|
155
|
tomwalters@32
|
156 out_bmm = []
|
tomwalters@32
|
157 out_nap = []
|
tomwalters@32
|
158 out_smooth_nap_profile = []
|
tomwalters@32
|
159 out_strobes = []
|
tomwalters@32
|
160 out_sais = []
|
tomwalters@32
|
161 out_ssis = []
|
tomwalters@32
|
162 out_slice_1 = []
|
tomwalters@32
|
163 out_slice_2 = []
|
tomwalters@32
|
164 out_slice_3 = []
|
tomwalters@32
|
165 out_slice_4 = []
|
tomwalters@32
|
166 out_slice_5 = []
|
tomwalters@32
|
167 out_feat_1 = []
|
tomwalters@32
|
168 out_feat_2 = []
|
tomwalters@32
|
169 out_feat_3 = []
|
tomwalters@32
|
170 out_feat_4 = []
|
tomwalters@32
|
171 out_feat_5 = []
|
tomwalters@32
|
172 for chunk in wave_chunks:
|
tomwalters@32
|
173 i = 0
|
tomwalters@32
|
174 for sample in chunk:
|
tomwalters@32
|
175 input_sig.set_sample(0, i, float(sample))
|
tomwalters@32
|
176 i += 1
|
tomwalters@32
|
177 mod_gt.Process(input_sig)
|
tomwalters@32
|
178
|
tomwalters@32
|
179 #out_bmm.append(BankToArray(mod_gt.GetOutputBank()))
|
tomwalters@32
|
180 #out_nap.append(BankToArray(mod_hl.GetOutputBank()))
|
tomwalters@32
|
181 out_smooth_nap_profile.append(BankToArray(mod_scaler.GetOutputBank()))
|
tomwalters@32
|
182 #out_strobes.append(BankToArray(mod_strobes.GetOutputBank()))
|
tomwalters@32
|
183 #out_sais.append(BankToArray(mod_sai.GetOutputBank()))
|
tomwalters@32
|
184 out_ssis.append(BankToArray(mod_ssi.GetOutputBank()))
|
tomwalters@32
|
185 out_slice_1.append(BankToArray(slice_1.GetOutputBank()))
|
tomwalters@32
|
186 out_slice_2.append(BankToArray(slice_2.GetOutputBank()))
|
tomwalters@32
|
187 out_slice_3.append(BankToArray(slice_3.GetOutputBank()))
|
tomwalters@32
|
188 out_slice_4.append(BankToArray(slice_4.GetOutputBank()))
|
tomwalters@32
|
189 out_slice_5.append(BankToArray(slice_5.GetOutputBank()))
|
tomwalters@32
|
190 out_feat_1.append(BankToArray(features_1.GetOutputBank()))
|
tomwalters@32
|
191 out_feat_2.append(BankToArray(features_2.GetOutputBank()))
|
tomwalters@32
|
192 out_feat_3.append(BankToArray(features_3.GetOutputBank()))
|
tomwalters@32
|
193 out_feat_4.append(BankToArray(features_4.GetOutputBank()))
|
tomwalters@32
|
194 out_feat_5.append(BankToArray(features_5.GetOutputBank()))
|
tomwalters@32
|
195
|
tomwalters@32
|
196 out_bank = mod_gt.GetOutputBank()
|
tomwalters@32
|
197 channel_count = out_bank.channel_count()
|
tomwalters@32
|
198 cfs = scipy.zeros((channel_count))
|
tomwalters@32
|
199 for ch in range(0, channel_count):
|
tomwalters@32
|
200 cfs[ch] = out_bank.centre_frequency(ch)
|
tomwalters@32
|
201 outmat = dict(bmm=out_bmm, nap=out_nap, sais=out_sais,
|
tomwalters@32
|
202 ssis=out_ssis, slice1=out_slice_1, slice2=out_slice_2,
|
tomwalters@32
|
203 slice3=out_slice_3, slice4=out_slice_4, slice5=out_slice_5,
|
tomwalters@32
|
204 feat1=out_feat_1, feat2=out_feat_2, feat3=out_feat_3,
|
tomwalters@32
|
205 feat4=out_feat_4, feat5=out_feat_5,
|
tomwalters@32
|
206 nap_smooth=out_smooth_nap_profile, centre_freqs=cfs)
|
tomwalters@32
|
207 io.savemat("src/Scripts/profile_out.mat", outmat, oned_as='column')
|
tomwalters@32
|
208
|
tomwalters@32
|
209 pass
|
tomwalters@32
|
210
|
tomwalters@32
|
211
|
tomwalters@32
|
212 if __name__ == '__main__':
|
tomwalters@32
|
213 main()
|