tomwalters@305
|
1 #!/usr/bin/env python
|
tomwalters@305
|
2 # encoding: utf-8
|
tomwalters@305
|
3 #
|
tomwalters@305
|
4 # AIM-C: A C++ implementation of the Auditory Image Model
|
tomwalters@305
|
5 # http://www.acousticscale.org/AIMC
|
tomwalters@305
|
6 #
|
tomwalters@318
|
7 # Licensed under the Apache License, Version 2.0 (the "License");
|
tomwalters@318
|
8 # you may not use this file except in compliance with the License.
|
tomwalters@318
|
9 # You may obtain a copy of the License at
|
tomwalters@305
|
10 #
|
tomwalters@318
|
11 # http://www.apache.org/licenses/LICENSE-2.0
|
tomwalters@305
|
12 #
|
tomwalters@318
|
13 # Unless required by applicable law or agreed to in writing, software
|
tomwalters@318
|
14 # distributed under the License is distributed on an "AS IS" BASIS,
|
tomwalters@318
|
15 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
tomwalters@318
|
16 # See the License for the specific language governing permissions and
|
tomwalters@318
|
17 # limitations under the License.
|
tomwalters@305
|
18 """
|
tomwalters@305
|
19 Profiles_test.py
|
tomwalters@305
|
20
|
tomwalters@305
|
21 Created by Thomas Walters on 2010-02-22.
|
tomwalters@305
|
22 Copyright 2010 Thomas Walters <tom@acousticscale.org>
|
tomwalters@305
|
23 Test the AIM-C model from filterbank to SSI profiles
|
tomwalters@305
|
24 """
|
tomwalters@305
|
25
|
tomwalters@305
|
26 import aimc
|
tomwalters@305
|
27 from scipy.io import wavfile
|
tomwalters@305
|
28 from scipy import io
|
tomwalters@305
|
29 import scipy
|
tomwalters@305
|
30 import pylab
|
tomwalters@305
|
31 from itertools import izip, chain, repeat
|
tomwalters@305
|
32
|
tomwalters@305
|
33 def grouper(n, iterable, padvalue=None):
|
tomwalters@305
|
34 "grouper(3, 'abcdefg', 'x') --> ('a','b','c'), ('d','e','f'), ('g','x','x')"
|
tomwalters@305
|
35 return izip(*[chain(iterable, repeat(padvalue, n-1))]*n)
|
tomwalters@305
|
36
|
tomwalters@305
|
37 def BankToArray(out_bank):
|
tomwalters@305
|
38 channel_count = out_bank.channel_count()
|
tomwalters@305
|
39 out_buffer_length = out_bank.buffer_length()
|
tomwalters@305
|
40 out = scipy.zeros((channel_count, out_buffer_length))
|
tomwalters@305
|
41 for ch in range(0, channel_count):
|
tomwalters@305
|
42 for i in range(0, out_buffer_length):
|
tomwalters@305
|
43 out[ch, i] = out_bank.sample(ch, i)
|
tomwalters@305
|
44 return out
|
tomwalters@305
|
45
|
tomwalters@305
|
46 def StrobesToList(bank):
|
tomwalters@305
|
47 channel_count = bank.channel_count()
|
tomwalters@305
|
48 strobes = []
|
tomwalters@305
|
49 for ch in range(0, channel_count):
|
tomwalters@305
|
50 s = []
|
tomwalters@305
|
51 for i in range(0, bank.strobe_count(ch)):
|
tomwalters@305
|
52 s.append(bank.strobe(ch, i))
|
tomwalters@305
|
53 strobes.append(s)
|
tomwalters@305
|
54
|
tomwalters@305
|
55 def main():
|
tomwalters@305
|
56 wave_path = "/Users/Tom/Documents/Work/PhD/HTK-AIM/Sounds/"
|
tomwalters@305
|
57 #features_path = "/Users/Tom/Documents/Work/PhD/HTK-AIM/work08-jess-original-rec_rubber/features/"
|
tomwalters@305
|
58
|
tomwalters@305
|
59 file_name = "ii/ii172.5p112.5s100.0t+000itd"
|
tomwalters@305
|
60
|
tomwalters@305
|
61 wave_suffix = ".wav"
|
tomwalters@305
|
62 features_suffix = ".mat"
|
tomwalters@305
|
63
|
tomwalters@305
|
64 frame_period_ms = 10;
|
tomwalters@305
|
65
|
tomwalters@305
|
66 wave_filename = wave_path + file_name + wave_suffix
|
tomwalters@305
|
67 #features_filename = features_path + file_name + features_suffix
|
tomwalters@305
|
68
|
tomwalters@305
|
69 (sample_rate, input_wave) = wavfile.read(wave_filename)
|
tomwalters@305
|
70 wave_length = input_wave.size
|
tomwalters@305
|
71 buffer_length = int(frame_period_ms * sample_rate / 1000)
|
tomwalters@305
|
72
|
tomwalters@305
|
73 #pylab.plot(input_wave)
|
tomwalters@305
|
74 #pylab.show()
|
tomwalters@305
|
75
|
tomwalters@305
|
76 input_sig = aimc.SignalBank()
|
tomwalters@305
|
77 input_sig.Initialize(1, buffer_length, sample_rate)
|
tomwalters@305
|
78 parameters = aimc.Parameters()
|
tomwalters@305
|
79 parameters.SetFloat("sai.frame_period_ms", 10.0)
|
tomwalters@305
|
80 parameters.SetInt("input.buffersize", 480)
|
tomwalters@305
|
81
|
tomwalters@305
|
82 mod_gt = aimc.ModuleGammatone(parameters)
|
tomwalters@305
|
83 mod_hl = aimc.ModuleHCL(parameters)
|
tomwalters@305
|
84 mod_strobes = aimc.ModuleLocalMax(parameters)
|
tomwalters@305
|
85 mod_sai = aimc.ModuleSAI(parameters)
|
tomwalters@305
|
86 parameters.SetBool("ssi.pitch_cutoff", True)
|
tomwalters@305
|
87 parameters.SetBool("ssi.weight_by_cutoff", False)
|
tomwalters@305
|
88 parameters.SetBool("ssi.weight_by_scaling", True)
|
tomwalters@305
|
89 parameters.SetBool("ssi.log_cycles_axis", True)
|
tomwalters@305
|
90 mod_ssi = aimc.ModuleSSI(parameters)
|
tomwalters@305
|
91
|
tomwalters@305
|
92 parameters.SetFloat("nap.lowpass_cutoff", 100.0)
|
tomwalters@305
|
93 mod_nap_smooth = aimc.ModuleHCL(parameters)
|
tomwalters@305
|
94 mod_scaler = aimc.ModuleScaler(parameters)
|
tomwalters@305
|
95
|
tomwalters@305
|
96 parameters.SetBool("slice.all", False)
|
tomwalters@305
|
97 parameters.SetInt("slice.lower_index", 77)
|
tomwalters@305
|
98 parameters.SetInt("slice.upper_index", 150)
|
tomwalters@305
|
99 slice_1 = aimc.ModuleSlice(parameters)
|
tomwalters@305
|
100
|
tomwalters@305
|
101 parameters.SetInt("slice.lower_index", 210)
|
tomwalters@305
|
102 parameters.SetInt("slice.upper_index", 240)
|
tomwalters@305
|
103 slice_2 = aimc.ModuleSlice(parameters)
|
tomwalters@305
|
104
|
tomwalters@305
|
105 parameters.SetInt("slice.lower_index", 280)
|
tomwalters@305
|
106 parameters.SetInt("slice.upper_index", 304)
|
tomwalters@305
|
107 slice_3 = aimc.ModuleSlice(parameters)
|
tomwalters@305
|
108
|
tomwalters@305
|
109 parameters.SetInt("slice.lower_index", 328)
|
tomwalters@305
|
110 parameters.SetInt("slice.upper_index", 352)
|
tomwalters@305
|
111 slice_4 = aimc.ModuleSlice(parameters)
|
tomwalters@305
|
112
|
tomwalters@305
|
113 parameters.SetBool("slice.all", True)
|
tomwalters@305
|
114 slice_5 = aimc.ModuleSlice(parameters)
|
tomwalters@305
|
115
|
tomwalters@305
|
116 nap_profile = aimc.ModuleSlice(parameters)
|
tomwalters@305
|
117
|
tomwalters@305
|
118 features_1 = aimc.ModuleGaussians(parameters)
|
tomwalters@305
|
119 features_2 = aimc.ModuleGaussians(parameters)
|
tomwalters@305
|
120 features_3 = aimc.ModuleGaussians(parameters)
|
tomwalters@305
|
121 features_4 = aimc.ModuleGaussians(parameters)
|
tomwalters@305
|
122 features_5 = aimc.ModuleGaussians(parameters)
|
tomwalters@305
|
123
|
tomwalters@305
|
124 mod_gt.AddTarget(mod_hl)
|
tomwalters@305
|
125 mod_gt.AddTarget(mod_nap_smooth)
|
tomwalters@305
|
126 mod_nap_smooth.AddTarget(nap_profile)
|
tomwalters@305
|
127 nap_profile.AddTarget(mod_scaler)
|
tomwalters@305
|
128 mod_hl.AddTarget(mod_strobes)
|
tomwalters@305
|
129 mod_strobes.AddTarget(mod_sai)
|
tomwalters@305
|
130 mod_sai.AddTarget(mod_ssi)
|
tomwalters@305
|
131 mod_ssi.AddTarget(slice_1)
|
tomwalters@305
|
132 mod_ssi.AddTarget(slice_2)
|
tomwalters@305
|
133 mod_ssi.AddTarget(slice_3)
|
tomwalters@305
|
134 mod_ssi.AddTarget(slice_4)
|
tomwalters@305
|
135 mod_ssi.AddTarget(slice_5)
|
tomwalters@305
|
136
|
tomwalters@305
|
137 slice_1.AddTarget(features_1)
|
tomwalters@305
|
138 slice_2.AddTarget(features_2)
|
tomwalters@305
|
139 slice_3.AddTarget(features_3)
|
tomwalters@305
|
140 slice_4.AddTarget(features_4)
|
tomwalters@305
|
141 slice_5.AddTarget(features_5)
|
tomwalters@305
|
142
|
tomwalters@305
|
143 mod_gt.Initialize(input_sig)
|
tomwalters@305
|
144
|
tomwalters@305
|
145 correct_count = 0;
|
tomwalters@305
|
146 incorrect_count = 0;
|
tomwalters@305
|
147
|
tomwalters@305
|
148 scaled_wave = []
|
tomwalters@305
|
149 for sample in input_wave:
|
tomwalters@305
|
150 scaled_wave.append(float(sample / float(pow(2,15) - 1)))
|
tomwalters@305
|
151 i = 0
|
tomwalters@305
|
152
|
tomwalters@305
|
153 wave_chunks = grouper(buffer_length, scaled_wave, 0)
|
tomwalters@305
|
154
|
tomwalters@305
|
155 out_bmm = []
|
tomwalters@305
|
156 out_nap = []
|
tomwalters@305
|
157 out_smooth_nap_profile = []
|
tomwalters@305
|
158 out_strobes = []
|
tomwalters@305
|
159 out_sais = []
|
tomwalters@305
|
160 out_ssis = []
|
tomwalters@305
|
161 out_slice_1 = []
|
tomwalters@305
|
162 out_slice_2 = []
|
tomwalters@305
|
163 out_slice_3 = []
|
tomwalters@305
|
164 out_slice_4 = []
|
tomwalters@305
|
165 out_slice_5 = []
|
tomwalters@305
|
166 out_feat_1 = []
|
tomwalters@305
|
167 out_feat_2 = []
|
tomwalters@305
|
168 out_feat_3 = []
|
tomwalters@305
|
169 out_feat_4 = []
|
tomwalters@305
|
170 out_feat_5 = []
|
tomwalters@305
|
171 for chunk in wave_chunks:
|
tomwalters@305
|
172 i = 0
|
tomwalters@305
|
173 for sample in chunk:
|
tomwalters@305
|
174 input_sig.set_sample(0, i, float(sample))
|
tomwalters@305
|
175 i += 1
|
tomwalters@305
|
176 mod_gt.Process(input_sig)
|
tomwalters@305
|
177
|
tomwalters@305
|
178 #out_bmm.append(BankToArray(mod_gt.GetOutputBank()))
|
tomwalters@305
|
179 #out_nap.append(BankToArray(mod_hl.GetOutputBank()))
|
tomwalters@305
|
180 out_smooth_nap_profile.append(BankToArray(mod_scaler.GetOutputBank()))
|
tomwalters@305
|
181 #out_strobes.append(BankToArray(mod_strobes.GetOutputBank()))
|
tomwalters@305
|
182 #out_sais.append(BankToArray(mod_sai.GetOutputBank()))
|
tomwalters@305
|
183 out_ssis.append(BankToArray(mod_ssi.GetOutputBank()))
|
tomwalters@305
|
184 out_slice_1.append(BankToArray(slice_1.GetOutputBank()))
|
tomwalters@305
|
185 out_slice_2.append(BankToArray(slice_2.GetOutputBank()))
|
tomwalters@305
|
186 out_slice_3.append(BankToArray(slice_3.GetOutputBank()))
|
tomwalters@305
|
187 out_slice_4.append(BankToArray(slice_4.GetOutputBank()))
|
tomwalters@305
|
188 out_slice_5.append(BankToArray(slice_5.GetOutputBank()))
|
tomwalters@305
|
189 out_feat_1.append(BankToArray(features_1.GetOutputBank()))
|
tomwalters@305
|
190 out_feat_2.append(BankToArray(features_2.GetOutputBank()))
|
tomwalters@305
|
191 out_feat_3.append(BankToArray(features_3.GetOutputBank()))
|
tomwalters@305
|
192 out_feat_4.append(BankToArray(features_4.GetOutputBank()))
|
tomwalters@305
|
193 out_feat_5.append(BankToArray(features_5.GetOutputBank()))
|
tomwalters@305
|
194
|
tomwalters@305
|
195 out_bank = mod_gt.GetOutputBank()
|
tomwalters@305
|
196 channel_count = out_bank.channel_count()
|
tomwalters@305
|
197 cfs = scipy.zeros((channel_count))
|
tomwalters@305
|
198 for ch in range(0, channel_count):
|
tomwalters@305
|
199 cfs[ch] = out_bank.centre_frequency(ch)
|
tomwalters@305
|
200 outmat = dict(bmm=out_bmm, nap=out_nap, sais=out_sais,
|
tomwalters@305
|
201 ssis=out_ssis, slice1=out_slice_1, slice2=out_slice_2,
|
tomwalters@305
|
202 slice3=out_slice_3, slice4=out_slice_4, slice5=out_slice_5,
|
tomwalters@305
|
203 feat1=out_feat_1, feat2=out_feat_2, feat3=out_feat_3,
|
tomwalters@305
|
204 feat4=out_feat_4, feat5=out_feat_5,
|
tomwalters@305
|
205 nap_smooth=out_smooth_nap_profile, centre_freqs=cfs)
|
tomwalters@305
|
206 io.savemat("src/Scripts/profile_out.mat", outmat, oned_as='column')
|
tomwalters@305
|
207
|
tomwalters@305
|
208 pass
|
tomwalters@305
|
209
|
tomwalters@305
|
210
|
tomwalters@305
|
211 if __name__ == '__main__':
|
tomwalters@305
|
212 main()
|