tomwalters@305: #!/usr/bin/env python tomwalters@305: # encoding: utf-8 tomwalters@305: # tomwalters@305: # AIM-C: A C++ implementation of the Auditory Image Model tomwalters@305: # http://www.acousticscale.org/AIMC tomwalters@305: # tomwalters@318: # Licensed under the Apache License, Version 2.0 (the "License"); tomwalters@318: # you may not use this file except in compliance with the License. tomwalters@318: # You may obtain a copy of the License at tomwalters@305: # tomwalters@318: # http://www.apache.org/licenses/LICENSE-2.0 tomwalters@305: # tomwalters@318: # Unless required by applicable law or agreed to in writing, software tomwalters@318: # distributed under the License is distributed on an "AS IS" BASIS, tomwalters@318: # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. tomwalters@318: # See the License for the specific language governing permissions and tomwalters@318: # limitations under the License. tomwalters@305: """ tomwalters@305: Profiles_test.py tomwalters@305: tomwalters@305: Created by Thomas Walters on 2010-02-22. tomwalters@305: Copyright 2010 Thomas Walters tomwalters@305: Test the AIM-C model from filterbank to SSI profiles tomwalters@305: """ tomwalters@305: tomwalters@305: import aimc tomwalters@305: from scipy.io import wavfile tomwalters@305: from scipy import io tomwalters@305: import scipy tomwalters@305: import pylab tomwalters@305: from itertools import izip, chain, repeat tomwalters@305: tomwalters@305: def grouper(n, iterable, padvalue=None): tomwalters@305: "grouper(3, 'abcdefg', 'x') --> ('a','b','c'), ('d','e','f'), ('g','x','x')" tomwalters@305: return izip(*[chain(iterable, repeat(padvalue, n-1))]*n) tomwalters@305: tomwalters@305: def BankToArray(out_bank): tomwalters@305: channel_count = out_bank.channel_count() tomwalters@305: out_buffer_length = out_bank.buffer_length() tomwalters@305: out = scipy.zeros((channel_count, out_buffer_length)) tomwalters@305: for ch in range(0, channel_count): tomwalters@305: for i in range(0, out_buffer_length): tomwalters@305: out[ch, i] = out_bank.sample(ch, i) tomwalters@305: return out tomwalters@305: tomwalters@305: def StrobesToList(bank): tomwalters@305: channel_count = bank.channel_count() tomwalters@305: strobes = [] tomwalters@305: for ch in range(0, channel_count): tomwalters@305: s = [] tomwalters@305: for i in range(0, bank.strobe_count(ch)): tomwalters@305: s.append(bank.strobe(ch, i)) tomwalters@305: strobes.append(s) tomwalters@305: tomwalters@305: def main(): tomwalters@305: wave_path = "/Users/Tom/Documents/Work/PhD/HTK-AIM/Sounds/" tomwalters@305: #features_path = "/Users/Tom/Documents/Work/PhD/HTK-AIM/work08-jess-original-rec_rubber/features/" tomwalters@305: tomwalters@305: file_name = "ii/ii172.5p112.5s100.0t+000itd" tomwalters@305: tomwalters@305: wave_suffix = ".wav" tomwalters@305: features_suffix = ".mat" tomwalters@305: tomwalters@305: frame_period_ms = 10; tomwalters@305: tomwalters@305: wave_filename = wave_path + file_name + wave_suffix tomwalters@305: #features_filename = features_path + file_name + features_suffix tomwalters@305: tomwalters@305: (sample_rate, input_wave) = wavfile.read(wave_filename) tomwalters@305: wave_length = input_wave.size tomwalters@305: buffer_length = int(frame_period_ms * sample_rate / 1000) tomwalters@305: tomwalters@305: #pylab.plot(input_wave) tomwalters@305: #pylab.show() tomwalters@305: tomwalters@305: input_sig = aimc.SignalBank() tomwalters@305: input_sig.Initialize(1, buffer_length, sample_rate) tomwalters@305: parameters = aimc.Parameters() tomwalters@305: parameters.SetFloat("sai.frame_period_ms", 10.0) tomwalters@305: parameters.SetInt("input.buffersize", 480) tomwalters@305: tomwalters@305: mod_gt = aimc.ModuleGammatone(parameters) tomwalters@305: mod_hl = aimc.ModuleHCL(parameters) tomwalters@305: mod_strobes = aimc.ModuleLocalMax(parameters) tomwalters@305: mod_sai = aimc.ModuleSAI(parameters) tomwalters@305: parameters.SetBool("ssi.pitch_cutoff", True) tomwalters@305: parameters.SetBool("ssi.weight_by_cutoff", False) tomwalters@305: parameters.SetBool("ssi.weight_by_scaling", True) tomwalters@305: parameters.SetBool("ssi.log_cycles_axis", True) tomwalters@305: mod_ssi = aimc.ModuleSSI(parameters) tomwalters@305: tomwalters@305: parameters.SetFloat("nap.lowpass_cutoff", 100.0) tomwalters@305: mod_nap_smooth = aimc.ModuleHCL(parameters) tomwalters@305: mod_scaler = aimc.ModuleScaler(parameters) tomwalters@305: tomwalters@305: parameters.SetBool("slice.all", False) tomwalters@305: parameters.SetInt("slice.lower_index", 77) tomwalters@305: parameters.SetInt("slice.upper_index", 150) tomwalters@305: slice_1 = aimc.ModuleSlice(parameters) tomwalters@305: tomwalters@305: parameters.SetInt("slice.lower_index", 210) tomwalters@305: parameters.SetInt("slice.upper_index", 240) tomwalters@305: slice_2 = aimc.ModuleSlice(parameters) tomwalters@305: tomwalters@305: parameters.SetInt("slice.lower_index", 280) tomwalters@305: parameters.SetInt("slice.upper_index", 304) tomwalters@305: slice_3 = aimc.ModuleSlice(parameters) tomwalters@305: tomwalters@305: parameters.SetInt("slice.lower_index", 328) tomwalters@305: parameters.SetInt("slice.upper_index", 352) tomwalters@305: slice_4 = aimc.ModuleSlice(parameters) tomwalters@305: tomwalters@305: parameters.SetBool("slice.all", True) tomwalters@305: slice_5 = aimc.ModuleSlice(parameters) tomwalters@305: tomwalters@305: nap_profile = aimc.ModuleSlice(parameters) tomwalters@305: tomwalters@305: features_1 = aimc.ModuleGaussians(parameters) tomwalters@305: features_2 = aimc.ModuleGaussians(parameters) tomwalters@305: features_3 = aimc.ModuleGaussians(parameters) tomwalters@305: features_4 = aimc.ModuleGaussians(parameters) tomwalters@305: features_5 = aimc.ModuleGaussians(parameters) tomwalters@305: tomwalters@305: mod_gt.AddTarget(mod_hl) tomwalters@305: mod_gt.AddTarget(mod_nap_smooth) tomwalters@305: mod_nap_smooth.AddTarget(nap_profile) tomwalters@305: nap_profile.AddTarget(mod_scaler) tomwalters@305: mod_hl.AddTarget(mod_strobes) tomwalters@305: mod_strobes.AddTarget(mod_sai) tomwalters@305: mod_sai.AddTarget(mod_ssi) tomwalters@305: mod_ssi.AddTarget(slice_1) tomwalters@305: mod_ssi.AddTarget(slice_2) tomwalters@305: mod_ssi.AddTarget(slice_3) tomwalters@305: mod_ssi.AddTarget(slice_4) tomwalters@305: mod_ssi.AddTarget(slice_5) tomwalters@305: tomwalters@305: slice_1.AddTarget(features_1) tomwalters@305: slice_2.AddTarget(features_2) tomwalters@305: slice_3.AddTarget(features_3) tomwalters@305: slice_4.AddTarget(features_4) tomwalters@305: slice_5.AddTarget(features_5) tomwalters@305: tomwalters@305: mod_gt.Initialize(input_sig) tomwalters@305: tomwalters@305: correct_count = 0; tomwalters@305: incorrect_count = 0; tomwalters@305: tomwalters@305: scaled_wave = [] tomwalters@305: for sample in input_wave: tomwalters@305: scaled_wave.append(float(sample / float(pow(2,15) - 1))) tomwalters@305: i = 0 tomwalters@305: tomwalters@305: wave_chunks = grouper(buffer_length, scaled_wave, 0) tomwalters@305: tomwalters@305: out_bmm = [] tomwalters@305: out_nap = [] tomwalters@305: out_smooth_nap_profile = [] tomwalters@305: out_strobes = [] tomwalters@305: out_sais = [] tomwalters@305: out_ssis = [] tomwalters@305: out_slice_1 = [] tomwalters@305: out_slice_2 = [] tomwalters@305: out_slice_3 = [] tomwalters@305: out_slice_4 = [] tomwalters@305: out_slice_5 = [] tomwalters@305: out_feat_1 = [] tomwalters@305: out_feat_2 = [] tomwalters@305: out_feat_3 = [] tomwalters@305: out_feat_4 = [] tomwalters@305: out_feat_5 = [] tomwalters@305: for chunk in wave_chunks: tomwalters@305: i = 0 tomwalters@305: for sample in chunk: tomwalters@305: input_sig.set_sample(0, i, float(sample)) tomwalters@305: i += 1 tomwalters@305: mod_gt.Process(input_sig) tomwalters@305: tomwalters@305: #out_bmm.append(BankToArray(mod_gt.GetOutputBank())) tomwalters@305: #out_nap.append(BankToArray(mod_hl.GetOutputBank())) tomwalters@305: out_smooth_nap_profile.append(BankToArray(mod_scaler.GetOutputBank())) tomwalters@305: #out_strobes.append(BankToArray(mod_strobes.GetOutputBank())) tomwalters@305: #out_sais.append(BankToArray(mod_sai.GetOutputBank())) tomwalters@305: out_ssis.append(BankToArray(mod_ssi.GetOutputBank())) tomwalters@305: out_slice_1.append(BankToArray(slice_1.GetOutputBank())) tomwalters@305: out_slice_2.append(BankToArray(slice_2.GetOutputBank())) tomwalters@305: out_slice_3.append(BankToArray(slice_3.GetOutputBank())) tomwalters@305: out_slice_4.append(BankToArray(slice_4.GetOutputBank())) tomwalters@305: out_slice_5.append(BankToArray(slice_5.GetOutputBank())) tomwalters@305: out_feat_1.append(BankToArray(features_1.GetOutputBank())) tomwalters@305: out_feat_2.append(BankToArray(features_2.GetOutputBank())) tomwalters@305: out_feat_3.append(BankToArray(features_3.GetOutputBank())) tomwalters@305: out_feat_4.append(BankToArray(features_4.GetOutputBank())) tomwalters@305: out_feat_5.append(BankToArray(features_5.GetOutputBank())) tomwalters@305: tomwalters@305: out_bank = mod_gt.GetOutputBank() tomwalters@305: channel_count = out_bank.channel_count() tomwalters@305: cfs = scipy.zeros((channel_count)) tomwalters@305: for ch in range(0, channel_count): tomwalters@305: cfs[ch] = out_bank.centre_frequency(ch) tomwalters@305: outmat = dict(bmm=out_bmm, nap=out_nap, sais=out_sais, tomwalters@305: ssis=out_ssis, slice1=out_slice_1, slice2=out_slice_2, tomwalters@305: slice3=out_slice_3, slice4=out_slice_4, slice5=out_slice_5, tomwalters@305: feat1=out_feat_1, feat2=out_feat_2, feat3=out_feat_3, tomwalters@305: feat4=out_feat_4, feat5=out_feat_5, tomwalters@305: nap_smooth=out_smooth_nap_profile, centre_freqs=cfs) tomwalters@305: io.savemat("src/Scripts/profile_out.mat", outmat, oned_as='column') tomwalters@305: tomwalters@305: pass tomwalters@305: tomwalters@305: tomwalters@305: if __name__ == '__main__': tomwalters@305: main()