tomwalters@305: #!/usr/bin/env python
tomwalters@305: # encoding: utf-8
tomwalters@305: #
tomwalters@305: # AIM-C: A C++ implementation of the Auditory Image Model
tomwalters@305: # http://www.acousticscale.org/AIMC
tomwalters@305: #
tomwalters@305: # This program is free software: you can redistribute it and/or modify
tomwalters@305: # it under the terms of the GNU General Public License as published by
tomwalters@305: # the Free Software Foundation, either version 3 of the License, or
tomwalters@305: # (at your option) any later version.
tomwalters@305: #
tomwalters@305: # This program is distributed in the hope that it will be useful,
tomwalters@305: # but WITHOUT ANY WARRANTY; without even the implied warranty of
tomwalters@305: # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
tomwalters@305: # GNU General Public License for more details.
tomwalters@305: #
tomwalters@305: # You should have received a copy of the GNU General Public License
tomwalters@305: # along with this program. If not, see .
tomwalters@305: """
tomwalters@305: Profiles_test.py
tomwalters@305:
tomwalters@305: Created by Thomas Walters on 2010-02-22.
tomwalters@305: Copyright 2010 Thomas Walters
tomwalters@305: Test the AIM-C model from filterbank to SSI profiles
tomwalters@305: """
tomwalters@305:
tomwalters@305: import aimc
tomwalters@305: from scipy.io import wavfile
tomwalters@305: from scipy import io
tomwalters@305: import scipy
tomwalters@305: import pylab
tomwalters@305: from itertools import izip, chain, repeat
tomwalters@305:
tomwalters@305: def grouper(n, iterable, padvalue=None):
tomwalters@305: "grouper(3, 'abcdefg', 'x') --> ('a','b','c'), ('d','e','f'), ('g','x','x')"
tomwalters@305: return izip(*[chain(iterable, repeat(padvalue, n-1))]*n)
tomwalters@305:
tomwalters@305: def BankToArray(out_bank):
tomwalters@305: channel_count = out_bank.channel_count()
tomwalters@305: out_buffer_length = out_bank.buffer_length()
tomwalters@305: out = scipy.zeros((channel_count, out_buffer_length))
tomwalters@305: for ch in range(0, channel_count):
tomwalters@305: for i in range(0, out_buffer_length):
tomwalters@305: out[ch, i] = out_bank.sample(ch, i)
tomwalters@305: return out
tomwalters@305:
tomwalters@305: def StrobesToList(bank):
tomwalters@305: channel_count = bank.channel_count()
tomwalters@305: strobes = []
tomwalters@305: for ch in range(0, channel_count):
tomwalters@305: s = []
tomwalters@305: for i in range(0, bank.strobe_count(ch)):
tomwalters@305: s.append(bank.strobe(ch, i))
tomwalters@305: strobes.append(s)
tomwalters@305:
tomwalters@305: def main():
tomwalters@305: wave_path = "/Users/Tom/Documents/Work/PhD/HTK-AIM/Sounds/"
tomwalters@305: #features_path = "/Users/Tom/Documents/Work/PhD/HTK-AIM/work08-jess-original-rec_rubber/features/"
tomwalters@305:
tomwalters@305: file_name = "ii/ii172.5p112.5s100.0t+000itd"
tomwalters@305:
tomwalters@305: wave_suffix = ".wav"
tomwalters@305: features_suffix = ".mat"
tomwalters@305:
tomwalters@305: frame_period_ms = 10;
tomwalters@305:
tomwalters@305: wave_filename = wave_path + file_name + wave_suffix
tomwalters@305: #features_filename = features_path + file_name + features_suffix
tomwalters@305:
tomwalters@305: (sample_rate, input_wave) = wavfile.read(wave_filename)
tomwalters@305: wave_length = input_wave.size
tomwalters@305: buffer_length = int(frame_period_ms * sample_rate / 1000)
tomwalters@305:
tomwalters@305: #pylab.plot(input_wave)
tomwalters@305: #pylab.show()
tomwalters@305:
tomwalters@305: input_sig = aimc.SignalBank()
tomwalters@305: input_sig.Initialize(1, buffer_length, sample_rate)
tomwalters@305: parameters = aimc.Parameters()
tomwalters@305: parameters.SetFloat("sai.frame_period_ms", 10.0)
tomwalters@305: parameters.SetInt("input.buffersize", 480)
tomwalters@305:
tomwalters@305: mod_gt = aimc.ModuleGammatone(parameters)
tomwalters@305: mod_hl = aimc.ModuleHCL(parameters)
tomwalters@305: mod_strobes = aimc.ModuleLocalMax(parameters)
tomwalters@305: mod_sai = aimc.ModuleSAI(parameters)
tomwalters@305: parameters.SetBool("ssi.pitch_cutoff", True)
tomwalters@305: parameters.SetBool("ssi.weight_by_cutoff", False)
tomwalters@305: parameters.SetBool("ssi.weight_by_scaling", True)
tomwalters@305: parameters.SetBool("ssi.log_cycles_axis", True)
tomwalters@305: mod_ssi = aimc.ModuleSSI(parameters)
tomwalters@305:
tomwalters@305: parameters.SetFloat("nap.lowpass_cutoff", 100.0)
tomwalters@305: mod_nap_smooth = aimc.ModuleHCL(parameters)
tomwalters@305: mod_scaler = aimc.ModuleScaler(parameters)
tomwalters@305:
tomwalters@305: parameters.SetBool("slice.all", False)
tomwalters@305: parameters.SetInt("slice.lower_index", 77)
tomwalters@305: parameters.SetInt("slice.upper_index", 150)
tomwalters@305: slice_1 = aimc.ModuleSlice(parameters)
tomwalters@305:
tomwalters@305: parameters.SetInt("slice.lower_index", 210)
tomwalters@305: parameters.SetInt("slice.upper_index", 240)
tomwalters@305: slice_2 = aimc.ModuleSlice(parameters)
tomwalters@305:
tomwalters@305: parameters.SetInt("slice.lower_index", 280)
tomwalters@305: parameters.SetInt("slice.upper_index", 304)
tomwalters@305: slice_3 = aimc.ModuleSlice(parameters)
tomwalters@305:
tomwalters@305: parameters.SetInt("slice.lower_index", 328)
tomwalters@305: parameters.SetInt("slice.upper_index", 352)
tomwalters@305: slice_4 = aimc.ModuleSlice(parameters)
tomwalters@305:
tomwalters@305: parameters.SetBool("slice.all", True)
tomwalters@305: slice_5 = aimc.ModuleSlice(parameters)
tomwalters@305:
tomwalters@305: nap_profile = aimc.ModuleSlice(parameters)
tomwalters@305:
tomwalters@305: features_1 = aimc.ModuleGaussians(parameters)
tomwalters@305: features_2 = aimc.ModuleGaussians(parameters)
tomwalters@305: features_3 = aimc.ModuleGaussians(parameters)
tomwalters@305: features_4 = aimc.ModuleGaussians(parameters)
tomwalters@305: features_5 = aimc.ModuleGaussians(parameters)
tomwalters@305:
tomwalters@305: mod_gt.AddTarget(mod_hl)
tomwalters@305: mod_gt.AddTarget(mod_nap_smooth)
tomwalters@305: mod_nap_smooth.AddTarget(nap_profile)
tomwalters@305: nap_profile.AddTarget(mod_scaler)
tomwalters@305: mod_hl.AddTarget(mod_strobes)
tomwalters@305: mod_strobes.AddTarget(mod_sai)
tomwalters@305: mod_sai.AddTarget(mod_ssi)
tomwalters@305: mod_ssi.AddTarget(slice_1)
tomwalters@305: mod_ssi.AddTarget(slice_2)
tomwalters@305: mod_ssi.AddTarget(slice_3)
tomwalters@305: mod_ssi.AddTarget(slice_4)
tomwalters@305: mod_ssi.AddTarget(slice_5)
tomwalters@305:
tomwalters@305: slice_1.AddTarget(features_1)
tomwalters@305: slice_2.AddTarget(features_2)
tomwalters@305: slice_3.AddTarget(features_3)
tomwalters@305: slice_4.AddTarget(features_4)
tomwalters@305: slice_5.AddTarget(features_5)
tomwalters@305:
tomwalters@305: mod_gt.Initialize(input_sig)
tomwalters@305:
tomwalters@305: correct_count = 0;
tomwalters@305: incorrect_count = 0;
tomwalters@305:
tomwalters@305: scaled_wave = []
tomwalters@305: for sample in input_wave:
tomwalters@305: scaled_wave.append(float(sample / float(pow(2,15) - 1)))
tomwalters@305: i = 0
tomwalters@305:
tomwalters@305: wave_chunks = grouper(buffer_length, scaled_wave, 0)
tomwalters@305:
tomwalters@305: out_bmm = []
tomwalters@305: out_nap = []
tomwalters@305: out_smooth_nap_profile = []
tomwalters@305: out_strobes = []
tomwalters@305: out_sais = []
tomwalters@305: out_ssis = []
tomwalters@305: out_slice_1 = []
tomwalters@305: out_slice_2 = []
tomwalters@305: out_slice_3 = []
tomwalters@305: out_slice_4 = []
tomwalters@305: out_slice_5 = []
tomwalters@305: out_feat_1 = []
tomwalters@305: out_feat_2 = []
tomwalters@305: out_feat_3 = []
tomwalters@305: out_feat_4 = []
tomwalters@305: out_feat_5 = []
tomwalters@305: for chunk in wave_chunks:
tomwalters@305: i = 0
tomwalters@305: for sample in chunk:
tomwalters@305: input_sig.set_sample(0, i, float(sample))
tomwalters@305: i += 1
tomwalters@305: mod_gt.Process(input_sig)
tomwalters@305:
tomwalters@305: #out_bmm.append(BankToArray(mod_gt.GetOutputBank()))
tomwalters@305: #out_nap.append(BankToArray(mod_hl.GetOutputBank()))
tomwalters@305: out_smooth_nap_profile.append(BankToArray(mod_scaler.GetOutputBank()))
tomwalters@305: #out_strobes.append(BankToArray(mod_strobes.GetOutputBank()))
tomwalters@305: #out_sais.append(BankToArray(mod_sai.GetOutputBank()))
tomwalters@305: out_ssis.append(BankToArray(mod_ssi.GetOutputBank()))
tomwalters@305: out_slice_1.append(BankToArray(slice_1.GetOutputBank()))
tomwalters@305: out_slice_2.append(BankToArray(slice_2.GetOutputBank()))
tomwalters@305: out_slice_3.append(BankToArray(slice_3.GetOutputBank()))
tomwalters@305: out_slice_4.append(BankToArray(slice_4.GetOutputBank()))
tomwalters@305: out_slice_5.append(BankToArray(slice_5.GetOutputBank()))
tomwalters@305: out_feat_1.append(BankToArray(features_1.GetOutputBank()))
tomwalters@305: out_feat_2.append(BankToArray(features_2.GetOutputBank()))
tomwalters@305: out_feat_3.append(BankToArray(features_3.GetOutputBank()))
tomwalters@305: out_feat_4.append(BankToArray(features_4.GetOutputBank()))
tomwalters@305: out_feat_5.append(BankToArray(features_5.GetOutputBank()))
tomwalters@305:
tomwalters@305: out_bank = mod_gt.GetOutputBank()
tomwalters@305: channel_count = out_bank.channel_count()
tomwalters@305: cfs = scipy.zeros((channel_count))
tomwalters@305: for ch in range(0, channel_count):
tomwalters@305: cfs[ch] = out_bank.centre_frequency(ch)
tomwalters@305: outmat = dict(bmm=out_bmm, nap=out_nap, sais=out_sais,
tomwalters@305: ssis=out_ssis, slice1=out_slice_1, slice2=out_slice_2,
tomwalters@305: slice3=out_slice_3, slice4=out_slice_4, slice5=out_slice_5,
tomwalters@305: feat1=out_feat_1, feat2=out_feat_2, feat3=out_feat_3,
tomwalters@305: feat4=out_feat_4, feat5=out_feat_5,
tomwalters@305: nap_smooth=out_smooth_nap_profile, centre_freqs=cfs)
tomwalters@305: io.savemat("src/Scripts/profile_out.mat", outmat, oned_as='column')
tomwalters@305:
tomwalters@305: pass
tomwalters@305:
tomwalters@305:
tomwalters@305: if __name__ == '__main__':
tomwalters@305: main()