Mercurial > hg > aimc
changeset 314:f8aa25bd6085
-New experimental system with pre-noised signals.
author | tomwalters |
---|---|
date | Thu, 04 Mar 2010 11:01:39 +0000 |
parents | 1705e25d5a59 |
children | 90488d48b267 |
files | trunk/SConstruct trunk/scripts/gen_features.sh trunk/src/Main/AIMCopy_SSI_Features_v3.cc |
diffstat | 3 files changed, 314 insertions(+), 4 deletions(-) [+] |
line wrap: on
line diff
--- a/trunk/SConstruct Mon Mar 01 19:22:15 2010 +0000 +++ b/trunk/SConstruct Thu Mar 04 11:01:39 2010 +0000 @@ -51,7 +51,7 @@ 'Modules/Output/FileOutputHTK.cc'] # File which contains main() -sources = common_sources + ['Main/AIMCopy_SSI_Features_v2.cc'] +sources = common_sources + ['Main/AIMCopy_SSI_Features_v3.cc'] # Test sources test_sources = ['Modules/Profile/ModuleSlice_unittest.cc']
--- a/trunk/scripts/gen_features.sh Mon Mar 01 19:22:15 2010 +0000 +++ b/trunk/scripts/gen_features.sh Thu Mar 04 11:01:39 2010 +0000 @@ -7,12 +7,13 @@ # Source directory for all the sound files #SOUND_SOURCE="/Users/Tom/Documents/Work/PhD/HTk-AIM/Sounds/" -SOUND_SOURCE="/media/sounds-database/cnbh-sounds/" +#SOUND_SOURCE="/media/sounds-database/cnbh-sounds/" +SOUND_SOURCE="/mnt/sounds/snr_+0dB/" # Location of the AIMCopy binary if not in the path AIMCOPY_PREFIX="../aimc-read-only/build/posix-release/" -MACHINE_CORES=1 +MACHINE_CORES=8 # Names of various internal files and directories. # Rename here if you don't like them for some reason. @@ -163,7 +164,6 @@ input.buffersize=480 sai.frame_period_ms=10.0 slice.normalize=true -ssi.pitch_cutoff=true ssi.weight_by_cutoff=false ssi.weight_by_scaling=true ssi.log_cycles_axis=true
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/trunk/src/Main/AIMCopy_SSI_Features_v3.cc Thu Mar 04 11:01:39 2010 +0000 @@ -0,0 +1,310 @@ +// Copyright 2008-2010, Thomas Walters +// +// AIM-C: A C++ implementation of the Auditory Image Model +// http://www.acousticscale.org/AIMC +// +// This program is free software: you can redistribute it and/or modify +// it under the terms of the GNU General Public License as published by +// the Free Software Foundation, either version 3 of the License, or +// (at your option) any later version. +// +// This program is distributed in the hope that it will be useful, +// but WITHOUT ANY WARRANTY; without even the implied warranty of +// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +// GNU General Public License for more details. +// +// You should have received a copy of the GNU General Public License +// along with this program. If not, see <http://www.gnu.org/licenses/>. + +/*! + * \file AIMCopy.cpp + * \brief AIM-C replacement for HTK's HCopy + * + * The following subset of the command-line flags + * should be implemented from HCopy: + * -A Print command line arguments off + * -C cf Set config file to cf default + * (should be able to take multiple config files) + * -S f Set script file to f none + * //! \todo -T N Set trace flags to N 0 + * -V Print version information off + * -D of Write configuration data to of none + * + * \author Thomas Walters <tom@acousticscale.org> + * \date created 2008/05/08 + * \version \$Id$ + */ + +#include <fstream> +#include <iostream> +#include <string> +#include <utility> +#include <vector> + +#include <stdlib.h> +#include <time.h> + +#include "Modules/Input/ModuleFileInput.h" +#include "Modules/BMM/ModuleGammatone.h" +#include "Modules/BMM/ModulePZFC.h" +#include "Modules/NAP/ModuleHCL.h" +#include "Modules/Strobes/ModuleParabola.h" +#include "Modules/Strobes/ModuleLocalMax.h" +#include "Modules/SAI/ModuleSAI.h" +#include "Modules/SSI/ModuleSSI.h" +#include "Modules/SNR/ModuleNoise.h" +#include "Modules/Profile/ModuleSlice.h" +#include "Modules/Profile/ModuleScaler.h" +#include "Modules/Features/ModuleGaussians.h" +#include "Modules/Output/FileOutputHTK.h" +#include "Support/Common.h" +#include "Support/FileList.h" +#include "Support/Parameters.h" + +using std::ofstream; +using std::pair; +using std::vector; +using std::string; +int main(int argc, char* argv[]) { + string sound_file; + string data_file; + string config_file; + string script_file; + bool write_data = false; + bool print_version = false; + + string version_string( + " AIM-C AIMCopy\n" + " (c) 2006-2010, Thomas Walters and Willem van Engen\n" + " http://www.acoustiscale.org/AIMC/\n" + "\n"); + + if (argc < 2) { + printf("%s", version_string.c_str()); + printf("AIMCopy is intended as a drop-in replacement for HTK's HCopy\n"); + printf("command. It is used for making features from audio files for\n"); + printf("use with HTK.\n"); + printf("Usage: \n"); + printf(" -A Print command line arguments off\n"); + printf(" -C cf Set config file to cf none\n"); + printf(" -S f Set script file to f none\n"); + printf(" -V Print version information off\n"); + printf(" -D g Write configuration data to g none\n"); + return -1; + } + + // Parse command-line arguments + for (int i = 1; i < argc; i++) { + if (strcmp(argv[i],"-A") == 0) { + for (int j = 0; j < argc; j++) + printf("%s ",argv[j]); + printf("\n"); + fflush(stdout); + continue; + } + if (strcmp(argv[i],"-C") == 0) { + if (++i >= argc) { + aimc::LOG_ERROR(_T("Configuration file name expected after -C")); + return(-1); + } + config_file = argv[i]; + continue; + } + if (strcmp(argv[i],"-S") == 0) { + if (++i >= argc) { + aimc::LOG_ERROR(_T("Script file name expected after -S")); + return(-1); + } + script_file = argv[i]; + continue; + } + if (strcmp(argv[i],"-D") == 0) { + if (++i >= argc) { + aimc::LOG_ERROR(_T("Data file name expected after -D")); + return(-1); + } + data_file = argv[i]; + write_data = true; + continue; + } + if (strcmp(argv[i],"-V") == 0) { + print_version = true; + continue; + } + aimc::LOG_ERROR(_T("Unrecognized command-line argument: %s"), argv[i]); + } + + if (print_version) + printf("%s", version_string.c_str()); + + aimc::Parameters params; + + if (!params.Load(config_file.c_str())) { + aimc::LOG_ERROR(_T("Couldn't load parameters from file %s"), + config_file.c_str()); + return -1; + } + + vector<pair<string, string> > file_list = aimc::FileList::Load(script_file); + if (file_list.size() == 0) { + aimc::LOG_ERROR("No data read from file %s", script_file.c_str()); + return -1; + } + + // Set up AIM-C processor here + aimc::ModuleFileInput input(¶ms); + //aimc::ModuleNoise noise_maker(¶ms); + aimc::ModuleGammatone bmm(¶ms); + aimc::ModuleHCL nap(¶ms); + aimc::ModuleLocalMax strobes(¶ms); + aimc::ModuleSAI sai(¶ms); + params.SetBool("ssi.pitch_cutoff", false); + aimc::ModuleSSI ssi_no_cutoff(¶ms); + + params.SetBool("ssi.pitch_cutoff", true); + params.SetFloat("ssi.pitch_search_start_ms", 4.6f); + aimc::ModuleSSI ssi_cutoff(¶ms); + + params.SetBool("slice.all", false); + params.SetInt("slice.lower_index", 77); + params.SetInt("slice.upper_index", 150); + aimc::ModuleSlice slice_ssi_slice_1_no_cutoff(¶ms); + aimc::ModuleSlice slice_ssi_slice_1_cutoff(¶ms); + + params.SetBool("slice.all", true); + aimc::ModuleSlice slice_ssi_all_no_cutoff(¶ms); + aimc::ModuleSlice slice_ssi_all_cutoff(¶ms); + + params.SetFloat("nap.lowpass_cutoff", 100.0); + aimc::ModuleHCL smooth_nap(¶ms); + params.SetBool("slice.all", true); + aimc::ModuleSlice nap_profile(¶ms); + aimc::ModuleScaler nap_scaler(¶ms); + + aimc::ModuleGaussians nap_features(¶ms); + aimc::ModuleGaussians features_ssi_slice1_no_cutoff(¶ms); + aimc::ModuleGaussians features_ssi_slice1_cutoff(¶ms); + aimc::ModuleGaussians features_ssi_all_no_cutoff(¶ms); + aimc::ModuleGaussians features_ssi_all_cutoff(¶ms); + + aimc::FileOutputHTK nap_out(¶ms); + aimc::FileOutputHTK output_ssi_slice1_no_cutoff(¶ms); + aimc::FileOutputHTK output_ssi_slice1_cutoff(¶ms); + aimc::FileOutputHTK output_ssi_all_no_cutoff(¶ms); + aimc::FileOutputHTK output_ssi_all_cutoff(¶ms); + + input.AddTarget(&bmm); + //noise_maker.AddTarget(&bmm); + bmm.AddTarget(&nap); + bmm.AddTarget(&smooth_nap); + smooth_nap.AddTarget(&nap_profile); + nap_profile.AddTarget(&nap_scaler); + nap_scaler.AddTarget(&nap_features); + nap_features.AddTarget(&nap_out); + + nap.AddTarget(&strobes); + strobes.AddTarget(&sai); + sai.AddTarget(&ssi_no_cutoff); + sai.AddTarget(&ssi_cutoff); + + ssi_no_cutoff.AddTarget(&output_ssi_slice1_no_cutoff); + ssi_no_cutoff.AddTarget(&output_ssi_all_no_cutoff); + ssi_cutoff.AddTarget(&output_ssi_slice1_cutoff); + ssi_cutoff.AddTarget(&output_ssi_all_cutoff); + + slice_ssi_slice_1_no_cutoff.AddTarget(&features_ssi_slice1_no_cutoff); + slice_ssi_all_no_cutoff.AddTarget(&features_ssi_all_no_cutoff); + slice_ssi_slice_1_cutoff.AddTarget(&features_ssi_slice1_cutoff); + slice_ssi_all_cutoff.AddTarget(&features_ssi_all_cutoff); + + + features_ssi_slice1_no_cutoff.AddTarget(&output_ssi_slice1_no_cutoff); + features_ssi_all_no_cutoff.AddTarget(&output_ssi_all_no_cutoff); + features_ssi_slice1_cutoff.AddTarget(&output_ssi_slice1_cutoff); + features_ssi_all_cutoff.AddTarget(&output_ssi_all_cutoff); + + + if (write_data) { + ofstream outfile(data_file.c_str()); + if (outfile.fail()) { + aimc::LOG_ERROR("Couldn't open data file %s for writing", + data_file.c_str()); + return -1; + } + time_t rawtime; + struct tm * timeinfo; + time(&rawtime); + timeinfo = localtime(&rawtime); + + + outfile << "# AIM-C AIMCopy\n"; + outfile << "# Run on: " << asctime(timeinfo); + char * descr = getenv("USER"); + if (descr) { + outfile << "# By user: " << descr <<"\n"; + } + outfile << "#Module chain: "; + outfile << "#input"; + outfile << "# noise_maker"; + outfile << "# gt"; + outfile << "# nap"; + outfile << "# slice"; + outfile << "# scaler"; + outfile << "# features"; + outfile << "# output"; + outfile << "# local_max"; + outfile << "# sai_weighted"; + outfile << "# ssi"; + outfile << "# slice"; + outfile << "# features"; + outfile << "# output"; + outfile << "# slice"; + outfile << "# features"; + outfile << "# output"; + outfile << "# slice"; + outfile << "# features"; + outfile << "# output"; + outfile << "# slice"; + outfile << "# features"; + outfile << "# output"; + outfile << "# slice"; + outfile << "# features"; + outfile << "# output"; + outfile << "# "; + outfile << "# Module versions:\n"; + outfile << "# " << input.id() << " : " << input.version() << "\n"; + outfile << "# " << bmm.id() << " : " << bmm.version() << "\n"; + outfile << "# " << nap.id() << " : " << nap.version() << "\n"; + outfile << "# " << strobes.id() << " : " << strobes.version() << "\n"; + outfile << "# " << sai.id() << " : " << sai.version() << "\n"; + outfile << "#\n"; + outfile << "# Parameters:\n"; + outfile << params.WriteString(); + outfile.close(); + } + + for (unsigned int i = 0; i < file_list.size(); ++i) { + // aimc::LOG_INFO(_T("In: %s"), file_list[i].first.c_str()); + aimc::LOG_INFO(_T("Out: %s"), file_list[i].second.c_str()); + + string filename = file_list[i].second + ".slice_1_no_cutoff"; + output_ssi_slice1_no_cutoff.OpenFile(filename.c_str(), 10.0f); + filename = file_list[i].second + ".ssi_profile_no_cutoff"; + output_ssi_all_no_cutoff.OpenFile(filename.c_str(), 10.0f); + filename = file_list[i].second + ".slice_1_cutoff"; + output_ssi_slice1_cutoff.OpenFile(filename.c_str(), 10.0f); + filename = file_list[i].second + ".ssi_profile_cutoff"; + output_ssi_all_cutoff.OpenFile(filename.c_str(), 10.0f); + filename = file_list[i].second + ".smooth_nap_profile"; + nap_out.OpenFile(filename.c_str(), 10.0f); + + if (input.LoadFile(file_list[i].first.c_str())) { + input.Process(); + } else { + printf("LoadFile failed for file %s\n", file_list[i].first.c_str()); + } + input.Reset(); + } + + return 0; +}