tomwalters@32: // Copyright 2008-2010, Thomas Walters tomwalters@32: // tomwalters@32: // AIM-C: A C++ implementation of the Auditory Image Model tomwalters@32: // http://www.acousticscale.org/AIMC tomwalters@32: // tomwalters@45: // Licensed under the Apache License, Version 2.0 (the "License"); tomwalters@45: // you may not use this file except in compliance with the License. tomwalters@45: // You may obtain a copy of the License at tomwalters@32: // tomwalters@45: // http://www.apache.org/licenses/LICENSE-2.0 tomwalters@32: // tomwalters@45: // Unless required by applicable law or agreed to in writing, software tomwalters@45: // distributed under the License is distributed on an "AS IS" BASIS, tomwalters@45: // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. tomwalters@45: // See the License for the specific language governing permissions and tomwalters@45: // limitations under the License. tomwalters@32: tomwalters@32: /*! tomwalters@32: * \file AIMCopy.cpp tomwalters@32: * \brief AIM-C replacement for HTK's HCopy tomwalters@32: * tomwalters@32: * The following subset of the command-line flags tomwalters@32: * should be implemented from HCopy: tomwalters@32: * -A Print command line arguments off tomwalters@32: * -C cf Set config file to cf default tomwalters@32: * (should be able to take multiple config files) tomwalters@32: * -S f Set script file to f none tomwalters@32: * //! \todo -T N Set trace flags to N 0 tomwalters@32: * -V Print version information off tomwalters@32: * -D of Write configuration data to of none tomwalters@32: * tomwalters@32: * \author Thomas Walters tomwalters@32: * \date created 2008/05/08 tomwalters@32: * \version \$Id$ tomwalters@32: */ tomwalters@32: tomwalters@32: #include tomwalters@32: #include tomwalters@32: #include tomwalters@32: #include tomwalters@32: #include tomwalters@32: tomwalters@32: #include tomwalters@32: #include tomwalters@32: tomwalters@32: #include "Modules/Input/ModuleFileInput.h" tomwalters@32: #include "Modules/BMM/ModuleGammatone.h" tomwalters@32: #include "Modules/BMM/ModulePZFC.h" tomwalters@32: #include "Modules/NAP/ModuleHCL.h" tomwalters@32: #include "Modules/Strobes/ModuleParabola.h" tomwalters@33: #include "Modules/Strobes/ModuleLocalMax.h" tomwalters@32: #include "Modules/SAI/ModuleSAI.h" tomwalters@32: #include "Modules/SSI/ModuleSSI.h" tomwalters@32: #include "Modules/SNR/ModuleNoise.h" tomwalters@32: #include "Modules/Profile/ModuleSlice.h" tomwalters@32: #include "Modules/Profile/ModuleScaler.h" tomwalters@32: #include "Modules/Features/ModuleGaussians.h" tomwalters@32: #include "Modules/Output/FileOutputHTK.h" tomwalters@32: #include "Support/Common.h" tomwalters@32: #include "Support/FileList.h" tomwalters@32: #include "Support/Parameters.h" tomwalters@32: tomwalters@32: using std::ofstream; tomwalters@32: using std::pair; tomwalters@32: using std::vector; tomwalters@32: using std::string; tomwalters@32: int main(int argc, char* argv[]) { tomwalters@32: string sound_file; tomwalters@32: string data_file; tomwalters@32: string config_file; tomwalters@32: string script_file; tomwalters@32: bool write_data = false; tomwalters@32: bool print_version = false; tomwalters@32: tomwalters@32: string version_string( tomwalters@32: " AIM-C AIMCopy\n" tomwalters@32: " (c) 2006-2010, Thomas Walters and Willem van Engen\n" tomwalters@32: " http://www.acoustiscale.org/AIMC/\n" tomwalters@32: "\n"); tomwalters@32: tomwalters@32: if (argc < 2) { tomwalters@32: printf("%s", version_string.c_str()); tomwalters@32: printf("AIMCopy is intended as a drop-in replacement for HTK's HCopy\n"); tomwalters@32: printf("command. It is used for making features from audio files for\n"); tomwalters@32: printf("use with HTK.\n"); tomwalters@32: printf("Usage: \n"); tomwalters@32: printf(" -A Print command line arguments off\n"); tomwalters@32: printf(" -C cf Set config file to cf none\n"); tomwalters@32: printf(" -S f Set script file to f none\n"); tomwalters@32: printf(" -V Print version information off\n"); tomwalters@32: printf(" -D g Write configuration data to g none\n"); tomwalters@32: return -1; tomwalters@32: } tomwalters@32: tomwalters@32: // Parse command-line arguments tomwalters@32: for (int i = 1; i < argc; i++) { tomwalters@32: if (strcmp(argv[i],"-A") == 0) { tomwalters@32: for (int j = 0; j < argc; j++) tomwalters@32: printf("%s ",argv[j]); tomwalters@32: printf("\n"); tomwalters@32: fflush(stdout); tomwalters@32: continue; tomwalters@32: } tomwalters@32: if (strcmp(argv[i],"-C") == 0) { tomwalters@32: if (++i >= argc) { tomwalters@32: aimc::LOG_ERROR(_T("Configuration file name expected after -C")); tomwalters@32: return(-1); tomwalters@32: } tomwalters@32: config_file = argv[i]; tomwalters@32: continue; tomwalters@32: } tomwalters@32: if (strcmp(argv[i],"-S") == 0) { tomwalters@32: if (++i >= argc) { tomwalters@32: aimc::LOG_ERROR(_T("Script file name expected after -S")); tomwalters@32: return(-1); tomwalters@32: } tomwalters@32: script_file = argv[i]; tomwalters@32: continue; tomwalters@32: } tomwalters@32: if (strcmp(argv[i],"-D") == 0) { tomwalters@32: if (++i >= argc) { tomwalters@32: aimc::LOG_ERROR(_T("Data file name expected after -D")); tomwalters@32: return(-1); tomwalters@32: } tomwalters@32: data_file = argv[i]; tomwalters@32: write_data = true; tomwalters@32: continue; tomwalters@32: } tomwalters@32: if (strcmp(argv[i],"-V") == 0) { tomwalters@32: print_version = true; tomwalters@32: continue; tomwalters@32: } tomwalters@32: aimc::LOG_ERROR(_T("Unrecognized command-line argument: %s"), argv[i]); tomwalters@32: } tomwalters@32: tomwalters@32: if (print_version) tomwalters@32: printf("%s", version_string.c_str()); tomwalters@32: tomwalters@32: aimc::Parameters params; tomwalters@32: tomwalters@32: if (!params.Load(config_file.c_str())) { tomwalters@32: aimc::LOG_ERROR(_T("Couldn't load parameters from file %s"), tomwalters@32: config_file.c_str()); tomwalters@32: return -1; tomwalters@32: } tomwalters@32: tomwalters@32: vector > file_list = aimc::FileList::Load(script_file); tomwalters@32: if (file_list.size() == 0) { tomwalters@32: aimc::LOG_ERROR("No data read from file %s", script_file.c_str()); tomwalters@32: return -1; tomwalters@32: } tomwalters@32: tomwalters@32: // Set up AIM-C processor here tomwalters@32: aimc::ModuleFileInput input(¶ms); tomwalters@33: aimc::ModuleNoise noise_maker(¶ms); tomwalters@32: aimc::ModuleGammatone bmm(¶ms); tomwalters@32: aimc::ModuleHCL nap(¶ms); tomwalters@33: aimc::ModuleLocalMax strobes(¶ms); tomwalters@32: aimc::ModuleSAI sai(¶ms); tomwalters@32: aimc::ModuleSSI ssi(¶ms); tomwalters@32: tomwalters@32: params.SetBool("slice.all", false); tomwalters@33: params.SetInt("slice.lower_index", 77); tomwalters@33: params.SetInt("slice.upper_index", 150); tomwalters@32: aimc::ModuleSlice slice_1(¶ms); tomwalters@32: tomwalters@33: params.SetInt("slice.lower_index", 210); tomwalters@33: params.SetInt("slice.upper_index", 240); tomwalters@32: aimc::ModuleSlice slice_2(¶ms); tomwalters@32: tomwalters@33: params.SetInt("slice.lower_index", 280); tomwalters@33: params.SetInt("slice.upper_index", 304); tomwalters@32: aimc::ModuleSlice slice_3(¶ms); tomwalters@32: tomwalters@33: params.SetInt("slice.lower_index", 328); tomwalters@33: params.SetInt("slice.upper_index", 352); tomwalters@32: aimc::ModuleSlice slice_4(¶ms); tomwalters@32: tomwalters@32: params.SetBool("slice.all", true); tomwalters@32: aimc::ModuleSlice slice_5(¶ms); tomwalters@32: tomwalters@33: params.SetFloat("nap.lowpass_cutoff", 100.0); tomwalters@33: aimc::ModuleHCL smooth_nap(¶ms); tomwalters@33: params.SetBool("slice.all", true); tomwalters@33: aimc::ModuleSlice nap_profile(¶ms); tomwalters@33: aimc::ModuleScaler nap_scaler(¶ms); tomwalters@33: aimc::ModuleGaussians nap_features(¶ms); tomwalters@33: aimc::FileOutputHTK nap_out(¶ms); tomwalters@33: tomwalters@32: aimc::ModuleGaussians features_1(¶ms); tomwalters@32: aimc::ModuleGaussians features_2(¶ms); tomwalters@32: aimc::ModuleGaussians features_3(¶ms); tomwalters@32: aimc::ModuleGaussians features_4(¶ms); tomwalters@32: aimc::ModuleGaussians features_5(¶ms); tomwalters@32: tomwalters@32: aimc::FileOutputHTK output_1(¶ms); tomwalters@32: aimc::FileOutputHTK output_2(¶ms); tomwalters@32: aimc::FileOutputHTK output_3(¶ms); tomwalters@32: aimc::FileOutputHTK output_4(¶ms); tomwalters@32: aimc::FileOutputHTK output_5(¶ms); tomwalters@32: tomwalters@33: input.AddTarget(&noise_maker); tomwalters@33: noise_maker.AddTarget(&bmm); tomwalters@32: bmm.AddTarget(&nap); tomwalters@33: bmm.AddTarget(&smooth_nap); tomwalters@33: smooth_nap.AddTarget(&nap_profile); tomwalters@33: nap_profile.AddTarget(&nap_scaler); tomwalters@33: nap_scaler.AddTarget(&nap_features); tomwalters@33: nap_features.AddTarget(&nap_out); tomwalters@32: nap.AddTarget(&strobes); tomwalters@32: strobes.AddTarget(&sai); tomwalters@32: sai.AddTarget(&ssi); tomwalters@32: tomwalters@32: ssi.AddTarget(&slice_1); tomwalters@32: ssi.AddTarget(&slice_2); tomwalters@32: ssi.AddTarget(&slice_3); tomwalters@32: ssi.AddTarget(&slice_4); tomwalters@32: ssi.AddTarget(&slice_5); tomwalters@32: tomwalters@32: slice_1.AddTarget(&features_1); tomwalters@32: slice_2.AddTarget(&features_2); tomwalters@32: slice_3.AddTarget(&features_3); tomwalters@32: slice_4.AddTarget(&features_4); tomwalters@32: slice_5.AddTarget(&features_5); tomwalters@32: tomwalters@32: features_1.AddTarget(&output_1); tomwalters@32: features_2.AddTarget(&output_2); tomwalters@32: features_3.AddTarget(&output_3); tomwalters@32: features_4.AddTarget(&output_4); tomwalters@32: features_5.AddTarget(&output_5); tomwalters@32: tomwalters@32: if (write_data) { tomwalters@32: ofstream outfile(data_file.c_str()); tomwalters@32: if (outfile.fail()) { tomwalters@32: aimc::LOG_ERROR("Couldn't open data file %s for writing", tomwalters@32: data_file.c_str()); tomwalters@32: return -1; tomwalters@32: } tomwalters@32: time_t rawtime; tomwalters@32: struct tm * timeinfo; tomwalters@32: time(&rawtime); tomwalters@32: timeinfo = localtime(&rawtime); tomwalters@32: tomwalters@32: tomwalters@32: outfile << "# AIM-C AIMCopy\n"; tomwalters@32: outfile << "# Run on: " << asctime(timeinfo); tomwalters@32: char * descr = getenv("USER"); tomwalters@32: if (descr) { tomwalters@32: outfile << "# By user: " << descr <<"\n"; tomwalters@32: } tomwalters@33: outfile << "#Module chain: "; tomwalters@33: outfile << "#input"; tomwalters@33: outfile << "# noise_maker"; tomwalters@32: outfile << "# gt"; tomwalters@33: outfile << "# nap"; tomwalters@33: outfile << "# slice"; tomwalters@33: outfile << "# scaler"; tomwalters@33: outfile << "# features"; tomwalters@33: outfile << "# output"; tomwalters@33: outfile << "# local_max"; tomwalters@33: outfile << "# sai_weighted"; tomwalters@33: outfile << "# ssi"; tomwalters@33: outfile << "# slice"; tomwalters@33: outfile << "# features"; tomwalters@33: outfile << "# output"; tomwalters@33: outfile << "# slice"; tomwalters@33: outfile << "# features"; tomwalters@33: outfile << "# output"; tomwalters@33: outfile << "# slice"; tomwalters@33: outfile << "# features"; tomwalters@33: outfile << "# output"; tomwalters@33: outfile << "# slice"; tomwalters@33: outfile << "# features"; tomwalters@33: outfile << "# output"; tomwalters@33: outfile << "# slice"; tomwalters@33: outfile << "# features"; tomwalters@33: outfile << "# output"; tomwalters@32: outfile << "# "; tomwalters@32: outfile << "# Module versions:\n"; tomwalters@32: outfile << "# " << input.id() << " : " << input.version() << "\n"; tomwalters@32: outfile << "# " << bmm.id() << " : " << bmm.version() << "\n"; tomwalters@32: outfile << "# " << nap.id() << " : " << nap.version() << "\n"; tomwalters@32: outfile << "# " << strobes.id() << " : " << strobes.version() << "\n"; tomwalters@32: outfile << "# " << sai.id() << " : " << sai.version() << "\n"; tomwalters@32: outfile << "# " << slice_1.id() << " : " << slice_1.version() << "\n"; tomwalters@32: // outfile << "# " << profile.id() << " : " << profile.version() << "\n"; tomwalters@32: // outfile << "# " << scaler.id() << " : " << scaler.version() << "\n"; tomwalters@32: outfile << "# " << features_1.id() << " : " << features_1.version() << "\n"; tomwalters@32: outfile << "# " << output_1.id() << " : " << output_1.version() << "\n"; tomwalters@32: outfile << "#\n"; tomwalters@32: outfile << "# Parameters:\n"; tomwalters@32: outfile << params.WriteString(); tomwalters@32: outfile.close(); tomwalters@32: } tomwalters@32: tomwalters@32: for (unsigned int i = 0; i < file_list.size(); ++i) { tomwalters@33: // aimc::LOG_INFO(_T("In: %s"), file_list[i].first.c_str()); tomwalters@32: aimc::LOG_INFO(_T("Out: %s"), file_list[i].second.c_str()); tomwalters@32: tomwalters@33: string filename = file_list[i].second + ".slice_1"; tomwalters@32: output_1.OpenFile(filename.c_str(), 10.0f); tomwalters@33: filename = file_list[i].second + ".slice_2"; tomwalters@32: output_2.OpenFile(filename.c_str(), 10.0f); tomwalters@33: filename = file_list[i].second + ".slice_3"; tomwalters@32: output_3.OpenFile(filename.c_str(), 10.0f); tomwalters@33: filename = file_list[i].second + ".slice_4"; tomwalters@32: output_4.OpenFile(filename.c_str(), 10.0f); tomwalters@33: filename = file_list[i].second + ".ssi_profile"; tomwalters@32: output_5.OpenFile(filename.c_str(), 10.0f); tomwalters@33: filename = file_list[i].second + ".smooth_nap_profile"; tomwalters@33: nap_out.OpenFile(filename.c_str(), 10.0f); tomwalters@32: tomwalters@32: if (input.LoadFile(file_list[i].first.c_str())) { tomwalters@32: input.Process(); tomwalters@32: } else { tomwalters@32: printf("LoadFile failed for file %s\n", file_list[i].first.c_str()); tomwalters@32: } tomwalters@32: input.Reset(); tomwalters@32: } tomwalters@32: tomwalters@32: return 0; tomwalters@32: }