tomwalters@305: // Copyright 2008-2010, Thomas Walters tomwalters@305: // tomwalters@305: // AIM-C: A C++ implementation of the Auditory Image Model tomwalters@305: // http://www.acousticscale.org/AIMC tomwalters@305: // tomwalters@318: // Licensed under the Apache License, Version 2.0 (the "License"); tomwalters@318: // you may not use this file except in compliance with the License. tomwalters@318: // You may obtain a copy of the License at tomwalters@305: // tomwalters@318: // http://www.apache.org/licenses/LICENSE-2.0 tomwalters@305: // tomwalters@318: // Unless required by applicable law or agreed to in writing, software tomwalters@318: // distributed under the License is distributed on an "AS IS" BASIS, tomwalters@318: // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. tomwalters@318: // See the License for the specific language governing permissions and tomwalters@318: // limitations under the License. tomwalters@305: tomwalters@305: /*! tomwalters@305: * \file AIMCopy.cpp tomwalters@305: * \brief AIM-C replacement for HTK's HCopy tomwalters@305: * tomwalters@305: * The following subset of the command-line flags tomwalters@305: * should be implemented from HCopy: tomwalters@305: * -A Print command line arguments off tomwalters@305: * -C cf Set config file to cf default tomwalters@305: * (should be able to take multiple config files) tomwalters@305: * -S f Set script file to f none tomwalters@305: * //! \todo -T N Set trace flags to N 0 tomwalters@305: * -V Print version information off tomwalters@305: * -D of Write configuration data to of none tomwalters@305: * tomwalters@305: * \author Thomas Walters tomwalters@305: * \date created 2008/05/08 tomwalters@305: * \version \$Id$ tomwalters@305: */ tomwalters@305: tomwalters@305: #include tomwalters@305: #include tomwalters@305: #include tomwalters@305: #include tomwalters@305: #include tomwalters@305: tomwalters@305: #include tomwalters@305: #include tomwalters@305: tomwalters@305: #include "Modules/Input/ModuleFileInput.h" tomwalters@305: #include "Modules/BMM/ModuleGammatone.h" tomwalters@305: #include "Modules/BMM/ModulePZFC.h" tomwalters@305: #include "Modules/NAP/ModuleHCL.h" tomwalters@305: #include "Modules/Strobes/ModuleParabola.h" tomwalters@306: #include "Modules/Strobes/ModuleLocalMax.h" tomwalters@305: #include "Modules/SAI/ModuleSAI.h" tomwalters@305: #include "Modules/SSI/ModuleSSI.h" tomwalters@305: #include "Modules/SNR/ModuleNoise.h" tomwalters@305: #include "Modules/Profile/ModuleSlice.h" tomwalters@305: #include "Modules/Profile/ModuleScaler.h" tomwalters@305: #include "Modules/Features/ModuleGaussians.h" tomwalters@305: #include "Modules/Output/FileOutputHTK.h" tomwalters@305: #include "Support/Common.h" tomwalters@305: #include "Support/FileList.h" tomwalters@305: #include "Support/Parameters.h" tomwalters@305: tomwalters@305: using std::ofstream; tomwalters@305: using std::pair; tomwalters@305: using std::vector; tomwalters@305: using std::string; tomwalters@305: int main(int argc, char* argv[]) { tomwalters@305: string sound_file; tomwalters@305: string data_file; tomwalters@305: string config_file; tomwalters@305: string script_file; tomwalters@305: bool write_data = false; tomwalters@305: bool print_version = false; tomwalters@305: tomwalters@305: string version_string( tomwalters@305: " AIM-C AIMCopy\n" tomwalters@305: " (c) 2006-2010, Thomas Walters and Willem van Engen\n" tomwalters@305: " http://www.acoustiscale.org/AIMC/\n" tomwalters@305: "\n"); tomwalters@305: tomwalters@305: if (argc < 2) { tomwalters@305: printf("%s", version_string.c_str()); tomwalters@305: printf("AIMCopy is intended as a drop-in replacement for HTK's HCopy\n"); tomwalters@305: printf("command. It is used for making features from audio files for\n"); tomwalters@305: printf("use with HTK.\n"); tomwalters@305: printf("Usage: \n"); tomwalters@305: printf(" -A Print command line arguments off\n"); tomwalters@305: printf(" -C cf Set config file to cf none\n"); tomwalters@305: printf(" -S f Set script file to f none\n"); tomwalters@305: printf(" -V Print version information off\n"); tomwalters@305: printf(" -D g Write configuration data to g none\n"); tomwalters@305: return -1; tomwalters@305: } tomwalters@305: tomwalters@305: // Parse command-line arguments tomwalters@305: for (int i = 1; i < argc; i++) { tomwalters@305: if (strcmp(argv[i],"-A") == 0) { tomwalters@305: for (int j = 0; j < argc; j++) tomwalters@305: printf("%s ",argv[j]); tomwalters@305: printf("\n"); tomwalters@305: fflush(stdout); tomwalters@305: continue; tomwalters@305: } tomwalters@305: if (strcmp(argv[i],"-C") == 0) { tomwalters@305: if (++i >= argc) { tomwalters@305: aimc::LOG_ERROR(_T("Configuration file name expected after -C")); tomwalters@305: return(-1); tomwalters@305: } tomwalters@305: config_file = argv[i]; tomwalters@305: continue; tomwalters@305: } tomwalters@305: if (strcmp(argv[i],"-S") == 0) { tomwalters@305: if (++i >= argc) { tomwalters@305: aimc::LOG_ERROR(_T("Script file name expected after -S")); tomwalters@305: return(-1); tomwalters@305: } tomwalters@305: script_file = argv[i]; tomwalters@305: continue; tomwalters@305: } tomwalters@305: if (strcmp(argv[i],"-D") == 0) { tomwalters@305: if (++i >= argc) { tomwalters@305: aimc::LOG_ERROR(_T("Data file name expected after -D")); tomwalters@305: return(-1); tomwalters@305: } tomwalters@305: data_file = argv[i]; tomwalters@305: write_data = true; tomwalters@305: continue; tomwalters@305: } tomwalters@305: if (strcmp(argv[i],"-V") == 0) { tomwalters@305: print_version = true; tomwalters@305: continue; tomwalters@305: } tomwalters@305: aimc::LOG_ERROR(_T("Unrecognized command-line argument: %s"), argv[i]); tomwalters@305: } tomwalters@305: tomwalters@305: if (print_version) tomwalters@305: printf("%s", version_string.c_str()); tomwalters@305: tomwalters@305: aimc::Parameters params; tomwalters@305: tomwalters@305: if (!params.Load(config_file.c_str())) { tomwalters@305: aimc::LOG_ERROR(_T("Couldn't load parameters from file %s"), tomwalters@305: config_file.c_str()); tomwalters@305: return -1; tomwalters@305: } tomwalters@305: tomwalters@305: vector > file_list = aimc::FileList::Load(script_file); tomwalters@305: if (file_list.size() == 0) { tomwalters@305: aimc::LOG_ERROR("No data read from file %s", script_file.c_str()); tomwalters@305: return -1; tomwalters@305: } tomwalters@305: tomwalters@305: // Set up AIM-C processor here tomwalters@305: aimc::ModuleFileInput input(¶ms); tomwalters@306: aimc::ModuleNoise noise_maker(¶ms); tomwalters@305: aimc::ModuleGammatone bmm(¶ms); tomwalters@305: aimc::ModuleHCL nap(¶ms); tomwalters@306: aimc::ModuleLocalMax strobes(¶ms); tomwalters@305: aimc::ModuleSAI sai(¶ms); tomwalters@305: aimc::ModuleSSI ssi(¶ms); tomwalters@305: tomwalters@305: params.SetBool("slice.all", false); tomwalters@306: params.SetInt("slice.lower_index", 77); tomwalters@306: params.SetInt("slice.upper_index", 150); tomwalters@305: aimc::ModuleSlice slice_1(¶ms); tomwalters@305: tomwalters@306: params.SetInt("slice.lower_index", 210); tomwalters@306: params.SetInt("slice.upper_index", 240); tomwalters@305: aimc::ModuleSlice slice_2(¶ms); tomwalters@305: tomwalters@306: params.SetInt("slice.lower_index", 280); tomwalters@306: params.SetInt("slice.upper_index", 304); tomwalters@305: aimc::ModuleSlice slice_3(¶ms); tomwalters@305: tomwalters@306: params.SetInt("slice.lower_index", 328); tomwalters@306: params.SetInt("slice.upper_index", 352); tomwalters@305: aimc::ModuleSlice slice_4(¶ms); tomwalters@305: tomwalters@305: params.SetBool("slice.all", true); tomwalters@305: aimc::ModuleSlice slice_5(¶ms); tomwalters@305: tomwalters@306: params.SetFloat("nap.lowpass_cutoff", 100.0); tomwalters@306: aimc::ModuleHCL smooth_nap(¶ms); tomwalters@306: params.SetBool("slice.all", true); tomwalters@306: aimc::ModuleSlice nap_profile(¶ms); tomwalters@306: aimc::ModuleScaler nap_scaler(¶ms); tomwalters@306: aimc::ModuleGaussians nap_features(¶ms); tomwalters@306: aimc::FileOutputHTK nap_out(¶ms); tomwalters@306: tomwalters@305: aimc::ModuleGaussians features_1(¶ms); tomwalters@305: aimc::ModuleGaussians features_2(¶ms); tomwalters@305: aimc::ModuleGaussians features_3(¶ms); tomwalters@305: aimc::ModuleGaussians features_4(¶ms); tomwalters@305: aimc::ModuleGaussians features_5(¶ms); tomwalters@305: tomwalters@305: aimc::FileOutputHTK output_1(¶ms); tomwalters@305: aimc::FileOutputHTK output_2(¶ms); tomwalters@305: aimc::FileOutputHTK output_3(¶ms); tomwalters@305: aimc::FileOutputHTK output_4(¶ms); tomwalters@305: aimc::FileOutputHTK output_5(¶ms); tomwalters@305: tomwalters@306: input.AddTarget(&noise_maker); tomwalters@306: noise_maker.AddTarget(&bmm); tomwalters@305: bmm.AddTarget(&nap); tomwalters@306: bmm.AddTarget(&smooth_nap); tomwalters@306: smooth_nap.AddTarget(&nap_profile); tomwalters@306: nap_profile.AddTarget(&nap_scaler); tomwalters@306: nap_scaler.AddTarget(&nap_features); tomwalters@306: nap_features.AddTarget(&nap_out); tomwalters@305: nap.AddTarget(&strobes); tomwalters@305: strobes.AddTarget(&sai); tomwalters@305: sai.AddTarget(&ssi); tomwalters@305: tomwalters@305: ssi.AddTarget(&slice_1); tomwalters@305: ssi.AddTarget(&slice_2); tomwalters@305: ssi.AddTarget(&slice_3); tomwalters@305: ssi.AddTarget(&slice_4); tomwalters@305: ssi.AddTarget(&slice_5); tomwalters@305: tomwalters@305: slice_1.AddTarget(&features_1); tomwalters@305: slice_2.AddTarget(&features_2); tomwalters@305: slice_3.AddTarget(&features_3); tomwalters@305: slice_4.AddTarget(&features_4); tomwalters@305: slice_5.AddTarget(&features_5); tomwalters@305: tomwalters@305: features_1.AddTarget(&output_1); tomwalters@305: features_2.AddTarget(&output_2); tomwalters@305: features_3.AddTarget(&output_3); tomwalters@305: features_4.AddTarget(&output_4); tomwalters@305: features_5.AddTarget(&output_5); tomwalters@305: tomwalters@305: if (write_data) { tomwalters@305: ofstream outfile(data_file.c_str()); tomwalters@305: if (outfile.fail()) { tomwalters@305: aimc::LOG_ERROR("Couldn't open data file %s for writing", tomwalters@305: data_file.c_str()); tomwalters@305: return -1; tomwalters@305: } tomwalters@305: time_t rawtime; tomwalters@305: struct tm * timeinfo; tomwalters@305: time(&rawtime); tomwalters@305: timeinfo = localtime(&rawtime); tomwalters@305: tomwalters@305: tomwalters@305: outfile << "# AIM-C AIMCopy\n"; tomwalters@305: outfile << "# Run on: " << asctime(timeinfo); tomwalters@305: char * descr = getenv("USER"); tomwalters@305: if (descr) { tomwalters@305: outfile << "# By user: " << descr <<"\n"; tomwalters@305: } tomwalters@306: outfile << "#Module chain: "; tomwalters@306: outfile << "#input"; tomwalters@306: outfile << "# noise_maker"; tomwalters@305: outfile << "# gt"; tomwalters@306: outfile << "# nap"; tomwalters@306: outfile << "# slice"; tomwalters@306: outfile << "# scaler"; tomwalters@306: outfile << "# features"; tomwalters@306: outfile << "# output"; tomwalters@306: outfile << "# local_max"; tomwalters@306: outfile << "# sai_weighted"; tomwalters@306: outfile << "# ssi"; tomwalters@306: outfile << "# slice"; tomwalters@306: outfile << "# features"; tomwalters@306: outfile << "# output"; tomwalters@306: outfile << "# slice"; tomwalters@306: outfile << "# features"; tomwalters@306: outfile << "# output"; tomwalters@306: outfile << "# slice"; tomwalters@306: outfile << "# features"; tomwalters@306: outfile << "# output"; tomwalters@306: outfile << "# slice"; tomwalters@306: outfile << "# features"; tomwalters@306: outfile << "# output"; tomwalters@306: outfile << "# slice"; tomwalters@306: outfile << "# features"; tomwalters@306: outfile << "# output"; tomwalters@305: outfile << "# "; tomwalters@305: outfile << "# Module versions:\n"; tomwalters@305: outfile << "# " << input.id() << " : " << input.version() << "\n"; tomwalters@305: outfile << "# " << bmm.id() << " : " << bmm.version() << "\n"; tomwalters@305: outfile << "# " << nap.id() << " : " << nap.version() << "\n"; tomwalters@305: outfile << "# " << strobes.id() << " : " << strobes.version() << "\n"; tomwalters@305: outfile << "# " << sai.id() << " : " << sai.version() << "\n"; tomwalters@305: outfile << "# " << slice_1.id() << " : " << slice_1.version() << "\n"; tomwalters@305: // outfile << "# " << profile.id() << " : " << profile.version() << "\n"; tomwalters@305: // outfile << "# " << scaler.id() << " : " << scaler.version() << "\n"; tomwalters@305: outfile << "# " << features_1.id() << " : " << features_1.version() << "\n"; tomwalters@305: outfile << "# " << output_1.id() << " : " << output_1.version() << "\n"; tomwalters@305: outfile << "#\n"; tomwalters@305: outfile << "# Parameters:\n"; tomwalters@305: outfile << params.WriteString(); tomwalters@305: outfile.close(); tomwalters@305: } tomwalters@305: tomwalters@305: for (unsigned int i = 0; i < file_list.size(); ++i) { tomwalters@306: // aimc::LOG_INFO(_T("In: %s"), file_list[i].first.c_str()); tomwalters@305: aimc::LOG_INFO(_T("Out: %s"), file_list[i].second.c_str()); tomwalters@305: tomwalters@306: string filename = file_list[i].second + ".slice_1"; tomwalters@305: output_1.OpenFile(filename.c_str(), 10.0f); tomwalters@306: filename = file_list[i].second + ".slice_2"; tomwalters@305: output_2.OpenFile(filename.c_str(), 10.0f); tomwalters@306: filename = file_list[i].second + ".slice_3"; tomwalters@305: output_3.OpenFile(filename.c_str(), 10.0f); tomwalters@306: filename = file_list[i].second + ".slice_4"; tomwalters@305: output_4.OpenFile(filename.c_str(), 10.0f); tomwalters@306: filename = file_list[i].second + ".ssi_profile"; tomwalters@305: output_5.OpenFile(filename.c_str(), 10.0f); tomwalters@306: filename = file_list[i].second + ".smooth_nap_profile"; tomwalters@306: nap_out.OpenFile(filename.c_str(), 10.0f); tomwalters@305: tomwalters@305: if (input.LoadFile(file_list[i].first.c_str())) { tomwalters@305: input.Process(); tomwalters@305: } else { tomwalters@305: printf("LoadFile failed for file %s\n", file_list[i].first.c_str()); tomwalters@305: } tomwalters@305: input.Reset(); tomwalters@305: } tomwalters@305: tomwalters@305: return 0; tomwalters@305: }