tomwalters@41: // Copyright 2008-2010, Thomas Walters tomwalters@41: // tomwalters@41: // AIM-C: A C++ implementation of the Auditory Image Model tomwalters@41: // http://www.acousticscale.org/AIMC tomwalters@41: // tomwalters@45: // Licensed under the Apache License, Version 2.0 (the "License"); tomwalters@45: // you may not use this file except in compliance with the License. tomwalters@45: // You may obtain a copy of the License at tomwalters@41: // tomwalters@45: // http://www.apache.org/licenses/LICENSE-2.0 tomwalters@41: // tomwalters@45: // Unless required by applicable law or agreed to in writing, software tomwalters@45: // distributed under the License is distributed on an "AS IS" BASIS, tomwalters@45: // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. tomwalters@45: // See the License for the specific language governing permissions and tomwalters@45: // limitations under the License. tomwalters@41: tomwalters@41: /*! tomwalters@41: * \file AIMCopy.cpp tomwalters@41: * \brief AIM-C replacement for HTK's HCopy tomwalters@41: * tomwalters@41: * The following subset of the command-line flags tomwalters@41: * should be implemented from HCopy: tomwalters@41: * -A Print command line arguments off tomwalters@41: * -C cf Set config file to cf default tomwalters@41: * (should be able to take multiple config files) tomwalters@41: * -S f Set script file to f none tomwalters@41: * //! \todo -T N Set trace flags to N 0 tomwalters@41: * -V Print version information off tomwalters@41: * -D of Write configuration data to of none tomwalters@41: * tomwalters@41: * \author Thomas Walters tomwalters@41: * \date created 2008/05/08 tomwalters@41: * \version \$Id$ tomwalters@41: */ tomwalters@41: tomwalters@41: #include tomwalters@41: #include tomwalters@41: #include tomwalters@41: #include tomwalters@41: #include tomwalters@41: tomwalters@41: #include tomwalters@41: #include tomwalters@41: tomwalters@41: #include "Modules/Input/ModuleFileInput.h" tomwalters@41: #include "Modules/BMM/ModuleGammatone.h" tomwalters@41: #include "Modules/BMM/ModulePZFC.h" tomwalters@41: #include "Modules/NAP/ModuleHCL.h" tomwalters@41: #include "Modules/Strobes/ModuleParabola.h" tomwalters@41: #include "Modules/Strobes/ModuleLocalMax.h" tomwalters@41: #include "Modules/SAI/ModuleSAI.h" tomwalters@41: #include "Modules/SSI/ModuleSSI.h" tomwalters@41: #include "Modules/SNR/ModuleNoise.h" tomwalters@41: #include "Modules/Profile/ModuleSlice.h" tomwalters@41: #include "Modules/Profile/ModuleScaler.h" tomwalters@41: #include "Modules/Features/ModuleGaussians.h" tomwalters@41: #include "Modules/Output/FileOutputHTK.h" tomwalters@41: #include "Support/Common.h" tomwalters@41: #include "Support/FileList.h" tomwalters@41: #include "Support/Parameters.h" tomwalters@41: tomwalters@41: using std::ofstream; tomwalters@41: using std::pair; tomwalters@41: using std::vector; tomwalters@41: using std::string; tomwalters@41: int main(int argc, char* argv[]) { tomwalters@41: string sound_file; tomwalters@41: string data_file; tomwalters@41: string config_file; tomwalters@41: string script_file; tomwalters@41: bool write_data = false; tomwalters@41: bool print_version = false; tomwalters@189: bool load_params = false; tomwalters@41: tomwalters@41: string version_string( tomwalters@41: " AIM-C AIMCopy\n" tomwalters@41: " (c) 2006-2010, Thomas Walters and Willem van Engen\n" tomwalters@41: " http://www.acoustiscale.org/AIMC/\n" tomwalters@41: "\n"); tomwalters@41: tomwalters@41: if (argc < 2) { tomwalters@41: printf("%s", version_string.c_str()); tomwalters@41: printf("AIMCopy is intended as a drop-in replacement for HTK's HCopy\n"); tomwalters@41: printf("command. It is used for making features from audio files for\n"); tomwalters@41: printf("use with HTK.\n"); tomwalters@41: printf("Usage: \n"); tomwalters@41: printf(" -A Print command line arguments off\n"); tomwalters@41: printf(" -C cf Set config file to cf none\n"); tomwalters@41: printf(" -S f Set script file to f none\n"); tomwalters@41: printf(" -V Print version information off\n"); tomwalters@41: printf(" -D g Write configuration data to g none\n"); tomwalters@41: return -1; tomwalters@41: } tomwalters@41: tomwalters@41: // Parse command-line arguments tomwalters@41: for (int i = 1; i < argc; i++) { tomwalters@41: if (strcmp(argv[i],"-A") == 0) { tomwalters@41: for (int j = 0; j < argc; j++) tomwalters@41: printf("%s ",argv[j]); tomwalters@41: printf("\n"); tomwalters@41: fflush(stdout); tomwalters@41: continue; tomwalters@41: } tomwalters@41: if (strcmp(argv[i],"-C") == 0) { tomwalters@41: if (++i >= argc) { tomwalters@41: aimc::LOG_ERROR(_T("Configuration file name expected after -C")); tomwalters@41: return(-1); tomwalters@41: } tomwalters@41: config_file = argv[i]; tomwalters@189: load_params = true; tomwalters@41: continue; tomwalters@41: } tomwalters@41: if (strcmp(argv[i],"-S") == 0) { tomwalters@41: if (++i >= argc) { tomwalters@41: aimc::LOG_ERROR(_T("Script file name expected after -S")); tomwalters@41: return(-1); tomwalters@41: } tomwalters@41: script_file = argv[i]; tomwalters@41: continue; tomwalters@41: } tomwalters@41: if (strcmp(argv[i],"-D") == 0) { tomwalters@41: if (++i >= argc) { tomwalters@41: aimc::LOG_ERROR(_T("Data file name expected after -D")); tomwalters@41: return(-1); tomwalters@41: } tomwalters@41: data_file = argv[i]; tomwalters@41: write_data = true; tomwalters@41: continue; tomwalters@41: } tomwalters@41: if (strcmp(argv[i],"-V") == 0) { tomwalters@41: print_version = true; tomwalters@41: continue; tomwalters@41: } tomwalters@41: aimc::LOG_ERROR(_T("Unrecognized command-line argument: %s"), argv[i]); tomwalters@41: } tomwalters@41: tomwalters@41: if (print_version) tomwalters@41: printf("%s", version_string.c_str()); tomwalters@41: tomwalters@41: aimc::Parameters params; tomwalters@41: tomwalters@189: if (load_params) { tomwalters@189: if (!params.Load(config_file.c_str())) { tomwalters@189: aimc::LOG_ERROR(_T("Couldn't load parameters from file %s"), tomwalters@189: config_file.c_str()); tomwalters@189: return -1; tomwalters@189: } tomwalters@41: } tomwalters@41: tomwalters@41: vector > file_list = aimc::FileList::Load(script_file); tomwalters@41: if (file_list.size() == 0) { tomwalters@41: aimc::LOG_ERROR("No data read from file %s", script_file.c_str()); tomwalters@41: return -1; tomwalters@41: } tomwalters@41: tomwalters@41: // Set up AIM-C processor here tomwalters@41: aimc::ModuleFileInput input(¶ms); tomwalters@41: //aimc::ModuleNoise noise_maker(¶ms); tomwalters@41: aimc::ModuleGammatone bmm(¶ms); tomwalters@41: aimc::ModuleHCL nap(¶ms); tomwalters@41: aimc::ModuleLocalMax strobes(¶ms); tomwalters@41: aimc::ModuleSAI sai(¶ms); tomwalters@41: params.SetBool("ssi.pitch_cutoff", false); tomwalters@41: aimc::ModuleSSI ssi_no_cutoff(¶ms); tomwalters@41: tomwalters@41: params.SetBool("ssi.pitch_cutoff", true); tomwalters@41: params.SetFloat("ssi.pitch_search_start_ms", 4.6f); tomwalters@41: aimc::ModuleSSI ssi_cutoff(¶ms); tomwalters@41: tomwalters@41: params.SetBool("slice.all", false); tomwalters@41: params.SetInt("slice.lower_index", 77); tomwalters@41: params.SetInt("slice.upper_index", 150); tomwalters@41: aimc::ModuleSlice slice_ssi_slice_1_no_cutoff(¶ms); tomwalters@41: aimc::ModuleSlice slice_ssi_slice_1_cutoff(¶ms); tomwalters@41: tomwalters@41: params.SetBool("slice.all", true); tomwalters@41: aimc::ModuleSlice slice_ssi_all_no_cutoff(¶ms); tomwalters@41: aimc::ModuleSlice slice_ssi_all_cutoff(¶ms); tomwalters@41: tomwalters@41: params.SetFloat("nap.lowpass_cutoff", 100.0); tomwalters@41: aimc::ModuleHCL smooth_nap(¶ms); tomwalters@41: params.SetBool("slice.all", true); tomwalters@41: aimc::ModuleSlice nap_profile(¶ms); tomwalters@41: aimc::ModuleScaler nap_scaler(¶ms); tomwalters@41: tomwalters@41: aimc::ModuleGaussians nap_features(¶ms); tomwalters@41: aimc::ModuleGaussians features_ssi_slice1_no_cutoff(¶ms); tomwalters@41: aimc::ModuleGaussians features_ssi_slice1_cutoff(¶ms); tomwalters@41: aimc::ModuleGaussians features_ssi_all_no_cutoff(¶ms); tomwalters@41: aimc::ModuleGaussians features_ssi_all_cutoff(¶ms); tomwalters@41: tomwalters@41: aimc::FileOutputHTK nap_out(¶ms); tomwalters@41: aimc::FileOutputHTK output_ssi_slice1_no_cutoff(¶ms); tomwalters@41: aimc::FileOutputHTK output_ssi_slice1_cutoff(¶ms); tomwalters@41: aimc::FileOutputHTK output_ssi_all_no_cutoff(¶ms); tomwalters@41: aimc::FileOutputHTK output_ssi_all_cutoff(¶ms); tomwalters@41: tomwalters@41: input.AddTarget(&bmm); tomwalters@41: //noise_maker.AddTarget(&bmm); tomwalters@41: bmm.AddTarget(&nap); tomwalters@41: bmm.AddTarget(&smooth_nap); tomwalters@41: smooth_nap.AddTarget(&nap_profile); tomwalters@41: nap_profile.AddTarget(&nap_scaler); tomwalters@41: nap_scaler.AddTarget(&nap_features); tomwalters@41: nap_features.AddTarget(&nap_out); tomwalters@41: tomwalters@41: nap.AddTarget(&strobes); tomwalters@41: strobes.AddTarget(&sai); tomwalters@41: sai.AddTarget(&ssi_no_cutoff); tomwalters@41: sai.AddTarget(&ssi_cutoff); tomwalters@41: tomwalters@42: ssi_no_cutoff.AddTarget(&slice_ssi_slice_1_no_cutoff); tomwalters@42: ssi_no_cutoff.AddTarget(&slice_ssi_all_no_cutoff); tomwalters@42: ssi_cutoff.AddTarget(&slice_ssi_slice_1_cutoff); tomwalters@42: ssi_cutoff.AddTarget(&slice_ssi_all_cutoff); tomwalters@41: tomwalters@41: slice_ssi_slice_1_no_cutoff.AddTarget(&features_ssi_slice1_no_cutoff); tomwalters@41: slice_ssi_all_no_cutoff.AddTarget(&features_ssi_all_no_cutoff); tomwalters@41: slice_ssi_slice_1_cutoff.AddTarget(&features_ssi_slice1_cutoff); tomwalters@41: slice_ssi_all_cutoff.AddTarget(&features_ssi_all_cutoff); tomwalters@41: tomwalters@41: tomwalters@41: features_ssi_slice1_no_cutoff.AddTarget(&output_ssi_slice1_no_cutoff); tomwalters@41: features_ssi_all_no_cutoff.AddTarget(&output_ssi_all_no_cutoff); tomwalters@41: features_ssi_slice1_cutoff.AddTarget(&output_ssi_slice1_cutoff); tomwalters@41: features_ssi_all_cutoff.AddTarget(&output_ssi_all_cutoff); tomwalters@41: tomwalters@41: tomwalters@41: if (write_data) { tomwalters@41: ofstream outfile(data_file.c_str()); tomwalters@41: if (outfile.fail()) { tomwalters@41: aimc::LOG_ERROR("Couldn't open data file %s for writing", tomwalters@41: data_file.c_str()); tomwalters@41: return -1; tomwalters@41: } tomwalters@41: time_t rawtime; tomwalters@41: struct tm * timeinfo; tomwalters@41: time(&rawtime); tomwalters@41: timeinfo = localtime(&rawtime); tomwalters@41: tomwalters@41: tomwalters@41: outfile << "# AIM-C AIMCopy\n"; tomwalters@41: outfile << "# Run on: " << asctime(timeinfo); tomwalters@41: char * descr = getenv("USER"); tomwalters@41: if (descr) { tomwalters@41: outfile << "# By user: " << descr <<"\n"; tomwalters@41: } tomwalters@49: outfile << "# Module chain:\n"; tomwalters@49: outfile << "#"; tomwalters@49: input.PrintTargets(outfile); tomwalters@49: outfile << "\n"; tomwalters@49: outfile << "#\n"; tomwalters@49: input.PrintVersions(outfile); tomwalters@49: outfile << "\n"; tomwalters@41: outfile << "#\n"; tomwalters@41: outfile << "# Parameters:\n"; tomwalters@41: outfile << params.WriteString(); tomwalters@41: outfile.close(); tomwalters@41: } tomwalters@41: tomwalters@41: for (unsigned int i = 0; i < file_list.size(); ++i) { tomwalters@41: // aimc::LOG_INFO(_T("In: %s"), file_list[i].first.c_str()); tomwalters@41: aimc::LOG_INFO(_T("Out: %s"), file_list[i].second.c_str()); tomwalters@41: tomwalters@189: string filename = file_list[i].second + "slice_1_no_cutoff"; tomwalters@41: output_ssi_slice1_no_cutoff.OpenFile(filename.c_str(), 10.0f); tomwalters@189: filename = file_list[i].second + "ssi_profile_no_cutoff"; tomwalters@41: output_ssi_all_no_cutoff.OpenFile(filename.c_str(), 10.0f); tomwalters@189: filename = file_list[i].second + "slice_1_cutoff"; tomwalters@41: output_ssi_slice1_cutoff.OpenFile(filename.c_str(), 10.0f); tomwalters@189: filename = file_list[i].second + "ssi_profile_cutoff"; tomwalters@41: output_ssi_all_cutoff.OpenFile(filename.c_str(), 10.0f); tomwalters@189: filename = file_list[i].second + "smooth_nap_profile"; tomwalters@41: nap_out.OpenFile(filename.c_str(), 10.0f); tomwalters@41: tomwalters@41: if (input.LoadFile(file_list[i].first.c_str())) { tomwalters@41: input.Process(); tomwalters@41: } else { tomwalters@41: printf("LoadFile failed for file %s\n", file_list[i].first.c_str()); tomwalters@41: } tomwalters@41: input.Reset(); tomwalters@41: } tomwalters@41: tomwalters@41: return 0; tomwalters@41: }