annotate trunk/src/Main/AIMCopy_SSI_Features_v3.cc @ 706:f8e90b5d85fd tip

Delete CARFAC code from this repository. It has been moved to https://github.com/google/carfac Please email me with your github username to get access. I've also created a new mailing list to discuss CARFAC development: https://groups.google.com/forum/#!forum/carfac-dev
author ronw@google.com
date Thu, 18 Jul 2013 20:56:51 +0000
parents 7074795fd2eb
children
rev   line source
tomwalters@314 1 // Copyright 2008-2010, Thomas Walters
tomwalters@314 2 //
tomwalters@314 3 // AIM-C: A C++ implementation of the Auditory Image Model
tomwalters@314 4 // http://www.acousticscale.org/AIMC
tomwalters@314 5 //
tomwalters@318 6 // Licensed under the Apache License, Version 2.0 (the "License");
tomwalters@318 7 // you may not use this file except in compliance with the License.
tomwalters@318 8 // You may obtain a copy of the License at
tomwalters@314 9 //
tomwalters@318 10 // http://www.apache.org/licenses/LICENSE-2.0
tomwalters@314 11 //
tomwalters@318 12 // Unless required by applicable law or agreed to in writing, software
tomwalters@318 13 // distributed under the License is distributed on an "AS IS" BASIS,
tomwalters@318 14 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
tomwalters@318 15 // See the License for the specific language governing permissions and
tomwalters@318 16 // limitations under the License.
tomwalters@314 17
tomwalters@314 18 /*!
tomwalters@314 19 * \file AIMCopy.cpp
tomwalters@314 20 * \brief AIM-C replacement for HTK's HCopy
tomwalters@314 21 *
tomwalters@314 22 * The following subset of the command-line flags
tomwalters@314 23 * should be implemented from HCopy:
tomwalters@314 24 * -A Print command line arguments off
tomwalters@314 25 * -C cf Set config file to cf default
tomwalters@314 26 * (should be able to take multiple config files)
tomwalters@314 27 * -S f Set script file to f none
tomwalters@314 28 * //! \todo -T N Set trace flags to N 0
tomwalters@314 29 * -V Print version information off
tomwalters@314 30 * -D of Write configuration data to of none
tomwalters@314 31 *
tomwalters@314 32 * \author Thomas Walters <tom@acousticscale.org>
tomwalters@314 33 * \date created 2008/05/08
tomwalters@314 34 * \version \$Id$
tomwalters@314 35 */
tomwalters@314 36
tomwalters@314 37 #include <fstream>
tomwalters@314 38 #include <iostream>
tomwalters@314 39 #include <string>
tomwalters@314 40 #include <utility>
tomwalters@314 41 #include <vector>
tomwalters@314 42
tomwalters@314 43 #include <stdlib.h>
tomwalters@314 44 #include <time.h>
tomwalters@314 45
tomwalters@314 46 #include "Modules/Input/ModuleFileInput.h"
tomwalters@314 47 #include "Modules/BMM/ModuleGammatone.h"
tomwalters@314 48 #include "Modules/BMM/ModulePZFC.h"
tomwalters@314 49 #include "Modules/NAP/ModuleHCL.h"
tomwalters@314 50 #include "Modules/Strobes/ModuleParabola.h"
tomwalters@314 51 #include "Modules/Strobes/ModuleLocalMax.h"
tomwalters@314 52 #include "Modules/SAI/ModuleSAI.h"
tomwalters@314 53 #include "Modules/SSI/ModuleSSI.h"
tomwalters@314 54 #include "Modules/SNR/ModuleNoise.h"
tomwalters@314 55 #include "Modules/Profile/ModuleSlice.h"
tomwalters@314 56 #include "Modules/Profile/ModuleScaler.h"
tomwalters@314 57 #include "Modules/Features/ModuleGaussians.h"
tomwalters@314 58 #include "Modules/Output/FileOutputHTK.h"
tomwalters@314 59 #include "Support/Common.h"
tomwalters@314 60 #include "Support/FileList.h"
tomwalters@314 61 #include "Support/Parameters.h"
tomwalters@314 62
tomwalters@314 63 using std::ofstream;
tomwalters@314 64 using std::pair;
tomwalters@314 65 using std::vector;
tomwalters@314 66 using std::string;
tomwalters@314 67 int main(int argc, char* argv[]) {
tomwalters@314 68 string sound_file;
tomwalters@314 69 string data_file;
tomwalters@314 70 string config_file;
tomwalters@314 71 string script_file;
tomwalters@314 72 bool write_data = false;
tomwalters@314 73 bool print_version = false;
tomwalters@359 74 bool load_params = false;
tomwalters@314 75
tomwalters@314 76 string version_string(
tomwalters@314 77 " AIM-C AIMCopy\n"
tomwalters@314 78 " (c) 2006-2010, Thomas Walters and Willem van Engen\n"
tomwalters@314 79 " http://www.acoustiscale.org/AIMC/\n"
tomwalters@314 80 "\n");
tomwalters@314 81
tomwalters@314 82 if (argc < 2) {
tomwalters@314 83 printf("%s", version_string.c_str());
tomwalters@314 84 printf("AIMCopy is intended as a drop-in replacement for HTK's HCopy\n");
tomwalters@314 85 printf("command. It is used for making features from audio files for\n");
tomwalters@314 86 printf("use with HTK.\n");
tomwalters@314 87 printf("Usage: \n");
tomwalters@314 88 printf(" -A Print command line arguments off\n");
tomwalters@314 89 printf(" -C cf Set config file to cf none\n");
tomwalters@314 90 printf(" -S f Set script file to f none\n");
tomwalters@314 91 printf(" -V Print version information off\n");
tomwalters@314 92 printf(" -D g Write configuration data to g none\n");
tomwalters@314 93 return -1;
tomwalters@314 94 }
tomwalters@314 95
tomwalters@314 96 // Parse command-line arguments
tomwalters@314 97 for (int i = 1; i < argc; i++) {
tomwalters@314 98 if (strcmp(argv[i],"-A") == 0) {
tomwalters@314 99 for (int j = 0; j < argc; j++)
tomwalters@314 100 printf("%s ",argv[j]);
tomwalters@314 101 printf("\n");
tomwalters@314 102 fflush(stdout);
tomwalters@314 103 continue;
tomwalters@314 104 }
tomwalters@314 105 if (strcmp(argv[i],"-C") == 0) {
tomwalters@314 106 if (++i >= argc) {
tomwalters@314 107 aimc::LOG_ERROR(_T("Configuration file name expected after -C"));
tomwalters@314 108 return(-1);
tomwalters@314 109 }
tomwalters@314 110 config_file = argv[i];
tomwalters@359 111 load_params = true;
tomwalters@314 112 continue;
tomwalters@314 113 }
tomwalters@314 114 if (strcmp(argv[i],"-S") == 0) {
tomwalters@314 115 if (++i >= argc) {
tomwalters@314 116 aimc::LOG_ERROR(_T("Script file name expected after -S"));
tomwalters@314 117 return(-1);
tomwalters@314 118 }
tomwalters@314 119 script_file = argv[i];
tomwalters@314 120 continue;
tomwalters@314 121 }
tomwalters@314 122 if (strcmp(argv[i],"-D") == 0) {
tomwalters@314 123 if (++i >= argc) {
tomwalters@314 124 aimc::LOG_ERROR(_T("Data file name expected after -D"));
tomwalters@314 125 return(-1);
tomwalters@314 126 }
tomwalters@314 127 data_file = argv[i];
tomwalters@314 128 write_data = true;
tomwalters@314 129 continue;
tomwalters@314 130 }
tomwalters@314 131 if (strcmp(argv[i],"-V") == 0) {
tomwalters@314 132 print_version = true;
tomwalters@314 133 continue;
tomwalters@314 134 }
tomwalters@314 135 aimc::LOG_ERROR(_T("Unrecognized command-line argument: %s"), argv[i]);
tomwalters@314 136 }
tomwalters@314 137
tomwalters@314 138 if (print_version)
tomwalters@314 139 printf("%s", version_string.c_str());
tomwalters@314 140
tomwalters@314 141 aimc::Parameters params;
tomwalters@314 142
tomwalters@359 143 if (load_params) {
tomwalters@359 144 if (!params.Load(config_file.c_str())) {
tomwalters@359 145 aimc::LOG_ERROR(_T("Couldn't load parameters from file %s"),
tomwalters@359 146 config_file.c_str());
tomwalters@359 147 return -1;
tomwalters@359 148 }
tomwalters@314 149 }
tomwalters@314 150
tomwalters@314 151 vector<pair<string, string> > file_list = aimc::FileList::Load(script_file);
tomwalters@314 152 if (file_list.size() == 0) {
tomwalters@314 153 aimc::LOG_ERROR("No data read from file %s", script_file.c_str());
tomwalters@314 154 return -1;
tomwalters@314 155 }
tomwalters@314 156
tomwalters@314 157 // Set up AIM-C processor here
tomwalters@314 158 aimc::ModuleFileInput input(&params);
tomwalters@314 159 //aimc::ModuleNoise noise_maker(&params);
tomwalters@314 160 aimc::ModuleGammatone bmm(&params);
tomwalters@314 161 aimc::ModuleHCL nap(&params);
tomwalters@314 162 aimc::ModuleLocalMax strobes(&params);
tomwalters@314 163 aimc::ModuleSAI sai(&params);
tomwalters@314 164 params.SetBool("ssi.pitch_cutoff", false);
tomwalters@314 165 aimc::ModuleSSI ssi_no_cutoff(&params);
tomwalters@314 166
tomwalters@314 167 params.SetBool("ssi.pitch_cutoff", true);
tomwalters@314 168 params.SetFloat("ssi.pitch_search_start_ms", 4.6f);
tomwalters@314 169 aimc::ModuleSSI ssi_cutoff(&params);
tomwalters@314 170
tomwalters@314 171 params.SetBool("slice.all", false);
tomwalters@314 172 params.SetInt("slice.lower_index", 77);
tomwalters@314 173 params.SetInt("slice.upper_index", 150);
tomwalters@314 174 aimc::ModuleSlice slice_ssi_slice_1_no_cutoff(&params);
tomwalters@314 175 aimc::ModuleSlice slice_ssi_slice_1_cutoff(&params);
tomwalters@314 176
tomwalters@314 177 params.SetBool("slice.all", true);
tomwalters@314 178 aimc::ModuleSlice slice_ssi_all_no_cutoff(&params);
tomwalters@314 179 aimc::ModuleSlice slice_ssi_all_cutoff(&params);
tomwalters@314 180
tomwalters@314 181 params.SetFloat("nap.lowpass_cutoff", 100.0);
tomwalters@314 182 aimc::ModuleHCL smooth_nap(&params);
tomwalters@314 183 params.SetBool("slice.all", true);
tomwalters@314 184 aimc::ModuleSlice nap_profile(&params);
tomwalters@314 185 aimc::ModuleScaler nap_scaler(&params);
tomwalters@314 186
tomwalters@314 187 aimc::ModuleGaussians nap_features(&params);
tomwalters@314 188 aimc::ModuleGaussians features_ssi_slice1_no_cutoff(&params);
tomwalters@314 189 aimc::ModuleGaussians features_ssi_slice1_cutoff(&params);
tomwalters@314 190 aimc::ModuleGaussians features_ssi_all_no_cutoff(&params);
tomwalters@314 191 aimc::ModuleGaussians features_ssi_all_cutoff(&params);
tomwalters@314 192
tomwalters@314 193 aimc::FileOutputHTK nap_out(&params);
tomwalters@314 194 aimc::FileOutputHTK output_ssi_slice1_no_cutoff(&params);
tomwalters@314 195 aimc::FileOutputHTK output_ssi_slice1_cutoff(&params);
tomwalters@314 196 aimc::FileOutputHTK output_ssi_all_no_cutoff(&params);
tomwalters@314 197 aimc::FileOutputHTK output_ssi_all_cutoff(&params);
tomwalters@314 198
tomwalters@314 199 input.AddTarget(&bmm);
tomwalters@314 200 //noise_maker.AddTarget(&bmm);
tomwalters@314 201 bmm.AddTarget(&nap);
tomwalters@314 202 bmm.AddTarget(&smooth_nap);
tomwalters@314 203 smooth_nap.AddTarget(&nap_profile);
tomwalters@314 204 nap_profile.AddTarget(&nap_scaler);
tomwalters@314 205 nap_scaler.AddTarget(&nap_features);
tomwalters@314 206 nap_features.AddTarget(&nap_out);
tomwalters@314 207
tomwalters@314 208 nap.AddTarget(&strobes);
tomwalters@314 209 strobes.AddTarget(&sai);
tomwalters@314 210 sai.AddTarget(&ssi_no_cutoff);
tomwalters@314 211 sai.AddTarget(&ssi_cutoff);
tomwalters@314 212
tomwalters@315 213 ssi_no_cutoff.AddTarget(&slice_ssi_slice_1_no_cutoff);
tomwalters@315 214 ssi_no_cutoff.AddTarget(&slice_ssi_all_no_cutoff);
tomwalters@315 215 ssi_cutoff.AddTarget(&slice_ssi_slice_1_cutoff);
tomwalters@315 216 ssi_cutoff.AddTarget(&slice_ssi_all_cutoff);
tomwalters@314 217
tomwalters@314 218 slice_ssi_slice_1_no_cutoff.AddTarget(&features_ssi_slice1_no_cutoff);
tomwalters@314 219 slice_ssi_all_no_cutoff.AddTarget(&features_ssi_all_no_cutoff);
tomwalters@314 220 slice_ssi_slice_1_cutoff.AddTarget(&features_ssi_slice1_cutoff);
tomwalters@314 221 slice_ssi_all_cutoff.AddTarget(&features_ssi_all_cutoff);
tomwalters@314 222
tomwalters@314 223
tomwalters@314 224 features_ssi_slice1_no_cutoff.AddTarget(&output_ssi_slice1_no_cutoff);
tomwalters@314 225 features_ssi_all_no_cutoff.AddTarget(&output_ssi_all_no_cutoff);
tomwalters@314 226 features_ssi_slice1_cutoff.AddTarget(&output_ssi_slice1_cutoff);
tomwalters@314 227 features_ssi_all_cutoff.AddTarget(&output_ssi_all_cutoff);
tomwalters@314 228
tomwalters@314 229
tomwalters@314 230 if (write_data) {
tomwalters@314 231 ofstream outfile(data_file.c_str());
tomwalters@314 232 if (outfile.fail()) {
tomwalters@314 233 aimc::LOG_ERROR("Couldn't open data file %s for writing",
tomwalters@314 234 data_file.c_str());
tomwalters@314 235 return -1;
tomwalters@314 236 }
tomwalters@314 237 time_t rawtime;
tomwalters@314 238 struct tm * timeinfo;
tomwalters@314 239 time(&rawtime);
tomwalters@314 240 timeinfo = localtime(&rawtime);
tomwalters@314 241
tomwalters@314 242
tomwalters@314 243 outfile << "# AIM-C AIMCopy\n";
tomwalters@314 244 outfile << "# Run on: " << asctime(timeinfo);
tomwalters@314 245 char * descr = getenv("USER");
tomwalters@314 246 if (descr) {
tomwalters@314 247 outfile << "# By user: " << descr <<"\n";
tomwalters@314 248 }
tomwalters@323 249 outfile << "# Module chain:\n";
tomwalters@323 250 outfile << "#";
tomwalters@323 251 input.PrintTargets(outfile);
tomwalters@323 252 outfile << "\n";
tomwalters@323 253 outfile << "#\n";
tomwalters@323 254 input.PrintVersions(outfile);
tomwalters@323 255 outfile << "\n";
tomwalters@314 256 outfile << "#\n";
tomwalters@314 257 outfile << "# Parameters:\n";
tomwalters@314 258 outfile << params.WriteString();
tomwalters@314 259 outfile.close();
tomwalters@314 260 }
tomwalters@314 261
tomwalters@314 262 for (unsigned int i = 0; i < file_list.size(); ++i) {
tomwalters@314 263 // aimc::LOG_INFO(_T("In: %s"), file_list[i].first.c_str());
tomwalters@314 264 aimc::LOG_INFO(_T("Out: %s"), file_list[i].second.c_str());
tomwalters@314 265
tomwalters@359 266 string filename = file_list[i].second + "slice_1_no_cutoff";
tomwalters@314 267 output_ssi_slice1_no_cutoff.OpenFile(filename.c_str(), 10.0f);
tomwalters@359 268 filename = file_list[i].second + "ssi_profile_no_cutoff";
tomwalters@314 269 output_ssi_all_no_cutoff.OpenFile(filename.c_str(), 10.0f);
tomwalters@359 270 filename = file_list[i].second + "slice_1_cutoff";
tomwalters@314 271 output_ssi_slice1_cutoff.OpenFile(filename.c_str(), 10.0f);
tomwalters@359 272 filename = file_list[i].second + "ssi_profile_cutoff";
tomwalters@314 273 output_ssi_all_cutoff.OpenFile(filename.c_str(), 10.0f);
tomwalters@359 274 filename = file_list[i].second + "smooth_nap_profile";
tomwalters@314 275 nap_out.OpenFile(filename.c_str(), 10.0f);
tomwalters@314 276
tomwalters@314 277 if (input.LoadFile(file_list[i].first.c_str())) {
tomwalters@314 278 input.Process();
tomwalters@314 279 } else {
tomwalters@314 280 printf("LoadFile failed for file %s\n", file_list[i].first.c_str());
tomwalters@314 281 }
tomwalters@314 282 input.Reset();
tomwalters@314 283 }
tomwalters@314 284
tomwalters@314 285 return 0;
tomwalters@314 286 }