annotate src/Main/AIMCopy_SSI_Features.cc @ 32:9122efd2b227

-New AIMCopy main for the SSI features (temporary hack till I get a working module load system) -LocalMax strobe criterion. This is faster and better than the parabola version, which still seems buggy. -Noise generator module. Adds noise to a signal. Uses boost for the random number generator. -New options for the SSI -Slice now respects all its flags (oops!). -MATLAB functions for visualisation -Scripts for generating data to view in MATLAB -Script to download and build HTK - useful for running experiments
author tomwalters
date Thu, 25 Feb 2010 22:02:00 +0000
parents
children f8fe1aadf097
rev   line source
tomwalters@32 1 // Copyright 2008-2010, Thomas Walters
tomwalters@32 2 //
tomwalters@32 3 // AIM-C: A C++ implementation of the Auditory Image Model
tomwalters@32 4 // http://www.acousticscale.org/AIMC
tomwalters@32 5 //
tomwalters@32 6 // This program is free software: you can redistribute it and/or modify
tomwalters@32 7 // it under the terms of the GNU General Public License as published by
tomwalters@32 8 // the Free Software Foundation, either version 3 of the License, or
tomwalters@32 9 // (at your option) any later version.
tomwalters@32 10 //
tomwalters@32 11 // This program is distributed in the hope that it will be useful,
tomwalters@32 12 // but WITHOUT ANY WARRANTY; without even the implied warranty of
tomwalters@32 13 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
tomwalters@32 14 // GNU General Public License for more details.
tomwalters@32 15 //
tomwalters@32 16 // You should have received a copy of the GNU General Public License
tomwalters@32 17 // along with this program. If not, see <http://www.gnu.org/licenses/>.
tomwalters@32 18
tomwalters@32 19 /*!
tomwalters@32 20 * \file AIMCopy.cpp
tomwalters@32 21 * \brief AIM-C replacement for HTK's HCopy
tomwalters@32 22 *
tomwalters@32 23 * The following subset of the command-line flags
tomwalters@32 24 * should be implemented from HCopy:
tomwalters@32 25 * -A Print command line arguments off
tomwalters@32 26 * -C cf Set config file to cf default
tomwalters@32 27 * (should be able to take multiple config files)
tomwalters@32 28 * -S f Set script file to f none
tomwalters@32 29 * //! \todo -T N Set trace flags to N 0
tomwalters@32 30 * -V Print version information off
tomwalters@32 31 * -D of Write configuration data to of none
tomwalters@32 32 *
tomwalters@32 33 * \author Thomas Walters <tom@acousticscale.org>
tomwalters@32 34 * \date created 2008/05/08
tomwalters@32 35 * \version \$Id$
tomwalters@32 36 */
tomwalters@32 37
tomwalters@32 38 #include <fstream>
tomwalters@32 39 #include <iostream>
tomwalters@32 40 #include <string>
tomwalters@32 41 #include <utility>
tomwalters@32 42 #include <vector>
tomwalters@32 43
tomwalters@32 44 #include <stdlib.h>
tomwalters@32 45 #include <time.h>
tomwalters@32 46
tomwalters@32 47 #include "Modules/Input/ModuleFileInput.h"
tomwalters@32 48 #include "Modules/BMM/ModuleGammatone.h"
tomwalters@32 49 #include "Modules/BMM/ModulePZFC.h"
tomwalters@32 50 #include "Modules/NAP/ModuleHCL.h"
tomwalters@32 51 #include "Modules/Strobes/ModuleParabola.h"
tomwalters@32 52 #include "Modules/SAI/ModuleSAI.h"
tomwalters@32 53 #include "Modules/SSI/ModuleSSI.h"
tomwalters@32 54 #include "Modules/SNR/ModuleNoise.h"
tomwalters@32 55 #include "Modules/Profile/ModuleSlice.h"
tomwalters@32 56 #include "Modules/Profile/ModuleScaler.h"
tomwalters@32 57 #include "Modules/Features/ModuleGaussians.h"
tomwalters@32 58 #include "Modules/Output/FileOutputHTK.h"
tomwalters@32 59 #include "Support/Common.h"
tomwalters@32 60 #include "Support/FileList.h"
tomwalters@32 61 #include "Support/Parameters.h"
tomwalters@32 62
tomwalters@32 63 using std::ofstream;
tomwalters@32 64 using std::pair;
tomwalters@32 65 using std::vector;
tomwalters@32 66 using std::string;
tomwalters@32 67 int main(int argc, char* argv[]) {
tomwalters@32 68 string sound_file;
tomwalters@32 69 string data_file;
tomwalters@32 70 string config_file;
tomwalters@32 71 string script_file;
tomwalters@32 72 bool write_data = false;
tomwalters@32 73 bool print_version = false;
tomwalters@32 74
tomwalters@32 75 string version_string(
tomwalters@32 76 " AIM-C AIMCopy\n"
tomwalters@32 77 " (c) 2006-2010, Thomas Walters and Willem van Engen\n"
tomwalters@32 78 " http://www.acoustiscale.org/AIMC/\n"
tomwalters@32 79 "\n");
tomwalters@32 80
tomwalters@32 81 if (argc < 2) {
tomwalters@32 82 printf("%s", version_string.c_str());
tomwalters@32 83 printf("AIMCopy is intended as a drop-in replacement for HTK's HCopy\n");
tomwalters@32 84 printf("command. It is used for making features from audio files for\n");
tomwalters@32 85 printf("use with HTK.\n");
tomwalters@32 86 printf("Usage: \n");
tomwalters@32 87 printf(" -A Print command line arguments off\n");
tomwalters@32 88 printf(" -C cf Set config file to cf none\n");
tomwalters@32 89 printf(" -S f Set script file to f none\n");
tomwalters@32 90 printf(" -V Print version information off\n");
tomwalters@32 91 printf(" -D g Write configuration data to g none\n");
tomwalters@32 92 return -1;
tomwalters@32 93 }
tomwalters@32 94
tomwalters@32 95 // Parse command-line arguments
tomwalters@32 96 for (int i = 1; i < argc; i++) {
tomwalters@32 97 if (strcmp(argv[i],"-A") == 0) {
tomwalters@32 98 for (int j = 0; j < argc; j++)
tomwalters@32 99 printf("%s ",argv[j]);
tomwalters@32 100 printf("\n");
tomwalters@32 101 fflush(stdout);
tomwalters@32 102 continue;
tomwalters@32 103 }
tomwalters@32 104 if (strcmp(argv[i],"-C") == 0) {
tomwalters@32 105 if (++i >= argc) {
tomwalters@32 106 aimc::LOG_ERROR(_T("Configuration file name expected after -C"));
tomwalters@32 107 return(-1);
tomwalters@32 108 }
tomwalters@32 109 config_file = argv[i];
tomwalters@32 110 continue;
tomwalters@32 111 }
tomwalters@32 112 if (strcmp(argv[i],"-S") == 0) {
tomwalters@32 113 if (++i >= argc) {
tomwalters@32 114 aimc::LOG_ERROR(_T("Script file name expected after -S"));
tomwalters@32 115 return(-1);
tomwalters@32 116 }
tomwalters@32 117 script_file = argv[i];
tomwalters@32 118 continue;
tomwalters@32 119 }
tomwalters@32 120 if (strcmp(argv[i],"-D") == 0) {
tomwalters@32 121 if (++i >= argc) {
tomwalters@32 122 aimc::LOG_ERROR(_T("Data file name expected after -D"));
tomwalters@32 123 return(-1);
tomwalters@32 124 }
tomwalters@32 125 data_file = argv[i];
tomwalters@32 126 write_data = true;
tomwalters@32 127 continue;
tomwalters@32 128 }
tomwalters@32 129 if (strcmp(argv[i],"-V") == 0) {
tomwalters@32 130 print_version = true;
tomwalters@32 131 continue;
tomwalters@32 132 }
tomwalters@32 133 aimc::LOG_ERROR(_T("Unrecognized command-line argument: %s"), argv[i]);
tomwalters@32 134 }
tomwalters@32 135
tomwalters@32 136 if (print_version)
tomwalters@32 137 printf("%s", version_string.c_str());
tomwalters@32 138
tomwalters@32 139 aimc::Parameters params;
tomwalters@32 140
tomwalters@32 141 if (!params.Load(config_file.c_str())) {
tomwalters@32 142 aimc::LOG_ERROR(_T("Couldn't load parameters from file %s"),
tomwalters@32 143 config_file.c_str());
tomwalters@32 144 return -1;
tomwalters@32 145 }
tomwalters@32 146
tomwalters@32 147 vector<pair<string, string> > file_list = aimc::FileList::Load(script_file);
tomwalters@32 148 if (file_list.size() == 0) {
tomwalters@32 149 aimc::LOG_ERROR("No data read from file %s", script_file.c_str());
tomwalters@32 150 return -1;
tomwalters@32 151 }
tomwalters@32 152
tomwalters@32 153 // Set up AIM-C processor here
tomwalters@32 154 aimc::ModuleFileInput input(&params);
tomwalters@32 155 //aimc::ModuleNoise noise_maker(&params);
tomwalters@32 156 aimc::ModuleGammatone bmm(&params);
tomwalters@32 157 aimc::ModuleHCL nap(&params);
tomwalters@32 158 aimc::ModuleParabola strobes(&params);
tomwalters@32 159 aimc::ModuleSAI sai(&params);
tomwalters@32 160 aimc::ModuleSSI ssi(&params);
tomwalters@32 161
tomwalters@32 162 params.SetBool("slice.all", false);
tomwalters@32 163 params.SetInt("slice.lower_index", 40);
tomwalters@32 164 params.SetInt("slice.upper_index", 56);
tomwalters@32 165 aimc::ModuleSlice slice_1(&params);
tomwalters@32 166
tomwalters@32 167 params.SetInt("slice.lower_index", 88);
tomwalters@32 168 params.SetInt("slice.upper_index", 104);
tomwalters@32 169 aimc::ModuleSlice slice_2(&params);
tomwalters@32 170
tomwalters@32 171 params.SetInt("slice.lower_index", 184);
tomwalters@32 172 params.SetInt("slice.upper_index", 200);
tomwalters@32 173 aimc::ModuleSlice slice_3(&params);
tomwalters@32 174
tomwalters@32 175 params.SetInt("slice.lower_index", 376);
tomwalters@32 176 params.SetInt("slice.upper_index", 392);
tomwalters@32 177 aimc::ModuleSlice slice_4(&params);
tomwalters@32 178
tomwalters@32 179 params.SetBool("slice.all", true);
tomwalters@32 180 aimc::ModuleSlice slice_5(&params);
tomwalters@32 181
tomwalters@32 182 aimc::ModuleGaussians features_1(&params);
tomwalters@32 183 aimc::ModuleGaussians features_2(&params);
tomwalters@32 184 aimc::ModuleGaussians features_3(&params);
tomwalters@32 185 aimc::ModuleGaussians features_4(&params);
tomwalters@32 186 aimc::ModuleGaussians features_5(&params);
tomwalters@32 187
tomwalters@32 188 aimc::FileOutputHTK output_1(&params);
tomwalters@32 189 aimc::FileOutputHTK output_2(&params);
tomwalters@32 190 aimc::FileOutputHTK output_3(&params);
tomwalters@32 191 aimc::FileOutputHTK output_4(&params);
tomwalters@32 192 aimc::FileOutputHTK output_5(&params);
tomwalters@32 193
tomwalters@32 194 input.AddTarget(&bmm);
tomwalters@32 195 // No noise for now
tomwalters@32 196 //noise_maker.AddTarget(&bmm);
tomwalters@32 197 bmm.AddTarget(&nap);
tomwalters@32 198 nap.AddTarget(&strobes);
tomwalters@32 199 strobes.AddTarget(&sai);
tomwalters@32 200 sai.AddTarget(&ssi);
tomwalters@32 201
tomwalters@32 202 ssi.AddTarget(&slice_1);
tomwalters@32 203 ssi.AddTarget(&slice_2);
tomwalters@32 204 ssi.AddTarget(&slice_3);
tomwalters@32 205 ssi.AddTarget(&slice_4);
tomwalters@32 206 ssi.AddTarget(&slice_5);
tomwalters@32 207
tomwalters@32 208 slice_1.AddTarget(&features_1);
tomwalters@32 209 slice_2.AddTarget(&features_2);
tomwalters@32 210 slice_3.AddTarget(&features_3);
tomwalters@32 211 slice_4.AddTarget(&features_4);
tomwalters@32 212 slice_5.AddTarget(&features_5);
tomwalters@32 213
tomwalters@32 214 features_1.AddTarget(&output_1);
tomwalters@32 215 features_2.AddTarget(&output_2);
tomwalters@32 216 features_3.AddTarget(&output_3);
tomwalters@32 217 features_4.AddTarget(&output_4);
tomwalters@32 218 features_5.AddTarget(&output_5);
tomwalters@32 219
tomwalters@32 220 if (write_data) {
tomwalters@32 221 ofstream outfile(data_file.c_str());
tomwalters@32 222 if (outfile.fail()) {
tomwalters@32 223 aimc::LOG_ERROR("Couldn't open data file %s for writing",
tomwalters@32 224 data_file.c_str());
tomwalters@32 225 return -1;
tomwalters@32 226 }
tomwalters@32 227 time_t rawtime;
tomwalters@32 228 struct tm * timeinfo;
tomwalters@32 229 time(&rawtime);
tomwalters@32 230 timeinfo = localtime(&rawtime);
tomwalters@32 231
tomwalters@32 232
tomwalters@32 233 outfile << "# AIM-C AIMCopy\n";
tomwalters@32 234 outfile << "# Run on: " << asctime(timeinfo);
tomwalters@32 235 char * descr = getenv("USER");
tomwalters@32 236 if (descr) {
tomwalters@32 237 outfile << "# By user: " << descr <<"\n";
tomwalters@32 238 }
tomwalters@32 239 outfile << "# Module chain: ";
tomwalters@32 240 outfile << "# gt";
tomwalters@32 241 outfile << "# parabola";
tomwalters@32 242 outfile << "# sai_weighted";
tomwalters@32 243 outfile << "# ssi";
tomwalters@32 244 outfile << "# slice";
tomwalters@32 245 outfile << "# features";
tomwalters@32 246 outfile << "# output";
tomwalters@32 247 outfile << "# slice";
tomwalters@32 248 outfile << "# features";
tomwalters@32 249 outfile << "# output";
tomwalters@32 250 outfile << "# slice";
tomwalters@32 251 outfile << "# features";
tomwalters@32 252 outfile << "# output";
tomwalters@32 253 outfile << "# slice";
tomwalters@32 254 outfile << "# features";
tomwalters@32 255 outfile << "# output";
tomwalters@32 256 outfile << "# slice";
tomwalters@32 257 outfile << "# features";
tomwalters@32 258 outfile << "# output";
tomwalters@32 259 outfile << "# ";
tomwalters@32 260 outfile << "# Module versions:\n";
tomwalters@32 261 outfile << "# " << input.id() << " : " << input.version() << "\n";
tomwalters@32 262 outfile << "# " << bmm.id() << " : " << bmm.version() << "\n";
tomwalters@32 263 outfile << "# " << nap.id() << " : " << nap.version() << "\n";
tomwalters@32 264 outfile << "# " << strobes.id() << " : " << strobes.version() << "\n";
tomwalters@32 265 outfile << "# " << sai.id() << " : " << sai.version() << "\n";
tomwalters@32 266 outfile << "# " << slice_1.id() << " : " << slice_1.version() << "\n";
tomwalters@32 267 // outfile << "# " << profile.id() << " : " << profile.version() << "\n";
tomwalters@32 268 // outfile << "# " << scaler.id() << " : " << scaler.version() << "\n";
tomwalters@32 269 outfile << "# " << features_1.id() << " : " << features_1.version() << "\n";
tomwalters@32 270 outfile << "# " << output_1.id() << " : " << output_1.version() << "\n";
tomwalters@32 271 outfile << "#\n";
tomwalters@32 272 outfile << "# Parameters:\n";
tomwalters@32 273 outfile << params.WriteString();
tomwalters@32 274 outfile.close();
tomwalters@32 275 }
tomwalters@32 276
tomwalters@32 277 for (unsigned int i = 0; i < file_list.size(); ++i) {
tomwalters@32 278 aimc::LOG_INFO(_T("In: %s"), file_list[i].first.c_str());
tomwalters@32 279 aimc::LOG_INFO(_T("Out: %s"), file_list[i].second.c_str());
tomwalters@32 280
tomwalters@32 281 string filename = file_list[i].second + "_1";
tomwalters@32 282 output_1.OpenFile(filename.c_str(), 10.0f);
tomwalters@32 283 filename = file_list[i].second + "_2";
tomwalters@32 284 output_2.OpenFile(filename.c_str(), 10.0f);
tomwalters@32 285 filename = file_list[i].second + "_3";
tomwalters@32 286 output_3.OpenFile(filename.c_str(), 10.0f);
tomwalters@32 287 filename = file_list[i].second + "_4";
tomwalters@32 288 output_4.OpenFile(filename.c_str(), 10.0f);
tomwalters@32 289 filename = file_list[i].second + "_5";
tomwalters@32 290 output_5.OpenFile(filename.c_str(), 10.0f);
tomwalters@32 291
tomwalters@32 292 if (input.LoadFile(file_list[i].first.c_str())) {
tomwalters@32 293 input.Process();
tomwalters@32 294 } else {
tomwalters@32 295 printf("LoadFile failed for file %s\n", file_list[i].first.c_str());
tomwalters@32 296 }
tomwalters@32 297 input.Reset();
tomwalters@32 298 }
tomwalters@32 299
tomwalters@32 300 return 0;
tomwalters@32 301 }