tomwalters@314
|
1 // Copyright 2008-2010, Thomas Walters
|
tomwalters@314
|
2 //
|
tomwalters@314
|
3 // AIM-C: A C++ implementation of the Auditory Image Model
|
tomwalters@314
|
4 // http://www.acousticscale.org/AIMC
|
tomwalters@314
|
5 //
|
tomwalters@314
|
6 // This program is free software: you can redistribute it and/or modify
|
tomwalters@314
|
7 // it under the terms of the GNU General Public License as published by
|
tomwalters@314
|
8 // the Free Software Foundation, either version 3 of the License, or
|
tomwalters@314
|
9 // (at your option) any later version.
|
tomwalters@314
|
10 //
|
tomwalters@314
|
11 // This program is distributed in the hope that it will be useful,
|
tomwalters@314
|
12 // but WITHOUT ANY WARRANTY; without even the implied warranty of
|
tomwalters@314
|
13 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
tomwalters@314
|
14 // GNU General Public License for more details.
|
tomwalters@314
|
15 //
|
tomwalters@314
|
16 // You should have received a copy of the GNU General Public License
|
tomwalters@314
|
17 // along with this program. If not, see <http://www.gnu.org/licenses/>.
|
tomwalters@314
|
18
|
tomwalters@314
|
19 /*!
|
tomwalters@314
|
20 * \file AIMCopy.cpp
|
tomwalters@314
|
21 * \brief AIM-C replacement for HTK's HCopy
|
tomwalters@314
|
22 *
|
tomwalters@314
|
23 * The following subset of the command-line flags
|
tomwalters@314
|
24 * should be implemented from HCopy:
|
tomwalters@314
|
25 * -A Print command line arguments off
|
tomwalters@314
|
26 * -C cf Set config file to cf default
|
tomwalters@314
|
27 * (should be able to take multiple config files)
|
tomwalters@314
|
28 * -S f Set script file to f none
|
tomwalters@314
|
29 * //! \todo -T N Set trace flags to N 0
|
tomwalters@314
|
30 * -V Print version information off
|
tomwalters@314
|
31 * -D of Write configuration data to of none
|
tomwalters@314
|
32 *
|
tomwalters@314
|
33 * \author Thomas Walters <tom@acousticscale.org>
|
tomwalters@314
|
34 * \date created 2008/05/08
|
tomwalters@314
|
35 * \version \$Id$
|
tomwalters@314
|
36 */
|
tomwalters@314
|
37
|
tomwalters@314
|
38 #include <fstream>
|
tomwalters@314
|
39 #include <iostream>
|
tomwalters@314
|
40 #include <string>
|
tomwalters@314
|
41 #include <utility>
|
tomwalters@314
|
42 #include <vector>
|
tomwalters@314
|
43
|
tomwalters@314
|
44 #include <stdlib.h>
|
tomwalters@314
|
45 #include <time.h>
|
tomwalters@314
|
46
|
tomwalters@314
|
47 #include "Modules/Input/ModuleFileInput.h"
|
tomwalters@314
|
48 #include "Modules/BMM/ModuleGammatone.h"
|
tomwalters@314
|
49 #include "Modules/BMM/ModulePZFC.h"
|
tomwalters@314
|
50 #include "Modules/NAP/ModuleHCL.h"
|
tomwalters@314
|
51 #include "Modules/Strobes/ModuleParabola.h"
|
tomwalters@314
|
52 #include "Modules/Strobes/ModuleLocalMax.h"
|
tomwalters@314
|
53 #include "Modules/SAI/ModuleSAI.h"
|
tomwalters@314
|
54 #include "Modules/SSI/ModuleSSI.h"
|
tomwalters@314
|
55 #include "Modules/SNR/ModuleNoise.h"
|
tomwalters@314
|
56 #include "Modules/Profile/ModuleSlice.h"
|
tomwalters@314
|
57 #include "Modules/Profile/ModuleScaler.h"
|
tomwalters@314
|
58 #include "Modules/Features/ModuleGaussians.h"
|
tomwalters@314
|
59 #include "Modules/Output/FileOutputHTK.h"
|
tomwalters@314
|
60 #include "Support/Common.h"
|
tomwalters@314
|
61 #include "Support/FileList.h"
|
tomwalters@314
|
62 #include "Support/Parameters.h"
|
tomwalters@314
|
63
|
tomwalters@314
|
64 using std::ofstream;
|
tomwalters@314
|
65 using std::pair;
|
tomwalters@314
|
66 using std::vector;
|
tomwalters@314
|
67 using std::string;
|
tomwalters@314
|
68 int main(int argc, char* argv[]) {
|
tomwalters@314
|
69 string sound_file;
|
tomwalters@314
|
70 string data_file;
|
tomwalters@314
|
71 string config_file;
|
tomwalters@314
|
72 string script_file;
|
tomwalters@314
|
73 bool write_data = false;
|
tomwalters@314
|
74 bool print_version = false;
|
tomwalters@314
|
75
|
tomwalters@314
|
76 string version_string(
|
tomwalters@314
|
77 " AIM-C AIMCopy\n"
|
tomwalters@314
|
78 " (c) 2006-2010, Thomas Walters and Willem van Engen\n"
|
tomwalters@314
|
79 " http://www.acoustiscale.org/AIMC/\n"
|
tomwalters@314
|
80 "\n");
|
tomwalters@314
|
81
|
tomwalters@314
|
82 if (argc < 2) {
|
tomwalters@314
|
83 printf("%s", version_string.c_str());
|
tomwalters@314
|
84 printf("AIMCopy is intended as a drop-in replacement for HTK's HCopy\n");
|
tomwalters@314
|
85 printf("command. It is used for making features from audio files for\n");
|
tomwalters@314
|
86 printf("use with HTK.\n");
|
tomwalters@314
|
87 printf("Usage: \n");
|
tomwalters@314
|
88 printf(" -A Print command line arguments off\n");
|
tomwalters@314
|
89 printf(" -C cf Set config file to cf none\n");
|
tomwalters@314
|
90 printf(" -S f Set script file to f none\n");
|
tomwalters@314
|
91 printf(" -V Print version information off\n");
|
tomwalters@314
|
92 printf(" -D g Write configuration data to g none\n");
|
tomwalters@314
|
93 return -1;
|
tomwalters@314
|
94 }
|
tomwalters@314
|
95
|
tomwalters@314
|
96 // Parse command-line arguments
|
tomwalters@314
|
97 for (int i = 1; i < argc; i++) {
|
tomwalters@314
|
98 if (strcmp(argv[i],"-A") == 0) {
|
tomwalters@314
|
99 for (int j = 0; j < argc; j++)
|
tomwalters@314
|
100 printf("%s ",argv[j]);
|
tomwalters@314
|
101 printf("\n");
|
tomwalters@314
|
102 fflush(stdout);
|
tomwalters@314
|
103 continue;
|
tomwalters@314
|
104 }
|
tomwalters@314
|
105 if (strcmp(argv[i],"-C") == 0) {
|
tomwalters@314
|
106 if (++i >= argc) {
|
tomwalters@314
|
107 aimc::LOG_ERROR(_T("Configuration file name expected after -C"));
|
tomwalters@314
|
108 return(-1);
|
tomwalters@314
|
109 }
|
tomwalters@314
|
110 config_file = argv[i];
|
tomwalters@314
|
111 continue;
|
tomwalters@314
|
112 }
|
tomwalters@314
|
113 if (strcmp(argv[i],"-S") == 0) {
|
tomwalters@314
|
114 if (++i >= argc) {
|
tomwalters@314
|
115 aimc::LOG_ERROR(_T("Script file name expected after -S"));
|
tomwalters@314
|
116 return(-1);
|
tomwalters@314
|
117 }
|
tomwalters@314
|
118 script_file = argv[i];
|
tomwalters@314
|
119 continue;
|
tomwalters@314
|
120 }
|
tomwalters@314
|
121 if (strcmp(argv[i],"-D") == 0) {
|
tomwalters@314
|
122 if (++i >= argc) {
|
tomwalters@314
|
123 aimc::LOG_ERROR(_T("Data file name expected after -D"));
|
tomwalters@314
|
124 return(-1);
|
tomwalters@314
|
125 }
|
tomwalters@314
|
126 data_file = argv[i];
|
tomwalters@314
|
127 write_data = true;
|
tomwalters@314
|
128 continue;
|
tomwalters@314
|
129 }
|
tomwalters@314
|
130 if (strcmp(argv[i],"-V") == 0) {
|
tomwalters@314
|
131 print_version = true;
|
tomwalters@314
|
132 continue;
|
tomwalters@314
|
133 }
|
tomwalters@314
|
134 aimc::LOG_ERROR(_T("Unrecognized command-line argument: %s"), argv[i]);
|
tomwalters@314
|
135 }
|
tomwalters@314
|
136
|
tomwalters@314
|
137 if (print_version)
|
tomwalters@314
|
138 printf("%s", version_string.c_str());
|
tomwalters@314
|
139
|
tomwalters@314
|
140 aimc::Parameters params;
|
tomwalters@314
|
141
|
tomwalters@314
|
142 if (!params.Load(config_file.c_str())) {
|
tomwalters@314
|
143 aimc::LOG_ERROR(_T("Couldn't load parameters from file %s"),
|
tomwalters@314
|
144 config_file.c_str());
|
tomwalters@314
|
145 return -1;
|
tomwalters@314
|
146 }
|
tomwalters@314
|
147
|
tomwalters@314
|
148 vector<pair<string, string> > file_list = aimc::FileList::Load(script_file);
|
tomwalters@314
|
149 if (file_list.size() == 0) {
|
tomwalters@314
|
150 aimc::LOG_ERROR("No data read from file %s", script_file.c_str());
|
tomwalters@314
|
151 return -1;
|
tomwalters@314
|
152 }
|
tomwalters@314
|
153
|
tomwalters@314
|
154 // Set up AIM-C processor here
|
tomwalters@314
|
155 aimc::ModuleFileInput input(¶ms);
|
tomwalters@314
|
156 //aimc::ModuleNoise noise_maker(¶ms);
|
tomwalters@314
|
157 aimc::ModuleGammatone bmm(¶ms);
|
tomwalters@314
|
158 aimc::ModuleHCL nap(¶ms);
|
tomwalters@314
|
159 aimc::ModuleLocalMax strobes(¶ms);
|
tomwalters@314
|
160 aimc::ModuleSAI sai(¶ms);
|
tomwalters@314
|
161 params.SetBool("ssi.pitch_cutoff", false);
|
tomwalters@314
|
162 aimc::ModuleSSI ssi_no_cutoff(¶ms);
|
tomwalters@314
|
163
|
tomwalters@314
|
164 params.SetBool("ssi.pitch_cutoff", true);
|
tomwalters@314
|
165 params.SetFloat("ssi.pitch_search_start_ms", 4.6f);
|
tomwalters@314
|
166 aimc::ModuleSSI ssi_cutoff(¶ms);
|
tomwalters@314
|
167
|
tomwalters@314
|
168 params.SetBool("slice.all", false);
|
tomwalters@314
|
169 params.SetInt("slice.lower_index", 77);
|
tomwalters@314
|
170 params.SetInt("slice.upper_index", 150);
|
tomwalters@314
|
171 aimc::ModuleSlice slice_ssi_slice_1_no_cutoff(¶ms);
|
tomwalters@314
|
172 aimc::ModuleSlice slice_ssi_slice_1_cutoff(¶ms);
|
tomwalters@314
|
173
|
tomwalters@314
|
174 params.SetBool("slice.all", true);
|
tomwalters@314
|
175 aimc::ModuleSlice slice_ssi_all_no_cutoff(¶ms);
|
tomwalters@314
|
176 aimc::ModuleSlice slice_ssi_all_cutoff(¶ms);
|
tomwalters@314
|
177
|
tomwalters@314
|
178 params.SetFloat("nap.lowpass_cutoff", 100.0);
|
tomwalters@314
|
179 aimc::ModuleHCL smooth_nap(¶ms);
|
tomwalters@314
|
180 params.SetBool("slice.all", true);
|
tomwalters@314
|
181 aimc::ModuleSlice nap_profile(¶ms);
|
tomwalters@314
|
182 aimc::ModuleScaler nap_scaler(¶ms);
|
tomwalters@314
|
183
|
tomwalters@314
|
184 aimc::ModuleGaussians nap_features(¶ms);
|
tomwalters@314
|
185 aimc::ModuleGaussians features_ssi_slice1_no_cutoff(¶ms);
|
tomwalters@314
|
186 aimc::ModuleGaussians features_ssi_slice1_cutoff(¶ms);
|
tomwalters@314
|
187 aimc::ModuleGaussians features_ssi_all_no_cutoff(¶ms);
|
tomwalters@314
|
188 aimc::ModuleGaussians features_ssi_all_cutoff(¶ms);
|
tomwalters@314
|
189
|
tomwalters@314
|
190 aimc::FileOutputHTK nap_out(¶ms);
|
tomwalters@314
|
191 aimc::FileOutputHTK output_ssi_slice1_no_cutoff(¶ms);
|
tomwalters@314
|
192 aimc::FileOutputHTK output_ssi_slice1_cutoff(¶ms);
|
tomwalters@314
|
193 aimc::FileOutputHTK output_ssi_all_no_cutoff(¶ms);
|
tomwalters@314
|
194 aimc::FileOutputHTK output_ssi_all_cutoff(¶ms);
|
tomwalters@314
|
195
|
tomwalters@314
|
196 input.AddTarget(&bmm);
|
tomwalters@314
|
197 //noise_maker.AddTarget(&bmm);
|
tomwalters@314
|
198 bmm.AddTarget(&nap);
|
tomwalters@314
|
199 bmm.AddTarget(&smooth_nap);
|
tomwalters@314
|
200 smooth_nap.AddTarget(&nap_profile);
|
tomwalters@314
|
201 nap_profile.AddTarget(&nap_scaler);
|
tomwalters@314
|
202 nap_scaler.AddTarget(&nap_features);
|
tomwalters@314
|
203 nap_features.AddTarget(&nap_out);
|
tomwalters@314
|
204
|
tomwalters@314
|
205 nap.AddTarget(&strobes);
|
tomwalters@314
|
206 strobes.AddTarget(&sai);
|
tomwalters@314
|
207 sai.AddTarget(&ssi_no_cutoff);
|
tomwalters@314
|
208 sai.AddTarget(&ssi_cutoff);
|
tomwalters@314
|
209
|
tomwalters@315
|
210 ssi_no_cutoff.AddTarget(&slice_ssi_slice_1_no_cutoff);
|
tomwalters@315
|
211 ssi_no_cutoff.AddTarget(&slice_ssi_all_no_cutoff);
|
tomwalters@315
|
212 ssi_cutoff.AddTarget(&slice_ssi_slice_1_cutoff);
|
tomwalters@315
|
213 ssi_cutoff.AddTarget(&slice_ssi_all_cutoff);
|
tomwalters@314
|
214
|
tomwalters@314
|
215 slice_ssi_slice_1_no_cutoff.AddTarget(&features_ssi_slice1_no_cutoff);
|
tomwalters@314
|
216 slice_ssi_all_no_cutoff.AddTarget(&features_ssi_all_no_cutoff);
|
tomwalters@314
|
217 slice_ssi_slice_1_cutoff.AddTarget(&features_ssi_slice1_cutoff);
|
tomwalters@314
|
218 slice_ssi_all_cutoff.AddTarget(&features_ssi_all_cutoff);
|
tomwalters@314
|
219
|
tomwalters@314
|
220
|
tomwalters@314
|
221 features_ssi_slice1_no_cutoff.AddTarget(&output_ssi_slice1_no_cutoff);
|
tomwalters@314
|
222 features_ssi_all_no_cutoff.AddTarget(&output_ssi_all_no_cutoff);
|
tomwalters@314
|
223 features_ssi_slice1_cutoff.AddTarget(&output_ssi_slice1_cutoff);
|
tomwalters@314
|
224 features_ssi_all_cutoff.AddTarget(&output_ssi_all_cutoff);
|
tomwalters@314
|
225
|
tomwalters@314
|
226
|
tomwalters@314
|
227 if (write_data) {
|
tomwalters@314
|
228 ofstream outfile(data_file.c_str());
|
tomwalters@314
|
229 if (outfile.fail()) {
|
tomwalters@314
|
230 aimc::LOG_ERROR("Couldn't open data file %s for writing",
|
tomwalters@314
|
231 data_file.c_str());
|
tomwalters@314
|
232 return -1;
|
tomwalters@314
|
233 }
|
tomwalters@314
|
234 time_t rawtime;
|
tomwalters@314
|
235 struct tm * timeinfo;
|
tomwalters@314
|
236 time(&rawtime);
|
tomwalters@314
|
237 timeinfo = localtime(&rawtime);
|
tomwalters@314
|
238
|
tomwalters@314
|
239
|
tomwalters@314
|
240 outfile << "# AIM-C AIMCopy\n";
|
tomwalters@314
|
241 outfile << "# Run on: " << asctime(timeinfo);
|
tomwalters@314
|
242 char * descr = getenv("USER");
|
tomwalters@314
|
243 if (descr) {
|
tomwalters@314
|
244 outfile << "# By user: " << descr <<"\n";
|
tomwalters@314
|
245 }
|
tomwalters@314
|
246 outfile << "#Module chain: ";
|
tomwalters@314
|
247 outfile << "#input";
|
tomwalters@314
|
248 outfile << "# noise_maker";
|
tomwalters@314
|
249 outfile << "# gt";
|
tomwalters@314
|
250 outfile << "# nap";
|
tomwalters@314
|
251 outfile << "# slice";
|
tomwalters@314
|
252 outfile << "# scaler";
|
tomwalters@314
|
253 outfile << "# features";
|
tomwalters@314
|
254 outfile << "# output";
|
tomwalters@314
|
255 outfile << "# local_max";
|
tomwalters@314
|
256 outfile << "# sai_weighted";
|
tomwalters@314
|
257 outfile << "# ssi";
|
tomwalters@314
|
258 outfile << "# slice";
|
tomwalters@314
|
259 outfile << "# features";
|
tomwalters@314
|
260 outfile << "# output";
|
tomwalters@314
|
261 outfile << "# slice";
|
tomwalters@314
|
262 outfile << "# features";
|
tomwalters@314
|
263 outfile << "# output";
|
tomwalters@314
|
264 outfile << "# slice";
|
tomwalters@314
|
265 outfile << "# features";
|
tomwalters@314
|
266 outfile << "# output";
|
tomwalters@314
|
267 outfile << "# slice";
|
tomwalters@314
|
268 outfile << "# features";
|
tomwalters@314
|
269 outfile << "# output";
|
tomwalters@314
|
270 outfile << "# slice";
|
tomwalters@314
|
271 outfile << "# features";
|
tomwalters@314
|
272 outfile << "# output";
|
tomwalters@314
|
273 outfile << "# ";
|
tomwalters@314
|
274 outfile << "# Module versions:\n";
|
tomwalters@314
|
275 outfile << "# " << input.id() << " : " << input.version() << "\n";
|
tomwalters@314
|
276 outfile << "# " << bmm.id() << " : " << bmm.version() << "\n";
|
tomwalters@314
|
277 outfile << "# " << nap.id() << " : " << nap.version() << "\n";
|
tomwalters@314
|
278 outfile << "# " << strobes.id() << " : " << strobes.version() << "\n";
|
tomwalters@314
|
279 outfile << "# " << sai.id() << " : " << sai.version() << "\n";
|
tomwalters@314
|
280 outfile << "#\n";
|
tomwalters@314
|
281 outfile << "# Parameters:\n";
|
tomwalters@314
|
282 outfile << params.WriteString();
|
tomwalters@314
|
283 outfile.close();
|
tomwalters@314
|
284 }
|
tomwalters@314
|
285
|
tomwalters@314
|
286 for (unsigned int i = 0; i < file_list.size(); ++i) {
|
tomwalters@314
|
287 // aimc::LOG_INFO(_T("In: %s"), file_list[i].first.c_str());
|
tomwalters@314
|
288 aimc::LOG_INFO(_T("Out: %s"), file_list[i].second.c_str());
|
tomwalters@314
|
289
|
tomwalters@314
|
290 string filename = file_list[i].second + ".slice_1_no_cutoff";
|
tomwalters@314
|
291 output_ssi_slice1_no_cutoff.OpenFile(filename.c_str(), 10.0f);
|
tomwalters@314
|
292 filename = file_list[i].second + ".ssi_profile_no_cutoff";
|
tomwalters@314
|
293 output_ssi_all_no_cutoff.OpenFile(filename.c_str(), 10.0f);
|
tomwalters@314
|
294 filename = file_list[i].second + ".slice_1_cutoff";
|
tomwalters@314
|
295 output_ssi_slice1_cutoff.OpenFile(filename.c_str(), 10.0f);
|
tomwalters@314
|
296 filename = file_list[i].second + ".ssi_profile_cutoff";
|
tomwalters@314
|
297 output_ssi_all_cutoff.OpenFile(filename.c_str(), 10.0f);
|
tomwalters@314
|
298 filename = file_list[i].second + ".smooth_nap_profile";
|
tomwalters@314
|
299 nap_out.OpenFile(filename.c_str(), 10.0f);
|
tomwalters@314
|
300
|
tomwalters@314
|
301 if (input.LoadFile(file_list[i].first.c_str())) {
|
tomwalters@314
|
302 input.Process();
|
tomwalters@314
|
303 } else {
|
tomwalters@314
|
304 printf("LoadFile failed for file %s\n", file_list[i].first.c_str());
|
tomwalters@314
|
305 }
|
tomwalters@314
|
306 input.Reset();
|
tomwalters@314
|
307 }
|
tomwalters@314
|
308
|
tomwalters@314
|
309 return 0;
|
tomwalters@314
|
310 }
|