tomwalters@277
|
1 // Copyright 2006-2010, Thomas Walters
|
tomwalters@277
|
2 //
|
tomwalters@277
|
3 // AIM-C: A C++ implementation of the Auditory Image Model
|
tomwalters@277
|
4 // http://www.acousticscale.org/AIMC
|
tomwalters@277
|
5 //
|
tomwalters@277
|
6 // This program is free software: you can redistribute it and/or modify
|
tomwalters@277
|
7 // it under the terms of the GNU General Public License as published by
|
tomwalters@277
|
8 // the Free Software Foundation, either version 3 of the License, or
|
tomwalters@277
|
9 // (at your option) any later version.
|
tomwalters@277
|
10 //
|
tomwalters@277
|
11 // This program is distributed in the hope that it will be useful,
|
tomwalters@277
|
12 // but WITHOUT ANY WARRANTY; without even the implied warranty of
|
tomwalters@277
|
13 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
tomwalters@277
|
14 // GNU General Public License for more details.
|
tomwalters@277
|
15 //
|
tomwalters@277
|
16 // You should have received a copy of the GNU General Public License
|
tomwalters@277
|
17 // along with this program. If not, see <http://www.gnu.org/licenses/>.
|
tomwalters@277
|
18
|
tomwalters@277
|
19 /*!
|
tomwalters@277
|
20 * \file
|
tomwalters@279
|
21 * \brief File output in the HTK format.
|
tomwalters@277
|
22 *
|
tomwalters@279
|
23 * \author Tom Walters <tom@acousticscale.org>
|
tomwalters@277
|
24 * \author Willem van Engen <cnbh@willem.engen.nl>
|
tomwalters@277
|
25 * \date created 2006/10/30
|
tomwalters@277
|
26 * \version \$Id$
|
tomwalters@277
|
27 */
|
tomwalters@277
|
28
|
tomwalters@277
|
29 #ifdef _WINDOWS
|
tomwalters@280
|
30 # include <direct.h> // for _mkdir&_rmdir
|
tomwalters@277
|
31 #else
|
tomwalters@279
|
32 # include <sys/types.h>
|
tomwalters@280
|
33 # include <dirent.h> // for opendir&friends
|
tomwalters@277
|
34 #endif
|
tomwalters@277
|
35 #include <stdio.h>
|
tomwalters@277
|
36 #include <string.h>
|
tomwalters@277
|
37 #include <cmath>
|
tomwalters@277
|
38
|
tomwalters@277
|
39 #include "Modules/Output/FileOutputHTK.h"
|
tomwalters@277
|
40
|
tomwalters@277
|
41 namespace aimc {
|
tomwalters@277
|
42 FileOutputHTK::FileOutputHTK(Parameters *params) : Module(params) {
|
tomwalters@278
|
43 module_description_ = "File output in HTK format";
|
tomwalters@278
|
44 module_identifier_ = "htk_out";
|
tomwalters@278
|
45 module_type_ = "output";
|
tomwalters@278
|
46 module_version_ = "$Id$";
|
tomwalters@278
|
47
|
tomwalters@279
|
48 file_handle_ = NULL;
|
tomwalters@279
|
49 header_written_ = false;
|
tomwalters@277
|
50 frame_period_ms_ = 0.0f;
|
tomwalters@277
|
51 }
|
tomwalters@277
|
52
|
tomwalters@277
|
53 FileOutputHTK::~FileOutputHTK() {
|
tomwalters@279
|
54 if (file_handle_ != NULL)
|
tomwalters@279
|
55 CloseFile();
|
tomwalters@277
|
56 }
|
tomwalters@277
|
57
|
tomwalters@277
|
58 bool FileOutputHTK::OpenFile(const char* filename, float frame_period_ms) {
|
tomwalters@279
|
59 if (file_handle_ != NULL) {
|
tomwalters@279
|
60 LOG_ERROR(_T("Couldn't open output file. A file is already open."));
|
tomwalters@279
|
61 return false;
|
tomwalters@279
|
62 }
|
tomwalters@277
|
63
|
tomwalters@279
|
64 // Check that the output file exists and is writeable
|
tomwalters@280
|
65 if ((file_handle_ = fopen(filename, "wb")) == NULL) {
|
tomwalters@279
|
66 LOG_ERROR(_T("Couldn't open output file '%s' for writing."), filename);
|
tomwalters@279
|
67 return false;
|
tomwalters@279
|
68 }
|
tomwalters@279
|
69 sample_count_ = 0;
|
tomwalters@277
|
70 frame_period_ms_ = frame_period_ms;
|
tomwalters@277
|
71 header_written_ = false;
|
tomwalters@292
|
72 if (initialized_) {
|
tomwalters@292
|
73 WriteHeader(channel_count_ * buffer_length_, frame_period_ms_);
|
tomwalters@292
|
74 }
|
tomwalters@279
|
75 return true;
|
tomwalters@277
|
76 }
|
tomwalters@277
|
77
|
tomwalters@277
|
78 bool FileOutputHTK::InitializeInternal(const SignalBank &input) {
|
tomwalters@277
|
79 if (file_handle_ == NULL) {
|
tomwalters@277
|
80 LOG_ERROR(_T("Couldn't initialize file output. "
|
tomwalters@277
|
81 "Please call FileOutputHTK::OpenFile first"));
|
tomwalters@279
|
82 return false;
|
tomwalters@277
|
83 }
|
tomwalters@277
|
84 if (header_written_) {
|
tomwalters@292
|
85 LOG_ERROR(_T("A header has already been written on the output file. "
|
tomwalters@277
|
86 "Please call FileOutputHTK::CloseFile to close that file, "
|
tomwalters@277
|
87 "and FileOutputHTK::OpenFile to open an new one before "
|
tomwalters@277
|
88 "calling FileOutputHTK::Initialize again."));
|
tomwalters@279
|
89 return false;
|
tomwalters@277
|
90 }
|
tomwalters@277
|
91 channel_count_ = input.channel_count();
|
tomwalters@277
|
92 buffer_length_ = input.buffer_length();
|
tomwalters@277
|
93 WriteHeader(channel_count_ * buffer_length_, frame_period_ms_);
|
tomwalters@277
|
94 return true;
|
tomwalters@277
|
95 }
|
tomwalters@277
|
96
|
tomwalters@277
|
97 void FileOutputHTK::ResetInternal() {
|
tomwalters@277
|
98 if (file_handle_ != NULL && !header_written_) {
|
tomwalters@277
|
99 WriteHeader(channel_count_ * buffer_length_, frame_period_ms_);
|
tomwalters@277
|
100 }
|
tomwalters@292
|
101 if (file_handle_ != NULL)
|
tomwalters@292
|
102 CloseFile();
|
tomwalters@277
|
103 }
|
tomwalters@277
|
104
|
tomwalters@277
|
105 void FileOutputHTK::WriteHeader(int num_elements, float period_ms) {
|
tomwalters@279
|
106 if (header_written_)
|
tomwalters@279
|
107 return;
|
tomwalters@277
|
108
|
tomwalters@279
|
109 /* HTK format file: (taken from the HTK book - section 5.10.1)
|
tomwalters@279
|
110 * Header: 12 bytes in total, contains:
|
tomwalters@279
|
111 * sample_count - number of samples in file (4-byte integer)(long)
|
tomwalters@279
|
112 * sample_period - sample period in 100ns units (4-byte integer)(long)
|
tomwalters@279
|
113 * sample_size - number of bytes per sample (2-byte integer)(short)
|
tomwalters@279
|
114 * parameter_kind - a code indicating the sample kind (2-byte integer)(short)
|
tomwalters@279
|
115 */
|
tomwalters@277
|
116
|
tomwalters@279
|
117 // To be filled in when the file is done
|
tomwalters@279
|
118 int32_t sample_count = 0;
|
tomwalters@277
|
119
|
tomwalters@277
|
120 int32_t sample_period = floor(1e4 * period_ms);
|
tomwalters@289
|
121 int16_t sample_size = num_elements * sizeof(float); // NOLINT
|
tomwalters@277
|
122
|
tomwalters@277
|
123 // User-defined coefficients with energy term
|
tomwalters@279
|
124 int16_t parameter_kind = H_USER + H_E;
|
tomwalters@277
|
125
|
tomwalters@279
|
126 // Fix endianness
|
tomwalters@279
|
127 sample_count = ByteSwap32(sample_count);
|
tomwalters@279
|
128 sample_period = ByteSwap32(sample_period);
|
tomwalters@279
|
129 sample_size = ByteSwap16(sample_size);
|
tomwalters@279
|
130 parameter_kind = ByteSwap16(parameter_kind);
|
tomwalters@277
|
131
|
tomwalters@277
|
132 // Enter header values. sample_count is a dummy value which is filled in on
|
tomwalters@277
|
133 // file close
|
tomwalters@279
|
134 fwrite(&sample_count, sizeof(sample_count), 1, file_handle_);
|
tomwalters@279
|
135 fwrite(&sample_period, sizeof(sample_period), 1, file_handle_);
|
tomwalters@279
|
136 fwrite(&sample_size, sizeof(sample_size), 1, file_handle_);
|
tomwalters@279
|
137 fwrite(¶meter_kind, sizeof(parameter_kind), 1, file_handle_);
|
tomwalters@279
|
138 fflush(file_handle_);
|
tomwalters@277
|
139
|
tomwalters@279
|
140 header_written_ = true;
|
tomwalters@277
|
141 }
|
tomwalters@277
|
142
|
tomwalters@277
|
143
|
tomwalters@277
|
144 void FileOutputHTK::Process(const SignalBank &input) {
|
tomwalters@277
|
145 if (file_handle_ == NULL) {
|
tomwalters@277
|
146 LOG_ERROR(_T("Couldn't process file output. No file is open."
|
tomwalters@277
|
147 "Please call FileOutputHTK::OpenFile first"));
|
tomwalters@279
|
148 return;
|
tomwalters@277
|
149 }
|
tomwalters@277
|
150
|
tomwalters@277
|
151 if (!header_written_) {
|
tomwalters@292
|
152 LOG_ERROR(_T("No header has been written on the output file yet. Please "
|
tomwalters@277
|
153 "call FileOutputHTK::Initialize() before calling "
|
tomwalters@277
|
154 "FileOutputHTK::Process()"));
|
tomwalters@279
|
155 return;
|
tomwalters@277
|
156 }
|
tomwalters@279
|
157 float s;
|
tomwalters@277
|
158
|
tomwalters@279
|
159 for (int ch = 0; ch < input.channel_count(); ch++) {
|
tomwalters@277
|
160 for (int i = 0; i < input.buffer_length(); i++) {
|
tomwalters@277
|
161 s = input.sample(ch, i);
|
tomwalters@277
|
162 s = ByteSwapFloat(s);
|
tomwalters@280
|
163 fwrite(&s, sizeof(s), 1, file_handle_);
|
tomwalters@277
|
164 }
|
tomwalters@277
|
165 }
|
tomwalters@279
|
166 sample_count_++;
|
tomwalters@277
|
167 }
|
tomwalters@277
|
168
|
tomwalters@277
|
169 bool FileOutputHTK::CloseFile() {
|
tomwalters@279
|
170 if (file_handle_ == NULL)
|
tomwalters@277
|
171 return false;
|
tomwalters@277
|
172
|
tomwalters@279
|
173 // Write the first 4 bytes of the file
|
tomwalters@279
|
174 // with how many samples there are in the file
|
tomwalters@279
|
175 fflush(file_handle_);
|
tomwalters@279
|
176 rewind(file_handle_);
|
tomwalters@279
|
177 fflush(file_handle_);
|
tomwalters@277
|
178 int32_t samples = sample_count_;
|
tomwalters@279
|
179 samples = ByteSwap32(samples);
|
tomwalters@279
|
180 fwrite(&samples, sizeof(samples), 1, file_handle_);
|
tomwalters@277
|
181
|
tomwalters@279
|
182 // And close the file
|
tomwalters@279
|
183 fclose(file_handle_);
|
tomwalters@279
|
184 file_handle_ = NULL;
|
tomwalters@292
|
185 header_written_ = false;
|
tomwalters@279
|
186 return true;
|
tomwalters@277
|
187 }
|
tomwalters@277
|
188
|
tomwalters@277
|
189 float FileOutputHTK::ByteSwapFloat(float d) {
|
tomwalters@277
|
190 // Endianness fix
|
tomwalters@277
|
191 float a;
|
tomwalters@277
|
192 unsigned char *dst = (unsigned char *)&a;
|
tomwalters@277
|
193 unsigned char *src = (unsigned char *)&d;
|
tomwalters@277
|
194
|
tomwalters@277
|
195 dst[0] = src[3];
|
tomwalters@277
|
196 dst[1] = src[2];
|
tomwalters@277
|
197 dst[2] = src[1];
|
tomwalters@277
|
198 dst[3] = src[0];
|
tomwalters@277
|
199
|
tomwalters@277
|
200 return a;
|
tomwalters@277
|
201 }
|
tomwalters@280
|
202 } // namespace aimc
|
tomwalters@277
|
203
|