annotate trunk/src/Modules/Output/FileOutputHTK.cc @ 278:5b8b9ea1218a

- Added a basic main function to test that all the can be fitted together - Fixed an initialisation bug in ModuleFileInput that left the buffer size at zero - Added proper description strings to the input and output modules - Fixed an out-by-a-factor-of-1000 bug in the SAI memory allocation (oops) - Added LOG_INFO_NN fucnction to log without a newline. Useful for the ASCII art module chain in aimc.cc.
author tomwalters
date Thu, 18 Feb 2010 19:35:07 +0000
parents 6b4921704eb1
children f469d936337f
rev   line source
tomwalters@277 1 // Copyright 2006-2010, Thomas Walters
tomwalters@277 2 //
tomwalters@277 3 // AIM-C: A C++ implementation of the Auditory Image Model
tomwalters@277 4 // http://www.acousticscale.org/AIMC
tomwalters@277 5 //
tomwalters@277 6 // This program is free software: you can redistribute it and/or modify
tomwalters@277 7 // it under the terms of the GNU General Public License as published by
tomwalters@277 8 // the Free Software Foundation, either version 3 of the License, or
tomwalters@277 9 // (at your option) any later version.
tomwalters@277 10 //
tomwalters@277 11 // This program is distributed in the hope that it will be useful,
tomwalters@277 12 // but WITHOUT ANY WARRANTY; without even the implied warranty of
tomwalters@277 13 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
tomwalters@277 14 // GNU General Public License for more details.
tomwalters@277 15 //
tomwalters@277 16 // You should have received a copy of the GNU General Public License
tomwalters@277 17 // along with this program. If not, see <http://www.gnu.org/licenses/>.
tomwalters@277 18
tomwalters@277 19 /*!
tomwalters@277 20 * \file
tomwalters@277 21 * \brief File output in the HTK format.
tomwalters@277 22 *
tomwalters@277 23 * \author Tom Walters <tom@acousticscale.org>
tomwalters@277 24 * \author Willem van Engen <cnbh@willem.engen.nl>
tomwalters@277 25 * \date created 2006/10/30
tomwalters@277 26 * \version \$Id$
tomwalters@277 27 */
tomwalters@277 28
tomwalters@277 29 #ifdef _WINDOWS
tomwalters@277 30 # include <direct.h> // for _mkdir&_rmdir
tomwalters@277 31 #else
tomwalters@277 32 # include <sys/types.h>
tomwalters@277 33 # include <dirent.h> // for opendir&friends
tomwalters@277 34 #endif
tomwalters@277 35 #include <stdio.h>
tomwalters@277 36 #include <string.h>
tomwalters@277 37 #include <cmath>
tomwalters@277 38
tomwalters@277 39 #include "Modules/Output/FileOutputHTK.h"
tomwalters@277 40
tomwalters@277 41 namespace aimc {
tomwalters@277 42 FileOutputHTK::FileOutputHTK(Parameters *params) : Module(params) {
tomwalters@278 43 module_description_ = "File output in HTK format";
tomwalters@278 44 module_identifier_ = "htk_out";
tomwalters@278 45 module_type_ = "output";
tomwalters@278 46 module_version_ = "$Id$";
tomwalters@278 47
tomwalters@277 48 file_handle_ = NULL;
tomwalters@277 49 header_written_ = false;
tomwalters@277 50 filename_[0] = '\0';
tomwalters@277 51 frame_period_ms_ = 0.0f;
tomwalters@277 52 }
tomwalters@277 53
tomwalters@277 54 FileOutputHTK::~FileOutputHTK() {
tomwalters@277 55 if (file_handle_ != NULL)
tomwalters@277 56 CloseFile();
tomwalters@277 57 }
tomwalters@277 58
tomwalters@277 59 bool FileOutputHTK::OpenFile(const char* filename, float frame_period_ms) {
tomwalters@277 60 if (file_handle_ != NULL) {
tomwalters@277 61 LOG_ERROR(_T("Couldn't open output file. A file is already open."));
tomwalters@277 62 return false;
tomwalters@277 63 }
tomwalters@277 64
tomwalters@277 65 // Check that the output file exists and is writeable
tomwalters@277 66 if ((file_handle_ = fopen(filename, "wb"))==NULL ) {
tomwalters@277 67 LOG_ERROR(_T("Couldn't open output file '%s' for writing."), filename);
tomwalters@277 68 return false;
tomwalters@277 69 }
tomwalters@277 70 strcpy(filename_, filename);
tomwalters@277 71 sample_count_ = 0;
tomwalters@277 72 frame_period_ms_ = frame_period_ms;
tomwalters@277 73 header_written_ = false;
tomwalters@277 74 return true;
tomwalters@277 75 }
tomwalters@277 76
tomwalters@277 77 bool FileOutputHTK::InitializeInternal(const SignalBank &input) {
tomwalters@277 78 if (file_handle_ == NULL) {
tomwalters@277 79 LOG_ERROR(_T("Couldn't initialize file output. "
tomwalters@277 80 "Please call FileOutputHTK::OpenFile first"));
tomwalters@277 81 return false;
tomwalters@277 82 }
tomwalters@277 83 if (header_written_) {
tomwalters@277 84 LOG_ERROR(_T("A header has already been written on the output file."
tomwalters@277 85 "Please call FileOutputHTK::CloseFile to close that file, "
tomwalters@277 86 "and FileOutputHTK::OpenFile to open an new one before "
tomwalters@277 87 "calling FileOutputHTK::Initialize again."));
tomwalters@277 88 return false;
tomwalters@277 89 }
tomwalters@277 90 channel_count_ = input.channel_count();
tomwalters@277 91 buffer_length_ = input.buffer_length();
tomwalters@277 92 WriteHeader(channel_count_ * buffer_length_, frame_period_ms_);
tomwalters@277 93 return true;
tomwalters@277 94 }
tomwalters@277 95
tomwalters@277 96 void FileOutputHTK::ResetInternal() {
tomwalters@277 97 if (file_handle_ != NULL && !header_written_) {
tomwalters@277 98 WriteHeader(channel_count_ * buffer_length_, frame_period_ms_);
tomwalters@277 99 }
tomwalters@277 100 }
tomwalters@277 101
tomwalters@277 102 void FileOutputHTK::WriteHeader(int num_elements, float period_ms) {
tomwalters@277 103 if (header_written_)
tomwalters@277 104 return;
tomwalters@277 105
tomwalters@277 106 /* HTK format file: (taken from the HTK book - section 5.10.1)
tomwalters@277 107 * Header: 12 bytes in total, contains:
tomwalters@277 108 * sample_count - number of samples in file (4-byte integer)(long)
tomwalters@277 109 * sample_period - sample period in 100ns units (4-byte integer)(long)
tomwalters@277 110 * sample_size - number of bytes per sample (2-byte integer)(short)
tomwalters@277 111 * parameter_kind - a code indicating the sample kind (2-byte integer)(short)
tomwalters@277 112 */
tomwalters@277 113
tomwalters@277 114 // To be filled in when the file is done
tomwalters@277 115 int32_t sample_count = 0;
tomwalters@277 116
tomwalters@277 117 int32_t sample_period = floor(1e4 * period_ms);
tomwalters@277 118 int16_t sample_size = num_elements * sizeof(float);
tomwalters@277 119
tomwalters@277 120 // User-defined coefficients with energy term
tomwalters@277 121 int16_t parameter_kind = H_USER + H_E;
tomwalters@277 122
tomwalters@277 123 // Fix endianness
tomwalters@277 124 sample_count = ByteSwap32(sample_count);
tomwalters@277 125 sample_period = ByteSwap32(sample_period);
tomwalters@277 126 sample_size = ByteSwap16(sample_size);
tomwalters@277 127 parameter_kind = ByteSwap16(parameter_kind);
tomwalters@277 128
tomwalters@277 129 // Enter header values. sample_count is a dummy value which is filled in on
tomwalters@277 130 // file close
tomwalters@277 131 fwrite(&sample_count, sizeof(sample_count), 1, file_handle_);
tomwalters@277 132 fwrite(&sample_period, sizeof(sample_period), 1, file_handle_);
tomwalters@277 133 fwrite(&sample_size, sizeof(sample_size), 1, file_handle_);
tomwalters@277 134 fwrite(&parameter_kind, sizeof(parameter_kind), 1, file_handle_);
tomwalters@277 135 fflush(file_handle_);
tomwalters@277 136
tomwalters@277 137 header_written_ = true;
tomwalters@277 138 }
tomwalters@277 139
tomwalters@277 140
tomwalters@277 141 void FileOutputHTK::Process(const SignalBank &input) {
tomwalters@277 142 if (file_handle_ == NULL) {
tomwalters@277 143 LOG_ERROR(_T("Couldn't process file output. No file is open."
tomwalters@277 144 "Please call FileOutputHTK::OpenFile first"));
tomwalters@277 145 return;
tomwalters@277 146 }
tomwalters@277 147
tomwalters@277 148 if (!header_written_) {
tomwalters@277 149 LOG_ERROR(_T("No header has been written on the output file yet. Please"
tomwalters@277 150 "call FileOutputHTK::Initialize() before calling "
tomwalters@277 151 "FileOutputHTK::Process()"));
tomwalters@277 152 return;
tomwalters@277 153 }
tomwalters@277 154 float s;
tomwalters@277 155
tomwalters@277 156 for (int ch = 0; ch < input.channel_count(); ch++) {
tomwalters@277 157 for (int i = 0; i < input.buffer_length(); i++) {
tomwalters@277 158 s = input.sample(ch, i);
tomwalters@277 159 s = ByteSwapFloat(s);
tomwalters@277 160 fwrite(&s, sizeof(float), 1, file_handle_);
tomwalters@277 161 }
tomwalters@277 162 }
tomwalters@277 163 sample_count_++;
tomwalters@277 164 }
tomwalters@277 165
tomwalters@277 166 bool FileOutputHTK::CloseFile() {
tomwalters@277 167 if (file_handle_ == NULL)
tomwalters@277 168 return false;
tomwalters@277 169
tomwalters@277 170 // Write the first 4 bytes of the file
tomwalters@277 171 // with how many samples there are in the file
tomwalters@277 172 fflush(file_handle_);
tomwalters@277 173 rewind(file_handle_);
tomwalters@277 174 fflush(file_handle_);
tomwalters@277 175 int32_t samples = sample_count_;
tomwalters@277 176 samples = ByteSwap32(samples);
tomwalters@277 177 fwrite(&samples, sizeof(samples), 1, file_handle_);
tomwalters@277 178
tomwalters@277 179 // And close the file
tomwalters@277 180 fclose(file_handle_);
tomwalters@277 181 file_handle_ = NULL;
tomwalters@277 182 return true;
tomwalters@277 183 }
tomwalters@277 184
tomwalters@277 185 float FileOutputHTK::ByteSwapFloat(float d) {
tomwalters@277 186 // Endianness fix
tomwalters@277 187 float a;
tomwalters@277 188 unsigned char *dst = (unsigned char *)&a;
tomwalters@277 189 unsigned char *src = (unsigned char *)&d;
tomwalters@277 190
tomwalters@277 191 dst[0] = src[3];
tomwalters@277 192 dst[1] = src[2];
tomwalters@277 193 dst[2] = src[1];
tomwalters@277 194 dst[3] = src[0];
tomwalters@277 195
tomwalters@277 196 return a;
tomwalters@277 197 }
tomwalters@277 198 } //namespace aimc
tomwalters@277 199