annotate trunk/src/Modules/Output/FileOutputHTK.cc @ 706:f8e90b5d85fd tip

Delete CARFAC code from this repository. It has been moved to https://github.com/google/carfac Please email me with your github username to get access. I've also created a new mailing list to discuss CARFAC development: https://groups.google.com/forum/#!forum/carfac-dev
author ronw@google.com
date Thu, 18 Jul 2013 20:56:51 +0000
parents 2d0b057e525c
children
rev   line source
tomwalters@277 1 // Copyright 2006-2010, Thomas Walters
tomwalters@277 2 //
tomwalters@277 3 // AIM-C: A C++ implementation of the Auditory Image Model
tomwalters@277 4 // http://www.acousticscale.org/AIMC
tomwalters@277 5 //
tomwalters@318 6 // Licensed under the Apache License, Version 2.0 (the "License");
tomwalters@318 7 // you may not use this file except in compliance with the License.
tomwalters@318 8 // You may obtain a copy of the License at
tomwalters@277 9 //
tomwalters@318 10 // http://www.apache.org/licenses/LICENSE-2.0
tomwalters@277 11 //
tomwalters@318 12 // Unless required by applicable law or agreed to in writing, software
tomwalters@318 13 // distributed under the License is distributed on an "AS IS" BASIS,
tomwalters@318 14 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
tomwalters@318 15 // See the License for the specific language governing permissions and
tomwalters@318 16 // limitations under the License.
tomwalters@277 17
tomwalters@277 18 /*!
tomwalters@277 19 * \file
tomwalters@279 20 * \brief File output in the HTK format.
tomwalters@277 21 *
tomwalters@279 22 * \author Tom Walters <tom@acousticscale.org>
tomwalters@277 23 * \author Willem van Engen <cnbh@willem.engen.nl>
tomwalters@277 24 * \date created 2006/10/30
tomwalters@277 25 * \version \$Id$
tomwalters@277 26 */
tomwalters@277 27
tomwalters@277 28 #ifdef _WINDOWS
tomwalters@320 29 # include <direct.h> // for _mkdir & _rmdir
tomwalters@277 30 #else
tomwalters@279 31 # include <sys/types.h>
tomwalters@320 32 # include <dirent.h> // for opendir & friends
tomwalters@277 33 #endif
tomwalters@293 34
tomwalters@293 35 #include <stdint.h>
tomwalters@277 36 #include <stdio.h>
tomwalters@277 37 #include <string.h>
tomwalters@277 38 #include <cmath>
tomwalters@277 39
tomwalters@277 40 #include "Modules/Output/FileOutputHTK.h"
tomwalters@277 41
tomwalters@277 42 namespace aimc {
tomwalters@277 43 FileOutputHTK::FileOutputHTK(Parameters *params) : Module(params) {
tomwalters@278 44 module_description_ = "File output in HTK format";
tomwalters@278 45 module_identifier_ = "htk_out";
tomwalters@278 46 module_type_ = "output";
tomwalters@278 47 module_version_ = "$Id$";
tomwalters@402 48
tomwalters@402 49 file_suffix_ = parameters_->DefaultString("htk_out.file_suffix", ".htk");
tomwalters@278 50
tomwalters@279 51 file_handle_ = NULL;
tomwalters@279 52 header_written_ = false;
tomwalters@277 53 frame_period_ms_ = 0.0f;
tomwalters@402 54 previous_start_time_ = 0;
tomwalters@277 55 }
tomwalters@277 56
tomwalters@277 57 FileOutputHTK::~FileOutputHTK() {
tomwalters@279 58 if (file_handle_ != NULL)
tomwalters@279 59 CloseFile();
tomwalters@277 60 }
tomwalters@277 61
tomwalters@402 62 bool FileOutputHTK::InitializeInternal(const SignalBank &input) {
tomwalters@402 63 channel_count_ = input.channel_count();
tomwalters@402 64 buffer_length_ = input.buffer_length();
tomwalters@402 65 ResetInternal();
tomwalters@402 66 if (file_handle_ == NULL) {
tomwalters@402 67 LOG_ERROR(_T("Couldn't initialize file output."));
tomwalters@279 68 return false;
tomwalters@279 69 }
tomwalters@402 70 if (!header_written_) {
tom@421 71 WriteHeader(channel_count_ * buffer_length_);
tomwalters@292 72 }
tomwalters@402 73
tomwalters@277 74 return true;
tomwalters@277 75 }
tomwalters@277 76
tomwalters@277 77 void FileOutputHTK::ResetInternal() {
tomwalters@402 78 // Finalize and close the open file, if there is one.
tomwalters@277 79 if (file_handle_ != NULL && !header_written_) {
tom@421 80 WriteHeader(channel_count_ * buffer_length_);
tomwalters@277 81 }
tomwalters@292 82 if (file_handle_ != NULL)
tomwalters@292 83 CloseFile();
tomwalters@402 84
tomwalters@402 85 // Now open and set up the new file.
tomwalters@402 86 // Check that the output file exists and is writeable.
tomwalters@402 87 string out_filename;
tomwalters@402 88 out_filename = global_parameters_->GetString("output_filename_base") + file_suffix_;
tomwalters@402 89 if ((file_handle_ = fopen(out_filename.c_str(),
tomwalters@402 90 "wb")) == NULL) {
tomwalters@402 91 LOG_ERROR(_T("Couldn't open output file '%s' for writing."),
tomwalters@402 92 out_filename.c_str());
tomwalters@402 93 return;
tomwalters@402 94 }
tomwalters@402 95 sample_count_ = 0;
tomwalters@402 96 header_written_ = false;
tom@421 97 WriteHeader(channel_count_ * buffer_length_);
tomwalters@277 98 }
tomwalters@277 99
tom@421 100 void FileOutputHTK::WriteHeader(int num_elements) {
tomwalters@279 101 if (header_written_)
tomwalters@279 102 return;
tomwalters@277 103
tomwalters@279 104 /* HTK format file: (taken from the HTK book - section 5.10.1)
tomwalters@279 105 * Header: 12 bytes in total, contains:
tomwalters@279 106 * sample_count - number of samples in file (4-byte integer)(long)
tomwalters@279 107 * sample_period - sample period in 100ns units (4-byte integer)(long)
tomwalters@279 108 * sample_size - number of bytes per sample (2-byte integer)(short)
tomwalters@279 109 * parameter_kind - a code indicating the sample kind (2-byte integer)(short)
tomwalters@279 110 */
tomwalters@277 111
tomwalters@279 112 // To be filled in when the file is done
tomwalters@279 113 int32_t sample_count = 0;
tomwalters@277 114
tom@421 115 int32_t sample_period = floor(1e4 * frame_period_ms_);
tomwalters@289 116 int16_t sample_size = num_elements * sizeof(float); // NOLINT
tomwalters@277 117
tomwalters@277 118 // User-defined coefficients with energy term
tomwalters@279 119 int16_t parameter_kind = H_USER + H_E;
tomwalters@277 120
tomwalters@279 121 // Fix endianness
tomwalters@279 122 sample_count = ByteSwap32(sample_count);
tomwalters@279 123 sample_period = ByteSwap32(sample_period);
tomwalters@279 124 sample_size = ByteSwap16(sample_size);
tomwalters@279 125 parameter_kind = ByteSwap16(parameter_kind);
tomwalters@277 126
tomwalters@277 127 // Enter header values. sample_count is a dummy value which is filled in on
tomwalters@277 128 // file close
tomwalters@279 129 fwrite(&sample_count, sizeof(sample_count), 1, file_handle_);
tomwalters@279 130 fwrite(&sample_period, sizeof(sample_period), 1, file_handle_);
tomwalters@279 131 fwrite(&sample_size, sizeof(sample_size), 1, file_handle_);
tomwalters@279 132 fwrite(&parameter_kind, sizeof(parameter_kind), 1, file_handle_);
tomwalters@279 133 fflush(file_handle_);
tomwalters@277 134
tomwalters@279 135 header_written_ = true;
tomwalters@277 136 }
tomwalters@277 137
tomwalters@277 138 void FileOutputHTK::Process(const SignalBank &input) {
tomwalters@277 139 if (file_handle_ == NULL) {
tomwalters@277 140 LOG_ERROR(_T("Couldn't process file output. No file is open."
tomwalters@277 141 "Please call FileOutputHTK::OpenFile first"));
tomwalters@279 142 return;
tomwalters@277 143 }
tomwalters@277 144
tomwalters@277 145 if (!header_written_) {
tomwalters@292 146 LOG_ERROR(_T("No header has been written on the output file yet. Please "
tomwalters@402 147 "call FileOutputHTK::Initialize() or FileOutputHTK::Reset() "
tom@442 148 "before calling FileOutputHTK::Process()"));
tomwalters@279 149 return;
tomwalters@277 150 }
tomwalters@279 151 float s;
tomwalters@277 152
tomwalters@279 153 for (int ch = 0; ch < input.channel_count(); ch++) {
tomwalters@277 154 for (int i = 0; i < input.buffer_length(); i++) {
tomwalters@277 155 s = input.sample(ch, i);
tomwalters@277 156 s = ByteSwapFloat(s);
tomwalters@280 157 fwrite(&s, sizeof(s), 1, file_handle_);
tomwalters@277 158 }
tomwalters@277 159 }
tomwalters@279 160 sample_count_++;
tomwalters@402 161 frame_period_ms_ = 1000.0
tomwalters@402 162 * (input.start_time() - previous_start_time_)
tomwalters@402 163 / input.sample_rate();
tomwalters@402 164 previous_start_time_ = input.start_time();
tomwalters@277 165 }
tomwalters@277 166
tomwalters@277 167 bool FileOutputHTK::CloseFile() {
tomwalters@279 168 if (file_handle_ == NULL)
tomwalters@277 169 return false;
tomwalters@277 170
tomwalters@279 171 // Write the first 4 bytes of the file
tomwalters@279 172 // with how many samples there are in the file
tom@421 173 // and the next 4 bytes with the frame period.
tomwalters@279 174 fflush(file_handle_);
tomwalters@279 175 rewind(file_handle_);
tomwalters@279 176 fflush(file_handle_);
tomwalters@277 177 int32_t samples = sample_count_;
tomwalters@279 178 samples = ByteSwap32(samples);
tom@421 179 int32_t sample_period = floor(1e4 * frame_period_ms_);
tom@421 180 sample_period = ByteSwap32(sample_period);
tomwalters@279 181 fwrite(&samples, sizeof(samples), 1, file_handle_);
tom@421 182 fwrite(&sample_period, sizeof(sample_period), 1, file_handle_);
tomwalters@277 183
tomwalters@279 184 // And close the file
tomwalters@279 185 fclose(file_handle_);
tomwalters@279 186 file_handle_ = NULL;
tomwalters@292 187 header_written_ = false;
tomwalters@279 188 return true;
tomwalters@277 189 }
tomwalters@277 190
tomwalters@277 191 float FileOutputHTK::ByteSwapFloat(float d) {
tomwalters@277 192 // Endianness fix
tomwalters@277 193 float a;
tomwalters@277 194 unsigned char *dst = (unsigned char *)&a;
tomwalters@277 195 unsigned char *src = (unsigned char *)&d;
tomwalters@277 196
tomwalters@277 197 dst[0] = src[3];
tomwalters@277 198 dst[1] = src[2];
tomwalters@277 199 dst[2] = src[1];
tomwalters@277 200 dst[3] = src[0];
tomwalters@277 201
tomwalters@277 202 return a;
tomwalters@277 203 }
tomwalters@280 204 } // namespace aimc
tomwalters@277 205