annotate data/fileio/test/AudioFileReaderTest.h @ 779:15cd67fcbdad

Fix calculation of timestamps for fixed-rate features
author Chris Cannam
date Wed, 27 Mar 2013 15:27:33 +0000
parents a43acbe3988f
children 2b3a8ae04597
rev   line source
Chris@756 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@756 2
Chris@756 3 /*
Chris@756 4 Sonic Visualiser
Chris@756 5 An audio file viewer and annotation editor.
Chris@756 6 Centre for Digital Music, Queen Mary, University of London.
Chris@756 7 This file copyright 2013 Chris Cannam.
Chris@756 8
Chris@756 9 This program is free software; you can redistribute it and/or
Chris@756 10 modify it under the terms of the GNU General Public License as
Chris@756 11 published by the Free Software Foundation; either version 2 of the
Chris@756 12 License, or (at your option) any later version. See the file
Chris@756 13 COPYING included with this distribution for more information.
Chris@756 14 */
Chris@756 15
Chris@756 16 #ifndef TEST_AUDIO_FILE_READER_H
Chris@756 17 #define TEST_AUDIO_FILE_READER_H
Chris@756 18
Chris@756 19 #include "../AudioFileReaderFactory.h"
Chris@756 20 #include "../AudioFileReader.h"
Chris@756 21
Chris@756 22 #include "AudioTestData.h"
Chris@756 23
Chris@756 24 #include <cmath>
Chris@756 25
Chris@756 26 #include <QObject>
Chris@756 27 #include <QtTest>
Chris@756 28 #include <QDir>
Chris@756 29
Chris@756 30 #include <iostream>
Chris@756 31
Chris@756 32 using namespace std;
Chris@756 33
Chris@756 34 static QString audioDir = "testfiles";
Chris@756 35
Chris@756 36 class AudioFileReaderTest : public QObject
Chris@756 37 {
Chris@756 38 Q_OBJECT
Chris@756 39
Chris@756 40 const char *strOf(QString s) {
Chris@756 41 return strdup(s.toLocal8Bit().data());
Chris@756 42 }
Chris@756 43
Chris@756 44 private slots:
Chris@756 45 void init()
Chris@756 46 {
Chris@756 47 if (!QDir(audioDir).exists()) {
Chris@756 48 cerr << "ERROR: Audio test file directory \"" << audioDir << "\" does not exist" << endl;
Chris@756 49 QVERIFY2(QDir(audioDir).exists(), "Audio test file directory not found");
Chris@756 50 }
Chris@756 51 }
Chris@756 52
Chris@756 53 void read_data()
Chris@756 54 {
Chris@756 55 QTest::addColumn<QString>("audiofile");
Chris@756 56 QStringList files = QDir(audioDir).entryList(QDir::Files);
Chris@756 57 foreach (QString filename, files) {
Chris@756 58 QTest::newRow(strOf(filename)) << filename;
Chris@756 59 }
Chris@756 60 }
Chris@756 61
Chris@756 62 void read()
Chris@756 63 {
Chris@756 64 QFETCH(QString, audiofile);
Chris@756 65
Chris@757 66 int readRate = 48000;
Chris@757 67
Chris@756 68 AudioFileReader *reader =
Chris@756 69 AudioFileReaderFactory::createReader
Chris@757 70 (audioDir + "/" + audiofile, readRate);
Chris@757 71
Chris@757 72 QStringList fileAndExt = audiofile.split(".");
Chris@757 73 QStringList bits = fileAndExt[0].split("-");
Chris@757 74 QString extension = fileAndExt[1];
Chris@757 75 int nominalRate = bits[0].toInt();
Chris@757 76 int nominalChannels = bits[1].toInt();
Chris@757 77 int nominalDepth = 16;
Chris@757 78 if (bits.length() > 2) nominalDepth = bits[2].toInt();
Chris@756 79
Chris@756 80 if (!reader) {
Chris@757 81 QSKIP("Unsupported file, skipping", SkipSingle);
Chris@756 82 }
Chris@756 83
Chris@757 84 QCOMPARE((int)reader->getChannelCount(), nominalChannels);
Chris@757 85 QCOMPARE((int)reader->getNativeRate(), nominalRate);
Chris@757 86 QCOMPARE((int)reader->getSampleRate(), readRate);
Chris@757 87
Chris@756 88 int channels = reader->getChannelCount();
Chris@757 89 AudioTestData tdata(readRate, channels);
Chris@756 90
Chris@756 91 float *reference = tdata.getInterleavedData();
Chris@759 92 int refFrames = tdata.getFrameCount();
Chris@759 93 int refsize = refFrames * channels;
Chris@756 94
Chris@756 95 vector<float> test;
Chris@756 96
Chris@756 97 // The reader should give us exactly the expected number of
Chris@759 98 // frames, except for mp3/aac files. We ask for quite a lot
Chris@759 99 // more, though, so we can (a) check that we only get the
Chris@759 100 // expected number back (if this is not mp3/aac) or (b) take
Chris@759 101 // into account silence at beginning and end (if it is).
Chris@759 102 reader->getInterleavedFrames(0, refFrames + 5000, test);
Chris@756 103 int read = test.size() / channels;
Chris@756 104
Chris@759 105 if (extension == "mp3" || extension == "aac" || extension == "m4a") {
Chris@759 106 // mp3s and aacs can have silence at start and end
Chris@759 107 QVERIFY(read >= refFrames);
Chris@757 108 } else {
Chris@759 109 QCOMPARE(read, refFrames);
Chris@757 110 }
Chris@757 111
Chris@757 112 // Our limits are pretty relaxed -- we're not testing decoder
Chris@757 113 // or resampler quality here, just whether the results are
Chris@757 114 // plainly wrong (e.g. at wrong samplerate or with an offset)
Chris@757 115
Chris@757 116 float limit = 0.01;
Chris@759 117 float edgeLimit = limit * 10; // in first or final edgeSize frames
Chris@759 118 int edgeSize = 100;
Chris@759 119
Chris@757 120 if (nominalDepth < 16) {
Chris@757 121 limit = 0.02;
Chris@757 122 }
Chris@759 123 if (extension == "ogg" || extension == "mp3" ||
Chris@759 124 extension == "aac" || extension == "m4a") {
Chris@759 125 limit = 0.2;
Chris@759 126 edgeLimit = limit * 3;
Chris@757 127 }
Chris@757 128
Chris@759 129 // And we ignore completely the last few frames when upsampling
Chris@759 130 int discard = 1 + readRate / nominalRate;
Chris@759 131
Chris@759 132 int offset = 0;
Chris@759 133
Chris@759 134 if (extension == "aac" || extension == "m4a") {
Chris@759 135 // our m4a file appears to have a fixed offset of 1024 (at
Chris@759 136 // file sample rate)
Chris@759 137 offset = (1024 / float(nominalRate)) * readRate;
Chris@759 138 }
Chris@759 139
Chris@759 140 if (extension == "mp3") {
Chris@759 141 // while mp3s appear to vary
Chris@759 142 for (int i = 0; i < read; ++i) {
Chris@759 143 bool any = false;
Chris@759 144 float thresh = 0.01;
Chris@759 145 for (int c = 0; c < channels; ++c) {
Chris@759 146 if (fabsf(test[i * channels + c]) > thresh) {
Chris@759 147 any = true;
Chris@759 148 break;
Chris@759 149 }
Chris@759 150 }
Chris@759 151 if (any) {
Chris@759 152 offset = i;
Chris@759 153 break;
Chris@759 154 }
Chris@759 155 }
Chris@759 156 // std::cerr << "offset = " << offset << std::endl;
Chris@759 157 }
Chris@756 158
Chris@756 159 for (int c = 0; c < channels; ++c) {
Chris@756 160 float maxdiff = 0.f;
Chris@756 161 int maxAt = 0;
Chris@756 162 float totdiff = 0.f;
Chris@759 163 for (int i = 0; i < read - offset - discard && i < refFrames; ++i) {
Chris@759 164 float diff = fabsf(test[(i + offset) * channels + c] -
Chris@756 165 reference[i * channels + c]);
Chris@756 166 totdiff += diff;
Chris@757 167 // in edge areas, record this only if it exceeds edgeLimit
Chris@759 168 if (i < edgeSize || i + edgeSize >= read - offset) {
Chris@757 169 if (diff > edgeLimit) {
Chris@757 170 maxdiff = diff;
Chris@757 171 maxAt = i;
Chris@757 172 }
Chris@757 173 } else {
Chris@757 174 if (diff > maxdiff) {
Chris@757 175 maxdiff = diff;
Chris@757 176 maxAt = i;
Chris@757 177 }
Chris@756 178 }
Chris@756 179 }
Chris@756 180 float meandiff = totdiff / read;
Chris@756 181 // cerr << "meandiff on channel " << c << ": " << meandiff << endl;
Chris@756 182 // cerr << "maxdiff on channel " << c << ": " << maxdiff << " at " << maxAt << endl;
Chris@759 183 if (meandiff >= limit) {
Chris@759 184 cerr << "ERROR: for audiofile " << audiofile << ": mean diff = " << meandiff << " for channel " << c << endl;
Chris@759 185 QVERIFY(meandiff < limit);
Chris@759 186 }
Chris@756 187 if (maxdiff >= limit) {
Chris@759 188 cerr << "ERROR: for audiofile " << audiofile << ": max diff = " << maxdiff << " at frame " << maxAt << " of " << read << " on channel " << c << " (mean diff = " << meandiff << ")" << endl;
Chris@756 189 QVERIFY(maxdiff < limit);
Chris@756 190 }
Chris@756 191 }
Chris@756 192 }
Chris@756 193 };
Chris@756 194
Chris@756 195 #endif