annotate data/fileio/test/AudioFileReaderTest.h @ 876:47aa3aeb687b tonioni

For outputs with unknown bin count or multiple bins with variable sample rate, create additional output models for bins beyond the first
author Chris Cannam
date Wed, 29 Jan 2014 09:31:22 +0000
parents bb7ea947c60d
children e06f03013f46
rev   line source
Chris@756 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@756 2
Chris@756 3 /*
Chris@756 4 Sonic Visualiser
Chris@756 5 An audio file viewer and annotation editor.
Chris@756 6 Centre for Digital Music, Queen Mary, University of London.
Chris@756 7 This file copyright 2013 Chris Cannam.
Chris@756 8
Chris@756 9 This program is free software; you can redistribute it and/or
Chris@756 10 modify it under the terms of the GNU General Public License as
Chris@756 11 published by the Free Software Foundation; either version 2 of the
Chris@756 12 License, or (at your option) any later version. See the file
Chris@756 13 COPYING included with this distribution for more information.
Chris@756 14 */
Chris@756 15
Chris@756 16 #ifndef TEST_AUDIO_FILE_READER_H
Chris@756 17 #define TEST_AUDIO_FILE_READER_H
Chris@756 18
Chris@756 19 #include "../AudioFileReaderFactory.h"
Chris@756 20 #include "../AudioFileReader.h"
Chris@756 21
Chris@756 22 #include "AudioTestData.h"
Chris@756 23
Chris@756 24 #include <cmath>
Chris@756 25
Chris@756 26 #include <QObject>
Chris@756 27 #include <QtTest>
Chris@756 28 #include <QDir>
Chris@756 29
Chris@756 30 #include <iostream>
Chris@756 31
Chris@756 32 using namespace std;
Chris@756 33
Chris@756 34 static QString audioDir = "testfiles";
Chris@756 35
Chris@756 36 class AudioFileReaderTest : public QObject
Chris@756 37 {
Chris@756 38 Q_OBJECT
Chris@756 39
Chris@756 40 const char *strOf(QString s) {
Chris@756 41 return strdup(s.toLocal8Bit().data());
Chris@756 42 }
Chris@756 43
Chris@756 44 private slots:
Chris@756 45 void init()
Chris@756 46 {
Chris@756 47 if (!QDir(audioDir).exists()) {
Chris@756 48 cerr << "ERROR: Audio test file directory \"" << audioDir << "\" does not exist" << endl;
Chris@756 49 QVERIFY2(QDir(audioDir).exists(), "Audio test file directory not found");
Chris@756 50 }
Chris@756 51 }
Chris@756 52
Chris@756 53 void read_data()
Chris@756 54 {
Chris@756 55 QTest::addColumn<QString>("audiofile");
Chris@756 56 QStringList files = QDir(audioDir).entryList(QDir::Files);
Chris@756 57 foreach (QString filename, files) {
Chris@756 58 QTest::newRow(strOf(filename)) << filename;
Chris@756 59 }
Chris@756 60 }
Chris@756 61
Chris@756 62 void read()
Chris@756 63 {
Chris@756 64 QFETCH(QString, audiofile);
Chris@756 65
Chris@757 66 int readRate = 48000;
Chris@757 67
Chris@756 68 AudioFileReader *reader =
Chris@756 69 AudioFileReaderFactory::createReader
Chris@757 70 (audioDir + "/" + audiofile, readRate);
Chris@757 71
Chris@757 72 QStringList fileAndExt = audiofile.split(".");
Chris@757 73 QStringList bits = fileAndExt[0].split("-");
Chris@757 74 QString extension = fileAndExt[1];
Chris@757 75 int nominalRate = bits[0].toInt();
Chris@757 76 int nominalChannels = bits[1].toInt();
Chris@757 77 int nominalDepth = 16;
Chris@757 78 if (bits.length() > 2) nominalDepth = bits[2].toInt();
Chris@756 79
Chris@756 80 if (!reader) {
Chris@820 81 #if ( QT_VERSION >= 0x050000 )
Chris@763 82 QSKIP("Unsupported file, skipping");
Chris@820 83 #else
Chris@820 84 QSKIP("Unsupported file, skipping", SkipSingle);
Chris@820 85 #endif
Chris@756 86 }
Chris@756 87
Chris@757 88 QCOMPARE((int)reader->getChannelCount(), nominalChannels);
Chris@757 89 QCOMPARE((int)reader->getNativeRate(), nominalRate);
Chris@757 90 QCOMPARE((int)reader->getSampleRate(), readRate);
Chris@757 91
Chris@756 92 int channels = reader->getChannelCount();
Chris@757 93 AudioTestData tdata(readRate, channels);
Chris@756 94
Chris@756 95 float *reference = tdata.getInterleavedData();
Chris@759 96 int refFrames = tdata.getFrameCount();
Chris@759 97 int refsize = refFrames * channels;
Chris@756 98
Chris@756 99 vector<float> test;
Chris@756 100
Chris@756 101 // The reader should give us exactly the expected number of
Chris@759 102 // frames, except for mp3/aac files. We ask for quite a lot
Chris@759 103 // more, though, so we can (a) check that we only get the
Chris@759 104 // expected number back (if this is not mp3/aac) or (b) take
Chris@759 105 // into account silence at beginning and end (if it is).
Chris@759 106 reader->getInterleavedFrames(0, refFrames + 5000, test);
Chris@756 107 int read = test.size() / channels;
Chris@756 108
Chris@759 109 if (extension == "mp3" || extension == "aac" || extension == "m4a") {
Chris@759 110 // mp3s and aacs can have silence at start and end
Chris@759 111 QVERIFY(read >= refFrames);
Chris@757 112 } else {
Chris@759 113 QCOMPARE(read, refFrames);
Chris@757 114 }
Chris@757 115
Chris@757 116 // Our limits are pretty relaxed -- we're not testing decoder
Chris@757 117 // or resampler quality here, just whether the results are
Chris@757 118 // plainly wrong (e.g. at wrong samplerate or with an offset)
Chris@757 119
Chris@757 120 float limit = 0.01;
Chris@759 121 float edgeLimit = limit * 10; // in first or final edgeSize frames
Chris@759 122 int edgeSize = 100;
Chris@759 123
Chris@757 124 if (nominalDepth < 16) {
Chris@757 125 limit = 0.02;
Chris@757 126 }
Chris@759 127 if (extension == "ogg" || extension == "mp3" ||
Chris@759 128 extension == "aac" || extension == "m4a") {
Chris@759 129 limit = 0.2;
Chris@759 130 edgeLimit = limit * 3;
Chris@757 131 }
Chris@757 132
Chris@759 133 // And we ignore completely the last few frames when upsampling
Chris@759 134 int discard = 1 + readRate / nominalRate;
Chris@759 135
Chris@759 136 int offset = 0;
Chris@759 137
Chris@759 138 if (extension == "aac" || extension == "m4a") {
Chris@759 139 // our m4a file appears to have a fixed offset of 1024 (at
Chris@759 140 // file sample rate)
Chris@759 141 offset = (1024 / float(nominalRate)) * readRate;
Chris@759 142 }
Chris@759 143
Chris@759 144 if (extension == "mp3") {
Chris@759 145 // while mp3s appear to vary
Chris@759 146 for (int i = 0; i < read; ++i) {
Chris@759 147 bool any = false;
Chris@759 148 float thresh = 0.01;
Chris@759 149 for (int c = 0; c < channels; ++c) {
Chris@759 150 if (fabsf(test[i * channels + c]) > thresh) {
Chris@759 151 any = true;
Chris@759 152 break;
Chris@759 153 }
Chris@759 154 }
Chris@759 155 if (any) {
Chris@759 156 offset = i;
Chris@759 157 break;
Chris@759 158 }
Chris@759 159 }
Chris@759 160 // std::cerr << "offset = " << offset << std::endl;
Chris@759 161 }
Chris@756 162
Chris@756 163 for (int c = 0; c < channels; ++c) {
Chris@756 164 float maxdiff = 0.f;
Chris@756 165 int maxAt = 0;
Chris@756 166 float totdiff = 0.f;
Chris@759 167 for (int i = 0; i < read - offset - discard && i < refFrames; ++i) {
Chris@759 168 float diff = fabsf(test[(i + offset) * channels + c] -
Chris@756 169 reference[i * channels + c]);
Chris@756 170 totdiff += diff;
Chris@757 171 // in edge areas, record this only if it exceeds edgeLimit
Chris@759 172 if (i < edgeSize || i + edgeSize >= read - offset) {
Chris@757 173 if (diff > edgeLimit) {
Chris@757 174 maxdiff = diff;
Chris@757 175 maxAt = i;
Chris@757 176 }
Chris@757 177 } else {
Chris@757 178 if (diff > maxdiff) {
Chris@757 179 maxdiff = diff;
Chris@757 180 maxAt = i;
Chris@757 181 }
Chris@756 182 }
Chris@756 183 }
Chris@756 184 float meandiff = totdiff / read;
Chris@756 185 // cerr << "meandiff on channel " << c << ": " << meandiff << endl;
Chris@756 186 // cerr << "maxdiff on channel " << c << ": " << maxdiff << " at " << maxAt << endl;
Chris@759 187 if (meandiff >= limit) {
Chris@759 188 cerr << "ERROR: for audiofile " << audiofile << ": mean diff = " << meandiff << " for channel " << c << endl;
Chris@759 189 QVERIFY(meandiff < limit);
Chris@759 190 }
Chris@756 191 if (maxdiff >= limit) {
Chris@759 192 cerr << "ERROR: for audiofile " << audiofile << ": max diff = " << maxdiff << " at frame " << maxAt << " of " << read << " on channel " << c << " (mean diff = " << meandiff << ")" << endl;
Chris@756 193 QVERIFY(maxdiff < limit);
Chris@756 194 }
Chris@756 195 }
Chris@756 196 }
Chris@756 197 };
Chris@756 198
Chris@756 199 #endif