annotate data/fileio/test/AudioFileReaderTest.h @ 1195:c118d2022ffa spectrogram-minor-refactor

Scale range matching
author Chris Cannam
date Mon, 01 Aug 2016 15:06:16 +0100
parents 843f67be0ed9
children abfc498c52bc
rev   line source
Chris@756 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@756 2
Chris@756 3 /*
Chris@756 4 Sonic Visualiser
Chris@756 5 An audio file viewer and annotation editor.
Chris@756 6 Centre for Digital Music, Queen Mary, University of London.
Chris@756 7 This file copyright 2013 Chris Cannam.
Chris@756 8
Chris@756 9 This program is free software; you can redistribute it and/or
Chris@756 10 modify it under the terms of the GNU General Public License as
Chris@756 11 published by the Free Software Foundation; either version 2 of the
Chris@756 12 License, or (at your option) any later version. See the file
Chris@756 13 COPYING included with this distribution for more information.
Chris@756 14 */
Chris@756 15
Chris@756 16 #ifndef TEST_AUDIO_FILE_READER_H
Chris@756 17 #define TEST_AUDIO_FILE_READER_H
Chris@756 18
Chris@756 19 #include "../AudioFileReaderFactory.h"
Chris@756 20 #include "../AudioFileReader.h"
Chris@756 21
Chris@756 22 #include "AudioTestData.h"
Chris@756 23
Chris@756 24 #include <cmath>
Chris@756 25
Chris@756 26 #include <QObject>
Chris@756 27 #include <QtTest>
Chris@756 28 #include <QDir>
Chris@756 29
Chris@756 30 #include <iostream>
Chris@756 31
Chris@756 32 using namespace std;
Chris@756 33
Chris@756 34 static QString audioDir = "testfiles";
Chris@756 35
Chris@756 36 class AudioFileReaderTest : public QObject
Chris@756 37 {
Chris@756 38 Q_OBJECT
Chris@756 39
Chris@756 40 const char *strOf(QString s) {
Chris@756 41 return strdup(s.toLocal8Bit().data());
Chris@756 42 }
Chris@756 43
Chris@756 44 private slots:
Chris@756 45 void init()
Chris@756 46 {
Chris@756 47 if (!QDir(audioDir).exists()) {
Chris@756 48 cerr << "ERROR: Audio test file directory \"" << audioDir << "\" does not exist" << endl;
Chris@756 49 QVERIFY2(QDir(audioDir).exists(), "Audio test file directory not found");
Chris@756 50 }
Chris@756 51 }
Chris@756 52
Chris@756 53 void read_data()
Chris@756 54 {
Chris@756 55 QTest::addColumn<QString>("audiofile");
Chris@756 56 QStringList files = QDir(audioDir).entryList(QDir::Files);
Chris@756 57 foreach (QString filename, files) {
Chris@756 58 QTest::newRow(strOf(filename)) << filename;
Chris@756 59 }
Chris@756 60 }
Chris@756 61
Chris@756 62 void read()
Chris@756 63 {
Chris@756 64 QFETCH(QString, audiofile);
Chris@756 65
Chris@1040 66 sv_samplerate_t readRate = 48000;
Chris@757 67
Chris@756 68 AudioFileReader *reader =
Chris@756 69 AudioFileReaderFactory::createReader
Chris@757 70 (audioDir + "/" + audiofile, readRate);
Chris@757 71
Chris@757 72 QStringList fileAndExt = audiofile.split(".");
Chris@757 73 QStringList bits = fileAndExt[0].split("-");
Chris@757 74 QString extension = fileAndExt[1];
Chris@1040 75 sv_samplerate_t nominalRate = bits[0].toInt();
Chris@757 76 int nominalChannels = bits[1].toInt();
Chris@757 77 int nominalDepth = 16;
Chris@757 78 if (bits.length() > 2) nominalDepth = bits[2].toInt();
Chris@756 79
Chris@756 80 if (!reader) {
Chris@820 81 #if ( QT_VERSION >= 0x050000 )
Chris@763 82 QSKIP("Unsupported file, skipping");
Chris@820 83 #else
Chris@820 84 QSKIP("Unsupported file, skipping", SkipSingle);
Chris@820 85 #endif
Chris@756 86 }
Chris@756 87
Chris@757 88 QCOMPARE((int)reader->getChannelCount(), nominalChannels);
Chris@1040 89 QCOMPARE(reader->getNativeRate(), nominalRate);
Chris@1040 90 QCOMPARE(reader->getSampleRate(), readRate);
Chris@757 91
Chris@756 92 int channels = reader->getChannelCount();
Chris@757 93 AudioTestData tdata(readRate, channels);
Chris@756 94
Chris@756 95 float *reference = tdata.getInterleavedData();
Chris@1040 96 sv_frame_t refFrames = tdata.getFrameCount();
Chris@756 97
Chris@756 98 // The reader should give us exactly the expected number of
Chris@759 99 // frames, except for mp3/aac files. We ask for quite a lot
Chris@759 100 // more, though, so we can (a) check that we only get the
Chris@759 101 // expected number back (if this is not mp3/aac) or (b) take
Chris@759 102 // into account silence at beginning and end (if it is).
Chris@1041 103 vector<float> test = reader->getInterleavedFrames(0, refFrames + 5000);
Chris@1040 104 sv_frame_t read = test.size() / channels;
Chris@756 105
Chris@759 106 if (extension == "mp3" || extension == "aac" || extension == "m4a") {
Chris@759 107 // mp3s and aacs can have silence at start and end
Chris@759 108 QVERIFY(read >= refFrames);
Chris@757 109 } else {
Chris@759 110 QCOMPARE(read, refFrames);
Chris@757 111 }
Chris@757 112
Chris@757 113 // Our limits are pretty relaxed -- we're not testing decoder
Chris@757 114 // or resampler quality here, just whether the results are
Chris@757 115 // plainly wrong (e.g. at wrong samplerate or with an offset)
Chris@757 116
Chris@1040 117 double limit = 0.01;
Chris@1040 118 double edgeLimit = limit * 10; // in first or final edgeSize frames
Chris@759 119 int edgeSize = 100;
Chris@759 120
Chris@757 121 if (nominalDepth < 16) {
Chris@757 122 limit = 0.02;
Chris@757 123 }
Chris@759 124 if (extension == "ogg" || extension == "mp3" ||
Chris@759 125 extension == "aac" || extension == "m4a") {
Chris@759 126 limit = 0.2;
Chris@759 127 edgeLimit = limit * 3;
Chris@757 128 }
Chris@757 129
Chris@759 130 // And we ignore completely the last few frames when upsampling
Chris@1040 131 int discard = 1 + int(round(readRate / nominalRate));
Chris@759 132
Chris@759 133 int offset = 0;
Chris@759 134
Chris@759 135 if (extension == "aac" || extension == "m4a") {
Chris@759 136 // our m4a file appears to have a fixed offset of 1024 (at
Chris@759 137 // file sample rate)
Chris@1040 138 offset = int(round((1024 / nominalRate) * readRate));
Chris@759 139 }
Chris@759 140
Chris@759 141 if (extension == "mp3") {
Chris@759 142 // while mp3s appear to vary
Chris@759 143 for (int i = 0; i < read; ++i) {
Chris@759 144 bool any = false;
Chris@1040 145 double thresh = 0.01;
Chris@759 146 for (int c = 0; c < channels; ++c) {
Chris@1040 147 if (fabs(test[i * channels + c]) > thresh) {
Chris@759 148 any = true;
Chris@759 149 break;
Chris@759 150 }
Chris@759 151 }
Chris@759 152 if (any) {
Chris@759 153 offset = i;
Chris@759 154 break;
Chris@759 155 }
Chris@759 156 }
Chris@759 157 // std::cerr << "offset = " << offset << std::endl;
Chris@759 158 }
Chris@756 159
Chris@756 160 for (int c = 0; c < channels; ++c) {
Chris@756 161 float maxdiff = 0.f;
Chris@756 162 int maxAt = 0;
Chris@756 163 float totdiff = 0.f;
Chris@759 164 for (int i = 0; i < read - offset - discard && i < refFrames; ++i) {
Chris@759 165 float diff = fabsf(test[(i + offset) * channels + c] -
Chris@756 166 reference[i * channels + c]);
Chris@756 167 totdiff += diff;
Chris@757 168 // in edge areas, record this only if it exceeds edgeLimit
Chris@759 169 if (i < edgeSize || i + edgeSize >= read - offset) {
Chris@968 170 if (diff > edgeLimit && diff > maxdiff) {
Chris@757 171 maxdiff = diff;
Chris@757 172 maxAt = i;
Chris@757 173 }
Chris@757 174 } else {
Chris@757 175 if (diff > maxdiff) {
Chris@757 176 maxdiff = diff;
Chris@757 177 maxAt = i;
Chris@757 178 }
Chris@756 179 }
Chris@756 180 }
Chris@1040 181 float meandiff = totdiff / float(read);
Chris@756 182 // cerr << "meandiff on channel " << c << ": " << meandiff << endl;
Chris@756 183 // cerr << "maxdiff on channel " << c << ": " << maxdiff << " at " << maxAt << endl;
Chris@759 184 if (meandiff >= limit) {
Chris@759 185 cerr << "ERROR: for audiofile " << audiofile << ": mean diff = " << meandiff << " for channel " << c << endl;
Chris@759 186 QVERIFY(meandiff < limit);
Chris@759 187 }
Chris@756 188 if (maxdiff >= limit) {
Chris@759 189 cerr << "ERROR: for audiofile " << audiofile << ": max diff = " << maxdiff << " at frame " << maxAt << " of " << read << " on channel " << c << " (mean diff = " << meandiff << ")" << endl;
Chris@756 190 QVERIFY(maxdiff < limit);
Chris@756 191 }
Chris@756 192 }
Chris@756 193 }
Chris@756 194 };
Chris@756 195
Chris@756 196 #endif