annotate runner/JAMSFeatureWriter.cpp @ 199:c8b934ed4ddd

Fix typo
author Chris Cannam
date Tue, 01 Sep 2015 17:29:20 +0100
parents 3b7ec45abd1c
children f35bbb3e4d41
rev   line source
Chris@145 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@145 2
Chris@145 3 /*
Chris@145 4 Sonic Annotator
Chris@145 5 A utility for batch feature extraction from audio files.
Chris@145 6 Mark Levy, Chris Sutton and Chris Cannam, Queen Mary, University of London.
Chris@145 7 Copyright 2007-2014 QMUL.
Chris@145 8
Chris@145 9 This program is free software; you can redistribute it and/or
Chris@145 10 modify it under the terms of the GNU General Public License as
Chris@145 11 published by the Free Software Foundation; either version 2 of the
Chris@145 12 License, or (at your option) any later version. See the file
Chris@145 13 COPYING included with this distribution for more information.
Chris@145 14 */
Chris@145 15
Chris@145 16 #include "JAMSFeatureWriter.h"
Chris@145 17
Chris@145 18 using namespace std;
Chris@145 19 using Vamp::Plugin;
Chris@145 20 using Vamp::PluginBase;
Chris@145 21
Chris@145 22 #include "base/Exceptions.h"
Chris@145 23 #include "rdf/PluginRDFIndexer.h"
Chris@145 24
Chris@166 25 #include <QFileInfo>
Chris@189 26 #include <QTextCodec>
Chris@166 27
Chris@162 28 #include "version.h"
Chris@162 29
Chris@145 30 JAMSFeatureWriter::JAMSFeatureWriter() :
Chris@145 31 FileFeatureWriter(SupportOneFilePerTrackTransform |
Chris@145 32 SupportOneFilePerTrack |
Chris@152 33 SupportOneFileTotal |
Chris@145 34 SupportStdOut,
Chris@145 35 "json"),
Chris@145 36 m_network(false),
Chris@169 37 m_networkRetrieved(false),
Chris@169 38 m_n(1),
Chris@169 39 m_m(1)
Chris@145 40 {
Chris@145 41 }
Chris@145 42
Chris@145 43 JAMSFeatureWriter::~JAMSFeatureWriter()
Chris@145 44 {
Chris@145 45 }
Chris@145 46
Chris@145 47 string
Chris@145 48 JAMSFeatureWriter::getDescription() const
Chris@145 49 {
Chris@170 50 return "Write features to JSON files in JAMS (JSON Annotated Music Specification) format. WARNING: This is a provisional implementation! The output format may change in future releases to comply more effectively with the specification. Please report any problems you find with the current implementation.";
Chris@145 51 }
Chris@145 52
Chris@145 53 JAMSFeatureWriter::ParameterList
Chris@145 54 JAMSFeatureWriter::getSupportedParameters() const
Chris@145 55 {
Chris@145 56 ParameterList pl = FileFeatureWriter::getSupportedParameters();
Chris@145 57 Parameter p;
Chris@145 58
Chris@145 59 p.name = "network";
Chris@197 60 p.description = "Attempt to retrieve RDF descriptions of plugins from network, if not available locally.";
Chris@145 61 p.hasArg = false;
Chris@145 62 pl.push_back(p);
Chris@145 63
Chris@197 64 p.name = "format";
Chris@197 65 p.description = "JSON format to use. Currently the only supported value is \"jams\". Other formats may be supported in future.";
Chris@197 66 p.hasArg = true;
Chris@197 67 p.mandatory = true;
Chris@197 68 pl.push_back(p);
Chris@197 69
Chris@145 70 return pl;
Chris@145 71 }
Chris@145 72
Chris@145 73 void
Chris@145 74 JAMSFeatureWriter::setParameters(map<string, string> &params)
Chris@145 75 {
Chris@145 76 FileFeatureWriter::setParameters(params);
Chris@145 77
Chris@145 78 for (map<string, string>::iterator i = params.begin();
Chris@145 79 i != params.end(); ++i) {
Chris@145 80 if (i->first == "network") {
Chris@145 81 m_network = true;
Chris@197 82 } else if (i->first == "format") {
Chris@197 83 if (i->second == "jams") {
Chris@197 84 m_format = i->second;
Chris@197 85 } else {
Chris@197 86 throw std::runtime_error
Chris@197 87 ("Unknown or invalid --json-format parameter \"" + i->second + "\"");
Chris@197 88 }
Chris@145 89 }
Chris@145 90 }
Chris@145 91 }
Chris@145 92
Chris@145 93 void
Chris@145 94 JAMSFeatureWriter::setTrackMetadata(QString trackId, TrackMetadata metadata)
Chris@145 95 {
Chris@167 96 m_trackMetadata[trackId] = metadata;
Chris@145 97 }
Chris@145 98
Chris@153 99 static double
Chris@153 100 realTime2Sec(const Vamp::RealTime &r)
Chris@153 101 {
Chris@153 102 return r / Vamp::RealTime(1, 0);
Chris@153 103 }
Chris@153 104
Chris@145 105 void
Chris@145 106 JAMSFeatureWriter::write(QString trackId,
Chris@145 107 const Transform &transform,
Chris@145 108 const Plugin::OutputDescriptor& ,
Chris@145 109 const Plugin::FeatureList& features,
Chris@145 110 std::string /* summaryType */)
Chris@145 111 {
Chris@145 112 QString transformId = transform.getIdentifier();
Chris@145 113
Chris@189 114 QTextStream *sptr = getOutputStream
Chris@189 115 (trackId, transformId, QTextCodec::codecForName("UTF-8"));
Chris@145 116 if (!sptr) {
Chris@145 117 throw FailedToOpenOutputStream(trackId, transformId);
Chris@145 118 }
Chris@145 119
Chris@167 120 DataId did(trackId, transform);
Chris@145 121
Chris@167 122 if (m_data.find(did) == m_data.end()) {
Chris@167 123 identifyTask(transform);
Chris@167 124 m_streamTracks[sptr].insert(trackId);
Chris@167 125 m_streamTasks[sptr].insert(m_tasks[transformId]);
Chris@167 126 m_streamData[sptr].insert(did);
Chris@152 127 }
Chris@152 128
Chris@167 129 QString d = m_data[did];
Chris@153 130
Chris@145 131 for (int i = 0; i < int(features.size()); ++i) {
Chris@153 132
Chris@167 133 if (d != "") {
Chris@153 134 d += ",\n";
Chris@153 135 }
Chris@153 136
Chris@153 137 d += " { ";
Chris@145 138
Chris@153 139 Plugin::Feature f(features[i]);
Chris@153 140
Chris@168 141 if (f.hasDuration) {
Chris@168 142 d += QString
Chris@168 143 ("\"start\": { \"value\": %1 }, "
Chris@168 144 "\"end\": { \"value\": %2 }")
Chris@168 145 .arg(realTime2Sec(f.timestamp))
Chris@168 146 .arg(realTime2Sec
Chris@168 147 (f.timestamp +
Chris@168 148 (f.hasDuration ? f.duration : Vamp::RealTime::zeroTime)));
Chris@168 149 } else {
Chris@153 150 d += QString("\"time\": { \"value\": %1 }")
Chris@153 151 .arg(realTime2Sec(f.timestamp));
Chris@153 152 }
Chris@153 153
Chris@153 154 if (f.label != "") {
Chris@153 155 d += QString(", \"label\": { \"value\": \"%2\" }")
Chris@153 156 .arg(f.label.c_str());
Chris@167 157 }
Chris@167 158
Chris@167 159 if (f.values.size() > 0) {
Chris@167 160 d += QString(", \"value\": [ ");
Chris@167 161 for (int j = 0; j < int(f.values.size()); ++j) {
Chris@169 162 if (isnan(f.values[j])) {
Chris@192 163 d += "\"NaN\"";
Chris@169 164 } else if (isinf(f.values[j])) {
Chris@192 165 d += "\"Inf\"";
Chris@169 166 } else {
Chris@192 167 d += QString("%1").arg(f.values[j]);
Chris@192 168 }
Chris@192 169 if (j + 1 < int(f.values.size())) {
Chris@192 170 d += ", ";
Chris@169 171 }
Chris@167 172 }
Chris@192 173 d += " ]";
Chris@153 174 }
Chris@153 175
Chris@153 176 d += " }";
Chris@145 177 }
Chris@153 178
Chris@167 179 m_data[did] = d;
Chris@145 180 }
Chris@145 181
Chris@145 182 void
Chris@169 183 JAMSFeatureWriter::setNofM(int n, int m)
Chris@169 184 {
Chris@169 185 if (m_singleFileName != "" || m_stdout) {
Chris@169 186 m_n = n;
Chris@169 187 m_m = m;
Chris@169 188 } else {
Chris@169 189 m_n = 1;
Chris@169 190 m_m = 1;
Chris@169 191 }
Chris@169 192 }
Chris@169 193
Chris@169 194 void
Chris@152 195 JAMSFeatureWriter::finish()
Chris@152 196 {
Chris@167 197 for (FileStreamMap::const_iterator stri = m_streams.begin();
Chris@167 198 stri != m_streams.end(); ++stri) {
Chris@152 199
Chris@167 200 QTextStream *sptr = stri->second;
Chris@167 201 QTextStream &stream = *sptr;
Chris@152 202
Chris@167 203 bool firstInStream = true;
Chris@167 204
Chris@167 205 for (TrackIds::const_iterator tri = m_streamTracks[sptr].begin();
Chris@167 206 tri != m_streamTracks[sptr].end(); ++tri) {
Chris@167 207
Chris@167 208 TrackId trackId = *tri;
Chris@167 209
Chris@169 210 if (firstInStream) {
Chris@169 211 if (m_streamTracks[sptr].size() > 1 || (m_m > 1 && m_n == 1)) {
Chris@169 212 stream << "[\n";
Chris@169 213 }
Chris@169 214 }
Chris@169 215
Chris@169 216 if (!firstInStream || (m_m > 1 && m_n > 1)) {
Chris@167 217 stream << ",\n";
Chris@167 218 }
Chris@167 219
Chris@167 220 stream << "{\n"
Chris@167 221 << QString("\"file_metadata\": {\n"
Chris@167 222 " \"filename\": \"%1\"")
Chris@167 223 .arg(QFileInfo(trackId).fileName());
Chris@167 224
Chris@167 225 if (m_trackMetadata.find(trackId) != m_trackMetadata.end()) {
Chris@167 226 if (m_trackMetadata[trackId].maker != "") {
Chris@167 227 stream << QString(",\n \"artist\": \"%1\"")
Chris@167 228 .arg(m_trackMetadata[trackId].maker);
Chris@167 229 }
Chris@167 230 if (m_trackMetadata[trackId].title != "") {
Chris@167 231 stream << QString(",\n \"title\": \"%1\"")
Chris@167 232 .arg(m_trackMetadata[trackId].title);
Chris@167 233 }
Chris@167 234 }
Chris@167 235
Chris@167 236 stream << "\n},\n";
Chris@167 237
Chris@167 238 bool firstInTrack = true;
Chris@167 239
Chris@167 240 for (Tasks::const_iterator ti = m_streamTasks[sptr].begin();
Chris@167 241 ti != m_streamTasks[sptr].end(); ++ti) {
Chris@167 242
Chris@167 243 Task task = *ti;
Chris@167 244
Chris@167 245 if (!firstInTrack) {
Chris@167 246 stream << ",\n";
Chris@167 247 }
Chris@167 248
Chris@167 249 stream << "\"" << getTaskKey(task) << "\": [\n";
Chris@167 250
Chris@167 251 bool firstInTask = true;
Chris@167 252
Chris@167 253 for (DataIds::const_iterator di = m_streamData[sptr].begin();
Chris@167 254 di != m_streamData[sptr].end(); ++di) {
Chris@167 255
Chris@167 256 DataId did = *di;
Chris@167 257
Chris@167 258 QString trackId = did.first;
Chris@167 259 Transform transform = did.second;
Chris@167 260
Chris@167 261 if (m_tasks[transform.getIdentifier()] != task) continue;
Chris@167 262
Chris@167 263 QString data = m_data[did];
Chris@167 264
Chris@167 265 if (!firstInTask) {
Chris@167 266 stream << ",\n";
Chris@167 267 }
Chris@167 268
Chris@167 269 stream << QString
Chris@167 270 ("{ \n"
Chris@167 271 " \"annotation_metadata\": {\n"
Chris@167 272 " \"annotation_tools\": \"Sonic Annotator v%2\",\n"
Chris@167 273 " \"data_source\": \"Automatic feature extraction\",\n"
Chris@167 274 " \"annotator\": {\n"
Chris@167 275 "%3"
Chris@167 276 " }\n"
Chris@167 277 " },\n"
Chris@167 278 " \"data\": [\n")
Chris@167 279 .arg(RUNNER_VERSION)
Chris@167 280 .arg(writeTransformToObjectContents(transform));
Chris@167 281
Chris@167 282 stream << data;
Chris@167 283
Chris@167 284 stream << "\n ]\n}";
Chris@167 285 firstInTask = false;
Chris@167 286 }
Chris@167 287
Chris@167 288 stream << "\n]";
Chris@167 289 firstInTrack = false;
Chris@167 290 }
Chris@167 291
Chris@167 292 stream << "\n}";
Chris@167 293 firstInStream = false;
Chris@152 294 }
Chris@167 295
Chris@169 296 if (!firstInStream) {
Chris@169 297 if (m_streamTracks[sptr].size() > 1 || (m_m > 1 && m_n == m_m)) {
Chris@169 298 stream << "\n]";
Chris@169 299 }
Chris@169 300 stream << "\n";
Chris@167 301 }
Chris@152 302 }
Chris@152 303
Chris@167 304 m_streamTracks.clear();
Chris@167 305 m_streamTasks.clear();
Chris@167 306 m_streamData.clear();
Chris@152 307 m_data.clear();
Chris@152 308
Chris@152 309 FileFeatureWriter::finish();
Chris@152 310 }
Chris@152 311
Chris@152 312 void
Chris@145 313 JAMSFeatureWriter::loadRDFDescription(const Transform &transform)
Chris@145 314 {
Chris@145 315 QString pluginId = transform.getPluginIdentifier();
Chris@145 316 if (m_rdfDescriptions.find(pluginId) != m_rdfDescriptions.end()) return;
Chris@145 317
Chris@145 318 if (m_network && !m_networkRetrieved) {
Chris@145 319 PluginRDFIndexer::getInstance()->indexConfiguredURLs();
Chris@145 320 m_networkRetrieved = true;
Chris@145 321 }
Chris@145 322
Chris@145 323 m_rdfDescriptions[pluginId] = PluginRDFDescription(pluginId);
Chris@145 324
Chris@145 325 if (m_rdfDescriptions[pluginId].haveDescription()) {
Chris@145 326 cerr << "NOTE: Have RDF description for plugin ID \""
Chris@145 327 << pluginId << "\"" << endl;
Chris@145 328 } else {
Chris@145 329 cerr << "NOTE: No RDF description for plugin ID \""
Chris@145 330 << pluginId << "\"" << endl;
Chris@145 331 if (!m_network) {
Chris@145 332 cerr << " Consider using the --json-network option to retrieve plugin descriptions" << endl;
Chris@145 333 cerr << " from the network where possible." << endl;
Chris@145 334 }
Chris@145 335 }
Chris@145 336 }
Chris@145 337
Chris@145 338 void
Chris@145 339 JAMSFeatureWriter::identifyTask(const Transform &transform)
Chris@145 340 {
Chris@145 341 QString transformId = transform.getIdentifier();
Chris@145 342 if (m_tasks.find(transformId) != m_tasks.end()) return;
Chris@145 343
Chris@145 344 loadRDFDescription(transform);
Chris@145 345
Chris@145 346 Task task = UnknownTask;
Chris@145 347
Chris@145 348 QString pluginId = transform.getPluginIdentifier();
Chris@145 349 QString outputId = transform.getOutput();
Chris@145 350
Chris@145 351 const PluginRDFDescription &desc = m_rdfDescriptions[pluginId];
Chris@145 352
Chris@145 353 if (desc.haveDescription()) {
Chris@145 354
Chris@145 355 PluginRDFDescription::OutputDisposition disp =
Chris@145 356 desc.getOutputDisposition(outputId);
Chris@145 357
Chris@145 358 QString af = "http://purl.org/ontology/af/";
Chris@145 359
Chris@145 360 if (disp == PluginRDFDescription::OutputSparse) {
Chris@145 361
Chris@145 362 QString eventUri = desc.getOutputEventTypeURI(outputId);
Chris@145 363
Chris@145 364 //!!! todo: allow user to prod writer for task type
Chris@145 365
Chris@145 366 if (eventUri == af + "Note") {
Chris@145 367 task = NoteTask;
Chris@145 368 } else if (eventUri == af + "Beat") {
Chris@145 369 task = BeatTask;
Chris@145 370 } else if (eventUri == af + "ChordSegment") {
Chris@145 371 task = ChordTask;
Chris@145 372 } else if (eventUri == af + "KeyChange") {
Chris@145 373 task = KeyTask;
Chris@145 374 } else if (eventUri == af + "KeySegment") {
Chris@145 375 task = KeyTask;
Chris@145 376 } else if (eventUri == af + "Onset") {
Chris@145 377 task = OnsetTask;
Chris@145 378 } else if (eventUri == af + "NonTonalOnset") {
Chris@145 379 task = OnsetTask;
Chris@145 380 } else if (eventUri == af + "Segment") {
Chris@145 381 task = SegmentTask;
Chris@145 382 } else if (eventUri == af + "SpeechSegment") {
Chris@145 383 task = SegmentTask;
Chris@145 384 } else if (eventUri == af + "StructuralSegment") {
Chris@145 385 task = SegmentTask;
Chris@145 386 } else {
Chris@145 387 cerr << "WARNING: Unsupported event type URI <"
Chris@145 388 << eventUri << ">, proceeding with UnknownTask type"
Chris@145 389 << endl;
Chris@145 390 }
Chris@145 391
Chris@145 392 } else {
Chris@145 393
Chris@145 394 cerr << "WARNING: Cannot currently write dense or track-level outputs to JSON format (only sparse ones). Will proceed using UnknownTask type, but this probably isn't going to work" << endl;
Chris@145 395 }
Chris@145 396 }
Chris@145 397
Chris@145 398 m_tasks[transformId] = task;
Chris@145 399 }
Chris@145 400
Chris@145 401 QString
Chris@145 402 JAMSFeatureWriter::getTaskKey(Task task)
Chris@145 403 {
Chris@145 404 switch (task) {
Chris@145 405 case UnknownTask: return "unknown";
Chris@145 406 case BeatTask: return "beat";
Chris@145 407 case OnsetTask: return "onset";
Chris@145 408 case ChordTask: return "chord";
Chris@145 409 case SegmentTask: return "segment";
Chris@145 410 case KeyTask: return "key";
Chris@145 411 case NoteTask: return "note";
Chris@145 412 case MelodyTask: return "melody";
Chris@145 413 case PitchTask: return "pitch";
Chris@145 414 }
Chris@145 415 return "unknown";
Chris@145 416 }
Chris@165 417
Chris@165 418 QString
Chris@165 419 JAMSFeatureWriter::writeTransformToObjectContents(const Transform &t)
Chris@165 420 {
Chris@165 421 QString json;
Chris@165 422 QString stpl(" \"%1\": \"%2\",\n");
Chris@165 423 QString ntpl(" \"%1\": %2,\n");
Chris@165 424
Chris@165 425 json += stpl.arg("plugin_id").arg(t.getPluginIdentifier());
Chris@165 426 json += stpl.arg("output_id").arg(t.getOutput());
Chris@165 427
Chris@165 428 if (t.getSummaryType() != Transform::NoSummary) {
Chris@165 429 json += stpl.arg("summary_type")
Chris@165 430 .arg(Transform::summaryTypeToString(t.getSummaryType()));
Chris@165 431 }
Chris@165 432
Chris@165 433 if (t.getPluginVersion() != QString()) {
Chris@165 434 json += stpl.arg("plugin_version").arg(t.getPluginVersion());
Chris@165 435 }
Chris@165 436
Chris@165 437 if (t.getProgram() != QString()) {
Chris@165 438 json += stpl.arg("program").arg(t.getProgram());
Chris@165 439 }
Chris@165 440
Chris@165 441 if (t.getStepSize() != 0) {
Chris@165 442 json += ntpl.arg("step_size").arg(t.getStepSize());
Chris@165 443 }
Chris@165 444
Chris@165 445 if (t.getBlockSize() != 0) {
Chris@165 446 json += ntpl.arg("block_size").arg(t.getBlockSize());
Chris@165 447 }
Chris@165 448
Chris@165 449 if (t.getWindowType() != HanningWindow) {
Chris@165 450 json += stpl.arg("window_type")
Chris@165 451 .arg(Window<float>::getNameForType(t.getWindowType()).c_str());
Chris@165 452 }
Chris@165 453
Chris@165 454 if (t.getStartTime() != RealTime::zeroTime) {
Chris@165 455 json += ntpl.arg("start").arg(t.getStartTime().toDouble());
Chris@165 456 }
Chris@165 457
Chris@165 458 if (t.getDuration() != RealTime::zeroTime) {
Chris@165 459 json += ntpl.arg("duration").arg(t.getDuration().toDouble());
Chris@165 460 }
Chris@165 461
Chris@165 462 if (t.getSampleRate() != 0) {
Chris@165 463 json += ntpl.arg("sample_rate").arg(t.getSampleRate());
Chris@165 464 }
Chris@165 465
Chris@165 466 if (!t.getParameters().empty()) {
Chris@165 467 json += QString(" \"parameters\": {\n");
Chris@165 468 Transform::ParameterMap parameters = t.getParameters();
Chris@165 469 for (Transform::ParameterMap::const_iterator i = parameters.begin();
Chris@165 470 i != parameters.end(); ++i) {
Chris@167 471 if (i != parameters.begin()) {
Chris@167 472 json += ",\n";
Chris@167 473 }
Chris@165 474 QString name = i->first;
Chris@165 475 float value = i->second;
Chris@167 476 json += QString(" \"%1\": %2").arg(name).arg(value);
Chris@165 477 }
Chris@167 478 json += QString("\n },\n");
Chris@165 479 }
Chris@165 480
Chris@165 481 // no trailing comma on final property:
Chris@165 482 json += QString(" \"transform_id\": \"%1\"\n").arg(t.getIdentifier());
Chris@165 483
Chris@165 484 return json;
Chris@165 485 }
Chris@165 486