annotate rdf/RDFImporter.cpp @ 520:e340b2fb9471

* Make FileSource able to indicate its preferred content type (e.g. application/rdf+xml in preference to text/html for rdf content) * Temp directory on Windows -- make $HOME expand to homedrive+homepath instead of user profile location (which may be networked)
author Chris Cannam
date Thu, 11 Dec 2008 15:18:10 +0000
parents af7b6e55895b
children 76f6971c8433
rev   line source
Chris@439 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@439 2
Chris@439 3 /*
Chris@439 4 Sonic Visualiser
Chris@439 5 An audio file viewer and annotation editor.
Chris@439 6 Centre for Digital Music, Queen Mary, University of London.
Chris@439 7 This file copyright 2008 QMUL.
Chris@439 8
Chris@439 9 This program is free software; you can redistribute it and/or
Chris@439 10 modify it under the terms of the GNU General Public License as
Chris@439 11 published by the Free Software Foundation; either version 2 of the
Chris@439 12 License, or (at your option) any later version. See the file
Chris@439 13 COPYING included with this distribution for more information.
Chris@439 14 */
Chris@439 15
Chris@439 16 #include "RDFImporter.h"
Chris@439 17
Chris@439 18 #include <map>
Chris@439 19 #include <vector>
Chris@439 20
Chris@439 21 #include <iostream>
Chris@439 22 #include <cmath>
Chris@439 23
Chris@439 24 #include "SimpleSPARQLQuery.h"
Chris@439 25
Chris@439 26 #include "base/ProgressReporter.h"
Chris@439 27 #include "base/RealTime.h"
Chris@439 28
Chris@439 29 #include "data/model/SparseOneDimensionalModel.h"
Chris@439 30 #include "data/model/SparseTimeValueModel.h"
Chris@439 31 #include "data/model/EditableDenseThreeDimensionalModel.h"
Chris@449 32 #include "data/model/NoteModel.h"
Chris@510 33 #include "data/model/TextModel.h"
Chris@449 34 #include "data/model/RegionModel.h"
Chris@499 35 #include "data/model/WaveFileModel.h"
Chris@499 36
Chris@499 37 #include "data/fileio/FileSource.h"
Chris@520 38 #include "data/fileio/CachedFile.h"
Chris@439 39
Chris@439 40 using std::cerr;
Chris@439 41 using std::endl;
Chris@439 42
Chris@439 43 class RDFImporterImpl
Chris@439 44 {
Chris@439 45 public:
Chris@439 46 RDFImporterImpl(QString url, int sampleRate);
Chris@439 47 virtual ~RDFImporterImpl();
Chris@490 48
Chris@490 49 void setSampleRate(int sampleRate) { m_sampleRate = sampleRate; }
Chris@439 50
Chris@439 51 bool isOK();
Chris@439 52 QString getErrorString() const;
Chris@439 53
Chris@439 54 std::vector<Model *> getDataModels(ProgressReporter *);
Chris@439 55
Chris@439 56 protected:
Chris@439 57 QString m_uristring;
Chris@439 58 QString m_errorString;
Chris@499 59 std::map<QString, Model *> m_audioModelMap;
Chris@439 60 int m_sampleRate;
Chris@439 61
Chris@520 62 static bool m_prefixesLoaded;
Chris@520 63 static void loadPrefixes(ProgressReporter *reporter);
Chris@520 64
Chris@499 65 void getDataModelsAudio(std::vector<Model *> &, ProgressReporter *);
Chris@440 66 void getDataModelsSparse(std::vector<Model *> &, ProgressReporter *);
Chris@440 67 void getDataModelsDense(std::vector<Model *> &, ProgressReporter *);
Chris@440 68
Chris@493 69 void getDenseModelTitle(Model *, QString, QString);
Chris@493 70
Chris@440 71 void getDenseFeatureProperties(QString featureUri,
Chris@440 72 int &sampleRate, int &windowLength,
Chris@440 73 int &hopSize, int &width, int &height);
Chris@440 74
Chris@449 75 void fillModel(Model *, long, long, bool, std::vector<float> &, QString);
Chris@439 76 };
Chris@439 77
Chris@520 78 bool RDFImporterImpl::m_prefixesLoaded = false;
Chris@439 79
Chris@439 80 QString
Chris@439 81 RDFImporter::getKnownExtensions()
Chris@439 82 {
Chris@439 83 return "*.rdf *.n3 *.ttl";
Chris@439 84 }
Chris@439 85
Chris@439 86 RDFImporter::RDFImporter(QString url, int sampleRate) :
Chris@439 87 m_d(new RDFImporterImpl(url, sampleRate))
Chris@439 88 {
Chris@439 89 }
Chris@439 90
Chris@439 91 RDFImporter::~RDFImporter()
Chris@439 92 {
Chris@439 93 delete m_d;
Chris@439 94 }
Chris@439 95
Chris@490 96 void
Chris@490 97 RDFImporter::setSampleRate(int sampleRate)
Chris@490 98 {
Chris@490 99 m_d->setSampleRate(sampleRate);
Chris@490 100 }
Chris@490 101
Chris@439 102 bool
Chris@439 103 RDFImporter::isOK()
Chris@439 104 {
Chris@439 105 return m_d->isOK();
Chris@439 106 }
Chris@439 107
Chris@439 108 QString
Chris@439 109 RDFImporter::getErrorString() const
Chris@439 110 {
Chris@439 111 return m_d->getErrorString();
Chris@439 112 }
Chris@439 113
Chris@439 114 std::vector<Model *>
Chris@439 115 RDFImporter::getDataModels(ProgressReporter *r)
Chris@439 116 {
Chris@439 117 return m_d->getDataModels(r);
Chris@439 118 }
Chris@439 119
Chris@439 120 RDFImporterImpl::RDFImporterImpl(QString uri, int sampleRate) :
Chris@439 121 m_uristring(uri),
Chris@439 122 m_sampleRate(sampleRate)
Chris@439 123 {
Chris@439 124 }
Chris@439 125
Chris@439 126 RDFImporterImpl::~RDFImporterImpl()
Chris@439 127 {
Chris@492 128 SimpleSPARQLQuery::closeSingleSource(m_uristring);
Chris@439 129 }
Chris@439 130
Chris@439 131 bool
Chris@439 132 RDFImporterImpl::isOK()
Chris@439 133 {
Chris@439 134 return (m_errorString == "");
Chris@439 135 }
Chris@439 136
Chris@439 137 QString
Chris@439 138 RDFImporterImpl::getErrorString() const
Chris@439 139 {
Chris@439 140 return m_errorString;
Chris@439 141 }
Chris@439 142
Chris@439 143 std::vector<Model *>
Chris@439 144 RDFImporterImpl::getDataModels(ProgressReporter *reporter)
Chris@439 145 {
Chris@520 146 loadPrefixes(reporter);
Chris@520 147
Chris@439 148 std::vector<Model *> models;
Chris@439 149
Chris@499 150 getDataModelsAudio(models, reporter);
Chris@499 151
Chris@490 152 if (m_sampleRate == 0) {
Chris@490 153 std::cerr << "RDFImporter::getDataModels: invalid sample rate" << std::endl;
Chris@490 154 return models;
Chris@490 155 }
Chris@490 156
Chris@508 157 QString error;
Chris@508 158
Chris@508 159 if (!isOK()) error = m_errorString;
Chris@508 160 m_errorString = "";
Chris@508 161
Chris@440 162 getDataModelsDense(models, reporter);
Chris@440 163
Chris@440 164 if (!isOK()) error = m_errorString;
Chris@440 165 m_errorString = "";
Chris@440 166
Chris@440 167 getDataModelsSparse(models, reporter);
Chris@440 168
Chris@440 169 if (isOK()) m_errorString = error;
Chris@440 170
Chris@440 171 return models;
Chris@440 172 }
Chris@440 173
Chris@440 174 void
Chris@499 175 RDFImporterImpl::getDataModelsAudio(std::vector<Model *> &models,
Chris@499 176 ProgressReporter *reporter)
Chris@499 177 {
Chris@499 178 SimpleSPARQLQuery query = SimpleSPARQLQuery
Chris@499 179 (SimpleSPARQLQuery::QueryFromSingleSource,
Chris@499 180 QString
Chris@499 181 (
Chris@499 182 " PREFIX mo: <http://purl.org/ontology/mo/> "
Chris@499 183 " SELECT ?signal ?source FROM <%1> "
Chris@499 184 " WHERE { ?signal a mo:Signal ; mo:available_as ?source } "
Chris@499 185 )
Chris@499 186 .arg(m_uristring));
Chris@499 187
Chris@499 188 SimpleSPARQLQuery::ResultList results = query.execute();
Chris@499 189
Chris@499 190 for (int i = 0; i < results.size(); ++i) {
Chris@499 191
Chris@499 192 QString signal = results[i]["signal"].value;
Chris@499 193 QString source = results[i]["source"].value;
Chris@499 194
Chris@499 195 FileSource fs(source, reporter);
Chris@499 196 if (fs.isAvailable()) {
Chris@499 197 if (reporter) {
Chris@499 198 reporter->setMessage(RDFImporter::tr("Importing audio referenced in RDF..."));
Chris@499 199 }
Chris@499 200 fs.waitForData();
Chris@499 201 WaveFileModel *newModel = new WaveFileModel(fs, m_sampleRate);
Chris@499 202 if (newModel->isOK()) {
Chris@499 203 std::cerr << "Successfully created wave file model from source at \"" << source.toStdString() << "\"" << std::endl;
Chris@499 204 models.push_back(newModel);
Chris@499 205 m_audioModelMap[signal] = newModel;
Chris@499 206 if (m_sampleRate == 0) {
Chris@499 207 m_sampleRate = newModel->getSampleRate();
Chris@499 208 }
Chris@499 209 } else {
Chris@508 210 m_errorString = QString("Failed to create wave file model from source at \"%1\"").arg(source);
Chris@499 211 delete newModel;
Chris@499 212 }
Chris@508 213 } else {
Chris@508 214 m_errorString = QString("Signal source \"%1\" is not available").arg(source);
Chris@499 215 }
Chris@499 216 }
Chris@499 217 }
Chris@499 218
Chris@499 219 void
Chris@440 220 RDFImporterImpl::getDataModelsDense(std::vector<Model *> &models,
Chris@440 221 ProgressReporter *reporter)
Chris@440 222 {
Chris@499 223 if (reporter) {
Chris@499 224 reporter->setMessage(RDFImporter::tr("Importing dense signal data from RDF..."));
Chris@499 225 }
Chris@499 226
Chris@440 227 SimpleSPARQLQuery query = SimpleSPARQLQuery
Chris@489 228 (SimpleSPARQLQuery::QueryFromSingleSource,
Chris@480 229 QString
Chris@440 230 (
Chris@440 231 " PREFIX mo: <http://purl.org/ontology/mo/>"
Chris@440 232 " PREFIX af: <http://purl.org/ontology/af/>"
Chris@440 233
Chris@493 234 " SELECT ?feature ?feature_signal_type ?value "
Chris@440 235 " FROM <%1> "
Chris@440 236
Chris@440 237 " WHERE { "
Chris@440 238
Chris@493 239 " ?signal af:signal_feature ?feature . "
Chris@440 240
Chris@440 241 " ?feature a ?feature_signal_type ; "
Chris@440 242 " af:value ?value . "
Chris@440 243
Chris@440 244 " } "
Chris@440 245 )
Chris@440 246 .arg(m_uristring));
Chris@440 247
Chris@440 248 SimpleSPARQLQuery::ResultList results = query.execute();
Chris@440 249
Chris@440 250 if (!query.isOK()) {
Chris@440 251 m_errorString = query.getErrorString();
Chris@440 252 return;
Chris@440 253 }
Chris@440 254
Chris@440 255 if (query.wasCancelled()) {
Chris@440 256 m_errorString = "Query cancelled";
Chris@440 257 return;
Chris@440 258 }
Chris@440 259
Chris@440 260 for (int i = 0; i < results.size(); ++i) {
Chris@440 261
Chris@440 262 QString feature = results[i]["feature"].value;
Chris@440 263 QString type = results[i]["feature_signal_type"].value;
Chris@440 264 QString value = results[i]["value"].value;
Chris@440 265
Chris@440 266 int sampleRate = 0;
Chris@440 267 int windowLength = 0;
Chris@440 268 int hopSize = 0;
Chris@440 269 int width = 0;
Chris@440 270 int height = 0;
Chris@440 271 getDenseFeatureProperties
Chris@440 272 (feature, sampleRate, windowLength, hopSize, width, height);
Chris@440 273
Chris@440 274 if (sampleRate != 0 && sampleRate != m_sampleRate) {
Chris@440 275 cerr << "WARNING: Sample rate in dense feature description does not match our underlying rate -- using rate from feature description" << endl;
Chris@440 276 }
Chris@440 277 if (sampleRate == 0) sampleRate = m_sampleRate;
Chris@440 278
Chris@440 279 if (hopSize == 0) {
Chris@440 280 cerr << "WARNING: Dense feature description does not specify a hop size -- assuming 1" << endl;
Chris@440 281 hopSize = 1;
Chris@440 282 }
Chris@440 283
Chris@440 284 if (height == 0) {
Chris@440 285 cerr << "WARNING: Dense feature description does not specify feature signal dimensions -- assuming one-dimensional (height = 1)" << endl;
Chris@440 286 height = 1;
Chris@440 287 }
Chris@440 288
Chris@440 289 QStringList values = value.split(' ', QString::SkipEmptyParts);
Chris@440 290
Chris@440 291 if (values.empty()) {
Chris@440 292 cerr << "WARNING: Dense feature description does not specify any values!" << endl;
Chris@440 293 continue;
Chris@440 294 }
Chris@440 295
Chris@440 296 if (height == 1) {
Chris@440 297
Chris@440 298 SparseTimeValueModel *m = new SparseTimeValueModel
Chris@440 299 (sampleRate, hopSize, false);
Chris@440 300
Chris@440 301 for (int j = 0; j < values.size(); ++j) {
Chris@440 302 float f = values[j].toFloat();
Chris@440 303 SparseTimeValueModel::Point point(j * hopSize, f, "");
Chris@440 304 m->addPoint(point);
Chris@440 305 }
Chris@493 306
Chris@493 307 getDenseModelTitle(m, feature, type);
Chris@440 308
Chris@440 309 models.push_back(m);
Chris@440 310
Chris@440 311 } else {
Chris@440 312
Chris@440 313 EditableDenseThreeDimensionalModel *m =
Chris@440 314 new EditableDenseThreeDimensionalModel(sampleRate, hopSize,
Chris@440 315 height, false);
Chris@440 316
Chris@440 317 EditableDenseThreeDimensionalModel::Column column;
Chris@440 318
Chris@440 319 int x = 0;
Chris@440 320
Chris@440 321 for (int j = 0; j < values.size(); ++j) {
Chris@440 322 if (j % height == 0 && !column.empty()) {
Chris@440 323 m->setColumn(x++, column);
Chris@440 324 column.clear();
Chris@440 325 }
Chris@440 326 column.push_back(values[j].toFloat());
Chris@440 327 }
Chris@440 328
Chris@440 329 if (!column.empty()) {
Chris@440 330 m->setColumn(x++, column);
Chris@440 331 }
Chris@440 332
Chris@493 333 getDenseModelTitle(m, feature, type);
Chris@493 334
Chris@440 335 models.push_back(m);
Chris@440 336 }
Chris@440 337 }
Chris@440 338 }
Chris@440 339
Chris@440 340 void
Chris@493 341 RDFImporterImpl::getDenseModelTitle(Model *m,
Chris@493 342 QString featureUri,
Chris@493 343 QString featureTypeUri)
Chris@493 344 {
Chris@493 345 QString titleQuery = QString
Chris@493 346 (
Chris@493 347 " PREFIX dc: <http://purl.org/dc/elements/1.1/> "
Chris@493 348 " SELECT ?title "
Chris@493 349 " FROM <%1> "
Chris@493 350 " WHERE { "
Chris@493 351 " <%2> dc:title ?title . "
Chris@493 352 " } "
Chris@493 353 ).arg(m_uristring);
Chris@493 354
Chris@493 355 SimpleSPARQLQuery::Value v;
Chris@493 356
Chris@493 357 v = SimpleSPARQLQuery::singleResultQuery
Chris@493 358 (SimpleSPARQLQuery::QueryFromSingleSource,
Chris@493 359 titleQuery.arg(featureUri),
Chris@493 360 "title");
Chris@493 361
Chris@493 362 if (v.value != "") {
Chris@493 363 std::cerr << "RDFImporterImpl::getDenseModelTitle: Title (from signal) \"" << v.value.toStdString() << "\"" << std::endl;
Chris@493 364 m->setObjectName(v.value);
Chris@493 365 return;
Chris@493 366 }
Chris@493 367
Chris@493 368 v = SimpleSPARQLQuery::singleResultQuery
Chris@493 369 (SimpleSPARQLQuery::QueryFromSingleSource,
Chris@493 370 titleQuery.arg(featureTypeUri),
Chris@493 371 "title");
Chris@493 372
Chris@493 373 if (v.value != "") {
Chris@493 374 std::cerr << "RDFImporterImpl::getDenseModelTitle: Title (from signal type) \"" << v.value.toStdString() << "\"" << std::endl;
Chris@493 375 m->setObjectName(v.value);
Chris@493 376 return;
Chris@493 377 }
Chris@493 378
Chris@493 379 std::cerr << "RDFImporterImpl::getDenseModelTitle: No title available for feature <" << featureUri.toStdString() << ">" << std::endl;
Chris@493 380 }
Chris@493 381
Chris@493 382 void
Chris@440 383 RDFImporterImpl::getDenseFeatureProperties(QString featureUri,
Chris@440 384 int &sampleRate, int &windowLength,
Chris@440 385 int &hopSize, int &width, int &height)
Chris@440 386 {
Chris@489 387 SimpleSPARQLQuery::QueryType s = SimpleSPARQLQuery::QueryFromSingleSource;
Chris@489 388
Chris@440 389 QString dimensionsQuery
Chris@440 390 (
Chris@440 391 " PREFIX mo: <http://purl.org/ontology/mo/>"
Chris@440 392 " PREFIX af: <http://purl.org/ontology/af/>"
Chris@440 393
Chris@440 394 " SELECT ?dimensions "
Chris@440 395 " FROM <%1> "
Chris@440 396
Chris@440 397 " WHERE { "
Chris@440 398
Chris@440 399 " <%2> af:dimensions ?dimensions . "
Chris@440 400
Chris@440 401 " } "
Chris@440 402 );
Chris@440 403
Chris@440 404 SimpleSPARQLQuery::Value dimensionsValue =
Chris@489 405 SimpleSPARQLQuery::singleResultQuery
Chris@489 406 (s, dimensionsQuery.arg(m_uristring).arg(featureUri), "dimensions");
Chris@440 407
Chris@440 408 cerr << "Dimensions = \"" << dimensionsValue.value.toStdString() << "\""
Chris@440 409 << endl;
Chris@440 410
Chris@440 411 if (dimensionsValue.value != "") {
Chris@440 412 QStringList dl = dimensionsValue.value.split(" ");
Chris@440 413 if (dl.empty()) dl.push_back(dimensionsValue.value);
Chris@440 414 if (dl.size() > 0) height = dl[0].toInt();
Chris@440 415 if (dl.size() > 1) width = dl[1].toInt();
Chris@440 416 }
Chris@440 417
Chris@440 418 QString queryTemplate
Chris@440 419 (
Chris@440 420 " PREFIX mo: <http://purl.org/ontology/mo/>"
Chris@440 421 " PREFIX af: <http://purl.org/ontology/af/>"
Chris@440 422 " PREFIX tl: <http://purl.org/NET/c4dm/timeline.owl#>"
Chris@440 423
Chris@440 424 " SELECT ?%3 "
Chris@440 425 " FROM <%1> "
Chris@440 426
Chris@440 427 " WHERE { "
Chris@440 428
Chris@440 429 " <%2> mo:time ?time . "
Chris@440 430
Chris@440 431 " ?time a tl:Interval ; "
Chris@440 432 " tl:onTimeLine ?timeline . "
Chris@440 433
Chris@440 434 " ?map tl:rangeTimeLine ?timeline . "
Chris@440 435
Chris@440 436 " ?map tl:%3 ?%3 . "
Chris@440 437
Chris@440 438 " } "
Chris@440 439 );
Chris@440 440
Chris@440 441 // Another laborious workaround for rasqal's failure to handle
Chris@440 442 // multiple optionals properly
Chris@440 443
Chris@440 444 SimpleSPARQLQuery::Value srValue =
Chris@489 445 SimpleSPARQLQuery::singleResultQuery(s,
Chris@480 446 queryTemplate
Chris@440 447 .arg(m_uristring).arg(featureUri)
Chris@440 448 .arg("sampleRate"),
Chris@440 449 "sampleRate");
Chris@440 450 if (srValue.value != "") {
Chris@440 451 sampleRate = srValue.value.toInt();
Chris@440 452 }
Chris@440 453
Chris@440 454 SimpleSPARQLQuery::Value hopValue =
Chris@489 455 SimpleSPARQLQuery::singleResultQuery(s,
Chris@480 456 queryTemplate
Chris@440 457 .arg(m_uristring).arg(featureUri)
Chris@440 458 .arg("hopSize"),
Chris@440 459 "hopSize");
Chris@440 460 if (srValue.value != "") {
Chris@440 461 hopSize = hopValue.value.toInt();
Chris@440 462 }
Chris@440 463
Chris@440 464 SimpleSPARQLQuery::Value winValue =
Chris@489 465 SimpleSPARQLQuery::singleResultQuery(s,
Chris@480 466 queryTemplate
Chris@440 467 .arg(m_uristring).arg(featureUri)
Chris@440 468 .arg("windowLength"),
Chris@440 469 "windowLength");
Chris@440 470 if (winValue.value != "") {
Chris@440 471 windowLength = winValue.value.toInt();
Chris@440 472 }
Chris@440 473
Chris@440 474 cerr << "sr = " << sampleRate << ", hop = " << hopSize << ", win = " << windowLength << endl;
Chris@440 475 }
Chris@440 476
Chris@440 477 void
Chris@440 478 RDFImporterImpl::getDataModelsSparse(std::vector<Model *> &models,
Chris@440 479 ProgressReporter *reporter)
Chris@440 480 {
Chris@499 481 if (reporter) {
Chris@499 482 reporter->setMessage(RDFImporter::tr("Importing event data from RDF..."));
Chris@499 483 }
Chris@499 484
Chris@489 485 SimpleSPARQLQuery::QueryType s = SimpleSPARQLQuery::QueryFromSingleSource;
Chris@489 486
Chris@439 487 // Our query is intended to retrieve every thing that has a time,
Chris@439 488 // and every feature type and value associated with a thing that
Chris@439 489 // has a time.
Chris@439 490
Chris@439 491 // We will then need to refine this big bag of results into a set
Chris@439 492 // of data models.
Chris@439 493
Chris@439 494 // Results that have different source signals should go into
Chris@439 495 // different models.
Chris@439 496
Chris@439 497 // Results that have different feature types should go into
Chris@439 498 // different models.
Chris@439 499
Chris@439 500 // Results that are sparse should go into different models from
Chris@439 501 // those that are dense (we need to examine the timestamps to
Chris@439 502 // establish this -- if the timestamps are regular, the results
Chris@439 503 // are dense -- so we can't do it as we go along, only after
Chris@439 504 // collecting all results).
Chris@439 505
Chris@439 506 // Timed things that have features associated with them should not
Chris@439 507 // appear directly in any model -- their features should appear
Chris@439 508 // instead -- and these should be different models from those used
Chris@439 509 // for timed things that do not have features.
Chris@439 510
Chris@439 511 // As we load the results, we'll push them into a partially
Chris@439 512 // structured container that maps from source signal (URI as
Chris@439 513 // string) -> feature type (likewise) -> time -> list of values.
Chris@439 514 // If the source signal or feature type is unavailable, the empty
Chris@439 515 // string will do.
Chris@439 516
Chris@449 517 QString prefixes = QString(
Chris@439 518 " PREFIX event: <http://purl.org/NET/c4dm/event.owl#>"
Chris@449 519 " PREFIX tl: <http://purl.org/NET/c4dm/timeline.owl#>"
Chris@439 520 " PREFIX mo: <http://purl.org/ontology/mo/>"
Chris@439 521 " PREFIX af: <http://purl.org/ontology/af/>"
Chris@449 522 " PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>"
Chris@449 523 );
Chris@439 524
Chris@449 525 QString queryString = prefixes + QString(
Chris@449 526
Chris@499 527 " SELECT ?signal ?timed_thing ?event_type ?value"
Chris@439 528 " FROM <%1>"
Chris@439 529
Chris@439 530 " WHERE {"
Chris@440 531
Chris@440 532 " ?signal a mo:Signal ."
Chris@440 533
Chris@439 534 " ?signal mo:time ?interval ."
Chris@449 535 " ?interval tl:onTimeLine ?tl ."
Chris@449 536 " ?time tl:onTimeLine ?tl ."
Chris@449 537 " ?timed_thing event:time ?time ."
Chris@440 538 " ?timed_thing a ?event_type ."
Chris@440 539
Chris@439 540 " OPTIONAL {"
Chris@440 541 " ?timed_thing af:feature ?value"
Chris@439 542 " }"
Chris@439 543 " }"
Chris@439 544
Chris@439 545 ).arg(m_uristring);
Chris@439 546
Chris@449 547 QString timeQueryString = prefixes + QString(
Chris@449 548
Chris@449 549 " SELECT ?time FROM <%1> "
Chris@449 550 " WHERE { "
Chris@449 551 " <%2> event:time ?t . "
Chris@449 552 " ?t tl:at ?time . "
Chris@449 553 " } "
Chris@449 554
Chris@449 555 ).arg(m_uristring);
Chris@449 556
Chris@449 557 QString rangeQueryString = prefixes + QString(
Chris@449 558
Chris@449 559 " SELECT ?time ?duration FROM <%1> "
Chris@449 560 " WHERE { "
Chris@449 561 " <%2> event:time ?t . "
Chris@449 562 " ?t tl:beginsAt ?time . "
Chris@449 563 " ?t tl:duration ?duration . "
Chris@449 564 " } "
Chris@449 565
Chris@449 566 ).arg(m_uristring);
Chris@449 567
Chris@449 568 QString labelQueryString = prefixes + QString(
Chris@449 569
Chris@449 570 " SELECT ?label FROM <%1> "
Chris@449 571 " WHERE { "
Chris@449 572 " <%2> rdfs:label ?label . "
Chris@449 573 " } "
Chris@449 574
Chris@449 575 ).arg(m_uristring);
Chris@449 576
Chris@510 577 QString textQueryString = prefixes + QString(
Chris@510 578
Chris@510 579 " SELECT ?label FROM <%1> "
Chris@510 580 " WHERE { "
Chris@510 581 " <%2> af:text ?label . "
Chris@510 582 " } "
Chris@510 583
Chris@510 584 ).arg(m_uristring);
Chris@510 585
Chris@489 586 SimpleSPARQLQuery query(s, queryString);
Chris@439 587 query.setProgressReporter(reporter);
Chris@439 588
Chris@500 589 // cerr << "Query will be: " << queryString.toStdString() << endl;
Chris@439 590
Chris@439 591 SimpleSPARQLQuery::ResultList results = query.execute();
Chris@439 592
Chris@439 593 if (!query.isOK()) {
Chris@439 594 m_errorString = query.getErrorString();
Chris@440 595 return;
Chris@439 596 }
Chris@439 597
Chris@439 598 if (query.wasCancelled()) {
Chris@439 599 m_errorString = "Query cancelled";
Chris@440 600 return;
Chris@439 601 }
Chris@439 602
Chris@449 603 /*
Chris@449 604 This function is now only used for sparse data (for dense data
Chris@449 605 we would be in getDataModelsDense instead).
Chris@449 606
Chris@449 607 For sparse data, the determining factors in deciding what model
Chris@449 608 to use are: Do the features have values? and Do the features
Chris@449 609 have duration?
Chris@449 610
Chris@449 611 We can run through the results and check off whether we find
Chris@449 612 values and duration for each of the source+type keys, and then
Chris@449 613 run through the source+type keys pushing each of the results
Chris@449 614 into a suitable model.
Chris@449 615
Chris@449 616 Unfortunately, at this point we do not yet have any actual
Chris@449 617 timing data (time/duration) -- just the time URI.
Chris@449 618
Chris@449 619 What we _could_ do is to create one of each type of model at the
Chris@449 620 start, for each of the source+type keys, and then push each
Chris@449 621 feature into the relevant model depending on what we find out
Chris@449 622 about it. Then return only non-empty models.
Chris@449 623 */
Chris@449 624
Chris@449 625 // Map from signal source to event type to dimensionality to
Chris@449 626 // presence of duration to model ptr. Whee!
Chris@449 627 std::map<QString, std::map<QString, std::map<int, std::map<bool, Model *> > > >
Chris@449 628 modelMap;
Chris@449 629
Chris@439 630 for (int i = 0; i < results.size(); ++i) {
Chris@439 631
Chris@499 632 if (i % 4 == 0) {
Chris@499 633 if (reporter) reporter->setProgress(i/4);
Chris@499 634 }
Chris@499 635
Chris@499 636 QString source = results[i]["signal"].value;
Chris@449 637 QString type = results[i]["event_type"].value;
Chris@449 638 QString thinguri = results[i]["timed_thing"].value;
Chris@449 639
Chris@449 640 RealTime time;
Chris@449 641 RealTime duration;
Chris@439 642
Chris@449 643 bool haveTime = false;
Chris@449 644 bool haveDuration = false;
Chris@439 645
Chris@510 646 QString label = "";
Chris@510 647 bool text = (type.contains("Text") || type.contains("text")); // Ha, ha
Chris@510 648
Chris@510 649 if (text) {
Chris@510 650 label = SimpleSPARQLQuery::singleResultQuery
Chris@510 651 (s, textQueryString.arg(thinguri), "label").value;
Chris@510 652 }
Chris@510 653
Chris@510 654 if (label == "") {
Chris@510 655 label = SimpleSPARQLQuery::singleResultQuery
Chris@510 656 (s, labelQueryString.arg(thinguri), "label").value;
Chris@510 657 }
Chris@449 658
Chris@489 659 SimpleSPARQLQuery rangeQuery(s, rangeQueryString.arg(thinguri));
Chris@450 660 SimpleSPARQLQuery::ResultList rangeResults = rangeQuery.execute();
Chris@450 661 if (!rangeResults.empty()) {
Chris@450 662 // std::cerr << rangeResults.size() << " range results" << std::endl;
Chris@450 663 time = RealTime::fromXsdDuration
Chris@450 664 (rangeResults[0]["time"].value.toStdString());
Chris@450 665 duration = RealTime::fromXsdDuration
Chris@450 666 (rangeResults[0]["duration"].value.toStdString());
Chris@450 667 // std::cerr << "duration string " << rangeResults[0]["duration"].value.toStdString() << std::endl;
Chris@449 668 haveTime = true;
Chris@450 669 haveDuration = true;
Chris@449 670 } else {
Chris@450 671 QString timestring = SimpleSPARQLQuery::singleResultQuery
Chris@489 672 (s, timeQueryString.arg(thinguri), "time").value;
Chris@520 673 // std::cerr << "timestring = " << timestring.toStdString() << std::endl;
Chris@450 674 if (timestring != "") {
Chris@450 675 time = RealTime::fromXsdDuration(timestring.toStdString());
Chris@449 676 haveTime = true;
Chris@449 677 }
Chris@449 678 }
Chris@439 679
Chris@439 680 QString valuestring = results[i]["value"].value;
Chris@449 681 std::vector<float> values;
Chris@449 682
Chris@439 683 if (valuestring != "") {
Chris@449 684 QStringList vsl = valuestring.split(" ", QString::SkipEmptyParts);
Chris@449 685 for (int j = 0; j < vsl.size(); ++j) {
Chris@449 686 bool success = false;
Chris@449 687 float v = vsl[j].toFloat(&success);
Chris@449 688 if (success) values.push_back(v);
Chris@449 689 }
Chris@439 690 }
Chris@439 691
Chris@449 692 int dimensions = 1;
Chris@449 693 if (values.size() == 1) dimensions = 2;
Chris@449 694 else if (values.size() > 1) dimensions = 3;
Chris@449 695
Chris@449 696 Model *model = 0;
Chris@449 697
Chris@449 698 if (modelMap[source][type][dimensions].find(haveDuration) ==
Chris@449 699 modelMap[source][type][dimensions].end()) {
Chris@449 700
Chris@449 701 /*
Chris@449 702 std::cerr << "Creating new model: source = " << source.toStdString()
Chris@449 703 << ", type = " << type.toStdString() << ", dimensions = "
Chris@449 704 << dimensions << ", haveDuration = " << haveDuration
Chris@449 705 << ", time = " << time << ", duration = " << duration
Chris@449 706 << std::endl;
Chris@449 707 */
Chris@449 708
Chris@449 709 if (!haveDuration) {
Chris@449 710
Chris@449 711 if (dimensions == 1) {
Chris@449 712
Chris@510 713 if (text) {
Chris@510 714
Chris@510 715 model = new TextModel(m_sampleRate, 1, false);
Chris@510 716
Chris@510 717 } else {
Chris@510 718
Chris@510 719 model = new SparseOneDimensionalModel(m_sampleRate, 1, false);
Chris@510 720 }
Chris@449 721
Chris@449 722 } else if (dimensions == 2) {
Chris@449 723
Chris@510 724 if (text) {
Chris@510 725
Chris@510 726 model = new TextModel(m_sampleRate, 1, false);
Chris@510 727
Chris@510 728 } else {
Chris@510 729
Chris@510 730 model = new SparseTimeValueModel(m_sampleRate, 1, false);
Chris@510 731 }
Chris@449 732
Chris@449 733 } else {
Chris@449 734
Chris@449 735 // We don't have a three-dimensional sparse model,
Chris@449 736 // so use a note model. We do have some logic (in
Chris@449 737 // extractStructure below) for guessing whether
Chris@449 738 // this should after all have been a dense model,
Chris@449 739 // but it's hard to apply it because we don't have
Chris@449 740 // all the necessary timing data yet... hmm
Chris@449 741
Chris@449 742 model = new NoteModel(m_sampleRate, 1, false);
Chris@449 743 }
Chris@449 744
Chris@449 745 } else { // haveDuration
Chris@449 746
Chris@449 747 if (dimensions == 1 || dimensions == 2) {
Chris@449 748
Chris@449 749 // If our units are frequency or midi pitch, we
Chris@449 750 // should be using a note model... hm
Chris@449 751
Chris@449 752 model = new RegionModel(m_sampleRate, 1, false);
Chris@449 753
Chris@449 754 } else {
Chris@449 755
Chris@449 756 // We don't have a three-dimensional sparse model,
Chris@449 757 // so use a note model. We do have some logic (in
Chris@449 758 // extractStructure below) for guessing whether
Chris@449 759 // this should after all have been a dense model,
Chris@449 760 // but it's hard to apply it because we don't have
Chris@449 761 // all the necessary timing data yet... hmm
Chris@449 762
Chris@449 763 model = new NoteModel(m_sampleRate, 1, false);
Chris@449 764 }
Chris@449 765 }
Chris@449 766
Chris@499 767 if (m_audioModelMap.find(source) != m_audioModelMap.end()) {
Chris@499 768 std::cerr << "source model for " << model << " is " << m_audioModelMap[source] << std::endl;
Chris@499 769 model->setSourceModel(m_audioModelMap[source]);
Chris@499 770 }
Chris@499 771
Chris@493 772 QString titleQuery = QString
Chris@493 773 (
Chris@493 774 " PREFIX dc: <http://purl.org/dc/elements/1.1/> "
Chris@493 775 " SELECT ?title "
Chris@493 776 " FROM <%1> "
Chris@493 777 " WHERE { "
Chris@493 778 " <%2> dc:title ?title . "
Chris@493 779 " } "
Chris@493 780 ).arg(m_uristring).arg(type);
Chris@493 781 QString title = SimpleSPARQLQuery::singleResultQuery
Chris@493 782 (s, titleQuery, "title").value;
Chris@493 783 if (title != "") model->setObjectName(title);
Chris@493 784
Chris@449 785 modelMap[source][type][dimensions][haveDuration] = model;
Chris@449 786 models.push_back(model);
Chris@449 787 }
Chris@449 788
Chris@449 789 model = modelMap[source][type][dimensions][haveDuration];
Chris@449 790
Chris@449 791 if (model) {
Chris@449 792 long ftime = RealTime::realTime2Frame(time, m_sampleRate);
Chris@449 793 long fduration = RealTime::realTime2Frame(duration, m_sampleRate);
Chris@449 794 fillModel(model, ftime, fduration, haveDuration, values, label);
Chris@439 795 }
Chris@439 796 }
Chris@439 797 }
Chris@439 798
Chris@439 799 void
Chris@449 800 RDFImporterImpl::fillModel(Model *model,
Chris@449 801 long ftime,
Chris@449 802 long fduration,
Chris@449 803 bool haveDuration,
Chris@449 804 std::vector<float> &values,
Chris@449 805 QString label)
Chris@449 806 {
Chris@493 807 // std::cerr << "RDFImporterImpl::fillModel: adding point at frame " << ftime << std::endl;
Chris@492 808
Chris@449 809 SparseOneDimensionalModel *sodm =
Chris@449 810 dynamic_cast<SparseOneDimensionalModel *>(model);
Chris@449 811 if (sodm) {
Chris@449 812 SparseOneDimensionalModel::Point point(ftime, label);
Chris@449 813 sodm->addPoint(point);
Chris@449 814 return;
Chris@449 815 }
Chris@449 816
Chris@510 817 TextModel *tm =
Chris@510 818 dynamic_cast<TextModel *>(model);
Chris@510 819 if (tm) {
Chris@510 820 TextModel::Point point
Chris@510 821 (ftime,
Chris@510 822 values.empty() ? 0.5f : values[0] < 0.f ? 0.f : values[0] > 1.f ? 1.f : values[0], // I was young and feckless once too
Chris@510 823 label);
Chris@510 824 tm->addPoint(point);
Chris@510 825 return;
Chris@510 826 }
Chris@510 827
Chris@449 828 SparseTimeValueModel *stvm =
Chris@449 829 dynamic_cast<SparseTimeValueModel *>(model);
Chris@449 830 if (stvm) {
Chris@449 831 SparseTimeValueModel::Point point
Chris@449 832 (ftime, values.empty() ? 0.f : values[0], label);
Chris@449 833 stvm->addPoint(point);
Chris@449 834 return;
Chris@449 835 }
Chris@449 836
Chris@449 837 NoteModel *nm =
Chris@449 838 dynamic_cast<NoteModel *>(model);
Chris@449 839 if (nm) {
Chris@449 840 if (haveDuration) {
Chris@449 841 float value = 0.f, level = 1.f;
Chris@449 842 if (!values.empty()) {
Chris@449 843 value = values[0];
Chris@449 844 if (values.size() > 1) {
Chris@449 845 level = values[1];
Chris@449 846 }
Chris@449 847 }
Chris@449 848 NoteModel::Point point(ftime, value, fduration, level, label);
Chris@449 849 nm->addPoint(point);
Chris@449 850 } else {
Chris@449 851 float value = 0.f, duration = 1.f, level = 1.f;
Chris@449 852 if (!values.empty()) {
Chris@449 853 value = values[0];
Chris@449 854 if (values.size() > 1) {
Chris@449 855 duration = values[1];
Chris@449 856 if (values.size() > 2) {
Chris@449 857 level = values[2];
Chris@449 858 }
Chris@449 859 }
Chris@449 860 }
Chris@449 861 NoteModel::Point point(ftime, value, duration, level, label);
Chris@449 862 nm->addPoint(point);
Chris@449 863 }
Chris@449 864 return;
Chris@449 865 }
Chris@449 866
Chris@449 867 RegionModel *rm =
Chris@449 868 dynamic_cast<RegionModel *>(model);
Chris@449 869 if (rm) {
Chris@449 870 if (haveDuration) {
Chris@449 871 RegionModel::Point point
Chris@449 872 (ftime, values.empty() ? 0.f : values[0], fduration, label);
Chris@449 873 rm->addPoint(point);
Chris@449 874 } else {
Chris@449 875 // This won't actually happen -- we only create region models
Chris@449 876 // if we do have duration -- but just for completeness
Chris@449 877 float value = 0.f, duration = 1.f;
Chris@449 878 if (!values.empty()) {
Chris@449 879 value = values[0];
Chris@449 880 if (values.size() > 1) {
Chris@449 881 duration = values[1];
Chris@449 882 }
Chris@449 883 }
Chris@449 884 RegionModel::Point point(ftime, value, duration, label);
Chris@449 885 rm->addPoint(point);
Chris@449 886 }
Chris@449 887 return;
Chris@449 888 }
Chris@449 889
Chris@449 890 std::cerr << "WARNING: RDFImporterImpl::fillModel: Unknown or unexpected model type" << std::endl;
Chris@449 891 return;
Chris@449 892 }
Chris@449 893
Chris@490 894 RDFImporter::RDFDocumentType
Chris@490 895 RDFImporter::identifyDocumentType(QString url)
Chris@490 896 {
Chris@490 897 bool haveAudio = false;
Chris@490 898 bool haveAnnotations = false;
Chris@449 899
Chris@499 900 // This query is not expected to return any values, but if it
Chris@499 901 // executes successfully (leaving no error in the error string)
Chris@499 902 // then we know we have RDF
Chris@499 903 SimpleSPARQLQuery q(SimpleSPARQLQuery::QueryFromSingleSource,
Chris@499 904 QString(" SELECT ?x FROM <%1> WHERE { ?x <y> <z> } ")
Chris@499 905 .arg(url));
Chris@499 906
Chris@499 907 SimpleSPARQLQuery::ResultList r = q.execute();
Chris@499 908 if (!q.isOK()) {
Chris@499 909 return NotRDF;
Chris@499 910 }
Chris@499 911
Chris@490 912 SimpleSPARQLQuery::Value value =
Chris@490 913 SimpleSPARQLQuery::singleResultQuery
Chris@490 914 (SimpleSPARQLQuery::QueryFromSingleSource,
Chris@490 915 QString
Chris@490 916 (" PREFIX mo: <http://purl.org/ontology/mo/> "
Chris@490 917 " SELECT ?url FROM <%1> "
Chris@490 918 " WHERE { ?signal a mo:Signal ; mo:available_as ?url } "
Chris@490 919 ).arg(url),
Chris@490 920 "url");
Chris@490 921
Chris@490 922 if (value.type == SimpleSPARQLQuery::URIValue) {
Chris@490 923 haveAudio = true;
Chris@490 924 }
Chris@490 925
Chris@490 926 value =
Chris@490 927 SimpleSPARQLQuery::singleResultQuery
Chris@490 928 (SimpleSPARQLQuery::QueryFromSingleSource,
Chris@490 929 QString
Chris@490 930 (" PREFIX event: <http://purl.org/NET/c4dm/event.owl#> "
Chris@490 931 " SELECT ?thing FROM <%1> "
Chris@490 932 " WHERE { ?thing event:time ?time } "
Chris@490 933 ).arg(url),
Chris@490 934 "thing");
Chris@490 935
Chris@490 936 if (value.type == SimpleSPARQLQuery::URIValue) {
Chris@490 937 haveAnnotations = true;
Chris@490 938 }
Chris@490 939
Chris@490 940 if (!haveAnnotations) {
Chris@490 941
Chris@490 942 value =
Chris@490 943 SimpleSPARQLQuery::singleResultQuery
Chris@490 944 (SimpleSPARQLQuery::QueryFromSingleSource,
Chris@490 945 QString
Chris@490 946 (" PREFIX af: <http://purl.org/ontology/af/> "
Chris@490 947 " SELECT ?thing FROM <%1> "
Chris@490 948 " WHERE { ?signal af:signal_feature ?thing } "
Chris@490 949 ).arg(url),
Chris@490 950 "thing");
Chris@490 951
Chris@490 952 if (value.type == SimpleSPARQLQuery::URIValue) {
Chris@490 953 haveAnnotations = true;
Chris@490 954 }
Chris@490 955 }
Chris@490 956
Chris@490 957 if (haveAudio) {
Chris@490 958 if (haveAnnotations) {
Chris@490 959 return AudioRefAndAnnotations;
Chris@490 960 } else {
Chris@490 961 return AudioRef;
Chris@490 962 }
Chris@490 963 } else {
Chris@490 964 if (haveAnnotations) {
Chris@490 965 return Annotations;
Chris@490 966 } else {
Chris@499 967 return OtherRDFDocument;
Chris@490 968 }
Chris@490 969 }
Chris@492 970
Chris@492 971 SimpleSPARQLQuery::closeSingleSource(url);
Chris@490 972 }
Chris@490 973
Chris@520 974 void
Chris@520 975 RDFImporterImpl::loadPrefixes(ProgressReporter *reporter)
Chris@520 976 {
Chris@520 977 return;
Chris@520 978 //!!!
Chris@520 979 if (m_prefixesLoaded) return;
Chris@520 980 const char *prefixes[] = {
Chris@520 981 "http://purl.org/NET/c4dm/event.owl",
Chris@520 982 "http://purl.org/NET/c4dm/timeline.owl",
Chris@520 983 "http://purl.org/ontology/mo/",
Chris@520 984 "http://purl.org/ontology/af/",
Chris@520 985 "http://www.w3.org/2000/01/rdf-schema",
Chris@520 986 "http://purl.org/dc/elements/1.1/",
Chris@520 987 };
Chris@520 988 for (size_t i = 0; i < sizeof(prefixes)/sizeof(prefixes[0]); ++i) {
Chris@520 989 CachedFile cf(prefixes[i], reporter, "application/rdf+xml");
Chris@520 990 if (!cf.isOK()) continue;
Chris@520 991 SimpleSPARQLQuery::addSourceToModel
Chris@520 992 (QUrl::fromLocalFile(cf.getLocalFilename()).toString());
Chris@520 993 }
Chris@520 994 m_prefixesLoaded = true;
Chris@520 995 }