annotate rdf/PluginRDFIndexer.cpp @ 476:acddcc3cca36

* Avoid deadlock in indexer
author Chris Cannam
date Fri, 07 Nov 2008 20:25:57 +0000
parents a70dcfed59c1
children e0784311a103
rev   line source
Chris@439 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@439 2
Chris@439 3 /*
Chris@439 4 Sonic Visualiser
Chris@439 5 An audio file viewer and annotation editor.
Chris@439 6 Centre for Digital Music, Queen Mary, University of London.
Chris@439 7 This file copyright 2008 QMUL.
Chris@439 8
Chris@439 9 This program is free software; you can redistribute it and/or
Chris@439 10 modify it under the terms of the GNU General Public License as
Chris@439 11 published by the Free Software Foundation; either version 2 of the
Chris@439 12 License, or (at your option) any later version. See the file
Chris@439 13 COPYING included with this distribution for more information.
Chris@439 14 */
Chris@439 15
Chris@439 16 #include "PluginRDFIndexer.h"
Chris@439 17
Chris@439 18 #include "SimpleSPARQLQuery.h"
Chris@439 19
Chris@467 20 #include "data/fileio/CachedFile.h"
Chris@471 21 #include "data/fileio/FileSource.h"
Chris@461 22 #include "data/fileio/PlaylistFileReader.h"
Chris@439 23 #include "plugin/PluginIdentifier.h"
Chris@439 24
Chris@457 25 #include "base/Profiler.h"
Chris@457 26
Chris@475 27 #include <vamp-hostsdk/PluginHostAdapter.h>
Chris@439 28
Chris@439 29 #include <QFileInfo>
Chris@439 30 #include <QDir>
Chris@439 31 #include <QUrl>
Chris@461 32 #include <QDateTime>
Chris@461 33 #include <QSettings>
Chris@461 34 #include <QFile>
Chris@439 35
Chris@439 36 #include <iostream>
Chris@439 37 using std::cerr;
Chris@439 38 using std::endl;
Chris@439 39 using std::vector;
Chris@439 40 using std::string;
Chris@439 41 using Vamp::PluginHostAdapter;
Chris@439 42
Chris@439 43 PluginRDFIndexer *
Chris@439 44 PluginRDFIndexer::m_instance = 0;
Chris@439 45
Chris@439 46 PluginRDFIndexer *
Chris@439 47 PluginRDFIndexer::getInstance()
Chris@439 48 {
Chris@439 49 if (!m_instance) m_instance = new PluginRDFIndexer();
Chris@439 50 return m_instance;
Chris@439 51 }
Chris@439 52
Chris@439 53 PluginRDFIndexer::PluginRDFIndexer()
Chris@439 54 {
Chris@439 55 vector<string> paths = PluginHostAdapter::getPluginPath();
Chris@439 56
Chris@439 57 QStringList filters;
Chris@439 58 filters << "*.n3";
Chris@439 59 filters << "*.N3";
Chris@439 60 filters << "*.rdf";
Chris@439 61 filters << "*.RDF";
Chris@439 62
Chris@439 63 // Search each Vamp plugin path for a .rdf file that either has
Chris@439 64 // name "soname", "soname:label" or "soname/label" plus RDF
Chris@439 65 // extension. Use that order of preference, and prefer n3 over
Chris@439 66 // rdf extension.
Chris@439 67
Chris@439 68 for (vector<string>::const_iterator i = paths.begin(); i != paths.end(); ++i) {
Chris@439 69
Chris@439 70 QDir dir(i->c_str());
Chris@439 71 if (!dir.exists()) continue;
Chris@439 72
Chris@439 73 QStringList entries = dir.entryList
Chris@439 74 (filters, QDir::Files | QDir::Readable);
Chris@439 75
Chris@439 76 for (QStringList::const_iterator j = entries.begin();
Chris@439 77 j != entries.end(); ++j) {
Chris@439 78 QFileInfo fi(dir.filePath(*j));
Chris@439 79 indexFile(fi.absoluteFilePath());
Chris@439 80 }
Chris@439 81
Chris@439 82 QStringList subdirs = dir.entryList
Chris@439 83 (QDir::AllDirs | QDir::NoDotAndDotDot | QDir::Readable);
Chris@439 84
Chris@439 85 for (QStringList::const_iterator j = subdirs.begin();
Chris@439 86 j != subdirs.end(); ++j) {
Chris@439 87 QDir subdir(dir.filePath(*j));
Chris@439 88 if (subdir.exists()) {
Chris@439 89 entries = subdir.entryList
Chris@439 90 (filters, QDir::Files | QDir::Readable);
Chris@439 91 for (QStringList::const_iterator k = entries.begin();
Chris@439 92 k != entries.end(); ++k) {
Chris@439 93 QFileInfo fi(subdir.filePath(*k));
Chris@439 94 indexFile(fi.absoluteFilePath());
Chris@439 95 }
Chris@439 96 }
Chris@439 97 }
Chris@439 98 }
Chris@439 99 }
Chris@439 100
Chris@439 101 PluginRDFIndexer::~PluginRDFIndexer()
Chris@439 102 {
Chris@461 103 QMutexLocker locker(&m_mutex);
Chris@439 104 }
Chris@439 105
Chris@461 106 bool
Chris@461 107 PluginRDFIndexer::indexConfiguredURLs()
Chris@461 108 {
Chris@461 109 std::cerr << "PluginRDFIndexer::indexConfiguredURLs" << std::endl;
Chris@461 110
Chris@461 111 QSettings settings;
Chris@461 112 settings.beginGroup("RDF");
Chris@461 113
Chris@461 114 QString indexKey("rdf-indices");
Chris@461 115 QStringList indices = settings.value(indexKey).toStringList();
Chris@461 116
Chris@461 117 for (int i = 0; i < indices.size(); ++i) {
Chris@461 118
Chris@461 119 QString index = indices[i];
Chris@461 120
Chris@461 121 std::cerr << "PluginRDFIndexer::indexConfiguredURLs: index url is "
Chris@461 122 << index.toStdString() << std::endl;
Chris@461 123
Chris@467 124 CachedFile cf(index);
Chris@467 125 if (!cf.isOK()) continue;
Chris@467 126
Chris@467 127 FileSource indexSource(cf.getLocalFilename());
Chris@461 128
Chris@461 129 PlaylistFileReader reader(indexSource);
Chris@461 130 if (!reader.isOK()) continue;
Chris@461 131
Chris@461 132 PlaylistFileReader::Playlist list = reader.load();
Chris@461 133 for (PlaylistFileReader::Playlist::const_iterator j = list.begin();
Chris@461 134 j != list.end(); ++j) {
Chris@461 135 std::cerr << "PluginRDFIndexer::indexConfiguredURLs: url is "
Chris@461 136 << j->toStdString() << std::endl;
Chris@461 137 indexURL(*j);
Chris@461 138 }
Chris@461 139 }
Chris@461 140
Chris@461 141 QString urlListKey("rdf-urls");
Chris@461 142 QStringList urls = settings.value(urlListKey).toStringList();
Chris@461 143
Chris@461 144 for (int i = 0; i < urls.size(); ++i) {
Chris@461 145 indexURL(urls[i]);
Chris@461 146 }
Chris@461 147
Chris@461 148 settings.endGroup();
Chris@461 149 return true;
Chris@461 150 }
Chris@461 151
Chris@439 152 QString
Chris@439 153 PluginRDFIndexer::getURIForPluginId(QString pluginId)
Chris@439 154 {
Chris@461 155 QMutexLocker locker(&m_mutex);
Chris@461 156
Chris@439 157 if (m_idToUriMap.find(pluginId) == m_idToUriMap.end()) return "";
Chris@439 158 return m_idToUriMap[pluginId];
Chris@439 159 }
Chris@439 160
Chris@439 161 QString
Chris@439 162 PluginRDFIndexer::getIdForPluginURI(QString uri)
Chris@439 163 {
Chris@476 164 m_mutex.lock();
Chris@461 165
Chris@439 166 if (m_uriToIdMap.find(uri) == m_uriToIdMap.end()) {
Chris@439 167
Chris@476 168 m_mutex.unlock();
Chris@476 169
Chris@439 170 // Haven't found this uri referenced in any document on the
Chris@439 171 // local filesystem; try resolving the pre-fragment part of
Chris@439 172 // the uri as a document URL and reading that if possible.
Chris@439 173
Chris@439 174 // Because we may want to refer to this document again, we
Chris@439 175 // cache it locally if it turns out to exist.
Chris@439 176
Chris@439 177 cerr << "PluginRDFIndexer::getIdForPluginURI: NOTE: Failed to find a local RDF document describing plugin <" << uri.toStdString() << ">: attempting to retrieve one remotely by guesswork" << endl;
Chris@439 178
Chris@439 179 QString baseUrl = QUrl(uri).toString(QUrl::RemoveFragment);
Chris@439 180
Chris@457 181 indexURL(baseUrl);
Chris@439 182
Chris@476 183 m_mutex.lock();
Chris@476 184
Chris@439 185 if (m_uriToIdMap.find(uri) == m_uriToIdMap.end()) {
Chris@439 186 m_uriToIdMap[uri] = "";
Chris@439 187 }
Chris@439 188 }
Chris@439 189
Chris@476 190 QString id = m_uriToIdMap[uri];
Chris@476 191 m_mutex.unlock();
Chris@476 192 return id;
Chris@439 193 }
Chris@439 194
Chris@439 195 QString
Chris@439 196 PluginRDFIndexer::getDescriptionURLForPluginId(QString pluginId)
Chris@439 197 {
Chris@461 198 QMutexLocker locker(&m_mutex);
Chris@461 199
Chris@439 200 if (m_idToDescriptionMap.find(pluginId) == m_idToDescriptionMap.end()) return "";
Chris@439 201 return m_idToDescriptionMap[pluginId];
Chris@439 202 }
Chris@439 203
Chris@439 204 QString
Chris@439 205 PluginRDFIndexer::getDescriptionURLForPluginURI(QString uri)
Chris@439 206 {
Chris@461 207 QMutexLocker locker(&m_mutex);
Chris@461 208
Chris@439 209 QString id = getIdForPluginURI(uri);
Chris@439 210 if (id == "") return "";
Chris@439 211 return getDescriptionURLForPluginId(id);
Chris@439 212 }
Chris@439 213
Chris@456 214 QStringList
Chris@456 215 PluginRDFIndexer::getIndexedPluginIds()
Chris@456 216 {
Chris@461 217 QMutexLocker locker(&m_mutex);
Chris@461 218
Chris@456 219 QStringList ids;
Chris@456 220 for (StringMap::const_iterator i = m_idToDescriptionMap.begin();
Chris@456 221 i != m_idToDescriptionMap.end(); ++i) {
Chris@456 222 ids.push_back(i->first);
Chris@456 223 }
Chris@456 224 return ids;
Chris@456 225 }
Chris@456 226
Chris@439 227 bool
Chris@439 228 PluginRDFIndexer::indexFile(QString filepath)
Chris@439 229 {
Chris@439 230 QUrl url = QUrl::fromLocalFile(filepath);
Chris@439 231 QString urlString = url.toString();
Chris@439 232 return indexURL(urlString);
Chris@439 233 }
Chris@461 234
Chris@439 235 bool
Chris@439 236 PluginRDFIndexer::indexURL(QString urlString)
Chris@439 237 {
Chris@457 238 Profiler profiler("PluginRDFIndexer::indexURL");
Chris@457 239
Chris@461 240 std::cerr << "PluginRDFIndexer::indexURL(" << urlString.toStdString() << ")" << std::endl;
Chris@461 241
Chris@461 242 QMutexLocker locker(&m_mutex);
Chris@461 243
Chris@457 244 QString localString = urlString;
Chris@457 245
Chris@457 246 if (FileSource::isRemote(urlString) &&
Chris@457 247 FileSource::canHandleScheme(urlString)) {
Chris@457 248
Chris@467 249 CachedFile cf(urlString);
Chris@467 250 if (!cf.isOK()) {
Chris@467 251 return false;
Chris@467 252 }
Chris@467 253
Chris@467 254 localString = cf.getLocalFilename();
Chris@457 255 }
Chris@457 256
Chris@439 257 // cerr << "PluginRDFIndexer::indexURL: url = <" << urlString.toStdString() << ">" << endl;
Chris@439 258
Chris@439 259 SimpleSPARQLQuery query
Chris@439 260 (QString
Chris@439 261 (
Chris@439 262 " PREFIX vamp: <http://purl.org/ontology/vamp/> "
Chris@439 263
Chris@439 264 " SELECT ?plugin ?library_id ?plugin_id "
Chris@439 265 " FROM <%1> "
Chris@439 266
Chris@439 267 " WHERE { "
Chris@439 268 " ?plugin a vamp:Plugin . "
Chris@439 269
Chris@439 270 // Make the identifier and library parts optional, so
Chris@439 271 // that we can check and report helpfully if one or both
Chris@439 272 // is absent instead of just getting no results
Chris@439 273
Chris@440 274 //!!! No -- because of rasqal's inability to correctly
Chris@440 275 // handle more than one OPTIONAL graph in a query, let's
Chris@440 276 // make identifier compulsory after all
Chris@440 277 //" OPTIONAL { ?plugin vamp:identifier ?plugin_id } . "
Chris@440 278
Chris@440 279 " ?plugin vamp:identifier ?plugin_id . "
Chris@439 280
Chris@439 281 " OPTIONAL { "
Chris@439 282 " ?library a vamp:PluginLibrary ; "
Chris@439 283 " vamp:available_plugin ?plugin ; "
Chris@439 284 " vamp:identifier ?library_id "
Chris@439 285 " } "
Chris@439 286 " } "
Chris@439 287 )
Chris@457 288 .arg(localString));
Chris@439 289
Chris@439 290 SimpleSPARQLQuery::ResultList results = query.execute();
Chris@439 291
Chris@439 292 if (!query.isOK()) {
Chris@439 293 cerr << "ERROR: PluginRDFIndexer::indexURL: ERROR: Failed to index document at <"
Chris@439 294 << urlString.toStdString() << ">: "
Chris@439 295 << query.getErrorString().toStdString() << endl;
Chris@439 296 return false;
Chris@439 297 }
Chris@439 298
Chris@439 299 if (results.empty()) {
Chris@439 300 cerr << "PluginRDFIndexer::indexURL: NOTE: Document at <"
Chris@439 301 << urlString.toStdString()
Chris@439 302 << "> does not describe any vamp:Plugin resources" << endl;
Chris@439 303 return false;
Chris@439 304 }
Chris@439 305
Chris@439 306 bool foundSomething = false;
Chris@439 307 bool addedSomething = false;
Chris@439 308
Chris@439 309 for (SimpleSPARQLQuery::ResultList::iterator i = results.begin();
Chris@439 310 i != results.end(); ++i) {
Chris@439 311
Chris@439 312 QString pluginUri = (*i)["plugin"].value;
Chris@439 313 QString soname = (*i)["library_id"].value;
Chris@439 314 QString identifier = (*i)["plugin_id"].value;
Chris@439 315
Chris@439 316 if (identifier == "") {
Chris@439 317 cerr << "PluginRDFIndexer::indexURL: NOTE: Document at <"
Chris@439 318 << urlString.toStdString()
Chris@439 319 << "> fails to define any vamp:identifier for plugin <"
Chris@439 320 << pluginUri.toStdString() << ">"
Chris@439 321 << endl;
Chris@439 322 continue;
Chris@439 323 }
Chris@439 324 if (soname == "") {
Chris@439 325 cerr << "PluginRDFIndexer::indexURL: NOTE: Document at <"
Chris@439 326 << urlString.toStdString() << "> does not associate plugin <"
Chris@439 327 << pluginUri.toStdString() << "> with any implementation library"
Chris@439 328 << endl;
Chris@439 329 continue;
Chris@439 330 }
Chris@439 331 /*
Chris@439 332 cerr << "PluginRDFIndexer::indexURL: Document for plugin \""
Chris@439 333 << soname.toStdString() << ":" << identifier.toStdString()
Chris@439 334 << "\" (uri <" << pluginUri.toStdString() << ">) is at url <"
Chris@439 335 << urlString.toStdString() << ">" << endl;
Chris@439 336 */
Chris@439 337 QString pluginId = PluginIdentifier::createIdentifier
Chris@439 338 ("vamp", soname, identifier);
Chris@439 339
Chris@439 340 foundSomething = true;
Chris@439 341
Chris@439 342 if (m_idToDescriptionMap.find(pluginId) != m_idToDescriptionMap.end()) {
Chris@439 343 cerr << "PluginRDFIndexer::indexURL: NOTE: Plugin id \""
Chris@439 344 << pluginId.toStdString() << "\", described in document at <"
Chris@439 345 << urlString.toStdString()
Chris@439 346 << ">, has already been described in document <"
Chris@439 347 << m_idToDescriptionMap[pluginId].toStdString()
Chris@439 348 << ">: ignoring this new description" << endl;
Chris@439 349 continue;
Chris@439 350 }
Chris@439 351
Chris@439 352 m_idToDescriptionMap[pluginId] = urlString;
Chris@439 353 m_idToUriMap[pluginId] = pluginUri;
Chris@439 354
Chris@439 355 addedSomething = true;
Chris@439 356
Chris@439 357 if (pluginUri != "") {
Chris@439 358 if (m_uriToIdMap.find(pluginUri) != m_uriToIdMap.end()) {
Chris@439 359 cerr << "PluginRDFIndexer::indexURL: WARNING: Found multiple plugins with the same URI:" << endl;
Chris@439 360 cerr << " 1. Plugin id \"" << m_uriToIdMap[pluginUri].toStdString() << "\"" << endl;
Chris@439 361 cerr << " described in <" << m_idToDescriptionMap[m_uriToIdMap[pluginUri]].toStdString() << ">" << endl;
Chris@439 362 cerr << " 2. Plugin id \"" << pluginId.toStdString() << "\"" << endl;
Chris@439 363 cerr << " described in <" << urlString.toStdString() << ">" << endl;
Chris@439 364 cerr << "both claim URI <" << pluginUri.toStdString() << ">" << endl;
Chris@439 365 } else {
Chris@439 366 m_uriToIdMap[pluginUri] = pluginId;
Chris@439 367 }
Chris@439 368 }
Chris@439 369 }
Chris@439 370
Chris@439 371 if (!foundSomething) {
Chris@439 372 cerr << "PluginRDFIndexer::indexURL: NOTE: Document at <"
Chris@439 373 << urlString.toStdString()
Chris@439 374 << "> does not sufficiently describe any plugins" << endl;
Chris@439 375 }
Chris@439 376
Chris@439 377 return addedSomething;
Chris@439 378 }
Chris@439 379
Chris@439 380
Chris@439 381