sonic-annotator: runner/FeatureExtractionManager.cpp comparison

comparison runner/FeatureExtractionManager.cpp @ 248:c8e5fcddf8be

Merge

author	Chris Cannam
date	Fri, 18 Mar 2016 15:15:55 +0000
parents	9a10c3ffff47
children	857ce6ecb163

comparison

equal deleted inserted replaced

-:5eadb3b687bb
+:c8e5fcddf8be
 << "\" with plugin step size " << actualStepSize
 << " and block size " << actualBlockSize
 << " (adapter step and block size " << m_blockSize << ")"
 << endl;
+//            cerr << "NOTE: That transform is: " << transform.toXmlString() << endl;
 if (pida) {
 cerr << "NOTE: PluginInputDomainAdapter timestamp adjustment is "
 << pida->getTimestampAdjustment() << endl;
 }
 }
 }
 m_transformPluginMap[transform] = plugin;
+//        cerr << "NOTE: Assigned plugin " << plugin << " for transform: " << transform.toXmlString() << endl;
 if (!(originalTransform == transform)) {
 m_transformPluginMap[originalTransform] = plugin;
+//            cerr << "NOTE: Also assigned plugin " << plugin << " for original transform: " << originalTransform.toXmlString() << endl;
 }
 } else {
 plugin = m_transformPluginMap[transform];
 }
 return result;
 }
 bool FeatureExtractionManager::addFeatureExtractorFromFile
-(QString transformXmlFile, const vector<FeatureWriter*> &writers)
+(QString transformFile, const vector<FeatureWriter*> &writers)
 {
+// We support two formats for transform description files, XML (in
+// a format specific to Sonic Annotator) and RDF/Turtle. The RDF
+// format can describe multiple transforms in a single file, the
+// XML only one.
+// Possible errors we should report:
+//
+// 1. File does not exist or cannot be opened
+// 2. File is ostensibly XML, but is not parseable
+// 3. File is ostensibly Turtle, but is not parseable
+// 4. File is XML, but contains no valid transform (e.g. is unrelated XML)
+// 5. File is Turtle, but contains no valid transform(s)
+// 6. File is Turtle and contains both valid and invalid transform(s)
+{
+// We don't actually need to open this here yet, we just hoist
+// it to the top for error reporting purposes
+QFile file(transformFile);
+if (!file.open(QIODevice::ReadOnly | QIODevice::Text)) {
+// Error case 1. File does not exist or cannot be opened
+cerr << "ERROR: Failed to open transform file \"" << transformFile
+<< "\" for reading" << endl;
+return false;
+}
+}
 bool tryRdf = true;
+if (transformFile.endsWith(".xml") || transformFile.endsWith(".XML")) {
-if (transformXmlFile.endsWith(".xml") || transformXmlFile.endsWith(".XML")) {
 // We don't support RDF-XML (and nor does the underlying
 // parser library) so skip the RDF parse if the filename
 // suggests XML, to avoid puking out a load of errors from
 // feeding XML to a Turtle parser
 tryRdf = false;
 }
+bool tryXml = true;
+if (transformFile.endsWith(".ttl") || transformFile.endsWith(".TTL") ||
+transformFile.endsWith(".ntriples") || transformFile.endsWith(".NTRIPLES") ||
+transformFile.endsWith(".n3") || transformFile.endsWith(".N3")) {
+tryXml = false;
+}
+QString rdfError, xmlError;
 if (tryRdf) {
 RDFTransformFactory factory
-(QUrl::fromLocalFile(QFileInfo(transformXmlFile).absoluteFilePath())
+(QUrl::fromLocalFile(QFileInfo(transformFile).absoluteFilePath())
 .toString());
 ProgressPrinter printer("Parsing transforms RDF file");
 std::vector<Transform> transforms = factory.getTransforms(&printer);
-if (!factory.isOK()) {
-cerr << "WARNING: FeatureExtractionManager::addFeatureExtractorFromFile: Failed to parse transforms file: " << factory.getErrorString().toStdString() << endl;
+if (factory.isOK()) {
+if (transforms.empty()) {
+cerr << "ERROR: Transform file \"" << transformFile
+<< "\" is valid RDF but defines no transforms" << endl;
+return false;
+} else {
+bool success = true;
+for (int i = 0; i < (int)transforms.size(); ++i) {
+if (!addFeatureExtractor(transforms[i], writers)) {
+success = false;
+}
+}
+return success;
+}
+} else { // !factory.isOK()
 if (factory.isRDF()) {
-return false; // no point trying it as XML
+cerr << "ERROR: Invalid transform RDF file \"" << transformFile
-}
+<< "\": " << factory.getErrorString() << endl;
-}
+return false;
-if (!transforms.empty()) {
+}
-bool success = true;
-for (int i = 0; i < (int)transforms.size(); ++i) {
+// the not-RDF case: fall through without reporting an
-if (!addFeatureExtractor(transforms[i], writers)) {
+// error, so we try the file as XML, and if that fails, we
-success = false;
+// print a general unparseable-file error
-}
+rdfError = factory.getErrorString();
 }
-return success;
+}
-}
-}
+if (tryXml) {
-QFile file(transformXmlFile);
+QFile file(transformFile);
 if (!file.open(QIODevice::ReadOnly | QIODevice::Text)) {
-cerr << "ERROR: Failed to open transform XML file \""
+cerr << "ERROR: Failed to open transform file \""
-<< transformXmlFile.toStdString() << "\" for reading" << endl;
+<< transformFile.toStdString() << "\" for reading" << endl;
 return false;
 }
 QTextStream *qts = new QTextStream(&file);
 QString qs = qts->readAll();
 delete qts;
 file.close();
 Transform transform(qs);
+xmlError = transform.getErrorString();
-return addFeatureExtractor(transform, writers);
+if (xmlError == "") {
+if (transform.getIdentifier() == "") {
+cerr << "ERROR: Transform file \"" << transformFile
+<< "\" is valid XML but defines no transform" << endl;
+return false;
+}
+return addFeatureExtractor(transform, writers);
+}
+}
+cerr << "ERROR: Transform file \"" << transformFile
+<< "\" could not be parsed" << endl;
+if (rdfError != "") {
+cerr << "ERROR: RDF parser reported: " << rdfError << endl;
+}
+if (xmlError != "") {
+cerr << "ERROR: XML parser reported: " << xmlError << endl;
+}
+return false;
 }
 void FeatureExtractionManager::addSource(QString audioSource, bool willMultiplex)
 {
 std::cerr << "Have audio source: \"" << audioSource.toStdString() << "\"" << std::endl;
 // first audio source and we need it to establish default channel
 // count and sample rate
 if (m_channels == 0 || m_defaultSampleRate == 0) {
-ProgressPrinter retrievalProgress("Determining default rate and channel count from first input file...");
+ProgressPrinter retrievalProgress("Retrieving first input file to determine default rate and channel count...");
 FileSource source(audioSource, &retrievalProgress);
 if (!source.isAvailable()) {
 cerr << "ERROR: File or URL \"" << audioSource.toStdString()
 << "\" could not be located";
 if (!willMultiplex) {
 if (m_channels == 0) {
 m_channels = reader->getChannelCount();
 cerr << "Taking default channel count of "
-<< reader->getChannelCount() << " from file" << endl;
+<< reader->getChannelCount() << " from audio file" << endl;
 }
 }
 if (m_defaultSampleRate == 0) {
 m_defaultSampleRate = reader->getNativeRate();
 cerr << "Taking default sample rate of "
-<< reader->getNativeRate() << "Hz from file" << endl;
+<< reader->getNativeRate() << "Hz from audio file" << endl;
 cerr << "(Note: Default may be overridden by transforms)" << endl;
 }
 m_readyReaders[audioSource] = reader;
 }
 retrievalProgress.done();
 }
 if (!reader) {
 throw FailedToOpenFile(source);
 }
-return reader;
-}
-void
-FeatureExtractionManager::extractFeaturesFor(AudioFileReader *reader,
-QString audioSource)
-{
-// Note: This also deletes reader
-cerr << "Audio file \"" << audioSource.toStdString() << "\": "
-<< reader->getChannelCount() << "ch at "
-<< reader->getNativeRate() << "Hz" << endl;
 if (reader->getChannelCount() != m_channels ||
 reader->getNativeRate() != m_sampleRate) {
 cerr << "NOTE: File will be mixed or resampled for processing, to: "
 << m_channels << "ch at "
 << m_sampleRate << "Hz" << endl;
 }
+return reader;
+}
+void
+FeatureExtractionManager::extractFeaturesFor(AudioFileReader *reader,
+QString audioSource)
+{
+// Note: This also deletes reader
+cerr << "Audio file \"" << audioSource.toStdString() << "\": "
+<< reader->getChannelCount() << "ch at "
+<< reader->getNativeRate() << "Hz" << endl;
 // allocate audio buffers
 float **data = new float *[m_channels];
 for (int c = 0; c < m_channels; ++c) {
 data[c] = new float[m_blockSize];
 foreach (Plugin *plugin, m_orderedPlugins) {
 PluginMap::iterator pi = m_plugins.find(plugin);
-std::cerr << "Calling reset on " << plugin << std::endl;
+//        std::cerr << "Calling reset on " << plugin << std::endl;
 plugin->reset();
 for (TransformWriterMap::iterator ti = pi->second.begin();
 ti != pi->second.end(); ++ti) {
 if (!m_summariesOnly) {
 writeFeatures(audioSource, plugin, featureSet);
 }
 if (!m_summaries.empty()) {
+// Summaries requested on the command line, for all transforms
 PluginSummarisingAdapter *adapter =
 dynamic_cast<PluginSummarisingAdapter *>(plugin);
 if (!adapter) {
 cerr << "WARNING: Summaries requested, but plugin is not a summarising adapter" << endl;
 } else {
 //!!! on whether their features have duration or
 //!!! not
 featureSet = adapter->getSummaryForAllOutputs
 (getSummaryType(*sni),
 PluginSummarisingAdapter::ContinuousTimeAverage);
-writeFeatures(audioSource, plugin, featureSet,//!!! *sni);
+writeFeatures(audioSource, plugin, featureSet,
 Transform::stringToSummaryType(sni->c_str()));
 }
 }
 }
+// Summaries specified in transform definitions themselves
 writeSummaries(audioSource, plugin);
 }
 extractionProgress.done();
 for (TransformWriterMap::const_iterator ti = pi->second.begin();
 ti != pi->second.end(); ++ti) {
 const Transform &transform = ti->first;
+//        cerr << "FeatureExtractionManager::writeSummaries: plugin is " << plugin
+//             << ", found transform: " << transform.toXmlString() << endl;
 Transform::SummaryType summaryType = transform.getSummaryType();
 PluginSummarisingAdapter::SummaryType pType =
 (PluginSummarisingAdapter::SummaryType)summaryType;
 if (transform.getSummaryType() == Transform::NoSummary) {
+//            cerr << "(no summary, continuing)" << endl;
 continue;
 }
 PluginSummarisingAdapter *adapter =
 dynamic_cast<PluginSummarisingAdapter *>(plugin);
 }
 Plugin::FeatureSet featureSet = adapter->getSummaryForAllOutputs
 (pType, PluginSummarisingAdapter::ContinuousTimeAverage);
-//        cout << "summary type " << int(pType) << " for transform:" << endl << transform.toXmlString().toStdString()<< endl << "... feature set with " << featureSet.size() << " elts" << endl;
+//        cerr << "summary type " << int(pType) << " for transform:" << endl << transform.toXmlString().toStdString()<< endl << "... feature set with " << featureSet.size() << " elts" << endl;
 writeFeatures(audioSource, plugin, featureSet, summaryType);
 }
 }
 Transform::SummaryType summaryType)
 {
 // caller should have ensured plugin is in m_plugins
 PluginMap::iterator pi = m_plugins.find(plugin);
+// Write features from the feature set passed in, according to the
+// transforms listed for the given plugin with the given summary type
 for (TransformWriterMap::const_iterator ti = pi->second.begin();
 ti != pi->second.end(); ++ti) {
 const Transform &transform = ti->first;
 const vector<FeatureWriter *> &writers = ti->second;
-if (transform.getSummaryType() != Transform::NoSummary &&
+//        cerr << "writeFeatures: plugin " << plugin << " has transform: " << transform.toXmlString() << endl;
-m_summaries.empty() &&
-summaryType == Transform::NoSummary) {
+if (transform.getSummaryType() == Transform::NoSummary &&
-continue;
+!m_summaries.empty()) {
-}
+//            cerr << "transform has no summary, but summaries requested on command line, so going for it anyway" << endl;
+} else if (transform.getSummaryType() != summaryType) {
-if (transform.getSummaryType() != Transform::NoSummary &&
+// Either we're not writing a summary and the transform
-summaryType != Transform::NoSummary &&
+// has one, or we're writing a summary but the transform
-transform.getSummaryType() != summaryType) {
+// has none or a different one; either way, skip it
+//            cerr << "summary type differs from passed-in one " << summaryType << endl;
 continue;
 }
 string outputId = transform.getOutput().toStdString();
 int outputIndex = m_pluginOutputIndices[outputId];
 Plugin::FeatureSet::const_iterator fsi = features.find(outputIndex);
 if (fsi == features.end()) continue;
+//        cerr << "this transform has " << writers.size() << " writer(s)" << endl;
 for (int j = 0; j < (int)writers.size(); ++j) {
 writers[j]->write
 (audioSource, transform, desc, fsi->second,
 Transform::summaryTypeToString(summaryType).toStdString());
 }

Mercurial > hg > sonic-annotator

comparison runner/FeatureExtractionManager.cpp @ 248:c8e5fcddf8be