annotate query.cpp @ 444:4fe90fd568fc api-inversion

No more audioDB::set_up_query{,_from_key} Go through audiodb_query_spec_qpointers() instead. It's a little bit horrible, but less horrible than two almost-identical separate functions...
author mas01cr
date Wed, 24 Dec 2008 10:56:37 +0000
parents cb44e57a96fa
children d1771f436ff7
rev   line source
mas01cr@239 1 #include "audioDB.h"
mas01cr@239 2 #include "reporter.h"
mas01cr@239 3
mas01cr@422 4 #include "audioDB-internals.h"
mas01cr@422 5 #include "accumulators.h"
mas01cr@422 6
mas01cr@444 7 bool audiodb_powers_acceptable(adb_query_refine_t *r, double p1, double p2) {
mas01cr@425 8 if (r->flags & ADB_REFINE_ABSOLUTE_THRESHOLD) {
mas01cr@425 9 if ((p1 < r->absolute_threshold) || (p2 < r->absolute_threshold)) {
mas01cr@239 10 return false;
mas01cr@239 11 }
mas01cr@239 12 }
mas01cr@425 13 if (r->flags & ADB_REFINE_RELATIVE_THRESHOLD) {
mas01cr@425 14 if (fabs(p1-p2) > fabs(r->relative_threshold)) {
mas01cr@239 15 return false;
mas01cr@239 16 }
mas01cr@239 17 }
mas01cr@239 18 return true;
mas01cr@239 19 }
mas01cr@239 20
mas01cr@239 21 void audioDB::query(const char* dbName, const char* inFile, adb__queryResponse *adbQueryResponse) {
mas01cr@425 22
mas01cr@431 23 // init database tables and dbH first
mas01cr@431 24 if(query_from_key)
mas01cr@431 25 initTables(dbName);
mas01cr@431 26 else
mas01cr@431 27 initTables(dbName, inFile);
mas01cr@431 28
mas01cr@435 29 adb_query_spec_t qspec;
mas01cr@444 30 adb_datum_t datum = {0};
mas01cr@435 31
mas01cr@435 32 qspec.refine.flags = 0;
mas01cr@425 33 /* FIXME: trackFile / ADB_REFINE_KEYLIST */
mas01cr@425 34 if(radius) {
mas01cr@435 35 qspec.refine.flags |= ADB_REFINE_RADIUS;
mas01cr@435 36 qspec.refine.radius = radius;
mas01cr@425 37 }
mas01cr@425 38 if(use_absolute_threshold) {
mas01cr@435 39 qspec.refine.flags |= ADB_REFINE_ABSOLUTE_THRESHOLD;
mas01cr@435 40 qspec.refine.absolute_threshold = absolute_threshold;
mas01cr@425 41 }
mas01cr@425 42 if(use_relative_threshold) {
mas01cr@435 43 qspec.refine.flags |= ADB_REFINE_RELATIVE_THRESHOLD;
mas01cr@435 44 qspec.refine.relative_threshold = relative_threshold;
mas01cr@425 45 }
mas01cr@425 46 if(usingTimes) {
mas01cr@435 47 qspec.refine.flags |= ADB_REFINE_DURATION_RATIO;
mas01cr@435 48 qspec.refine.duration_ratio = timesTol;
mas01cr@425 49 }
mas01cr@439 50 /* FIXME: not sure about this any more; maybe it belongs in
mas01cr@439 51 query_id? Or maybe we just don't need a flag for it? */
mas01cr@439 52 qspec.refine.hopsize = sequenceHop;
mas01cr@425 53 if(sequenceHop != 1) {
mas01cr@435 54 qspec.refine.flags |= ADB_REFINE_HOP_SIZE;
mas01cr@425 55 }
mas01cr@425 56
mas01cr@444 57 if(query_from_key) {
mas01cr@444 58 datum.key = key;
mas01cr@444 59 } else {
mas01cr@444 60 int fd;
mas01cr@444 61 struct stat st;
mas01cr@444 62
mas01cr@444 63 /* FIXME: around here there are all sorts of hideous leaks. */
mas01cr@444 64 fd = open(inFile, O_RDONLY);
mas01cr@444 65 if(fd < 0) {
mas01cr@444 66 error("failed to open feature file", inFile);
mas01cr@444 67 }
mas01cr@444 68 fstat(fd, &st);
mas01cr@444 69 read(fd, &datum.dim, sizeof(uint32_t));
mas01cr@444 70 datum.nvectors = (st.st_size - sizeof(uint32_t)) / (datum.dim * sizeof(double));
mas01cr@444 71 datum.data = (double *) malloc(st.st_size - sizeof(uint32_t));
mas01cr@444 72 read(fd, datum.data, st.st_size - sizeof(uint32_t));
mas01cr@444 73 close(fd);
mas01cr@444 74 if(usingPower) {
mas01cr@444 75 uint32_t one;
mas01cr@444 76 fd = open(powerFileName, O_RDONLY);
mas01cr@444 77 if(fd < 0) {
mas01cr@444 78 error("failed to open power file", powerFileName);
mas01cr@444 79 }
mas01cr@444 80 read(fd, &one, sizeof(uint32_t));
mas01cr@444 81 if(one != 1) {
mas01cr@444 82 error("malformed power file dimensionality", powerFileName);
mas01cr@444 83 }
mas01cr@444 84 datum.power = (double *) malloc(datum.nvectors * sizeof(double));
mas01cr@444 85 if(read(fd, datum.power, datum.nvectors * sizeof(double)) != (ssize_t) (datum.nvectors * sizeof(double))) {
mas01cr@444 86 error("malformed power file", powerFileName);
mas01cr@444 87 }
mas01cr@444 88 close(fd);
mas01cr@444 89 }
mas01cr@444 90 if(usingTimes) {
mas01cr@444 91 datum.times = (double *) malloc(2 * datum.nvectors * sizeof(double));
mas01cr@444 92 insertTimeStamps(datum.nvectors, timesFile, datum.times);
mas01cr@444 93 }
mas01cr@444 94 }
mas01cr@444 95
mas01cr@444 96 qspec.qid.datum = &datum;
mas01cr@435 97 qspec.qid.sequence_length = sequenceLength;
mas01cr@435 98 qspec.qid.flags = usingQueryPoint ? 0 : ADB_QUERY_ID_FLAG_EXHAUSTIVE;
mas01cr@435 99 qspec.qid.sequence_start = queryPoint;
mas01cr@435 100
mas01cr@431 101 switch(queryType) {
mas01cr@431 102 case O2_POINT_QUERY:
mas01cr@435 103 qspec.qid.sequence_length = 1;
mas01cr@435 104 qspec.params.accumulation = ADB_ACCUMULATION_DB;
mas01cr@435 105 qspec.params.distance = ADB_DISTANCE_DOT_PRODUCT;
mas01cr@435 106 qspec.params.npoints = pointNN;
mas01cr@435 107 qspec.params.ntracks = 0;
mas01cr@431 108 reporter = new pointQueryReporter< std::greater < NNresult > >(pointNN);
mas01cr@431 109 break;
mas01cr@431 110 case O2_TRACK_QUERY:
mas01cr@435 111 qspec.qid.sequence_length = 1;
mas01cr@435 112 qspec.params.accumulation = ADB_ACCUMULATION_PER_TRACK;
mas01cr@435 113 qspec.params.distance = ADB_DISTANCE_DOT_PRODUCT;
mas01cr@435 114 qspec.params.npoints = pointNN;
mas01cr@435 115 qspec.params.ntracks = trackNN;
mas01cr@431 116 reporter = new trackAveragingReporter< std::greater< NNresult > >(pointNN, trackNN, dbH->numFiles);
mas01cr@431 117 break;
mas01cr@431 118 case O2_SEQUENCE_QUERY:
mas01cr@431 119 case O2_N_SEQUENCE_QUERY:
mas01cr@435 120 qspec.params.accumulation = ADB_ACCUMULATION_PER_TRACK;
mas01cr@435 121 qspec.params.distance = no_unit_norming ? ADB_DISTANCE_EUCLIDEAN : ADB_DISTANCE_EUCLIDEAN_NORMED;
mas01cr@435 122 qspec.params.npoints = pointNN;
mas01cr@435 123 qspec.params.ntracks = trackNN;
mas01cr@431 124 switch(queryType) {
mas01cr@431 125 case O2_SEQUENCE_QUERY:
mas01cr@435 126 if(!(qspec.refine.flags & ADB_REFINE_RADIUS)) {
mas01cr@431 127 reporter = new trackAveragingReporter< std::less< NNresult > >(pointNN, trackNN, dbH->numFiles);
mas01cr@435 128 } else if (index_exists(adb->path, qspec.refine.radius, qspec.qid.sequence_length)) {
mas01cr@435 129 char* indexName = index_get_name(adb->path, qspec.refine.radius, qspec.qid.sequence_length);
mas01cr@431 130 lsh = index_allocate(indexName, false);
mas01cr@431 131 reporter = new trackSequenceQueryRadReporter(trackNN, index_to_trackID(lsh->get_maxp(), lsh_n_point_bits)+1);
mas01cr@431 132 delete[] indexName;
mas01cr@431 133 } else {
mas01cr@431 134 reporter = new trackSequenceQueryRadReporter(trackNN, dbH->numFiles);
mas01cr@431 135 }
mas01cr@431 136 break;
mas01cr@431 137 case O2_N_SEQUENCE_QUERY:
mas01cr@435 138 if(!(qspec.refine.flags & ADB_REFINE_RADIUS)) {
mas01cr@431 139 reporter = new trackSequenceQueryNNReporter< std::less < NNresult > >(pointNN, trackNN, dbH->numFiles);
mas01cr@435 140 } else if (index_exists(adb->path, qspec.refine.radius, qspec.qid.sequence_length)){
mas01cr@435 141 char* indexName = index_get_name(adb->path, qspec.refine.radius, qspec.qid.sequence_length);
mas01cr@431 142 lsh = index_allocate(indexName, false);
mas01cr@431 143 reporter = new trackSequenceQueryRadNNReporter(pointNN,trackNN, index_to_trackID(lsh->get_maxp(), lsh_n_point_bits)+1);
mas01cr@431 144 delete[] indexName;
mas01cr@431 145 } else {
mas01cr@431 146 reporter = new trackSequenceQueryRadNNReporter(pointNN,trackNN, dbH->numFiles);
mas01cr@431 147 }
mas01cr@431 148 break;
mas01cr@431 149 }
mas01cr@431 150 break;
mas01cr@431 151 case O2_ONE_TO_ONE_N_SEQUENCE_QUERY:
mas01cr@435 152 qspec.params.accumulation = ADB_ACCUMULATION_ONE_TO_ONE;
mas01cr@435 153 qspec.params.distance = ADB_DISTANCE_EUCLIDEAN_NORMED;
mas01cr@435 154 qspec.params.npoints = 0;
mas01cr@435 155 qspec.params.ntracks = 0;
mas01cr@431 156 break;
mas01cr@431 157 default:
mas01cr@431 158 error("unrecognized queryType");
mas01cr@431 159 }
mas01mc@292 160
mas01mc@292 161 // keyKeyPos requires dbH to be initialized
mas01cr@430 162 if(query_from_key && (!key || (query_from_key_index = audiodb_key_index(adb, key)) == (uint32_t) -1))
mas01cr@430 163 error("Query key not found", key);
mas01cr@431 164
mas01cr@435 165 switch(qspec.params.distance) {
mas01cr@431 166 case ADB_DISTANCE_DOT_PRODUCT:
mas01cr@435 167 switch(qspec.params.accumulation) {
mas01cr@431 168 case ADB_ACCUMULATION_DB:
mas01cr@435 169 accumulator = new DBAccumulator<adb_result_dist_gt>(qspec.params.npoints);
mas01cr@431 170 break;
mas01cr@431 171 case ADB_ACCUMULATION_PER_TRACK:
mas01cr@435 172 accumulator = new PerTrackAccumulator<adb_result_dist_gt>(qspec.params.npoints, qspec.params.ntracks);
mas01cr@431 173 break;
mas01cr@431 174 case ADB_ACCUMULATION_ONE_TO_ONE:
mas01cr@431 175 accumulator = new NearestAccumulator<adb_result_dist_gt>();
mas01cr@431 176 break;
mas01cr@431 177 default:
mas01cr@431 178 error("unknown accumulation");
mas01cr@239 179 }
mas01cr@239 180 break;
mas01cr@431 181 case ADB_DISTANCE_EUCLIDEAN_NORMED:
mas01cr@431 182 case ADB_DISTANCE_EUCLIDEAN:
mas01cr@435 183 switch(qspec.params.accumulation) {
mas01cr@431 184 case ADB_ACCUMULATION_DB:
mas01cr@435 185 accumulator = new DBAccumulator<adb_result_dist_lt>(qspec.params.npoints);
mas01cr@431 186 break;
mas01cr@431 187 case ADB_ACCUMULATION_PER_TRACK:
mas01cr@435 188 accumulator = new PerTrackAccumulator<adb_result_dist_lt>(qspec.params.npoints, qspec.params.ntracks);
mas01cr@431 189 break;
mas01cr@431 190 case ADB_ACCUMULATION_ONE_TO_ONE:
mas01cr@431 191 accumulator = new NearestAccumulator<adb_result_dist_lt>();
mas01cr@431 192 break;
mas01cr@431 193 default:
mas01cr@431 194 error("unknown accumulation");
mas01mc@263 195 }
mas01mc@263 196 break;
mas01cr@239 197 default:
mas01cr@431 198 error("unknown distance function");
mas01cr@431 199 }
mas01cr@431 200
mas01mc@292 201 // Test for index (again) here
mas01cr@435 202 if((qspec.refine.flags & ADB_REFINE_RADIUS) && index_exists(adb->path, qspec.refine.radius, qspec.qid.sequence_length)){
mas01cr@436 203 VERB_LOG(1, "Calling indexed query on database %s, radius=%f, sequence_length=%d\n", adb->path, qspec.refine.radius, qspec.qid.sequence_length);
mas01cr@435 204 index_query_loop(&qspec, dbName, query_from_key_index);
mas01mc@329 205 }
mas01mc@329 206 else{
mas01mc@329 207 VERB_LOG(1, "Calling brute-force query on database %s\n", dbName);
mas01cr@435 208 query_loop(&qspec, query_from_key_index);
mas01mc@329 209 }
mas01mc@292 210
mas01cr@423 211 adb_query_results_t *rs = accumulator->get_points();
mas01cr@423 212 for(unsigned int k = 0; k < rs->nresults; k++) {
mas01cr@423 213 adb_result_t r = rs->results[k];
mas01cr@430 214 reporter->add_point(audiodb_key_index(adb, r.key), r.qpos, r.ipos, r.dist);
mas01cr@423 215 }
mas01cr@423 216
mas01mc@292 217 reporter->report(fileTable, adbQueryResponse);
mas01cr@239 218 }
mas01cr@239 219
mas01cr@439 220 static void audiodb_initialize_arrays(adb_t *adb, adb_query_spec_t *spec, int track, unsigned int numVectors, double *query, double *data_buffer, double **D, double **DD) {
mas01cr@239 221 unsigned int j, k, l, w;
mas01cr@239 222 double *dp, *qp, *sp;
mas01cr@239 223
mas01cr@439 224 const unsigned HOP_SIZE = spec->refine.hopsize;
mas01cr@435 225 const unsigned wL = spec->qid.sequence_length;
mas01cr@239 226
mas01cr@239 227 for(j = 0; j < numVectors; j++) {
mas01cr@239 228 // Sum products matrix
mas01cr@433 229 D[j] = new double[(*adb->track_lengths)[track]];
mas01cr@239 230 assert(D[j]);
mas01cr@239 231 // Matched filter matrix
mas01cr@433 232 DD[j]=new double[(*adb->track_lengths)[track]];
mas01cr@239 233 assert(DD[j]);
mas01cr@239 234 }
mas01cr@239 235
mas01cr@239 236 // Dot product
mas01cr@239 237 for(j = 0; j < numVectors; j++)
mas01cr@433 238 for(k = 0; k < (*adb->track_lengths)[track]; k++){
mas01cr@439 239 qp = query + j * adb->header->dim;
mas01cr@439 240 sp = data_buffer + k * adb->header->dim;
mas01cr@239 241 DD[j][k] = 0.0; // Initialize matched filter array
mas01cr@239 242 dp = &D[j][k]; // point to correlation cell j,k
mas01cr@239 243 *dp = 0.0; // initialize correlation cell
mas01cr@439 244 l = adb->header->dim; // size of vectors
mas01cr@239 245 while(l--)
mas01cr@239 246 *dp += *qp++ * *sp++;
mas01cr@239 247 }
mas01cr@239 248
mas01cr@239 249 // Matched Filter
mas01cr@239 250 // HOP SIZE == 1
mas01cr@239 251 double* spd;
mas01cr@239 252 if(HOP_SIZE == 1) { // HOP_SIZE = shingleHop
mas01cr@239 253 for(w = 0; w < wL; w++) {
mas01cr@239 254 for(j = 0; j < numVectors - w; j++) {
mas01cr@239 255 sp = DD[j];
mas01cr@239 256 spd = D[j+w] + w;
mas01cr@433 257 k = (*adb->track_lengths)[track] - w;
mas01mc@292 258 while(k--)
mas01mc@292 259 *sp++ += *spd++;
mas01cr@239 260 }
mas01cr@239 261 }
mas01cr@239 262 } else { // HOP_SIZE != 1
mas01cr@239 263 for(w = 0; w < wL; w++) {
mas01cr@239 264 for(j = 0; j < numVectors - w; j += HOP_SIZE) {
mas01cr@239 265 sp = DD[j];
mas01cr@239 266 spd = D[j+w]+w;
mas01cr@433 267 for(k = 0; k < (*adb->track_lengths)[track] - w; k += HOP_SIZE) {
mas01cr@239 268 *sp += *spd;
mas01cr@239 269 sp += HOP_SIZE;
mas01cr@239 270 spd += HOP_SIZE;
mas01cr@239 271 }
mas01cr@239 272 }
mas01cr@239 273 }
mas01cr@239 274 }
mas01cr@239 275 }
mas01cr@239 276
mas01cr@433 277 static void audiodb_delete_arrays(int track, unsigned int numVectors, double **D, double **DD) {
mas01cr@239 278 if(D != NULL) {
mas01cr@239 279 for(unsigned int j = 0; j < numVectors; j++) {
mas01cr@239 280 delete[] D[j];
mas01cr@239 281 }
mas01cr@239 282 }
mas01cr@239 283 if(DD != NULL) {
mas01cr@239 284 for(unsigned int j = 0; j < numVectors; j++) {
mas01cr@239 285 delete[] DD[j];
mas01cr@239 286 }
mas01cr@239 287 }
mas01cr@239 288 }
mas01cr@239 289
mas01cr@433 290 int audiodb_read_data(adb_t *adb, int trkfid, int track, double **data_buffer_p, size_t *data_buffer_size_p) {
mas01cr@433 291 uint32_t track_length = (*adb->track_lengths)[track];
mas01cr@433 292 size_t track_size = track_length * sizeof(double) * adb->header->dim;
mas01cr@433 293 if (track_size > *data_buffer_size_p) {
mas01cr@239 294 if(*data_buffer_p) {
mas01cr@239 295 free(*data_buffer_p);
mas01cr@239 296 }
mas01cr@239 297 {
mas01cr@433 298 *data_buffer_size_p = track_size;
mas01cr@433 299 void *tmp = malloc(track_size);
mas01cr@239 300 if (tmp == NULL) {
mas01cr@433 301 goto error;
mas01cr@239 302 }
mas01cr@239 303 *data_buffer_p = (double *) tmp;
mas01cr@239 304 }
mas01cr@239 305 }
mas01cr@239 306
mas01cr@433 307 read_or_goto_error(trkfid, *data_buffer_p, track_size);
mas01cr@433 308 return 0;
mas01cr@433 309
mas01cr@433 310 error:
mas01cr@433 311 return 1;
mas01cr@239 312 }
mas01cr@239 313
mas01cr@405 314 void audioDB::insertTimeStamps(unsigned numVectors, std::ifstream *timesFile, double *timesdata) {
mas01cr@405 315 assert(usingTimes);
mas01cr@405 316
mas01cr@405 317 unsigned numtimes = 0;
mas01cr@405 318
mas01cr@405 319 if(!timesFile->is_open()) {
mas01cr@405 320 error("problem opening times file on timestamped database", timesFileName);
mas01cr@405 321 }
mas01cr@405 322
mas01cr@405 323 double timepoint, next;
mas01cr@405 324 *timesFile >> timepoint;
mas01cr@405 325 if (timesFile->eof()) {
mas01cr@405 326 error("no entries in times file", timesFileName);
mas01cr@405 327 }
mas01cr@405 328 numtimes++;
mas01cr@405 329 do {
mas01cr@405 330 *timesFile >> next;
mas01cr@405 331 if (timesFile->eof()) {
mas01cr@405 332 break;
mas01cr@405 333 }
mas01cr@405 334 numtimes++;
mas01cr@405 335 timesdata[0] = timepoint;
mas01cr@405 336 timepoint = (timesdata[1] = next);
mas01cr@405 337 timesdata += 2;
mas01cr@405 338 } while (numtimes < numVectors + 1);
mas01cr@405 339
mas01cr@405 340 if (numtimes < numVectors + 1) {
mas01cr@405 341 error("too few timepoints in times file", timesFileName);
mas01cr@405 342 }
mas01cr@405 343
mas01cr@405 344 *timesFile >> next;
mas01cr@405 345 if (!timesFile->eof()) {
mas01cr@405 346 error("too many timepoints in times file", timesFileName);
mas01cr@405 347 }
mas01cr@405 348 }
mas01cr@405 349
mas01cr@444 350 int audiodb_query_spec_qpointers(adb_t *adb, adb_query_spec_t *spec, double **vector_data, double **vector, adb_qpointers_internal_t *qpointers) {
mas01cr@443 351 adb_datum_t *datum;
mas01cr@443 352 adb_datum_t d = {0};
mas01cr@443 353 uint32_t nvectors;
mas01cr@443 354 uint32_t sequence_length;
mas01cr@443 355 uint32_t sequence_start;
mas01cr@443 356
mas01cr@443 357 datum = spec->qid.datum;
mas01cr@443 358 sequence_length = spec->qid.sequence_length;
mas01cr@443 359 sequence_start = spec->qid.sequence_start;
mas01cr@443 360
mas01cr@443 361 if(datum->data) {
mas01cr@443 362 if(datum->dim != adb->header->dim) {
mas01cr@443 363 return 1;
mas01cr@443 364 }
mas01cr@443 365 /* initialize d, and mark that nothing needs freeing later. */
mas01cr@443 366 d = *datum;
mas01cr@443 367 datum = &d;
mas01cr@443 368 } else if (datum->key) {
mas01cr@443 369 std::map<std::string,uint32_t>::iterator it;
mas01cr@443 370 it = adb->keys->find(datum->key);
mas01cr@443 371 if(it == adb->keys->end()) {
mas01cr@443 372 return 1;
mas01cr@443 373 }
mas01cr@443 374 uint32_t track_id = (*it).second;
mas01cr@443 375 off_t track_offset = (*adb->track_offsets)[track_id];
mas01cr@443 376
mas01cr@443 377 if(adb->header->flags & O2_FLAG_LARGE_ADB) {
mas01cr@443 378 /* create a reference/insert, then use adb_insert_create_datum() */
mas01cr@443 379 adb_reference_t reference = {0};
mas01cr@443 380 char features[MAXSTR], power[MAXSTR], times[MAXSTR];
mas01cr@443 381 lseek(adb->fd, adb->header->dataOffset + track_id * O2_FILETABLE_ENTRY_SIZE, SEEK_SET);
mas01cr@443 382 /* FIXME: learn not to worry and love the bomb^Wbuffer overflow */
mas01cr@443 383 read(adb->fd, features, MAXSTR);
mas01cr@443 384 reference.features = features;
mas01cr@443 385 if(adb->header->flags & O2_FLAG_POWER) {
mas01cr@443 386 lseek(adb->fd, adb->header->powerTableOffset + track_id * O2_FILETABLE_ENTRY_SIZE, SEEK_SET);
mas01cr@443 387 read(adb->fd, power, MAXSTR);
mas01cr@443 388 reference.power = power;
mas01cr@443 389 }
mas01cr@443 390 if(adb->header->flags & O2_FLAG_TIMES) {
mas01cr@443 391 lseek(adb->fd, adb->header->timesTableOffset + track_id * O2_FILETABLE_ENTRY_SIZE, SEEK_SET);
mas01cr@443 392 read(adb->fd, times, MAXSTR);
mas01cr@443 393 reference.times = times;
mas01cr@443 394 }
mas01cr@443 395 audiodb_insert_create_datum(&reference, &d);
mas01cr@443 396 } else {
mas01cr@443 397 /* initialize from sources of data that we already have */
mas01cr@443 398 d.nvectors = (*adb->track_lengths)[track_id];
mas01cr@443 399 d.dim = adb->header->dim;
mas01cr@443 400 d.key = datum->key;
mas01cr@443 401 /* read out stuff from the database tables */
mas01cr@443 402 d.data = (double *) malloc(d.nvectors * d.dim * sizeof(double));
mas01cr@443 403 lseek(adb->fd, adb->header->dataOffset + track_offset, SEEK_SET);
mas01cr@443 404 read(adb->fd, d.data, d.nvectors * d.dim * sizeof(double));
mas01cr@443 405 if(adb->header->flags & O2_FLAG_POWER) {
mas01cr@443 406 d.power = (double *) malloc(d.nvectors * sizeof(double));
mas01cr@443 407 lseek(adb->fd, adb->header->powerTableOffset + track_offset / d.dim, SEEK_SET);
mas01cr@443 408 read(adb->fd, d.power, d.nvectors * sizeof(double));
mas01cr@443 409 }
mas01cr@443 410 if(adb->header->flags & O2_FLAG_TIMES) {
mas01cr@443 411 d.times = (double *) malloc(2 * d.nvectors * sizeof(double));
mas01cr@443 412 lseek(adb->fd, adb->header->timesTableOffset + track_offset / d.dim, SEEK_SET);
mas01cr@443 413 read(adb->fd, d.times, 2 * d.nvectors * sizeof(double));
mas01cr@443 414 }
mas01cr@443 415 }
mas01cr@443 416 } else {
mas01cr@443 417 return 1;
mas01cr@443 418 }
mas01cr@443 419
mas01cr@443 420 /* Now we have a full(ish) datum, compute all the qpointery stuff
mas01cr@443 421 that we care about (l2norm/power/mean duration). (This bit could
mas01cr@443 422 conceivably become a new function) */
mas01cr@443 423 nvectors = d.nvectors;
mas01cr@444 424 /* FIXME: check the overflow logic here */
mas01cr@444 425 if(sequence_start + sequence_length > nvectors) {
mas01cr@443 426 /* is there something to free? goto error */
mas01cr@443 427 return 1;
mas01cr@443 428 }
mas01cr@443 429
mas01cr@443 430 qpointers->nvectors = nvectors;
mas01cr@443 431
mas01cr@443 432 size_t vector_size = nvectors * sizeof(double) * d.dim;
mas01cr@443 433 *vector_data = (double *) malloc(vector_size);
mas01cr@443 434 memcpy(*vector_data, d.data, vector_size);
mas01cr@443 435
mas01cr@443 436 qpointers->l2norm_data = (double *) malloc(vector_size / d.dim);
mas01cr@443 437 audiodb_l2norm_buffer(*vector_data, d.dim, nvectors, qpointers->l2norm_data);
mas01cr@443 438 audiodb_sequence_sum(qpointers->l2norm_data, nvectors, sequence_length);
mas01cr@443 439 audiodb_sequence_sqrt(qpointers->l2norm_data, nvectors, sequence_length);
mas01cr@443 440
mas01cr@443 441 if(d.power) {
mas01cr@443 442 qpointers->power_data = (double *) malloc(vector_size / d.dim);
mas01cr@443 443 memcpy(qpointers->power_data, d.power, vector_size / d.dim);
mas01cr@443 444 audiodb_sequence_sum(qpointers->power_data, nvectors, sequence_length);
mas01cr@443 445 audiodb_sequence_average(qpointers->power_data, nvectors, sequence_length);
mas01cr@443 446 }
mas01cr@443 447
mas01cr@443 448 if(d.times) {
mas01cr@443 449 qpointers->mean_duration = (double *) calloc(1, sizeof(double));
mas01cr@443 450 for(unsigned int k = 0; k < nvectors; k++) {
mas01cr@443 451 *qpointers->mean_duration += d.times[2*k+1] - d.times[2*k];
mas01cr@443 452 }
mas01cr@443 453 *qpointers->mean_duration /= nvectors;
mas01cr@443 454 }
mas01cr@443 455
mas01cr@443 456
mas01cr@443 457 /* Finally, set up the moving qpointers. */
mas01cr@443 458 if(spec->qid.flags & ADB_QUERY_ID_FLAG_EXHAUSTIVE) {
mas01cr@443 459 *vector = *vector_data;
mas01cr@443 460 qpointers->l2norm = qpointers->l2norm_data;
mas01cr@443 461 qpointers->power = qpointers->power_data;
mas01cr@443 462 } else {
mas01cr@443 463 *vector = *vector_data + spec->qid.sequence_start * d.dim;
mas01cr@443 464 qpointers->l2norm = qpointers->l2norm_data + spec->qid.sequence_start;
mas01cr@444 465 if(d.power) {
mas01cr@444 466 qpointers->power = qpointers->power_data + spec->qid.sequence_start;
mas01cr@444 467 }
mas01cr@444 468 /* FIXME: this is a little bit ugly. No, a lot ugly. But at the
mas01cr@444 469 * moment this is how query_loop() knows when to stop, so for
mas01cr@444 470 * now... */
mas01cr@444 471 qpointers->nvectors = sequence_length;
mas01cr@443 472 }
mas01cr@443 473
mas01cr@443 474 /* Clean up: free any bits of datum that we have ourselves
mas01cr@443 475 * allocated. */
mas01cr@443 476 if(datum != &d) {
mas01cr@443 477 audiodb_free_datum(&d);
mas01cr@443 478 }
mas01cr@444 479
mas01cr@444 480 return 0;
mas01cr@443 481 }
mas01cr@443 482
mas01cr@239 483 // FIXME: this is not the right name; we're not actually setting up
mas01cr@239 484 // the database, but copying various bits of it out of mmap()ed tables
mas01cr@239 485 // in order to reduce seeks.
mas01cr@438 486 static int audiodb_set_up_db(adb_t *adb, adb_query_spec_t *spec, adb_qpointers_internal_t *dbpointers) {
mas01cr@438 487 uint32_t nvectors = adb->header->length / (adb->header->dim * sizeof(double));
mas01cr@435 488 uint32_t sequence_length = spec->qid.sequence_length;
mas01cr@438 489
mas01cr@437 490 bool using_power = spec->refine.flags & (ADB_REFINE_ABSOLUTE_THRESHOLD|ADB_REFINE_RELATIVE_THRESHOLD);
mas01cr@437 491 bool using_times = spec->refine.flags & ADB_REFINE_DURATION_RATIO;
mas01cr@437 492 double *times_table = NULL;
mas01cr@435 493
mas01cr@239 494
mas01cr@438 495 dbpointers->nvectors = nvectors;
mas01cr@438 496 dbpointers->l2norm_data = new double[nvectors];
mas01cr@438 497
mas01cr@438 498 double *snpp = dbpointers->l2norm_data, *sppp = 0;
mas01cr@434 499 lseek(adb->fd, adb->header->l2normTableOffset, SEEK_SET);
mas01cr@438 500 read_or_goto_error(adb->fd, dbpointers->l2norm_data, nvectors * sizeof(double));
mas01cr@239 501
mas01cr@437 502 if (using_power) {
mas01cr@434 503 if (!(adb->header->flags & O2_FLAG_POWER)) {
mas01cr@434 504 goto error;
mas01cr@239 505 }
mas01cr@438 506 dbpointers->power_data = new double[nvectors];
mas01cr@438 507 sppp = dbpointers->power_data;
mas01cr@434 508 lseek(adb->fd, adb->header->powerTableOffset, SEEK_SET);
mas01cr@438 509 read_or_goto_error(adb->fd, dbpointers->power_data, nvectors * sizeof(double));
mas01cr@239 510 }
mas01cr@239 511
mas01cr@434 512 for(unsigned int i = 0; i < adb->header->numFiles; i++){
mas01cr@434 513 size_t track_length = (*adb->track_lengths)[i];
mas01cr@435 514 if(track_length >= sequence_length) {
mas01cr@435 515 audiodb_sequence_sum(snpp, track_length, sequence_length);
mas01cr@435 516 audiodb_sequence_sqrt(snpp, track_length, sequence_length);
mas01cr@437 517 if (using_power) {
mas01cr@435 518 audiodb_sequence_sum(sppp, track_length, sequence_length);
mas01cr@435 519 audiodb_sequence_average(sppp, track_length, sequence_length);
mas01cr@239 520 }
mas01cr@239 521 }
mas01cr@434 522 snpp += track_length;
mas01cr@437 523 if (using_power) {
mas01cr@434 524 sppp += track_length;
mas01cr@239 525 }
mas01cr@239 526 }
mas01cr@239 527
mas01cr@437 528 if (using_times) {
mas01cr@434 529 if(!(adb->header->flags & O2_FLAG_TIMES)) {
mas01cr@437 530 goto error;
mas01cr@239 531 }
mas01cr@239 532
mas01cr@438 533 dbpointers->mean_duration = new double[adb->header->numFiles];
mas01cr@239 534
mas01cr@438 535 times_table = (double *) malloc(2 * nvectors * sizeof(double));
mas01cr@437 536 if(!times_table) {
mas01cr@437 537 goto error;
mas01cr@437 538 }
mas01cr@437 539 lseek(adb->fd, adb->header->timesTableOffset, SEEK_SET);
mas01cr@438 540 read_or_goto_error(adb->fd, times_table, 2 * nvectors * sizeof(double));
mas01cr@434 541 for(unsigned int k = 0; k < adb->header->numFiles; k++) {
mas01cr@434 542 size_t track_length = (*adb->track_lengths)[k];
mas01cr@239 543 unsigned int j;
mas01cr@438 544 dbpointers->mean_duration[k] = 0.0;
mas01cr@434 545 for(j = 0; j < track_length; j++) {
mas01cr@438 546 dbpointers->mean_duration[k] += times_table[2*j+1] - times_table[2*j];
mas01cr@239 547 }
mas01cr@438 548 dbpointers->mean_duration[k] /= j;
mas01cr@239 549 }
mas01cr@437 550
mas01cr@437 551 free(times_table);
mas01cr@437 552 times_table = NULL;
mas01cr@239 553 }
mas01cr@239 554
mas01cr@438 555 dbpointers->l2norm = dbpointers->l2norm_data;
mas01cr@438 556 dbpointers->power = dbpointers->power_data;
mas01cr@434 557 return 0;
mas01cr@434 558
mas01cr@434 559 error:
mas01cr@438 560 if(dbpointers->l2norm_data) {
mas01cr@438 561 delete [] dbpointers->l2norm_data;
mas01cr@434 562 }
mas01cr@438 563 if(dbpointers->power_data) {
mas01cr@438 564 delete [] dbpointers->power_data;
mas01cr@434 565 }
mas01cr@438 566 if(dbpointers->mean_duration) {
mas01cr@438 567 delete [] dbpointers->mean_duration;
mas01cr@434 568 }
mas01cr@437 569 if(times_table) {
mas01cr@437 570 free(times_table);
mas01cr@437 571 }
mas01cr@434 572 return 1;
mas01cr@434 573
mas01cr@239 574 }
mas01cr@239 575
mas01mc@292 576 // query_points()
mas01mc@292 577 //
mas01mc@292 578 // using PointPairs held in the exact_evaluation_queue compute squared distance for each PointPair
mas01mc@292 579 // and insert result into the current reporter.
mas01mc@292 580 //
mas01mc@292 581 // Preconditions:
mas01mc@292 582 // A query inFile has been opened with setup_query(...) and query pointers initialized
mas01mc@292 583 // The database contains some points
mas01mc@292 584 // An exact_evaluation_queue has been allocated and populated
mas01mc@292 585 // A reporter has been allocated
mas01mc@292 586 //
mas01mc@292 587 // Postconditions:
mas01mc@292 588 // reporter contains the points and distances that meet the reporter constraints
mas01mc@292 589
mas01cr@437 590 void audioDB::query_loop_points(adb_query_spec_t *spec, double* query, adb_qpointers_internal_t *qpointers) {
mas01cr@438 591 adb_qpointers_internal_t dbpointers = {0};
mas01mc@292 592
mas01cr@436 593 uint32_t sequence_length = spec->qid.sequence_length;
mas01cr@437 594 bool power_refine = spec->refine.flags & (ADB_REFINE_ABSOLUTE_THRESHOLD|ADB_REFINE_RELATIVE_THRESHOLD);
mas01cr@436 595
mas01mc@292 596 // check pre-conditions
mas01mc@292 597 assert(exact_evaluation_queue&&reporter);
mas01mc@292 598 if(!exact_evaluation_queue->size()) // Exit if no points to evaluate
mas01mc@292 599 return;
mas01mc@292 600
mas01mc@292 601 // Compute database info
mas01mc@292 602 // FIXME: we more than likely don't need very much of the database
mas01mc@292 603 // so make a new method to build these values per-track or, even better, per-point
mas01mc@324 604 if( !( dbH->flags & O2_FLAG_LARGE_ADB) )
mas01cr@438 605 if(audiodb_set_up_db(adb, spec, &dbpointers)) {
mas01cr@434 606 error("failed to set up db");
mas01cr@434 607 }
mas01mc@292 608
mas01mc@292 609 VERB_LOG(1, "matching points...");
mas01mc@292 610
mas01mc@292 611 // We are guaranteed that the order of points is sorted by:
mas01mc@324 612 // trackID, spos, qpos
mas01mc@292 613 // so we can be relatively efficient in initialization of track data.
mas01mc@292 614 // Here we assume that points don't overlap, so we will use exhaustive dot
mas01mc@324 615 // product evaluation instead of memoization of partial sums which is used
mas01mc@324 616 // for exhaustive brute-force evaluation from smaller databases: e.g. query_loop()
mas01mc@292 617 double dist;
mas01mc@292 618 size_t data_buffer_size = 0;
mas01mc@292 619 double *data_buffer = 0;
mas01mc@324 620 Uns32T trackOffset = 0;
mas01mc@324 621 Uns32T trackIndexOffset = 0;
mas01mc@292 622 Uns32T currentTrack = 0x80000000; // Initialize with a value outside of track index range
mas01mc@292 623 Uns32T npairs = exact_evaluation_queue->size();
mas01mc@292 624 while(npairs--){
mas01mc@292 625 PointPair pp = exact_evaluation_queue->top();
mas01mc@324 626 // Large ADB track data must be loaded here for sPower
mas01mc@324 627 if(dbH->flags & O2_FLAG_LARGE_ADB){
mas01mc@324 628 trackOffset=0;
mas01mc@324 629 trackIndexOffset=0;
mas01mc@292 630 if(currentTrack!=pp.trackID){
mas01mc@324 631 char* prefixedString = new char[O2_MAXFILESTR];
mas01mc@324 632 char* tmpStr = prefixedString;
mas01mc@324 633 // On currentTrack change, allocate and load track data
mas01mc@292 634 currentTrack=pp.trackID;
mas01cr@438 635 SAFE_DELETE_ARRAY(dbpointers.l2norm_data);
mas01cr@438 636 SAFE_DELETE_ARRAY(dbpointers.power_data);
mas01mc@324 637 if(infid>0)
mas01mc@324 638 close(infid);
mas01mc@324 639 // Open and check dimensions of feature file
mas01mc@324 640 strncpy(prefixedString, featureFileNameTable+pp.trackID*O2_FILETABLE_ENTRY_SIZE, O2_MAXFILESTR);
mas01mc@324 641 prefix_name((char ** const) &prefixedString, adb_feature_root);
mas01mc@324 642 if (prefixedString!=tmpStr)
mas01mc@324 643 delete[] tmpStr;
mas01mc@324 644 initInputFile(prefixedString, false); // nommap, file pointer at correct position
mas01mc@324 645 // Load the feature vector data for current track into data_buffer
mas01cr@433 646 if(audiodb_read_data(adb, infid, pp.trackID, &data_buffer, &data_buffer_size))
mas01cr@433 647 error("failed to read data");
mas01mc@324 648 // Load power and calculate power and l2norm sequence sums
mas01cr@438 649 init_track_aux_data(pp.trackID, data_buffer, &dbpointers.l2norm_data, &dbpointers.l2norm, &dbpointers.power_data, &dbpointers.power);
mas01mc@292 650 }
mas01mc@324 651 }
mas01mc@324 652 else{
mas01mc@324 653 // These offsets are w.r.t. the entire database of feature vectors and auxillary variables
mas01mc@324 654 trackOffset=trackOffsetTable[pp.trackID]; // num data elements offset
mas01mc@324 655 trackIndexOffset=trackOffset/dbH->dim; // num vectors offset
mas01mc@324 656 }
mas01mc@324 657 Uns32T qPos = usingQueryPoint?0:pp.qpos;// index for query point
mas01mc@324 658 Uns32T sPos = trackIndexOffset+pp.spos; // index into l2norm table
mas01mc@324 659 // Test power thresholds before computing distance
mas01cr@438 660 if( ( (!power_refine) || audiodb_powers_acceptable(&spec->refine, qpointers->power[qPos], dbpointers.power[sPos])) &&
mas01cr@437 661 ( qPos<qpointers->nvectors-sequence_length+1 && pp.spos<trackTable[pp.trackID]-sequence_length+1 ) ){
mas01mc@324 662 // Non-large ADB track data is loaded inside power test for efficiency
mas01mc@324 663 if( !(dbH->flags & O2_FLAG_LARGE_ADB) && (currentTrack!=pp.trackID) ){
mas01mc@324 664 // On currentTrack change, allocate and load track data
mas01mc@324 665 currentTrack=pp.trackID;
mas01mc@324 666 lseek(dbfid, dbH->dataOffset + trackOffset * sizeof(double), SEEK_SET);
mas01cr@433 667 if(audiodb_read_data(adb, dbfid, currentTrack, &data_buffer, &data_buffer_size))
mas01cr@433 668 error("failed to read data");
mas01mc@324 669 }
mas01mc@324 670 // Compute distance
mas01cr@436 671 dist = audiodb_dot_product(query+qPos*dbH->dim, data_buffer+pp.spos*dbH->dim, dbH->dim*sequence_length);
mas01cr@437 672 double qn = qpointers->l2norm[qPos];
mas01cr@438 673 double sn = dbpointers.l2norm[sPos];
mas01cr@435 674 switch(spec->params.distance) {
mas01cr@431 675 case ADB_DISTANCE_EUCLIDEAN_NORMED:
mas01mc@324 676 dist = 2 - (2/(qn*sn))*dist;
mas01cr@431 677 break;
mas01cr@431 678 case ADB_DISTANCE_EUCLIDEAN:
mas01cr@431 679 dist = qn*qn + sn*sn - 2*dist;
mas01cr@431 680 break;
mas01cr@431 681 }
mas01cr@424 682 if((!radius) || dist <= (O2_LSH_EXACT_MULT*radius+O2_DISTANCE_TOLERANCE)) {
mas01cr@424 683 adb_result_t r;
mas01cr@424 684 r.key = fileTable + pp.trackID * O2_FILETABLE_ENTRY_SIZE;
mas01cr@424 685 r.dist = dist;
mas01cr@424 686 r.qpos = pp.qpos;
mas01cr@424 687 r.ipos = pp.spos;
mas01cr@424 688 accumulator->add_point(&r);
mas01cr@424 689 }
mas01mc@292 690 }
mas01mc@292 691 exact_evaluation_queue->pop();
mas01mc@292 692 }
mas01mc@315 693 // Cleanup
mas01cr@438 694 SAFE_DELETE_ARRAY(dbpointers.l2norm_data);
mas01cr@438 695 SAFE_DELETE_ARRAY(dbpointers.power_data);
mas01cr@438 696 SAFE_DELETE_ARRAY(dbpointers.mean_duration);
mas01mc@292 697 }
mas01mc@292 698
mas01cr@435 699 void audioDB::query_loop(adb_query_spec_t *spec, Uns32T queryIndex) {
mas01cr@239 700
mas01cr@239 701 double *query, *query_data;
mas01cr@438 702 adb_qpointers_internal_t qpointers = {0}, dbpointers = {0};
mas01cr@437 703
mas01cr@437 704 bool power_refine = spec->refine.flags & (ADB_REFINE_ABSOLUTE_THRESHOLD|ADB_REFINE_RELATIVE_THRESHOLD);
mas01cr@239 705
mas01mc@324 706 if( dbH->flags & O2_FLAG_LARGE_ADB )
mas01mc@324 707 error("error: LARGE_ADB requires indexed query");
mas01mc@324 708
mas01cr@444 709 if(audiodb_query_spec_qpointers(adb, spec, &query_data, &query, &qpointers)) {
mas01cr@444 710 error("failed to set up qpointers");
mas01cr@444 711 }
mas01cr@239 712
mas01cr@438 713 if(audiodb_set_up_db(adb, spec, &dbpointers)) {
mas01cr@434 714 error("failed to set up db");
mas01cr@434 715 }
mas01cr@239 716
mas01cr@239 717 VERB_LOG(1, "matching tracks...");
mas01cr@239 718
mas01cr@435 719 unsigned j,k,track,trackOffset=0, HOP_SIZE=sequenceHop;
mas01cr@435 720 unsigned wL = spec->qid.sequence_length;
mas01cr@239 721 double **D = 0; // Differences query and target
mas01cr@239 722 double **DD = 0; // Matched filter distance
mas01cr@239 723
mas01cr@437 724 D = new double*[qpointers.nvectors]; // pre-allocate
mas01cr@437 725 DD = new double*[qpointers.nvectors];
mas01cr@239 726
mas01cr@239 727 gettimeofday(&tv1, NULL);
mas01cr@239 728 unsigned processedTracks = 0;
mas01cr@239 729 off_t trackIndexOffset;
mas01cr@239 730 char nextKey[MAXSTR];
mas01cr@239 731
mas01cr@239 732 // Track loop
mas01cr@239 733 size_t data_buffer_size = 0;
mas01cr@239 734 double *data_buffer = 0;
mas01cr@239 735 lseek(dbfid, dbH->dataOffset, SEEK_SET);
mas01cr@239 736
mas01cr@239 737 for(processedTracks=0, track=0 ; processedTracks < dbH->numFiles ; track++, processedTracks++) {
mas01cr@239 738
mas01cr@239 739 trackOffset = trackOffsetTable[track]; // numDoubles offset
mas01cr@239 740
mas01cr@239 741 // get trackID from file if using a control file
mas01cr@239 742 if(trackFile) {
mas01cr@239 743 trackFile->getline(nextKey,MAXSTR);
mas01cr@239 744 if(!trackFile->eof()) {
mas01cr@430 745 track = audiodb_key_index(adb, nextKey);
mas01cr@430 746 if(track == (uint32_t) -1) {
mas01cr@430 747 error("key not found", nextKey);
mas01cr@430 748 }
mas01cr@239 749 trackOffset = trackOffsetTable[track];
mas01cr@239 750 lseek(dbfid, dbH->dataOffset + trackOffset * sizeof(double), SEEK_SET);
mas01cr@239 751 } else {
mas01cr@239 752 break;
mas01cr@239 753 }
mas01cr@239 754 }
mas01cr@239 755
mas01mc@292 756 // skip identity on query_from_key
mas01mc@292 757 if( query_from_key && (track == queryIndex) ) {
mas01mc@292 758 if(queryIndex!=dbH->numFiles-1){
mas01mc@292 759 track++;
mas01mc@292 760 trackOffset = trackOffsetTable[track];
mas01mc@292 761 lseek(dbfid, dbH->dataOffset + trackOffset * sizeof(double), SEEK_SET);
mas01mc@292 762 }
mas01mc@292 763 else{
mas01mc@292 764 break;
mas01mc@292 765 }
mas01mc@292 766 }
mas01mc@292 767
mas01cr@437 768 trackIndexOffset=trackOffset/dbH->dim; // qpointers.nvectors offset
mas01cr@239 769
mas01cr@433 770 if(audiodb_read_data(adb, dbfid, track, &data_buffer, &data_buffer_size))
mas01cr@433 771 error("failed to read data");
mas01cr@435 772 if(wL <= trackTable[track]) { // test for short sequences
mas01cr@239 773
mas01cr@239 774 VERB_LOG(7,"%u.%jd.%u | ", track, (intmax_t) trackIndexOffset, trackTable[track]);
mas01cr@239 775
mas01cr@439 776 audiodb_initialize_arrays(adb, spec, track, qpointers.nvectors, query, data_buffer, D, DD);
mas01cr@239 777
mas01cr@435 778 if(spec->refine.flags & ADB_REFINE_DURATION_RATIO) {
mas01cr@438 779 VERB_LOG(3,"meanQdur=%f meanDBdur=%f\n", qpointers.mean_duration[0], dbpointers.mean_duration[track]);
mas01cr@239 780 }
mas01cr@239 781
mas01cr@437 782 if((!(spec->refine.flags & ADB_REFINE_DURATION_RATIO)) ||
mas01cr@438 783 fabs(dbpointers.mean_duration[track]-qpointers.mean_duration[0]) < qpointers.mean_duration[0]*spec->refine.duration_ratio) {
mas01cr@435 784 if(spec->refine.flags & ADB_REFINE_DURATION_RATIO) {
mas01cr@239 785 VERB_LOG(3,"within duration tolerance.\n");
mas01cr@239 786 }
mas01cr@239 787
mas01cr@239 788 // Search for minimum distance by shingles (concatenated vectors)
mas01cr@437 789 for(j = 0; j <= qpointers.nvectors - wL; j += HOP_SIZE) {
mas01cr@239 790 for(k = 0; k <= trackTable[track] - wL; k += HOP_SIZE) {
mas01cr@431 791 double thisDist = 0;
mas01cr@438 792 double qn = qpointers.l2norm[j];
mas01cr@438 793 double sn = dbpointers.l2norm[trackIndexOffset + k];
mas01cr@435 794 switch(spec->params.distance) {
mas01cr@431 795 case ADB_DISTANCE_EUCLIDEAN_NORMED:
mas01cr@438 796 thisDist = 2-(2/(qn*sn))*DD[j][k];
mas01cr@431 797 break;
mas01cr@431 798 case ADB_DISTANCE_EUCLIDEAN:
mas01cr@438 799 thisDist = qn*qn + sn*sn - 2*DD[j][k];
mas01cr@431 800 break;
mas01cr@431 801 case ADB_DISTANCE_DOT_PRODUCT:
mas01cr@431 802 thisDist = DD[j][k];
mas01cr@431 803 break;
mas01cr@431 804 }
mas01cr@239 805 // Power test
mas01cr@438 806 if ((!power_refine) || audiodb_powers_acceptable(&spec->refine, qpointers.power[j], dbpointers.power[trackIndexOffset + k])) {
mas01cr@239 807 // radius test
mas01cr@435 808 if((!(spec->refine.flags & ADB_REFINE_RADIUS)) ||
mas01cr@435 809 thisDist <= (spec->refine.radius+O2_DISTANCE_TOLERANCE)) {
mas01cr@423 810 adb_result_t r;
mas01cr@423 811 r.key = fileTable + track * O2_FILETABLE_ENTRY_SIZE;
mas01cr@423 812 r.dist = thisDist;
mas01cr@423 813 r.qpos = usingQueryPoint ? queryPoint : j;
mas01cr@423 814 r.ipos = k;
mas01cr@423 815 accumulator->add_point(&r);
mas01cr@239 816 }
mas01cr@239 817 }
mas01cr@239 818 }
mas01cr@239 819 }
mas01cr@239 820 } // Duration match
mas01cr@437 821 audiodb_delete_arrays(track, qpointers.nvectors, D, DD);
mas01cr@239 822 }
mas01cr@239 823 }
mas01cr@239 824
mas01cr@239 825 free(data_buffer);
mas01cr@239 826
mas01cr@239 827 gettimeofday(&tv2,NULL);
mas01cr@239 828 VERB_LOG(1,"elapsed time: %ld msec\n",
mas01cr@239 829 (tv2.tv_sec*1000 + tv2.tv_usec/1000) -
mas01cr@239 830 (tv1.tv_sec*1000 + tv1.tv_usec/1000))
mas01cr@239 831
mas01cr@239 832 // Clean up
mas01cr@239 833 if(query_data)
mas01cr@239 834 delete[] query_data;
mas01cr@437 835 if(qpointers.l2norm_data)
mas01cr@437 836 delete[] qpointers.l2norm_data;
mas01cr@437 837 if(qpointers.power_data)
mas01cr@437 838 delete[] qpointers.power_data;
mas01cr@437 839 if(qpointers.mean_duration)
mas01cr@437 840 delete[] qpointers.mean_duration;
mas01cr@438 841 if(dbpointers.power_data)
mas01cr@438 842 delete[] dbpointers.power_data;
mas01cr@438 843 if(dbpointers.l2norm_data)
mas01cr@438 844 delete[] dbpointers.l2norm_data;
mas01cr@239 845 if(D)
mas01cr@239 846 delete[] D;
mas01cr@239 847 if(DD)
mas01cr@239 848 delete[] DD;
mas01cr@438 849 if(dbpointers.mean_duration)
mas01cr@438 850 delete[] dbpointers.mean_duration;
mas01cr@239 851 }