annotate query.cpp @ 435:53c487885b2c api-inversion

begin pushing an adb_query_spec_t * all the way through query. Almost all of the query specification data is in there now; missing are the key list refinement and the query datum. Mostly eliminate uses of the audioDB::sequenceLength member variable throughout query.cpp. It's still used in functions in index.cpp, though, so make sure that a correct value is installed before calling audioDB::index_query_loop()
author mas01cr
date Wed, 24 Dec 2008 10:55:56 +0000
parents 7af140bf8a0a
children e43f8a7aca93
rev   line source
mas01cr@239 1 #include "audioDB.h"
mas01cr@239 2 #include "reporter.h"
mas01cr@239 3
mas01cr@422 4 #include "audioDB-internals.h"
mas01cr@422 5 #include "accumulators.h"
mas01cr@422 6
mas01cr@425 7 static bool audiodb_powers_acceptable(adb_query_refine_t *r, double p1, double p2) {
mas01cr@425 8 if (r->flags & ADB_REFINE_ABSOLUTE_THRESHOLD) {
mas01cr@425 9 if ((p1 < r->absolute_threshold) || (p2 < r->absolute_threshold)) {
mas01cr@239 10 return false;
mas01cr@239 11 }
mas01cr@239 12 }
mas01cr@425 13 if (r->flags & ADB_REFINE_RELATIVE_THRESHOLD) {
mas01cr@425 14 if (fabs(p1-p2) > fabs(r->relative_threshold)) {
mas01cr@239 15 return false;
mas01cr@239 16 }
mas01cr@239 17 }
mas01cr@239 18 return true;
mas01cr@239 19 }
mas01cr@239 20
mas01cr@239 21 void audioDB::query(const char* dbName, const char* inFile, adb__queryResponse *adbQueryResponse) {
mas01cr@425 22
mas01cr@431 23 // init database tables and dbH first
mas01cr@431 24 if(query_from_key)
mas01cr@431 25 initTables(dbName);
mas01cr@431 26 else
mas01cr@431 27 initTables(dbName, inFile);
mas01cr@431 28
mas01cr@435 29 adb_query_spec_t qspec;
mas01cr@435 30
mas01cr@435 31 qspec.refine.flags = 0;
mas01cr@425 32 /* FIXME: trackFile / ADB_REFINE_KEYLIST */
mas01cr@425 33 if(radius) {
mas01cr@435 34 qspec.refine.flags |= ADB_REFINE_RADIUS;
mas01cr@435 35 qspec.refine.radius = radius;
mas01cr@425 36 }
mas01cr@425 37 if(use_absolute_threshold) {
mas01cr@435 38 qspec.refine.flags |= ADB_REFINE_ABSOLUTE_THRESHOLD;
mas01cr@435 39 qspec.refine.absolute_threshold = absolute_threshold;
mas01cr@425 40 }
mas01cr@425 41 if(use_relative_threshold) {
mas01cr@435 42 qspec.refine.flags |= ADB_REFINE_RELATIVE_THRESHOLD;
mas01cr@435 43 qspec.refine.relative_threshold = relative_threshold;
mas01cr@425 44 }
mas01cr@425 45 if(usingTimes) {
mas01cr@435 46 qspec.refine.flags |= ADB_REFINE_DURATION_RATIO;
mas01cr@435 47 qspec.refine.duration_ratio = timesTol;
mas01cr@425 48 }
mas01cr@425 49 /* FIXME: not sure about this any more; maybe it belongs in query_id */
mas01cr@425 50 if(sequenceHop != 1) {
mas01cr@435 51 qspec.refine.flags |= ADB_REFINE_HOP_SIZE;
mas01cr@435 52 qspec.refine.hopsize = sequenceHop;
mas01cr@425 53 }
mas01cr@425 54
mas01cr@435 55 /* FIXME qspec.qid.datum */
mas01cr@435 56 qspec.qid.sequence_length = sequenceLength;
mas01cr@435 57 qspec.qid.flags = usingQueryPoint ? 0 : ADB_QUERY_ID_FLAG_EXHAUSTIVE;
mas01cr@435 58 qspec.qid.sequence_start = queryPoint;
mas01cr@435 59
mas01cr@431 60 switch(queryType) {
mas01cr@431 61 case O2_POINT_QUERY:
mas01cr@435 62 qspec.qid.sequence_length = 1;
mas01cr@435 63 qspec.params.accumulation = ADB_ACCUMULATION_DB;
mas01cr@435 64 qspec.params.distance = ADB_DISTANCE_DOT_PRODUCT;
mas01cr@435 65 qspec.params.npoints = pointNN;
mas01cr@435 66 qspec.params.ntracks = 0;
mas01cr@431 67 reporter = new pointQueryReporter< std::greater < NNresult > >(pointNN);
mas01cr@431 68 break;
mas01cr@431 69 case O2_TRACK_QUERY:
mas01cr@435 70 qspec.qid.sequence_length = 1;
mas01cr@435 71 qspec.params.accumulation = ADB_ACCUMULATION_PER_TRACK;
mas01cr@435 72 qspec.params.distance = ADB_DISTANCE_DOT_PRODUCT;
mas01cr@435 73 qspec.params.npoints = pointNN;
mas01cr@435 74 qspec.params.ntracks = trackNN;
mas01cr@431 75 reporter = new trackAveragingReporter< std::greater< NNresult > >(pointNN, trackNN, dbH->numFiles);
mas01cr@431 76 break;
mas01cr@431 77 case O2_SEQUENCE_QUERY:
mas01cr@431 78 case O2_N_SEQUENCE_QUERY:
mas01cr@435 79 qspec.params.accumulation = ADB_ACCUMULATION_PER_TRACK;
mas01cr@435 80 qspec.params.distance = no_unit_norming ? ADB_DISTANCE_EUCLIDEAN : ADB_DISTANCE_EUCLIDEAN_NORMED;
mas01cr@435 81 qspec.params.npoints = pointNN;
mas01cr@435 82 qspec.params.ntracks = trackNN;
mas01cr@431 83 switch(queryType) {
mas01cr@431 84 case O2_SEQUENCE_QUERY:
mas01cr@435 85 if(!(qspec.refine.flags & ADB_REFINE_RADIUS)) {
mas01cr@431 86 reporter = new trackAveragingReporter< std::less< NNresult > >(pointNN, trackNN, dbH->numFiles);
mas01cr@435 87 } else if (index_exists(adb->path, qspec.refine.radius, qspec.qid.sequence_length)) {
mas01cr@435 88 char* indexName = index_get_name(adb->path, qspec.refine.radius, qspec.qid.sequence_length);
mas01cr@431 89 lsh = index_allocate(indexName, false);
mas01cr@431 90 reporter = new trackSequenceQueryRadReporter(trackNN, index_to_trackID(lsh->get_maxp(), lsh_n_point_bits)+1);
mas01cr@431 91 delete[] indexName;
mas01cr@431 92 } else {
mas01cr@431 93 reporter = new trackSequenceQueryRadReporter(trackNN, dbH->numFiles);
mas01cr@431 94 }
mas01cr@431 95 break;
mas01cr@431 96 case O2_N_SEQUENCE_QUERY:
mas01cr@435 97 if(!(qspec.refine.flags & ADB_REFINE_RADIUS)) {
mas01cr@431 98 reporter = new trackSequenceQueryNNReporter< std::less < NNresult > >(pointNN, trackNN, dbH->numFiles);
mas01cr@435 99 } else if (index_exists(adb->path, qspec.refine.radius, qspec.qid.sequence_length)){
mas01cr@435 100 char* indexName = index_get_name(adb->path, qspec.refine.radius, qspec.qid.sequence_length);
mas01cr@431 101 lsh = index_allocate(indexName, false);
mas01cr@431 102 reporter = new trackSequenceQueryRadNNReporter(pointNN,trackNN, index_to_trackID(lsh->get_maxp(), lsh_n_point_bits)+1);
mas01cr@431 103 delete[] indexName;
mas01cr@431 104 } else {
mas01cr@431 105 reporter = new trackSequenceQueryRadNNReporter(pointNN,trackNN, dbH->numFiles);
mas01cr@431 106 }
mas01cr@431 107 break;
mas01cr@431 108 }
mas01cr@431 109 break;
mas01cr@431 110 case O2_ONE_TO_ONE_N_SEQUENCE_QUERY:
mas01cr@435 111 qspec.params.accumulation = ADB_ACCUMULATION_ONE_TO_ONE;
mas01cr@435 112 qspec.params.distance = ADB_DISTANCE_EUCLIDEAN_NORMED;
mas01cr@435 113 qspec.params.npoints = 0;
mas01cr@435 114 qspec.params.ntracks = 0;
mas01cr@431 115 break;
mas01cr@431 116 default:
mas01cr@431 117 error("unrecognized queryType");
mas01cr@431 118 }
mas01mc@292 119
mas01mc@292 120 // keyKeyPos requires dbH to be initialized
mas01cr@430 121 if(query_from_key && (!key || (query_from_key_index = audiodb_key_index(adb, key)) == (uint32_t) -1))
mas01cr@430 122 error("Query key not found", key);
mas01cr@431 123
mas01cr@435 124 switch(qspec.params.distance) {
mas01cr@431 125 case ADB_DISTANCE_DOT_PRODUCT:
mas01cr@435 126 switch(qspec.params.accumulation) {
mas01cr@431 127 case ADB_ACCUMULATION_DB:
mas01cr@435 128 accumulator = new DBAccumulator<adb_result_dist_gt>(qspec.params.npoints);
mas01cr@431 129 break;
mas01cr@431 130 case ADB_ACCUMULATION_PER_TRACK:
mas01cr@435 131 accumulator = new PerTrackAccumulator<adb_result_dist_gt>(qspec.params.npoints, qspec.params.ntracks);
mas01cr@431 132 break;
mas01cr@431 133 case ADB_ACCUMULATION_ONE_TO_ONE:
mas01cr@431 134 accumulator = new NearestAccumulator<adb_result_dist_gt>();
mas01cr@431 135 break;
mas01cr@431 136 default:
mas01cr@431 137 error("unknown accumulation");
mas01cr@239 138 }
mas01cr@239 139 break;
mas01cr@431 140 case ADB_DISTANCE_EUCLIDEAN_NORMED:
mas01cr@431 141 case ADB_DISTANCE_EUCLIDEAN:
mas01cr@435 142 switch(qspec.params.accumulation) {
mas01cr@431 143 case ADB_ACCUMULATION_DB:
mas01cr@435 144 accumulator = new DBAccumulator<adb_result_dist_lt>(qspec.params.npoints);
mas01cr@431 145 break;
mas01cr@431 146 case ADB_ACCUMULATION_PER_TRACK:
mas01cr@435 147 accumulator = new PerTrackAccumulator<adb_result_dist_lt>(qspec.params.npoints, qspec.params.ntracks);
mas01cr@431 148 break;
mas01cr@431 149 case ADB_ACCUMULATION_ONE_TO_ONE:
mas01cr@431 150 accumulator = new NearestAccumulator<adb_result_dist_lt>();
mas01cr@431 151 break;
mas01cr@431 152 default:
mas01cr@431 153 error("unknown accumulation");
mas01mc@263 154 }
mas01mc@263 155 break;
mas01cr@239 156 default:
mas01cr@431 157 error("unknown distance function");
mas01cr@431 158 }
mas01cr@431 159
mas01mc@292 160 // Test for index (again) here
mas01cr@435 161 if((qspec.refine.flags & ADB_REFINE_RADIUS) && index_exists(adb->path, qspec.refine.radius, qspec.qid.sequence_length)){
mas01cr@435 162 /* FIXME: remaining use of sequenceLength */
mas01cr@435 163 sequenceLength = qspec.qid.sequence_length;
mas01cr@435 164 VERB_LOG(1, "Calling indexed query on database %s, radius=%f, sequenceLength=%d\n", adb->path, qspec.refine.radius, sequenceLength);
mas01cr@435 165 index_query_loop(&qspec, dbName, query_from_key_index);
mas01mc@329 166 }
mas01mc@329 167 else{
mas01mc@329 168 VERB_LOG(1, "Calling brute-force query on database %s\n", dbName);
mas01cr@435 169 query_loop(&qspec, query_from_key_index);
mas01mc@329 170 }
mas01mc@292 171
mas01cr@423 172 adb_query_results_t *rs = accumulator->get_points();
mas01cr@423 173 for(unsigned int k = 0; k < rs->nresults; k++) {
mas01cr@423 174 adb_result_t r = rs->results[k];
mas01cr@430 175 reporter->add_point(audiodb_key_index(adb, r.key), r.qpos, r.ipos, r.dist);
mas01cr@423 176 }
mas01cr@423 177
mas01mc@292 178 reporter->report(fileTable, adbQueryResponse);
mas01cr@239 179 }
mas01cr@239 180
mas01cr@435 181 void audioDB::initialize_arrays(adb_t *adb, adb_query_spec_t *spec, int track, unsigned int numVectors, double *query, double *data_buffer, double **D, double **DD) {
mas01cr@239 182 unsigned int j, k, l, w;
mas01cr@239 183 double *dp, *qp, *sp;
mas01cr@239 184
mas01cr@239 185 const unsigned HOP_SIZE = sequenceHop;
mas01cr@435 186 const unsigned wL = spec->qid.sequence_length;
mas01cr@239 187
mas01cr@239 188 for(j = 0; j < numVectors; j++) {
mas01cr@239 189 // Sum products matrix
mas01cr@433 190 D[j] = new double[(*adb->track_lengths)[track]];
mas01cr@239 191 assert(D[j]);
mas01cr@239 192 // Matched filter matrix
mas01cr@433 193 DD[j]=new double[(*adb->track_lengths)[track]];
mas01cr@239 194 assert(DD[j]);
mas01cr@239 195 }
mas01cr@239 196
mas01cr@239 197 // Dot product
mas01cr@239 198 for(j = 0; j < numVectors; j++)
mas01cr@433 199 for(k = 0; k < (*adb->track_lengths)[track]; k++){
mas01cr@239 200 qp = query + j * dbH->dim;
mas01cr@239 201 sp = data_buffer + k * dbH->dim;
mas01cr@239 202 DD[j][k] = 0.0; // Initialize matched filter array
mas01cr@239 203 dp = &D[j][k]; // point to correlation cell j,k
mas01cr@239 204 *dp = 0.0; // initialize correlation cell
mas01cr@239 205 l = dbH->dim; // size of vectors
mas01cr@239 206 while(l--)
mas01cr@239 207 *dp += *qp++ * *sp++;
mas01cr@239 208 }
mas01cr@239 209
mas01cr@239 210 // Matched Filter
mas01cr@239 211 // HOP SIZE == 1
mas01cr@239 212 double* spd;
mas01cr@239 213 if(HOP_SIZE == 1) { // HOP_SIZE = shingleHop
mas01cr@239 214 for(w = 0; w < wL; w++) {
mas01cr@239 215 for(j = 0; j < numVectors - w; j++) {
mas01cr@239 216 sp = DD[j];
mas01cr@239 217 spd = D[j+w] + w;
mas01cr@433 218 k = (*adb->track_lengths)[track] - w;
mas01mc@292 219 while(k--)
mas01mc@292 220 *sp++ += *spd++;
mas01cr@239 221 }
mas01cr@239 222 }
mas01cr@239 223 } else { // HOP_SIZE != 1
mas01cr@239 224 for(w = 0; w < wL; w++) {
mas01cr@239 225 for(j = 0; j < numVectors - w; j += HOP_SIZE) {
mas01cr@239 226 sp = DD[j];
mas01cr@239 227 spd = D[j+w]+w;
mas01cr@433 228 for(k = 0; k < (*adb->track_lengths)[track] - w; k += HOP_SIZE) {
mas01cr@239 229 *sp += *spd;
mas01cr@239 230 sp += HOP_SIZE;
mas01cr@239 231 spd += HOP_SIZE;
mas01cr@239 232 }
mas01cr@239 233 }
mas01cr@239 234 }
mas01cr@239 235 }
mas01cr@239 236 }
mas01cr@239 237
mas01cr@433 238 static void audiodb_delete_arrays(int track, unsigned int numVectors, double **D, double **DD) {
mas01cr@239 239 if(D != NULL) {
mas01cr@239 240 for(unsigned int j = 0; j < numVectors; j++) {
mas01cr@239 241 delete[] D[j];
mas01cr@239 242 }
mas01cr@239 243 }
mas01cr@239 244 if(DD != NULL) {
mas01cr@239 245 for(unsigned int j = 0; j < numVectors; j++) {
mas01cr@239 246 delete[] DD[j];
mas01cr@239 247 }
mas01cr@239 248 }
mas01cr@239 249 }
mas01cr@239 250
mas01cr@433 251 int audiodb_read_data(adb_t *adb, int trkfid, int track, double **data_buffer_p, size_t *data_buffer_size_p) {
mas01cr@433 252 uint32_t track_length = (*adb->track_lengths)[track];
mas01cr@433 253 size_t track_size = track_length * sizeof(double) * adb->header->dim;
mas01cr@433 254 if (track_size > *data_buffer_size_p) {
mas01cr@239 255 if(*data_buffer_p) {
mas01cr@239 256 free(*data_buffer_p);
mas01cr@239 257 }
mas01cr@239 258 {
mas01cr@433 259 *data_buffer_size_p = track_size;
mas01cr@433 260 void *tmp = malloc(track_size);
mas01cr@239 261 if (tmp == NULL) {
mas01cr@433 262 goto error;
mas01cr@239 263 }
mas01cr@239 264 *data_buffer_p = (double *) tmp;
mas01cr@239 265 }
mas01cr@239 266 }
mas01cr@239 267
mas01cr@433 268 read_or_goto_error(trkfid, *data_buffer_p, track_size);
mas01cr@433 269 return 0;
mas01cr@433 270
mas01cr@433 271 error:
mas01cr@433 272 return 1;
mas01cr@239 273 }
mas01cr@239 274
mas01cr@405 275 void audioDB::insertTimeStamps(unsigned numVectors, std::ifstream *timesFile, double *timesdata) {
mas01cr@405 276 assert(usingTimes);
mas01cr@405 277
mas01cr@405 278 unsigned numtimes = 0;
mas01cr@405 279
mas01cr@405 280 if(!timesFile->is_open()) {
mas01cr@405 281 error("problem opening times file on timestamped database", timesFileName);
mas01cr@405 282 }
mas01cr@405 283
mas01cr@405 284 double timepoint, next;
mas01cr@405 285 *timesFile >> timepoint;
mas01cr@405 286 if (timesFile->eof()) {
mas01cr@405 287 error("no entries in times file", timesFileName);
mas01cr@405 288 }
mas01cr@405 289 numtimes++;
mas01cr@405 290 do {
mas01cr@405 291 *timesFile >> next;
mas01cr@405 292 if (timesFile->eof()) {
mas01cr@405 293 break;
mas01cr@405 294 }
mas01cr@405 295 numtimes++;
mas01cr@405 296 timesdata[0] = timepoint;
mas01cr@405 297 timepoint = (timesdata[1] = next);
mas01cr@405 298 timesdata += 2;
mas01cr@405 299 } while (numtimes < numVectors + 1);
mas01cr@405 300
mas01cr@405 301 if (numtimes < numVectors + 1) {
mas01cr@405 302 error("too few timepoints in times file", timesFileName);
mas01cr@405 303 }
mas01cr@405 304
mas01cr@405 305 *timesFile >> next;
mas01cr@405 306 if (!timesFile->eof()) {
mas01cr@405 307 error("too many timepoints in times file", timesFileName);
mas01cr@405 308 }
mas01cr@405 309 }
mas01cr@405 310
mas01cr@239 311 // These names deserve some unpicking. The names starting with a "q"
mas01cr@239 312 // are pointers to the query, norm and power vectors; the names
mas01cr@239 313 // starting with "v" are things that will end up pointing to the
mas01cr@239 314 // actual query point's information. -- CSR, 2007-12-05
mas01cr@435 315 void audioDB::set_up_query(adb_query_spec_t *spec, double **qp, double **vqp, double **qnp, double **vqnp, double **qpp, double **vqpp, double *mqdp, unsigned *nvp) {
mas01cr@239 316 *nvp = (statbuf.st_size - sizeof(int)) / (dbH->dim * sizeof(double));
mas01mc@292 317
mas01cr@435 318 uint32_t sequence_length = spec->qid.sequence_length;
mas01cr@239 319 if(!(dbH->flags & O2_FLAG_L2NORM)) {
mas01cr@239 320 error("Database must be L2 normed for sequence query","use -L2NORM");
mas01cr@239 321 }
mas01cr@239 322
mas01cr@435 323 if(*nvp < sequence_length) {
mas01cr@239 324 error("Query shorter than requested sequence length", "maybe use -l");
mas01cr@239 325 }
mas01cr@239 326
mas01cr@239 327 VERB_LOG(1, "performing norms... ");
mas01cr@239 328
mas01cr@239 329 *qp = new double[*nvp * dbH->dim];
mas01cr@239 330 memcpy(*qp, indata+sizeof(int), *nvp * dbH->dim * sizeof(double));
mas01cr@239 331 *qnp = new double[*nvp];
mas01cr@426 332 audiodb_l2norm_buffer(*qp, dbH->dim, *nvp, *qnp);
mas01cr@239 333
mas01cr@435 334 audiodb_sequence_sum(*qnp, *nvp, sequence_length);
mas01cr@435 335 audiodb_sequence_sqrt(*qnp, *nvp, sequence_length);
mas01cr@239 336
mas01cr@239 337 if (usingPower) {
mas01cr@239 338 *qpp = new double[*nvp];
mas01cr@239 339 if (lseek(powerfd, sizeof(int), SEEK_SET) == (off_t) -1) {
mas01cr@239 340 error("error seeking to data", powerFileName, "lseek");
mas01cr@239 341 }
mas01cr@239 342 int count = read(powerfd, *qpp, *nvp * sizeof(double));
mas01cr@239 343 if (count == -1) {
mas01cr@239 344 error("error reading data", powerFileName, "read");
mas01cr@239 345 }
mas01cr@239 346 if ((unsigned) count != *nvp * sizeof(double)) {
mas01cr@239 347 error("short read", powerFileName);
mas01cr@239 348 }
mas01cr@239 349
mas01cr@435 350 audiodb_sequence_sum(*qpp, *nvp, sequence_length);
mas01cr@435 351 audiodb_sequence_average(*qpp, *nvp, sequence_length);
mas01cr@239 352 }
mas01cr@239 353
mas01cr@239 354 if (usingTimes) {
mas01cr@239 355 unsigned int k;
mas01cr@239 356 *mqdp = 0.0;
mas01cr@239 357 double *querydurs = new double[*nvp];
mas01cr@239 358 double *timesdata = new double[*nvp*2];
mas01cr@239 359 insertTimeStamps(*nvp, timesFile, timesdata);
mas01cr@239 360 for(k = 0; k < *nvp; k++) {
mas01cr@239 361 querydurs[k] = timesdata[2*k+1] - timesdata[2*k];
mas01cr@239 362 *mqdp += querydurs[k];
mas01cr@239 363 }
mas01cr@239 364 *mqdp /= k;
mas01cr@239 365
mas01cr@239 366 VERB_LOG(1, "mean query file duration: %f\n", *mqdp);
mas01cr@239 367
mas01cr@239 368 delete [] querydurs;
mas01cr@239 369 delete [] timesdata;
mas01cr@239 370 }
mas01cr@239 371
mas01cr@239 372 // Defaults, for exhaustive search (!usingQueryPoint)
mas01cr@239 373 *vqp = *qp;
mas01cr@239 374 *vqnp = *qnp;
mas01cr@239 375 *vqpp = *qpp;
mas01cr@239 376
mas01cr@239 377 if(usingQueryPoint) {
mas01cr@435 378 if( !(queryPoint < *nvp && queryPoint < *nvp - sequence_length + 1) ) {
mas01mc@342 379 error("queryPoint >= numVectors-sequenceLength+1 in query");
mas01cr@239 380 } else {
mas01cr@239 381 VERB_LOG(1, "query point: %u\n", queryPoint);
mas01cr@239 382 *vqp = *qp + queryPoint * dbH->dim;
mas01cr@239 383 *vqnp = *qnp + queryPoint;
mas01cr@239 384 if (usingPower) {
mas01cr@239 385 *vqpp = *qpp + queryPoint;
mas01cr@239 386 }
mas01cr@435 387 *nvp = sequence_length;
mas01cr@239 388 }
mas01cr@239 389 }
mas01cr@239 390 }
mas01cr@239 391
mas01mc@292 392 // Does the same as set_up_query(...) but from database features instead of from a file
mas01mc@292 393 // Constructs the same outputs as set_up_query
mas01cr@435 394 void audioDB::set_up_query_from_key(adb_query_spec_t *spec, double **qp, double **vqp, double **qnp, double **vqnp, double **qpp, double **vqpp, double *mqdp, unsigned *nvp, Uns32T queryIndex) {
mas01cr@435 395 uint32_t sequence_length = spec->qid.sequence_length;
mas01mc@292 396 if(!trackTable)
mas01mc@292 397 error("trackTable not initialized","set_up_query_from_key");
mas01mc@292 398
mas01mc@292 399 if(!(dbH->flags & O2_FLAG_L2NORM)) {
mas01mc@292 400 error("Database must be L2 normed for sequence query","use -L2NORM");
mas01mc@292 401 }
mas01mc@292 402
mas01mc@292 403 if(dbH->flags & O2_FLAG_POWER)
mas01mc@292 404 usingPower = true;
mas01mc@292 405
mas01mc@292 406 if(dbH->flags & O2_FLAG_TIMES)
mas01mc@292 407 usingTimes = true;
mas01mc@292 408
mas01mc@292 409 *nvp = trackTable[queryIndex];
mas01cr@435 410 if(*nvp < sequence_length) {
mas01mc@292 411 error("Query shorter than requested sequence length", "maybe use -l");
mas01mc@292 412 }
mas01mc@292 413
mas01mc@292 414 VERB_LOG(1, "performing norms... ");
mas01mc@292 415
mas01mc@324 416 // For LARGE_ADB load query features from file
mas01mc@324 417 if( dbH->flags & O2_FLAG_LARGE_ADB ){
mas01mc@324 418 if(infid>0)
mas01mc@324 419 close(infid);
mas01mc@324 420 char* prefixedString = new char[O2_MAXFILESTR];
mas01mc@324 421 char* tmpStr = prefixedString;
mas01mc@324 422 strncpy(prefixedString, featureFileNameTable+queryIndex*O2_FILETABLE_ENTRY_SIZE, O2_MAXFILESTR);
mas01mc@324 423 prefix_name(&prefixedString, adb_feature_root);
mas01mc@324 424 if(tmpStr!=prefixedString)
mas01mc@324 425 delete[] tmpStr;
mas01mc@324 426 initInputFile(prefixedString, false); // nommap, file pointer at correct position
mas01mc@324 427 size_t allocatedSize = 0;
mas01cr@433 428 if(audiodb_read_data(adb, infid, queryIndex, qp, &allocatedSize))
mas01cr@433 429 error("failed to read data"); // over-writes qp and allocatedSize
mas01mc@324 430 // Consistency check on allocated memory and query feature size
mas01mc@324 431 if(*nvp*sizeof(double)*dbH->dim != allocatedSize)
mas01mc@324 432 error("Query memory allocation failed consitency check","set_up_query_from_key");
mas01mc@324 433 // Allocated and calculate auxillary sequences: l2norm and power
mas01mc@324 434 init_track_aux_data(queryIndex, *qp, qnp, vqnp, qpp, vqpp);
mas01mc@324 435 }
mas01mc@324 436 else{ // Load from self-contained ADB database
mas01mc@324 437 // Read query feature vectors from database
mas01mc@324 438 *qp = NULL;
mas01mc@324 439 lseek(dbfid, dbH->dataOffset + trackOffsetTable[queryIndex] * sizeof(double), SEEK_SET);
mas01mc@324 440 size_t allocatedSize = 0;
mas01cr@433 441 if(audiodb_read_data(adb, dbfid, queryIndex, qp, &allocatedSize))
mas01cr@433 442 error("failed to read data");
mas01mc@324 443 // Consistency check on allocated memory and query feature size
mas01mc@324 444 if(*nvp*sizeof(double)*dbH->dim != allocatedSize)
mas01mc@324 445 error("Query memory allocation failed consitency check","set_up_query_from_key");
mas01mc@324 446
mas01mc@324 447 Uns32T trackIndexOffset = trackOffsetTable[queryIndex]/dbH->dim; // Convert num data elements to num vectors
mas01mc@324 448 // Copy L2 norm partial-sum coefficients
mas01mc@324 449 assert(*qnp = new double[*nvp]);
mas01mc@324 450 memcpy(*qnp, l2normTable+trackIndexOffset, *nvp*sizeof(double));
mas01cr@435 451 audiodb_sequence_sum(*qnp, *nvp, sequence_length);
mas01cr@435 452 audiodb_sequence_sqrt(*qnp, *nvp, sequence_length);
mas01mc@324 453
mas01mc@324 454 if( usingPower ){
mas01mc@324 455 // Copy Power partial-sum coefficients
mas01mc@324 456 assert(*qpp = new double[*nvp]);
mas01mc@324 457 memcpy(*qpp, powerTable+trackIndexOffset, *nvp*sizeof(double));
mas01cr@435 458 audiodb_sequence_sum(*qpp, *nvp, sequence_length);
mas01cr@435 459 audiodb_sequence_average(*qpp, *nvp, sequence_length);
mas01mc@324 460 }
mas01mc@324 461
mas01mc@324 462 if (usingTimes) {
mas01mc@324 463 unsigned int k;
mas01mc@324 464 *mqdp = 0.0;
mas01mc@324 465 double *querydurs = new double[*nvp];
mas01mc@324 466 double *timesdata = new double[*nvp*2];
mas01mc@324 467 assert(querydurs && timesdata);
mas01mc@324 468 memcpy(timesdata, timesTable+trackIndexOffset, *nvp*sizeof(double));
mas01mc@324 469 for(k = 0; k < *nvp; k++) {
mas01mc@324 470 querydurs[k] = timesdata[2*k+1] - timesdata[2*k];
mas01mc@324 471 *mqdp += querydurs[k];
mas01mc@324 472 }
mas01mc@324 473 *mqdp /= k;
mas01mc@324 474
mas01mc@324 475 VERB_LOG(1, "mean query file duration: %f\n", *mqdp);
mas01mc@324 476
mas01mc@324 477 delete [] querydurs;
mas01mc@324 478 delete [] timesdata;
mas01mc@324 479 }
mas01mc@292 480 }
mas01mc@292 481
mas01mc@292 482 // Defaults, for exhaustive search (!usingQueryPoint)
mas01mc@292 483 *vqp = *qp;
mas01mc@292 484 *vqnp = *qnp;
mas01mc@292 485 *vqpp = *qpp;
mas01mc@292 486
mas01mc@292 487 if(usingQueryPoint) {
mas01cr@435 488 if( !(queryPoint < *nvp && queryPoint < *nvp - sequence_length + 1) ) {
mas01mc@342 489 error("queryPoint >= numVectors-sequenceLength+1 in query");
mas01mc@292 490 } else {
mas01mc@292 491 VERB_LOG(1, "query point: %u\n", queryPoint);
mas01mc@292 492 *vqp = *qp + queryPoint * dbH->dim;
mas01mc@292 493 *vqnp = *qnp + queryPoint;
mas01mc@292 494 if (usingPower) {
mas01mc@292 495 *vqpp = *qpp + queryPoint;
mas01mc@292 496 }
mas01cr@435 497 *nvp = sequence_length;
mas01mc@292 498 }
mas01mc@292 499 }
mas01mc@292 500 }
mas01mc@292 501
mas01mc@292 502
mas01cr@239 503 // FIXME: this is not the right name; we're not actually setting up
mas01cr@239 504 // the database, but copying various bits of it out of mmap()ed tables
mas01cr@239 505 // in order to reduce seeks.
mas01cr@435 506 int audioDB::set_up_db(adb_t *adb, adb_query_spec_t *spec, double **snp, double **vsnp, double **spp, double **vspp, double **mddp, unsigned int *dvp) {
mas01cr@435 507 uint32_t sequence_length = spec->qid.sequence_length;
mas01cr@435 508
mas01cr@434 509 *dvp = adb->header->length / (adb->header->dim * sizeof(double));
mas01cr@239 510 *snp = new double[*dvp];
mas01cr@239 511
mas01cr@239 512 double *snpp = *snp, *sppp = 0;
mas01cr@434 513 lseek(adb->fd, adb->header->l2normTableOffset, SEEK_SET);
mas01cr@434 514 read_or_goto_error(adb->fd, *snp, *dvp * sizeof(double));
mas01cr@239 515
mas01cr@239 516 if (usingPower) {
mas01cr@434 517 if (!(adb->header->flags & O2_FLAG_POWER)) {
mas01cr@434 518 goto error;
mas01cr@239 519 }
mas01cr@239 520 *spp = new double[*dvp];
mas01cr@239 521 sppp = *spp;
mas01cr@434 522 lseek(adb->fd, adb->header->powerTableOffset, SEEK_SET);
mas01cr@434 523 read_or_goto_error(adb->fd, *spp, *dvp * sizeof(double));
mas01cr@239 524 }
mas01cr@239 525
mas01cr@434 526 for(unsigned int i = 0; i < adb->header->numFiles; i++){
mas01cr@434 527 size_t track_length = (*adb->track_lengths)[i];
mas01cr@435 528 if(track_length >= sequence_length) {
mas01cr@435 529 audiodb_sequence_sum(snpp, track_length, sequence_length);
mas01cr@435 530 audiodb_sequence_sqrt(snpp, track_length, sequence_length);
mas01cr@239 531 if (usingPower) {
mas01cr@435 532 audiodb_sequence_sum(sppp, track_length, sequence_length);
mas01cr@435 533 audiodb_sequence_average(sppp, track_length, sequence_length);
mas01cr@239 534 }
mas01cr@239 535 }
mas01cr@434 536 snpp += track_length;
mas01cr@239 537 if (usingPower) {
mas01cr@434 538 sppp += track_length;
mas01cr@239 539 }
mas01cr@239 540 }
mas01cr@239 541
mas01cr@239 542 if (usingTimes) {
mas01cr@434 543 if(!(adb->header->flags & O2_FLAG_TIMES)) {
mas01cr@239 544 error("query timestamps provided for non-timed database", dbName);
mas01cr@239 545 }
mas01cr@239 546
mas01cr@434 547 *mddp = new double[adb->header->numFiles];
mas01cr@239 548
mas01cr@434 549 for(unsigned int k = 0; k < adb->header->numFiles; k++) {
mas01cr@434 550 size_t track_length = (*adb->track_lengths)[k];
mas01cr@239 551 unsigned int j;
mas01cr@239 552 (*mddp)[k] = 0.0;
mas01cr@434 553 for(j = 0; j < track_length; j++) {
mas01cr@239 554 (*mddp)[k] += timesTable[2*j+1] - timesTable[2*j];
mas01cr@239 555 }
mas01cr@239 556 (*mddp)[k] /= j;
mas01cr@239 557 }
mas01cr@239 558 }
mas01cr@239 559
mas01cr@239 560 *vsnp = *snp;
mas01cr@239 561 *vspp = *spp;
mas01cr@434 562 return 0;
mas01cr@434 563
mas01cr@434 564 error:
mas01cr@434 565 if(*snp) {
mas01cr@434 566 delete [] *snp;
mas01cr@434 567 }
mas01cr@434 568 if(*spp) {
mas01cr@434 569 delete [] *spp;
mas01cr@434 570 }
mas01cr@434 571 if(*mddp) {
mas01cr@434 572 delete [] *mddp;
mas01cr@434 573 }
mas01cr@434 574 return 1;
mas01cr@434 575
mas01cr@239 576 }
mas01cr@239 577
mas01mc@292 578 // query_points()
mas01mc@292 579 //
mas01mc@292 580 // using PointPairs held in the exact_evaluation_queue compute squared distance for each PointPair
mas01mc@292 581 // and insert result into the current reporter.
mas01mc@292 582 //
mas01mc@292 583 // Preconditions:
mas01mc@292 584 // A query inFile has been opened with setup_query(...) and query pointers initialized
mas01mc@292 585 // The database contains some points
mas01mc@292 586 // An exact_evaluation_queue has been allocated and populated
mas01mc@292 587 // A reporter has been allocated
mas01mc@292 588 //
mas01mc@292 589 // Postconditions:
mas01mc@292 590 // reporter contains the points and distances that meet the reporter constraints
mas01mc@292 591
mas01cr@435 592 void audioDB::query_loop_points(adb_query_spec_t *spec, double* query, double* qnPtr, double* qpPtr, double meanQdur, Uns32T numVectors){
mas01mc@292 593 unsigned int dbVectors;
mas01mc@315 594 double *sNorm = 0, *snPtr, *sPower = 0, *spPtr = 0;
mas01mc@292 595 double *meanDBdur = 0;
mas01mc@292 596
mas01mc@292 597 // check pre-conditions
mas01mc@292 598 assert(exact_evaluation_queue&&reporter);
mas01mc@292 599 if(!exact_evaluation_queue->size()) // Exit if no points to evaluate
mas01mc@292 600 return;
mas01mc@292 601
mas01mc@292 602 // Compute database info
mas01mc@292 603 // FIXME: we more than likely don't need very much of the database
mas01mc@292 604 // so make a new method to build these values per-track or, even better, per-point
mas01mc@324 605 if( !( dbH->flags & O2_FLAG_LARGE_ADB) )
mas01cr@435 606 if(set_up_db(adb, spec, &sNorm, &snPtr, &sPower, &spPtr, &meanDBdur, &dbVectors)) {
mas01cr@434 607 error("failed to set up db");
mas01cr@434 608 }
mas01mc@292 609
mas01mc@292 610 VERB_LOG(1, "matching points...");
mas01mc@292 611
mas01mc@292 612 // We are guaranteed that the order of points is sorted by:
mas01mc@324 613 // trackID, spos, qpos
mas01mc@292 614 // so we can be relatively efficient in initialization of track data.
mas01mc@292 615 // Here we assume that points don't overlap, so we will use exhaustive dot
mas01mc@324 616 // product evaluation instead of memoization of partial sums which is used
mas01mc@324 617 // for exhaustive brute-force evaluation from smaller databases: e.g. query_loop()
mas01mc@292 618 double dist;
mas01mc@292 619 size_t data_buffer_size = 0;
mas01mc@292 620 double *data_buffer = 0;
mas01mc@324 621 Uns32T trackOffset = 0;
mas01mc@324 622 Uns32T trackIndexOffset = 0;
mas01mc@292 623 Uns32T currentTrack = 0x80000000; // Initialize with a value outside of track index range
mas01mc@292 624 Uns32T npairs = exact_evaluation_queue->size();
mas01mc@292 625 while(npairs--){
mas01mc@292 626 PointPair pp = exact_evaluation_queue->top();
mas01mc@324 627 // Large ADB track data must be loaded here for sPower
mas01mc@324 628 if(dbH->flags & O2_FLAG_LARGE_ADB){
mas01mc@324 629 trackOffset=0;
mas01mc@324 630 trackIndexOffset=0;
mas01mc@292 631 if(currentTrack!=pp.trackID){
mas01mc@324 632 char* prefixedString = new char[O2_MAXFILESTR];
mas01mc@324 633 char* tmpStr = prefixedString;
mas01mc@324 634 // On currentTrack change, allocate and load track data
mas01mc@292 635 currentTrack=pp.trackID;
mas01mc@324 636 SAFE_DELETE_ARRAY(sNorm);
mas01mc@324 637 SAFE_DELETE_ARRAY(sPower);
mas01mc@324 638 if(infid>0)
mas01mc@324 639 close(infid);
mas01mc@324 640 // Open and check dimensions of feature file
mas01mc@324 641 strncpy(prefixedString, featureFileNameTable+pp.trackID*O2_FILETABLE_ENTRY_SIZE, O2_MAXFILESTR);
mas01mc@324 642 prefix_name((char ** const) &prefixedString, adb_feature_root);
mas01mc@324 643 if (prefixedString!=tmpStr)
mas01mc@324 644 delete[] tmpStr;
mas01mc@324 645 initInputFile(prefixedString, false); // nommap, file pointer at correct position
mas01mc@324 646 // Load the feature vector data for current track into data_buffer
mas01cr@433 647 if(audiodb_read_data(adb, infid, pp.trackID, &data_buffer, &data_buffer_size))
mas01cr@433 648 error("failed to read data");
mas01mc@324 649 // Load power and calculate power and l2norm sequence sums
mas01mc@324 650 init_track_aux_data(pp.trackID, data_buffer, &sNorm, &snPtr, &sPower, &spPtr);
mas01mc@292 651 }
mas01mc@324 652 }
mas01mc@324 653 else{
mas01mc@324 654 // These offsets are w.r.t. the entire database of feature vectors and auxillary variables
mas01mc@324 655 trackOffset=trackOffsetTable[pp.trackID]; // num data elements offset
mas01mc@324 656 trackIndexOffset=trackOffset/dbH->dim; // num vectors offset
mas01mc@324 657 }
mas01mc@324 658 Uns32T qPos = usingQueryPoint?0:pp.qpos;// index for query point
mas01mc@324 659 Uns32T sPos = trackIndexOffset+pp.spos; // index into l2norm table
mas01mc@324 660 // Test power thresholds before computing distance
mas01cr@435 661 if( ( !usingPower || audiodb_powers_acceptable(&spec->refine, qpPtr[qPos], sPower[sPos])) &&
mas01mc@324 662 ( qPos<numVectors-sequenceLength+1 && pp.spos<trackTable[pp.trackID]-sequenceLength+1 ) ){
mas01mc@324 663 // Non-large ADB track data is loaded inside power test for efficiency
mas01mc@324 664 if( !(dbH->flags & O2_FLAG_LARGE_ADB) && (currentTrack!=pp.trackID) ){
mas01mc@324 665 // On currentTrack change, allocate and load track data
mas01mc@324 666 currentTrack=pp.trackID;
mas01mc@324 667 lseek(dbfid, dbH->dataOffset + trackOffset * sizeof(double), SEEK_SET);
mas01cr@433 668 if(audiodb_read_data(adb, dbfid, currentTrack, &data_buffer, &data_buffer_size))
mas01cr@433 669 error("failed to read data");
mas01mc@324 670 }
mas01mc@324 671 // Compute distance
mas01cr@425 672 dist = audiodb_dot_product(query+qPos*dbH->dim, data_buffer+pp.spos*dbH->dim, dbH->dim*sequenceLength);
mas01mc@324 673 double qn = qnPtr[qPos];
mas01mc@324 674 double sn = sNorm[sPos];
mas01cr@435 675 switch(spec->params.distance) {
mas01cr@431 676 case ADB_DISTANCE_EUCLIDEAN_NORMED:
mas01mc@324 677 dist = 2 - (2/(qn*sn))*dist;
mas01cr@431 678 break;
mas01cr@431 679 case ADB_DISTANCE_EUCLIDEAN:
mas01cr@431 680 dist = qn*qn + sn*sn - 2*dist;
mas01cr@431 681 break;
mas01cr@431 682 }
mas01cr@424 683 if((!radius) || dist <= (O2_LSH_EXACT_MULT*radius+O2_DISTANCE_TOLERANCE)) {
mas01cr@424 684 adb_result_t r;
mas01cr@424 685 r.key = fileTable + pp.trackID * O2_FILETABLE_ENTRY_SIZE;
mas01cr@424 686 r.dist = dist;
mas01cr@424 687 r.qpos = pp.qpos;
mas01cr@424 688 r.ipos = pp.spos;
mas01cr@424 689 accumulator->add_point(&r);
mas01cr@424 690 }
mas01mc@292 691 }
mas01mc@292 692 exact_evaluation_queue->pop();
mas01mc@292 693 }
mas01mc@315 694 // Cleanup
mas01mc@324 695 SAFE_DELETE_ARRAY(sNorm);
mas01mc@324 696 SAFE_DELETE_ARRAY(sPower);
mas01mc@324 697 SAFE_DELETE_ARRAY(meanDBdur);
mas01mc@292 698 }
mas01mc@292 699
mas01cr@435 700 void audioDB::query_loop(adb_query_spec_t *spec, Uns32T queryIndex) {
mas01cr@239 701
mas01cr@239 702 unsigned int numVectors;
mas01cr@239 703 double *query, *query_data;
mas01cr@239 704 double *qNorm, *qnPtr, *qPower = 0, *qpPtr = 0;
mas01cr@239 705 double meanQdur;
mas01cr@239 706
mas01mc@324 707 if( dbH->flags & O2_FLAG_LARGE_ADB )
mas01mc@324 708 error("error: LARGE_ADB requires indexed query");
mas01mc@324 709
mas01mc@292 710 if(query_from_key)
mas01cr@435 711 set_up_query_from_key(spec, &query_data, &query, &qNorm, &qnPtr, &qPower, &qpPtr, &meanQdur, &numVectors, queryIndex);
mas01mc@292 712 else
mas01cr@435 713 set_up_query(spec, &query_data, &query, &qNorm, &qnPtr, &qPower, &qpPtr, &meanQdur, &numVectors);
mas01cr@239 714
mas01cr@239 715 unsigned int dbVectors;
mas01cr@239 716 double *sNorm, *snPtr, *sPower = 0, *spPtr = 0;
mas01cr@239 717 double *meanDBdur = 0;
mas01cr@239 718
mas01cr@435 719 if(set_up_db(adb, spec, &sNorm, &snPtr, &sPower, &spPtr, &meanDBdur, &dbVectors)) {
mas01cr@434 720 error("failed to set up db");
mas01cr@434 721 }
mas01cr@239 722
mas01cr@239 723 VERB_LOG(1, "matching tracks...");
mas01cr@239 724
mas01cr@435 725 unsigned j,k,track,trackOffset=0, HOP_SIZE=sequenceHop;
mas01cr@435 726 unsigned wL = spec->qid.sequence_length;
mas01cr@239 727 double **D = 0; // Differences query and target
mas01cr@239 728 double **DD = 0; // Matched filter distance
mas01cr@239 729
mas01mc@292 730 D = new double*[numVectors]; // pre-allocate
mas01cr@239 731 DD = new double*[numVectors];
mas01cr@239 732
mas01cr@239 733 gettimeofday(&tv1, NULL);
mas01cr@239 734 unsigned processedTracks = 0;
mas01cr@239 735 off_t trackIndexOffset;
mas01cr@239 736 char nextKey[MAXSTR];
mas01cr@239 737
mas01cr@239 738 // Track loop
mas01cr@239 739 size_t data_buffer_size = 0;
mas01cr@239 740 double *data_buffer = 0;
mas01cr@239 741 lseek(dbfid, dbH->dataOffset, SEEK_SET);
mas01cr@239 742
mas01cr@239 743 for(processedTracks=0, track=0 ; processedTracks < dbH->numFiles ; track++, processedTracks++) {
mas01cr@239 744
mas01cr@239 745 trackOffset = trackOffsetTable[track]; // numDoubles offset
mas01cr@239 746
mas01cr@239 747 // get trackID from file if using a control file
mas01cr@239 748 if(trackFile) {
mas01cr@239 749 trackFile->getline(nextKey,MAXSTR);
mas01cr@239 750 if(!trackFile->eof()) {
mas01cr@430 751 track = audiodb_key_index(adb, nextKey);
mas01cr@430 752 if(track == (uint32_t) -1) {
mas01cr@430 753 error("key not found", nextKey);
mas01cr@430 754 }
mas01cr@239 755 trackOffset = trackOffsetTable[track];
mas01cr@239 756 lseek(dbfid, dbH->dataOffset + trackOffset * sizeof(double), SEEK_SET);
mas01cr@239 757 } else {
mas01cr@239 758 break;
mas01cr@239 759 }
mas01cr@239 760 }
mas01cr@239 761
mas01mc@292 762 // skip identity on query_from_key
mas01mc@292 763 if( query_from_key && (track == queryIndex) ) {
mas01mc@292 764 if(queryIndex!=dbH->numFiles-1){
mas01mc@292 765 track++;
mas01mc@292 766 trackOffset = trackOffsetTable[track];
mas01mc@292 767 lseek(dbfid, dbH->dataOffset + trackOffset * sizeof(double), SEEK_SET);
mas01mc@292 768 }
mas01mc@292 769 else{
mas01mc@292 770 break;
mas01mc@292 771 }
mas01mc@292 772 }
mas01mc@292 773
mas01cr@239 774 trackIndexOffset=trackOffset/dbH->dim; // numVectors offset
mas01cr@239 775
mas01cr@433 776 if(audiodb_read_data(adb, dbfid, track, &data_buffer, &data_buffer_size))
mas01cr@433 777 error("failed to read data");
mas01cr@435 778 if(wL <= trackTable[track]) { // test for short sequences
mas01cr@239 779
mas01cr@239 780 VERB_LOG(7,"%u.%jd.%u | ", track, (intmax_t) trackIndexOffset, trackTable[track]);
mas01cr@239 781
mas01cr@435 782 initialize_arrays(adb, spec, track, numVectors, query, data_buffer, D, DD);
mas01cr@239 783
mas01cr@435 784 if(spec->refine.flags & ADB_REFINE_DURATION_RATIO) {
mas01cr@239 785 VERB_LOG(3,"meanQdur=%f meanDBdur=%f\n", meanQdur, meanDBdur[track]);
mas01cr@239 786 }
mas01cr@239 787
mas01cr@435 788 if((!(spec->refine.flags & ADB_REFINE_DURATION_RATIO)) || fabs(meanDBdur[track]-meanQdur) < meanQdur*spec->refine.duration_ratio) {
mas01cr@435 789 if(spec->refine.flags & ADB_REFINE_DURATION_RATIO) {
mas01cr@239 790 VERB_LOG(3,"within duration tolerance.\n");
mas01cr@239 791 }
mas01cr@239 792
mas01cr@239 793 // Search for minimum distance by shingles (concatenated vectors)
mas01cr@239 794 for(j = 0; j <= numVectors - wL; j += HOP_SIZE) {
mas01cr@239 795 for(k = 0; k <= trackTable[track] - wL; k += HOP_SIZE) {
mas01cr@431 796 double thisDist = 0;
mas01cr@435 797 switch(spec->params.distance) {
mas01cr@431 798 case ADB_DISTANCE_EUCLIDEAN_NORMED:
mas01cr@239 799 thisDist = 2-(2/(qnPtr[j]*sNorm[trackIndexOffset+k]))*DD[j][k];
mas01cr@431 800 break;
mas01cr@431 801 case ADB_DISTANCE_EUCLIDEAN:
mas01cr@431 802 thisDist = qnPtr[j]*qnPtr[j]+sNorm[trackIndexOffset+k]*sNorm[trackIndexOffset+k] - 2*DD[j][k];
mas01cr@431 803 break;
mas01cr@431 804 case ADB_DISTANCE_DOT_PRODUCT:
mas01cr@431 805 thisDist = DD[j][k];
mas01cr@431 806 break;
mas01cr@431 807 }
mas01cr@239 808 // Power test
mas01cr@435 809 if ((!usingPower) || audiodb_powers_acceptable(&spec->refine, qpPtr[j], sPower[trackIndexOffset + k])) {
mas01cr@239 810 // radius test
mas01cr@435 811 if((!(spec->refine.flags & ADB_REFINE_RADIUS)) ||
mas01cr@435 812 thisDist <= (spec->refine.radius+O2_DISTANCE_TOLERANCE)) {
mas01cr@423 813 adb_result_t r;
mas01cr@423 814 r.key = fileTable + track * O2_FILETABLE_ENTRY_SIZE;
mas01cr@423 815 r.dist = thisDist;
mas01cr@423 816 r.qpos = usingQueryPoint ? queryPoint : j;
mas01cr@423 817 r.ipos = k;
mas01cr@423 818 accumulator->add_point(&r);
mas01cr@239 819 }
mas01cr@239 820 }
mas01cr@239 821 }
mas01cr@239 822 }
mas01cr@239 823 } // Duration match
mas01cr@433 824 audiodb_delete_arrays(track, numVectors, D, DD);
mas01cr@239 825 }
mas01cr@239 826 }
mas01cr@239 827
mas01cr@239 828 free(data_buffer);
mas01cr@239 829
mas01cr@239 830 gettimeofday(&tv2,NULL);
mas01cr@239 831 VERB_LOG(1,"elapsed time: %ld msec\n",
mas01cr@239 832 (tv2.tv_sec*1000 + tv2.tv_usec/1000) -
mas01cr@239 833 (tv1.tv_sec*1000 + tv1.tv_usec/1000))
mas01cr@239 834
mas01cr@239 835 // Clean up
mas01cr@239 836 if(query_data)
mas01cr@239 837 delete[] query_data;
mas01cr@239 838 if(qNorm)
mas01cr@239 839 delete[] qNorm;
mas01cr@239 840 if(sNorm)
mas01cr@239 841 delete[] sNorm;
mas01cr@239 842 if(qPower)
mas01cr@239 843 delete[] qPower;
mas01cr@239 844 if(sPower)
mas01cr@239 845 delete[] sPower;
mas01cr@239 846 if(D)
mas01cr@239 847 delete[] D;
mas01cr@239 848 if(DD)
mas01cr@239 849 delete[] DD;
mas01cr@239 850 if(meanDBdur)
mas01cr@239 851 delete[] meanDBdur;
mas01cr@239 852 }