annotate query.cpp @ 216:cd3dced4f534 refactoring

Comment fixes.
author mas01cr
date Tue, 04 Dec 2007 10:23:28 +0000
parents 241bc55a1a4e
children 685eb707b660
rev   line source
mas01cr@204 1 #include "audioDB.h"
mas01cr@204 2
mas01cr@204 3 bool audioDB::powers_acceptable(double p1, double p2) {
mas01cr@204 4 if (use_absolute_threshold) {
mas01cr@204 5 if ((p1 < absolute_threshold) || (p2 < absolute_threshold)) {
mas01cr@204 6 return false;
mas01cr@204 7 }
mas01cr@204 8 }
mas01cr@204 9 if (use_relative_threshold) {
mas01cr@204 10 if (fabs(p1-p2) > fabs(relative_threshold)) {
mas01cr@204 11 return false;
mas01cr@204 12 }
mas01cr@204 13 }
mas01cr@204 14 return true;
mas01cr@204 15 }
mas01cr@204 16
mas01cr@206 17 void audioDB::query(const char* dbName, const char* inFile, adb__queryResponse *adbQueryResponse) {
mas01cr@206 18 switch(queryType) {
mas01cr@204 19 case O2_SEQUENCE_QUERY:
mas01cr@204 20 if(radius==0)
mas01cr@204 21 trackSequenceQueryNN(dbName, inFile, adbQueryResponse);
mas01cr@204 22 else
mas01cr@204 23 trackSequenceQueryRad(dbName, inFile, adbQueryResponse);
mas01cr@204 24 break;
mas01cr@204 25 default:
mas01cr@204 26 error("unrecognized queryType in query()");
mas01cr@204 27 }
mas01cr@204 28 }
mas01cr@204 29
mas01cr@206 30 // return ordinal position of key in keyTable
mas01cr@204 31 unsigned audioDB::getKeyPos(char* key){
mas01cr@204 32 for(unsigned k=0; k<dbH->numFiles; k++)
mas01cr@204 33 if(strncmp(fileTable + k*O2_FILETABLESIZE, key, strlen(key))==0)
mas01cr@204 34 return k;
mas01cr@204 35 error("Key not found",key);
mas01cr@204 36 return O2_ERR_KEYNOTFOUND;
mas01cr@204 37 }
mas01cr@204 38
mas01cr@204 39 // This is a common pattern in sequence queries: what we are doing is
mas01cr@204 40 // taking a window of length seqlen over a buffer of length length,
mas01cr@204 41 // and placing the sum of the elements in that window in the first
mas01cr@204 42 // element of the window: thus replacing all but the last seqlen
mas01cr@216 43 // elements in the buffer with the corresponding windowed sum.
mas01cr@204 44 void audioDB::sequence_sum(double *buffer, int length, int seqlen) {
mas01cr@204 45 double tmp1, tmp2, *ps;
mas01cr@204 46 int j, w;
mas01cr@204 47
mas01cr@204 48 tmp1 = *buffer;
mas01cr@204 49 j = 1;
mas01cr@204 50 w = seqlen - 1;
mas01cr@204 51 while(w--) {
mas01cr@204 52 *buffer += buffer[j++];
mas01cr@204 53 }
mas01cr@204 54 ps = buffer + 1;
mas01cr@204 55 w = length - seqlen; // +1 - 1
mas01cr@204 56 while(w--) {
mas01cr@204 57 tmp2 = *ps;
mas01cr@204 58 *ps = *(ps - 1) - tmp1 + *(ps + seqlen - 1);
mas01cr@204 59 tmp1 = tmp2;
mas01cr@204 60 ps++;
mas01cr@204 61 }
mas01cr@204 62 }
mas01cr@204 63
mas01cr@216 64 // In contrast to sequence_sum() above, sequence_sqrt() and
mas01cr@216 65 // sequence_average() below are simple mappers across the sequence.
mas01cr@204 66 void audioDB::sequence_sqrt(double *buffer, int length, int seqlen) {
mas01cr@204 67 int w = length - seqlen + 1;
mas01cr@204 68 while(w--) {
mas01cr@204 69 *buffer = sqrt(*buffer);
mas01cr@204 70 buffer++;
mas01cr@204 71 }
mas01cr@204 72 }
mas01cr@204 73
mas01cr@204 74 void audioDB::sequence_average(double *buffer, int length, int seqlen) {
mas01cr@204 75 int w = length - seqlen + 1;
mas01cr@204 76 while(w--) {
mas01cr@204 77 *buffer /= seqlen;
mas01cr@204 78 buffer++;
mas01cr@204 79 }
mas01cr@204 80 }
mas01cr@204 81
mas01cr@208 82 void audioDB::initialize_arrays(int track, unsigned int numVectors, double *query, double *data_buffer, double **D, double **DD) {
mas01cr@208 83 unsigned int j, k, l, w;
mas01cr@208 84 double *dp, *qp, *sp;
mas01cr@208 85
mas01cr@208 86 const unsigned HOP_SIZE = sequenceHop;
mas01cr@208 87 const unsigned wL = sequenceLength;
mas01cr@208 88
mas01cr@208 89 for(j = 0; j < numVectors; j++) {
mas01cr@208 90 // Sum products matrix
mas01cr@208 91 D[j] = new double[trackTable[track]];
mas01cr@208 92 assert(D[j]);
mas01cr@208 93 // Matched filter matrix
mas01cr@208 94 DD[j]=new double[trackTable[track]];
mas01cr@208 95 assert(DD[j]);
mas01cr@208 96 }
mas01cr@208 97
mas01cr@208 98 // Dot product
mas01cr@208 99 for(j = 0; j < numVectors; j++)
mas01cr@208 100 for(k = 0; k < trackTable[track]; k++){
mas01cr@208 101 qp = query + j * dbH->dim;
mas01cr@208 102 sp = data_buffer + k * dbH->dim;
mas01cr@208 103 DD[j][k] = 0.0; // Initialize matched filter array
mas01cr@208 104 dp = &D[j][k]; // point to correlation cell j,k
mas01cr@208 105 *dp = 0.0; // initialize correlation cell
mas01cr@208 106 l = dbH->dim; // size of vectors
mas01cr@208 107 while(l--)
mas01cr@208 108 *dp += *qp++ * *sp++;
mas01cr@208 109 }
mas01cr@208 110
mas01cr@208 111 // Matched Filter
mas01cr@208 112 // HOP SIZE == 1
mas01cr@208 113 double* spd;
mas01cr@208 114 if(HOP_SIZE == 1) { // HOP_SIZE = shingleHop
mas01cr@209 115 for(w = 0; w < wL; w++) {
mas01cr@208 116 for(j = 0; j < numVectors - w; j++) {
mas01cr@208 117 sp = DD[j];
mas01cr@208 118 spd = D[j+w] + w;
mas01cr@208 119 k = trackTable[track] - w;
mas01cr@208 120 while(k--)
mas01cr@208 121 *sp++ += *spd++;
mas01cr@208 122 }
mas01cr@209 123 }
mas01cr@208 124 } else { // HOP_SIZE != 1
mas01cr@209 125 for(w = 0; w < wL; w++) {
mas01cr@208 126 for(j = 0; j < numVectors - w; j += HOP_SIZE) {
mas01cr@208 127 sp = DD[j];
mas01cr@208 128 spd = D[j+w]+w;
mas01cr@208 129 for(k = 0; k < trackTable[track] - w; k += HOP_SIZE) {
mas01cr@208 130 *sp += *spd;
mas01cr@208 131 sp += HOP_SIZE;
mas01cr@208 132 spd += HOP_SIZE;
mas01cr@208 133 }
mas01cr@208 134 }
mas01cr@209 135 }
mas01cr@208 136 }
mas01cr@208 137 }
mas01cr@208 138
mas01cr@211 139 void audioDB::delete_arrays(int track, unsigned int numVectors, double **D, double **DD) {
mas01cr@211 140 if(D != NULL) {
mas01cr@211 141 for(unsigned int j = 0; j < numVectors; j++) {
mas01cr@211 142 delete[] D[j];
mas01cr@211 143 }
mas01cr@211 144 }
mas01cr@211 145 if(DD != NULL) {
mas01cr@211 146 for(unsigned int j = 0; j < numVectors; j++) {
mas01cr@211 147 delete[] DD[j];
mas01cr@211 148 }
mas01cr@211 149 }
mas01cr@211 150 }
mas01cr@211 151
mas01cr@209 152 void audioDB::read_data(int track, double **data_buffer_p, size_t *data_buffer_size_p) {
mas01cr@209 153 if (trackTable[track] * sizeof(double) * dbH->dim > *data_buffer_size_p) {
mas01cr@209 154 if(*data_buffer_p) {
mas01cr@209 155 free(*data_buffer_p);
mas01cr@209 156 }
mas01cr@209 157 {
mas01cr@209 158 *data_buffer_size_p = trackTable[track] * sizeof(double) * dbH->dim;
mas01cr@209 159 void *tmp = malloc(*data_buffer_size_p);
mas01cr@209 160 if (tmp == NULL) {
mas01cr@209 161 error("error allocating data buffer");
mas01cr@209 162 }
mas01cr@209 163 *data_buffer_p = (double *) tmp;
mas01cr@209 164 }
mas01cr@209 165 }
mas01cr@209 166
mas01cr@209 167 read(dbfid, *data_buffer_p, trackTable[track] * sizeof(double) * dbH->dim);
mas01cr@209 168 }
mas01cr@209 169
mas01cr@215 170 void audioDB::set_up_query(double **qp, double **qnp, double **qpp, unsigned *nvp) {
mas01cr@214 171 *nvp = (statbuf.st_size - sizeof(int)) / (dbH->dim * sizeof(double));
mas01cr@214 172
mas01cr@214 173 if(!(dbH->flags & O2_FLAG_L2NORM)) {
mas01cr@214 174 error("Database must be L2 normed for sequence query","use -L2NORM");
mas01cr@214 175 }
mas01cr@214 176
mas01cr@214 177 if(*nvp < sequenceLength) {
mas01cr@214 178 error("Query shorter than requested sequence length", "maybe use -l");
mas01cr@214 179 }
mas01cr@214 180
mas01cr@214 181 if(verbosity>1) {
mas01cr@214 182 std::cerr << "performing norms ... "; std::cerr.flush();
mas01cr@214 183 }
mas01cr@214 184
mas01cr@214 185 *qp = new double[*nvp * dbH->dim];
mas01cr@214 186 memcpy(*qp, indata+sizeof(int), *nvp * dbH->dim * sizeof(double));
mas01cr@214 187 *qnp = new double[*nvp];
mas01cr@214 188 unitNorm(*qp, dbH->dim, *nvp, *qnp);
mas01cr@215 189
mas01cr@215 190 sequence_sum(*qnp, *nvp, sequenceLength);
mas01cr@215 191 sequence_sqrt(*qnp, *nvp, sequenceLength);
mas01cr@215 192
mas01cr@215 193 if (usingPower) {
mas01cr@215 194 *qpp = new double[*nvp];
mas01cr@215 195 if (lseek(powerfd, sizeof(int), SEEK_SET) == (off_t) -1) {
mas01cr@215 196 error("error seeking to data", powerFileName, "lseek");
mas01cr@215 197 }
mas01cr@215 198 int count = read(powerfd, *qpp, *nvp * sizeof(double));
mas01cr@215 199 if (count == -1) {
mas01cr@215 200 error("error reading data", powerFileName, "read");
mas01cr@215 201 }
mas01cr@215 202 if ((unsigned) count != *nvp * sizeof(double)) {
mas01cr@215 203 error("short read", powerFileName);
mas01cr@215 204 }
mas01cr@215 205
mas01cr@215 206 sequence_sum(*qpp, *nvp, sequenceLength);
mas01cr@215 207 sequence_average(*qpp, *nvp, sequenceLength);
mas01cr@215 208 }
mas01cr@214 209 }
mas01cr@214 210
mas01cr@204 211 void audioDB::trackSequenceQueryNN(const char* dbName, const char* inFile, adb__queryResponse *adbQueryResponse){
mas01cr@204 212
mas01cr@204 213 initTables(dbName, inFile);
mas01cr@204 214
mas01cr@214 215 unsigned int numVectors;
mas01cr@214 216 double *query, *query_data;
mas01cr@215 217 double *qNorm, *qnPtr, *qPower = 0, *qpPtr = 0;
mas01cr@204 218
mas01cr@215 219 set_up_query(&query, &qNorm, &qPower, &numVectors);
mas01cr@214 220 query_data = query;
mas01cr@215 221 qpPtr = qPower;
mas01cr@215 222 qnPtr = qNorm;
mas01cr@204 223
mas01cr@204 224 unsigned dbVectors = dbH->length/(sizeof(double)*dbH->dim);
mas01cr@204 225
mas01cr@215 226 double *sNorm = new double[dbVectors];
mas01cr@204 227
mas01cr@204 228 // Make norm measurements relative to sequenceLength
mas01cr@204 229 unsigned i,j;
mas01cr@204 230
mas01cr@204 231 // Copy the L2 norm values to core to avoid disk random access later on
mas01cr@204 232 memcpy(sNorm, l2normTable, dbVectors*sizeof(double));
mas01cr@204 233 double* snPtr = sNorm;
mas01cr@204 234
mas01cr@215 235 double *sPower = 0, *spPtr = 0;
mas01cr@204 236
mas01cr@204 237 if (usingPower) {
mas01cr@204 238 if (!(dbH->flags & O2_FLAG_POWER)) {
mas01cr@204 239 error("database not power-enabled", dbName);
mas01cr@204 240 }
mas01cr@204 241 sPower = new double[dbVectors];
mas01cr@204 242 spPtr = sPower;
mas01cr@204 243 memcpy(sPower, powerTable, dbVectors * sizeof(double));
mas01cr@204 244 }
mas01cr@204 245
mas01cr@204 246 for(i=0; i<dbH->numFiles; i++){
mas01cr@204 247 if(trackTable[i]>=sequenceLength) {
mas01cr@204 248 sequence_sum(snPtr, trackTable[i], sequenceLength);
mas01cr@204 249 sequence_sqrt(snPtr, trackTable[i], sequenceLength);
mas01cr@204 250
mas01cr@204 251 if (usingPower) {
mas01cr@204 252 sequence_sum(spPtr, trackTable[i], sequenceLength);
mas01cr@204 253 sequence_average(spPtr, trackTable[i], sequenceLength);
mas01cr@204 254 }
mas01cr@204 255 }
mas01cr@204 256 snPtr += trackTable[i];
mas01cr@204 257 if (usingPower) {
mas01cr@204 258 spPtr += trackTable[i];
mas01cr@204 259 }
mas01cr@204 260 }
mas01cr@204 261
mas01cr@204 262 if(verbosity>1) {
mas01cr@204 263 std::cerr << "done." << std::endl;
mas01cr@204 264 }
mas01cr@204 265
mas01cr@204 266 if(verbosity>1) {
mas01cr@204 267 std::cerr << "matching tracks..." << std::endl;
mas01cr@204 268 }
mas01cr@204 269
mas01cr@204 270 assert(pointNN>0 && pointNN<=O2_MAXNN);
mas01cr@204 271 assert(trackNN>0 && trackNN<=O2_MAXNN);
mas01cr@204 272
mas01cr@204 273 // Make temporary dynamic memory for results
mas01cr@204 274 double trackDistances[trackNN];
mas01cr@204 275 unsigned trackIDs[trackNN];
mas01cr@204 276 unsigned trackQIndexes[trackNN];
mas01cr@204 277 unsigned trackSIndexes[trackNN];
mas01cr@204 278
mas01cr@204 279 double distances[pointNN];
mas01cr@204 280 unsigned qIndexes[pointNN];
mas01cr@204 281 unsigned sIndexes[pointNN];
mas01cr@204 282
mas01cr@204 283
mas01cr@204 284 unsigned k,l,m,n,track,trackOffset=0, HOP_SIZE=sequenceHop, wL=sequenceLength;
mas01cr@204 285 double thisDist;
mas01cr@204 286
mas01cr@204 287 for(k=0; k<pointNN; k++){
mas01cr@204 288 distances[k]=1.0e6;
mas01cr@204 289 qIndexes[k]=~0;
mas01cr@204 290 sIndexes[k]=~0;
mas01cr@204 291 }
mas01cr@204 292
mas01cr@204 293 for(k=0; k<trackNN; k++){
mas01cr@204 294 trackDistances[k]=1.0e6;
mas01cr@204 295 trackQIndexes[k]=~0;
mas01cr@204 296 trackSIndexes[k]=~0;
mas01cr@204 297 trackIDs[k]=~0;
mas01cr@204 298 }
mas01cr@204 299
mas01cr@204 300 // Timestamp and durations processing
mas01cr@204 301 double meanQdur = 0;
mas01cr@204 302 double *timesdata = 0;
mas01cr@204 303 double *querydurs = 0;
mas01cr@204 304 double *meanDBdur = 0;
mas01cr@204 305
mas01cr@204 306 if(usingTimes && !(dbH->flags & O2_FLAG_TIMES)){
mas01cr@204 307 std::cerr << "warning: ignoring query timestamps for non-timestamped database" << std::endl;
mas01cr@204 308 usingTimes=0;
mas01cr@204 309 }
mas01cr@204 310
mas01cr@204 311 else if(!usingTimes && (dbH->flags & O2_FLAG_TIMES))
mas01cr@204 312 std::cerr << "warning: no timestamps given for query. Ignoring database timestamps." << std::endl;
mas01cr@204 313
mas01cr@204 314 else if(usingTimes && (dbH->flags & O2_FLAG_TIMES)){
mas01cr@204 315 timesdata = new double[2*numVectors];
mas01cr@204 316 querydurs = new double[numVectors];
mas01cr@204 317
mas01cr@204 318 insertTimeStamps(numVectors, timesFile, timesdata);
mas01cr@204 319 // Calculate durations of points
mas01cr@204 320 for(k=0; k<numVectors-1; k++) {
mas01cr@204 321 querydurs[k] = timesdata[2*k+1] - timesdata[2*k];
mas01cr@204 322 meanQdur += querydurs[k];
mas01cr@204 323 }
mas01cr@204 324 meanQdur/=k;
mas01cr@204 325 if(verbosity>1) {
mas01cr@204 326 std::cerr << "mean query file duration: " << meanQdur << std::endl;
mas01cr@204 327 }
mas01cr@204 328 meanDBdur = new double[dbH->numFiles];
mas01cr@204 329 assert(meanDBdur);
mas01cr@204 330 for(k=0; k<dbH->numFiles; k++){
mas01cr@204 331 meanDBdur[k]=0.0;
mas01cr@204 332 for(j=0; j<trackTable[k]-1 ; j++) {
mas01cr@204 333 meanDBdur[k]+=timesTable[2*j+1]-timesTable[2*j];
mas01cr@204 334 }
mas01cr@204 335 meanDBdur[k]/=j;
mas01cr@204 336 }
mas01cr@204 337 }
mas01cr@204 338
mas01cr@204 339 if(usingQueryPoint)
mas01cr@204 340 if(queryPoint>numVectors || queryPoint>numVectors-wL+1)
mas01cr@204 341 error("queryPoint > numVectors-wL+1 in query");
mas01cr@204 342 else{
mas01cr@204 343 if(verbosity>1) {
mas01cr@204 344 std::cerr << "query point: " << queryPoint << std::endl; std::cerr.flush();
mas01cr@204 345 }
mas01cr@204 346 query = query + queryPoint * dbH->dim;
mas01cr@204 347 qnPtr = qnPtr + queryPoint;
mas01cr@204 348 if (usingPower) {
mas01cr@204 349 qpPtr = qpPtr + queryPoint;
mas01cr@204 350 }
mas01cr@204 351 numVectors=wL;
mas01cr@204 352 }
mas01cr@204 353
mas01cr@204 354 double ** D = 0; // Differences query and target
mas01cr@204 355 double ** DD = 0; // Matched filter distance
mas01cr@204 356
mas01cr@204 357 D = new double*[numVectors];
mas01cr@204 358 assert(D);
mas01cr@204 359 DD = new double*[numVectors];
mas01cr@204 360 assert(DD);
mas01cr@204 361
mas01cr@204 362 gettimeofday(&tv1, NULL);
mas01cr@204 363 unsigned processedTracks = 0;
mas01cr@204 364 unsigned successfulTracks=0;
mas01cr@204 365
mas01cr@204 366 // build track offset table
mas01cr@204 367 off_t *trackOffsetTable = new off_t[dbH->numFiles];
mas01cr@204 368 unsigned cumTrack=0;
mas01cr@204 369 off_t trackIndexOffset;
mas01cr@204 370 for(k=0; k<dbH->numFiles;k++){
mas01cr@204 371 trackOffsetTable[k]=cumTrack;
mas01cr@204 372 cumTrack+=trackTable[k]*dbH->dim;
mas01cr@204 373 }
mas01cr@204 374
mas01cr@204 375 char nextKey [MAXSTR];
mas01cr@204 376
mas01cr@204 377 // chi^2 statistics
mas01cr@204 378 double sampleCount = 0;
mas01cr@204 379 double sampleSum = 0;
mas01cr@204 380 double logSampleSum = 0;
mas01cr@204 381 double minSample = 1e9;
mas01cr@204 382 double maxSample = 0;
mas01cr@204 383
mas01cr@204 384 // Track loop
mas01cr@204 385 size_t data_buffer_size = 0;
mas01cr@204 386 double *data_buffer = 0;
mas01cr@204 387 lseek(dbfid, dbH->dataOffset, SEEK_SET);
mas01cr@204 388
mas01cr@204 389 for(processedTracks=0, track=0 ; processedTracks < dbH->numFiles ; track++, processedTracks++) {
mas01cr@204 390
mas01cr@204 391 trackOffset = trackOffsetTable[track]; // numDoubles offset
mas01cr@204 392
mas01cr@204 393 // get trackID from file if using a control file
mas01cr@204 394 if(trackFile) {
mas01cr@204 395 trackFile->getline(nextKey,MAXSTR);
mas01cr@204 396 if(!trackFile->eof()) {
mas01cr@204 397 track = getKeyPos(nextKey);
mas01cr@204 398 trackOffset = trackOffsetTable[track];
mas01cr@204 399 lseek(dbfid, dbH->dataOffset + trackOffset * sizeof(double), SEEK_SET);
mas01cr@204 400 } else {
mas01cr@204 401 break;
mas01cr@204 402 }
mas01cr@204 403 }
mas01cr@204 404
mas01cr@204 405 trackIndexOffset=trackOffset/dbH->dim; // numVectors offset
mas01cr@204 406
mas01cr@204 407 if(sequenceLength<=trackTable[track]){ // test for short sequences
mas01cr@204 408
mas01cr@204 409 if(verbosity>7) {
mas01cr@204 410 std::cerr << track << "." << trackIndexOffset << "." << trackTable[track] << " | ";std::cerr.flush();
mas01cr@204 411 }
mas01cr@209 412
mas01cr@209 413 read_data(track, &data_buffer, &data_buffer_size);
mas01cr@208 414 initialize_arrays(track, numVectors, query, data_buffer, D, DD);
mas01cr@207 415
mas01cr@204 416 if(verbosity>3 && usingTimes) {
mas01cr@204 417 std::cerr << "meanQdur=" << meanQdur << " meanDBdur=" << meanDBdur[track] << std::endl;
mas01cr@204 418 std::cerr.flush();
mas01cr@204 419 }
mas01cr@204 420
mas01cr@204 421 if(!usingTimes ||
mas01cr@204 422 (usingTimes
mas01cr@204 423 && fabs(meanDBdur[track]-meanQdur)<meanQdur*timesTol)){
mas01cr@204 424
mas01cr@204 425 if(verbosity>3 && usingTimes) {
mas01cr@204 426 std::cerr << "within duration tolerance." << std::endl;
mas01cr@204 427 std::cerr.flush();
mas01cr@204 428 }
mas01cr@204 429
mas01cr@204 430 // Search for minimum distance by shingles (concatenated vectors)
mas01cr@204 431 for(j=0;j<=numVectors-wL;j+=HOP_SIZE)
mas01cr@204 432 for(k=0;k<=trackTable[track]-wL;k+=HOP_SIZE){
mas01cr@204 433 thisDist=2-(2/(qnPtr[j]*sNorm[trackIndexOffset+k]))*DD[j][k];
mas01cr@204 434 if(verbosity>9) {
mas01cr@204 435 std::cerr << thisDist << " " << qnPtr[j] << " " << sNorm[trackIndexOffset+k] << std::endl;
mas01cr@204 436 }
mas01cr@204 437 // Gather chi^2 statistics
mas01cr@204 438 if(thisDist<minSample)
mas01cr@204 439 minSample=thisDist;
mas01cr@204 440 else if(thisDist>maxSample)
mas01cr@204 441 maxSample=thisDist;
mas01cr@204 442 if(thisDist>1e-9){
mas01cr@204 443 sampleCount++;
mas01cr@204 444 sampleSum+=thisDist;
mas01cr@204 445 logSampleSum+=log(thisDist);
mas01cr@204 446 }
mas01cr@204 447
mas01cr@204 448 // diffL2 = fabs(qnPtr[j] - sNorm[trackIndexOffset+k]);
mas01cr@204 449 // Power test
mas01cr@204 450 if (usingPower) {
mas01cr@204 451 if (!(powers_acceptable(qpPtr[j], sPower[trackIndexOffset + k]))) {
mas01cr@204 452 thisDist = 1000000.0;
mas01cr@204 453 }
mas01cr@204 454 }
mas01cr@204 455
mas01cr@204 456 // k-NN match algorithm
mas01cr@204 457 m=pointNN;
mas01cr@204 458 while(m--){
mas01cr@204 459 if(thisDist<=distances[m])
mas01cr@204 460 if(m==0 || thisDist>=distances[m-1]){
mas01cr@204 461 // Shuffle distances up the list
mas01cr@204 462 for(l=pointNN-1; l>m; l--){
mas01cr@204 463 distances[l]=distances[l-1];
mas01cr@204 464 qIndexes[l]=qIndexes[l-1];
mas01cr@204 465 sIndexes[l]=sIndexes[l-1];
mas01cr@204 466 }
mas01cr@204 467 distances[m]=thisDist;
mas01cr@204 468 if(usingQueryPoint)
mas01cr@204 469 qIndexes[m]=queryPoint;
mas01cr@204 470 else
mas01cr@204 471 qIndexes[m]=j;
mas01cr@204 472 sIndexes[m]=k;
mas01cr@204 473 break;
mas01cr@204 474 }
mas01cr@204 475 }
mas01cr@204 476 }
mas01cr@204 477 // Calculate the mean of the N-Best matches
mas01cr@204 478 thisDist=0.0;
mas01cr@204 479 for(m=0; m<pointNN; m++) {
mas01cr@204 480 if (distances[m] == 1000000.0) break;
mas01cr@204 481 thisDist+=distances[m];
mas01cr@204 482 }
mas01cr@204 483 thisDist/=m;
mas01cr@204 484
mas01cr@204 485 // Let's see the distances then...
mas01cr@204 486 if(verbosity>3) {
mas01cr@204 487 std::cerr << fileTable+track*O2_FILETABLESIZE << " " << thisDist << std::endl;
mas01cr@204 488 }
mas01cr@204 489
mas01cr@204 490
mas01cr@204 491 // All the track stuff goes here
mas01cr@204 492 n=trackNN;
mas01cr@204 493 while(n--){
mas01cr@204 494 if(thisDist<=trackDistances[n]){
mas01cr@204 495 if((n==0 || thisDist>=trackDistances[n-1])){
mas01cr@204 496 // Copy all values above up the queue
mas01cr@204 497 for( l=trackNN-1 ; l > n ; l--){
mas01cr@204 498 trackDistances[l]=trackDistances[l-1];
mas01cr@204 499 trackQIndexes[l]=trackQIndexes[l-1];
mas01cr@204 500 trackSIndexes[l]=trackSIndexes[l-1];
mas01cr@204 501 trackIDs[l]=trackIDs[l-1];
mas01cr@204 502 }
mas01cr@204 503 trackDistances[n]=thisDist;
mas01cr@204 504 trackQIndexes[n]=qIndexes[0];
mas01cr@204 505 trackSIndexes[n]=sIndexes[0];
mas01cr@204 506 successfulTracks++;
mas01cr@204 507 trackIDs[n]=track;
mas01cr@204 508 break;
mas01cr@204 509 }
mas01cr@204 510 }
mas01cr@204 511 else
mas01cr@204 512 break;
mas01cr@204 513 }
mas01cr@211 514 } // Duration match
mas01cr@211 515 delete_arrays(track, numVectors, D, DD);
mas01cr@204 516 }
mas01cr@204 517 // per-track reset array values
mas01cr@204 518 for(unsigned k=0; k<pointNN; k++){
mas01cr@204 519 distances[k]=1.0e6;
mas01cr@204 520 qIndexes[k]=~0;
mas01cr@204 521 sIndexes[k]=~0;
mas01cr@204 522 }
mas01cr@204 523 }
mas01cr@204 524
mas01cr@204 525 free(data_buffer);
mas01cr@204 526
mas01cr@204 527 gettimeofday(&tv2,NULL);
mas01cr@204 528 if(verbosity>1) {
mas01cr@204 529 std::cerr << std::endl << "processed tracks :" << processedTracks << " matched tracks: " << successfulTracks << " elapsed time:"
mas01cr@204 530 << ( tv2.tv_sec*1000 + tv2.tv_usec/1000 ) - ( tv1.tv_sec*1000+tv1.tv_usec/1000 ) << " msec" << std::endl;
mas01cr@204 531 std::cerr << "sampleCount: " << sampleCount << " sampleSum: " << sampleSum << " logSampleSum: " << logSampleSum
mas01cr@204 532 << " minSample: " << minSample << " maxSample: " << maxSample << std::endl;
mas01cr@204 533 }
mas01cr@204 534 if(adbQueryResponse==0){
mas01cr@204 535 if(verbosity>1) {
mas01cr@204 536 std::cerr<<std::endl;
mas01cr@204 537 }
mas01cr@204 538 // Output answer
mas01cr@204 539 // Loop over nearest neighbours
mas01cr@204 540 for(k=0; k < std::min(trackNN,successfulTracks); k++)
mas01cr@204 541 std::cout << fileTable+trackIDs[k]*O2_FILETABLESIZE << " " << trackDistances[k] << " "
mas01cr@204 542 << trackQIndexes[k] << " " << trackSIndexes[k] << std::endl;
mas01cr@204 543 }
mas01cr@204 544 else{ // Process Web Services Query
mas01cr@204 545 int listLen = std::min(trackNN, processedTracks);
mas01cr@204 546 adbQueryResponse->result.__sizeRlist=listLen;
mas01cr@204 547 adbQueryResponse->result.__sizeDist=listLen;
mas01cr@204 548 adbQueryResponse->result.__sizeQpos=listLen;
mas01cr@204 549 adbQueryResponse->result.__sizeSpos=listLen;
mas01cr@204 550 adbQueryResponse->result.Rlist= new char*[listLen];
mas01cr@204 551 adbQueryResponse->result.Dist = new double[listLen];
mas01cr@204 552 adbQueryResponse->result.Qpos = new unsigned int[listLen];
mas01cr@204 553 adbQueryResponse->result.Spos = new unsigned int[listLen];
mas01cr@204 554 for(k=0; k<(unsigned)adbQueryResponse->result.__sizeRlist; k++){
mas01cr@204 555 adbQueryResponse->result.Rlist[k]=new char[O2_MAXFILESTR];
mas01cr@204 556 adbQueryResponse->result.Dist[k]=trackDistances[k];
mas01cr@204 557 adbQueryResponse->result.Qpos[k]=trackQIndexes[k];
mas01cr@204 558 adbQueryResponse->result.Spos[k]=trackSIndexes[k];
mas01cr@204 559 sprintf(adbQueryResponse->result.Rlist[k], "%s", fileTable+trackIDs[k]*O2_FILETABLESIZE);
mas01cr@204 560 }
mas01cr@204 561 }
mas01cr@204 562
mas01cr@204 563 // Clean up
mas01cr@204 564 if(trackOffsetTable)
mas01cr@204 565 delete[] trackOffsetTable;
mas01cr@214 566 if(query_data)
mas01cr@214 567 delete[] query_data;
mas01cr@204 568 if(qNorm)
mas01cr@204 569 delete[] qNorm;
mas01cr@204 570 if(sNorm)
mas01cr@204 571 delete[] sNorm;
mas01cr@204 572 if(qPower)
mas01cr@204 573 delete[] qPower;
mas01cr@204 574 if(sPower)
mas01cr@204 575 delete[] sPower;
mas01cr@204 576 if(D)
mas01cr@204 577 delete[] D;
mas01cr@204 578 if(DD)
mas01cr@204 579 delete[] DD;
mas01cr@204 580 if(timesdata)
mas01cr@204 581 delete[] timesdata;
mas01cr@204 582 if(querydurs)
mas01cr@204 583 delete[] querydurs;
mas01cr@204 584 if(meanDBdur)
mas01cr@204 585 delete[] meanDBdur;
mas01cr@204 586 }
mas01cr@204 587
mas01cr@204 588 void audioDB::trackSequenceQueryRad(const char* dbName, const char* inFile, adb__queryResponse *adbQueryResponse){
mas01cr@204 589
mas01cr@204 590 initTables(dbName, inFile);
mas01cr@204 591
mas01cr@214 592 unsigned int numVectors;
mas01cr@214 593 double *query, *query_data;
mas01cr@215 594 double *qNorm, *qnPtr, *qPower = 0, *qpPtr = 0;
mas01cr@204 595
mas01cr@215 596 set_up_query(&query, &qNorm, &qPower, &numVectors);
mas01cr@214 597 query_data = query;
mas01cr@215 598 qpPtr = qPower;
mas01cr@215 599 qnPtr = qNorm;
mas01cr@214 600
mas01cr@204 601 unsigned dbVectors = dbH->length/(sizeof(double)*dbH->dim);
mas01cr@204 602
mas01cr@215 603 double *sNorm = new double[dbVectors];
mas01cr@204 604
mas01cr@204 605 // Make norm measurements relative to sequenceLength
mas01cr@204 606 unsigned i,j;
mas01cr@204 607
mas01cr@204 608 // Copy the L2 norm values to core to avoid disk random access later on
mas01cr@204 609 memcpy(sNorm, l2normTable, dbVectors*sizeof(double));
mas01cr@204 610 double* snPtr = sNorm;
mas01cr@204 611
mas01cr@215 612 double *sPower = 0, *spPtr = 0;
mas01cr@204 613
mas01cr@204 614 if (usingPower) {
mas01cr@204 615 if(!(dbH->flags & O2_FLAG_POWER)) {
mas01cr@204 616 error("database not power-enabled", dbName);
mas01cr@204 617 }
mas01cr@204 618 sPower = new double[dbVectors];
mas01cr@204 619 spPtr = sPower;
mas01cr@204 620 memcpy(sPower, powerTable, dbVectors * sizeof(double));
mas01cr@204 621 }
mas01cr@204 622
mas01cr@204 623 for(i=0; i<dbH->numFiles; i++){
mas01cr@204 624 if(trackTable[i]>=sequenceLength) {
mas01cr@204 625 sequence_sum(snPtr, trackTable[i], sequenceLength);
mas01cr@204 626 sequence_sqrt(snPtr, trackTable[i], sequenceLength);
mas01cr@204 627 if (usingPower) {
mas01cr@204 628 sequence_sum(spPtr, trackTable[i], sequenceLength);
mas01cr@204 629 sequence_average(spPtr, trackTable[i], sequenceLength);
mas01cr@204 630 }
mas01cr@204 631 }
mas01cr@204 632 snPtr += trackTable[i];
mas01cr@204 633 if (usingPower) {
mas01cr@204 634 spPtr += trackTable[i];
mas01cr@204 635 }
mas01cr@204 636 }
mas01cr@204 637
mas01cr@204 638 if(verbosity>1) {
mas01cr@204 639 std::cerr << "done." << std::endl;
mas01cr@204 640 }
mas01cr@204 641
mas01cr@204 642 if(verbosity>1) {
mas01cr@204 643 std::cerr << "matching tracks..." << std::endl;
mas01cr@204 644 }
mas01cr@204 645
mas01cr@204 646 assert(pointNN>0 && pointNN<=O2_MAXNN);
mas01cr@204 647 assert(trackNN>0 && trackNN<=O2_MAXNN);
mas01cr@204 648
mas01cr@204 649 // Make temporary dynamic memory for results
mas01cr@204 650 double trackDistances[trackNN];
mas01cr@204 651 unsigned trackIDs[trackNN];
mas01cr@204 652 unsigned trackQIndexes[trackNN];
mas01cr@204 653 unsigned trackSIndexes[trackNN];
mas01cr@204 654
mas01cr@204 655 double distances[pointNN];
mas01cr@204 656 unsigned qIndexes[pointNN];
mas01cr@204 657 unsigned sIndexes[pointNN];
mas01cr@204 658
mas01cr@204 659
mas01cr@208 660 unsigned k,l,n,track,trackOffset=0;
mas01cr@208 661 unsigned const HOP_SIZE=sequenceHop;
mas01cr@208 662 unsigned const wL=sequenceLength;
mas01cr@204 663 double thisDist;
mas01cr@204 664
mas01cr@204 665 for(k=0; k<pointNN; k++){
mas01cr@204 666 distances[k]=0.0;
mas01cr@204 667 qIndexes[k]=~0;
mas01cr@204 668 sIndexes[k]=~0;
mas01cr@204 669 }
mas01cr@204 670
mas01cr@204 671 for(k=0; k<trackNN; k++){
mas01cr@204 672 trackDistances[k]=0.0;
mas01cr@204 673 trackQIndexes[k]=~0;
mas01cr@204 674 trackSIndexes[k]=~0;
mas01cr@204 675 trackIDs[k]=~0;
mas01cr@204 676 }
mas01cr@204 677
mas01cr@204 678 // Timestamp and durations processing
mas01cr@204 679 double meanQdur = 0;
mas01cr@204 680 double *timesdata = 0;
mas01cr@204 681 double *querydurs = 0;
mas01cr@204 682 double *meanDBdur = 0;
mas01cr@204 683
mas01cr@204 684 if(usingTimes && !(dbH->flags & O2_FLAG_TIMES)){
mas01cr@204 685 std::cerr << "warning: ignoring query timestamps for non-timestamped database" << std::endl;
mas01cr@204 686 usingTimes=0;
mas01cr@204 687 }
mas01cr@204 688
mas01cr@204 689 else if(!usingTimes && (dbH->flags & O2_FLAG_TIMES))
mas01cr@204 690 std::cerr << "warning: no timestamps given for query. Ignoring database timestamps." << std::endl;
mas01cr@204 691
mas01cr@204 692 else if(usingTimes && (dbH->flags & O2_FLAG_TIMES)){
mas01cr@204 693 timesdata = new double[2*numVectors];
mas01cr@204 694 querydurs = new double[numVectors];
mas01cr@204 695
mas01cr@204 696 insertTimeStamps(numVectors, timesFile, timesdata);
mas01cr@204 697 // Calculate durations of points
mas01cr@204 698 for(k=0; k<numVectors-1; k++){
mas01cr@204 699 querydurs[k] = timesdata[2*k+1] - timesdata[2*k];
mas01cr@204 700 meanQdur += querydurs[k];
mas01cr@204 701 }
mas01cr@204 702 meanQdur/=k;
mas01cr@204 703 if(verbosity>1) {
mas01cr@204 704 std::cerr << "mean query file duration: " << meanQdur << std::endl;
mas01cr@204 705 }
mas01cr@204 706 meanDBdur = new double[dbH->numFiles];
mas01cr@204 707 assert(meanDBdur);
mas01cr@204 708 for(k=0; k<dbH->numFiles; k++){
mas01cr@204 709 meanDBdur[k]=0.0;
mas01cr@204 710 for(j=0; j<trackTable[k]-1 ; j++) {
mas01cr@204 711 meanDBdur[k]+=timesTable[2*j+1]-timesTable[2*j];
mas01cr@204 712 }
mas01cr@204 713 meanDBdur[k]/=j;
mas01cr@204 714 }
mas01cr@204 715 }
mas01cr@204 716
mas01cr@204 717 if(usingQueryPoint)
mas01cr@204 718 if(queryPoint>numVectors || queryPoint>numVectors-wL+1)
mas01cr@204 719 error("queryPoint > numVectors-wL+1 in query");
mas01cr@204 720 else{
mas01cr@204 721 if(verbosity>1) {
mas01cr@204 722 std::cerr << "query point: " << queryPoint << std::endl; std::cerr.flush();
mas01cr@204 723 }
mas01cr@204 724 query = query + queryPoint*dbH->dim;
mas01cr@204 725 qnPtr = qnPtr + queryPoint;
mas01cr@204 726 if (usingPower) {
mas01cr@204 727 qpPtr = qpPtr + queryPoint;
mas01cr@204 728 }
mas01cr@204 729 numVectors=wL;
mas01cr@204 730 }
mas01cr@204 731
mas01cr@204 732 double ** D = 0; // Differences query and target
mas01cr@204 733 double ** DD = 0; // Matched filter distance
mas01cr@204 734
mas01cr@204 735 D = new double*[numVectors];
mas01cr@204 736 assert(D);
mas01cr@204 737 DD = new double*[numVectors];
mas01cr@204 738 assert(DD);
mas01cr@204 739
mas01cr@204 740 gettimeofday(&tv1, NULL);
mas01cr@204 741 unsigned processedTracks = 0;
mas01cr@204 742 unsigned successfulTracks=0;
mas01cr@204 743
mas01cr@204 744 // build track offset table
mas01cr@204 745 off_t *trackOffsetTable = new off_t[dbH->numFiles];
mas01cr@204 746 unsigned cumTrack=0;
mas01cr@204 747 off_t trackIndexOffset;
mas01cr@204 748 for(k=0; k<dbH->numFiles;k++){
mas01cr@204 749 trackOffsetTable[k]=cumTrack;
mas01cr@204 750 cumTrack+=trackTable[k]*dbH->dim;
mas01cr@204 751 }
mas01cr@204 752
mas01cr@204 753 char nextKey [MAXSTR];
mas01cr@204 754
mas01cr@204 755 // chi^2 statistics
mas01cr@204 756 double sampleCount = 0;
mas01cr@204 757 double sampleSum = 0;
mas01cr@204 758 double logSampleSum = 0;
mas01cr@204 759 double minSample = 1e9;
mas01cr@204 760 double maxSample = 0;
mas01cr@204 761
mas01cr@204 762 // Track loop
mas01cr@204 763 size_t data_buffer_size = 0;
mas01cr@204 764 double *data_buffer = 0;
mas01cr@204 765 lseek(dbfid, dbH->dataOffset, SEEK_SET);
mas01cr@204 766
mas01cr@204 767 for(processedTracks=0, track=0 ; processedTracks < dbH->numFiles ; track++, processedTracks++){
mas01cr@204 768
mas01cr@204 769 trackOffset = trackOffsetTable[track]; // numDoubles offset
mas01cr@204 770
mas01cr@204 771 // get trackID from file if using a control file
mas01cr@204 772 if(trackFile) {
mas01cr@204 773 trackFile->getline(nextKey,MAXSTR);
mas01cr@204 774 if(!trackFile->eof()) {
mas01cr@204 775 track = getKeyPos(nextKey);
mas01cr@204 776 trackOffset = trackOffsetTable[track];
mas01cr@204 777 lseek(dbfid, dbH->dataOffset + trackOffset * sizeof(double), SEEK_SET);
mas01cr@204 778 } else {
mas01cr@204 779 break;
mas01cr@204 780 }
mas01cr@204 781 }
mas01cr@204 782
mas01cr@204 783 trackIndexOffset=trackOffset/dbH->dim; // numVectors offset
mas01cr@204 784
mas01cr@204 785 if(sequenceLength<=trackTable[track]){ // test for short sequences
mas01cr@204 786
mas01cr@204 787 if(verbosity>7) {
mas01cr@204 788 std::cerr << track << "." << trackIndexOffset << "." << trackTable[track] << " | ";std::cerr.flush();
mas01cr@204 789 }
mas01cr@204 790
mas01cr@209 791 read_data(track, &data_buffer, &data_buffer_size);
mas01cr@208 792 initialize_arrays(track, numVectors, query, data_buffer, D, DD);
mas01cr@207 793
mas01cr@204 794 if(verbosity>3 && usingTimes) {
mas01cr@204 795 std::cerr << "meanQdur=" << meanQdur << " meanDBdur=" << meanDBdur[track] << std::endl;
mas01cr@204 796 std::cerr.flush();
mas01cr@204 797 }
mas01cr@204 798
mas01cr@204 799 if(!usingTimes ||
mas01cr@204 800 (usingTimes
mas01cr@204 801 && fabs(meanDBdur[track]-meanQdur)<meanQdur*timesTol)){
mas01cr@204 802
mas01cr@204 803 if(verbosity>3 && usingTimes) {
mas01cr@204 804 std::cerr << "within duration tolerance." << std::endl;
mas01cr@204 805 std::cerr.flush();
mas01cr@204 806 }
mas01cr@204 807
mas01cr@204 808 // Search for minimum distance by shingles (concatenated vectors)
mas01cr@204 809 for(j=0;j<=numVectors-wL;j+=HOP_SIZE)
mas01cr@204 810 for(k=0;k<=trackTable[track]-wL;k+=HOP_SIZE){
mas01cr@204 811 thisDist=2-(2/(qnPtr[j]*sNorm[trackIndexOffset+k]))*DD[j][k];
mas01cr@204 812 if(verbosity>9) {
mas01cr@204 813 std::cerr << thisDist << " " << qnPtr[j] << " " << sNorm[trackIndexOffset+k] << std::endl;
mas01cr@204 814 }
mas01cr@204 815 // Gather chi^2 statistics
mas01cr@204 816 if(thisDist<minSample)
mas01cr@204 817 minSample=thisDist;
mas01cr@204 818 else if(thisDist>maxSample)
mas01cr@204 819 maxSample=thisDist;
mas01cr@204 820 if(thisDist>1e-9){
mas01cr@204 821 sampleCount++;
mas01cr@204 822 sampleSum+=thisDist;
mas01cr@204 823 logSampleSum+=log(thisDist);
mas01cr@204 824 }
mas01cr@204 825
mas01cr@204 826 // diffL2 = fabs(qnPtr[j] - sNorm[trackIndexOffset+k]);
mas01cr@204 827 // Power test
mas01cr@204 828 if (usingPower) {
mas01cr@204 829 if (!(powers_acceptable(qpPtr[j], sPower[trackIndexOffset + k]))) {
mas01cr@204 830 thisDist = 1000000.0;
mas01cr@204 831 }
mas01cr@204 832 }
mas01cr@204 833
mas01cr@204 834 if(thisDist>=0 && thisDist<=radius){
mas01cr@204 835 distances[0]++; // increment count
mas01cr@204 836 break; // only need one track point per query point
mas01cr@204 837 }
mas01cr@204 838 }
mas01cr@204 839 // How many points were below threshold ?
mas01cr@204 840 thisDist=distances[0];
mas01cr@204 841
mas01cr@204 842 // Let's see the distances then...
mas01cr@204 843 if(verbosity>3) {
mas01cr@204 844 std::cerr << fileTable+track*O2_FILETABLESIZE << " " << thisDist << std::endl;
mas01cr@204 845 }
mas01cr@204 846
mas01cr@204 847 // All the track stuff goes here
mas01cr@204 848 n=trackNN;
mas01cr@204 849 while(n--){
mas01cr@204 850 if(thisDist>trackDistances[n]){
mas01cr@204 851 if((n==0 || thisDist<=trackDistances[n-1])){
mas01cr@204 852 // Copy all values above up the queue
mas01cr@204 853 for( l=trackNN-1 ; l > n ; l--){
mas01cr@204 854 trackDistances[l]=trackDistances[l-1];
mas01cr@204 855 trackQIndexes[l]=trackQIndexes[l-1];
mas01cr@204 856 trackSIndexes[l]=trackSIndexes[l-1];
mas01cr@204 857 trackIDs[l]=trackIDs[l-1];
mas01cr@204 858 }
mas01cr@204 859 trackDistances[n]=thisDist;
mas01cr@204 860 trackQIndexes[n]=qIndexes[0];
mas01cr@204 861 trackSIndexes[n]=sIndexes[0];
mas01cr@204 862 successfulTracks++;
mas01cr@204 863 trackIDs[n]=track;
mas01cr@204 864 break;
mas01cr@204 865 }
mas01cr@204 866 }
mas01cr@204 867 else
mas01cr@204 868 break;
mas01cr@204 869 }
mas01cr@204 870 } // Duration match
mas01cr@211 871 delete_arrays(track, numVectors, D, DD);
mas01cr@204 872 }
mas01cr@204 873 // per-track reset array values
mas01cr@204 874 for(unsigned k=0; k<pointNN; k++){
mas01cr@204 875 distances[k]=0.0;
mas01cr@204 876 qIndexes[k]=~0;
mas01cr@204 877 sIndexes[k]=~0;
mas01cr@204 878 }
mas01cr@204 879 }
mas01cr@204 880
mas01cr@204 881 free(data_buffer);
mas01cr@204 882
mas01cr@204 883 gettimeofday(&tv2,NULL);
mas01cr@204 884 if(verbosity>1) {
mas01cr@204 885 std::cerr << std::endl << "processed tracks :" << processedTracks << " matched tracks: " << successfulTracks << " elapsed time:"
mas01cr@204 886 << ( tv2.tv_sec*1000 + tv2.tv_usec/1000 ) - ( tv1.tv_sec*1000+tv1.tv_usec/1000 ) << " msec" << std::endl;
mas01cr@204 887 std::cerr << "sampleCount: " << sampleCount << " sampleSum: " << sampleSum << " logSampleSum: " << logSampleSum
mas01cr@204 888 << " minSample: " << minSample << " maxSample: " << maxSample << std::endl;
mas01cr@204 889 }
mas01cr@204 890
mas01cr@204 891 if(adbQueryResponse==0){
mas01cr@204 892 if(verbosity>1) {
mas01cr@204 893 std::cerr<<std::endl;
mas01cr@204 894 }
mas01cr@204 895 // Output answer
mas01cr@204 896 // Loop over nearest neighbours
mas01cr@204 897 for(k=0; k < std::min(trackNN,successfulTracks); k++)
mas01cr@204 898 std::cout << fileTable+trackIDs[k]*O2_FILETABLESIZE << " " << trackDistances[k] << std::endl;
mas01cr@204 899 }
mas01cr@204 900 else{ // Process Web Services Query
mas01cr@204 901 int listLen = std::min(trackNN, processedTracks);
mas01cr@204 902 adbQueryResponse->result.__sizeRlist=listLen;
mas01cr@204 903 adbQueryResponse->result.__sizeDist=listLen;
mas01cr@204 904 adbQueryResponse->result.__sizeQpos=listLen;
mas01cr@204 905 adbQueryResponse->result.__sizeSpos=listLen;
mas01cr@204 906 adbQueryResponse->result.Rlist= new char*[listLen];
mas01cr@204 907 adbQueryResponse->result.Dist = new double[listLen];
mas01cr@204 908 adbQueryResponse->result.Qpos = new unsigned int[listLen];
mas01cr@204 909 adbQueryResponse->result.Spos = new unsigned int[listLen];
mas01cr@204 910 for(k=0; k<(unsigned)adbQueryResponse->result.__sizeRlist; k++){
mas01cr@204 911 adbQueryResponse->result.Rlist[k]=new char[O2_MAXFILESTR];
mas01cr@204 912 adbQueryResponse->result.Dist[k]=trackDistances[k];
mas01cr@204 913 adbQueryResponse->result.Qpos[k]=trackQIndexes[k];
mas01cr@204 914 adbQueryResponse->result.Spos[k]=trackSIndexes[k];
mas01cr@204 915 sprintf(adbQueryResponse->result.Rlist[k], "%s", fileTable+trackIDs[k]*O2_FILETABLESIZE);
mas01cr@204 916 }
mas01cr@204 917 }
mas01cr@204 918
mas01cr@204 919 // Clean up
mas01cr@204 920 if(trackOffsetTable)
mas01cr@204 921 delete[] trackOffsetTable;
mas01cr@214 922 if(query_data)
mas01cr@214 923 delete[] query_data;
mas01cr@204 924 if(qNorm)
mas01cr@204 925 delete[] qNorm;
mas01cr@204 926 if(sNorm)
mas01cr@204 927 delete[] sNorm;
mas01cr@204 928 if(qPower)
mas01cr@204 929 delete[] qPower;
mas01cr@204 930 if(sPower)
mas01cr@204 931 delete[] sPower;
mas01cr@204 932 if(D)
mas01cr@204 933 delete[] D;
mas01cr@204 934 if(DD)
mas01cr@204 935 delete[] DD;
mas01cr@204 936 if(timesdata)
mas01cr@204 937 delete[] timesdata;
mas01cr@204 938 if(querydurs)
mas01cr@204 939 delete[] querydurs;
mas01cr@204 940 if(meanDBdur)
mas01cr@204 941 delete[] meanDBdur;
mas01cr@204 942 }
mas01cr@204 943
mas01cr@204 944 // Unit norm block of features
mas01cr@204 945 void audioDB::unitNorm(double* X, unsigned dim, unsigned n, double* qNorm){
mas01cr@204 946 unsigned d;
mas01cr@204 947 double L2, *p;
mas01cr@204 948 if(verbosity>2) {
mas01cr@204 949 std::cerr << "norming " << n << " vectors...";std::cerr.flush();
mas01cr@204 950 }
mas01cr@212 951 while(n--) {
mas01cr@212 952 p = X;
mas01cr@212 953 L2 = 0.0;
mas01cr@212 954 d = dim;
mas01cr@212 955 while(d--) {
mas01cr@212 956 L2 += *p * *p;
mas01cr@204 957 p++;
mas01cr@204 958 }
mas01cr@212 959 if(qNorm) {
mas01cr@204 960 *qNorm++=L2;
mas01cr@212 961 }
mas01cr@212 962 X += dim;
mas01cr@204 963 }
mas01cr@204 964 if(verbosity>2) {
mas01cr@204 965 std::cerr << "done..." << std::endl;
mas01cr@204 966 }
mas01cr@204 967 }