annotate audioDB.cpp @ 280:3be15407e814

Merge sampling branch (-r361:405, though I hope that the branch is now finished) onto trunk. API developers take note. Things still to clear up: * whether the threshold distance it currently reports bears any relation to reality; * if not, how to bring it a bit more into alignment; * minor code cleanup issues in sample.cpp; * incorporating --absolute-threshold handling into sampling; * writing suitable test cases.
author mas01cr
date Wed, 02 Jul 2008 14:07:10 +0000
parents 210b2f661b88
children cacad987d785
rev   line source
mas01cr@0 1 #include "audioDB.h"
mas01cr@0 2
mas01cr@76 3 audioDB::audioDB(const unsigned argc, char* const argv[]): O2_AUDIODB_INITIALIZERS
mas01cr@76 4 {
mas01cr@0 5 if(processArgs(argc, argv)<0){
mas01cr@0 6 printf("No command found.\n");
mas01cr@0 7 cmdline_parser_print_version ();
mas01cr@0 8 if (strlen(gengetopt_args_info_purpose) > 0)
mas01cr@0 9 printf("%s\n", gengetopt_args_info_purpose);
mas01cr@0 10 printf("%s\n", gengetopt_args_info_usage);
mas01cr@0 11 printf("%s\n", gengetopt_args_info_help[1]);
mas01cr@0 12 printf("%s\n", gengetopt_args_info_help[2]);
mas01cr@0 13 printf("%s\n", gengetopt_args_info_help[0]);
mas01cr@151 14 error("No command found");
mas01cr@0 15 }
mas01cr@77 16
mas01cr@0 17 if(O2_ACTION(COM_SERVER))
mas01cr@0 18 startServer();
mas01cr@0 19
mas01cr@0 20 else if(O2_ACTION(COM_CREATE))
mas01cr@0 21 create(dbName);
mas01cr@0 22
mas01cr@0 23 else if(O2_ACTION(COM_INSERT))
mas01cr@0 24 insert(dbName, inFile);
mas01cr@0 25
mas01cr@0 26 else if(O2_ACTION(COM_BATCHINSERT))
mas01cr@0 27 batchinsert(dbName, inFile);
mas01cr@0 28
mas01cr@0 29 else if(O2_ACTION(COM_QUERY))
mas01cr@0 30 if(isClient)
mas01cr@0 31 ws_query(dbName, inFile, (char*)hostport);
mas01cr@0 32 else
mas01cr@76 33 query(dbName, inFile);
mas01cr@0 34
mas01cr@0 35 else if(O2_ACTION(COM_STATUS))
mas01cr@0 36 if(isClient)
mas01cr@0 37 ws_status(dbName,(char*)hostport);
mas01cr@0 38 else
mas01cr@0 39 status(dbName);
mas01cr@280 40
mas01cr@280 41 else if(O2_ACTION(COM_SAMPLE))
mas01cr@280 42 sample(dbName);
mas01cr@0 43
mas01cr@0 44 else if(O2_ACTION(COM_L2NORM))
mas01cr@0 45 l2norm(dbName);
mas01cr@0 46
mas01cr@193 47 else if(O2_ACTION(COM_POWER))
mas01cr@193 48 power_flag(dbName);
mas01cr@193 49
mas01cr@0 50 else if(O2_ACTION(COM_DUMP))
mas01cr@0 51 dump(dbName);
mas01cr@0 52
mas01cr@0 53 else
mas01cr@0 54 error("Unrecognized command",command);
mas01cr@0 55 }
mas01cr@0 56
mas01cr@133 57 audioDB::audioDB(const unsigned argc, char* const argv[], adb__queryResponse *adbQueryResponse): O2_AUDIODB_INITIALIZERS
mas01cr@76 58 {
mas01cr@97 59 try {
mas01cr@151 60 isServer = 1; // FIXME: Hack
mas01cr@97 61 processArgs(argc, argv);
mas01cr@97 62 assert(O2_ACTION(COM_QUERY));
mas01cr@133 63 query(dbName, inFile, adbQueryResponse);
mas01cr@97 64 } catch(char *err) {
mas01cr@97 65 cleanup();
mas01cr@97 66 throw(err);
mas01cr@97 67 }
mas01cr@76 68 }
mas01cr@76 69
mas01cr@133 70 audioDB::audioDB(const unsigned argc, char* const argv[], adb__statusResponse *adbStatusResponse): O2_AUDIODB_INITIALIZERS
mas01cr@76 71 {
mas01cr@97 72 try {
mas01cr@151 73 isServer = 1; // FIXME: Hack
mas01cr@97 74 processArgs(argc, argv);
mas01cr@97 75 assert(O2_ACTION(COM_STATUS));
mas01cr@133 76 status(dbName, adbStatusResponse);
mas01cr@97 77 } catch(char *err) {
mas01cr@97 78 cleanup();
mas01cr@97 79 throw(err);
mas01cr@97 80 }
mas01cr@76 81 }
mas01cr@76 82
mas01cr@97 83 void audioDB::cleanup() {
mas01cr@122 84 cmdline_parser_free(&args_info);
mas01cr@0 85 if(indata)
mas01cr@0 86 munmap(indata,statbuf.st_size);
mas01cr@0 87 if(db)
mas01cr@196 88 munmap(db,getpagesize());
mas01cr@196 89 if(fileTable)
mas01cr@196 90 munmap(fileTable, fileTableLength);
mas01cr@196 91 if(trackTable)
mas01cr@196 92 munmap(trackTable, trackTableLength);
mas01cr@196 93 if(dataBuf)
mas01cr@196 94 munmap(dataBuf, dataBufLength);
mas01cr@196 95 if(timesTable)
mas01cr@196 96 munmap(timesTable, timesTableLength);
mas01cr@196 97 if(l2normTable)
mas01cr@196 98 munmap(l2normTable, l2normTableLength);
mas01cr@196 99
mas01cr@0 100 if(dbfid>0)
mas01cr@0 101 close(dbfid);
mas01cr@0 102 if(infid>0)
mas01cr@0 103 close(infid);
mas01cr@0 104 if(dbH)
mas01cr@0 105 delete dbH;
mas01cr@0 106 }
mas01cr@0 107
mas01cr@97 108 audioDB::~audioDB(){
mas01cr@97 109 cleanup();
mas01cr@97 110 }
mas01cr@97 111
mas01cr@0 112 int audioDB::processArgs(const unsigned argc, char* const argv[]){
mas01cr@0 113
mas01cr@0 114 if(argc<2){
mas01cr@0 115 cmdline_parser_print_version ();
mas01cr@0 116 if (strlen(gengetopt_args_info_purpose) > 0)
mas01cr@0 117 printf("%s\n", gengetopt_args_info_purpose);
mas01cr@0 118 printf("%s\n", gengetopt_args_info_usage);
mas01cr@0 119 printf("%s\n", gengetopt_args_info_help[1]);
mas01cr@0 120 printf("%s\n", gengetopt_args_info_help[2]);
mas01cr@0 121 printf("%s\n", gengetopt_args_info_help[0]);
mas01cr@0 122 exit(0);
mas01cr@0 123 }
mas01cr@0 124
mas01cr@0 125 if (cmdline_parser (argc, argv, &args_info) != 0)
mas01cr@151 126 error("Error parsing command line");
mas01cr@0 127
mas01cr@0 128 if(args_info.help_given){
mas01cr@0 129 cmdline_parser_print_help();
mas01cr@0 130 exit(0);
mas01cr@0 131 }
mas01cr@0 132
mas01cr@0 133 if(args_info.verbosity_given){
mas01cr@239 134 verbosity = args_info.verbosity_arg;
mas01cr@239 135 if(verbosity < 0 || verbosity > 10){
mas01cr@239 136 std::cerr << "Warning: verbosity out of range, setting to 1" << std::endl;
mas01cr@239 137 verbosity = 1;
mas01cr@0 138 }
mas01cr@0 139 }
mas01cr@0 140
mas01cr@129 141 if(args_info.size_given) {
mas01cr@256 142 if(args_info.datasize_given) {
mas01cr@256 143 error("both --size and --datasize given", "");
mas01cr@256 144 }
mas01cr@256 145 if(args_info.ntracks_given) {
mas01cr@256 146 error("both --size and --ntracks given", "");
mas01cr@256 147 }
mas01cr@256 148 if(args_info.datadim_given) {
mas01cr@256 149 error("both --size and --datadim given", "");
mas01cr@256 150 }
mas01cr@196 151 if (args_info.size_arg < 50 || args_info.size_arg > 32000) {
mas01cr@129 152 error("Size out of range", "");
mas01cr@129 153 }
mas01cr@256 154 double ratio = (double) args_info.size_arg * 1000000 / ((double) O2_DEFAULTDBSIZE);
mas01cr@256 155 /* FIXME: what's the safe way of doing this? */
mas01cr@256 156 datasize = (unsigned int) ceil(datasize * ratio);
mas01cr@256 157 ntracks = (unsigned int) ceil(ntracks * ratio);
mas01cr@256 158 } else {
mas01cr@256 159 if(args_info.datasize_given) {
mas01cr@256 160 datasize = args_info.datasize_arg;
mas01cr@256 161 }
mas01cr@256 162 if(args_info.ntracks_given) {
mas01cr@256 163 ntracks = args_info.ntracks_arg;
mas01cr@256 164 }
mas01cr@256 165 if(args_info.datadim_given) {
mas01cr@256 166 datadim = args_info.datadim_arg;
mas01cr@256 167 }
mas01cr@129 168 }
mas01cr@129 169
mas01cr@239 170 if(args_info.radius_given) {
mas01cr@239 171 radius = args_info.radius_arg;
mas01cr@239 172 if(radius <= 0 || radius > 1000000000) {
mas01cr@77 173 error("radius out of range");
mas01cr@239 174 } else {
mas01cr@239 175 VERB_LOG(3, "Setting radius to %f\n", radius);
mas01mc@17 176 }
mas01mc@17 177 }
mas01mc@17 178
mas01cr@0 179 if(args_info.SERVER_given){
mas01cr@0 180 command=COM_SERVER;
mas01cr@0 181 port=args_info.SERVER_arg;
mas01cr@0 182 if(port<100 || port > 100000)
mas01cr@0 183 error("port out of range");
mas01cr@151 184 isServer = 1;
mas01cr@105 185 #if defined(O2_DEBUG)
mas01cr@104 186 struct sigaction sa;
mas01cr@104 187 sa.sa_sigaction = sigterm_action;
mas01cr@104 188 sa.sa_flags = SA_SIGINFO | SA_RESTART | SA_NODEFER;
mas01cr@104 189 sigaction(SIGTERM, &sa, NULL);
mas01cr@104 190 sa.sa_sigaction = sighup_action;
mas01cr@104 191 sa.sa_flags = SA_SIGINFO | SA_RESTART | SA_NODEFER;
mas01cr@104 192 sigaction(SIGHUP, &sa, NULL);
mas01cr@105 193 #endif
mas01cr@0 194 return 0;
mas01cr@0 195 }
mas01cr@0 196
mas01cr@0 197 // No return on client command, find database command
mas01cr@105 198 if(args_info.client_given){
mas01cr@105 199 command=COM_CLIENT;
mas01cr@105 200 hostport=args_info.client_arg;
mas01cr@105 201 isClient=1;
mas01cr@105 202 }
mas01cr@0 203
mas01cr@105 204 if(args_info.NEW_given){
mas01cr@105 205 command=COM_CREATE;
mas01cr@105 206 dbName=args_info.database_arg;
mas01cr@105 207 return 0;
mas01cr@105 208 }
mas01cr@0 209
mas01cr@105 210 if(args_info.STATUS_given){
mas01cr@105 211 command=COM_STATUS;
mas01cr@105 212 dbName=args_info.database_arg;
mas01cr@105 213 return 0;
mas01cr@105 214 }
mas01cr@0 215
mas01cr@280 216 if(args_info.SAMPLE_given) {
mas01cr@280 217 command = COM_SAMPLE;
mas01cr@280 218 dbName = args_info.database_arg;
mas01cr@280 219 sequenceLength = args_info.sequencelength_arg;
mas01cr@280 220 if(sequenceLength < 1 || sequenceLength > 1000) {
mas01cr@280 221 error("seqlen out of range: 1 <= seqlen <= 1000");
mas01cr@280 222 }
mas01cr@280 223 nsamples = args_info.nsamples_arg;
mas01cr@280 224 return 0;
mas01cr@280 225 }
mas01cr@280 226
mas01cr@105 227 if(args_info.DUMP_given){
mas01cr@105 228 command=COM_DUMP;
mas01cr@105 229 dbName=args_info.database_arg;
mas01cr@131 230 output = args_info.output_arg;
mas01cr@105 231 return 0;
mas01cr@105 232 }
mas01cr@0 233
mas01cr@105 234 if(args_info.L2NORM_given){
mas01cr@105 235 command=COM_L2NORM;
mas01cr@105 236 dbName=args_info.database_arg;
mas01cr@105 237 return 0;
mas01cr@105 238 }
mas01cr@0 239
mas01cr@193 240 if(args_info.POWER_given){
mas01cr@193 241 command=COM_POWER;
mas01cr@193 242 dbName=args_info.database_arg;
mas01cr@193 243 return 0;
mas01cr@193 244 }
mas01cr@193 245
mas01cr@105 246 if(args_info.INSERT_given){
mas01cr@105 247 command=COM_INSERT;
mas01cr@105 248 dbName=args_info.database_arg;
mas01cr@105 249 inFile=args_info.features_arg;
mas01cr@105 250 if(args_info.key_given)
mas01cr@105 251 key=args_info.key_arg;
mas01cr@105 252 if(args_info.times_given){
mas01cr@105 253 timesFileName=args_info.times_arg;
mas01cr@105 254 if(strlen(timesFileName)>0){
mas01cr@239 255 if(!(timesFile = new std::ifstream(timesFileName,std::ios::in)))
mas01cr@105 256 error("Could not open times file for reading", timesFileName);
mas01cr@105 257 usingTimes=1;
mas01cr@105 258 }
mas01cr@105 259 }
mas01cr@193 260 if (args_info.power_given) {
mas01cr@193 261 powerFileName = args_info.power_arg;
mas01cr@193 262 if (strlen(powerFileName) > 0) {
mas01cr@193 263 if (!(powerfd = open(powerFileName, O_RDONLY))) {
mas01cr@193 264 error("Could not open power file for reading", powerFileName, "open");
mas01cr@193 265 }
mas01cr@193 266 usingPower = 1;
mas01cr@193 267 }
mas01cr@193 268 }
mas01cr@105 269 return 0;
mas01cr@105 270 }
mas01cr@105 271
mas01cr@105 272 if(args_info.BATCHINSERT_given){
mas01cr@105 273 command=COM_BATCHINSERT;
mas01cr@105 274 dbName=args_info.database_arg;
mas01cr@105 275 inFile=args_info.featureList_arg;
mas01cr@105 276 if(args_info.keyList_given)
mas01cr@105 277 key=args_info.keyList_arg; // INCONSISTENT NO CHECK
mas01cr@0 278
mas01cr@105 279 /* TO DO: REPLACE WITH
mas01cr@0 280 if(args_info.keyList_given){
mas01mc@18 281 trackFileName=args_info.keyList_arg;
mas01cr@239 282 if(strlen(trackFileName)>0 && !(trackFile = new std::ifstream(trackFileName,std::ios::in)))
mas01mc@18 283 error("Could not open keyList file for reading",trackFileName);
mas01cr@0 284 }
mas01cr@0 285 AND UPDATE BATCHINSERT()
mas01cr@105 286 */
mas01cr@105 287
mas01cr@105 288 if(args_info.timesList_given){
mas01cr@105 289 timesFileName=args_info.timesList_arg;
mas01cr@105 290 if(strlen(timesFileName)>0){
mas01cr@239 291 if(!(timesFile = new std::ifstream(timesFileName,std::ios::in)))
mas01cr@105 292 error("Could not open timesList file for reading", timesFileName);
mas01cr@105 293 usingTimes=1;
mas01cr@105 294 }
mas01cr@105 295 }
mas01cr@193 296 if(args_info.powerList_given){
mas01cr@193 297 powerFileName=args_info.powerList_arg;
mas01cr@193 298 if(strlen(powerFileName)>0){
mas01cr@239 299 if(!(powerFile = new std::ifstream(powerFileName,std::ios::in)))
mas01cr@193 300 error("Could not open powerList file for reading", powerFileName);
mas01cr@193 301 usingPower=1;
mas01cr@193 302 }
mas01cr@193 303 }
mas01cr@105 304 return 0;
mas01cr@105 305 }
mas01cr@105 306
mas01cr@105 307 // Query command and arguments
mas01cr@105 308 if(args_info.QUERY_given){
mas01cr@105 309 command=COM_QUERY;
mas01cr@105 310 dbName=args_info.database_arg;
mas01cr@105 311 inFile=args_info.features_arg;
mas01cr@105 312
mas01cr@105 313 if(args_info.keyList_given){
mas01cr@105 314 trackFileName=args_info.keyList_arg;
mas01cr@239 315 if(strlen(trackFileName)>0 && !(trackFile = new std::ifstream(trackFileName,std::ios::in)))
mas01cr@105 316 error("Could not open keyList file for reading",trackFileName);
mas01cr@105 317 }
mas01cr@105 318
mas01cr@105 319 if(args_info.times_given){
mas01cr@105 320 timesFileName=args_info.times_arg;
mas01cr@105 321 if(strlen(timesFileName)>0){
mas01cr@239 322 if(!(timesFile = new std::ifstream(timesFileName,std::ios::in)))
mas01cr@105 323 error("Could not open times file for reading", timesFileName);
mas01cr@105 324 usingTimes=1;
mas01cr@105 325 }
mas01cr@105 326 }
mas01cr@193 327
mas01cr@193 328 if(args_info.power_given){
mas01cr@193 329 powerFileName=args_info.power_arg;
mas01cr@193 330 if(strlen(powerFileName)>0){
mas01cr@193 331 if (!(powerfd = open(powerFileName, O_RDONLY))) {
mas01cr@193 332 error("Could not open power file for reading", powerFileName, "open");
mas01cr@193 333 }
mas01cr@193 334 usingPower = 1;
mas01cr@193 335 }
mas01cr@193 336 }
mas01cr@105 337
mas01cr@105 338 // query type
mas01cr@105 339 if(strncmp(args_info.QUERY_arg, "track", MAXSTR)==0)
mas01cr@105 340 queryType=O2_TRACK_QUERY;
mas01cr@105 341 else if(strncmp(args_info.QUERY_arg, "point", MAXSTR)==0)
mas01cr@105 342 queryType=O2_POINT_QUERY;
mas01cr@105 343 else if(strncmp(args_info.QUERY_arg, "sequence", MAXSTR)==0)
mas01cr@105 344 queryType=O2_SEQUENCE_QUERY;
mas01mc@248 345 else if(strncmp(args_info.QUERY_arg, "nsequence", MAXSTR)==0)
mas01mc@248 346 queryType=O2_N_SEQUENCE_QUERY;
mas01mc@263 347 else if(strncmp(args_info.QUERY_arg, "onetoonensequence", MAXSTR)==0)
mas01mc@263 348 queryType=O2_ONE_TO_ONE_N_SEQUENCE_QUERY;
mas01cr@105 349 else
mas01cr@105 350 error("unsupported query type",args_info.QUERY_arg);
mas01cr@105 351
mas01cr@105 352 if(!args_info.exhaustive_flag){
mas01cr@105 353 queryPoint = args_info.qpoint_arg;
mas01cr@105 354 usingQueryPoint=1;
mas01cr@105 355 if(queryPoint<0 || queryPoint >10000)
mas01cr@105 356 error("queryPoint out of range: 0 <= queryPoint <= 10000");
mas01cr@105 357 }
mas01cr@105 358
mas01cr@105 359 pointNN = args_info.pointnn_arg;
mas01mc@263 360 if(pointNN < 1 || pointNN > O2_MAXNN) {
mas01mc@263 361 error("pointNN out of range: 1 <= pointNN <= 1000000");
mas01cr@105 362 }
mas01cr@105 363 trackNN = args_info.resultlength_arg;
mas01mc@263 364 if(trackNN < 1 || trackNN > O2_MAXNN) {
mas01mc@263 365 error("resultlength out of range: 1 <= resultlength <= 1000000");
mas01cr@105 366 }
mas01cr@105 367 sequenceLength = args_info.sequencelength_arg;
mas01cr@105 368 if(sequenceLength < 1 || sequenceLength > 1000) {
mas01cr@105 369 error("seqlen out of range: 1 <= seqlen <= 1000");
mas01cr@105 370 }
mas01cr@105 371 sequenceHop = args_info.sequencehop_arg;
mas01cr@105 372 if(sequenceHop < 1 || sequenceHop > 1000) {
mas01cr@105 373 error("seqhop out of range: 1 <= seqhop <= 1000");
mas01cr@105 374 }
mas01cr@193 375
mas01cr@193 376 if (args_info.absolute_threshold_given) {
mas01cr@193 377 if (args_info.absolute_threshold_arg >= 0) {
mas01cr@193 378 error("absolute threshold out of range: should be negative");
mas01cr@193 379 }
mas01cr@193 380 use_absolute_threshold = true;
mas01cr@193 381 absolute_threshold = args_info.absolute_threshold_arg;
mas01cr@193 382 }
mas01cr@193 383 if (args_info.relative_threshold_given) {
mas01cr@193 384 use_relative_threshold = true;
mas01cr@193 385 relative_threshold = args_info.relative_threshold_arg;
mas01cr@193 386 }
mas01cr@105 387 return 0;
mas01cr@105 388 }
mas01cr@105 389 return -1; // no command found
mas01cr@0 390 }
mas01cr@0 391
mas01cr@133 392 void audioDB::status(const char* dbName, adb__statusResponse *adbStatusResponse){
mas01cr@0 393 if(!dbH)
mas01cr@196 394 initTables(dbName, 0);
mas01cr@0 395
mas01cr@0 396 unsigned dudCount=0;
mas01cr@0 397 unsigned nullCount=0;
mas01cr@0 398 for(unsigned k=0; k<dbH->numFiles; k++){
mas01mc@18 399 if(trackTable[k]<sequenceLength){
mas01cr@0 400 dudCount++;
mas01mc@18 401 if(!trackTable[k])
mas01cr@76 402 nullCount++;
mas01cr@0 403 }
mas01cr@0 404 }
mas01cr@76 405
mas01cr@133 406 if(adbStatusResponse == 0) {
mas01cr@76 407
mas01cr@76 408 // Update Header information
mas01cr@239 409 std::cout << "num files:" << dbH->numFiles << std::endl;
mas01cr@239 410 std::cout << "data dim:" << dbH->dim <<std::endl;
mas01cr@76 411 if(dbH->dim>0){
mas01cr@239 412 std::cout << "total vectors:" << dbH->length/(sizeof(double)*dbH->dim)<<std::endl;
mas01cr@239 413 std::cout << "vectors available:" << (dbH->timesTableOffset-(dbH->dataOffset+dbH->length))/(sizeof(double)*dbH->dim) << std::endl;
mas01cr@76 414 }
mas01cr@239 415 std::cout << "total bytes:" << dbH->length << " (" << (100.0*dbH->length)/(dbH->timesTableOffset-dbH->dataOffset) << "%)" << std::endl;
mas01cr@239 416 std::cout << "bytes available:" << dbH->timesTableOffset-(dbH->dataOffset+dbH->length) << " (" <<
mas01cr@239 417 (100.0*(dbH->timesTableOffset-(dbH->dataOffset+dbH->length)))/(dbH->timesTableOffset-dbH->dataOffset) << "%)" << std::endl;
mas01cr@239 418 std::cout << "flags:" << dbH->flags << std::endl;
mas01cr@76 419
mas01cr@239 420 std::cout << "null count: " << nullCount << " small sequence count " << dudCount-nullCount << std::endl;
mas01cr@76 421 } else {
mas01cr@133 422 adbStatusResponse->result.numFiles = dbH->numFiles;
mas01cr@133 423 adbStatusResponse->result.dim = dbH->dim;
mas01cr@133 424 adbStatusResponse->result.length = dbH->length;
mas01cr@133 425 adbStatusResponse->result.dudCount = dudCount;
mas01cr@133 426 adbStatusResponse->result.nullCount = nullCount;
mas01cr@133 427 adbStatusResponse->result.flags = dbH->flags;
mas01cr@76 428 }
mas01cr@0 429 }
mas01cr@0 430
mas01cr@196 431 void audioDB::l2norm(const char* dbName) {
mas01cr@196 432 forWrite = true;
mas01cr@196 433 initTables(dbName, 0);
mas01cr@0 434 if(dbH->length>0){
mas01cr@196 435 /* FIXME: should probably be uint64_t */
mas01cr@0 436 unsigned numVectors = dbH->length/(sizeof(double)*dbH->dim);
mas01cr@196 437 CHECKED_MMAP(double *, dataBuf, dbH->dataOffset, dataBufLength);
mas01cr@0 438 unitNormAndInsertL2(dataBuf, dbH->dim, numVectors, 0); // No append
mas01cr@0 439 }
mas01cr@0 440 // Update database flags
mas01cr@0 441 dbH->flags = dbH->flags|O2_FLAG_L2NORM;
mas01cr@0 442 memcpy (db, dbH, O2_HEADERSIZE);
mas01cr@0 443 }
mas01cr@193 444
mas01cr@193 445 void audioDB::power_flag(const char *dbName) {
mas01cr@196 446 forWrite = true;
mas01cr@196 447 initTables(dbName, 0);
mas01cr@193 448 if (dbH->length > 0) {
mas01cr@193 449 error("cannot turn on power storage for non-empty database", dbName);
mas01cr@193 450 }
mas01cr@193 451 dbH->flags |= O2_FLAG_POWER;
mas01cr@193 452 memcpy(db, dbH, O2_HEADERSIZE);
mas01cr@193 453 }
mas01cr@193 454
mas01cr@239 455 // Unit norm block of features
mas01cr@0 456
mas01cr@239 457 /* FIXME: in fact this does not unit norm a block of features, it just
mas01cr@239 458 records the L2 norms somewhere. unitNorm() does in fact unit norm
mas01cr@239 459 a block of features. */
mas01cr@0 460 void audioDB::unitNormAndInsertL2(double* X, unsigned dim, unsigned n, unsigned append=0){
mas01cr@0 461 unsigned d;
mas01cr@59 462 double *p;
mas01cr@0 463 unsigned nn = n;
mas01cr@0 464
mas01cr@0 465 assert(l2normTable);
mas01cr@0 466
mas01cr@0 467 if( !append && (dbH->flags & O2_FLAG_L2NORM) )
mas01cr@0 468 error("Database is already L2 normed", "automatic norm on insert is enabled");
mas01cr@0 469
mas01cr@239 470 VERB_LOG(2, "norming %u vectors...", n);
mas01cr@0 471
mas01cr@0 472 double* l2buf = new double[n];
mas01cr@0 473 double* l2ptr = l2buf;
mas01cr@0 474 assert(l2buf);
mas01cr@0 475 assert(X);
mas01cr@0 476
mas01cr@0 477 while(nn--){
mas01cr@0 478 p=X;
mas01cr@0 479 *l2ptr=0.0;
mas01cr@0 480 d=dim;
mas01cr@0 481 while(d--){
mas01cr@0 482 *l2ptr+=*p**p;
mas01cr@0 483 p++;
mas01cr@0 484 }
mas01mc@17 485 l2ptr++;
mas01mc@17 486 X+=dim;
mas01cr@0 487 }
mas01cr@0 488 unsigned offset;
mas01cr@84 489 if(append) {
mas01cr@84 490 // FIXME: a hack, a very palpable hack: the vectors have already
mas01cr@84 491 // been inserted, and dbH->length has already been updated. We
mas01cr@84 492 // need to subtract off again the number of vectors that we've
mas01cr@84 493 // inserted this time...
mas01cr@84 494 offset=(dbH->length/(dbH->dim*sizeof(double)))-n; // number of vectors
mas01cr@84 495 } else {
mas01cr@0 496 offset=0;
mas01cr@84 497 }
mas01cr@0 498 memcpy(l2normTable+offset, l2buf, n*sizeof(double));
mas01cr@0 499 if(l2buf)
mas01mc@17 500 delete[] l2buf;
mas01cr@239 501 VERB_LOG(2, " done.");
mas01cr@193 502 }
mas01cr@193 503
mas01cr@0 504 int main(const unsigned argc, char* const argv[]){
mas01cr@0 505 audioDB(argc, argv);
mas01cr@0 506 }