mas01cr@0
|
1 #include <stdio.h>
|
mas01cr@0
|
2 #include <stdlib.h>
|
mas01cr@0
|
3 #include <sys/types.h>
|
mas01cr@0
|
4 #include <sys/stat.h>
|
mas01cr@0
|
5 #include <sys/mman.h>
|
mas01cr@0
|
6 #include <fcntl.h>
|
mas01cr@0
|
7 #include <string.h>
|
mas01cr@0
|
8 #include <iostream>
|
mas01cr@0
|
9 #include <fstream>
|
mas01cr@0
|
10 #include <math.h>
|
mas01cr@0
|
11 #include <sys/time.h>
|
mas01cr@0
|
12 #include <assert.h>
|
mas01cr@62
|
13 #include <float.h>
|
mas01cr@104
|
14 #include <signal.h>
|
mas01cr@0
|
15
|
mas01cr@0
|
16 // includes for web services
|
mas01cr@0
|
17 #include "soapH.h"
|
mas01cr@0
|
18 #include "adb.nsmap"
|
mas01cr@0
|
19 #include "cmdline.h"
|
mas01cr@0
|
20
|
mas01cr@0
|
21 #define MAXSTR 512
|
mas01cr@0
|
22
|
mas01cr@0
|
23 // Databse PRIMARY commands
|
mas01cr@0
|
24 #define COM_CREATE "--NEW"
|
mas01cr@0
|
25 #define COM_INSERT "--INSERT"
|
mas01cr@0
|
26 #define COM_BATCHINSERT "--BATCHINSERT"
|
mas01cr@0
|
27 #define COM_QUERY "--QUERY"
|
mas01cr@0
|
28 #define COM_STATUS "--STATUS"
|
mas01cr@0
|
29 #define COM_L2NORM "--L2NORM"
|
mas01cr@0
|
30 #define COM_DUMP "--DUMP"
|
mas01cr@0
|
31 #define COM_SERVER "--SERVER"
|
mas01cr@0
|
32
|
mas01cr@0
|
33 // parameters
|
mas01cr@0
|
34 #define COM_CLIENT "--client"
|
mas01cr@0
|
35 #define COM_DATABASE "--database"
|
mas01cr@0
|
36 #define COM_QTYPE "--qtype"
|
mas01cr@0
|
37 #define COM_SEQLEN "--sequencelength"
|
mas01cr@0
|
38 #define COM_SEQHOP "--sequencehop"
|
mas01cr@0
|
39 #define COM_POINTNN "--pointnn"
|
mas01mc@18
|
40 #define COM_TRACKNN "--resultlength"
|
mas01cr@0
|
41 #define COM_QPOINT "--qpoint"
|
mas01cr@0
|
42 #define COM_FEATURES "--features"
|
mas01cr@0
|
43 #define COM_QUERYKEY "--key"
|
mas01cr@0
|
44 #define COM_KEYLIST "--keyList"
|
mas01cr@0
|
45 #define COM_TIMES "--times"
|
mas01cr@0
|
46
|
mas01cr@108
|
47 #define O2_OLD_MAGIC ('O'|'2'<<8|'D'<<16|'B'<<24)
|
mas01cr@108
|
48 #define O2_MAGIC ('o'|'2'<<8|'d'<<16|'b'<<24)
|
mas01cr@108
|
49 #define O2_FORMAT_VERSION (0U)
|
mas01cr@0
|
50
|
mas01cr@0
|
51 #define O2_DEFAULT_POINTNN (10U)
|
mas01mc@18
|
52 #define O2_DEFAULT_TRACKNN (10U)
|
mas01cr@0
|
53
|
mas01mc@7
|
54 #define O2_DEFAULTDBSIZE (2000000000) // 2GB table size
|
mas01mc@7
|
55 //#define O2_DEFAULTDBSIZE (1000000000U) // 1GB table size
|
mas01cr@0
|
56
|
mas01cr@0
|
57 //#define O2_MAXFILES (1000000)
|
mas01cr@0
|
58 #define O2_MAXFILES (10000U) // 10,000 files
|
mas01cr@0
|
59 #define O2_MAXFILESTR (256U)
|
mas01cr@0
|
60 #define O2_FILETABLESIZE (O2_MAXFILESTR)
|
mas01mc@18
|
61 #define O2_TRACKTABLESIZE (sizeof(unsigned))
|
mas01cr@0
|
62 #define O2_HEADERSIZE (sizeof(dbTableHeaderT))
|
mas01cr@0
|
63 #define O2_MEANNUMVECTORS (1000U)
|
mas01cr@0
|
64 #define O2_MAXDIM (1000U)
|
mas01mc@17
|
65 #define O2_MAXNN (10000U)
|
mas01cr@0
|
66
|
mas01cr@0
|
67 // Flags
|
mas01cr@0
|
68 #define O2_FLAG_L2NORM (0x1U)
|
mas01cr@0
|
69 #define O2_FLAG_MINMAX (0x2U)
|
mas01cr@0
|
70 #define O2_FLAG_TIMES (0x20U)
|
mas01cr@0
|
71
|
mas01cr@105
|
72 // Query types
|
mas01cr@105
|
73 #define O2_POINT_QUERY (0x4U)
|
mas01cr@105
|
74 #define O2_SEQUENCE_QUERY (0x8U)
|
mas01cr@105
|
75 #define O2_TRACK_QUERY (0x10U)
|
mas01cr@105
|
76
|
mas01cr@0
|
77 // Error Codes
|
mas01cr@0
|
78 #define O2_ERR_KEYNOTFOUND (0xFFFFFF00)
|
mas01cr@0
|
79
|
mas01cr@0
|
80 // Macros
|
mas01cr@0
|
81 #define O2_ACTION(a) (strcmp(command,a)==0)
|
mas01cr@0
|
82
|
mas01cr@108
|
83 #define ALIGN_UP(x,w) ((x) + ((1<<w)-1) & ~((1<<w)-1))
|
mas01cr@108
|
84 #define ALIGN_DOWN(x,w) ((x) & ~((1<<w)-1))
|
mas01cr@108
|
85
|
mas01cr@0
|
86 using namespace std;
|
mas01cr@0
|
87
|
mas01cr@0
|
88 typedef struct dbTableHeader{
|
mas01cr@0
|
89 unsigned magic;
|
mas01cr@108
|
90 unsigned version;
|
mas01cr@0
|
91 unsigned numFiles;
|
mas01cr@0
|
92 unsigned dim;
|
mas01cr@0
|
93 unsigned flags;
|
mas01cr@111
|
94 // FIXME: these lengths and offsets should be size_t or off_t, but
|
mas01cr@111
|
95 // that causes this header (and hence audioDB files) to be
|
mas01cr@111
|
96 // unportable between 32 and 64-bit architectures. Making them
|
mas01cr@111
|
97 // unsigned isn't the real answer, but it works around the problem.
|
mas01cr@111
|
98 // -- CSR, 2007-10-05
|
mas01cr@111
|
99 unsigned length;
|
mas01cr@111
|
100 unsigned fileTableOffset;
|
mas01cr@111
|
101 unsigned trackTableOffset;
|
mas01cr@111
|
102 unsigned dataOffset;
|
mas01cr@111
|
103 unsigned l2normTableOffset;
|
mas01cr@111
|
104 unsigned timesTableOffset;
|
mas01cr@0
|
105 } dbTableHeaderT, *dbTableHeaderPtr;
|
mas01cr@0
|
106
|
mas01cr@0
|
107
|
mas01cr@0
|
108 class audioDB{
|
mas01cr@0
|
109
|
mas01cr@0
|
110 private:
|
mas01cr@0
|
111 gengetopt_args_info args_info;
|
mas01cr@0
|
112 unsigned dim;
|
mas01cr@0
|
113 const char *dbName;
|
mas01cr@0
|
114 const char *inFile;
|
mas01cr@0
|
115 const char *hostport;
|
mas01cr@0
|
116 const char *key;
|
mas01mc@18
|
117 const char* trackFileName;
|
mas01mc@18
|
118 ifstream *trackFile;
|
mas01cr@0
|
119 const char *command;
|
mas01cr@0
|
120 const char *timesFileName;
|
mas01cr@0
|
121 ifstream *timesFile;
|
mas01cr@0
|
122
|
mas01cr@0
|
123 int dbfid;
|
mas01cr@0
|
124 int infid;
|
mas01cr@0
|
125 char* db;
|
mas01cr@0
|
126 char* indata;
|
mas01cr@0
|
127 struct stat statbuf;
|
mas01cr@0
|
128 dbTableHeaderPtr dbH;
|
mas01cr@0
|
129
|
mas01cr@0
|
130 char *fileTable;
|
mas01mc@18
|
131 unsigned* trackTable;
|
mas01cr@0
|
132 double* dataBuf;
|
mas01cr@0
|
133 double* inBuf;
|
mas01cr@0
|
134 double* l2normTable;
|
mas01cr@0
|
135 double* qNorm;
|
mas01cr@0
|
136 double* sNorm;
|
mas01cr@0
|
137 double* timesTable;
|
mas01cr@0
|
138
|
mas01cr@0
|
139 // Flags and parameters
|
mas01cr@0
|
140 unsigned verbosity; // how much do we want to know?
|
mas01cr@0
|
141 unsigned queryType; // point queries default
|
mas01cr@0
|
142 unsigned pointNN; // how many point NNs ?
|
mas01mc@18
|
143 unsigned trackNN; // how many track NNs ?
|
mas01cr@0
|
144 unsigned sequenceLength;
|
mas01cr@0
|
145 unsigned sequenceHop;
|
mas01cr@0
|
146 unsigned queryPoint;
|
mas01cr@0
|
147 unsigned usingQueryPoint;
|
mas01cr@0
|
148 unsigned usingTimes;
|
mas01cr@0
|
149 unsigned isClient;
|
mas01cr@0
|
150 unsigned isServer;
|
mas01cr@0
|
151 unsigned port;
|
mas01cr@0
|
152 double timesTol;
|
mas01mc@17
|
153 double radius;
|
mas01mc@17
|
154
|
mas01cr@0
|
155 // Timers
|
mas01cr@0
|
156 struct timeval tv1;
|
mas01cr@0
|
157 struct timeval tv2;
|
mas01cr@0
|
158
|
mas01cr@0
|
159 // private methods
|
mas01cr@32
|
160 void error(const char* a, const char* b = "", const char *sysFunc = 0);
|
mas01cr@0
|
161 void pointQuery(const char* dbName, const char* inFile, adb__queryResult *adbQueryResult=0);
|
mas01mc@18
|
162 void trackPointQuery(const char* dbName, const char* inFile, adb__queryResult *adbQueryResult=0);
|
mas01mc@20
|
163 void trackSequenceQueryNN(const char* dbName, const char* inFile, adb__queryResult *adbQueryResult=0);
|
mas01mc@20
|
164 void trackSequenceQueryRad(const char* dbName, const char* inFile, adb__queryResult *adbQueryResult=0);
|
mas01cr@0
|
165
|
mas01cr@27
|
166 void initTables(const char* dbName, bool forWrite, const char* inFile);
|
mas01cr@0
|
167 void unitNorm(double* X, unsigned d, unsigned n, double* qNorm);
|
mas01cr@0
|
168 void unitNormAndInsertL2(double* X, unsigned dim, unsigned n, unsigned append);
|
mas01cr@0
|
169 void insertTimeStamps(unsigned n, ifstream* timesFile, double* timesdata);
|
mas01cr@0
|
170 unsigned getKeyPos(char* key);
|
mas01cr@0
|
171 public:
|
mas01cr@0
|
172
|
mas01cr@76
|
173 audioDB(const unsigned argc, char* const argv[]);
|
mas01cr@76
|
174 audioDB(const unsigned argc, char* const argv[], adb__queryResult *adbQueryResult);
|
mas01cr@76
|
175 audioDB(const unsigned argc, char* const argv[], adb__statusResult *adbStatusResult);
|
mas01cr@97
|
176 void cleanup();
|
mas01cr@0
|
177 ~audioDB();
|
mas01cr@0
|
178 int processArgs(const unsigned argc, char* const argv[]);
|
mas01cr@30
|
179 void get_lock(int fd, bool exclusive);
|
mas01cr@30
|
180 void release_lock(int fd);
|
mas01cr@0
|
181 void create(const char* dbName);
|
mas01cr@0
|
182 void drop();
|
mas01cr@0
|
183 void insert(const char* dbName, const char* inFile);
|
mas01cr@0
|
184 void batchinsert(const char* dbName, const char* inFile);
|
mas01cr@0
|
185 void query(const char* dbName, const char* inFile, adb__queryResult *adbQueryResult=0);
|
mas01cr@76
|
186 void status(const char* dbName, adb__statusResult *adbStatusResult=0);
|
mas01cr@0
|
187 void ws_status(const char*dbName, char* hostport);
|
mas01mc@18
|
188 void ws_query(const char*dbName, const char *trackKey, const char* hostport);
|
mas01cr@0
|
189 void l2norm(const char* dbName);
|
mas01cr@0
|
190 void dump(const char* dbName);
|
mas01cr@0
|
191
|
mas01cr@0
|
192 // web services
|
mas01cr@0
|
193 void startServer();
|
mas01cr@0
|
194
|
mas01cr@0
|
195 };
|
mas01mc@17
|
196
|
mas01cr@105
|
197 #define O2_AUDIODB_INITIALIZERS \
|
mas01cr@105
|
198 dim(0), \
|
mas01cr@105
|
199 dbName(0), \
|
mas01cr@105
|
200 inFile(0), \
|
mas01cr@105
|
201 key(0), \
|
mas01cr@105
|
202 trackFileName(0), \
|
mas01cr@105
|
203 trackFile(0), \
|
mas01cr@105
|
204 command(0), \
|
mas01cr@105
|
205 timesFileName(0), \
|
mas01cr@105
|
206 timesFile(0), \
|
mas01cr@105
|
207 dbfid(0), \
|
mas01cr@105
|
208 infid(0), \
|
mas01cr@105
|
209 db(0), \
|
mas01cr@105
|
210 indata(0), \
|
mas01cr@105
|
211 dbH(0), \
|
mas01cr@105
|
212 fileTable(0), \
|
mas01cr@105
|
213 trackTable(0), \
|
mas01cr@105
|
214 dataBuf(0), \
|
mas01cr@105
|
215 l2normTable(0), \
|
mas01cr@105
|
216 qNorm(0), \
|
mas01cr@105
|
217 timesTable(0), \
|
mas01cr@105
|
218 verbosity(1), \
|
mas01cr@105
|
219 queryType(O2_POINT_QUERY), \
|
mas01cr@105
|
220 pointNN(O2_DEFAULT_POINTNN), \
|
mas01cr@105
|
221 trackNN(O2_DEFAULT_TRACKNN), \
|
mas01cr@105
|
222 sequenceLength(16), \
|
mas01cr@105
|
223 sequenceHop(1), \
|
mas01cr@105
|
224 queryPoint(0), \
|
mas01cr@105
|
225 usingQueryPoint(0), \
|
mas01cr@105
|
226 usingTimes(0), \
|
mas01cr@105
|
227 isClient(0), \
|
mas01cr@105
|
228 isServer(0), \
|
mas01cr@105
|
229 port(0), \
|
mas01cr@105
|
230 timesTol(0.1), \
|
mas01cr@105
|
231 radius(0)
|