wolffd@0
|
1 function [Y,FS,NBITS,OPTS] = mp3read(FILE,N,MONO,DOWNSAMP,DELAY)
|
wolffd@0
|
2 % MP3READ Read MP3 audio file via use of external binaries.
|
wolffd@0
|
3 % Y = MP3READ(FILE) reads an mp3-encoded audio file into the
|
wolffd@0
|
4 % vector Y just like wavread reads a wav-encoded file (one channel
|
wolffd@0
|
5 % per column). Extension ".mp3" is added if FILE has none.
|
wolffd@0
|
6 % Also accepts other formats of wavread, such as
|
wolffd@0
|
7 % Y = MP3READ(FILE,N) to read just the first N sample frames (N
|
wolffd@0
|
8 % scalar), or the frames from N(1) to N(2) if N is a two-element vector.
|
wolffd@0
|
9 % Y = MP3READ(FILE,FMT) or Y = mp3read(FILE,N,FMT)
|
wolffd@0
|
10 % with FMT as 'native' returns int16 samples instead of doubles;
|
wolffd@0
|
11 % FMT can be 'double' for default behavior (to exactly mirror the
|
wolffd@0
|
12 % syntax of wavread).
|
wolffd@0
|
13 %
|
wolffd@0
|
14 % [Y,FS,NBITS,OPTS] = MP3READ(FILE...) returns extra information:
|
wolffd@0
|
15 % FS is the sampling rate, NBITS is the bit depth (always 16),
|
wolffd@0
|
16 % OPTS.fmt is a format info string; OPTS has multiple other
|
wolffd@0
|
17 % fields, see WAVREAD.
|
wolffd@0
|
18 %
|
wolffd@0
|
19 % SIZ = MP3READ(FILE,'size') returns the size of the audio data contained
|
wolffd@0
|
20 % in the file in place of the actual audio data, returning the
|
wolffd@0
|
21 % 2-element vector SIZ=[samples channels].
|
wolffd@0
|
22 %
|
wolffd@0
|
23 % [Y...] = MP3READ(FILE,N,MONO,DOWNSAMP,DELAY) extends the
|
wolffd@0
|
24 % WAVREAD syntax to allow access to special features of the
|
wolffd@0
|
25 % mpg123 engine: MONO = 1 forces output to be mono (by
|
wolffd@0
|
26 % averaging stereo channels); DOWNSAMP = 2 or 4 downsamples by
|
wolffd@0
|
27 % a factor of 2 or 4 (thus FS returns as 22050 or 11025
|
wolffd@0
|
28 % respectively for a 44 kHz mp3 file); DELAY controls how many
|
wolffd@0
|
29 % "warm up" samples to drop at the start of the file; the
|
wolffd@0
|
30 % default value of 2257 makes an mp3write/mp3read loop for a 44
|
wolffd@0
|
31 % kHz mp3 file be as close as possible to being temporally
|
wolffd@0
|
32 % aligned; specify as 0 to prevent discard of initial samples.
|
wolffd@0
|
33 %
|
wolffd@0
|
34 % Example:
|
wolffd@0
|
35 % To read an mp3 file as doubles at its original width and sampling rate:
|
wolffd@0
|
36 % [Y,FS] = mp3read('piano.mp3');
|
wolffd@0
|
37 % To read the first 1 second of the same file, downsampled by a
|
wolffd@0
|
38 % factor of 4, cast to mono, using the default filename
|
wolffd@0
|
39 % extension:
|
wolffd@0
|
40 % [Y,FS4] = mp3read('piano', FS/4, 1, 4);
|
wolffd@0
|
41 %
|
wolffd@0
|
42 % Note: Because the mp3 format encodes samples in blocks of 26 ms (at
|
wolffd@0
|
43 % 44 kHz), and because of the "warm up" period of the encoder,
|
wolffd@0
|
44 % the file length may not be exactly what you expect.
|
wolffd@0
|
45 %
|
wolffd@0
|
46 % Note: requires external binaries mpg123 and mp3info; you
|
wolffd@0
|
47 % can find binaries for several platforms at:
|
wolffd@0
|
48 % http://labrosa.ee.columbia.edu/matlab/mp3read.html
|
wolffd@0
|
49 %
|
wolffd@0
|
50 % See also mp3write, wavread.
|
wolffd@0
|
51
|
wolffd@0
|
52 % 2003-07-20 dpwe@ee.columbia.edu This version calls mpg123.
|
wolffd@0
|
53 % 2004-08-31 Fixed to read whole files correctly
|
wolffd@0
|
54 % 2004-09-08 Uses mp3info to get info about mp3 files too
|
wolffd@0
|
55 % 2004-09-18 Reports all mp3info fields in OPTS.fmt; handles MPG2LSF sizes
|
wolffd@0
|
56 % + added MONO, DOWNSAMP flags, changed default behavior.
|
wolffd@0
|
57 % 2005-09-28 Fixed bug reading full-rate stereo as 1ch (thx bjoerns@vjk.dk)
|
wolffd@0
|
58 % 2006-09-17 Chop off initial 2257 sample delay (for 44.1 kHz mp3)
|
wolffd@0
|
59 % so read-write loop doesn't get progressively delayed.
|
wolffd@0
|
60 % You can suppress this with a 5th argument of 0.
|
wolffd@0
|
61 % 2007-02-04 Added support for FMT argument to match wavread
|
wolffd@0
|
62 % Added automatic selection of binary etc. to allow it
|
wolffd@0
|
63 % to work cross-platform without editing prior to
|
wolffd@0
|
64 % submitting to Matlab File Exchange
|
wolffd@0
|
65 % 2007-07-23 Tweaks to 'size' mode so it exactly agrees with read data.
|
wolffd@0
|
66
|
wolffd@0
|
67 % find our baseline directory
|
wolffd@0
|
68 path = fileparts(which('mp3read'));
|
wolffd@0
|
69
|
wolffd@0
|
70 % %%%%% Directory for temporary file (if needed)
|
wolffd@0
|
71 % % Try to read from environment, or use /tmp if it exists, or use CWD
|
wolffd@0
|
72 tmpdir = getenv('TMPDIR');
|
wolffd@0
|
73 if isempty(tmpdir) || exist(tmpdir,'file')==0
|
wolffd@0
|
74 tmpdir = '/tmp';
|
wolffd@0
|
75 end
|
wolffd@0
|
76 if exist(tmpdir,'file')==0
|
wolffd@0
|
77 tmpdir = '';
|
wolffd@0
|
78 end
|
wolffd@0
|
79 % ensure it exists
|
wolffd@0
|
80 %if length(tmpdir) > 0 && exist(tmpdir,'file')==0
|
wolffd@0
|
81 % mkdir(tmpdir);
|
wolffd@0
|
82 %end
|
wolffd@0
|
83
|
wolffd@0
|
84 %%%%%% Command to delete temporary file (if needed)
|
wolffd@0
|
85 rmcmd = 'rm';
|
wolffd@0
|
86
|
wolffd@0
|
87 %%%%%% Location of the binaries - attempt to choose automatically
|
wolffd@0
|
88 %%%%%% (or edit to be hard-coded for your installation)
|
wolffd@0
|
89 ext = lower(computer);
|
wolffd@0
|
90 if ispc
|
wolffd@0
|
91 ext = 'exe';
|
wolffd@0
|
92 rmcmd = 'del';
|
wolffd@0
|
93 end
|
wolffd@0
|
94 mpg123 = fullfile(path,['mpg123.',ext]);
|
wolffd@0
|
95 mp3info = fullfile(path,['mp3info.',ext]);
|
wolffd@0
|
96
|
wolffd@0
|
97 %%%%% Process input arguments
|
wolffd@0
|
98 if nargin < 2
|
wolffd@0
|
99 N = 0;
|
wolffd@0
|
100 end
|
wolffd@0
|
101
|
wolffd@0
|
102 % Check for FMT spec (per wavread)
|
wolffd@0
|
103 FMT = 'double';
|
wolffd@0
|
104 if ischar(N)
|
wolffd@0
|
105 FMT = lower(N);
|
wolffd@0
|
106 N = 0;
|
wolffd@0
|
107 end
|
wolffd@0
|
108
|
wolffd@0
|
109 if length(N) == 1
|
wolffd@0
|
110 % Specified N was upper limit
|
wolffd@0
|
111 N = [1 N];
|
wolffd@0
|
112 end
|
wolffd@0
|
113 if nargin < 3
|
wolffd@0
|
114 forcemono = 0;
|
wolffd@0
|
115 else
|
wolffd@0
|
116 % Check for 3rd arg as FMT
|
wolffd@0
|
117 if ischar(MONO)
|
wolffd@0
|
118 FMT = lower(MONO);
|
wolffd@0
|
119 MONO = 0;
|
wolffd@0
|
120 end
|
wolffd@0
|
121 forcemono = (MONO ~= 0);
|
wolffd@0
|
122 end
|
wolffd@0
|
123 if nargin < 4
|
wolffd@0
|
124 downsamp = 1;
|
wolffd@0
|
125 else
|
wolffd@0
|
126 downsamp = DOWNSAMP;
|
wolffd@0
|
127 end
|
wolffd@0
|
128 if downsamp ~= 1 && downsamp ~= 2 && downsamp ~= 4
|
wolffd@0
|
129 error('DOWNSAMP can only be 1, 2, or 4');
|
wolffd@0
|
130 end
|
wolffd@0
|
131 if nargin < 5
|
wolffd@0
|
132 mpg123delay44kHz = 2257; % empirical delay of lame/mpg123 loop
|
wolffd@0
|
133 delay = round(mpg123delay44kHz/downsamp);
|
wolffd@0
|
134 else
|
wolffd@0
|
135 delay = DELAY;
|
wolffd@0
|
136 end
|
wolffd@0
|
137
|
wolffd@0
|
138 if strcmp(FMT,'native') == 0 && strcmp(FMT,'double') == 0 && ...
|
wolffd@0
|
139 strcmp(FMT,'size') == 0
|
wolffd@0
|
140 error(['FMT must be ''native'' or ''double'' (or ''size''), not ''',FMT,'''']);
|
wolffd@0
|
141 end
|
wolffd@0
|
142
|
wolffd@0
|
143
|
wolffd@0
|
144 %%%%%% Constants
|
wolffd@0
|
145 NBITS=16;
|
wolffd@0
|
146
|
wolffd@0
|
147 %%%%% add extension if none (like wavread)
|
wolffd@0
|
148 [path,file,ext] = fileparts(FILE);
|
wolffd@0
|
149 if isempty(ext)
|
wolffd@0
|
150 FILE = [FILE, '.mp3'];
|
wolffd@0
|
151 end
|
wolffd@0
|
152
|
wolffd@0
|
153 %%%%%% Probe file to find format, size, etc. using "mp3info" utility
|
wolffd@0
|
154 cmd = ['"',mp3info, '" -r m -p "%Q %u %b %r %v * %C %e %E %L %O %o %p" "', FILE,'"'];
|
wolffd@0
|
155 % Q = samprate, u = #frames, b = #badframes (needed to get right answer from %u)
|
wolffd@0
|
156 % r = bitrate, v = mpeg version (1/2/2.5)
|
wolffd@0
|
157 % C = Copyright, e = emph, E = CRC, L = layer, O = orig, o = mono, p = pad
|
wolffd@0
|
158 w = mysystem(cmd);
|
wolffd@0
|
159 % Break into numerical and ascii parts by finding the delimiter we put in
|
wolffd@0
|
160 starpos = findstr(w,'*');
|
wolffd@0
|
161 nums = str2num(w(1:(starpos - 2)));
|
wolffd@0
|
162 strs = tokenize(w((starpos+2):end));
|
wolffd@0
|
163
|
wolffd@0
|
164 SR = nums(1);
|
wolffd@0
|
165 nframes = nums(2);
|
wolffd@0
|
166 nchans = 2 - strcmp(strs{6}, 'mono');
|
wolffd@0
|
167 layer = length(strs{4});
|
wolffd@0
|
168 bitrate = nums(4)*1000;
|
wolffd@0
|
169 mpgv = nums(5);
|
wolffd@0
|
170 % Figure samples per frame, after
|
wolffd@0
|
171 % http://board.mp3-tech.org/view.php3?bn=agora_mp3techorg&key=1019510889
|
wolffd@0
|
172 if layer == 1
|
wolffd@0
|
173 smpspfrm = 384;
|
wolffd@0
|
174 elseif SR < 32000 && layer ==3
|
wolffd@0
|
175 smpspfrm = 576;
|
wolffd@0
|
176 if mpgv == 1
|
wolffd@0
|
177 error('SR < 32000 but mpeg version = 1');
|
wolffd@0
|
178 end
|
wolffd@0
|
179 else
|
wolffd@0
|
180 smpspfrm = 1152;
|
wolffd@0
|
181 end
|
wolffd@0
|
182
|
wolffd@0
|
183 OPTS.fmt.mpgBitrate = bitrate;
|
wolffd@0
|
184 OPTS.fmt.mpgVersion = mpgv;
|
wolffd@0
|
185 % fields from wavread's OPTS
|
wolffd@0
|
186 OPTS.fmt.nAvgBytesPerSec = bitrate/8;
|
wolffd@0
|
187 OPTS.fmt.nSamplesPerSec = SR;
|
wolffd@0
|
188 OPTS.fmt.nChannels = nchans;
|
wolffd@0
|
189 OPTS.fmt.nBlockAlign = smpspfrm/SR*bitrate/8;
|
wolffd@0
|
190 OPTS.fmt.nBitsPerSample = NBITS;
|
wolffd@0
|
191 OPTS.fmt.mpgNFrames = nframes;
|
wolffd@0
|
192 OPTS.fmt.mpgCopyright = strs{1};
|
wolffd@0
|
193 OPTS.fmt.mpgEmphasis = strs{2};
|
wolffd@0
|
194 OPTS.fmt.mpgCRC = strs{3};
|
wolffd@0
|
195 OPTS.fmt.mpgLayer = strs{4};
|
wolffd@0
|
196 OPTS.fmt.mpgOriginal = strs{5};
|
wolffd@0
|
197 OPTS.fmt.mpgChanmode = strs{6};
|
wolffd@0
|
198 OPTS.fmt.mpgPad = strs{7};
|
wolffd@0
|
199 OPTS.fmt.mpgSampsPerFrame = smpspfrm;
|
wolffd@0
|
200
|
wolffd@0
|
201 if SR == 16000 && downsamp == 4
|
wolffd@0
|
202 error('mpg123 will not downsample 16 kHz files by 4 (only 2)');
|
wolffd@0
|
203 end
|
wolffd@0
|
204
|
wolffd@0
|
205 if downsamp == 1
|
wolffd@0
|
206 downsampstr = '';
|
wolffd@0
|
207 else
|
wolffd@0
|
208 downsampstr = [' -',num2str(downsamp)];
|
wolffd@0
|
209 end
|
wolffd@0
|
210 FS = SR/downsamp;
|
wolffd@0
|
211
|
wolffd@0
|
212 if forcemono == 1
|
wolffd@0
|
213 nchans = 1;
|
wolffd@0
|
214 chansstr = ' -m';
|
wolffd@0
|
215 else
|
wolffd@0
|
216 chansstr = '';
|
wolffd@0
|
217 end
|
wolffd@0
|
218
|
wolffd@0
|
219 % Size-reading version
|
wolffd@0
|
220 if strcmp(FMT,'size') == 1
|
wolffd@0
|
221 Y = [floor(smpspfrm*nframes/downsamp)-delay, nchans];
|
wolffd@0
|
222 else
|
wolffd@0
|
223
|
wolffd@0
|
224 % Temporary file to use
|
wolffd@0
|
225 tmpfile = fullfile(tmpdir, ['tmp',num2str(round(1000*rand(1))),'.wav']);
|
wolffd@0
|
226
|
wolffd@0
|
227 skipx = 0;
|
wolffd@0
|
228 skipblks = 0;
|
wolffd@0
|
229 skipstr = '';
|
wolffd@0
|
230 sttfrm = N(1)-1;
|
wolffd@0
|
231
|
wolffd@0
|
232 % chop off transcoding delay?
|
wolffd@0
|
233 %sttfrm = sttfrm + delay; % empirically measured
|
wolffd@0
|
234 % no, we want to *decode* those samples, then drop them
|
wolffd@0
|
235 % so delay gets added to skipx instead
|
wolffd@0
|
236
|
wolffd@0
|
237 if sttfrm > 0
|
wolffd@0
|
238 skipblks = floor(sttfrm*downsamp/smpspfrm);
|
wolffd@0
|
239 skipx = sttfrm - (skipblks*smpspfrm/downsamp);
|
wolffd@0
|
240 skipstr = [' -k ', num2str(skipblks)];
|
wolffd@0
|
241 end
|
wolffd@0
|
242 skipx = skipx + delay;
|
wolffd@0
|
243
|
wolffd@0
|
244 lenstr = '';
|
wolffd@0
|
245 endfrm = -1;
|
wolffd@0
|
246 decblk = 0;
|
wolffd@0
|
247 if length(N) > 1
|
wolffd@0
|
248 endfrm = N(2);
|
wolffd@0
|
249 if endfrm > sttfrm
|
wolffd@0
|
250 decblk = ceil((endfrm+delay)*downsamp/smpspfrm) - skipblks + 10;
|
wolffd@0
|
251 % we read 10 extra blks (+10) to cover the case where up to 10 bad
|
wolffd@0
|
252 % blocks are included in the part we are trying to read (it happened)
|
wolffd@0
|
253 lenstr = [' -n ', num2str(decblk)];
|
wolffd@0
|
254 % This generates a spurious "Warn: requested..." if reading right
|
wolffd@0
|
255 % to the last sample by index (or bad blks), but no matter.
|
wolffd@0
|
256 end
|
wolffd@0
|
257 end
|
wolffd@0
|
258
|
wolffd@0
|
259 % Run the decode
|
wolffd@0
|
260 cmd=['"',mpg123,'"', downsampstr, chansstr, skipstr, lenstr, ...
|
wolffd@0
|
261 ' -q -w "', tmpfile,'" "',FILE,'"'];
|
wolffd@0
|
262 %w =
|
wolffd@0
|
263 mysystem(cmd);
|
wolffd@0
|
264
|
wolffd@0
|
265 % Load the data
|
wolffd@0
|
266 Y = wavread(tmpfile);
|
wolffd@0
|
267
|
wolffd@0
|
268 % % pad delay on to end, just in case
|
wolffd@0
|
269 % Y = [Y; zeros(delay,size(Y,2))];
|
wolffd@0
|
270 % % no, the saved file is just longer
|
wolffd@0
|
271
|
wolffd@0
|
272 if decblk > 0 && length(Y) < decblk*smpspfrm/downsamp
|
wolffd@0
|
273 % This will happen if the selected block range includes >1 bad block
|
wolffd@0
|
274 disp(['Warn: requested ', num2str(decblk*smpspfrm/downsamp),' frames, returned ',num2str(length(Y))]);
|
wolffd@0
|
275 end
|
wolffd@0
|
276
|
wolffd@0
|
277 % Delete tmp file
|
wolffd@0
|
278 mysystem([rmcmd,' "', tmpfile,'"']);
|
wolffd@0
|
279
|
wolffd@0
|
280 % debug
|
wolffd@0
|
281 % disp(['sttfrm=',num2str(sttfrm),' endfrm=',num2str(endfrm),' skipx=',num2str(skipx),' delay=',num2str(delay),' len=',num2str(length(Y))]);
|
wolffd@0
|
282
|
wolffd@0
|
283 % Select the desired part
|
wolffd@0
|
284 if skipx+endfrm-sttfrm > length(Y)
|
wolffd@0
|
285 endfrm = length(Y)+sttfrm-skipx;
|
wolffd@0
|
286 end
|
wolffd@0
|
287
|
wolffd@0
|
288 if endfrm > sttfrm
|
wolffd@0
|
289 Y = Y(skipx+(1:(endfrm-sttfrm)),:);
|
wolffd@0
|
290 elseif skipx > 0
|
wolffd@0
|
291 Y = Y((skipx+1):end,:);
|
wolffd@0
|
292 end
|
wolffd@0
|
293
|
wolffd@0
|
294 % Convert to int if format = 'native'
|
wolffd@0
|
295 if strcmp(FMT,'native')
|
wolffd@0
|
296 Y = int16((2^15)*Y);
|
wolffd@0
|
297 end
|
wolffd@0
|
298
|
wolffd@0
|
299 end
|
wolffd@0
|
300
|
wolffd@0
|
301 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
|
wolffd@0
|
302 function w = mysystem(cmd)
|
wolffd@0
|
303 % Run system command; report error; strip all but last line
|
wolffd@0
|
304 [s,w] = system(cmd);
|
wolffd@0
|
305 if s ~= 0
|
wolffd@0
|
306 error(['unable to execute ',cmd,' (',w,')']);
|
wolffd@0
|
307 end
|
wolffd@0
|
308 % Keep just final line
|
wolffd@0
|
309 w = w((1+max([0,findstr(w,10)])):end);
|
wolffd@0
|
310 % Debug
|
wolffd@0
|
311 %disp([cmd,' -> ','*',w,'*']);
|
wolffd@0
|
312
|
wolffd@0
|
313 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
|
wolffd@0
|
314 function a = tokenize(s)
|
wolffd@0
|
315 % Break space-separated string into cell array of strings
|
wolffd@0
|
316 % 2004-09-18 dpwe@ee.columbia.edu
|
wolffd@0
|
317 a = [];
|
wolffd@0
|
318 p = 1;
|
wolffd@0
|
319 n = 1;
|
wolffd@0
|
320 l = length(s);
|
wolffd@0
|
321 nss = findstr([s(p:end),' '],' ');
|
wolffd@0
|
322 for ns = nss
|
wolffd@0
|
323 % Skip initial spaces
|
wolffd@0
|
324 if ns == p
|
wolffd@0
|
325 p = p+1;
|
wolffd@0
|
326 else
|
wolffd@0
|
327 if p <= l
|
wolffd@0
|
328 a{n} = s(p:(ns-1));
|
wolffd@0
|
329 n = n+1;
|
wolffd@0
|
330 p = ns+1;
|
wolffd@0
|
331 end
|
wolffd@0
|
332 end
|
wolffd@0
|
333 end
|
wolffd@0
|
334
|