annotate Problems/generateAudioDenoiseProblem.m @ 128:8e660fd14774 ivand_dev

Feature 186
author Ivan Damnjanovic lnx <ivan.damnjanovic@eecs.qmul.ac.uk>
date Mon, 13 Jun 2011 14:55:45 +0100
parents 0211faef9add
children f42aa8bcb82f
rev   line source
idamnjanovic@10 1 function data=generateAudioDenoiseProblem(au, trainnum, blocksize, dictsize, overlap, sigma, gain, maxval, initdict);
ivan@128 2 %% Audio Denoising Problem - needs revision, not yet finalised
idamnjanovic@10 3 %
idamnjanovic@10 4 % generateAudioDenoiseProblem is part of the SMALLbox and generate a
idamnjanovic@10 5 % problem for comaprison of Dictionary Learning/Sparse Representation
idamnjanovic@10 6 % techniques in audio denoising scenario. It is based on KSVD image
idamnjanovic@10 7 % denoise demo by Ron Rubinstein (see bellow).
idamnjanovic@10 8 % The fuction takes as an optional input
idamnjanovic@10 9 % au - audio samples to be denoised
idamnjanovic@10 10 % trainnum - number of frames for training
idamnjanovic@10 11 % blocksize - 1D frame size (eg 512)
idamnjanovic@10 12 % dictsize - number of atoms to be trained
idamnjanovic@10 13 % overlap - ammount of overlaping frames between 0 and 1
idamnjanovic@21 14 %
idamnjanovic@10 15
ivan@128 16 % Centre for Digital Music, Queen Mary, University of London.
ivan@128 17 % This file copyright 2010 Ivan Damnjanovic.
ivan@128 18 %
ivan@128 19 % This program is free software; you can redistribute it and/or
ivan@128 20 % modify it under the terms of the GNU General Public License as
ivan@128 21 % published by the Free Software Foundation; either version 2 of the
ivan@128 22 % License, or (at your option) any later version. See the file
ivan@128 23 % COPYING included with this distribution for more information.
ivan@128 24 %%
idamnjanovic@10 25 disp(' ');
idamnjanovic@10 26 disp(' ********** Denoising Problem **********');
idamnjanovic@10 27 disp(' ');
idamnjanovic@10 28 disp(' This function reads an audio, adds random Gaussian noise,');
idamnjanovic@10 29 disp(' that can be later denoised by using dictionary learning techniques.');
idamnjanovic@10 30 disp(' ');
idamnjanovic@10 31
idamnjanovic@10 32 FS=filesep;
idamnjanovic@10 33 if ~ exist( 'sigma', 'var' ) || isempty(sigma), sigma = 26.74; end
idamnjanovic@10 34 if ~ exist( 'gain', 'var' ) || isempty(gain), gain = 1.15; end
idamnjanovic@10 35
idamnjanovic@10 36 if ~ exist( 'initdict', 'var' ) || isempty(initdict), initdict = 'odct'; end
idamnjanovic@10 37 if ~ exist( 'overlap', 'var' ) || isempty(overlap), overlap = 15/16; end
idamnjanovic@10 38 %% prompt user for wav file %%
idamnjanovic@10 39 %ask for file name
idamnjanovic@10 40
idamnjanovic@10 41 TMPpath=pwd;
idamnjanovic@10 42 if ~ exist( 'au', 'var' ) || isempty(au)
idamnjanovic@10 43 [pathstr1, name, ext, versn] = fileparts(which('SMALLboxSetup.m'));
idamnjanovic@10 44 cd([pathstr1,FS,'data',FS,'audio',FS,'wav']);
idamnjanovic@10 45 [filename,pathname] = uigetfile({'*.wav;'},'Select a wav file');
idamnjanovic@10 46 [pathstr, name, ext, versn] = fileparts(filename);
idamnjanovic@10 47 data.name=name;
idamnjanovic@10 48
idamnjanovic@10 49 au = wavread(filename);
idamnjanovic@10 50 au = mean(au,2); % turn it into mono.
idamnjanovic@10 51 end;
idamnjanovic@10 52 if ~ exist( 'maxval', 'var' ) || isempty(maxval), maxval = max(au); end
idamnjanovic@10 53
idamnjanovic@10 54 %% generate noisy audio %%
idamnjanovic@10 55
idamnjanovic@10 56 disp(' ');
idamnjanovic@10 57 disp('Generating noisy audio...');
idamnjanovic@10 58 sigma = max(au)/10^(sigma/20);
idamnjanovic@10 59 n = randn(size(au)) .* sigma;
idamnjanovic@10 60 aunoise = au + n;% here we can load noise audio if available
idamnjanovic@10 61 % for example: wavread('icassp06_x.wav');%
idamnjanovic@10 62
idamnjanovic@10 63
idamnjanovic@10 64
idamnjanovic@10 65 %% set parameters %%
idamnjanovic@10 66
idamnjanovic@10 67 x = aunoise;
idamnjanovic@10 68 if ~ exist( 'blocksize', 'var' ) || isempty(blocksize),blocksize = 512;end
idamnjanovic@10 69 if ~ exist( 'dictsize', 'var' ) || isempty(dictsize), dictsize = 2048;end
idamnjanovic@10 70
idamnjanovic@10 71 if ~ exist( 'trainnum', 'var' ) || isempty(trainnum),trainnum = (size(x,1)-blocksize+1);end
idamnjanovic@10 72
idamnjanovic@10 73
idamnjanovic@10 74
idamnjanovic@10 75
idamnjanovic@10 76
idamnjanovic@10 77 p=1;
idamnjanovic@10 78
idamnjanovic@10 79
idamnjanovic@10 80 %
idamnjanovic@10 81 % msgdelta = 5;
idamnjanovic@10 82 %
idamnjanovic@10 83 % verbose = 't';
idamnjanovic@10 84 % if (msgdelta <= 0)
idamnjanovic@10 85 % verbose='';
idamnjanovic@10 86 % msgdelta = -1;
idamnjanovic@10 87 % end
idamnjanovic@10 88 %
idamnjanovic@10 89 %
idamnjanovic@10 90 % % initial dictionary %
idamnjanovic@10 91 %
idamnjanovic@10 92 if (strcmpi(initdict,'odct'))
idamnjanovic@10 93 initdict = odctndict(blocksize,dictsize,p);
idamnjanovic@10 94 elseif (strcmpi(initdict,'data'))
idamnjanovic@10 95 clear initdict; % causes initialization using random examples
idamnjanovic@10 96 else
idamnjanovic@10 97 error('Invalid initial dictionary specified.');
idamnjanovic@10 98 end
idamnjanovic@10 99
idamnjanovic@10 100 if exist( 'initdict', 'var' )
idamnjanovic@10 101 initdict = initdict(:,1:dictsize);
idamnjanovic@10 102 end
idamnjanovic@10 103
idamnjanovic@10 104
idamnjanovic@10 105 % noise mode %
idamnjanovic@10 106 % if (isfield(params,'noisemode'))
idamnjanovic@10 107 % switch lower(params.noisemode)
idamnjanovic@10 108 % case 'psnr'
idamnjanovic@10 109 % sigma = maxval / 10^(params.psnr/20);
idamnjanovic@10 110 % case 'sigma'
idamnjanovic@10 111 % sigma = params.sigma;
idamnjanovic@10 112 % otherwise
idamnjanovic@10 113 % error('Invalid noise mode specified');
idamnjanovic@10 114 % end
idamnjanovic@10 115 % elseif (isfield(params,'sigma'))
idamnjanovic@10 116 % sigma = params.sigma;
idamnjanovic@10 117 % elseif (isfield(params,'psnr'))
idamnjanovic@10 118 % sigma = maxval / 10^(params.psnr/20);
idamnjanovic@10 119 % else
idamnjanovic@10 120 % error('Noise strength not specified');
idamnjanovic@10 121 % end
idamnjanovic@10 122
idamnjanovic@10 123 % params.Edata = sqrt(prod(blocksize)) * sigma * gain; % target error for omp
idamnjanovic@10 124 % params.codemode = 'error';
idamnjanovic@10 125 %
idamnjanovic@10 126 % params.sigma = sigma;
idamnjanovic@10 127 % params.noisemode = 'sigma';
idamnjanovic@10 128 %
idamnjanovic@10 129 %
idamnjanovic@10 130 % % make sure test data is not present in params
idamnjanovic@10 131 % if (isfield(params,'testdata'))
idamnjanovic@10 132 % params = rmfield(params,'testdata');
idamnjanovic@10 133 % end
idamnjanovic@10 134
idamnjanovic@10 135
idamnjanovic@10 136 %%%% create training data %%%
idamnjanovic@10 137
idamnjanovic@10 138
idamnjanovic@10 139 X = buffer( x(1:trainnum),blocksize, overlap*blocksize);
idamnjanovic@10 140
idamnjanovic@10 141 % remove dc in blocks to conserve memory %
idamnjanovic@10 142 % bsize = 2000;
idamnjanovic@10 143 % for i = 1:bsize:size(X,2)
idamnjanovic@10 144 % blockids = i : min(i+bsize-1,size(X,2));
idamnjanovic@10 145 % X(:,blockids) = remove_dc(X(:,blockids),'columns');
idamnjanovic@10 146 % end
idamnjanovic@10 147 data.Original = au;
idamnjanovic@10 148 data.Noisy = aunoise;
idamnjanovic@10 149 data.b = X;
idamnjanovic@10 150 data.m = size(X,1);
idamnjanovic@10 151 data.n = size(X,2);
idamnjanovic@10 152 data.p = dictsize;
idamnjanovic@10 153 data.blocksize=blocksize;
idamnjanovic@10 154 data.sigma = sigma;
idamnjanovic@10 155 data.gain = gain;
idamnjanovic@10 156 data.maxval = maxval;
idamnjanovic@10 157 data.initdict= initdict;
idamnjanovic@10 158 data.signalDim=1;
idamnjanovic@10 159 cd(TMPpath);
idamnjanovic@10 160