Chris@1: /******************************************************************** Chris@1: * * Chris@1: * THIS FILE IS PART OF THE OggVorbis SOFTWARE CODEC SOURCE CODE. * Chris@1: * USE, DISTRIBUTION AND REPRODUCTION OF THIS LIBRARY SOURCE IS * Chris@1: * GOVERNED BY A BSD-STYLE SOURCE LICENSE INCLUDED WITH THIS SOURCE * Chris@1: * IN 'COPYING'. PLEASE READ THESE TERMS BEFORE DISTRIBUTING. * Chris@1: * * Chris@1: * THE OggVorbis SOURCE CODE IS (C) COPYRIGHT 1994-2009 * Chris@1: * by the Xiph.Org Foundation http://www.xiph.org/ * Chris@1: * * Chris@1: ******************************************************************** Chris@1: Chris@1: function: PCM data envelope analysis Chris@1: last mod: $Id: envelope.c 16227 2009-07-08 06:58:46Z xiphmont $ Chris@1: Chris@1: ********************************************************************/ Chris@1: Chris@1: #include Chris@1: #include Chris@1: #include Chris@1: #include Chris@1: #include Chris@1: #include "vorbis/codec.h" Chris@1: #include "codec_internal.h" Chris@1: Chris@1: #include "os.h" Chris@1: #include "scales.h" Chris@1: #include "envelope.h" Chris@1: #include "mdct.h" Chris@1: #include "misc.h" Chris@1: Chris@1: void _ve_envelope_init(envelope_lookup *e,vorbis_info *vi){ Chris@1: codec_setup_info *ci=vi->codec_setup; Chris@1: vorbis_info_psy_global *gi=&ci->psy_g_param; Chris@1: int ch=vi->channels; Chris@1: int i,j; Chris@1: int n=e->winlength=128; Chris@1: e->searchstep=64; /* not random */ Chris@1: Chris@1: e->minenergy=gi->preecho_minenergy; Chris@1: e->ch=ch; Chris@1: e->storage=128; Chris@1: e->cursor=ci->blocksizes[1]/2; Chris@1: e->mdct_win=_ogg_calloc(n,sizeof(*e->mdct_win)); Chris@1: mdct_init(&e->mdct,n); Chris@1: Chris@1: for(i=0;imdct_win[i]=sin(i/(n-1.)*M_PI); Chris@1: e->mdct_win[i]*=e->mdct_win[i]; Chris@1: } Chris@1: Chris@1: /* magic follows */ Chris@1: e->band[0].begin=2; e->band[0].end=4; Chris@1: e->band[1].begin=4; e->band[1].end=5; Chris@1: e->band[2].begin=6; e->band[2].end=6; Chris@1: e->band[3].begin=9; e->band[3].end=8; Chris@1: e->band[4].begin=13; e->band[4].end=8; Chris@1: e->band[5].begin=17; e->band[5].end=8; Chris@1: e->band[6].begin=22; e->band[6].end=8; Chris@1: Chris@1: for(j=0;jband[j].end; Chris@1: e->band[j].window=_ogg_malloc(n*sizeof(*e->band[0].window)); Chris@1: for(i=0;iband[j].window[i]=sin((i+.5)/n*M_PI); Chris@1: e->band[j].total+=e->band[j].window[i]; Chris@1: } Chris@1: e->band[j].total=1./e->band[j].total; Chris@1: } Chris@1: Chris@1: e->filter=_ogg_calloc(VE_BANDS*ch,sizeof(*e->filter)); Chris@1: e->mark=_ogg_calloc(e->storage,sizeof(*e->mark)); Chris@1: Chris@1: } Chris@1: Chris@1: void _ve_envelope_clear(envelope_lookup *e){ Chris@1: int i; Chris@1: mdct_clear(&e->mdct); Chris@1: for(i=0;iband[i].window); Chris@1: _ogg_free(e->mdct_win); Chris@1: _ogg_free(e->filter); Chris@1: _ogg_free(e->mark); Chris@1: memset(e,0,sizeof(*e)); Chris@1: } Chris@1: Chris@1: /* fairly straight threshhold-by-band based until we find something Chris@1: that works better and isn't patented. */ Chris@1: Chris@1: static int _ve_amp(envelope_lookup *ve, Chris@1: vorbis_info_psy_global *gi, Chris@1: float *data, Chris@1: envelope_band *bands, Chris@1: envelope_filter_state *filters){ Chris@1: long n=ve->winlength; Chris@1: int ret=0; Chris@1: long i,j; Chris@1: float decay; Chris@1: Chris@1: /* we want to have a 'minimum bar' for energy, else we're just Chris@1: basing blocks on quantization noise that outweighs the signal Chris@1: itself (for low power signals) */ Chris@1: Chris@1: float minV=ve->minenergy; Chris@1: float *vec=alloca(n*sizeof(*vec)); Chris@1: Chris@1: /* stretch is used to gradually lengthen the number of windows Chris@1: considered prevoius-to-potential-trigger */ Chris@1: int stretch=max(VE_MINSTRETCH,ve->stretch/2); Chris@1: float penalty=gi->stretch_penalty-(ve->stretch/2-VE_MINSTRETCH); Chris@1: if(penalty<0.f)penalty=0.f; Chris@1: if(penalty>gi->stretch_penalty)penalty=gi->stretch_penalty; Chris@1: Chris@1: /*_analysis_output_always("lpcm",seq2,data,n,0,0, Chris@1: totalshift+pos*ve->searchstep);*/ Chris@1: Chris@1: /* window and transform */ Chris@1: for(i=0;imdct_win[i]; Chris@1: mdct_forward(&ve->mdct,vec,vec); Chris@1: Chris@1: /*_analysis_output_always("mdct",seq2,vec,n/2,0,1,0); */ Chris@1: Chris@1: /* near-DC spreading function; this has nothing to do with Chris@1: psychoacoustics, just sidelobe leakage and window size */ Chris@1: { Chris@1: float temp=vec[0]*vec[0]+.7*vec[1]*vec[1]+.2*vec[2]*vec[2]; Chris@1: int ptr=filters->nearptr; Chris@1: Chris@1: /* the accumulation is regularly refreshed from scratch to avoid Chris@1: floating point creep */ Chris@1: if(ptr==0){ Chris@1: decay=filters->nearDC_acc=filters->nearDC_partialacc+temp; Chris@1: filters->nearDC_partialacc=temp; Chris@1: }else{ Chris@1: decay=filters->nearDC_acc+=temp; Chris@1: filters->nearDC_partialacc+=temp; Chris@1: } Chris@1: filters->nearDC_acc-=filters->nearDC[ptr]; Chris@1: filters->nearDC[ptr]=temp; Chris@1: Chris@1: decay*=(1./(VE_NEARDC+1)); Chris@1: filters->nearptr++; Chris@1: if(filters->nearptr>=VE_NEARDC)filters->nearptr=0; Chris@1: decay=todB(&decay)*.5-15.f; Chris@1: } Chris@1: Chris@1: /* perform spreading and limiting, also smooth the spectrum. yes, Chris@1: the MDCT results in all real coefficients, but it still *behaves* Chris@1: like real/imaginary pairs */ Chris@1: for(i=0;i>1]=val; Chris@1: decay-=8.; Chris@1: } Chris@1: Chris@1: /*_analysis_output_always("spread",seq2++,vec,n/4,0,0,0);*/ Chris@1: Chris@1: /* perform preecho/postecho triggering by band */ Chris@1: for(j=0;j=VE_AMP)filters[j].ampptr=0; Chris@1: } Chris@1: Chris@1: /* look at min/max, decide trigger */ Chris@1: if(valmax>gi->preecho_thresh[j]+penalty){ Chris@1: ret|=1; Chris@1: ret|=4; Chris@1: } Chris@1: if(valminpostecho_thresh[j]-penalty)ret|=2; Chris@1: } Chris@1: Chris@1: return(ret); Chris@1: } Chris@1: Chris@1: #if 0 Chris@1: static int seq=0; Chris@1: static ogg_int64_t totalshift=-1024; Chris@1: #endif Chris@1: Chris@1: long _ve_envelope_search(vorbis_dsp_state *v){ Chris@1: vorbis_info *vi=v->vi; Chris@1: codec_setup_info *ci=vi->codec_setup; Chris@1: vorbis_info_psy_global *gi=&ci->psy_g_param; Chris@1: envelope_lookup *ve=((private_state *)(v->backend_state))->ve; Chris@1: long i,j; Chris@1: Chris@1: int first=ve->current/ve->searchstep; Chris@1: int last=v->pcm_current/ve->searchstep-VE_WIN; Chris@1: if(first<0)first=0; Chris@1: Chris@1: /* make sure we have enough storage to match the PCM */ Chris@1: if(last+VE_WIN+VE_POST>ve->storage){ Chris@1: ve->storage=last+VE_WIN+VE_POST; /* be sure */ Chris@1: ve->mark=_ogg_realloc(ve->mark,ve->storage*sizeof(*ve->mark)); Chris@1: } Chris@1: Chris@1: for(j=first;jstretch++; Chris@1: if(ve->stretch>VE_MAXSTRETCH*2) Chris@1: ve->stretch=VE_MAXSTRETCH*2; Chris@1: Chris@1: for(i=0;ich;i++){ Chris@1: float *pcm=v->pcm[i]+ve->searchstep*(j); Chris@1: ret|=_ve_amp(ve,gi,pcm,ve->band,ve->filter+i*VE_BANDS); Chris@1: } Chris@1: Chris@1: ve->mark[j+VE_POST]=0; Chris@1: if(ret&1){ Chris@1: ve->mark[j]=1; Chris@1: ve->mark[j+1]=1; Chris@1: } Chris@1: Chris@1: if(ret&2){ Chris@1: ve->mark[j]=1; Chris@1: if(j>0)ve->mark[j-1]=1; Chris@1: } Chris@1: Chris@1: if(ret&4)ve->stretch=-1; Chris@1: } Chris@1: Chris@1: ve->current=last*ve->searchstep; Chris@1: Chris@1: { Chris@1: long centerW=v->centerW; Chris@1: long testW= Chris@1: centerW+ Chris@1: ci->blocksizes[v->W]/4+ Chris@1: ci->blocksizes[1]/2+ Chris@1: ci->blocksizes[0]/4; Chris@1: Chris@1: j=ve->cursor; Chris@1: Chris@1: while(jcurrent-(ve->searchstep)){/* account for postecho Chris@1: working back one window */ Chris@1: if(j>=testW)return(1); Chris@1: Chris@1: ve->cursor=j; Chris@1: Chris@1: if(ve->mark[j/ve->searchstep]){ Chris@1: if(j>centerW){ Chris@1: Chris@1: #if 0 Chris@1: if(j>ve->curmark){ Chris@1: float *marker=alloca(v->pcm_current*sizeof(*marker)); Chris@1: int l,m; Chris@1: memset(marker,0,sizeof(*marker)*v->pcm_current); Chris@1: fprintf(stderr,"mark! seq=%d, cursor:%fs time:%fs\n", Chris@1: seq, Chris@1: (totalshift+ve->cursor)/44100., Chris@1: (totalshift+j)/44100.); Chris@1: _analysis_output_always("pcmL",seq,v->pcm[0],v->pcm_current,0,0,totalshift); Chris@1: _analysis_output_always("pcmR",seq,v->pcm[1],v->pcm_current,0,0,totalshift); Chris@1: Chris@1: _analysis_output_always("markL",seq,v->pcm[0],j,0,0,totalshift); Chris@1: _analysis_output_always("markR",seq,v->pcm[1],j,0,0,totalshift); Chris@1: Chris@1: for(m=0;msearchstep]=ve->filter[m].markers[l]*.1; Chris@1: _analysis_output_always(buf,seq,marker,v->pcm_current,0,0,totalshift); Chris@1: } Chris@1: Chris@1: for(m=0;msearchstep]=ve->filter[m+VE_BANDS].markers[l]*.1; Chris@1: _analysis_output_always(buf,seq,marker,v->pcm_current,0,0,totalshift); Chris@1: } Chris@1: Chris@1: for(l=0;lsearchstep]=ve->mark[l]*.4; Chris@1: _analysis_output_always("mark",seq,marker,v->pcm_current,0,0,totalshift); Chris@1: Chris@1: Chris@1: seq++; Chris@1: Chris@1: } Chris@1: #endif Chris@1: Chris@1: ve->curmark=j; Chris@1: if(j>=testW)return(1); Chris@1: return(0); Chris@1: } Chris@1: } Chris@1: j+=ve->searchstep; Chris@1: } Chris@1: } Chris@1: Chris@1: return(-1); Chris@1: } Chris@1: Chris@1: int _ve_envelope_mark(vorbis_dsp_state *v){ Chris@1: envelope_lookup *ve=((private_state *)(v->backend_state))->ve; Chris@1: vorbis_info *vi=v->vi; Chris@1: codec_setup_info *ci=vi->codec_setup; Chris@1: long centerW=v->centerW; Chris@1: long beginW=centerW-ci->blocksizes[v->W]/4; Chris@1: long endW=centerW+ci->blocksizes[v->W]/4; Chris@1: if(v->W){ Chris@1: beginW-=ci->blocksizes[v->lW]/4; Chris@1: endW+=ci->blocksizes[v->nW]/4; Chris@1: }else{ Chris@1: beginW-=ci->blocksizes[0]/4; Chris@1: endW+=ci->blocksizes[0]/4; Chris@1: } Chris@1: Chris@1: if(ve->curmark>=beginW && ve->curmarksearchstep; Chris@1: long last=endW/ve->searchstep; Chris@1: long i; Chris@1: for(i=first;imark[i])return(1); Chris@1: } Chris@1: return(0); Chris@1: } Chris@1: Chris@1: void _ve_envelope_shift(envelope_lookup *e,long shift){ Chris@1: int smallsize=e->current/e->searchstep+VE_POST; /* adjust for placing marks Chris@1: ahead of ve->current */ Chris@1: int smallshift=shift/e->searchstep; Chris@1: Chris@1: memmove(e->mark,e->mark+smallshift,(smallsize-smallshift)*sizeof(*e->mark)); Chris@1: Chris@1: #if 0 Chris@1: for(i=0;ich;i++) Chris@1: memmove(e->filter[i].markers, Chris@1: e->filter[i].markers+smallshift, Chris@1: (1024-smallshift)*sizeof(*(*e->filter).markers)); Chris@1: totalshift+=shift; Chris@1: #endif Chris@1: Chris@1: e->current-=shift; Chris@1: if(e->curmark>=0) Chris@1: e->curmark-=shift; Chris@1: e->cursor-=shift; Chris@1: }