cannam@154
|
1 /* Copyright (c) 2007-2008 CSIRO
|
cannam@154
|
2 Copyright (c) 2007-2009 Xiph.Org Foundation
|
cannam@154
|
3 Written by Jean-Marc Valin */
|
cannam@154
|
4 /**
|
cannam@154
|
5 @file pitch.c
|
cannam@154
|
6 @brief Pitch analysis
|
cannam@154
|
7 */
|
cannam@154
|
8
|
cannam@154
|
9 /*
|
cannam@154
|
10 Redistribution and use in source and binary forms, with or without
|
cannam@154
|
11 modification, are permitted provided that the following conditions
|
cannam@154
|
12 are met:
|
cannam@154
|
13
|
cannam@154
|
14 - Redistributions of source code must retain the above copyright
|
cannam@154
|
15 notice, this list of conditions and the following disclaimer.
|
cannam@154
|
16
|
cannam@154
|
17 - Redistributions in binary form must reproduce the above copyright
|
cannam@154
|
18 notice, this list of conditions and the following disclaimer in the
|
cannam@154
|
19 documentation and/or other materials provided with the distribution.
|
cannam@154
|
20
|
cannam@154
|
21 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
cannam@154
|
22 ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
cannam@154
|
23 LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
cannam@154
|
24 A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
|
cannam@154
|
25 OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
cannam@154
|
26 EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
cannam@154
|
27 PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
cannam@154
|
28 PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
cannam@154
|
29 LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
cannam@154
|
30 NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
cannam@154
|
31 SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
cannam@154
|
32 */
|
cannam@154
|
33
|
cannam@154
|
34 #ifdef HAVE_CONFIG_H
|
cannam@154
|
35 #include "config.h"
|
cannam@154
|
36 #endif
|
cannam@154
|
37
|
cannam@154
|
38 #include "pitch.h"
|
cannam@154
|
39 #include "os_support.h"
|
cannam@154
|
40 #include "modes.h"
|
cannam@154
|
41 #include "stack_alloc.h"
|
cannam@154
|
42 #include "mathops.h"
|
cannam@154
|
43 #include "celt_lpc.h"
|
cannam@154
|
44
|
cannam@154
|
45 static void find_best_pitch(opus_val32 *xcorr, opus_val16 *y, int len,
|
cannam@154
|
46 int max_pitch, int *best_pitch
|
cannam@154
|
47 #ifdef FIXED_POINT
|
cannam@154
|
48 , int yshift, opus_val32 maxcorr
|
cannam@154
|
49 #endif
|
cannam@154
|
50 )
|
cannam@154
|
51 {
|
cannam@154
|
52 int i, j;
|
cannam@154
|
53 opus_val32 Syy=1;
|
cannam@154
|
54 opus_val16 best_num[2];
|
cannam@154
|
55 opus_val32 best_den[2];
|
cannam@154
|
56 #ifdef FIXED_POINT
|
cannam@154
|
57 int xshift;
|
cannam@154
|
58
|
cannam@154
|
59 xshift = celt_ilog2(maxcorr)-14;
|
cannam@154
|
60 #endif
|
cannam@154
|
61
|
cannam@154
|
62 best_num[0] = -1;
|
cannam@154
|
63 best_num[1] = -1;
|
cannam@154
|
64 best_den[0] = 0;
|
cannam@154
|
65 best_den[1] = 0;
|
cannam@154
|
66 best_pitch[0] = 0;
|
cannam@154
|
67 best_pitch[1] = 1;
|
cannam@154
|
68 for (j=0;j<len;j++)
|
cannam@154
|
69 Syy = ADD32(Syy, SHR32(MULT16_16(y[j],y[j]), yshift));
|
cannam@154
|
70 for (i=0;i<max_pitch;i++)
|
cannam@154
|
71 {
|
cannam@154
|
72 if (xcorr[i]>0)
|
cannam@154
|
73 {
|
cannam@154
|
74 opus_val16 num;
|
cannam@154
|
75 opus_val32 xcorr16;
|
cannam@154
|
76 xcorr16 = EXTRACT16(VSHR32(xcorr[i], xshift));
|
cannam@154
|
77 #ifndef FIXED_POINT
|
cannam@154
|
78 /* Considering the range of xcorr16, this should avoid both underflows
|
cannam@154
|
79 and overflows (inf) when squaring xcorr16 */
|
cannam@154
|
80 xcorr16 *= 1e-12f;
|
cannam@154
|
81 #endif
|
cannam@154
|
82 num = MULT16_16_Q15(xcorr16,xcorr16);
|
cannam@154
|
83 if (MULT16_32_Q15(num,best_den[1]) > MULT16_32_Q15(best_num[1],Syy))
|
cannam@154
|
84 {
|
cannam@154
|
85 if (MULT16_32_Q15(num,best_den[0]) > MULT16_32_Q15(best_num[0],Syy))
|
cannam@154
|
86 {
|
cannam@154
|
87 best_num[1] = best_num[0];
|
cannam@154
|
88 best_den[1] = best_den[0];
|
cannam@154
|
89 best_pitch[1] = best_pitch[0];
|
cannam@154
|
90 best_num[0] = num;
|
cannam@154
|
91 best_den[0] = Syy;
|
cannam@154
|
92 best_pitch[0] = i;
|
cannam@154
|
93 } else {
|
cannam@154
|
94 best_num[1] = num;
|
cannam@154
|
95 best_den[1] = Syy;
|
cannam@154
|
96 best_pitch[1] = i;
|
cannam@154
|
97 }
|
cannam@154
|
98 }
|
cannam@154
|
99 }
|
cannam@154
|
100 Syy += SHR32(MULT16_16(y[i+len],y[i+len]),yshift) - SHR32(MULT16_16(y[i],y[i]),yshift);
|
cannam@154
|
101 Syy = MAX32(1, Syy);
|
cannam@154
|
102 }
|
cannam@154
|
103 }
|
cannam@154
|
104
|
cannam@154
|
105 static void celt_fir5(opus_val16 *x,
|
cannam@154
|
106 const opus_val16 *num,
|
cannam@154
|
107 int N)
|
cannam@154
|
108 {
|
cannam@154
|
109 int i;
|
cannam@154
|
110 opus_val16 num0, num1, num2, num3, num4;
|
cannam@154
|
111 opus_val32 mem0, mem1, mem2, mem3, mem4;
|
cannam@154
|
112 num0=num[0];
|
cannam@154
|
113 num1=num[1];
|
cannam@154
|
114 num2=num[2];
|
cannam@154
|
115 num3=num[3];
|
cannam@154
|
116 num4=num[4];
|
cannam@154
|
117 mem0=0;
|
cannam@154
|
118 mem1=0;
|
cannam@154
|
119 mem2=0;
|
cannam@154
|
120 mem3=0;
|
cannam@154
|
121 mem4=0;
|
cannam@154
|
122 for (i=0;i<N;i++)
|
cannam@154
|
123 {
|
cannam@154
|
124 opus_val32 sum = SHL32(EXTEND32(x[i]), SIG_SHIFT);
|
cannam@154
|
125 sum = MAC16_16(sum,num0,mem0);
|
cannam@154
|
126 sum = MAC16_16(sum,num1,mem1);
|
cannam@154
|
127 sum = MAC16_16(sum,num2,mem2);
|
cannam@154
|
128 sum = MAC16_16(sum,num3,mem3);
|
cannam@154
|
129 sum = MAC16_16(sum,num4,mem4);
|
cannam@154
|
130 mem4 = mem3;
|
cannam@154
|
131 mem3 = mem2;
|
cannam@154
|
132 mem2 = mem1;
|
cannam@154
|
133 mem1 = mem0;
|
cannam@154
|
134 mem0 = x[i];
|
cannam@154
|
135 x[i] = ROUND16(sum, SIG_SHIFT);
|
cannam@154
|
136 }
|
cannam@154
|
137 }
|
cannam@154
|
138
|
cannam@154
|
139
|
cannam@154
|
140 void pitch_downsample(celt_sig * OPUS_RESTRICT x[], opus_val16 * OPUS_RESTRICT x_lp,
|
cannam@154
|
141 int len, int C, int arch)
|
cannam@154
|
142 {
|
cannam@154
|
143 int i;
|
cannam@154
|
144 opus_val32 ac[5];
|
cannam@154
|
145 opus_val16 tmp=Q15ONE;
|
cannam@154
|
146 opus_val16 lpc[4];
|
cannam@154
|
147 opus_val16 lpc2[5];
|
cannam@154
|
148 opus_val16 c1 = QCONST16(.8f,15);
|
cannam@154
|
149 #ifdef FIXED_POINT
|
cannam@154
|
150 int shift;
|
cannam@154
|
151 opus_val32 maxabs = celt_maxabs32(x[0], len);
|
cannam@154
|
152 if (C==2)
|
cannam@154
|
153 {
|
cannam@154
|
154 opus_val32 maxabs_1 = celt_maxabs32(x[1], len);
|
cannam@154
|
155 maxabs = MAX32(maxabs, maxabs_1);
|
cannam@154
|
156 }
|
cannam@154
|
157 if (maxabs<1)
|
cannam@154
|
158 maxabs=1;
|
cannam@154
|
159 shift = celt_ilog2(maxabs)-10;
|
cannam@154
|
160 if (shift<0)
|
cannam@154
|
161 shift=0;
|
cannam@154
|
162 if (C==2)
|
cannam@154
|
163 shift++;
|
cannam@154
|
164 #endif
|
cannam@154
|
165 for (i=1;i<len>>1;i++)
|
cannam@154
|
166 x_lp[i] = SHR32(HALF32(HALF32(x[0][(2*i-1)]+x[0][(2*i+1)])+x[0][2*i]), shift);
|
cannam@154
|
167 x_lp[0] = SHR32(HALF32(HALF32(x[0][1])+x[0][0]), shift);
|
cannam@154
|
168 if (C==2)
|
cannam@154
|
169 {
|
cannam@154
|
170 for (i=1;i<len>>1;i++)
|
cannam@154
|
171 x_lp[i] += SHR32(HALF32(HALF32(x[1][(2*i-1)]+x[1][(2*i+1)])+x[1][2*i]), shift);
|
cannam@154
|
172 x_lp[0] += SHR32(HALF32(HALF32(x[1][1])+x[1][0]), shift);
|
cannam@154
|
173 }
|
cannam@154
|
174
|
cannam@154
|
175 _celt_autocorr(x_lp, ac, NULL, 0,
|
cannam@154
|
176 4, len>>1, arch);
|
cannam@154
|
177
|
cannam@154
|
178 /* Noise floor -40 dB */
|
cannam@154
|
179 #ifdef FIXED_POINT
|
cannam@154
|
180 ac[0] += SHR32(ac[0],13);
|
cannam@154
|
181 #else
|
cannam@154
|
182 ac[0] *= 1.0001f;
|
cannam@154
|
183 #endif
|
cannam@154
|
184 /* Lag windowing */
|
cannam@154
|
185 for (i=1;i<=4;i++)
|
cannam@154
|
186 {
|
cannam@154
|
187 /*ac[i] *= exp(-.5*(2*M_PI*.002*i)*(2*M_PI*.002*i));*/
|
cannam@154
|
188 #ifdef FIXED_POINT
|
cannam@154
|
189 ac[i] -= MULT16_32_Q15(2*i*i, ac[i]);
|
cannam@154
|
190 #else
|
cannam@154
|
191 ac[i] -= ac[i]*(.008f*i)*(.008f*i);
|
cannam@154
|
192 #endif
|
cannam@154
|
193 }
|
cannam@154
|
194
|
cannam@154
|
195 _celt_lpc(lpc, ac, 4);
|
cannam@154
|
196 for (i=0;i<4;i++)
|
cannam@154
|
197 {
|
cannam@154
|
198 tmp = MULT16_16_Q15(QCONST16(.9f,15), tmp);
|
cannam@154
|
199 lpc[i] = MULT16_16_Q15(lpc[i], tmp);
|
cannam@154
|
200 }
|
cannam@154
|
201 /* Add a zero */
|
cannam@154
|
202 lpc2[0] = lpc[0] + QCONST16(.8f,SIG_SHIFT);
|
cannam@154
|
203 lpc2[1] = lpc[1] + MULT16_16_Q15(c1,lpc[0]);
|
cannam@154
|
204 lpc2[2] = lpc[2] + MULT16_16_Q15(c1,lpc[1]);
|
cannam@154
|
205 lpc2[3] = lpc[3] + MULT16_16_Q15(c1,lpc[2]);
|
cannam@154
|
206 lpc2[4] = MULT16_16_Q15(c1,lpc[3]);
|
cannam@154
|
207 celt_fir5(x_lp, lpc2, len>>1);
|
cannam@154
|
208 }
|
cannam@154
|
209
|
cannam@154
|
210 /* Pure C implementation. */
|
cannam@154
|
211 #ifdef FIXED_POINT
|
cannam@154
|
212 opus_val32
|
cannam@154
|
213 #else
|
cannam@154
|
214 void
|
cannam@154
|
215 #endif
|
cannam@154
|
216 celt_pitch_xcorr_c(const opus_val16 *_x, const opus_val16 *_y,
|
cannam@154
|
217 opus_val32 *xcorr, int len, int max_pitch, int arch)
|
cannam@154
|
218 {
|
cannam@154
|
219
|
cannam@154
|
220 #if 0 /* This is a simple version of the pitch correlation that should work
|
cannam@154
|
221 well on DSPs like Blackfin and TI C5x/C6x */
|
cannam@154
|
222 int i, j;
|
cannam@154
|
223 #ifdef FIXED_POINT
|
cannam@154
|
224 opus_val32 maxcorr=1;
|
cannam@154
|
225 #endif
|
cannam@154
|
226 #if !defined(OVERRIDE_PITCH_XCORR)
|
cannam@154
|
227 (void)arch;
|
cannam@154
|
228 #endif
|
cannam@154
|
229 for (i=0;i<max_pitch;i++)
|
cannam@154
|
230 {
|
cannam@154
|
231 opus_val32 sum = 0;
|
cannam@154
|
232 for (j=0;j<len;j++)
|
cannam@154
|
233 sum = MAC16_16(sum, _x[j], _y[i+j]);
|
cannam@154
|
234 xcorr[i] = sum;
|
cannam@154
|
235 #ifdef FIXED_POINT
|
cannam@154
|
236 maxcorr = MAX32(maxcorr, sum);
|
cannam@154
|
237 #endif
|
cannam@154
|
238 }
|
cannam@154
|
239 #ifdef FIXED_POINT
|
cannam@154
|
240 return maxcorr;
|
cannam@154
|
241 #endif
|
cannam@154
|
242
|
cannam@154
|
243 #else /* Unrolled version of the pitch correlation -- runs faster on x86 and ARM */
|
cannam@154
|
244 int i;
|
cannam@154
|
245 /*The EDSP version requires that max_pitch is at least 1, and that _x is
|
cannam@154
|
246 32-bit aligned.
|
cannam@154
|
247 Since it's hard to put asserts in assembly, put them here.*/
|
cannam@154
|
248 #ifdef FIXED_POINT
|
cannam@154
|
249 opus_val32 maxcorr=1;
|
cannam@154
|
250 #endif
|
cannam@154
|
251 celt_assert(max_pitch>0);
|
cannam@154
|
252 celt_sig_assert((((unsigned char *)_x-(unsigned char *)NULL)&3)==0);
|
cannam@154
|
253 for (i=0;i<max_pitch-3;i+=4)
|
cannam@154
|
254 {
|
cannam@154
|
255 opus_val32 sum[4]={0,0,0,0};
|
cannam@154
|
256 xcorr_kernel(_x, _y+i, sum, len, arch);
|
cannam@154
|
257 xcorr[i]=sum[0];
|
cannam@154
|
258 xcorr[i+1]=sum[1];
|
cannam@154
|
259 xcorr[i+2]=sum[2];
|
cannam@154
|
260 xcorr[i+3]=sum[3];
|
cannam@154
|
261 #ifdef FIXED_POINT
|
cannam@154
|
262 sum[0] = MAX32(sum[0], sum[1]);
|
cannam@154
|
263 sum[2] = MAX32(sum[2], sum[3]);
|
cannam@154
|
264 sum[0] = MAX32(sum[0], sum[2]);
|
cannam@154
|
265 maxcorr = MAX32(maxcorr, sum[0]);
|
cannam@154
|
266 #endif
|
cannam@154
|
267 }
|
cannam@154
|
268 /* In case max_pitch isn't a multiple of 4, do non-unrolled version. */
|
cannam@154
|
269 for (;i<max_pitch;i++)
|
cannam@154
|
270 {
|
cannam@154
|
271 opus_val32 sum;
|
cannam@154
|
272 sum = celt_inner_prod(_x, _y+i, len, arch);
|
cannam@154
|
273 xcorr[i] = sum;
|
cannam@154
|
274 #ifdef FIXED_POINT
|
cannam@154
|
275 maxcorr = MAX32(maxcorr, sum);
|
cannam@154
|
276 #endif
|
cannam@154
|
277 }
|
cannam@154
|
278 #ifdef FIXED_POINT
|
cannam@154
|
279 return maxcorr;
|
cannam@154
|
280 #endif
|
cannam@154
|
281 #endif
|
cannam@154
|
282 }
|
cannam@154
|
283
|
cannam@154
|
284 void pitch_search(const opus_val16 * OPUS_RESTRICT x_lp, opus_val16 * OPUS_RESTRICT y,
|
cannam@154
|
285 int len, int max_pitch, int *pitch, int arch)
|
cannam@154
|
286 {
|
cannam@154
|
287 int i, j;
|
cannam@154
|
288 int lag;
|
cannam@154
|
289 int best_pitch[2]={0,0};
|
cannam@154
|
290 VARDECL(opus_val16, x_lp4);
|
cannam@154
|
291 VARDECL(opus_val16, y_lp4);
|
cannam@154
|
292 VARDECL(opus_val32, xcorr);
|
cannam@154
|
293 #ifdef FIXED_POINT
|
cannam@154
|
294 opus_val32 maxcorr;
|
cannam@154
|
295 opus_val32 xmax, ymax;
|
cannam@154
|
296 int shift=0;
|
cannam@154
|
297 #endif
|
cannam@154
|
298 int offset;
|
cannam@154
|
299
|
cannam@154
|
300 SAVE_STACK;
|
cannam@154
|
301
|
cannam@154
|
302 celt_assert(len>0);
|
cannam@154
|
303 celt_assert(max_pitch>0);
|
cannam@154
|
304 lag = len+max_pitch;
|
cannam@154
|
305
|
cannam@154
|
306 ALLOC(x_lp4, len>>2, opus_val16);
|
cannam@154
|
307 ALLOC(y_lp4, lag>>2, opus_val16);
|
cannam@154
|
308 ALLOC(xcorr, max_pitch>>1, opus_val32);
|
cannam@154
|
309
|
cannam@154
|
310 /* Downsample by 2 again */
|
cannam@154
|
311 for (j=0;j<len>>2;j++)
|
cannam@154
|
312 x_lp4[j] = x_lp[2*j];
|
cannam@154
|
313 for (j=0;j<lag>>2;j++)
|
cannam@154
|
314 y_lp4[j] = y[2*j];
|
cannam@154
|
315
|
cannam@154
|
316 #ifdef FIXED_POINT
|
cannam@154
|
317 xmax = celt_maxabs16(x_lp4, len>>2);
|
cannam@154
|
318 ymax = celt_maxabs16(y_lp4, lag>>2);
|
cannam@154
|
319 shift = celt_ilog2(MAX32(1, MAX32(xmax, ymax)))-11;
|
cannam@154
|
320 if (shift>0)
|
cannam@154
|
321 {
|
cannam@154
|
322 for (j=0;j<len>>2;j++)
|
cannam@154
|
323 x_lp4[j] = SHR16(x_lp4[j], shift);
|
cannam@154
|
324 for (j=0;j<lag>>2;j++)
|
cannam@154
|
325 y_lp4[j] = SHR16(y_lp4[j], shift);
|
cannam@154
|
326 /* Use double the shift for a MAC */
|
cannam@154
|
327 shift *= 2;
|
cannam@154
|
328 } else {
|
cannam@154
|
329 shift = 0;
|
cannam@154
|
330 }
|
cannam@154
|
331 #endif
|
cannam@154
|
332
|
cannam@154
|
333 /* Coarse search with 4x decimation */
|
cannam@154
|
334
|
cannam@154
|
335 #ifdef FIXED_POINT
|
cannam@154
|
336 maxcorr =
|
cannam@154
|
337 #endif
|
cannam@154
|
338 celt_pitch_xcorr(x_lp4, y_lp4, xcorr, len>>2, max_pitch>>2, arch);
|
cannam@154
|
339
|
cannam@154
|
340 find_best_pitch(xcorr, y_lp4, len>>2, max_pitch>>2, best_pitch
|
cannam@154
|
341 #ifdef FIXED_POINT
|
cannam@154
|
342 , 0, maxcorr
|
cannam@154
|
343 #endif
|
cannam@154
|
344 );
|
cannam@154
|
345
|
cannam@154
|
346 /* Finer search with 2x decimation */
|
cannam@154
|
347 #ifdef FIXED_POINT
|
cannam@154
|
348 maxcorr=1;
|
cannam@154
|
349 #endif
|
cannam@154
|
350 for (i=0;i<max_pitch>>1;i++)
|
cannam@154
|
351 {
|
cannam@154
|
352 opus_val32 sum;
|
cannam@154
|
353 xcorr[i] = 0;
|
cannam@154
|
354 if (abs(i-2*best_pitch[0])>2 && abs(i-2*best_pitch[1])>2)
|
cannam@154
|
355 continue;
|
cannam@154
|
356 #ifdef FIXED_POINT
|
cannam@154
|
357 sum = 0;
|
cannam@154
|
358 for (j=0;j<len>>1;j++)
|
cannam@154
|
359 sum += SHR32(MULT16_16(x_lp[j],y[i+j]), shift);
|
cannam@154
|
360 #else
|
cannam@154
|
361 sum = celt_inner_prod(x_lp, y+i, len>>1, arch);
|
cannam@154
|
362 #endif
|
cannam@154
|
363 xcorr[i] = MAX32(-1, sum);
|
cannam@154
|
364 #ifdef FIXED_POINT
|
cannam@154
|
365 maxcorr = MAX32(maxcorr, sum);
|
cannam@154
|
366 #endif
|
cannam@154
|
367 }
|
cannam@154
|
368 find_best_pitch(xcorr, y, len>>1, max_pitch>>1, best_pitch
|
cannam@154
|
369 #ifdef FIXED_POINT
|
cannam@154
|
370 , shift+1, maxcorr
|
cannam@154
|
371 #endif
|
cannam@154
|
372 );
|
cannam@154
|
373
|
cannam@154
|
374 /* Refine by pseudo-interpolation */
|
cannam@154
|
375 if (best_pitch[0]>0 && best_pitch[0]<(max_pitch>>1)-1)
|
cannam@154
|
376 {
|
cannam@154
|
377 opus_val32 a, b, c;
|
cannam@154
|
378 a = xcorr[best_pitch[0]-1];
|
cannam@154
|
379 b = xcorr[best_pitch[0]];
|
cannam@154
|
380 c = xcorr[best_pitch[0]+1];
|
cannam@154
|
381 if ((c-a) > MULT16_32_Q15(QCONST16(.7f,15),b-a))
|
cannam@154
|
382 offset = 1;
|
cannam@154
|
383 else if ((a-c) > MULT16_32_Q15(QCONST16(.7f,15),b-c))
|
cannam@154
|
384 offset = -1;
|
cannam@154
|
385 else
|
cannam@154
|
386 offset = 0;
|
cannam@154
|
387 } else {
|
cannam@154
|
388 offset = 0;
|
cannam@154
|
389 }
|
cannam@154
|
390 *pitch = 2*best_pitch[0]-offset;
|
cannam@154
|
391
|
cannam@154
|
392 RESTORE_STACK;
|
cannam@154
|
393 }
|
cannam@154
|
394
|
cannam@154
|
395 #ifdef FIXED_POINT
|
cannam@154
|
396 static opus_val16 compute_pitch_gain(opus_val32 xy, opus_val32 xx, opus_val32 yy)
|
cannam@154
|
397 {
|
cannam@154
|
398 opus_val32 x2y2;
|
cannam@154
|
399 int sx, sy, shift;
|
cannam@154
|
400 opus_val32 g;
|
cannam@154
|
401 opus_val16 den;
|
cannam@154
|
402 if (xy == 0 || xx == 0 || yy == 0)
|
cannam@154
|
403 return 0;
|
cannam@154
|
404 sx = celt_ilog2(xx)-14;
|
cannam@154
|
405 sy = celt_ilog2(yy)-14;
|
cannam@154
|
406 shift = sx + sy;
|
cannam@154
|
407 x2y2 = SHR32(MULT16_16(VSHR32(xx, sx), VSHR32(yy, sy)), 14);
|
cannam@154
|
408 if (shift & 1) {
|
cannam@154
|
409 if (x2y2 < 32768)
|
cannam@154
|
410 {
|
cannam@154
|
411 x2y2 <<= 1;
|
cannam@154
|
412 shift--;
|
cannam@154
|
413 } else {
|
cannam@154
|
414 x2y2 >>= 1;
|
cannam@154
|
415 shift++;
|
cannam@154
|
416 }
|
cannam@154
|
417 }
|
cannam@154
|
418 den = celt_rsqrt_norm(x2y2);
|
cannam@154
|
419 g = MULT16_32_Q15(den, xy);
|
cannam@154
|
420 g = VSHR32(g, (shift>>1)-1);
|
cannam@154
|
421 return EXTRACT16(MIN32(g, Q15ONE));
|
cannam@154
|
422 }
|
cannam@154
|
423 #else
|
cannam@154
|
424 static opus_val16 compute_pitch_gain(opus_val32 xy, opus_val32 xx, opus_val32 yy)
|
cannam@154
|
425 {
|
cannam@154
|
426 return xy/celt_sqrt(1+xx*yy);
|
cannam@154
|
427 }
|
cannam@154
|
428 #endif
|
cannam@154
|
429
|
cannam@154
|
430 static const int second_check[16] = {0, 0, 3, 2, 3, 2, 5, 2, 3, 2, 3, 2, 5, 2, 3, 2};
|
cannam@154
|
431 opus_val16 remove_doubling(opus_val16 *x, int maxperiod, int minperiod,
|
cannam@154
|
432 int N, int *T0_, int prev_period, opus_val16 prev_gain, int arch)
|
cannam@154
|
433 {
|
cannam@154
|
434 int k, i, T, T0;
|
cannam@154
|
435 opus_val16 g, g0;
|
cannam@154
|
436 opus_val16 pg;
|
cannam@154
|
437 opus_val32 xy,xx,yy,xy2;
|
cannam@154
|
438 opus_val32 xcorr[3];
|
cannam@154
|
439 opus_val32 best_xy, best_yy;
|
cannam@154
|
440 int offset;
|
cannam@154
|
441 int minperiod0;
|
cannam@154
|
442 VARDECL(opus_val32, yy_lookup);
|
cannam@154
|
443 SAVE_STACK;
|
cannam@154
|
444
|
cannam@154
|
445 minperiod0 = minperiod;
|
cannam@154
|
446 maxperiod /= 2;
|
cannam@154
|
447 minperiod /= 2;
|
cannam@154
|
448 *T0_ /= 2;
|
cannam@154
|
449 prev_period /= 2;
|
cannam@154
|
450 N /= 2;
|
cannam@154
|
451 x += maxperiod;
|
cannam@154
|
452 if (*T0_>=maxperiod)
|
cannam@154
|
453 *T0_=maxperiod-1;
|
cannam@154
|
454
|
cannam@154
|
455 T = T0 = *T0_;
|
cannam@154
|
456 ALLOC(yy_lookup, maxperiod+1, opus_val32);
|
cannam@154
|
457 dual_inner_prod(x, x, x-T0, N, &xx, &xy, arch);
|
cannam@154
|
458 yy_lookup[0] = xx;
|
cannam@154
|
459 yy=xx;
|
cannam@154
|
460 for (i=1;i<=maxperiod;i++)
|
cannam@154
|
461 {
|
cannam@154
|
462 yy = yy+MULT16_16(x[-i],x[-i])-MULT16_16(x[N-i],x[N-i]);
|
cannam@154
|
463 yy_lookup[i] = MAX32(0, yy);
|
cannam@154
|
464 }
|
cannam@154
|
465 yy = yy_lookup[T0];
|
cannam@154
|
466 best_xy = xy;
|
cannam@154
|
467 best_yy = yy;
|
cannam@154
|
468 g = g0 = compute_pitch_gain(xy, xx, yy);
|
cannam@154
|
469 /* Look for any pitch at T/k */
|
cannam@154
|
470 for (k=2;k<=15;k++)
|
cannam@154
|
471 {
|
cannam@154
|
472 int T1, T1b;
|
cannam@154
|
473 opus_val16 g1;
|
cannam@154
|
474 opus_val16 cont=0;
|
cannam@154
|
475 opus_val16 thresh;
|
cannam@154
|
476 T1 = celt_udiv(2*T0+k, 2*k);
|
cannam@154
|
477 if (T1 < minperiod)
|
cannam@154
|
478 break;
|
cannam@154
|
479 /* Look for another strong correlation at T1b */
|
cannam@154
|
480 if (k==2)
|
cannam@154
|
481 {
|
cannam@154
|
482 if (T1+T0>maxperiod)
|
cannam@154
|
483 T1b = T0;
|
cannam@154
|
484 else
|
cannam@154
|
485 T1b = T0+T1;
|
cannam@154
|
486 } else
|
cannam@154
|
487 {
|
cannam@154
|
488 T1b = celt_udiv(2*second_check[k]*T0+k, 2*k);
|
cannam@154
|
489 }
|
cannam@154
|
490 dual_inner_prod(x, &x[-T1], &x[-T1b], N, &xy, &xy2, arch);
|
cannam@154
|
491 xy = HALF32(xy + xy2);
|
cannam@154
|
492 yy = HALF32(yy_lookup[T1] + yy_lookup[T1b]);
|
cannam@154
|
493 g1 = compute_pitch_gain(xy, xx, yy);
|
cannam@154
|
494 if (abs(T1-prev_period)<=1)
|
cannam@154
|
495 cont = prev_gain;
|
cannam@154
|
496 else if (abs(T1-prev_period)<=2 && 5*k*k < T0)
|
cannam@154
|
497 cont = HALF16(prev_gain);
|
cannam@154
|
498 else
|
cannam@154
|
499 cont = 0;
|
cannam@154
|
500 thresh = MAX16(QCONST16(.3f,15), MULT16_16_Q15(QCONST16(.7f,15),g0)-cont);
|
cannam@154
|
501 /* Bias against very high pitch (very short period) to avoid false-positives
|
cannam@154
|
502 due to short-term correlation */
|
cannam@154
|
503 if (T1<3*minperiod)
|
cannam@154
|
504 thresh = MAX16(QCONST16(.4f,15), MULT16_16_Q15(QCONST16(.85f,15),g0)-cont);
|
cannam@154
|
505 else if (T1<2*minperiod)
|
cannam@154
|
506 thresh = MAX16(QCONST16(.5f,15), MULT16_16_Q15(QCONST16(.9f,15),g0)-cont);
|
cannam@154
|
507 if (g1 > thresh)
|
cannam@154
|
508 {
|
cannam@154
|
509 best_xy = xy;
|
cannam@154
|
510 best_yy = yy;
|
cannam@154
|
511 T = T1;
|
cannam@154
|
512 g = g1;
|
cannam@154
|
513 }
|
cannam@154
|
514 }
|
cannam@154
|
515 best_xy = MAX32(0, best_xy);
|
cannam@154
|
516 if (best_yy <= best_xy)
|
cannam@154
|
517 pg = Q15ONE;
|
cannam@154
|
518 else
|
cannam@154
|
519 pg = SHR32(frac_div32(best_xy,best_yy+1),16);
|
cannam@154
|
520
|
cannam@154
|
521 for (k=0;k<3;k++)
|
cannam@154
|
522 xcorr[k] = celt_inner_prod(x, x-(T+k-1), N, arch);
|
cannam@154
|
523 if ((xcorr[2]-xcorr[0]) > MULT16_32_Q15(QCONST16(.7f,15),xcorr[1]-xcorr[0]))
|
cannam@154
|
524 offset = 1;
|
cannam@154
|
525 else if ((xcorr[0]-xcorr[2]) > MULT16_32_Q15(QCONST16(.7f,15),xcorr[1]-xcorr[2]))
|
cannam@154
|
526 offset = -1;
|
cannam@154
|
527 else
|
cannam@154
|
528 offset = 0;
|
cannam@154
|
529 if (pg > g)
|
cannam@154
|
530 pg = g;
|
cannam@154
|
531 *T0_ = 2*T+offset;
|
cannam@154
|
532
|
cannam@154
|
533 if (*T0_<minperiod0)
|
cannam@154
|
534 *T0_=minperiod0;
|
cannam@154
|
535 RESTORE_STACK;
|
cannam@154
|
536 return pg;
|
cannam@154
|
537 }
|