Jean-Marc Valin | 8b2ff0d | 2009-10-17 21:40:10 -0400 | [diff] [blame] | 1 | /* Copyright (c) 2007-2008 CSIRO |
| 2 | Copyright (c) 2007-2009 Xiph.Org Foundation |
| 3 | Written by Jean-Marc Valin */ |
Jean-Marc Valin | 14191b3 | 2007-11-30 12:15:49 +1100 | [diff] [blame] | 4 | /** |
| 5 | @file pitch.c |
| 6 | @brief Pitch analysis |
Jean-Marc Valin | 879fbfd | 2008-02-20 17:17:13 +1100 | [diff] [blame] | 7 | */ |
| 8 | |
| 9 | /* |
| 10 | Redistribution and use in source and binary forms, with or without |
| 11 | modification, are permitted provided that the following conditions |
| 12 | are met: |
Gregory Maxwell | 71d39ad | 2011-07-30 00:00:29 -0400 | [diff] [blame] | 13 | |
Jean-Marc Valin | 879fbfd | 2008-02-20 17:17:13 +1100 | [diff] [blame] | 14 | - Redistributions of source code must retain the above copyright |
| 15 | notice, this list of conditions and the following disclaimer. |
Gregory Maxwell | 71d39ad | 2011-07-30 00:00:29 -0400 | [diff] [blame] | 16 | |
Jean-Marc Valin | 879fbfd | 2008-02-20 17:17:13 +1100 | [diff] [blame] | 17 | - Redistributions in binary form must reproduce the above copyright |
| 18 | notice, this list of conditions and the following disclaimer in the |
| 19 | documentation and/or other materials provided with the distribution. |
Gregory Maxwell | 71d39ad | 2011-07-30 00:00:29 -0400 | [diff] [blame] | 20 | |
Jean-Marc Valin | 879fbfd | 2008-02-20 17:17:13 +1100 | [diff] [blame] | 21 | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| 22 | ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| 23 | LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
Jean-Marc Valin | cb05e7c | 2012-04-20 16:40:24 -0400 | [diff] [blame] | 24 | A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER |
| 25 | OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
Jean-Marc Valin | 879fbfd | 2008-02-20 17:17:13 +1100 | [diff] [blame] | 26 | EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
| 27 | PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
| 28 | PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF |
| 29 | LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING |
| 30 | NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |
| 31 | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
Jean-Marc Valin | 14191b3 | 2007-11-30 12:15:49 +1100 | [diff] [blame] | 32 | */ |
| 33 | |
Jean-Marc Valin | 02fa913 | 2008-02-20 12:09:29 +1100 | [diff] [blame] | 34 | #ifdef HAVE_CONFIG_H |
| 35 | #include "config.h" |
| 36 | #endif |
Jean-Marc Valin | 14191b3 | 2007-11-30 12:15:49 +1100 | [diff] [blame] | 37 | |
Jean-Marc Valin | f3efa3e | 2007-12-01 01:55:17 +1100 | [diff] [blame] | 38 | #include "pitch.h" |
Jean-Marc Valin | f93747c | 2008-03-05 17:20:30 +1100 | [diff] [blame] | 39 | #include "os_support.h" |
Jean-Marc Valin | f11d6f4 | 2008-04-18 23:13:14 +1000 | [diff] [blame] | 40 | #include "modes.h" |
Jean-Marc Valin | c7e0b76 | 2008-03-16 07:55:29 +1100 | [diff] [blame] | 41 | #include "stack_alloc.h" |
Jean-Marc Valin | 9319e3e | 2009-11-09 13:51:54 +0900 | [diff] [blame] | 42 | #include "mathops.h" |
Jean-Marc Valin | 2779df7 | 2011-10-04 13:26:53 -0400 | [diff] [blame] | 43 | #include "celt_lpc.h" |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 44 | |
Gregory Maxwell | 40f956e | 2011-09-01 19:42:37 -0400 | [diff] [blame] | 45 | static void find_best_pitch(opus_val32 *xcorr, opus_val16 *y, int len, |
| 46 | int max_pitch, int *best_pitch |
| 47 | #ifdef FIXED_POINT |
| 48 | , int yshift, opus_val32 maxcorr |
| 49 | #endif |
| 50 | ) |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 51 | { |
| 52 | int i, j; |
Jean-Marc Valin | ff5f722 | 2011-07-29 18:59:12 -0400 | [diff] [blame] | 53 | opus_val32 Syy=1; |
| 54 | opus_val16 best_num[2]; |
| 55 | opus_val32 best_den[2]; |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 56 | #ifdef FIXED_POINT |
| 57 | int xshift; |
| 58 | |
| 59 | xshift = celt_ilog2(maxcorr)-14; |
| 60 | #endif |
| 61 | |
| 62 | best_num[0] = -1; |
| 63 | best_num[1] = -1; |
| 64 | best_den[0] = 0; |
| 65 | best_den[1] = 0; |
| 66 | best_pitch[0] = 0; |
| 67 | best_pitch[1] = 1; |
| 68 | for (j=0;j<len;j++) |
Jean-Marc Valin | 178758b | 2012-04-06 23:32:11 -0400 | [diff] [blame] | 69 | Syy = ADD32(Syy, SHR32(MULT16_16(y[j],y[j]), yshift)); |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 70 | for (i=0;i<max_pitch;i++) |
| 71 | { |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 72 | if (xcorr[i]>0) |
| 73 | { |
Jean-Marc Valin | ff5f722 | 2011-07-29 18:59:12 -0400 | [diff] [blame] | 74 | opus_val16 num; |
| 75 | opus_val32 xcorr16; |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 76 | xcorr16 = EXTRACT16(VSHR32(xcorr[i], xshift)); |
Jean-Marc Valin | 9faea25 | 2012-05-08 13:58:57 -0400 | [diff] [blame] | 77 | #ifndef FIXED_POINT |
| 78 | /* Considering the range of xcorr16, this should avoid both underflows |
| 79 | and overflows (inf) when squaring xcorr16 */ |
Ralph Giles | 027ec51 | 2012-10-23 10:49:18 -0700 | [diff] [blame] | 80 | xcorr16 *= 1e-12f; |
Jean-Marc Valin | 9faea25 | 2012-05-08 13:58:57 -0400 | [diff] [blame] | 81 | #endif |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 82 | num = MULT16_16_Q15(xcorr16,xcorr16); |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 83 | if (MULT16_32_Q15(num,best_den[1]) > MULT16_32_Q15(best_num[1],Syy)) |
| 84 | { |
| 85 | if (MULT16_32_Q15(num,best_den[0]) > MULT16_32_Q15(best_num[0],Syy)) |
| 86 | { |
| 87 | best_num[1] = best_num[0]; |
| 88 | best_den[1] = best_den[0]; |
| 89 | best_pitch[1] = best_pitch[0]; |
| 90 | best_num[0] = num; |
| 91 | best_den[0] = Syy; |
| 92 | best_pitch[0] = i; |
| 93 | } else { |
| 94 | best_num[1] = num; |
| 95 | best_den[1] = Syy; |
| 96 | best_pitch[1] = i; |
| 97 | } |
| 98 | } |
| 99 | } |
| 100 | Syy += SHR32(MULT16_16(y[i+len],y[i+len]),yshift) - SHR32(MULT16_16(y[i],y[i]),yshift); |
| 101 | Syy = MAX32(1, Syy); |
| 102 | } |
| 103 | } |
| 104 | |
Jean-Marc Valin | fbf9998 | 2013-05-24 17:18:41 -0400 | [diff] [blame] | 105 | static void celt_fir5(const opus_val16 *x, |
| 106 | const opus_val16 *num, |
| 107 | opus_val16 *y, |
| 108 | int N, |
| 109 | opus_val16 *mem) |
| 110 | { |
| 111 | int i; |
| 112 | opus_val16 num0, num1, num2, num3, num4; |
| 113 | opus_val32 mem0, mem1, mem2, mem3, mem4; |
| 114 | num0=num[0]; |
| 115 | num1=num[1]; |
| 116 | num2=num[2]; |
| 117 | num3=num[3]; |
| 118 | num4=num[4]; |
| 119 | mem0=mem[0]; |
| 120 | mem1=mem[1]; |
| 121 | mem2=mem[2]; |
| 122 | mem3=mem[3]; |
| 123 | mem4=mem[4]; |
| 124 | for (i=0;i<N;i++) |
| 125 | { |
| 126 | opus_val32 sum = SHL32(EXTEND32(x[i]), SIG_SHIFT); |
| 127 | sum = MAC16_16(sum,num0,mem0); |
| 128 | sum = MAC16_16(sum,num1,mem1); |
| 129 | sum = MAC16_16(sum,num2,mem2); |
| 130 | sum = MAC16_16(sum,num3,mem3); |
| 131 | sum = MAC16_16(sum,num4,mem4); |
| 132 | mem4 = mem3; |
| 133 | mem3 = mem2; |
| 134 | mem2 = mem1; |
| 135 | mem1 = mem0; |
| 136 | mem0 = x[i]; |
| 137 | y[i] = ROUND16(sum, SIG_SHIFT); |
| 138 | } |
| 139 | mem[0]=mem0; |
| 140 | mem[1]=mem1; |
| 141 | mem[2]=mem2; |
| 142 | mem[3]=mem3; |
| 143 | mem[4]=mem4; |
| 144 | } |
| 145 | |
| 146 | |
Gregory Maxwell | de0b532 | 2012-07-18 12:12:35 -0400 | [diff] [blame] | 147 | void pitch_downsample(celt_sig * OPUS_RESTRICT x[], opus_val16 * OPUS_RESTRICT x_lp, |
Ralph Giles | 120800f | 2011-11-25 13:02:00 -0800 | [diff] [blame] | 148 | int len, int C) |
Jean-Marc Valin | e465c14 | 2009-11-26 00:39:36 -0500 | [diff] [blame] | 149 | { |
| 150 | int i; |
Jean-Marc Valin | ff5f722 | 2011-07-29 18:59:12 -0400 | [diff] [blame] | 151 | opus_val32 ac[5]; |
| 152 | opus_val16 tmp=Q15ONE; |
Jean-Marc Valin | fbf9998 | 2013-05-24 17:18:41 -0400 | [diff] [blame] | 153 | opus_val16 lpc[4], mem[5]={0,0,0,0,0}; |
| 154 | opus_val16 lpc2[5]; |
| 155 | opus_val16 c1 = QCONST16(.8f,15); |
Jean-Marc Valin | 178758b | 2012-04-06 23:32:11 -0400 | [diff] [blame] | 156 | #ifdef FIXED_POINT |
| 157 | int shift; |
Jean-Marc Valin | 66ac102 | 2012-05-29 17:01:35 -0400 | [diff] [blame] | 158 | opus_val32 maxabs = celt_maxabs32(x[0], len); |
Jean-Marc Valin | 178758b | 2012-04-06 23:32:11 -0400 | [diff] [blame] | 159 | if (C==2) |
Jean-Marc Valin | 66ac102 | 2012-05-29 17:01:35 -0400 | [diff] [blame] | 160 | { |
| 161 | opus_val32 maxabs_1 = celt_maxabs32(x[1], len); |
| 162 | maxabs = MAX32(maxabs, maxabs_1); |
| 163 | } |
| 164 | if (maxabs<1) |
| 165 | maxabs=1; |
| 166 | shift = celt_ilog2(maxabs)-10; |
| 167 | if (shift<0) |
| 168 | shift=0; |
Jean-Marc Valin | 178758b | 2012-04-06 23:32:11 -0400 | [diff] [blame] | 169 | if (C==2) |
| 170 | shift++; |
| 171 | #endif |
Jean-Marc Valin | e465c14 | 2009-11-26 00:39:36 -0500 | [diff] [blame] | 172 | for (i=1;i<len>>1;i++) |
Jean-Marc Valin | 178758b | 2012-04-06 23:32:11 -0400 | [diff] [blame] | 173 | x_lp[i] = SHR32(HALF32(HALF32(x[0][(2*i-1)]+x[0][(2*i+1)])+x[0][2*i]), shift); |
| 174 | x_lp[0] = SHR32(HALF32(HALF32(x[0][1])+x[0][0]), shift); |
Jean-Marc Valin | e465c14 | 2009-11-26 00:39:36 -0500 | [diff] [blame] | 175 | if (C==2) |
| 176 | { |
| 177 | for (i=1;i<len>>1;i++) |
Jean-Marc Valin | 178758b | 2012-04-06 23:32:11 -0400 | [diff] [blame] | 178 | x_lp[i] += SHR32(HALF32(HALF32(x[1][(2*i-1)]+x[1][(2*i+1)])+x[1][2*i]), shift); |
| 179 | x_lp[0] += SHR32(HALF32(HALF32(x[1][1])+x[1][0]), shift); |
Jean-Marc Valin | e465c14 | 2009-11-26 00:39:36 -0500 | [diff] [blame] | 180 | } |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 181 | |
| 182 | _celt_autocorr(x_lp, ac, NULL, 0, |
| 183 | 4, len>>1); |
| 184 | |
| 185 | /* Noise floor -40 dB */ |
| 186 | #ifdef FIXED_POINT |
| 187 | ac[0] += SHR32(ac[0],13); |
| 188 | #else |
| 189 | ac[0] *= 1.0001f; |
| 190 | #endif |
| 191 | /* Lag windowing */ |
| 192 | for (i=1;i<=4;i++) |
| 193 | { |
| 194 | /*ac[i] *= exp(-.5*(2*M_PI*.002*i)*(2*M_PI*.002*i));*/ |
| 195 | #ifdef FIXED_POINT |
| 196 | ac[i] -= MULT16_32_Q15(2*i*i, ac[i]); |
| 197 | #else |
| 198 | ac[i] -= ac[i]*(.008f*i)*(.008f*i); |
| 199 | #endif |
| 200 | } |
| 201 | |
| 202 | _celt_lpc(lpc, ac, 4); |
| 203 | for (i=0;i<4;i++) |
| 204 | { |
| 205 | tmp = MULT16_16_Q15(QCONST16(.9f,15), tmp); |
| 206 | lpc[i] = MULT16_16_Q15(lpc[i], tmp); |
| 207 | } |
Jean-Marc Valin | fbf9998 | 2013-05-24 17:18:41 -0400 | [diff] [blame] | 208 | /* Add a zero */ |
| 209 | lpc2[0] = lpc[0] + QCONST16(.8f,SIG_SHIFT); |
| 210 | lpc2[1] = lpc[1] + MULT16_16_Q15(c1,lpc[0]); |
| 211 | lpc2[2] = lpc[2] + MULT16_16_Q15(c1,lpc[1]); |
| 212 | lpc2[3] = lpc[3] + MULT16_16_Q15(c1,lpc[2]); |
| 213 | lpc2[4] = MULT16_16_Q15(c1,lpc[3]); |
| 214 | celt_fir5(x_lp, lpc2, x_lp, len>>1, mem); |
Jean-Marc Valin | e465c14 | 2009-11-26 00:39:36 -0500 | [diff] [blame] | 215 | } |
| 216 | |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 217 | #if 0 /* This is a simple version of the pitch correlation that should work |
| 218 | well on DSPs like Blackfin and TI C5x/C6x */ |
| 219 | |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 220 | #ifdef FIXED_POINT |
Jean-Marc Valin | e8e57a3 | 2013-05-25 02:14:25 -0400 | [diff] [blame^] | 221 | opus_val32 |
| 222 | #else |
| 223 | void |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 224 | #endif |
Jean-Marc Valin | e8e57a3 | 2013-05-25 02:14:25 -0400 | [diff] [blame^] | 225 | pitch_xcorr(opus_val16 *x, opus_val16 *y, opus_val32 *xcorr, int len, int max_pitch) |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 226 | { |
| 227 | int i, j; |
| 228 | #ifdef FIXED_POINT |
Jean-Marc Valin | 088929d | 2013-05-24 01:38:06 -0400 | [diff] [blame] | 229 | opus_val32 maxcorr=1; |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 230 | #endif |
| 231 | for (i=0;i<max_pitch;i++) |
| 232 | { |
| 233 | opus_val32 sum = 0; |
| 234 | for (j=0;j<len;j++) |
| 235 | sum = MAC16_16(sum, x[j],y[i+j]); |
Jean-Marc Valin | e8e57a3 | 2013-05-25 02:14:25 -0400 | [diff] [blame^] | 236 | xcorr[i] = sum; |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 237 | #ifdef FIXED_POINT |
| 238 | maxcorr = MAX32(maxcorr, sum); |
| 239 | #endif |
| 240 | } |
| 241 | #ifdef FIXED_POINT |
Jean-Marc Valin | e8e57a3 | 2013-05-25 02:14:25 -0400 | [diff] [blame^] | 242 | return maxcorr; |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 243 | #endif |
| 244 | } |
| 245 | |
| 246 | #else /* Unrolled version of the pitch correlation -- runs faster on x86 and ARM */ |
| 247 | |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 248 | #ifdef FIXED_POINT |
Jean-Marc Valin | e8e57a3 | 2013-05-25 02:14:25 -0400 | [diff] [blame^] | 249 | opus_val32 |
| 250 | #else |
| 251 | void |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 252 | #endif |
Jean-Marc Valin | e8e57a3 | 2013-05-25 02:14:25 -0400 | [diff] [blame^] | 253 | pitch_xcorr(opus_val16 *_x, opus_val16 *_y, opus_val32 *xcorr, int len, int max_pitch) |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 254 | { |
| 255 | int i,j; |
| 256 | #ifdef FIXED_POINT |
Jean-Marc Valin | 088929d | 2013-05-24 01:38:06 -0400 | [diff] [blame] | 257 | opus_val32 maxcorr=1; |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 258 | #endif |
Jean-Marc Valin | 85a6618 | 2013-05-24 03:41:04 -0400 | [diff] [blame] | 259 | for (i=0;i<max_pitch-3;i+=4) |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 260 | { |
| 261 | /* Compute correlation*/ |
| 262 | /*corr[nb_pitch-1-i]=inner_prod(x, _y+i, len);*/ |
| 263 | opus_val32 sum1=0; |
| 264 | opus_val32 sum2=0; |
| 265 | opus_val32 sum3=0; |
| 266 | opus_val32 sum4=0; |
| 267 | const opus_val16 *y = _y+i; |
| 268 | const opus_val16 *x = _x; |
| 269 | opus_val16 y0, y1, y2, y3; |
| 270 | /*y0=y[0];y1=y[1];y2=y[2];y3=y[3];*/ |
| 271 | y0=*y++; |
| 272 | y1=*y++; |
| 273 | y2=*y++; |
Jean-Marc Valin | e8e57a3 | 2013-05-25 02:14:25 -0400 | [diff] [blame^] | 274 | for (j=0;j<len-3;j+=4) |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 275 | { |
| 276 | opus_val16 tmp; |
| 277 | tmp = *x++; |
| 278 | y3=*y++; |
| 279 | sum1 = MAC16_16(sum1,tmp,y0); |
| 280 | sum2 = MAC16_16(sum2,tmp,y1); |
| 281 | sum3 = MAC16_16(sum3,tmp,y2); |
| 282 | sum4 = MAC16_16(sum4,tmp,y3); |
| 283 | tmp=*x++; |
| 284 | y0=*y++; |
| 285 | sum1 = MAC16_16(sum1,tmp,y1); |
| 286 | sum2 = MAC16_16(sum2,tmp,y2); |
| 287 | sum3 = MAC16_16(sum3,tmp,y3); |
| 288 | sum4 = MAC16_16(sum4,tmp,y0); |
| 289 | tmp=*x++; |
| 290 | y1=*y++; |
| 291 | sum1 = MAC16_16(sum1,tmp,y2); |
| 292 | sum2 = MAC16_16(sum2,tmp,y3); |
| 293 | sum3 = MAC16_16(sum3,tmp,y0); |
| 294 | sum4 = MAC16_16(sum4,tmp,y1); |
| 295 | tmp=*x++; |
| 296 | y2=*y++; |
| 297 | sum1 = MAC16_16(sum1,tmp,y3); |
| 298 | sum2 = MAC16_16(sum2,tmp,y0); |
| 299 | sum3 = MAC16_16(sum3,tmp,y1); |
| 300 | sum4 = MAC16_16(sum4,tmp,y2); |
| 301 | } |
Jean-Marc Valin | e8e57a3 | 2013-05-25 02:14:25 -0400 | [diff] [blame^] | 302 | if (j++<len) |
| 303 | { |
| 304 | opus_val16 tmp = *x++; |
| 305 | y3=*y++; |
| 306 | sum1 = MAC16_16(sum1,tmp,y0); |
| 307 | sum2 = MAC16_16(sum2,tmp,y1); |
| 308 | sum3 = MAC16_16(sum3,tmp,y2); |
| 309 | sum4 = MAC16_16(sum4,tmp,y3); |
| 310 | } |
| 311 | if (j++<len) |
| 312 | { |
| 313 | opus_val16 tmp=*x++; |
| 314 | y0=*y++; |
| 315 | sum1 = MAC16_16(sum1,tmp,y1); |
| 316 | sum2 = MAC16_16(sum2,tmp,y2); |
| 317 | sum3 = MAC16_16(sum3,tmp,y3); |
| 318 | sum4 = MAC16_16(sum4,tmp,y0); |
| 319 | } |
| 320 | if (j<len) |
| 321 | { |
| 322 | opus_val16 tmp=*x++; |
| 323 | y1=*y++; |
| 324 | sum1 = MAC16_16(sum1,tmp,y2); |
| 325 | sum2 = MAC16_16(sum2,tmp,y3); |
| 326 | sum3 = MAC16_16(sum3,tmp,y0); |
| 327 | sum4 = MAC16_16(sum4,tmp,y1); |
| 328 | } |
| 329 | xcorr[i]=sum1; |
| 330 | xcorr[i+1]=sum2; |
| 331 | xcorr[i+2]=sum3; |
| 332 | xcorr[i+3]=sum4; |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 333 | #ifdef FIXED_POINT |
| 334 | sum1 = MAX32(sum1, sum2); |
| 335 | sum3 = MAX32(sum3, sum4); |
| 336 | sum1 = MAX32(sum1, sum3); |
| 337 | maxcorr = MAX32(maxcorr, sum1); |
| 338 | #endif |
| 339 | } |
Jean-Marc Valin | 85a6618 | 2013-05-24 03:41:04 -0400 | [diff] [blame] | 340 | /* In case max_pitch isn't a multiple of 4, do non-unrolled version. */ |
| 341 | for (;i<max_pitch;i++) |
| 342 | { |
| 343 | opus_val32 sum = 0; |
| 344 | for (j=0;j<len;j++) |
| 345 | sum = MAC16_16(sum, _x[j],_y[i+j]); |
Jean-Marc Valin | e8e57a3 | 2013-05-25 02:14:25 -0400 | [diff] [blame^] | 346 | xcorr[i] = sum; |
Jean-Marc Valin | 85a6618 | 2013-05-24 03:41:04 -0400 | [diff] [blame] | 347 | #ifdef FIXED_POINT |
| 348 | maxcorr = MAX32(maxcorr, sum); |
| 349 | #endif |
| 350 | } |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 351 | #ifdef FIXED_POINT |
Jean-Marc Valin | e8e57a3 | 2013-05-25 02:14:25 -0400 | [diff] [blame^] | 352 | return maxcorr; |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 353 | #endif |
| 354 | } |
| 355 | |
| 356 | #endif |
Gregory Maxwell | de0b532 | 2012-07-18 12:12:35 -0400 | [diff] [blame] | 357 | void pitch_search(const opus_val16 * OPUS_RESTRICT x_lp, opus_val16 * OPUS_RESTRICT y, |
Jean-Marc Valin | e3e2c26 | 2011-01-26 13:09:53 -0500 | [diff] [blame] | 358 | int len, int max_pitch, int *pitch) |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 359 | { |
| 360 | int i, j; |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 361 | int lag; |
Gregory Maxwell | 06d57b2 | 2011-08-01 22:02:25 -0400 | [diff] [blame] | 362 | int best_pitch[2]={0,0}; |
Jean-Marc Valin | ff5f722 | 2011-07-29 18:59:12 -0400 | [diff] [blame] | 363 | VARDECL(opus_val16, x_lp4); |
| 364 | VARDECL(opus_val16, y_lp4); |
| 365 | VARDECL(opus_val32, xcorr); |
Gregory Maxwell | 40f956e | 2011-09-01 19:42:37 -0400 | [diff] [blame] | 366 | #ifdef FIXED_POINT |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 367 | opus_val32 maxcorr; |
Jean-Marc Valin | b7bd4c2 | 2013-05-18 23:33:48 -0400 | [diff] [blame] | 368 | opus_val32 xmax, ymax; |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 369 | int shift=0; |
Gregory Maxwell | 40f956e | 2011-09-01 19:42:37 -0400 | [diff] [blame] | 370 | #endif |
| 371 | int offset; |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 372 | |
Thorvald Natvig | 065dafd | 2009-11-25 01:02:42 +0100 | [diff] [blame] | 373 | SAVE_STACK; |
| 374 | |
Gregory Maxwell | 5d5875a | 2011-10-03 21:07:39 -0400 | [diff] [blame] | 375 | celt_assert(len>0); |
| 376 | celt_assert(max_pitch>0); |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 377 | lag = len+max_pitch; |
| 378 | |
Jean-Marc Valin | ff5f722 | 2011-07-29 18:59:12 -0400 | [diff] [blame] | 379 | ALLOC(x_lp4, len>>2, opus_val16); |
| 380 | ALLOC(y_lp4, lag>>2, opus_val16); |
| 381 | ALLOC(xcorr, max_pitch>>1, opus_val32); |
Thorvald Natvig | 065dafd | 2009-11-25 01:02:42 +0100 | [diff] [blame] | 382 | |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 383 | /* Downsample by 2 again */ |
| 384 | for (j=0;j<len>>2;j++) |
| 385 | x_lp4[j] = x_lp[2*j]; |
| 386 | for (j=0;j<lag>>2;j++) |
| 387 | y_lp4[j] = y[2*j]; |
| 388 | |
| 389 | #ifdef FIXED_POINT |
Jean-Marc Valin | 66ac102 | 2012-05-29 17:01:35 -0400 | [diff] [blame] | 390 | xmax = celt_maxabs16(x_lp4, len>>2); |
| 391 | ymax = celt_maxabs16(y_lp4, lag>>2); |
Jean-Marc Valin | b7bd4c2 | 2013-05-18 23:33:48 -0400 | [diff] [blame] | 392 | shift = celt_ilog2(MAX32(1, MAX32(xmax, ymax)))-11; |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 393 | if (shift>0) |
| 394 | { |
| 395 | for (j=0;j<len>>2;j++) |
| 396 | x_lp4[j] = SHR16(x_lp4[j], shift); |
| 397 | for (j=0;j<lag>>2;j++) |
| 398 | y_lp4[j] = SHR16(y_lp4[j], shift); |
| 399 | /* Use double the shift for a MAC */ |
| 400 | shift *= 2; |
| 401 | } else { |
| 402 | shift = 0; |
| 403 | } |
| 404 | #endif |
| 405 | |
| 406 | /* Coarse search with 4x decimation */ |
| 407 | |
Gregory Maxwell | 40f956e | 2011-09-01 19:42:37 -0400 | [diff] [blame] | 408 | #ifdef FIXED_POINT |
Jean-Marc Valin | e8e57a3 | 2013-05-25 02:14:25 -0400 | [diff] [blame^] | 409 | maxcorr = |
Gregory Maxwell | 40f956e | 2011-09-01 19:42:37 -0400 | [diff] [blame] | 410 | #endif |
Jean-Marc Valin | e8e57a3 | 2013-05-25 02:14:25 -0400 | [diff] [blame^] | 411 | pitch_xcorr(x_lp4, y_lp4, xcorr, len>>2, max_pitch>>2); |
Jean-Marc Valin | 559fbe8 | 2013-05-24 01:09:31 -0400 | [diff] [blame] | 412 | |
Gregory Maxwell | 40f956e | 2011-09-01 19:42:37 -0400 | [diff] [blame] | 413 | find_best_pitch(xcorr, y_lp4, len>>2, max_pitch>>2, best_pitch |
| 414 | #ifdef FIXED_POINT |
| 415 | , 0, maxcorr |
| 416 | #endif |
| 417 | ); |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 418 | |
| 419 | /* Finer search with 2x decimation */ |
Gregory Maxwell | 40f956e | 2011-09-01 19:42:37 -0400 | [diff] [blame] | 420 | #ifdef FIXED_POINT |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 421 | maxcorr=1; |
Gregory Maxwell | 40f956e | 2011-09-01 19:42:37 -0400 | [diff] [blame] | 422 | #endif |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 423 | for (i=0;i<max_pitch>>1;i++) |
| 424 | { |
Jean-Marc Valin | ff5f722 | 2011-07-29 18:59:12 -0400 | [diff] [blame] | 425 | opus_val32 sum=0; |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 426 | xcorr[i] = 0; |
| 427 | if (abs(i-2*best_pitch[0])>2 && abs(i-2*best_pitch[1])>2) |
| 428 | continue; |
| 429 | for (j=0;j<len>>1;j++) |
| 430 | sum += SHR32(MULT16_16(x_lp[j],y[i+j]), shift); |
| 431 | xcorr[i] = MAX32(-1, sum); |
Gregory Maxwell | 40f956e | 2011-09-01 19:42:37 -0400 | [diff] [blame] | 432 | #ifdef FIXED_POINT |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 433 | maxcorr = MAX32(maxcorr, sum); |
Gregory Maxwell | 40f956e | 2011-09-01 19:42:37 -0400 | [diff] [blame] | 434 | #endif |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 435 | } |
Gregory Maxwell | 40f956e | 2011-09-01 19:42:37 -0400 | [diff] [blame] | 436 | find_best_pitch(xcorr, y, len>>1, max_pitch>>1, best_pitch |
| 437 | #ifdef FIXED_POINT |
Jean-Marc Valin | 178758b | 2012-04-06 23:32:11 -0400 | [diff] [blame] | 438 | , shift+1, maxcorr |
Gregory Maxwell | 40f956e | 2011-09-01 19:42:37 -0400 | [diff] [blame] | 439 | #endif |
| 440 | ); |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 441 | |
| 442 | /* Refine by pseudo-interpolation */ |
| 443 | if (best_pitch[0]>0 && best_pitch[0]<(max_pitch>>1)-1) |
| 444 | { |
Jean-Marc Valin | ff5f722 | 2011-07-29 18:59:12 -0400 | [diff] [blame] | 445 | opus_val32 a, b, c; |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 446 | a = xcorr[best_pitch[0]-1]; |
| 447 | b = xcorr[best_pitch[0]]; |
| 448 | c = xcorr[best_pitch[0]+1]; |
| 449 | if ((c-a) > MULT16_32_Q15(QCONST16(.7f,15),b-a)) |
| 450 | offset = 1; |
| 451 | else if ((a-c) > MULT16_32_Q15(QCONST16(.7f,15),b-c)) |
| 452 | offset = -1; |
Gregory Maxwell | 71d39ad | 2011-07-30 00:00:29 -0400 | [diff] [blame] | 453 | else |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 454 | offset = 0; |
| 455 | } else { |
| 456 | offset = 0; |
| 457 | } |
| 458 | *pitch = 2*best_pitch[0]-offset; |
| 459 | |
Thorvald Natvig | 065dafd | 2009-11-25 01:02:42 +0100 | [diff] [blame] | 460 | RESTORE_STACK; |
Jean-Marc Valin | 294863b | 2009-11-08 22:29:54 +0900 | [diff] [blame] | 461 | } |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 462 | |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 463 | static const int second_check[16] = {0, 0, 3, 2, 3, 2, 5, 2, 3, 2, 3, 2, 5, 2, 3, 2}; |
Jean-Marc Valin | ff5f722 | 2011-07-29 18:59:12 -0400 | [diff] [blame] | 464 | opus_val16 remove_doubling(opus_val16 *x, int maxperiod, int minperiod, |
Ralph Giles | 120800f | 2011-11-25 13:02:00 -0800 | [diff] [blame] | 465 | int N, int *T0_, int prev_period, opus_val16 prev_gain) |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 466 | { |
Gregory Maxwell | b8a6b31 | 2011-02-03 22:56:01 -0500 | [diff] [blame] | 467 | int k, i, T, T0; |
Jean-Marc Valin | ff5f722 | 2011-07-29 18:59:12 -0400 | [diff] [blame] | 468 | opus_val16 g, g0; |
| 469 | opus_val16 pg; |
| 470 | opus_val32 xy,xx,yy; |
| 471 | opus_val32 xcorr[3]; |
| 472 | opus_val32 best_xy, best_yy; |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 473 | int offset; |
Jean-Marc Valin | d121260 | 2011-01-25 13:11:36 -0500 | [diff] [blame] | 474 | int minperiod0; |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 475 | |
Jean-Marc Valin | d121260 | 2011-01-25 13:11:36 -0500 | [diff] [blame] | 476 | minperiod0 = minperiod; |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 477 | maxperiod /= 2; |
| 478 | minperiod /= 2; |
Ralph Giles | 120800f | 2011-11-25 13:02:00 -0800 | [diff] [blame] | 479 | *T0_ /= 2; |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 480 | prev_period /= 2; |
| 481 | N /= 2; |
| 482 | x += maxperiod; |
Ralph Giles | 120800f | 2011-11-25 13:02:00 -0800 | [diff] [blame] | 483 | if (*T0_>=maxperiod) |
| 484 | *T0_=maxperiod-1; |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 485 | |
Ralph Giles | 120800f | 2011-11-25 13:02:00 -0800 | [diff] [blame] | 486 | T = T0 = *T0_; |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 487 | xx=xy=yy=0; |
| 488 | for (i=0;i<N;i++) |
| 489 | { |
| 490 | xy = MAC16_16(xy, x[i], x[i-T0]); |
| 491 | xx = MAC16_16(xx, x[i], x[i]); |
| 492 | yy = MAC16_16(yy, x[i-T0],x[i-T0]); |
| 493 | } |
| 494 | best_xy = xy; |
| 495 | best_yy = yy; |
| 496 | #ifdef FIXED_POINT |
| 497 | { |
Jean-Marc Valin | ff5f722 | 2011-07-29 18:59:12 -0400 | [diff] [blame] | 498 | opus_val32 x2y2; |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 499 | int sh, t; |
| 500 | x2y2 = 1+HALF32(MULT32_32_Q31(xx,yy)); |
| 501 | sh = celt_ilog2(x2y2)>>1; |
| 502 | t = VSHR32(x2y2, 2*(sh-7)); |
| 503 | g = g0 = VSHR32(MULT16_32_Q15(celt_rsqrt_norm(t), xy),sh+1); |
| 504 | } |
| 505 | #else |
Gregory Maxwell | 662587d | 2011-08-01 20:41:54 -0400 | [diff] [blame] | 506 | g = g0 = xy/celt_sqrt(1+xx*yy); |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 507 | #endif |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 508 | /* Look for any pitch at T/k */ |
| 509 | for (k=2;k<=15;k++) |
| 510 | { |
| 511 | int T1, T1b; |
Jean-Marc Valin | ff5f722 | 2011-07-29 18:59:12 -0400 | [diff] [blame] | 512 | opus_val16 g1; |
| 513 | opus_val16 cont=0; |
Jean-Marc Valin | 0892c16 | 2012-01-12 03:44:49 -0500 | [diff] [blame] | 514 | opus_val16 thresh; |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 515 | T1 = (2*T0+k)/(2*k); |
| 516 | if (T1 < minperiod) |
| 517 | break; |
| 518 | /* Look for another strong correlation at T1b */ |
| 519 | if (k==2) |
| 520 | { |
| 521 | if (T1+T0>maxperiod) |
| 522 | T1b = T0; |
| 523 | else |
| 524 | T1b = T0+T1; |
| 525 | } else |
| 526 | { |
| 527 | T1b = (2*second_check[k]*T0+k)/(2*k); |
| 528 | } |
| 529 | xy=yy=0; |
| 530 | for (i=0;i<N;i++) |
| 531 | { |
| 532 | xy = MAC16_16(xy, x[i], x[i-T1]); |
| 533 | yy = MAC16_16(yy, x[i-T1], x[i-T1]); |
| 534 | |
| 535 | xy = MAC16_16(xy, x[i], x[i-T1b]); |
| 536 | yy = MAC16_16(yy, x[i-T1b], x[i-T1b]); |
| 537 | } |
| 538 | #ifdef FIXED_POINT |
| 539 | { |
Jean-Marc Valin | ff5f722 | 2011-07-29 18:59:12 -0400 | [diff] [blame] | 540 | opus_val32 x2y2; |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 541 | int sh, t; |
| 542 | x2y2 = 1+MULT32_32_Q31(xx,yy); |
| 543 | sh = celt_ilog2(x2y2)>>1; |
| 544 | t = VSHR32(x2y2, 2*(sh-7)); |
| 545 | g1 = VSHR32(MULT16_32_Q15(celt_rsqrt_norm(t), xy),sh+1); |
| 546 | } |
| 547 | #else |
Gregory Maxwell | 662587d | 2011-08-01 20:41:54 -0400 | [diff] [blame] | 548 | g1 = xy/celt_sqrt(1+2.f*xx*1.f*yy); |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 549 | #endif |
| 550 | if (abs(T1-prev_period)<=1) |
| 551 | cont = prev_gain; |
| 552 | else if (abs(T1-prev_period)<=2 && 5*k*k < T0) |
| 553 | cont = HALF32(prev_gain); |
| 554 | else |
| 555 | cont = 0; |
Ralph Giles | 027ec51 | 2012-10-23 10:49:18 -0700 | [diff] [blame] | 556 | thresh = MAX16(QCONST16(.3f,15), MULT16_16_Q15(QCONST16(.7f,15),g0)-cont); |
Jean-Marc Valin | 0892c16 | 2012-01-12 03:44:49 -0500 | [diff] [blame] | 557 | /* Bias against very high pitch (very short period) to avoid false-positives |
| 558 | due to short-term correlation */ |
| 559 | if (T1<3*minperiod) |
Ralph Giles | 027ec51 | 2012-10-23 10:49:18 -0700 | [diff] [blame] | 560 | thresh = MAX16(QCONST16(.4f,15), MULT16_16_Q15(QCONST16(.85f,15),g0)-cont); |
Jean-Marc Valin | 0892c16 | 2012-01-12 03:44:49 -0500 | [diff] [blame] | 561 | else if (T1<2*minperiod) |
Ralph Giles | 027ec51 | 2012-10-23 10:49:18 -0700 | [diff] [blame] | 562 | thresh = MAX16(QCONST16(.5f,15), MULT16_16_Q15(QCONST16(.9f,15),g0)-cont); |
Jean-Marc Valin | 0892c16 | 2012-01-12 03:44:49 -0500 | [diff] [blame] | 563 | if (g1 > thresh) |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 564 | { |
| 565 | best_xy = xy; |
| 566 | best_yy = yy; |
| 567 | T = T1; |
| 568 | g = g1; |
| 569 | } |
| 570 | } |
Jean-Marc Valin | b3deb53 | 2012-04-24 17:00:54 -0400 | [diff] [blame] | 571 | best_xy = MAX32(0, best_xy); |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 572 | if (best_yy <= best_xy) |
| 573 | pg = Q15ONE; |
| 574 | else |
| 575 | pg = SHR32(frac_div32(best_xy,best_yy+1),16); |
| 576 | |
| 577 | for (k=0;k<3;k++) |
| 578 | { |
| 579 | int T1 = T+k-1; |
| 580 | xy = 0; |
| 581 | for (i=0;i<N;i++) |
| 582 | xy = MAC16_16(xy, x[i], x[i-T1]); |
| 583 | xcorr[k] = xy; |
| 584 | } |
| 585 | if ((xcorr[2]-xcorr[0]) > MULT16_32_Q15(QCONST16(.7f,15),xcorr[1]-xcorr[0])) |
| 586 | offset = 1; |
| 587 | else if ((xcorr[0]-xcorr[2]) > MULT16_32_Q15(QCONST16(.7f,15),xcorr[1]-xcorr[2])) |
| 588 | offset = -1; |
| 589 | else |
| 590 | offset = 0; |
| 591 | if (pg > g) |
| 592 | pg = g; |
Ralph Giles | 120800f | 2011-11-25 13:02:00 -0800 | [diff] [blame] | 593 | *T0_ = 2*T+offset; |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 594 | |
Ralph Giles | 120800f | 2011-11-25 13:02:00 -0800 | [diff] [blame] | 595 | if (*T0_<minperiod0) |
| 596 | *T0_=minperiod0; |
Jean-Marc Valin | 35095c6 | 2010-11-04 13:24:44 -0400 | [diff] [blame] | 597 | return pg; |
| 598 | } |