Blame - libcelt/vq.c - platform/external/libopus

blob: 1d14c2c17d44bad5254adcb8933b344210a8cbde [file] [log] [blame]

Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	1	/* (C) 2007-2008 Jean-Marc Valin, CSIRO
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	2	*/
				3	/*
				4	Redistribution and use in source and binary forms, with or without
				5	modification, are permitted provided that the following conditions
				6	are met:
				7
				8	- Redistributions of source code must retain the above copyright
				9	notice, this list of conditions and the following disclaimer.
				10
				11	- Redistributions in binary form must reproduce the above copyright
				12	notice, this list of conditions and the following disclaimer in the
				13	documentation and/or other materials provided with the distribution.
				14
				15	- Neither the name of the Xiph.org Foundation nor the names of its
				16	contributors may be used to endorse or promote products derived from
				17	this software without specific prior written permission.
				18
				19	THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
				20	``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
				21	LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
				22	A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR
				23	CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
				24	EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
				25	PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
				26	PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
				27	LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
				28	NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
				29	SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
				30	*/
				31
Jean-Marc Valin	02fa913	2008-02-20 12:09:29 +1100	[diff] [blame]	32	#ifdef HAVE_CONFIG_H
				33	#include "config.h"
				34	#endif
				35
Jean-Marc Valin	3ca9b1d	2008-02-27 23:50:31 +1100	[diff] [blame]	36	#include "mathops.h"
Jean-Marc Valin	29ccab8	2007-12-06 15:39:38 +1100	[diff] [blame]	37	#include "cwrs.h"
Jean-Marc Valin	9cace64	2007-12-06 17:44:09 +1100	[diff] [blame]	38	#include "vq.h"
Jean-Marc Valin	9a0bba1	2008-02-20 14:08:50 +1100	[diff] [blame]	39	#include "arch.h"
Jean-Marc Valin	b60340f	2008-02-26 15:41:51 +1100	[diff] [blame]	40	#include "os_support.h"
Jean-Marc Valin	164a229	2009-07-22 07:48:35 -0400	[diff] [blame]	41	#include "rate.h"
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	42
Jean-Marc Valin	a7750b9	2009-08-29 22:52:03 +0100	[diff] [blame]	43	static void exp_rotation(celt_norm_t *X, int len, int dir, int stride, int K)
				44	{
				45	int i, k, iter;
				46	celt_word16_t c, s;
				47	celt_word16_t gain, theta;
				48	celt_norm_t *Xptr;
				49	gain = celt_div((celt_word32_t)MULT16_16(Q15_ONE,len),(celt_word32_t)(len+2K((K>>1)+1)));
				50	/* FIXME: Make that HALF16 instead of HALF32 */
				51	theta = SUB16(Q15ONE, HALF32(MULT16_16_Q15(gain,gain)));
				52	/*if (len==30)
				53	{
				54	for (i=0;i<len;i++)
				55	X[i] = 0;
				56	X[14] = 1;
				57	}*/
				58	c = celt_cos_norm(EXTEND32(theta));
				59	s = dircelt_cos_norm(EXTEND32(SUB16(Q15ONE,theta))); / sin(theta) */
				60	if (stride == 1)
				61	stride = 2;
				62	iter = 1;
				63	for (k=0;k<iter;k++)
				64	{
				65	/* We could use MULT16_16_P15 instead of MULT16_16_Q15 for more accuracy,
				66	but at this point, I really don't think it's necessary */
				67	Xptr = X;
				68	for (i=0;i<len-stride;i++)
				69	{
				70	celt_norm_t x1, x2;
				71	x1 = Xptr[0];
				72	x2 = Xptr[stride];
				73	Xptr[stride] = MULT16_16_Q15(c,x2) + MULT16_16_Q15(s,x1);
				74	*Xptr++ = MULT16_16_Q15(c,x1) - MULT16_16_Q15(s,x2);
				75	}
				76	Xptr = &X[len-2*stride-1];
				77	for (i=len-2*stride-1;i>=0;i--)
				78	{
				79	celt_norm_t x1, x2;
				80	x1 = Xptr[0];
				81	x2 = Xptr[stride];
				82	Xptr[stride] = MULT16_16_Q15(c,x2) + MULT16_16_Q15(s,x1);
				83	*Xptr-- = MULT16_16_Q15(c,x1) - MULT16_16_Q15(s,x2);
				84	}
				85	}
				86	/*if (len==30)
				87	{
				88	for (i=0;i<len;i++)
				89	printf ("%f ", X[i]);
				90	printf ("\n");
				91	exit(0);
				92	}*/
				93	}
				94
				95
Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	96	/** Takes the pitch vector and the decoded residual vector, computes the gain
				97	that will give \|\|p+gy\|\|=1 and mixes the residual with the pitch. /
Jean-Marc Valin	5de868c	2008-03-25 22:38:58 +1100	[diff] [blame]	98	static void mix_pitch_and_residual(int * restrict iy, celt_norm_t * restrict X, int N, int K, const celt_norm_t * restrict P)
Jean-Marc Valin	d4018c3	2008-02-27 10:09:48 +1100	[diff] [blame]	99	{
				100	int i;
Jean-Marc Valin	b50c541	2008-02-27 17:05:43 +1100	[diff] [blame]	101	celt_word32_t Ryp, Ryy, Rpp;
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	102	celt_word16_t ryp, ryy, rpp;
Jean-Marc Valin	a847b77	2008-02-27 17:46:49 +1100	[diff] [blame]	103	celt_word32_t g;
Jean-Marc Valin	31b79d1	2008-03-12 17:17:23 +1100	[diff] [blame]	104	VARDECL(celt_norm_t, y);
Jean-Marc Valin	d9de593	2008-03-05 08:11:57 +1100	[diff] [blame]	105	#ifdef FIXED_POINT
				106	int yshift;
				107	#endif
Jean-Marc Valin	8600f69	2008-02-29 15:14:12 +1100	[diff] [blame]	108	SAVE_STACK;
Jean-Marc Valin	d17edd3	2008-02-27 16:52:30 +1100	[diff] [blame]	109	#ifdef FIXED_POINT
Jean-Marc Valin	98c86c7	2008-03-27 08:40:45 +1100	[diff] [blame]	110	yshift = 13-celt_ilog2(K);
Jean-Marc Valin	d17edd3	2008-02-27 16:52:30 +1100	[diff] [blame]	111	#endif
				112	ALLOC(y, N, celt_norm_t);
Jean-Marc Valin	d4018c3	2008-02-27 10:09:48 +1100	[diff] [blame]	113
Jean-Marc Valin	b50c541	2008-02-27 17:05:43 +1100	[diff] [blame]	114	Rpp = 0;
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	115	i=0;
				116	do {
Jean-Marc Valin	b50c541	2008-02-27 17:05:43 +1100	[diff] [blame]	117	Rpp = MAC16_16(Rpp,P[i],P[i]);
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	118	y[i] = SHL16(iy[i],yshift);
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	119	} while (++i < N);
				120
Jean-Marc Valin	d4018c3	2008-02-27 10:09:48 +1100	[diff] [blame]	121	Ryp = 0;
Jean-Marc Valin	b50c541	2008-02-27 17:05:43 +1100	[diff] [blame]	122	Ryy = 0;
Jean-Marc Valin	df7ab43	2008-03-26 18:03:22 +1100	[diff] [blame]	123	/* If this doesn't generate a dual MAC (on supported archs), fire the compiler guy */
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	124	i=0;
				125	do {
Jean-Marc Valin	df7ab43	2008-03-26 18:03:22 +1100	[diff] [blame]	126	Ryp = MAC16_16(Ryp, y[i], P[i]);
				127	Ryy = MAC16_16(Ryy, y[i], y[i]);
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	128	} while (++i < N);
				129
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	130	ryp = ROUND16(Ryp,14);
				131	ryy = ROUND16(Ryy,14);
				132	rpp = ROUND16(Rpp,14);
Jean-Marc Valin	1ca0722	2008-02-27 17:23:04 +1100	[diff] [blame]	133	/* g = (sqrt(Ryp^2 + Ryy - RppRyy)-Ryp)/Ryy /
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	134	g = MULT16_32_Q15(celt_sqrt(MAC16_16(Ryy, ryp,ryp) - MULT16_16(ryy,rpp)) - ryp,
				135	celt_rcp(SHR32(Ryy,9)));
Jean-Marc Valin	d4018c3	2008-02-27 10:09:48 +1100	[diff] [blame]	136
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	137	i=0;
				138	do
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	139	X[i] = ADD16(P[i], ROUND16(MULT16_16(y[i], g),11));
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	140	while (++i < N);
				141
Jean-Marc Valin	8600f69	2008-02-29 15:14:12 +1100	[diff] [blame]	142	RESTORE_STACK;
Jean-Marc Valin	d4018c3	2008-02-27 10:09:48 +1100	[diff] [blame]	143	}
				144
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	145
Jean-Marc Valin	a7750b9	2009-08-29 22:52:03 +0100	[diff] [blame]	146	void alg_quant(celt_norm_t X, celt_mask_t W, int N, int K, int spread, celt_norm_t P, ec_enc enc)
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	147	{
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	148	VARDECL(celt_norm_t, y);
				149	VARDECL(int, iy);
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	150	VARDECL(celt_word16_t, signx);
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	151	int j, is;
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	152	celt_word16_t s;
Jean-Marc Valin	846d4e2	2008-02-12 13:48:48 +1100	[diff] [blame]	153	int pulsesLeft;
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	154	celt_word32_t sum;
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	155	celt_word32_t xy, yy, yp;
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	156	celt_word16_t Rpp;
Jean-Marc Valin	f958477	2008-03-27 12:22:44 +1100	[diff] [blame]	157	int N_1; /* Inverse of N, in Q14 format (even for float) */
Jean-Marc Valin	f675adc	2008-02-28 12:15:17 +1100	[diff] [blame]	158	#ifdef FIXED_POINT
Jean-Marc Valin	d748cd5	2008-03-01 07:27:03 +1100	[diff] [blame]	159	int yshift;
				160	#endif
				161	SAVE_STACK;
				162
Jean-Marc Valin	164a229	2009-07-22 07:48:35 -0400	[diff] [blame]	163	K = get_pulses(K);
Jean-Marc Valin	d748cd5	2008-03-01 07:27:03 +1100	[diff] [blame]	164	#ifdef FIXED_POINT
Jean-Marc Valin	98c86c7	2008-03-27 08:40:45 +1100	[diff] [blame]	165	yshift = 13-celt_ilog2(K);
Jean-Marc Valin	f675adc	2008-02-28 12:15:17 +1100	[diff] [blame]	166	#endif
Jean-Marc Valin	9d8d9b3	2008-02-27 16:17:39 +1100	[diff] [blame]	167
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	168	ALLOC(y, N, celt_norm_t);
				169	ALLOC(iy, N, int);
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	170	ALLOC(signx, N, celt_word16_t);
Jean-Marc Valin	124d1cd	2008-03-28 00:33:04 +1100	[diff] [blame]	171	N_1 = 512/N;
Jean-Marc Valin	a7750b9	2009-08-29 22:52:03 +0100	[diff] [blame]	172
				173	if (spread)
				174	exp_rotation(X, N, 1, spread, K);
Jean-Marc Valin	3d152a5	2008-04-15 07:46:48 +1000	[diff] [blame]	175
				176	sum = 0;
Jean-Marc Valin	dff9b7e	2008-04-21 11:43:51 +1000	[diff] [blame]	177	j=0; do {
Jean-Marc Valin	bf2d648	2008-05-23 16:57:34 +1000	[diff] [blame]	178	X[j] -= P[j];
Jean-Marc Valin	4913438	2008-03-25 16:07:05 +1100	[diff] [blame]	179	if (X[j]>0)
				180	signx[j]=1;
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	181	else {
Jean-Marc Valin	4913438	2008-03-25 16:07:05 +1100	[diff] [blame]	182	signx[j]=-1;
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	183	X[j]=-X[j];
				184	P[j]=-P[j];
				185	}
Jean-Marc Valin	3d152a5	2008-04-15 07:46:48 +1000	[diff] [blame]	186	iy[j] = 0;
				187	y[j] = 0;
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	188	sum = MAC16_16(sum, P[j],P[j]);
Jean-Marc Valin	dff9b7e	2008-04-21 11:43:51 +1000	[diff] [blame]	189	} while (++j<N);
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	190	Rpp = ROUND16(sum, NORM_SHIFT);
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	191
Jean-Marc Valin	4ff068e	2008-03-15 23:34:39 +1100	[diff] [blame]	192	celt_assert2(Rpp<=NORM_SCALING, "Rpp should never have a norm greater than unity");
Jean-Marc Valin	b60340f	2008-02-26 15:41:51 +1100	[diff] [blame]	193
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	194	xy = yy = yp = 0;
Jean-Marc Valin	0d587d8	2008-02-14 21:29:50 +1100	[diff] [blame]	195
Jean-Marc Valin	846d4e2	2008-02-12 13:48:48 +1100	[diff] [blame]	196	pulsesLeft = K;
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	197
				198	/* Do a pre-search by projecting on the pyramid */
Jean-Marc Valin	a733f08	2008-12-04 22:52:26 -0500	[diff] [blame]	199	if (K > (N>>1))
				200	{
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	201	celt_word16_t rcp;
Gregory Maxwell	61832f1	2008-12-22 18:15:42 -0500	[diff] [blame]	202	sum=0;
Jean-Marc Valin	a733f08	2008-12-04 22:52:26 -0500	[diff] [blame]	203	j=0; do {
				204	sum += X[j];
				205	} while (++j<N);
Jean-Marc Valin	6d454d8	2009-06-30 10:31:00 -0400	[diff] [blame]	206
				207	#ifdef FIXED_POINT
				208	if (sum <= K)
				209	#else
				210	if (sum <= EPSILON)
				211	#endif
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	212	{
Jean-Marc Valin	da1156a	2009-07-01 01:27:48 -0400	[diff] [blame]	213	X[0] = QCONST16(1.f,14);
Jean-Marc Valin	6d454d8	2009-06-30 10:31:00 -0400	[diff] [blame]	214	j=1; do
				215	X[j]=0;
				216	while (++j<N);
Jean-Marc Valin	da1156a	2009-07-01 01:27:48 -0400	[diff] [blame]	217	sum = QCONST16(1.f,14);
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	218	}
				219	/* Do we have sufficient accuracy here? */
				220	rcp = EXTRACT16(MULT16_32_Q16(K-1, celt_rcp(sum)));
Jean-Marc Valin	a733f08	2008-12-04 22:52:26 -0500	[diff] [blame]	221	j=0; do {
Jean-Marc Valin	09dc5a1	2008-12-05 00:28:28 -0500	[diff] [blame]	222	#ifdef FIXED_POINT
Jean-Marc Valin	137241d	2008-12-06 23:44:55 -0500	[diff] [blame]	223	/* It's really important to round towards zero here */
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	224	iy[j] = MULT16_16_Q15(X[j],rcp);
Jean-Marc Valin	09dc5a1	2008-12-05 00:28:28 -0500	[diff] [blame]	225	#else
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	226	iy[j] = floor(rcp*X[j]);
Jean-Marc Valin	09dc5a1	2008-12-05 00:28:28 -0500	[diff] [blame]	227	#endif
Jean-Marc Valin	c7635b4	2008-12-04 23:26:32 -0500	[diff] [blame]	228	y[j] = SHL16(iy[j],yshift);
				229	yy = MAC16_16(yy, y[j],y[j]);
				230	xy = MAC16_16(xy, X[j],y[j]);
Jean-Marc Valin	a733f08	2008-12-04 22:52:26 -0500	[diff] [blame]	231	yp += P[j]*y[j];
Jean-Marc Valin	09dc5a1	2008-12-05 00:28:28 -0500	[diff] [blame]	232	y[j] *= 2;
Jean-Marc Valin	a733f08	2008-12-04 22:52:26 -0500	[diff] [blame]	233	pulsesLeft -= iy[j];
				234	} while (++j<N);
				235	}
Jean-Marc Valin	137241d	2008-12-06 23:44:55 -0500	[diff] [blame]	236	celt_assert2(pulsesLeft>=1, "Allocated too many pulses in the quick pass");
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	237
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	238	while (pulsesLeft > 1)
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	239	{
Jean-Marc Valin	846d4e2	2008-02-12 13:48:48 +1100	[diff] [blame]	240	int pulsesAtOnce=1;
Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	241	int best_id;
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	242	celt_word16_t magnitude;
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	243	celt_word32_t best_num = -VERY_LARGE16;
				244	celt_word16_t best_den = 0;
Jean-Marc Valin	0bc5f7f	2008-04-20 17:16:18 +1000	[diff] [blame]	245	#ifdef FIXED_POINT
				246	int rshift;
				247	#endif
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	248	/* Decide on how many pulses to find at once */
Jean-Marc Valin	124d1cd	2008-03-28 00:33:04 +1100	[diff] [blame]	249	pulsesAtOnce = (pulsesLeftN_1)>>9; / pulsesLeft/N */
Jean-Marc Valin	cab576e	2008-02-12 17:21:14 +1100	[diff] [blame]	250	if (pulsesAtOnce<1)
				251	pulsesAtOnce = 1;
Jean-Marc Valin	0bc5f7f	2008-04-20 17:16:18 +1000	[diff] [blame]	252	#ifdef FIXED_POINT
				253	rshift = yshift+1+celt_ilog2(K-pulsesLeft+pulsesAtOnce);
				254	#endif
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	255	magnitude = SHL16(pulsesAtOnce, yshift);
Jean-Marc Valin	846d4e2	2008-02-12 13:48:48 +1100	[diff] [blame]	256
Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	257	best_id = 0;
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	258	/* The squared magnitude term gets added anyway, so we might as well
				259	add it outside the loop */
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	260	yy = MAC16_16(yy, magnitude,magnitude);
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	261	/* Choose between fast and accurate strategy depending on where we are in the search */
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	262	/* This should ensure that anything we can process will have a better score */
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	263	j=0;
				264	do {
				265	celt_word16_t Rxy, Ryy;
				266	/* Select sign based on X[j] alone */
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	267	s = magnitude;
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	268	/* Temporary sums of the new pulse(s) */
				269	Rxy = EXTRACT16(SHR32(MAC16_16(xy, s,X[j]),rshift));
				270	/* We're multiplying y[j] by two so we don't have to do it here */
				271	Ryy = EXTRACT16(SHR32(MAC16_16(yy, s,y[j]),rshift));
Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	272
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	273	/* Approximate score: we maximise Rxy/sqrt(Ryy) (we're guaranteed that
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	274	Rxy is positive because the sign is pre-computed) */
				275	Rxy = MULT16_16_Q15(Rxy,Rxy);
Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	276	/* The idea is to check for num/den >= best_num/best_den, but that way
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	277	we can do it without any division */
				278	/* OPT: Make sure to use conditional moves here */
				279	if (MULT16_16(best_den, Rxy) > MULT16_16(Ryy, best_num))
				280	{
				281	best_den = Ryy;
				282	best_num = Rxy;
				283	best_id = j;
				284	}
				285	} while (++j<N);
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	286
Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	287	j = best_id;
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	288	is = pulsesAtOnce;
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	289	s = SHL16(is, yshift);
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	290
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	291	/* Updating the sums of the new pulse(s) */
				292	xy = xy + MULT16_16(s,X[j]);
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	293	/* We're multiplying y[j] by two so we don't have to do it here */
				294	yy = yy + MULT16_16(s,y[j]);
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	295	yp = yp + MULT16_16(s, P[j]);
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	296
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	297	/* Only now that we've made the final choice, update y/iy */
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	298	/* Multiplying y[j] by 2 so we don't have to do it everywhere else */
				299	y[j] += 2*s;
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	300	iy[j] += is;
Jean-Marc Valin	846d4e2	2008-02-12 13:48:48 +1100	[diff] [blame]	301	pulsesLeft -= pulsesAtOnce;
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	302	}
				303
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	304	if (pulsesLeft > 0)
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	305	{
				306	celt_word16_t g;
				307	celt_word16_t best_num = -VERY_LARGE16;
				308	celt_word16_t best_den = 0;
				309	int best_id = 0;
Jean-Marc Valin	0ec7c14	2008-09-22 10:25:46 -0400	[diff] [blame]	310	celt_word16_t magnitude = SHL16(1, yshift);
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	311
				312	/* The squared magnitude term gets added anyway, so we might as well
				313	add it outside the loop */
Jean-Marc Valin	0ec7c14	2008-09-22 10:25:46 -0400	[diff] [blame]	314	yy = MAC16_16(yy, magnitude,magnitude);
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	315	j=0;
				316	do {
				317	celt_word16_t Rxy, Ryy, Ryp;
				318	celt_word16_t num;
				319	/* Select sign based on X[j] alone */
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	320	s = magnitude;
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	321	/* Temporary sums of the new pulse(s) */
				322	Rxy = ROUND16(MAC16_16(xy, s,X[j]), 14);
				323	/* We're multiplying y[j] by two so we don't have to do it here */
				324	Ryy = ROUND16(MAC16_16(yy, s,y[j]), 14);
				325	Ryp = ROUND16(MAC16_16(yp, s,P[j]), 14);
				326
				327	/* Compute the gain such that \|\|p + g*y\|\| = 1
				328	...but instead, we compute gRyy to avoid dividing /
				329	g = celt_psqrt(MULT16_16(Ryp,Ryp) + MULT16_16(Ryy,QCONST16(1.f,14)-Rpp)) - Ryp;
				330	/* Knowing that gain, what's the error: (x-g*y)^2
				331	(result is negated and we discard x^2 because it's constant) */
				332	/* score = 2gRxy - ggRyy;*/
				333	#ifdef FIXED_POINT
				334	/* No need to multiply Rxy by 2 because we did it earlier */
				335	num = MULT16_16_Q15(ADD16(SUB16(Rxy,g),Rxy),g);
				336	#else
				337	num = g(2Rxy-g);
				338	#endif
				339	if (MULT16_16(best_den, num) > MULT16_16(Ryy, best_num))
				340	{
				341	best_den = Ryy;
				342	best_num = num;
				343	best_id = j;
				344	}
				345	} while (++j<N);
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	346	iy[best_id] += 1;
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	347	}
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	348	j=0;
				349	do {
				350	P[j] = MULT16_16(signx[j],P[j]);
				351	X[j] = MULT16_16(signx[j],X[j]);
				352	if (signx[j] < 0)
				353	iy[j] = -iy[j];
				354	} while (++j<N);
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	355	encode_pulses(iy, N, K, enc);
Jean-Marc Valin	5fa5995	2008-02-14 13:50:44 +1100	[diff] [blame]	356
Jean-Marc Valin	a4833ff	2008-01-10 15:34:00 +1100	[diff] [blame]	357	/* Recompute the gain in one pass to reduce the encoder-decoder mismatch
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	358	due to the recursive computation used in quantisation. */
				359	mix_pitch_and_residual(iy, X, N, K, P);
Jean-Marc Valin	a7750b9	2009-08-29 22:52:03 +0100	[diff] [blame]	360	if (spread)
				361	exp_rotation(X, N, -1, spread, K);
Jean-Marc Valin	8600f69	2008-02-29 15:14:12 +1100	[diff] [blame]	362	RESTORE_STACK;
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	363	}
				364
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	365
Jean-Marc Valin	879fbfd	2008-02-20 17:17:13 +1100	[diff] [blame]	366	/** Decode pulse vector and combine the result with the pitch vector to produce
				367	the final normalised signal in the current band. */
Jean-Marc Valin	a7750b9	2009-08-29 22:52:03 +0100	[diff] [blame]	368	void alg_unquant(celt_norm_t X, int N, int K, int spread, celt_norm_t P, ec_dec *dec)
Jean-Marc Valin	0d227d8	2007-12-31 16:12:12 +1100	[diff] [blame]	369	{
Jean-Marc Valin	31b79d1	2008-03-12 17:17:23 +1100	[diff] [blame]	370	VARDECL(int, iy);
Jean-Marc Valin	8600f69	2008-02-29 15:14:12 +1100	[diff] [blame]	371	SAVE_STACK;
Jean-Marc Valin	164a229	2009-07-22 07:48:35 -0400	[diff] [blame]	372	K = get_pulses(K);
Jean-Marc Valin	9a0bba1	2008-02-20 14:08:50 +1100	[diff] [blame]	373	ALLOC(iy, N, int);
Jean-Marc Valin	5fa5995	2008-02-14 13:50:44 +1100	[diff] [blame]	374	decode_pulses(iy, N, K, dec);
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	375	mix_pitch_and_residual(iy, X, N, K, P);
Jean-Marc Valin	a7750b9	2009-08-29 22:52:03 +0100	[diff] [blame]	376	if (spread)
				377	exp_rotation(X, N, -1, spread, K);
Jean-Marc Valin	8600f69	2008-02-29 15:14:12 +1100	[diff] [blame]	378	RESTORE_STACK;
Jean-Marc Valin	0d227d8	2007-12-31 16:12:12 +1100	[diff] [blame]	379	}
				380
Jean-Marc Valin	ca53b7c	2009-03-26 20:23:14 -0400	[diff] [blame]	381	celt_word16_t renormalise_vector(celt_norm_t *X, celt_word16_t value, int N, int stride)
Jean-Marc Valin	6361ad8	2008-07-20 23:14:31 -0400	[diff] [blame]	382	{
				383	int i;
				384	celt_word32_t E = EPSILON;
Jean-Marc Valin	ca53b7c	2009-03-26 20:23:14 -0400	[diff] [blame]	385	celt_word16_t rE;
Jean-Marc Valin	6361ad8	2008-07-20 23:14:31 -0400	[diff] [blame]	386	celt_word16_t g;
				387	celt_norm_t *xptr = X;
				388	for (i=0;i<N;i++)
				389	{
				390	E = MAC16_16(E, xptr, xptr);
				391	xptr += stride;
				392	}
				393
Jean-Marc Valin	ca53b7c	2009-03-26 20:23:14 -0400	[diff] [blame]	394	rE = celt_sqrt(E);
Jean-Marc Valin	cd29b02	2009-07-01 09:59:21 -0400	[diff] [blame]	395	#ifdef FIXED_POINT
				396	if (rE <= 128)
				397	g = Q15ONE;
				398	else
				399	#endif
				400	g = MULT16_16_Q15(value,celt_rcp(SHL32(rE,9)));
Jean-Marc Valin	6361ad8	2008-07-20 23:14:31 -0400	[diff] [blame]	401	xptr = X;
				402	for (i=0;i<N;i++)
				403	{
				404	xptr = PSHR32(MULT16_16(g, xptr),8);
				405	xptr += stride;
				406	}
Jean-Marc Valin	ca53b7c	2009-03-26 20:23:14 -0400	[diff] [blame]	407	return rE;
Jean-Marc Valin	6361ad8	2008-07-20 23:14:31 -0400	[diff] [blame]	408	}
				409
				410	static void fold(const CELTMode m, int N, celt_norm_t Y, celt_norm_t * restrict P, int N0, int B)
Jean-Marc Valin	4841a0a	2007-12-03 13:54:30 +1100	[diff] [blame]	411	{
Jean-Marc Valin	df38f2b	2008-07-20 20:36:54 -0400	[diff] [blame]	412	int j;
Jean-Marc Valin	ba11d78	2008-04-21 21:59:37 +1000	[diff] [blame]	413	const int C = CHANNELS(m);
Jean-Marc Valin	9edb7b4	2009-06-15 11:22:01 -0400	[diff] [blame]	414	int id = (N0C) % (CB);
Jean-Marc Valin	df38f2b	2008-07-20 20:36:54 -0400	[diff] [blame]	415	/* Here, we assume that id will never be greater than N0, i.e. that
Jean-Marc Valin	5eef264	2008-08-06 23:06:31 -0400	[diff] [blame]	416	no band is wider than N0. In the unlikely case it happens, we set
				417	everything to zero */
Jean-Marc Valin	4e5b7bc	2009-07-03 15:09:07 -0400	[diff] [blame]	418	/*{
				419	int offset = (N0C - (id+CN))/2;
				420	if (offset > C*N0/16)
				421	offset = C*N0/16;
				422	offset -= offset % (C*B);
				423	if (offset < 0)
				424	offset = 0;
				425	//printf ("%d\n", offset);
				426	id += offset;
				427	}*/
Jean-Marc Valin	9edb7b4	2009-06-15 11:22:01 -0400	[diff] [blame]	428	if (id+CN>N0C)
Jean-Marc Valin	5eef264	2008-08-06 23:06:31 -0400	[diff] [blame]	429	for (j=0;j<C*N;j++)
				430	P[j] = 0;
				431	else
				432	for (j=0;j<C*N;j++)
				433	P[j] = Y[id++];
Jean-Marc Valin	2c73306	2008-07-17 16:22:23 -0400	[diff] [blame]	434	}
				435
Jean-Marc Valin	3aa3afe	2009-09-11 20:28:29 -0400	[diff] [blame]	436	void intra_fold(const CELTMode m, celt_norm_t restrict x, int N, celt_norm_t Y, celt_norm_t restrict P, int N0, int B)
Jean-Marc Valin	2c73306	2008-07-17 16:22:23 -0400	[diff] [blame]	437	{
Jean-Marc Valin	798ab38	2009-07-12 20:41:29 -0400	[diff] [blame]	438	int c;
Jean-Marc Valin	ba11d78	2008-04-21 21:59:37 +1000	[diff] [blame]	439	const int C = CHANNELS(m);
Jean-Marc Valin	896471d	2008-11-06 21:55:41 -0500	[diff] [blame]	440
Jean-Marc Valin	6361ad8	2008-07-20 23:14:31 -0400	[diff] [blame]	441	fold(m, N, Y, P, N0, B);
Jean-Marc Valin	798ab38	2009-07-12 20:41:29 -0400	[diff] [blame]	442	c=0;
				443	do {
Jean-Marc Valin	3aa3afe	2009-09-11 20:28:29 -0400	[diff] [blame]	444	renormalise_vector(P+c, Q15ONE, N, C);
Jean-Marc Valin	798ab38	2009-07-12 20:41:29 -0400	[diff] [blame]	445	} while (++c < C);
Jean-Marc Valin	0e20ca0	2008-02-11 15:33:53 +1100	[diff] [blame]	446	}
				447