Blame - libcelt/vq.c - platform/external/libopus

blob: 009fcb7f9496d217bf21141061c6a25ba7b7d63c [file] [log] [blame]

Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	1	/* (C) 2007-2008 Jean-Marc Valin, CSIRO
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	2	*/
				3	/*
				4	Redistribution and use in source and binary forms, with or without
				5	modification, are permitted provided that the following conditions
				6	are met:
				7
				8	- Redistributions of source code must retain the above copyright
				9	notice, this list of conditions and the following disclaimer.
				10
				11	- Redistributions in binary form must reproduce the above copyright
				12	notice, this list of conditions and the following disclaimer in the
				13	documentation and/or other materials provided with the distribution.
				14
				15	- Neither the name of the Xiph.org Foundation nor the names of its
				16	contributors may be used to endorse or promote products derived from
				17	this software without specific prior written permission.
				18
				19	THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
				20	``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
				21	LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
				22	A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR
				23	CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
				24	EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
				25	PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
				26	PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
				27	LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
				28	NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
				29	SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
				30	*/
				31
Jean-Marc Valin	02fa913	2008-02-20 12:09:29 +1100	[diff] [blame]	32	#ifdef HAVE_CONFIG_H
				33	#include "config.h"
				34	#endif
				35
Jean-Marc Valin	3ca9b1d	2008-02-27 23:50:31 +1100	[diff] [blame]	36	#include "mathops.h"
Jean-Marc Valin	29ccab8	2007-12-06 15:39:38 +1100	[diff] [blame]	37	#include "cwrs.h"
Jean-Marc Valin	9cace64	2007-12-06 17:44:09 +1100	[diff] [blame]	38	#include "vq.h"
Jean-Marc Valin	9a0bba1	2008-02-20 14:08:50 +1100	[diff] [blame]	39	#include "arch.h"
Jean-Marc Valin	b60340f	2008-02-26 15:41:51 +1100	[diff] [blame]	40	#include "os_support.h"
Jean-Marc Valin	164a229	2009-07-22 07:48:35 -0400	[diff] [blame]	41	#include "rate.h"
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	42
Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	43	/** Takes the pitch vector and the decoded residual vector, computes the gain
				44	that will give \|\|p+gy\|\|=1 and mixes the residual with the pitch. /
Jean-Marc Valin	5de868c	2008-03-25 22:38:58 +1100	[diff] [blame]	45	static void mix_pitch_and_residual(int * restrict iy, celt_norm_t * restrict X, int N, int K, const celt_norm_t * restrict P)
Jean-Marc Valin	d4018c3	2008-02-27 10:09:48 +1100	[diff] [blame]	46	{
				47	int i;
Jean-Marc Valin	b50c541	2008-02-27 17:05:43 +1100	[diff] [blame]	48	celt_word32_t Ryp, Ryy, Rpp;
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	49	celt_word16_t ryp, ryy, rpp;
Jean-Marc Valin	a847b77	2008-02-27 17:46:49 +1100	[diff] [blame]	50	celt_word32_t g;
Jean-Marc Valin	31b79d1	2008-03-12 17:17:23 +1100	[diff] [blame]	51	VARDECL(celt_norm_t, y);
Jean-Marc Valin	d9de593	2008-03-05 08:11:57 +1100	[diff] [blame]	52	#ifdef FIXED_POINT
				53	int yshift;
				54	#endif
Jean-Marc Valin	8600f69	2008-02-29 15:14:12 +1100	[diff] [blame]	55	SAVE_STACK;
Jean-Marc Valin	d17edd3	2008-02-27 16:52:30 +1100	[diff] [blame]	56	#ifdef FIXED_POINT
Jean-Marc Valin	98c86c7	2008-03-27 08:40:45 +1100	[diff] [blame]	57	yshift = 13-celt_ilog2(K);
Jean-Marc Valin	d17edd3	2008-02-27 16:52:30 +1100	[diff] [blame]	58	#endif
				59	ALLOC(y, N, celt_norm_t);
Jean-Marc Valin	d4018c3	2008-02-27 10:09:48 +1100	[diff] [blame]	60
Jean-Marc Valin	b50c541	2008-02-27 17:05:43 +1100	[diff] [blame]	61	Rpp = 0;
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	62	i=0;
				63	do {
Jean-Marc Valin	b50c541	2008-02-27 17:05:43 +1100	[diff] [blame]	64	Rpp = MAC16_16(Rpp,P[i],P[i]);
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	65	y[i] = SHL16(iy[i],yshift);
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	66	} while (++i < N);
				67
Jean-Marc Valin	d4018c3	2008-02-27 10:09:48 +1100	[diff] [blame]	68	Ryp = 0;
Jean-Marc Valin	b50c541	2008-02-27 17:05:43 +1100	[diff] [blame]	69	Ryy = 0;
Jean-Marc Valin	df7ab43	2008-03-26 18:03:22 +1100	[diff] [blame]	70	/* If this doesn't generate a dual MAC (on supported archs), fire the compiler guy */
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	71	i=0;
				72	do {
Jean-Marc Valin	df7ab43	2008-03-26 18:03:22 +1100	[diff] [blame]	73	Ryp = MAC16_16(Ryp, y[i], P[i]);
				74	Ryy = MAC16_16(Ryy, y[i], y[i]);
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	75	} while (++i < N);
				76
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	77	ryp = ROUND16(Ryp,14);
				78	ryy = ROUND16(Ryy,14);
				79	rpp = ROUND16(Rpp,14);
Jean-Marc Valin	1ca0722	2008-02-27 17:23:04 +1100	[diff] [blame]	80	/* g = (sqrt(Ryp^2 + Ryy - RppRyy)-Ryp)/Ryy /
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	81	g = MULT16_32_Q15(celt_sqrt(MAC16_16(Ryy, ryp,ryp) - MULT16_16(ryy,rpp)) - ryp,
				82	celt_rcp(SHR32(Ryy,9)));
Jean-Marc Valin	d4018c3	2008-02-27 10:09:48 +1100	[diff] [blame]	83
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	84	i=0;
				85	do
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	86	X[i] = ADD16(P[i], ROUND16(MULT16_16(y[i], g),11));
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	87	while (++i < N);
				88
Jean-Marc Valin	8600f69	2008-02-29 15:14:12 +1100	[diff] [blame]	89	RESTORE_STACK;
Jean-Marc Valin	d4018c3	2008-02-27 10:09:48 +1100	[diff] [blame]	90	}
				91
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	92
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	93	void alg_quant(celt_norm_t X, celt_mask_t W, int N, int K, celt_norm_t P, ec_enc enc)
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	94	{
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	95	VARDECL(celt_norm_t, y);
				96	VARDECL(int, iy);
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	97	VARDECL(celt_word16_t, signx);
Jean-Marc Valin	6ea8bae	2008-04-15 08:01:33 +1000	[diff] [blame]	98	int j, is;
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	99	celt_word16_t s;
Jean-Marc Valin	846d4e2	2008-02-12 13:48:48 +1100	[diff] [blame]	100	int pulsesLeft;
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	101	celt_word32_t sum;
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	102	celt_word32_t xy, yy, yp;
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	103	celt_word16_t Rpp;
Jean-Marc Valin	f958477	2008-03-27 12:22:44 +1100	[diff] [blame]	104	int N_1; /* Inverse of N, in Q14 format (even for float) */
Jean-Marc Valin	f675adc	2008-02-28 12:15:17 +1100	[diff] [blame]	105	#ifdef FIXED_POINT
Jean-Marc Valin	d748cd5	2008-03-01 07:27:03 +1100	[diff] [blame]	106	int yshift;
				107	#endif
				108	SAVE_STACK;
				109
Jean-Marc Valin	164a229	2009-07-22 07:48:35 -0400	[diff] [blame]	110	K = get_pulses(K);
Jean-Marc Valin	d748cd5	2008-03-01 07:27:03 +1100	[diff] [blame]	111	#ifdef FIXED_POINT
Jean-Marc Valin	98c86c7	2008-03-27 08:40:45 +1100	[diff] [blame]	112	yshift = 13-celt_ilog2(K);
Jean-Marc Valin	f675adc	2008-02-28 12:15:17 +1100	[diff] [blame]	113	#endif
Jean-Marc Valin	9d8d9b3	2008-02-27 16:17:39 +1100	[diff] [blame]	114
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	115	ALLOC(y, N, celt_norm_t);
				116	ALLOC(iy, N, int);
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	117	ALLOC(signx, N, celt_word16_t);
Jean-Marc Valin	124d1cd	2008-03-28 00:33:04 +1100	[diff] [blame]	118	N_1 = 512/N;
Jean-Marc Valin	3d152a5	2008-04-15 07:46:48 +1000	[diff] [blame]	119
				120	sum = 0;
Jean-Marc Valin	dff9b7e	2008-04-21 11:43:51 +1000	[diff] [blame]	121	j=0; do {
Jean-Marc Valin	bf2d648	2008-05-23 16:57:34 +1000	[diff] [blame]	122	X[j] -= P[j];
Jean-Marc Valin	4913438	2008-03-25 16:07:05 +1100	[diff] [blame]	123	if (X[j]>0)
				124	signx[j]=1;
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	125	else {
Jean-Marc Valin	4913438	2008-03-25 16:07:05 +1100	[diff] [blame]	126	signx[j]=-1;
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	127	X[j]=-X[j];
				128	P[j]=-P[j];
				129	}
Jean-Marc Valin	3d152a5	2008-04-15 07:46:48 +1000	[diff] [blame]	130	iy[j] = 0;
				131	y[j] = 0;
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	132	sum = MAC16_16(sum, P[j],P[j]);
Jean-Marc Valin	dff9b7e	2008-04-21 11:43:51 +1000	[diff] [blame]	133	} while (++j<N);
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	134	Rpp = ROUND16(sum, NORM_SHIFT);
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	135
Jean-Marc Valin	4ff068e	2008-03-15 23:34:39 +1100	[diff] [blame]	136	celt_assert2(Rpp<=NORM_SCALING, "Rpp should never have a norm greater than unity");
Jean-Marc Valin	b60340f	2008-02-26 15:41:51 +1100	[diff] [blame]	137
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	138	xy = yy = yp = 0;
Jean-Marc Valin	0d587d8	2008-02-14 21:29:50 +1100	[diff] [blame]	139
Jean-Marc Valin	846d4e2	2008-02-12 13:48:48 +1100	[diff] [blame]	140	pulsesLeft = K;
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	141
				142	/* Do a pre-search by projecting on the pyramid */
Jean-Marc Valin	a733f08	2008-12-04 22:52:26 -0500	[diff] [blame]	143	if (K > (N>>1))
				144	{
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	145	celt_word16_t rcp;
Gregory Maxwell	61832f1	2008-12-22 18:15:42 -0500	[diff] [blame]	146	sum=0;
Jean-Marc Valin	a733f08	2008-12-04 22:52:26 -0500	[diff] [blame]	147	j=0; do {
				148	sum += X[j];
				149	} while (++j<N);
Jean-Marc Valin	6d454d8	2009-06-30 10:31:00 -0400	[diff] [blame]	150
				151	#ifdef FIXED_POINT
				152	if (sum <= K)
				153	#else
				154	if (sum <= EPSILON)
				155	#endif
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	156	{
Jean-Marc Valin	da1156a	2009-07-01 01:27:48 -0400	[diff] [blame]	157	X[0] = QCONST16(1.f,14);
Jean-Marc Valin	6d454d8	2009-06-30 10:31:00 -0400	[diff] [blame]	158	j=1; do
				159	X[j]=0;
				160	while (++j<N);
Jean-Marc Valin	da1156a	2009-07-01 01:27:48 -0400	[diff] [blame]	161	sum = QCONST16(1.f,14);
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	162	}
				163	/* Do we have sufficient accuracy here? */
				164	rcp = EXTRACT16(MULT16_32_Q16(K-1, celt_rcp(sum)));
Jean-Marc Valin	a733f08	2008-12-04 22:52:26 -0500	[diff] [blame]	165	j=0; do {
Jean-Marc Valin	09dc5a1	2008-12-05 00:28:28 -0500	[diff] [blame]	166	#ifdef FIXED_POINT
Jean-Marc Valin	137241d	2008-12-06 23:44:55 -0500	[diff] [blame]	167	/* It's really important to round towards zero here */
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	168	iy[j] = MULT16_16_Q15(X[j],rcp);
Jean-Marc Valin	09dc5a1	2008-12-05 00:28:28 -0500	[diff] [blame]	169	#else
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	170	iy[j] = floor(rcp*X[j]);
Jean-Marc Valin	09dc5a1	2008-12-05 00:28:28 -0500	[diff] [blame]	171	#endif
Jean-Marc Valin	c7635b4	2008-12-04 23:26:32 -0500	[diff] [blame]	172	y[j] = SHL16(iy[j],yshift);
				173	yy = MAC16_16(yy, y[j],y[j]);
				174	xy = MAC16_16(xy, X[j],y[j]);
Jean-Marc Valin	a733f08	2008-12-04 22:52:26 -0500	[diff] [blame]	175	yp += P[j]*y[j];
Jean-Marc Valin	09dc5a1	2008-12-05 00:28:28 -0500	[diff] [blame]	176	y[j] *= 2;
Jean-Marc Valin	a733f08	2008-12-04 22:52:26 -0500	[diff] [blame]	177	pulsesLeft -= iy[j];
				178	} while (++j<N);
				179	}
Jean-Marc Valin	137241d	2008-12-06 23:44:55 -0500	[diff] [blame]	180	celt_assert2(pulsesLeft>=1, "Allocated too many pulses in the quick pass");
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	181
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	182	while (pulsesLeft > 1)
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	183	{
Jean-Marc Valin	846d4e2	2008-02-12 13:48:48 +1100	[diff] [blame]	184	int pulsesAtOnce=1;
Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	185	int best_id;
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	186	celt_word16_t magnitude;
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	187	celt_word32_t best_num = -VERY_LARGE16;
				188	celt_word16_t best_den = 0;
Jean-Marc Valin	0bc5f7f	2008-04-20 17:16:18 +1000	[diff] [blame]	189	#ifdef FIXED_POINT
				190	int rshift;
				191	#endif
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	192	/* Decide on how many pulses to find at once */
Jean-Marc Valin	124d1cd	2008-03-28 00:33:04 +1100	[diff] [blame]	193	pulsesAtOnce = (pulsesLeftN_1)>>9; / pulsesLeft/N */
Jean-Marc Valin	cab576e	2008-02-12 17:21:14 +1100	[diff] [blame]	194	if (pulsesAtOnce<1)
				195	pulsesAtOnce = 1;
Jean-Marc Valin	0bc5f7f	2008-04-20 17:16:18 +1000	[diff] [blame]	196	#ifdef FIXED_POINT
				197	rshift = yshift+1+celt_ilog2(K-pulsesLeft+pulsesAtOnce);
				198	#endif
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	199	magnitude = SHL16(pulsesAtOnce, yshift);
Jean-Marc Valin	846d4e2	2008-02-12 13:48:48 +1100	[diff] [blame]	200
Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	201	best_id = 0;
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	202	/* The squared magnitude term gets added anyway, so we might as well
				203	add it outside the loop */
Jean-Marc Valin	1dab60c	2008-09-16 13:29:37 -0400	[diff] [blame]	204	yy = MAC16_16(yy, magnitude,magnitude);
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	205	/* Choose between fast and accurate strategy depending on where we are in the search */
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	206	/* This should ensure that anything we can process will have a better score */
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	207	j=0;
				208	do {
				209	celt_word16_t Rxy, Ryy;
				210	/* Select sign based on X[j] alone */
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	211	s = magnitude;
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	212	/* Temporary sums of the new pulse(s) */
				213	Rxy = EXTRACT16(SHR32(MAC16_16(xy, s,X[j]),rshift));
				214	/* We're multiplying y[j] by two so we don't have to do it here */
				215	Ryy = EXTRACT16(SHR32(MAC16_16(yy, s,y[j]),rshift));
Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	216
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	217	/* Approximate score: we maximise Rxy/sqrt(Ryy) (we're guaranteed that
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	218	Rxy is positive because the sign is pre-computed) */
				219	Rxy = MULT16_16_Q15(Rxy,Rxy);
Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	220	/* The idea is to check for num/den >= best_num/best_den, but that way
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	221	we can do it without any division */
				222	/* OPT: Make sure to use conditional moves here */
				223	if (MULT16_16(best_den, Rxy) > MULT16_16(Ryy, best_num))
				224	{
				225	best_den = Ryy;
				226	best_num = Rxy;
				227	best_id = j;
				228	}
				229	} while (++j<N);
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	230
Jean-Marc Valin	35a1f88	2008-03-26 10:34:23 +1100	[diff] [blame]	231	j = best_id;
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	232	is = pulsesAtOnce;
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	233	s = SHL16(is, yshift);
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	234
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	235	/* Updating the sums of the new pulse(s) */
				236	xy = xy + MULT16_16(s,X[j]);
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	237	/* We're multiplying y[j] by two so we don't have to do it here */
				238	yy = yy + MULT16_16(s,y[j]);
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	239	yp = yp + MULT16_16(s, P[j]);
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	240
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	241	/* Only now that we've made the final choice, update y/iy */
Jean-Marc Valin	ed317c9	2008-04-15 17:31:23 +1000	[diff] [blame]	242	/* Multiplying y[j] by 2 so we don't have to do it everywhere else */
				243	y[j] += 2*s;
Jean-Marc Valin	44c6335	2008-03-25 21:28:40 +1100	[diff] [blame]	244	iy[j] += is;
Jean-Marc Valin	846d4e2	2008-02-12 13:48:48 +1100	[diff] [blame]	245	pulsesLeft -= pulsesAtOnce;
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	246	}
				247
Jean-Marc Valin	8256ed4	2008-12-12 20:50:56 -0500	[diff] [blame]	248	if (pulsesLeft > 0)
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	249	{
				250	celt_word16_t g;
				251	celt_word16_t best_num = -VERY_LARGE16;
				252	celt_word16_t best_den = 0;
				253	int best_id = 0;
Jean-Marc Valin	0ec7c14	2008-09-22 10:25:46 -0400	[diff] [blame]	254	celt_word16_t magnitude = SHL16(1, yshift);
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	255
				256	/* The squared magnitude term gets added anyway, so we might as well
				257	add it outside the loop */
Jean-Marc Valin	0ec7c14	2008-09-22 10:25:46 -0400	[diff] [blame]	258	yy = MAC16_16(yy, magnitude,magnitude);
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	259	j=0;
				260	do {
				261	celt_word16_t Rxy, Ryy, Ryp;
				262	celt_word16_t num;
				263	/* Select sign based on X[j] alone */
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	264	s = magnitude;
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	265	/* Temporary sums of the new pulse(s) */
				266	Rxy = ROUND16(MAC16_16(xy, s,X[j]), 14);
				267	/* We're multiplying y[j] by two so we don't have to do it here */
				268	Ryy = ROUND16(MAC16_16(yy, s,y[j]), 14);
				269	Ryp = ROUND16(MAC16_16(yp, s,P[j]), 14);
				270
				271	/* Compute the gain such that \|\|p + g*y\|\| = 1
				272	...but instead, we compute gRyy to avoid dividing /
				273	g = celt_psqrt(MULT16_16(Ryp,Ryp) + MULT16_16(Ryy,QCONST16(1.f,14)-Rpp)) - Ryp;
				274	/* Knowing that gain, what's the error: (x-g*y)^2
				275	(result is negated and we discard x^2 because it's constant) */
				276	/* score = 2gRxy - ggRyy;*/
				277	#ifdef FIXED_POINT
				278	/* No need to multiply Rxy by 2 because we did it earlier */
				279	num = MULT16_16_Q15(ADD16(SUB16(Rxy,g),Rxy),g);
				280	#else
				281	num = g(2Rxy-g);
				282	#endif
				283	if (MULT16_16(best_den, num) > MULT16_16(Ryy, best_num))
				284	{
				285	best_den = Ryy;
				286	best_num = num;
				287	best_id = j;
				288	}
				289	} while (++j<N);
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	290	iy[best_id] += 1;
Jean-Marc Valin	7bb339d	2008-09-21 21:11:39 -0400	[diff] [blame]	291	}
Jean-Marc Valin	6cde5dd	2008-12-04 21:21:41 -0500	[diff] [blame]	292	j=0;
				293	do {
				294	P[j] = MULT16_16(signx[j],P[j]);
				295	X[j] = MULT16_16(signx[j],X[j]);
				296	if (signx[j] < 0)
				297	iy[j] = -iy[j];
				298	} while (++j<N);
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	299	encode_pulses(iy, N, K, enc);
Jean-Marc Valin	5fa5995	2008-02-14 13:50:44 +1100	[diff] [blame]	300
Jean-Marc Valin	a4833ff	2008-01-10 15:34:00 +1100	[diff] [blame]	301	/* Recompute the gain in one pass to reduce the encoder-decoder mismatch
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	302	due to the recursive computation used in quantisation. */
				303	mix_pitch_and_residual(iy, X, N, K, P);
Jean-Marc Valin	8600f69	2008-02-29 15:14:12 +1100	[diff] [blame]	304	RESTORE_STACK;
Jean-Marc Valin	41af421	2007-11-30 18:35:37 +1100	[diff] [blame]	305	}
				306
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	307
Jean-Marc Valin	879fbfd	2008-02-20 17:17:13 +1100	[diff] [blame]	308	/** Decode pulse vector and combine the result with the pitch vector to produce
				309	the final normalised signal in the current band. */
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	310	void alg_unquant(celt_norm_t X, int N, int K, celt_norm_t P, ec_dec *dec)
Jean-Marc Valin	0d227d8	2007-12-31 16:12:12 +1100	[diff] [blame]	311	{
Jean-Marc Valin	31b79d1	2008-03-12 17:17:23 +1100	[diff] [blame]	312	VARDECL(int, iy);
Jean-Marc Valin	8600f69	2008-02-29 15:14:12 +1100	[diff] [blame]	313	SAVE_STACK;
Jean-Marc Valin	164a229	2009-07-22 07:48:35 -0400	[diff] [blame]	314	K = get_pulses(K);
Jean-Marc Valin	9a0bba1	2008-02-20 14:08:50 +1100	[diff] [blame]	315	ALLOC(iy, N, int);
Jean-Marc Valin	5fa5995	2008-02-14 13:50:44 +1100	[diff] [blame]	316	decode_pulses(iy, N, K, dec);
Jean-Marc Valin	bd718ba	2008-03-25 14:15:41 +1100	[diff] [blame]	317	mix_pitch_and_residual(iy, X, N, K, P);
Jean-Marc Valin	8600f69	2008-02-29 15:14:12 +1100	[diff] [blame]	318	RESTORE_STACK;
Jean-Marc Valin	0d227d8	2007-12-31 16:12:12 +1100	[diff] [blame]	319	}
				320
Jean-Marc Valin	ca53b7c	2009-03-26 20:23:14 -0400	[diff] [blame]	321	celt_word16_t renormalise_vector(celt_norm_t *X, celt_word16_t value, int N, int stride)
Jean-Marc Valin	6361ad8	2008-07-20 23:14:31 -0400	[diff] [blame]	322	{
				323	int i;
				324	celt_word32_t E = EPSILON;
Jean-Marc Valin	ca53b7c	2009-03-26 20:23:14 -0400	[diff] [blame]	325	celt_word16_t rE;
Jean-Marc Valin	6361ad8	2008-07-20 23:14:31 -0400	[diff] [blame]	326	celt_word16_t g;
				327	celt_norm_t *xptr = X;
				328	for (i=0;i<N;i++)
				329	{
				330	E = MAC16_16(E, xptr, xptr);
				331	xptr += stride;
				332	}
				333
Jean-Marc Valin	ca53b7c	2009-03-26 20:23:14 -0400	[diff] [blame]	334	rE = celt_sqrt(E);
Jean-Marc Valin	cd29b02	2009-07-01 09:59:21 -0400	[diff] [blame]	335	#ifdef FIXED_POINT
				336	if (rE <= 128)
				337	g = Q15ONE;
				338	else
				339	#endif
				340	g = MULT16_16_Q15(value,celt_rcp(SHL32(rE,9)));
Jean-Marc Valin	6361ad8	2008-07-20 23:14:31 -0400	[diff] [blame]	341	xptr = X;
				342	for (i=0;i<N;i++)
				343	{
				344	xptr = PSHR32(MULT16_16(g, xptr),8);
				345	xptr += stride;
				346	}
Jean-Marc Valin	ca53b7c	2009-03-26 20:23:14 -0400	[diff] [blame]	347	return rE;
Jean-Marc Valin	6361ad8	2008-07-20 23:14:31 -0400	[diff] [blame]	348	}
				349
				350	static void fold(const CELTMode m, int N, celt_norm_t Y, celt_norm_t * restrict P, int N0, int B)
Jean-Marc Valin	4841a0a	2007-12-03 13:54:30 +1100	[diff] [blame]	351	{
Jean-Marc Valin	df38f2b	2008-07-20 20:36:54 -0400	[diff] [blame]	352	int j;
Jean-Marc Valin	ba11d78	2008-04-21 21:59:37 +1000	[diff] [blame]	353	const int C = CHANNELS(m);
Jean-Marc Valin	9edb7b4	2009-06-15 11:22:01 -0400	[diff] [blame]	354	int id = (N0C) % (CB);
Jean-Marc Valin	df38f2b	2008-07-20 20:36:54 -0400	[diff] [blame]	355	/* Here, we assume that id will never be greater than N0, i.e. that
Jean-Marc Valin	5eef264	2008-08-06 23:06:31 -0400	[diff] [blame]	356	no band is wider than N0. In the unlikely case it happens, we set
				357	everything to zero */
Jean-Marc Valin	4e5b7bc	2009-07-03 15:09:07 -0400	[diff] [blame]	358	/*{
				359	int offset = (N0C - (id+CN))/2;
				360	if (offset > C*N0/16)
				361	offset = C*N0/16;
				362	offset -= offset % (C*B);
				363	if (offset < 0)
				364	offset = 0;
				365	//printf ("%d\n", offset);
				366	id += offset;
				367	}*/
Jean-Marc Valin	9edb7b4	2009-06-15 11:22:01 -0400	[diff] [blame]	368	if (id+CN>N0C)
Jean-Marc Valin	5eef264	2008-08-06 23:06:31 -0400	[diff] [blame]	369	for (j=0;j<C*N;j++)
				370	P[j] = 0;
				371	else
				372	for (j=0;j<C*N;j++)
				373	P[j] = Y[id++];
Jean-Marc Valin	2c73306	2008-07-17 16:22:23 -0400	[diff] [blame]	374	}
				375
Jean-Marc Valin	798ab38	2009-07-12 20:41:29 -0400	[diff] [blame]	376	void intra_fold(const CELTMode m, celt_norm_t restrict x, int N, int pulses, celt_norm_t Y, celt_norm_t * restrict P, int N0, int B)
Jean-Marc Valin	2c73306	2008-07-17 16:22:23 -0400	[diff] [blame]	377	{
Jean-Marc Valin	798ab38	2009-07-12 20:41:29 -0400	[diff] [blame]	378	int c;
Jean-Marc Valin	9455d1b	2008-03-07 17:17:37 +1100	[diff] [blame]	379	celt_word16_t pred_gain;
Jean-Marc Valin	ba11d78	2008-04-21 21:59:37 +1000	[diff] [blame]	380	const int C = CHANNELS(m);
Jean-Marc Valin	896471d	2008-11-06 21:55:41 -0500	[diff] [blame]	381
Jean-Marc Valin	6361ad8	2008-07-20 23:14:31 -0400	[diff] [blame]	382	fold(m, N, Y, P, N0, B);
Jean-Marc Valin	798ab38	2009-07-12 20:41:29 -0400	[diff] [blame]	383	c=0;
				384	do {
Jean-Marc Valin	164a229	2009-07-22 07:48:35 -0400	[diff] [blame]	385	int K = get_pulses(pulses[c]);
Jean-Marc Valin	798ab38	2009-07-12 20:41:29 -0400	[diff] [blame]	386	if (K==0)
				387	pred_gain = Q15ONE;
				388	else
				389	pred_gain = celt_div((celt_word32_t)MULT16_16(Q15_ONE,N),(celt_word32_t)(N+2K(K+1)));
				390
				391	renormalise_vector(P+c, pred_gain, N, C);
				392	} while (++c < C);
Jean-Marc Valin	0e20ca0	2008-02-11 15:33:53 +1100	[diff] [blame]	393	}
				394