2013-02-13 17:08:47 +00:00
|
|
|
/* (C) 2007-2008 Timothy B. Terriberry
|
|
|
|
(C) 2008 Jean-Marc Valin */
|
|
|
|
/*
|
|
|
|
Redistribution and use in source and binary forms, with or without
|
|
|
|
modification, are permitted provided that the following conditions
|
|
|
|
are met:
|
|
|
|
|
|
|
|
- Redistributions of source code must retain the above copyright
|
|
|
|
notice, this list of conditions and the following disclaimer.
|
|
|
|
|
|
|
|
- Redistributions in binary form must reproduce the above copyright
|
|
|
|
notice, this list of conditions and the following disclaimer in the
|
|
|
|
documentation and/or other materials provided with the distribution.
|
|
|
|
|
|
|
|
- Neither the name of the Xiph.org Foundation nor the names of its
|
|
|
|
contributors may be used to endorse or promote products derived from
|
|
|
|
this software without specific prior written permission.
|
|
|
|
|
|
|
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
|
|
``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
|
|
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
|
|
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR
|
|
|
|
CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
|
|
|
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
|
|
|
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
|
|
|
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
|
|
|
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
|
|
|
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
|
|
|
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
|
|
#include "config.h"
|
|
|
|
#endif
|
|
|
|
|
2013-02-13 18:48:36 +00:00
|
|
|
#include "cc6_os_support.h"
|
2013-02-13 17:08:47 +00:00
|
|
|
#include <stdlib.h>
|
|
|
|
#include <string.h>
|
2013-02-13 17:20:51 +00:00
|
|
|
#include "cc6_cwrs.h"
|
2013-02-13 18:48:36 +00:00
|
|
|
#include "cc6_mathops.h"
|
2013-02-13 17:08:47 +00:00
|
|
|
#include "cc6_arch.h"
|
|
|
|
|
|
|
|
/*Guaranteed to return a conservatively large estimate of the binary logarithm
|
|
|
|
with frac bits of fractional precision.
|
|
|
|
Tested for all possible 32-bit inputs with frac=4, where the maximum
|
|
|
|
overestimation is 0.06254243 bits.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
int cc6_log2_frac(cc6_ec_uint32 val, int frac)
|
2013-02-13 17:08:47 +00:00
|
|
|
{
|
|
|
|
int l;
|
2013-02-15 20:04:02 +00:00
|
|
|
l=cc6_EC_ILOG(val);
|
2013-02-13 17:08:47 +00:00
|
|
|
if(val&val-1){
|
|
|
|
/*This is (val>>l-16), but guaranteed to round up, even if adding a bias
|
|
|
|
before the shift would cause overflow (e.g., for 0xFFFFxxxx).*/
|
|
|
|
if(l>16)val=(val>>l-16)+((val&(1<<l-16)-1)+(1<<l-16)-1>>l-16);
|
|
|
|
else val<<=16-l;
|
|
|
|
l=l-1<<frac;
|
|
|
|
/*Note that we always need one iteration, since the rounding up above means
|
|
|
|
that we might need to adjust the integer part of the logarithm.*/
|
|
|
|
do{
|
|
|
|
int b;
|
|
|
|
b=(int)(val>>16);
|
|
|
|
l+=b<<frac;
|
|
|
|
val=val+b>>b;
|
|
|
|
val=val*val+0x7FFF>>15;
|
|
|
|
}
|
|
|
|
while(frac-->0);
|
|
|
|
/*If val is not exactly 0x8000, then we have to round up the remainder.*/
|
|
|
|
return l+(val>0x8000);
|
|
|
|
}
|
|
|
|
/*Exact powers of two require no rounding.*/
|
|
|
|
else return l-1<<frac;
|
|
|
|
}
|
|
|
|
|
2013-02-15 20:04:02 +00:00
|
|
|
#define cc6_MASK32 (0xFFFFFFFF)
|
2013-02-13 17:08:47 +00:00
|
|
|
|
2013-02-15 20:04:02 +00:00
|
|
|
/*cc6_INV_TABLE[i] holds the multiplicative inverse of (2*i+1) mod 2**32.*/
|
|
|
|
static const cc6_celt_uint32_t cc6_INV_TABLE[128]={
|
2013-02-13 17:08:47 +00:00
|
|
|
0x00000001,0xAAAAAAAB,0xCCCCCCCD,0xB6DB6DB7,
|
|
|
|
0x38E38E39,0xBA2E8BA3,0xC4EC4EC5,0xEEEEEEEF,
|
|
|
|
0xF0F0F0F1,0x286BCA1B,0x3CF3CF3D,0xE9BD37A7,
|
|
|
|
0xC28F5C29,0x684BDA13,0x4F72C235,0xBDEF7BDF,
|
|
|
|
0x3E0F83E1,0x8AF8AF8B,0x914C1BAD,0x96F96F97,
|
|
|
|
0xC18F9C19,0x2FA0BE83,0xA4FA4FA5,0x677D46CF,
|
|
|
|
0x1A1F58D1,0xFAFAFAFB,0x8C13521D,0x586FB587,
|
|
|
|
0xB823EE09,0xA08AD8F3,0xC10C9715,0xBEFBEFBF,
|
|
|
|
0xC0FC0FC1,0x07A44C6B,0xA33F128D,0xE327A977,
|
|
|
|
0xC7E3F1F9,0x962FC963,0x3F2B3885,0x613716AF,
|
|
|
|
0x781948B1,0x2B2E43DB,0xFCFCFCFD,0x6FD0EB67,
|
|
|
|
0xFA3F47E9,0xD2FD2FD3,0x3F4FD3F5,0xD4E25B9F,
|
|
|
|
0x5F02A3A1,0xBF5A814B,0x7C32B16D,0xD3431B57,
|
|
|
|
0xD8FD8FD9,0x8D28AC43,0xDA6C0965,0xDB195E8F,
|
|
|
|
0x0FDBC091,0x61F2A4BB,0xDCFDCFDD,0x46FDD947,
|
|
|
|
0x56BE69C9,0xEB2FDEB3,0x26E978D5,0xEFDFBF7F,
|
|
|
|
0x0FE03F81,0xC9484E2B,0xE133F84D,0xE1A8C537,
|
|
|
|
0x077975B9,0x70586723,0xCD29C245,0xFAA11E6F,
|
|
|
|
0x0FE3C071,0x08B51D9B,0x8CE2CABD,0xBF937F27,
|
|
|
|
0xA8FE53A9,0x592FE593,0x2C0685B5,0x2EB11B5F,
|
|
|
|
0xFCD1E361,0x451AB30B,0x72CFE72D,0xDB35A717,
|
|
|
|
0xFB74A399,0xE80BFA03,0x0D516325,0x1BCB564F,
|
|
|
|
0xE02E4851,0xD962AE7B,0x10F8ED9D,0x95AEDD07,
|
|
|
|
0xE9DC0589,0xA18A4473,0xEA53FA95,0xEE936F3F,
|
|
|
|
0x90948F41,0xEAFEAFEB,0x3D137E0D,0xEF46C0F7,
|
|
|
|
0x028C1979,0x791064E3,0xC04FEC05,0xE115062F,
|
|
|
|
0x32385831,0x6E68575B,0xA10D387D,0x6FECF2E7,
|
|
|
|
0x3FB47F69,0xED4BFB53,0x74FED775,0xDB43BB1F,
|
|
|
|
0x87654321,0x9BA144CB,0x478BBCED,0xBFB912D7,
|
|
|
|
0x1FDCD759,0x14B2A7C3,0xCB125CE5,0x437B2E0F,
|
|
|
|
0x10FEF011,0xD2B3183B,0x386CAB5D,0xEF6AC0C7,
|
|
|
|
0x0E64C149,0x9A020A33,0xE6B41C55,0xFEFEFEFF
|
|
|
|
};
|
|
|
|
|
|
|
|
/*Computes (_a*_b-_c)/(2*_d+1) when the quotient is known to be exact.
|
|
|
|
_a, _b, _c, and _d may be arbitrary so long as the arbitrary precision result
|
|
|
|
fits in 32 bits, but currently the table for multiplicative inverses is only
|
|
|
|
valid for _d<128.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_imusdiv32odd(cc6_celt_uint32_t _a,cc6_celt_uint32_t _b,
|
|
|
|
cc6_celt_uint32_t _c,int _d){
|
|
|
|
return (_a*_b-_c)*cc6_INV_TABLE[_d]&cc6_MASK32;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Computes (_a*_b-_c)/_d when the quotient is known to be exact.
|
2013-02-15 20:04:02 +00:00
|
|
|
_d does not actually have to be even, but cc6_imusdiv32odd will be faster when
|
2013-02-13 17:08:47 +00:00
|
|
|
it's odd, so you should use that instead.
|
|
|
|
_a and _d are assumed to be small (e.g., _a*_d fits in 32 bits; currently the
|
|
|
|
table for multiplicative inverses is only valid for _d<=256).
|
|
|
|
_b and _c may be arbitrary so long as the arbitrary precision reuslt fits in
|
|
|
|
32 bits.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_imusdiv32even(cc6_celt_uint32_t _a,cc6_celt_uint32_t _b,
|
|
|
|
cc6_celt_uint32_t _c,int _d){
|
|
|
|
cc6_celt_uint32_t inv;
|
2013-02-13 17:08:47 +00:00
|
|
|
int mask;
|
|
|
|
int shift;
|
|
|
|
int one;
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_assert(_d>0);
|
|
|
|
shift=cc6_EC_ILOG(_d^_d-1);
|
|
|
|
cc6_celt_assert(_d<=256);
|
|
|
|
inv=cc6_INV_TABLE[_d-1>>shift];
|
2013-02-13 17:08:47 +00:00
|
|
|
shift--;
|
|
|
|
one=1<<shift;
|
|
|
|
mask=one-1;
|
|
|
|
return (_a*(_b>>shift)-(_c>>shift)+
|
2013-02-15 20:04:02 +00:00
|
|
|
(_a*(_b&mask)+one-(_c&mask)>>shift)-1)*inv&cc6_MASK32;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Compute floor(sqrt(_val)) with exact arithmetic.
|
|
|
|
This has been tested on all possible 32-bit inputs.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static unsigned cc6_isqrt32(cc6_celt_uint32_t _val){
|
2013-02-13 17:08:47 +00:00
|
|
|
unsigned b;
|
|
|
|
unsigned g;
|
|
|
|
int bshift;
|
|
|
|
/*Uses the second method from
|
|
|
|
http://www.azillionmonkeys.com/qed/sqroot.html
|
|
|
|
The main idea is to search for the largest binary digit b such that
|
|
|
|
(g+b)*(g+b) <= _val, and add it to the solution g.*/
|
|
|
|
g=0;
|
2013-02-15 20:04:02 +00:00
|
|
|
bshift=cc6_EC_ILOG(_val)-1>>1;
|
2013-02-13 17:08:47 +00:00
|
|
|
b=1U<<bshift;
|
|
|
|
do{
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_uint32_t t;
|
|
|
|
t=((cc6_celt_uint32_t)g<<1)+b<<bshift;
|
2013-02-13 17:08:47 +00:00
|
|
|
if(t<=_val){
|
|
|
|
g+=b;
|
|
|
|
_val-=t;
|
|
|
|
}
|
|
|
|
b>>=1;
|
|
|
|
bshift--;
|
|
|
|
}
|
|
|
|
while(bshift>=0);
|
|
|
|
return g;
|
|
|
|
}
|
|
|
|
|
|
|
|
#if 0
|
|
|
|
/*Compute floor(sqrt(_val)) with exact arithmetic.
|
|
|
|
This has been tested on all possible 36-bit inputs.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static cc6_celt_uint32_t isqrt36(cc6_celt_uint64_t _val){
|
|
|
|
cc6_celt_uint32_t val32;
|
|
|
|
cc6_celt_uint32_t b;
|
|
|
|
cc6_celt_uint32_t g;
|
2013-02-13 17:08:47 +00:00
|
|
|
int bshift;
|
|
|
|
g=0;
|
|
|
|
b=0x20000;
|
|
|
|
for(bshift=18;bshift-->13;){
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_uint64_t t;
|
|
|
|
t=((cc6_celt_uint64_t)g<<1)+b<<bshift;
|
2013-02-13 17:08:47 +00:00
|
|
|
if(t<=_val){
|
|
|
|
g+=b;
|
|
|
|
_val-=t;
|
|
|
|
}
|
|
|
|
b>>=1;
|
|
|
|
}
|
2013-02-15 20:04:02 +00:00
|
|
|
val32=(cc6_celt_uint32_t)_val;
|
2013-02-13 17:08:47 +00:00
|
|
|
for(;bshift>=0;bshift--){
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_uint32_t t;
|
2013-02-13 17:08:47 +00:00
|
|
|
t=(g<<1)+b<<bshift;
|
|
|
|
if(t<=val32){
|
|
|
|
g+=b;
|
|
|
|
val32-=t;
|
|
|
|
}
|
|
|
|
b>>=1;
|
|
|
|
}
|
|
|
|
return g;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/*Although derived separately, the pulse vector coding scheme is equivalent to
|
|
|
|
a Pyramid Vector Quantizer \cite{Fis86}.
|
|
|
|
Some additional notes about an early version appear at
|
|
|
|
http://people.xiph.org/~tterribe/notes/cwrs.html, but the codebook ordering
|
|
|
|
and the definitions of some terms have evolved since that was written.
|
|
|
|
|
|
|
|
The conversion from a pulse vector to an integer index (encoding) and back
|
|
|
|
(decoding) is governed by two related functions, V(N,K) and U(N,K).
|
|
|
|
|
|
|
|
V(N,K) = the number of combinations, with replacement, of N items, taken K
|
|
|
|
at a time, when a sign bit is added to each item taken at least once (i.e.,
|
|
|
|
the number of N-dimensional unit pulse vectors with K pulses).
|
|
|
|
One way to compute this is via
|
|
|
|
V(N,K) = K>0 ? sum(k=1...K,2**k*choose(N,k)*choose(K-1,k-1)) : 1,
|
|
|
|
where choose() is the binomial function.
|
|
|
|
A table of values for N<10 and K<10 looks like:
|
|
|
|
V[10][10] = {
|
|
|
|
{1, 0, 0, 0, 0, 0, 0, 0, 0, 0},
|
|
|
|
{1, 2, 2, 2, 2, 2, 2, 2, 2, 2},
|
|
|
|
{1, 4, 8, 12, 16, 20, 24, 28, 32, 36},
|
|
|
|
{1, 6, 18, 38, 66, 102, 146, 198, 258, 326},
|
|
|
|
{1, 8, 32, 88, 192, 360, 608, 952, 1408, 1992},
|
|
|
|
{1, 10, 50, 170, 450, 1002, 1970, 3530, 5890, 9290},
|
|
|
|
{1, 12, 72, 292, 912, 2364, 5336, 10836, 20256, 35436},
|
|
|
|
{1, 14, 98, 462, 1666, 4942, 12642, 28814, 59906, 115598},
|
|
|
|
{1, 16, 128, 688, 2816, 9424, 27008, 68464, 157184, 332688},
|
|
|
|
{1, 18, 162, 978, 4482, 16722, 53154, 148626, 374274, 864146}
|
|
|
|
};
|
|
|
|
|
|
|
|
U(N,K) = the number of such combinations wherein N-1 objects are taken at
|
|
|
|
most K-1 at a time.
|
|
|
|
This is given by
|
|
|
|
U(N,K) = sum(k=0...K-1,V(N-1,k))
|
|
|
|
= K>0 ? (V(N-1,K-1) + V(N,K-1))/2 : 0.
|
|
|
|
The latter expression also makes clear that U(N,K) is half the number of such
|
|
|
|
combinations wherein the first object is taken at least once.
|
|
|
|
Although it may not be clear from either of these definitions, U(N,K) is the
|
|
|
|
natural function to work with when enumerating the pulse vector codebooks,
|
|
|
|
not V(N,K).
|
|
|
|
U(N,K) is not well-defined for N=0, but with the extension
|
|
|
|
U(0,K) = K>0 ? 0 : 1,
|
|
|
|
the function becomes symmetric: U(N,K) = U(K,N), with a similar table:
|
|
|
|
U[10][10] = {
|
|
|
|
{1, 0, 0, 0, 0, 0, 0, 0, 0, 0},
|
|
|
|
{0, 1, 1, 1, 1, 1, 1, 1, 1, 1},
|
|
|
|
{0, 1, 3, 5, 7, 9, 11, 13, 15, 17},
|
|
|
|
{0, 1, 5, 13, 25, 41, 61, 85, 113, 145},
|
|
|
|
{0, 1, 7, 25, 63, 129, 231, 377, 575, 833},
|
|
|
|
{0, 1, 9, 41, 129, 321, 681, 1289, 2241, 3649},
|
|
|
|
{0, 1, 11, 61, 231, 681, 1683, 3653, 7183, 13073},
|
|
|
|
{0, 1, 13, 85, 377, 1289, 3653, 8989, 19825, 40081},
|
|
|
|
{0, 1, 15, 113, 575, 2241, 7183, 19825, 48639, 108545},
|
|
|
|
{0, 1, 17, 145, 833, 3649, 13073, 40081, 108545, 265729}
|
|
|
|
};
|
|
|
|
|
|
|
|
With this extension, V(N,K) may be written in terms of U(N,K):
|
|
|
|
V(N,K) = U(N,K) + U(N,K+1)
|
|
|
|
for all N>=0, K>=0.
|
|
|
|
Thus U(N,K+1) represents the number of combinations where the first element
|
|
|
|
is positive or zero, and U(N,K) represents the number of combinations where
|
|
|
|
it is negative.
|
|
|
|
With a large enough table of U(N,K) values, we could write O(N) encoding
|
|
|
|
and O(min(N*log(K),N+K)) decoding routines, but such a table would be
|
|
|
|
prohibitively large for small embedded devices (K may be as large as 32767
|
|
|
|
for small N, and N may be as large as 200).
|
|
|
|
|
|
|
|
Both functions obey the same recurrence relation:
|
|
|
|
V(N,K) = V(N-1,K) + V(N,K-1) + V(N-1,K-1),
|
|
|
|
U(N,K) = U(N-1,K) + U(N,K-1) + U(N-1,K-1),
|
|
|
|
for all N>0, K>0, with different initial conditions at N=0 or K=0.
|
|
|
|
This allows us to construct a row of one of the tables above given the
|
|
|
|
previous row or the next row.
|
|
|
|
Thus we can derive O(NK) encoding and decoding routines with O(K) memory
|
|
|
|
using only addition and subtraction.
|
|
|
|
|
|
|
|
When encoding, we build up from the U(2,K) row and work our way forwards.
|
|
|
|
When decoding, we need to start at the U(N,K) row and work our way backwards,
|
|
|
|
which requires a means of computing U(N,K).
|
|
|
|
U(N,K) may be computed from two previous values with the same N:
|
|
|
|
U(N,K) = ((2*N-1)*U(N,K-1) - U(N,K-2))/(K-1) + U(N,K-2)
|
|
|
|
for all N>1, and since U(N,K) is symmetric, a similar relation holds for two
|
|
|
|
previous values with the same K:
|
|
|
|
U(N,K>1) = ((2*K-1)*U(N-1,K) - U(N-2,K))/(N-1) + U(N-2,K)
|
|
|
|
for all K>1.
|
|
|
|
This allows us to construct an arbitrary row of the U(N,K) table by starting
|
|
|
|
with the first two values, which are constants.
|
|
|
|
This saves roughly 2/3 the work in our O(NK) decoding routine, but costs O(K)
|
|
|
|
multiplications.
|
|
|
|
Similar relations can be derived for V(N,K), but are not used here.
|
|
|
|
|
|
|
|
For N>0 and K>0, U(N,K) and V(N,K) take on the form of an (N-1)-degree
|
|
|
|
polynomial for fixed N.
|
|
|
|
The first few are
|
|
|
|
U(1,K) = 1,
|
|
|
|
U(2,K) = 2*K-1,
|
|
|
|
U(3,K) = (2*K-2)*K+1,
|
|
|
|
U(4,K) = (((4*K-6)*K+8)*K-3)/3,
|
|
|
|
U(5,K) = ((((2*K-4)*K+10)*K-8)*K+3)/3,
|
|
|
|
and
|
|
|
|
V(1,K) = 2,
|
|
|
|
V(2,K) = 4*K,
|
|
|
|
V(3,K) = 4*K*K+2,
|
|
|
|
V(4,K) = 8*(K*K+2)*K/3,
|
|
|
|
V(5,K) = ((4*K*K+20)*K*K+6)/3,
|
|
|
|
for all K>0.
|
|
|
|
This allows us to derive O(N) encoding and O(N*log(K)) decoding routines for
|
|
|
|
small N (and indeed decoding is also O(N) for N<3).
|
|
|
|
|
|
|
|
@ARTICLE{Fis86,
|
|
|
|
author="Thomas R. Fischer",
|
|
|
|
title="A Pyramid Vector Quantizer",
|
|
|
|
journal="IEEE Transactions on Information Theory",
|
|
|
|
volume="IT-32",
|
|
|
|
number=4,
|
|
|
|
pages="568--583",
|
|
|
|
month=Jul,
|
|
|
|
year=1986
|
|
|
|
}*/
|
|
|
|
|
|
|
|
/*Determines if V(N,K) fits in a 32-bit unsigned integer.
|
|
|
|
N and K are themselves limited to 15 bits.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
int cc6_fits_in32(int _n, int _k)
|
2013-02-13 17:08:47 +00:00
|
|
|
{
|
2013-02-15 20:04:02 +00:00
|
|
|
static const cc6_celt_int16_t maxN[15] = {
|
2013-02-13 17:08:47 +00:00
|
|
|
32767, 32767, 32767, 1476, 283, 109, 60, 40,
|
|
|
|
29, 24, 20, 18, 16, 14, 13};
|
2013-02-15 20:04:02 +00:00
|
|
|
static const cc6_celt_int16_t maxK[15] = {
|
2013-02-13 17:08:47 +00:00
|
|
|
32767, 32767, 32767, 32767, 1172, 238, 95, 53,
|
|
|
|
36, 27, 22, 18, 16, 15, 13};
|
|
|
|
if (_n>=14)
|
|
|
|
{
|
|
|
|
if (_k>=14)
|
|
|
|
return 0;
|
|
|
|
else
|
|
|
|
return _n <= maxN[_k];
|
|
|
|
} else {
|
|
|
|
return _k <= maxK[_n];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*Compute U(1,_k).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline unsigned cc6_ucwrs1(int _k){
|
2013-02-13 17:08:47 +00:00
|
|
|
return _k?1:0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*Compute V(1,_k).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline unsigned cc6_ncwrs1(int _k){
|
2013-02-13 17:08:47 +00:00
|
|
|
return _k?2:1;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*Compute U(2,_k).
|
|
|
|
Note that this may be called with _k=32768 (maxK[2]+1).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline unsigned cc6_ucwrs2(unsigned _k){
|
2013-02-13 17:08:47 +00:00
|
|
|
return _k?_k+(_k-1):0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*Compute V(2,_k).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_ncwrs2(int _k){
|
|
|
|
return _k?4*(cc6_celt_uint32_t)_k:1;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Compute U(3,_k).
|
|
|
|
Note that this may be called with _k=32768 (maxK[3]+1).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_ucwrs3(unsigned _k){
|
|
|
|
return _k?(2*(cc6_celt_uint32_t)_k-2)*_k+1:0;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Compute V(3,_k).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_ncwrs3(int _k){
|
|
|
|
return _k?2*(2*(unsigned)_k*(cc6_celt_uint32_t)_k+1):1;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Compute U(4,_k).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_ucwrs4(int _k){
|
|
|
|
return _k?cc6_imusdiv32odd(2*_k,(2*_k-3)*(cc6_celt_uint32_t)_k+4,3,1):0;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Compute V(4,_k).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_ncwrs4(int _k){
|
|
|
|
return _k?((_k*(cc6_celt_uint32_t)_k+2)*_k)/3<<3:1;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Compute U(5,_k).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_ucwrs5(int _k){
|
|
|
|
return _k?(((((_k-2)*(unsigned)_k+5)*(cc6_celt_uint32_t)_k-4)*_k)/3<<1)+1:0;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Compute V(5,_k).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_ncwrs5(int _k){
|
|
|
|
return _k?(((_k*(unsigned)_k+5)*(cc6_celt_uint32_t)_k*_k)/3<<2)+2:1;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Computes the next row/column of any recurrence that obeys the relation
|
|
|
|
u[i][j]=u[i-1][j]+u[i][j-1]+u[i-1][j-1].
|
|
|
|
_ui0 is the base case for the new row/column.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline void cc6_unext(cc6_celt_uint32_t *_ui,unsigned _len,cc6_celt_uint32_t _ui0){
|
|
|
|
cc6_celt_uint32_t ui1;
|
2013-02-13 17:08:47 +00:00
|
|
|
unsigned j;
|
|
|
|
/*This do-while will overrun the array if we don't have storage for at least
|
|
|
|
2 values.*/
|
|
|
|
j=1; do {
|
2013-02-15 20:04:02 +00:00
|
|
|
ui1=cc6_UADD32(cc6_UADD32(_ui[j],_ui[j-1]),_ui0);
|
2013-02-13 17:08:47 +00:00
|
|
|
_ui[j-1]=_ui0;
|
|
|
|
_ui0=ui1;
|
|
|
|
} while (++j<_len);
|
|
|
|
_ui[j-1]=_ui0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*Computes the previous row/column of any recurrence that obeys the relation
|
|
|
|
u[i-1][j]=u[i][j]-u[i][j-1]-u[i-1][j-1].
|
|
|
|
_ui0 is the base case for the new row/column.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline void cc6_uprev(cc6_celt_uint32_t *_ui,unsigned _n,cc6_celt_uint32_t _ui0){
|
|
|
|
cc6_celt_uint32_t ui1;
|
2013-02-13 17:08:47 +00:00
|
|
|
unsigned j;
|
|
|
|
/*This do-while will overrun the array if we don't have storage for at least
|
|
|
|
2 values.*/
|
|
|
|
j=1; do {
|
2013-02-15 20:04:02 +00:00
|
|
|
ui1=cc6_USUB32(cc6_USUB32(_ui[j],_ui[j-1]),_ui0);
|
2013-02-13 17:08:47 +00:00
|
|
|
_ui[j-1]=_ui0;
|
|
|
|
_ui0=ui1;
|
|
|
|
} while (++j<_n);
|
|
|
|
_ui[j-1]=_ui0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*Compute V(_n,_k), as well as U(_n,0..._k+1).
|
|
|
|
_u: On exit, _u[i] contains U(_n,i) for i in [0..._k+1].*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static cc6_celt_uint32_t cc6_ncwrs_urow(unsigned _n,unsigned _k,cc6_celt_uint32_t *_u){
|
|
|
|
cc6_celt_uint32_t um2;
|
2013-02-13 17:08:47 +00:00
|
|
|
unsigned len;
|
|
|
|
unsigned k;
|
|
|
|
len=_k+2;
|
|
|
|
/*We require storage at least 3 values (e.g., _k>0).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_assert(len>=3);
|
2013-02-13 17:08:47 +00:00
|
|
|
_u[0]=0;
|
|
|
|
_u[1]=um2=1;
|
|
|
|
if(_n<=6 || _k>255){
|
|
|
|
/*If _n==0, _u[0] should be 1 and the rest should be 0.*/
|
|
|
|
/*If _n==1, _u[i] should be 1 for i>1.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_assert(_n>=2);
|
2013-02-13 17:08:47 +00:00
|
|
|
/*If _k==0, the following do-while loop will overflow the buffer.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_assert(_k>0);
|
2013-02-13 17:08:47 +00:00
|
|
|
k=2;
|
|
|
|
do _u[k]=(k<<1)-1;
|
|
|
|
while(++k<len);
|
2013-02-15 20:04:02 +00:00
|
|
|
for(k=2;k<_n;k++)cc6_unext(_u+1,_k+1,1);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
else{
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_uint32_t um1;
|
|
|
|
cc6_celt_uint32_t n2m1;
|
2013-02-13 17:08:47 +00:00
|
|
|
_u[2]=n2m1=um1=(_n<<1)-1;
|
|
|
|
for(k=3;k<len;k++){
|
|
|
|
/*U(N,K) = ((2*N-1)*U(N,K-1)-U(N,K-2))/(K-1) + U(N,K-2)*/
|
2013-02-15 20:04:02 +00:00
|
|
|
_u[k]=um2=cc6_imusdiv32even(n2m1,um1,um2,k-1)+um2;
|
2013-02-13 17:08:47 +00:00
|
|
|
if(++k>=len)break;
|
2013-02-15 20:04:02 +00:00
|
|
|
_u[k]=um1=cc6_imusdiv32odd(n2m1,um2,um1,k-1>>1)+um1;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return _u[_k]+_u[_k+1];
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/*Returns the _i'th combination of _k elements (at most 32767) chosen from a
|
|
|
|
set of size 1 with associated sign bits.
|
|
|
|
_y: Returns the vector of pulses.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline void cc6_cwrsi1(int _k,cc6_celt_uint32_t _i,int *_y){
|
2013-02-13 17:08:47 +00:00
|
|
|
int s;
|
|
|
|
s=-(int)_i;
|
|
|
|
_y[0]=_k+s^s;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*Returns the _i'th combination of _k elements (at most 32767) chosen from a
|
|
|
|
set of size 2 with associated sign bits.
|
|
|
|
_y: Returns the vector of pulses.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline void cc6_cwrsi2(int _k,cc6_celt_uint32_t _i,int *_y){
|
|
|
|
cc6_celt_uint32_t p;
|
2013-02-13 17:08:47 +00:00
|
|
|
int s;
|
|
|
|
int yj;
|
2013-02-15 20:04:02 +00:00
|
|
|
p=cc6_ucwrs2(_k+1U);
|
2013-02-13 17:08:47 +00:00
|
|
|
s=-(_i>=p);
|
|
|
|
_i-=p&s;
|
|
|
|
yj=_k;
|
|
|
|
_k=_i+1>>1;
|
2013-02-15 20:04:02 +00:00
|
|
|
p=cc6_ucwrs2(_k);
|
2013-02-13 17:08:47 +00:00
|
|
|
_i-=p;
|
|
|
|
yj-=_k;
|
|
|
|
_y[0]=yj+s^s;
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_cwrsi1(_k,_i,_y+1);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Returns the _i'th combination of _k elements (at most 32767) chosen from a
|
|
|
|
set of size 3 with associated sign bits.
|
|
|
|
_y: Returns the vector of pulses.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static void cc6_cwrsi3(int _k,cc6_celt_uint32_t _i,int *_y){
|
|
|
|
cc6_celt_uint32_t p;
|
2013-02-13 17:08:47 +00:00
|
|
|
int s;
|
|
|
|
int yj;
|
2013-02-15 20:04:02 +00:00
|
|
|
p=cc6_ucwrs3(_k+1U);
|
2013-02-13 17:08:47 +00:00
|
|
|
s=-(_i>=p);
|
|
|
|
_i-=p&s;
|
|
|
|
yj=_k;
|
2013-02-15 20:04:02 +00:00
|
|
|
/*Finds the maximum _k such that cc6_ucwrs3(_k)<=_i (tested for all
|
2013-02-13 17:08:47 +00:00
|
|
|
_i<2147418113=U(3,32768)).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
_k=_i>0?cc6_isqrt32(2*_i-1)+1>>1:0;
|
|
|
|
p=cc6_ucwrs3(_k);
|
2013-02-13 17:08:47 +00:00
|
|
|
_i-=p;
|
|
|
|
yj-=_k;
|
|
|
|
_y[0]=yj+s^s;
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_cwrsi2(_k,_i,_y+1);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Returns the _i'th combination of _k elements (at most 1172) chosen from a set
|
|
|
|
of size 4 with associated sign bits.
|
|
|
|
_y: Returns the vector of pulses.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static void cc6_cwrsi4(int _k,cc6_celt_uint32_t _i,int *_y){
|
|
|
|
cc6_celt_uint32_t p;
|
2013-02-13 17:08:47 +00:00
|
|
|
int s;
|
|
|
|
int yj;
|
|
|
|
int kl;
|
|
|
|
int kr;
|
2013-02-15 20:04:02 +00:00
|
|
|
p=cc6_ucwrs4(_k+1);
|
2013-02-13 17:08:47 +00:00
|
|
|
s=-(_i>=p);
|
|
|
|
_i-=p&s;
|
|
|
|
yj=_k;
|
|
|
|
/*We could solve a cubic for k here, but the form of the direct solution does
|
|
|
|
not lend itself well to exact integer arithmetic.
|
|
|
|
Instead we do a binary search on U(4,K).*/
|
|
|
|
kl=0;
|
|
|
|
kr=_k;
|
|
|
|
for(;;){
|
|
|
|
_k=kl+kr>>1;
|
2013-02-15 20:04:02 +00:00
|
|
|
p=cc6_ucwrs4(_k);
|
2013-02-13 17:08:47 +00:00
|
|
|
if(p<_i){
|
|
|
|
if(_k>=kr)break;
|
|
|
|
kl=_k+1;
|
|
|
|
}
|
|
|
|
else if(p>_i)kr=_k-1;
|
|
|
|
else break;
|
|
|
|
}
|
|
|
|
_i-=p;
|
|
|
|
yj-=_k;
|
|
|
|
_y[0]=yj+s^s;
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_cwrsi3(_k,_i,_y+1);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Returns the _i'th combination of _k elements (at most 238) chosen from a set
|
|
|
|
of size 5 with associated sign bits.
|
|
|
|
_y: Returns the vector of pulses.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static void cc6_cwrsi5(int _k,cc6_celt_uint32_t _i,int *_y){
|
|
|
|
cc6_celt_uint32_t p;
|
2013-02-13 17:08:47 +00:00
|
|
|
int s;
|
|
|
|
int yj;
|
2013-02-15 20:04:02 +00:00
|
|
|
p=cc6_ucwrs5(_k+1);
|
2013-02-13 17:08:47 +00:00
|
|
|
s=-(_i>=p);
|
|
|
|
_i-=p&s;
|
|
|
|
yj=_k;
|
|
|
|
#if 0
|
2013-02-15 20:04:02 +00:00
|
|
|
/*Finds the maximum _k such that cc6_ucwrs5(_k)<=_i (tested for all
|
2013-02-13 17:08:47 +00:00
|
|
|
_i<2157192969=U(5,239)).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
if(_i>=0x2AAAAAA9UL)_k=cc6_isqrt32(2*isqrt36(10+6*(cc6_celt_uint64_t)_i)-7)+1>>1;
|
|
|
|
else _k=_i>0?cc6_isqrt32(2*(cc6_celt_uint32_t)cc6_isqrt32(10+6*_i)-7)+1>>1:0;
|
|
|
|
p=cc6_ucwrs5(_k);
|
2013-02-13 17:08:47 +00:00
|
|
|
#else
|
|
|
|
/* A binary search on U(5,K) avoids the need for 64-bit arithmetic */
|
|
|
|
{
|
|
|
|
int kl=0;
|
|
|
|
int kr=_k;
|
|
|
|
for(;;){
|
|
|
|
_k=kl+kr>>1;
|
2013-02-15 20:04:02 +00:00
|
|
|
p=cc6_ucwrs5(_k);
|
2013-02-13 17:08:47 +00:00
|
|
|
if(p<_i){
|
|
|
|
if(_k>=kr)break;
|
|
|
|
kl=_k+1;
|
|
|
|
}
|
|
|
|
else if(p>_i)kr=_k-1;
|
|
|
|
else break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
_i-=p;
|
|
|
|
yj-=_k;
|
|
|
|
_y[0]=yj+s^s;
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_cwrsi4(_k,_i,_y+1);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*Returns the _i'th combination of _k elements chosen from a set of size _n
|
|
|
|
with associated sign bits.
|
|
|
|
_y: Returns the vector of pulses.
|
|
|
|
_u: Must contain entries [0..._k+1] of row _n of U() on input.
|
|
|
|
Its contents will be destructively modified.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static void cc6_cwrsi(int _n,int _k,cc6_celt_uint32_t _i,int *_y,cc6_celt_uint32_t *_u){
|
2013-02-13 17:08:47 +00:00
|
|
|
int j;
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_assert(_n>0);
|
2013-02-13 17:08:47 +00:00
|
|
|
j=0;
|
|
|
|
do{
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_uint32_t p;
|
2013-02-13 17:08:47 +00:00
|
|
|
int s;
|
|
|
|
int yj;
|
|
|
|
p=_u[_k+1];
|
|
|
|
s=-(_i>=p);
|
|
|
|
_i-=p&s;
|
|
|
|
yj=_k;
|
|
|
|
p=_u[_k];
|
|
|
|
while(p>_i)p=_u[--_k];
|
|
|
|
_i-=p;
|
|
|
|
yj-=_k;
|
|
|
|
_y[j]=yj+s^s;
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_uprev(_u,_k+2,0);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
while(++j<_n);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/*Returns the index of the given combination of K elements chosen from a set
|
|
|
|
of size 1 with associated sign bits.
|
|
|
|
_y: The vector of pulses, whose sum of absolute values is K.
|
|
|
|
_k: Returns K.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_icwrs1(const int *_y,int *_k){
|
2013-02-13 17:08:47 +00:00
|
|
|
*_k=abs(_y[0]);
|
|
|
|
return _y[0]<0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*Returns the index of the given combination of K elements chosen from a set
|
|
|
|
of size 2 with associated sign bits.
|
|
|
|
_y: The vector of pulses, whose sum of absolute values is K.
|
|
|
|
_k: Returns K.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_icwrs2(const int *_y,int *_k){
|
|
|
|
cc6_celt_uint32_t i;
|
2013-02-13 17:08:47 +00:00
|
|
|
int k;
|
2013-02-15 20:04:02 +00:00
|
|
|
i=cc6_icwrs1(_y+1,&k);
|
|
|
|
i+=cc6_ucwrs2(k);
|
2013-02-13 17:08:47 +00:00
|
|
|
k+=abs(_y[0]);
|
2013-02-15 20:04:02 +00:00
|
|
|
if(_y[0]<0)i+=cc6_ucwrs2(k+1U);
|
2013-02-13 17:08:47 +00:00
|
|
|
*_k=k;
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*Returns the index of the given combination of K elements chosen from a set
|
|
|
|
of size 3 with associated sign bits.
|
|
|
|
_y: The vector of pulses, whose sum of absolute values is K.
|
|
|
|
_k: Returns K.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_icwrs3(const int *_y,int *_k){
|
|
|
|
cc6_celt_uint32_t i;
|
2013-02-13 17:08:47 +00:00
|
|
|
int k;
|
2013-02-15 20:04:02 +00:00
|
|
|
i=cc6_icwrs2(_y+1,&k);
|
|
|
|
i+=cc6_ucwrs3(k);
|
2013-02-13 17:08:47 +00:00
|
|
|
k+=abs(_y[0]);
|
2013-02-15 20:04:02 +00:00
|
|
|
if(_y[0]<0)i+=cc6_ucwrs3(k+1U);
|
2013-02-13 17:08:47 +00:00
|
|
|
*_k=k;
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*Returns the index of the given combination of K elements chosen from a set
|
|
|
|
of size 4 with associated sign bits.
|
|
|
|
_y: The vector of pulses, whose sum of absolute values is K.
|
|
|
|
_k: Returns K.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_icwrs4(const int *_y,int *_k){
|
|
|
|
cc6_celt_uint32_t i;
|
2013-02-13 17:08:47 +00:00
|
|
|
int k;
|
2013-02-15 20:04:02 +00:00
|
|
|
i=cc6_icwrs3(_y+1,&k);
|
|
|
|
i+=cc6_ucwrs4(k);
|
2013-02-13 17:08:47 +00:00
|
|
|
k+=abs(_y[0]);
|
2013-02-15 20:04:02 +00:00
|
|
|
if(_y[0]<0)i+=cc6_ucwrs4(k+1);
|
2013-02-13 17:08:47 +00:00
|
|
|
*_k=k;
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*Returns the index of the given combination of K elements chosen from a set
|
|
|
|
of size 5 with associated sign bits.
|
|
|
|
_y: The vector of pulses, whose sum of absolute values is K.
|
|
|
|
_k: Returns K.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline cc6_celt_uint32_t cc6_icwrs5(const int *_y,int *_k){
|
|
|
|
cc6_celt_uint32_t i;
|
2013-02-13 17:08:47 +00:00
|
|
|
int k;
|
2013-02-15 20:04:02 +00:00
|
|
|
i=cc6_icwrs4(_y+1,&k);
|
|
|
|
i+=cc6_ucwrs5(k);
|
2013-02-13 17:08:47 +00:00
|
|
|
k+=abs(_y[0]);
|
2013-02-15 20:04:02 +00:00
|
|
|
if(_y[0]<0)i+=cc6_ucwrs5(k+1);
|
2013-02-13 17:08:47 +00:00
|
|
|
*_k=k;
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*Returns the index of the given combination of K elements chosen from a set
|
|
|
|
of size _n with associated sign bits.
|
|
|
|
_y: The vector of pulses, whose sum of absolute values must be _k.
|
|
|
|
_nc: Returns V(_n,_k).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_uint32_t cc6_icwrs(int _n,int _k,cc6_celt_uint32_t *_nc,const int *_y,
|
|
|
|
cc6_celt_uint32_t *_u){
|
|
|
|
cc6_celt_uint32_t i;
|
2013-02-13 17:08:47 +00:00
|
|
|
int j;
|
|
|
|
int k;
|
|
|
|
/*We can't unroll the first two iterations of the loop unless _n>=2.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_assert(_n>=2);
|
2013-02-13 17:08:47 +00:00
|
|
|
_u[0]=0;
|
|
|
|
for(k=1;k<=_k+1;k++)_u[k]=(k<<1)-1;
|
2013-02-15 20:04:02 +00:00
|
|
|
i=cc6_icwrs1(_y+_n-1,&k);
|
2013-02-13 17:08:47 +00:00
|
|
|
j=_n-2;
|
|
|
|
i+=_u[k];
|
|
|
|
k+=abs(_y[j]);
|
|
|
|
if(_y[j]<0)i+=_u[k+1];
|
|
|
|
while(j-->0){
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_unext(_u,_k+2,0);
|
2013-02-13 17:08:47 +00:00
|
|
|
i+=_u[k];
|
|
|
|
k+=abs(_y[j]);
|
|
|
|
if(_y[j]<0)i+=_u[k+1];
|
|
|
|
}
|
|
|
|
*_nc=_u[k]+_u[k+1];
|
|
|
|
return i;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2013-02-15 20:04:02 +00:00
|
|
|
/*Computes cc6_get_required_bits when splitting is required.
|
2013-02-13 17:08:47 +00:00
|
|
|
_left_bits and _right_bits must contain the required bits for the left and
|
|
|
|
right sides of the split, respectively (which themselves may require
|
|
|
|
splitting).*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static void cc6_get_required_split_bits(cc6_celt_int16_t *_bits,
|
|
|
|
const cc6_celt_int16_t *_left_bits,const cc6_celt_int16_t *_right_bits,
|
2013-02-13 17:08:47 +00:00
|
|
|
int _n,int _maxk,int _frac){
|
|
|
|
int k;
|
|
|
|
for(k=_maxk;k-->0;){
|
|
|
|
/*If we've reached a k where everything fits in 32 bits, evaluate the
|
|
|
|
remaining required bits directly.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
if(cc6_fits_in32(_n,k)){
|
|
|
|
cc6_get_required_bits(_bits,_n,k+1,_frac);
|
2013-02-13 17:08:47 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
else{
|
|
|
|
int worst_bits;
|
|
|
|
int i;
|
|
|
|
/*Due to potentially recursive splitting, it's difficult to derive an
|
|
|
|
analytic expression for the location of the worst-case split index.
|
|
|
|
We simply check them all.*/
|
|
|
|
worst_bits=0;
|
|
|
|
for(i=0;i<=k;i++){
|
|
|
|
int split_bits;
|
|
|
|
split_bits=_left_bits[i]+_right_bits[k-i];
|
|
|
|
if(split_bits>worst_bits)worst_bits=split_bits;
|
|
|
|
}
|
2013-02-15 20:04:02 +00:00
|
|
|
_bits[k]=cc6_log2_frac(k+1,_frac)+worst_bits;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-02-15 20:04:02 +00:00
|
|
|
/*Computes cc6_get_required_bits for a pair of N values.
|
2013-02-13 17:08:47 +00:00
|
|
|
_n1 and _n2 must either be equal or two consecutive integers.
|
|
|
|
Returns the buffer used to store the required bits for _n2, which is either
|
|
|
|
_bits1 if _n1==_n2 or _bits2 if _n1+1==_n2.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
static cc6_celt_int16_t *cc6_get_required_bits_pair(cc6_celt_int16_t *_bits1,
|
|
|
|
cc6_celt_int16_t *_bits2,cc6_celt_int16_t *_tmp,int _n1,int _n2,int _maxk,int _frac){
|
|
|
|
cc6_celt_int16_t *tmp2;
|
2013-02-13 17:08:47 +00:00
|
|
|
/*If we only need a single set of required bits...*/
|
|
|
|
if(_n1==_n2){
|
|
|
|
/*Stop recursing if everything fits.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
if(cc6_fits_in32(_n1,_maxk-1))cc6_get_required_bits(_bits1,_n1,_maxk,_frac);
|
2013-02-13 17:08:47 +00:00
|
|
|
else{
|
2013-02-15 20:04:02 +00:00
|
|
|
_tmp=cc6_get_required_bits_pair(_bits2,_tmp,_bits1,
|
2013-02-13 17:08:47 +00:00
|
|
|
_n1>>1,_n1+1>>1,_maxk,_frac);
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_get_required_split_bits(_bits1,_bits2,_tmp,_n1,_maxk,_frac);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
return _bits1;
|
|
|
|
}
|
|
|
|
/*Otherwise we need two distinct sets...*/
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_assert(_n1+1==_n2);
|
2013-02-13 17:08:47 +00:00
|
|
|
/*Stop recursing if everything fits.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
if(cc6_fits_in32(_n2,_maxk-1)){
|
|
|
|
cc6_get_required_bits(_bits1,_n1,_maxk,_frac);
|
|
|
|
cc6_get_required_bits(_bits2,_n2,_maxk,_frac);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
/*Otherwise choose an evaluation order that doesn't require extra buffers.*/
|
|
|
|
else if(_n1&1){
|
|
|
|
/*This special case isn't really needed, but can save some work.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
if(cc6_fits_in32(_n1,_maxk-1)){
|
|
|
|
tmp2=cc6_get_required_bits_pair(_tmp,_bits1,_bits2,
|
2013-02-13 17:08:47 +00:00
|
|
|
_n2>>1,_n2>>1,_maxk,_frac);
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_get_required_split_bits(_bits2,_tmp,tmp2,_n2,_maxk,_frac);
|
|
|
|
cc6_get_required_bits(_bits1,_n1,_maxk,_frac);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
else{
|
2013-02-15 20:04:02 +00:00
|
|
|
_tmp=cc6_get_required_bits_pair(_bits2,_tmp,_bits1,
|
2013-02-13 17:08:47 +00:00
|
|
|
_n1>>1,_n1+1>>1,_maxk,_frac);
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_get_required_split_bits(_bits1,_bits2,_tmp,_n1,_maxk,_frac);
|
|
|
|
cc6_get_required_split_bits(_bits2,_tmp,_tmp,_n2,_maxk,_frac);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
else{
|
|
|
|
/*There's no need to special case _n1 fitting by itself, since _n2 requires
|
|
|
|
us to recurse for both values anyway.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
tmp2=cc6_get_required_bits_pair(_tmp,_bits1,_bits2,
|
2013-02-13 17:08:47 +00:00
|
|
|
_n2>>1,_n2+1>>1,_maxk,_frac);
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_get_required_split_bits(_bits2,_tmp,tmp2,_n2,_maxk,_frac);
|
|
|
|
cc6_get_required_split_bits(_bits1,_tmp,_tmp,_n1,_maxk,_frac);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
return _bits2;
|
|
|
|
}
|
|
|
|
|
2013-02-15 20:04:02 +00:00
|
|
|
void cc6_get_required_bits(cc6_celt_int16_t *_bits,int _n,int _maxk,int _frac){
|
2013-02-13 17:08:47 +00:00
|
|
|
int k;
|
|
|
|
/*_maxk==0 => there's nothing to do.*/
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_assert(_maxk>0);
|
|
|
|
if(cc6_fits_in32(_n,_maxk-1)){
|
2013-02-13 17:08:47 +00:00
|
|
|
_bits[0]=0;
|
|
|
|
if(_maxk>1){
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_VARDECL(cc6_celt_uint32_t,u);
|
|
|
|
cc6_SAVE_STACK;
|
|
|
|
cc6_ALLOC(u,_maxk+1U,cc6_celt_uint32_t);
|
|
|
|
cc6_ncwrs_urow(_n,_maxk-1,u);
|
|
|
|
for(k=1;k<_maxk;k++)_bits[k]=cc6_log2_frac(u[k]+u[k+1],_frac);
|
|
|
|
cc6_RESTORE_STACK;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
else{
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_VARDECL(cc6_celt_int16_t,n1bits);
|
|
|
|
cc6_VARDECL(cc6_celt_int16_t,n2bits_buf);
|
|
|
|
cc6_celt_int16_t *n2bits;
|
|
|
|
cc6_SAVE_STACK;
|
|
|
|
cc6_ALLOC(n1bits,_maxk,cc6_celt_int16_t);
|
|
|
|
cc6_ALLOC(n2bits_buf,_maxk,cc6_celt_int16_t);
|
|
|
|
n2bits=cc6_get_required_bits_pair(n1bits,n2bits_buf,_bits,
|
2013-02-13 17:08:47 +00:00
|
|
|
_n>>1,_n+1>>1,_maxk,_frac);
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_get_required_split_bits(_bits,n1bits,n2bits,_n,_maxk,_frac);
|
|
|
|
cc6_RESTORE_STACK;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline void cc6_encode_pulses32(int _n,int _k,const int *_y,cc6_ec_enc *_enc){
|
|
|
|
cc6_celt_uint32_t i;
|
2013-02-13 17:08:47 +00:00
|
|
|
switch(_n){
|
|
|
|
case 1:{
|
2013-02-15 20:04:02 +00:00
|
|
|
i=cc6_icwrs1(_y,&_k);
|
|
|
|
cc6_celt_assert(cc6_ncwrs1(_k)==2);
|
|
|
|
cc6_ec_enc_bits(_enc,i,1);
|
2013-02-13 17:08:47 +00:00
|
|
|
}break;
|
|
|
|
case 2:{
|
2013-02-15 20:04:02 +00:00
|
|
|
i=cc6_icwrs2(_y,&_k);
|
|
|
|
cc6_ec_enc_uint(_enc,i,cc6_ncwrs2(_k));
|
2013-02-13 17:08:47 +00:00
|
|
|
}break;
|
|
|
|
case 3:{
|
2013-02-15 20:04:02 +00:00
|
|
|
i=cc6_icwrs3(_y,&_k);
|
|
|
|
cc6_ec_enc_uint(_enc,i,cc6_ncwrs3(_k));
|
2013-02-13 17:08:47 +00:00
|
|
|
}break;
|
|
|
|
case 4:{
|
2013-02-15 20:04:02 +00:00
|
|
|
i=cc6_icwrs4(_y,&_k);
|
|
|
|
cc6_ec_enc_uint(_enc,i,cc6_ncwrs4(_k));
|
2013-02-13 17:08:47 +00:00
|
|
|
}break;
|
|
|
|
case 5:{
|
2013-02-15 20:04:02 +00:00
|
|
|
i=cc6_icwrs5(_y,&_k);
|
|
|
|
cc6_ec_enc_uint(_enc,i,cc6_ncwrs5(_k));
|
2013-02-13 17:08:47 +00:00
|
|
|
}break;
|
|
|
|
default:{
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_VARDECL(cc6_celt_uint32_t,u);
|
|
|
|
cc6_celt_uint32_t nc;
|
|
|
|
cc6_SAVE_STACK;
|
|
|
|
cc6_ALLOC(u,_k+2U,cc6_celt_uint32_t);
|
|
|
|
i=cc6_icwrs(_n,_k,&nc,_y,u);
|
|
|
|
cc6_ec_enc_uint(_enc,i,nc);
|
|
|
|
cc6_RESTORE_STACK;
|
2013-02-13 17:08:47 +00:00
|
|
|
}break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-02-15 20:04:02 +00:00
|
|
|
void cc6_encode_pulses(int *_y, int N, int K, cc6_ec_enc *enc)
|
2013-02-13 17:08:47 +00:00
|
|
|
{
|
|
|
|
if (K==0) {
|
2013-02-15 20:04:02 +00:00
|
|
|
} else if(cc6_fits_in32(N,K))
|
2013-02-13 17:08:47 +00:00
|
|
|
{
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_encode_pulses32(N, K, _y, enc);
|
2013-02-13 17:08:47 +00:00
|
|
|
} else {
|
|
|
|
int i;
|
|
|
|
int count=0;
|
|
|
|
int split;
|
|
|
|
split = (N+1)/2;
|
|
|
|
for (i=0;i<split;i++)
|
|
|
|
count += abs(_y[i]);
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_ec_enc_uint(enc,count,K+1);
|
|
|
|
cc6_encode_pulses(_y, split, count, enc);
|
|
|
|
cc6_encode_pulses(_y+split, N-split, K-count, enc);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-02-15 20:04:02 +00:00
|
|
|
static __inline void cc6_decode_pulses32(int _n,int _k,int *_y,cc6_ec_dec *_dec){
|
2013-02-13 17:08:47 +00:00
|
|
|
switch(_n){
|
|
|
|
case 1:{
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_celt_assert(cc6_ncwrs1(_k)==2);
|
|
|
|
cc6_cwrsi1(_k,cc6_ec_dec_bits(_dec,1),_y);
|
2013-02-13 17:08:47 +00:00
|
|
|
}break;
|
2013-02-15 20:04:02 +00:00
|
|
|
case 2:cc6_cwrsi2(_k,cc6_ec_dec_uint(_dec,cc6_ncwrs2(_k)),_y);break;
|
|
|
|
case 3:cc6_cwrsi3(_k,cc6_ec_dec_uint(_dec,cc6_ncwrs3(_k)),_y);break;
|
|
|
|
case 4:cc6_cwrsi4(_k,cc6_ec_dec_uint(_dec,cc6_ncwrs4(_k)),_y);break;
|
|
|
|
case 5:cc6_cwrsi5(_k,cc6_ec_dec_uint(_dec,cc6_ncwrs5(_k)),_y);break;
|
2013-02-13 17:08:47 +00:00
|
|
|
default:{
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_VARDECL(cc6_celt_uint32_t,u);
|
|
|
|
cc6_SAVE_STACK;
|
|
|
|
cc6_ALLOC(u,_k+2U,cc6_celt_uint32_t);
|
|
|
|
cc6_cwrsi(_n,_k,cc6_ec_dec_uint(_dec,cc6_ncwrs_urow(_n,_k,u)),_y,u);
|
|
|
|
cc6_RESTORE_STACK;
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-02-15 20:04:02 +00:00
|
|
|
void cc6_decode_pulses(int *_y, int N, int K, cc6_ec_dec *dec)
|
2013-02-13 17:08:47 +00:00
|
|
|
{
|
|
|
|
if (K==0) {
|
|
|
|
int i;
|
|
|
|
for (i=0;i<N;i++)
|
|
|
|
_y[i] = 0;
|
2013-02-15 20:04:02 +00:00
|
|
|
} else if(cc6_fits_in32(N,K))
|
2013-02-13 17:08:47 +00:00
|
|
|
{
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_decode_pulses32(N, K, _y, dec);
|
2013-02-13 17:08:47 +00:00
|
|
|
} else {
|
|
|
|
int split;
|
2013-02-15 20:04:02 +00:00
|
|
|
int count = cc6_ec_dec_uint(dec,K+1);
|
2013-02-13 17:08:47 +00:00
|
|
|
split = (N+1)/2;
|
2013-02-15 20:04:02 +00:00
|
|
|
cc6_decode_pulses(_y, split, count, dec);
|
|
|
|
cc6_decode_pulses(_y+split, N-split, K-count, dec);
|
2013-02-13 17:08:47 +00:00
|
|
|
}
|
|
|
|
}
|