shithub: opus

--- a/libcelt/arch.h

+++ b/libcelt/arch.h

@@ -154,6 +154,8 @@

 #define SHL(a,shift)       (a)

 #define SATURATE(x,a) (x)

+#define ROUND(a,shift)       (a)

 #define ADD16(a,b) ((a)+(b))

 #define SUB16(a,b) ((a)-(b))

 #define ADD32(a,b) ((a)+(b))

--- /dev/null

+++ b/libcelt/fixed_debug.h

@@ -1,0 +1,491 @@

+/* Copyright (C) 2003 Jean-Marc Valin */

+/**

+   @file fixed_debug.h

+   @brief Fixed-point operations with debugging

+*/

+/*

+   Redistribution and use in source and binary forms, with or without

+   modification, are permitted provided that the following conditions

+   are met:

+   - Redistributions of source code must retain the above copyright

+   notice, this list of conditions and the following disclaimer.

+   - Redistributions in binary form must reproduce the above copyright

+   notice, this list of conditions and the following disclaimer in the

+   documentation and/or other materials provided with the distribution.

+   - Neither the name of the Xiph.org Foundation nor the names of its

+   contributors may be used to endorse or promote products derived from

+   this software without specific prior written permission.

+   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

+   ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

+   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR

+   A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR

+   CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,

+   EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,

+   PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR

+   PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF

+   LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING

+   NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

+   SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

+*/

+#ifndef FIXED_DEBUG_H

+#define FIXED_DEBUG_H

+#include <stdio.h>

+//extern long long celt_mips;

+static long long celt_mips = 0;

+#define MIPS_INC celt_mips++,

+#define QCONST16(x,bits) ((celt_word16_t)(.5+(x)*(((celt_word32_t)1)<<(bits))))

+#define QCONST32(x,bits) ((celt_word32_t)(.5+(x)*(((celt_word32_t)1)<<(bits))))

+#define VERIFY_SHORT(x) ((x)<=32767&&(x)>=-32768)

+#define VERIFY_INT(x) ((x)<=2147483647LL&&(x)>=-2147483648LL)

+#define SHR(a,b) SHR32(a,b)

+#define PSHR(a,b) PSHR32(a,b)

+static inline short NEG16(int x)

+{

+   int res;

+   if (!VERIFY_SHORT(x))

+   {

+      fprintf (stderr, "NEG16: input is not short: %d\n", (int)x);

+   }

+   res = -x;

+   if (!VERIFY_SHORT(res))

+      fprintf (stderr, "NEG16: output is not short: %d\n", (int)res);

+   celt_mips++;

+   return res;

+}

+static inline int NEG32(long long x)

+{

+   long long res;

+   if (!VERIFY_INT(x))

+   {

+      fprintf (stderr, "NEG16: input is not int: %d\n", (int)x);

+   }

+   res = -x;

+   if (!VERIFY_INT(res))

+      fprintf (stderr, "NEG16: output is not int: %d\n", (int)res);

+   celt_mips++;

+   return res;

+}

+#define EXTRACT16(x) _EXTRACT16(x, __FILE__, __LINE__)

+static inline short _EXTRACT16(int x, char *file, int line)

+{

+   int res;

+   if (!VERIFY_SHORT(x))

+   {

+      fprintf (stderr, "EXTRACT16: input is not short: %d in %s: line %d\n", x, file, line);

+   }

+   res = x;

+   celt_mips++;

+   return res;

+}

+#define EXTEND32(x) _EXTEND32(x, __FILE__, __LINE__)

+static inline int _EXTEND32(int x, char *file, int line)

+{

+   int res;

+   if (!VERIFY_SHORT(x))

+   {

+      fprintf (stderr, "EXTEND32: input is not short: %d in %s: line %d\n", x, file, line);

+   }

+   res = x;

+   celt_mips++;

+   return res;

+}

+#define SHR16(a, shift) _SHR16(a, shift, __FILE__, __LINE__)

+static inline short _SHR16(int a, int shift, char *file, int line)

+{

+   int res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(shift))

+   {

+      fprintf (stderr, "SHR16: inputs are not short: %d >> %d in %s: line %d\n", a, shift, file, line);

+   }

+   res = a>>shift;

+   if (!VERIFY_SHORT(res))

+      fprintf (stderr, "SHR16: output is not short: %d in %s: line %d\n", res, file, line);

+   celt_mips++;

+   return res;

+}

+#define SHL16(a, shift) _SHL16(a, shift, __FILE__, __LINE__)

+static inline short _SHL16(int a, int shift, char *file, int line)

+{

+   int res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(shift))

+   {

+      fprintf (stderr, "SHL16: inputs are not short: %d %d in %s: line %d\n", a, shift, file, line);

+   }

+   res = a<<shift;

+   if (!VERIFY_SHORT(res))

+      fprintf (stderr, "SHL16: output is not short: %d in %s: line %d\n", res, file, line);

+   celt_mips++;

+   return res;

+}

+static inline int SHR32(long long a, int shift)

+{

+   long long  res;

+   if (!VERIFY_INT(a) || !VERIFY_SHORT(shift))

+   {

+      fprintf (stderr, "SHR32: inputs are not int: %d %d\n", (int)a, shift);

+   }

+   res = a>>shift;

+   if (!VERIFY_INT(res))

+   {

+      fprintf (stderr, "SHR32: output is not int: %d\n", (int)res);

+   }

+   celt_mips++;

+   return res;

+}

+static inline int SHL32(long long a, int shift)

+{

+   long long  res;

+   if (!VERIFY_INT(a) || !VERIFY_SHORT(shift))

+   {

+      fprintf (stderr, "SHL32: inputs are not int: %d %d\n", (int)a, shift);

+   }

+   res = a<<shift;

+   if (!VERIFY_INT(res))

+   {

+      fprintf (stderr, "SHL32: output is not int: %d\n", (int)res);

+   }

+   celt_mips++;

+   return res;

+}

+#define PSHR16(a,shift) (SHR16(ADD16((a),((1<<((shift))>>1))),shift))

+#define PSHR32(a,shift) (SHR32(ADD32((a),((EXTEND32(1)<<((shift))>>1))),shift))

+#define VSHR32(a, shift) (((shift)>0) ? SHR32(a, shift) : SHL32(a, -(shift)))

+#define SATURATE16(x,a) (((x)>(a) ? (a) : (x)<-(a) ? -(a) : (x)))

+#define SATURATE32(x,a) (((x)>(a) ? (a) : (x)<-(a) ? -(a) : (x)))

+//#define SHR(a,shift) ((a) >> (shift))

+//#define SHL(a,shift) ((a) << (shift))

+#define ADD16(a, b) _ADD16(a, b, __FILE__, __LINE__)

+static inline short _ADD16(int a, int b, char *file, int line)

+{

+   int res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b))

+   {

+      fprintf (stderr, "ADD16: inputs are not short: %d %d in %s: line %d\n", a, b, file, line);

+   }

+   res = a+b;

+   if (!VERIFY_SHORT(res))

+   {

+      fprintf (stderr, "ADD16: output is not short: %d+%d=%d in %s: line %d\n", a,b,res, file, line);

+   }

+   celt_mips++;

+   return res;

+}

+#define SUB16(a, b) _SUB16(a, b, __FILE__, __LINE__)

+static inline short _SUB16(int a, int b, char *file, int line)

+{

+   int res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b))

+   {

+      fprintf (stderr, "SUB16: inputs are not short: %d %d in %s: line %d\n", a, b, file, line);

+   }

+   res = a-b;

+   if (!VERIFY_SHORT(res))

+      fprintf (stderr, "SUB16: output is not short: %d in %s: line %d\n", res, file, line);

+   celt_mips++;

+   return res;

+}

+#define ADD32(a, b) _ADD32(a, b, __FILE__, __LINE__)

+static inline int _ADD32(long long a, long long b, char *file, int line)

+{

+   long long res;

+   if (!VERIFY_INT(a) || !VERIFY_INT(b))

+   {

+      fprintf (stderr, "ADD32: inputs are not int: %d %d in %s: line %d\n", (int)a, (int)b, file, line);

+   }

+   res = a+b;

+   if (!VERIFY_INT(res))

+   {

+      fprintf (stderr, "ADD32: output is not int: %d in %s: line %d\n", (int)res, file, line);

+   }

+   celt_mips++;

+   return res;

+}

+static inline int SUB32(long long a, long long b)

+{

+   long long res;

+   if (!VERIFY_INT(a) || !VERIFY_INT(b))

+   {

+      fprintf (stderr, "SUB32: inputs are not int: %d %d\n", (int)a, (int)b);

+   }

+   res = a-b;

+   if (!VERIFY_INT(res))

+      fprintf (stderr, "SUB32: output is not int: %d\n", (int)res);

+   celt_mips++;

+   return res;

+}

+#define ADD64(a,b) (MIPS_INC(a)+(b))

+/* result fits in 16 bits */

+static inline short MULT16_16_16(int a, int b)

+{

+   int res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b))

+   {

+      fprintf (stderr, "MULT16_16_16: inputs are not short: %d %d\n", a, b);

+   }

+   res = a*b;

+   if (!VERIFY_SHORT(res))

+      fprintf (stderr, "MULT16_16_16: output is not short: %d\n", res);

+   celt_mips++;

+   return res;

+}

+#define MULT16_16(a, b) _MULT16_16(a, b, __FILE__, __LINE__)

+static inline int _MULT16_16(int a, int b, char *file, int line)

+{

+   long long res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b))

+   {

+      fprintf (stderr, "MULT16_16: inputs are not short: %d %d in %s: line %d\n", a, b, file, line);

+   }

+   res = ((long long)a)*b;

+   if (!VERIFY_INT(res))

+      fprintf (stderr, "MULT16_16: output is not int: %d in %s: line %d\n", (int)res, file, line);

+   celt_mips++;

+   return res;

+}

+#define MAC16_16(c,a,b)     (celt_mips--,ADD32((c),MULT16_16((a),(b))))

+#define MAC16_16_Q11(c,a,b)     (EXTRACT16(ADD16((c),EXTRACT16(SHR32(MULT16_16((a),(b)),11)))))

+#define MAC16_16_Q13(c,a,b)     (EXTRACT16(ADD16((c),EXTRACT16(SHR32(MULT16_16((a),(b)),13)))))

+#define MAC16_16_P13(c,a,b)     (EXTRACT16(ADD32((c),SHR32(ADD32(4096,MULT16_16((a),(b))),13))))

+#define MULT16_32_QX(a, b, Q) _MULT16_32_QX(a, b, Q, __FILE__, __LINE__)

+static inline int _MULT16_32_QX(int a, long long b, int Q, char *file, int line)

+{

+   long long res;

+   if (!VERIFY_SHORT(a) || !VERIFY_INT(b))

+   {

+      fprintf (stderr, "MULT16_32_Q%d: inputs are not short+int: %d %d in %s: line %d\n", Q, (int)a, (int)b, file, line);

+   }

+   if (ABS32(b)>=(EXTEND32(1)<<(15+Q)))

+      fprintf (stderr, "MULT16_32_Q%d: second operand too large: %d %d in %s: line %d\n", Q, (int)a, (int)b, file, line);

+   res = (((long long)a)*(long long)b) >> Q;

+   if (!VERIFY_INT(res))

+      fprintf (stderr, "MULT16_32_Q%d: output is not int: %d*%d=%d in %s: line %d\n", Q, (int)a, (int)b,(int)res, file, line);

+   celt_mips+=5;

+   return res;

+}

+static inline int MULT16_32_PX(int a, long long b, int Q)

+{

+   long long res;

+   if (!VERIFY_SHORT(a) || !VERIFY_INT(b))

+   {

+      fprintf (stderr, "MULT16_32_P%d: inputs are not short+int: %d %d\n", Q, (int)a, (int)b);

+   }

+   if (ABS32(b)>=(EXTEND32(1)<<(15+Q)))

+      fprintf (stderr, "MULT16_32_Q%d: second operand too large: %d %d\n", Q, (int)a, (int)b);

+   res = ((((long long)a)*(long long)b) + ((EXTEND32(1)<<Q)>>1))>> Q;

+   if (!VERIFY_INT(res))

+      fprintf (stderr, "MULT16_32_P%d: output is not int: %d*%d=%d\n", Q, (int)a, (int)b,(int)res);

+   celt_mips+=5;

+   return res;

+}

+#define MULT16_32_Q11(a,b) MULT16_32_QX(a,b,11)

+#define MAC16_32_Q11(c,a,b) ADD32((c),MULT16_32_Q11((a),(b)))

+#define MULT16_32_Q12(a,b) MULT16_32_QX(a,b,12)

+#define MULT16_32_Q13(a,b) MULT16_32_QX(a,b,13)

+#define MULT16_32_Q14(a,b) MULT16_32_QX(a,b,14)

+#define MULT16_32_Q15(a,b) MULT16_32_QX(a,b,15)

+#define MULT16_32_P15(a,b) MULT16_32_PX(a,b,15)

+#define MAC16_32_Q15(c,a,b) ADD32((c),MULT16_32_Q15((a),(b)))

+static inline int SATURATE(int a, int b)

+{

+   if (a>b)

+      a=b;

+   if (a<-b)

+      a = -b;

+   return a;

+}

+static inline int MULT16_16_Q11_32(int a, int b)

+{

+   long long res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b))

+   {

+      fprintf (stderr, "MULT16_16_Q11: inputs are not short: %d %d\n", a, b);

+   }

+   res = ((long long)a)*b;

+   res >>= 11;

+   if (!VERIFY_INT(res))

+      fprintf (stderr, "MULT16_16_Q11: output is not short: %d*%d=%d\n", (int)a, (int)b, (int)res);

+   celt_mips+=3;

+   return res;

+}

+static inline short MULT16_16_Q13(int a, int b)

+{

+   long long res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b))

+   {

+      fprintf (stderr, "MULT16_16_Q13: inputs are not short: %d %d\n", a, b);

+   }

+   res = ((long long)a)*b;

+   res >>= 13;

+   if (!VERIFY_SHORT(res))

+      fprintf (stderr, "MULT16_16_Q13: output is not short: %d*%d=%d\n", a, b, (int)res);

+   celt_mips+=3;

+   return res;

+}

+static inline short MULT16_16_Q14(int a, int b)

+{

+   long long res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b))

+   {

+      fprintf (stderr, "MULT16_16_Q14: inputs are not short: %d %d\n", a, b);

+   }

+   res = ((long long)a)*b;

+   res >>= 14;

+   if (!VERIFY_SHORT(res))

+      fprintf (stderr, "MULT16_16_Q14: output is not short: %d\n", (int)res);

+   celt_mips+=3;

+   return res;

+}

+static inline short MULT16_16_Q15(int a, int b)

+{

+   long long res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b))

+   {

+      fprintf (stderr, "MULT16_16_Q15: inputs are not short: %d %d\n", a, b);

+   }

+   res = ((long long)a)*b;

+   res >>= 15;

+   if (!VERIFY_SHORT(res))

+   {

+      fprintf (stderr, "MULT16_16_Q15: output is not short: %d\n", (int)res);

+   }

+   celt_mips+=3;

+   return res;

+}

+static inline short MULT16_16_P13(int a, int b)

+{

+   long long res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b))

+   {

+      fprintf (stderr, "MULT16_16_P13: inputs are not short: %d %d\n", a, b);

+   }

+   res = ((long long)a)*b;

+   res += 4096;

+   if (!VERIFY_INT(res))

+      fprintf (stderr, "MULT16_16_P13: overflow: %d*%d=%d\n", a, b, (int)res);

+   res >>= 13;

+   if (!VERIFY_SHORT(res))

+      fprintf (stderr, "MULT16_16_P13: output is not short: %d*%d=%d\n", a, b, (int)res);

+   celt_mips+=4;

+   return res;

+}

+static inline short MULT16_16_P14(int a, int b)

+{

+   long long res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b))

+   {

+      fprintf (stderr, "MULT16_16_P14: inputs are not short: %d %d\n", a, b);

+   }

+   res = ((long long)a)*b;

+   res += 8192;

+   if (!VERIFY_INT(res))

+      fprintf (stderr, "MULT16_16_P14: overflow: %d*%d=%d\n", a, b, (int)res);

+   res >>= 14;

+   if (!VERIFY_SHORT(res))

+      fprintf (stderr, "MULT16_16_P14: output is not short: %d*%d=%d\n", a, b, (int)res);

+   celt_mips+=4;

+   return res;

+}

+static inline short MULT16_16_P15(int a, int b)

+{

+   long long res;

+   if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b))

+   {

+      fprintf (stderr, "MULT16_16_P15: inputs are not short: %d %d\n", a, b);

+   }

+   res = ((long long)a)*b;

+   res += 16384;

+   if (!VERIFY_INT(res))

+      fprintf (stderr, "MULT16_16_P15: overflow: %d*%d=%d\n", a, b, (int)res);

+   res >>= 15;

+   if (!VERIFY_SHORT(res))

+      fprintf (stderr, "MULT16_16_P15: output is not short: %d*%d=%d\n", a, b, (int)res);

+   celt_mips+=4;

+   return res;

+}

+#define DIV32_16(a, b) _DIV32_16(a, b, __FILE__, __LINE__)

+static inline int _DIV32_16(long long a, long long b, char *file, int line)

+{

+   long long res;

+   if (b==0)

+   {

+      fprintf(stderr, "DIV32_16: divide by zero: %d/%d in %s: line %d\n", (int)a, (int)b, file, line);

+      return 0;

+   }

+   if (!VERIFY_INT(a) || !VERIFY_SHORT(b))

+   {

+      fprintf (stderr, "DIV32_16: inputs are not int/short: %d %d in %s: line %d\n", (int)a, (int)b, file, line);

+   }

+   res = a/b;

+   if (!VERIFY_SHORT(res))

+   {

+      fprintf (stderr, "DIV32_16: output is not short: %d / %d = %d in %s: line %d\n", (int)a,(int)b,(int)res, file, line);

+      if (res>32767)

+         res = 32767;

+      if (res<-32768)

+         res = -32768;

+   }

+   celt_mips+=20;

+   return res;

+}

+#define DIV32(a, b) _DIV32(a, b, __FILE__, __LINE__)

+static inline int _DIV32(long long a, long long b, char *file, int line)

+{

+   long long res;

+   if (b==0)

+   {

+      fprintf(stderr, "DIV32: divide by zero: %d/%d in %s: line %d\n", (int)a, (int)b, file, line);

+      return 0;

+   }

+   if (!VERIFY_INT(a) || !VERIFY_INT(b))

+   {

+      fprintf (stderr, "DIV32: inputs are not int/short: %d %d in %s: line %d\n", (int)a, (int)b, file, line);

+   }

+   res = a/b;

+   if (!VERIFY_INT(res))

+      fprintf (stderr, "DIV32: output is not int: %d in %s: line %d\n", (int)res, file, line);

+   celt_mips+=36;

+   return res;

+}

+#define PDIV32(a,b) DIV32(ADD32((a),(b)>>1),b)

+#define PDIV32_16(a,b) DIV32_16(ADD32((a),(b)>>1),b)

+#endif

--- a/libcelt/fixed_generic.h

+++ b/libcelt/fixed_generic.h

@@ -57,6 +57,7 @@

 #define PSHR(a,shift) (SHR((a)+((EXTEND32(1)<<((shift))>>1)),shift))

 #define SATURATE(x,a) (((x)>(a) ? (a) : (x)<-(a) ? -(a) : (x)))

+#define ROUND(x,a) (EXTRACT16(PSHR32((x),(a))))

 #define ADD16(a,b) ((celt_word16_t)((celt_word16_t)(a)+(celt_word16_t)(b)))

 #define SUB16(a,b) ((celt_word16_t)(a)-(celt_word16_t)(b))

--- a/libcelt/vq.c

+++ b/libcelt/vq.c

@@ -60,11 +60,6 @@

 #define approx_inv(x) (1.f/(x))

 #endif

-#ifdef FIXED_POINT

-#else

-#define celt_sqrt sqrt

-#endif

 /** Takes the pitch vector and the decoded residual vector (non-compressed),

    applies the compression in the pitch direction, computes the gain that will

    give ||p+g*y||=1 and mixes the residual with the pitch. */

@@ -93,7 +88,7 @@

       the encoded (int) one */

    for (i=0;i<N;i++)

       y[i] = SUB16(SHL16(iy[i],yshift),

-                   MULT16_16_Q15(alpha,MULT16_16_Q14(EXTRACT16(SHR32(Ryp,14)),P[i])));

+                   MULT16_16_Q15(alpha,MULT16_16_Q14(ROUND(Ryp,14),P[i])));

    /* Recompute after the projection (I think it's right) */

    Ryp = 0;

@@ -105,7 +100,7 @@

       Ryy = MAC16_16(Ryy, y[i],y[i]);

    /* g = (sqrt(Ryp^2 + Ryy - Rpp*Ryy)-Ryp)/Ryy */

-   g = DIV32(SHL32(celt_sqrt(MULT16_16(PSHR32(Ryp,14),PSHR32(Ryp,14)) + Ryy - MULT16_16(PSHR32(Ryy,14),PSHR32(Rpp,14))) - PSHR32(Ryp,14),14),PSHR32(Ryy,14));

+   g = DIV32(SHL32(celt_sqrt(MULT16_16(ROUND(Ryp,14),ROUND(Ryp,14)) + Ryy - MULT16_16(ROUND(Ryy,14),ROUND(Rpp,14))) - ROUND(Ryp,14),14),ROUND(Ryy,14));

    for (i=0;i<N;i++)

       X[i] = P[i] + MULT16_32_Q14(y[i], g);