mirror of
				https://github.com/Rockbox/rockbox.git
				synced 2025-10-24 15:37:38 -04:00 
			
		
		
		
	Sync opus codec to upstream git
Change-Id: I0cfcc0005c4ad7bfbb1aaf454188ce70fb043dc1
This commit is contained in:
		
							parent
							
								
									75d9393796
								
							
						
					
					
						commit
						14c6bb798d
					
				
					 286 changed files with 48931 additions and 1278 deletions
				
			
		|  | @ -58,12 +58,12 @@ | |||
| #   define S_MUL(a,b) MULT16_32_Q15(b, a) | ||||
| 
 | ||||
| #   define C_MUL(m,a,b) \ | ||||
|       do{ (m).r = SUB32(S_MUL((a).r,(b).r) , S_MUL((a).i,(b).i)); \ | ||||
|           (m).i = ADD32(S_MUL((a).r,(b).i) , S_MUL((a).i,(b).r)); }while(0) | ||||
|       do{ (m).r = SUB32_ovflw(S_MUL((a).r,(b).r) , S_MUL((a).i,(b).i)); \ | ||||
|           (m).i = ADD32_ovflw(S_MUL((a).r,(b).i) , S_MUL((a).i,(b).r)); }while(0) | ||||
| 
 | ||||
| #   define C_MULC(m,a,b) \ | ||||
|       do{ (m).r = ADD32(S_MUL((a).r,(b).r) , S_MUL((a).i,(b).i)); \ | ||||
|           (m).i = SUB32(S_MUL((a).i,(b).r) , S_MUL((a).r,(b).i)); }while(0) | ||||
|       do{ (m).r = ADD32_ovflw(S_MUL((a).r,(b).r) , S_MUL((a).i,(b).i)); \ | ||||
|           (m).i = SUB32_ovflw(S_MUL((a).i,(b).r) , S_MUL((a).r,(b).i)); }while(0) | ||||
| 
 | ||||
| #   define C_MULBYSCALAR( c, s ) \ | ||||
|       do{ (c).r =  S_MUL( (c).r , s ) ;\ | ||||
|  | @ -77,17 +77,17 @@ | |||
|                 DIVSCALAR( (c).i  , div); }while (0) | ||||
| 
 | ||||
| #define  C_ADD( res, a,b)\ | ||||
|     do {(res).r=ADD32((a).r,(b).r);  (res).i=ADD32((a).i,(b).i); \ | ||||
|     do {(res).r=ADD32_ovflw((a).r,(b).r);  (res).i=ADD32_ovflw((a).i,(b).i); \ | ||||
|     }while(0) | ||||
| #define  C_SUB( res, a,b)\ | ||||
|     do {(res).r=SUB32((a).r,(b).r);  (res).i=SUB32((a).i,(b).i); \ | ||||
|     do {(res).r=SUB32_ovflw((a).r,(b).r);  (res).i=SUB32_ovflw((a).i,(b).i); \ | ||||
|     }while(0) | ||||
| #define C_ADDTO( res , a)\ | ||||
|     do {(res).r = ADD32((res).r, (a).r);  (res).i = ADD32((res).i,(a).i);\ | ||||
|     do {(res).r = ADD32_ovflw((res).r, (a).r);  (res).i = ADD32_ovflw((res).i,(a).i);\ | ||||
|     }while(0) | ||||
| 
 | ||||
| #define C_SUBFROM( res , a)\ | ||||
|     do {(res).r = ADD32((res).r,(a).r);  (res).i = SUB32((res).i,(a).i); \ | ||||
|     do {(res).r = ADD32_ovflw((res).r,(a).r);  (res).i = SUB32_ovflw((res).i,(a).i); \ | ||||
|     }while(0) | ||||
| 
 | ||||
| #if defined(OPUS_ARM_INLINE_ASM) | ||||
|  | @ -97,9 +97,8 @@ | |||
| #if defined(OPUS_ARM_INLINE_EDSP) | ||||
| #include "arm/kiss_fft_armv5e.h" | ||||
| #endif | ||||
| 
 | ||||
| #if defined(OPUS_CF_INLINE_ASM) | ||||
| #include "cf/kiss_fft_cf.h" | ||||
| #if defined(MIPSr1_ASM) | ||||
| #include "mips/kiss_fft_mipsr1.h" | ||||
| #endif | ||||
| 
 | ||||
| #else  /* not FIXED_POINT*/ | ||||
|  |  | |||
|  | @ -46,30 +46,54 @@ | |||
| #  endif | ||||
| # endif | ||||
| 
 | ||||
| #if OPUS_GNUC_PREREQ(3, 0) | ||||
| #define opus_likely(x)       (__builtin_expect(!!(x), 1)) | ||||
| #define opus_unlikely(x)     (__builtin_expect(!!(x), 0)) | ||||
| #else | ||||
| #define opus_likely(x)       (!!(x)) | ||||
| #define opus_unlikely(x)     (!!(x)) | ||||
| #endif | ||||
| 
 | ||||
| #define CELT_SIG_SCALE 32768.f | ||||
| 
 | ||||
| #define celt_fatal(str) _celt_fatal(str, __FILE__, __LINE__); | ||||
| #ifdef ENABLE_ASSERTIONS | ||||
| #define CELT_FATAL(str) celt_fatal(str, __FILE__, __LINE__); | ||||
| 
 | ||||
| #if defined(ENABLE_ASSERTIONS) || defined(ENABLE_HARDENING) | ||||
| #ifdef __GNUC__ | ||||
| __attribute__((noreturn)) | ||||
| #endif | ||||
| void celt_fatal(const char *str, const char *file, int line); | ||||
| 
 | ||||
| #if defined(CELT_C) && !defined(OVERRIDE_celt_fatal) | ||||
| #include <stdio.h> | ||||
| #include <stdlib.h> | ||||
| #ifdef __GNUC__ | ||||
| __attribute__((noreturn)) | ||||
| #endif | ||||
| static OPUS_INLINE void _celt_fatal(const char *str, const char *file, int line) | ||||
| void celt_fatal(const char *str, const char *file, int line) | ||||
| { | ||||
|    fprintf (stderr, "Fatal (internal) error in %s, line %d: %s\n", file, line, str); | ||||
|    abort(); | ||||
| } | ||||
| #define celt_assert(cond) {if (!(cond)) {celt_fatal("assertion failed: " #cond);}} | ||||
| #define celt_assert2(cond, message) {if (!(cond)) {celt_fatal("assertion failed: " #cond "\n" message);}} | ||||
| #endif | ||||
| 
 | ||||
| #define celt_assert(cond) {if (!(cond)) {CELT_FATAL("assertion failed: " #cond);}} | ||||
| #define celt_assert2(cond, message) {if (!(cond)) {CELT_FATAL("assertion failed: " #cond "\n" message);}} | ||||
| #define MUST_SUCCEED(call) celt_assert((call) == OPUS_OK) | ||||
| #else | ||||
| #define celt_assert(cond) | ||||
| #define celt_assert2(cond, message) | ||||
| #define MUST_SUCCEED(call) do {if((call) != OPUS_OK) {RESTORE_STACK; return OPUS_INTERNAL_ERROR;} } while (0) | ||||
| #endif | ||||
| 
 | ||||
| #if defined(ENABLE_ASSERTIONS) | ||||
| #define celt_sig_assert(cond) {if (!(cond)) {CELT_FATAL("signal assertion failed: " #cond);}} | ||||
| #else | ||||
| #define celt_sig_assert(cond) | ||||
| #endif | ||||
| 
 | ||||
| #define IMUL32(a,b) ((a)*(b)) | ||||
| 
 | ||||
| #define ABS(x) ((x) < 0 ? (-(x)) : (x)) | ||||
| #define MIN16(a,b) ((a) < (b) ? (a) : (b))   /**< Minimum 16-bit value.   */ | ||||
| #define MAX16(a,b) ((a) > (b) ? (a) : (b))   /**< Maximum 16-bit value.   */ | ||||
| #define MIN32(a,b) ((a) < (b) ? (a) : (b))   /**< Minimum 32-bit value.   */ | ||||
|  | @ -79,20 +103,35 @@ static OPUS_INLINE void _celt_fatal(const char *str, const char *file, int line) | |||
| #define UADD32(a,b) ((a)+(b)) | ||||
| #define USUB32(a,b) ((a)-(b)) | ||||
| 
 | ||||
| /* Set this if opus_int64 is a native type of the CPU. */ | ||||
| /* Assume that all LP64 architectures have fast 64-bit types; also x86_64
 | ||||
|    (which can be ILP32 for x32) and Win64 (which is LLP64). */ | ||||
| #if defined(__x86_64__) || defined(__LP64__) || defined(_WIN64) | ||||
| #define OPUS_FAST_INT64 1 | ||||
| #else | ||||
| #define OPUS_FAST_INT64 0 | ||||
| #endif | ||||
| 
 | ||||
| #define PRINT_MIPS(file) | ||||
| 
 | ||||
| #ifdef FIXED_POINT | ||||
| 
 | ||||
| typedef opus_int16 opus_val16; | ||||
| typedef opus_int32 opus_val32; | ||||
| typedef opus_int64 opus_val64; | ||||
| 
 | ||||
| typedef opus_val32 celt_sig; | ||||
| typedef opus_val16 celt_norm; | ||||
| typedef opus_val32 celt_ener; | ||||
| 
 | ||||
| #define celt_isnan(x) 0 | ||||
| 
 | ||||
| #define Q15ONE 32767 | ||||
| 
 | ||||
| #define SIG_SHIFT 12 | ||||
| /* Safe saturation value for 32-bit signals. Should be less than
 | ||||
|    2^31*(1-0.85) to avoid blowing up on DC at deemphasis.*/ | ||||
| #define SIG_SAT (300000000) | ||||
| 
 | ||||
| #define NORM_SCALING 16384 | ||||
| 
 | ||||
|  | @ -119,7 +158,9 @@ static OPUS_INLINE opus_int16 SAT16(opus_int32 x) { | |||
| 
 | ||||
| #include "fixed_generic.h" | ||||
| 
 | ||||
| #ifdef OPUS_ARM_INLINE_EDSP | ||||
| #ifdef OPUS_ARM_PRESUME_AARCH64_NEON_INTR | ||||
| #include "arm/fixed_arm64.h" | ||||
| #elif defined (OPUS_ARM_INLINE_EDSP) | ||||
| #include "arm/fixed_armv5e.h" | ||||
| #elif defined (OPUS_ARM_INLINE_ASM) | ||||
| #include "arm/fixed_armv4.h" | ||||
|  | @ -129,8 +170,6 @@ static OPUS_INLINE opus_int16 SAT16(opus_int32 x) { | |||
| #include "fixed_c5x.h" | ||||
| #elif defined (TI_C6X_ASM) | ||||
| #include "fixed_c6x.h" | ||||
| #elif defined (OPUS_CF_INLINE_ASM) | ||||
| #include "cf/fixed_cf.h" | ||||
| #endif | ||||
| 
 | ||||
| #endif | ||||
|  | @ -139,6 +178,7 @@ static OPUS_INLINE opus_int16 SAT16(opus_int32 x) { | |||
| 
 | ||||
| typedef float opus_val16; | ||||
| typedef float opus_val32; | ||||
| typedef float opus_val64; | ||||
| 
 | ||||
| typedef float celt_sig; | ||||
| typedef float celt_norm; | ||||
|  | @ -178,6 +218,7 @@ static OPUS_INLINE int celt_isnan(float x) | |||
| 
 | ||||
| #define NEG16(x) (-(x)) | ||||
| #define NEG32(x) (-(x)) | ||||
| #define NEG32_ovflw(x) (-(x)) | ||||
| #define EXTRACT16(x) (x) | ||||
| #define EXTEND32(x) (x) | ||||
| #define SHR16(a,shift) (a) | ||||
|  | @ -194,6 +235,7 @@ static OPUS_INLINE int celt_isnan(float x) | |||
| #define SATURATE16(x)   (x) | ||||
| 
 | ||||
| #define ROUND16(a,shift)  (a) | ||||
| #define SROUND16(a,shift) (a) | ||||
| #define HALF16(x)       (.5f*(x)) | ||||
| #define HALF32(x)       (.5f*(x)) | ||||
| 
 | ||||
|  | @ -201,6 +243,8 @@ static OPUS_INLINE int celt_isnan(float x) | |||
| #define SUB16(a,b) ((a)-(b)) | ||||
| #define ADD32(a,b) ((a)+(b)) | ||||
| #define SUB32(a,b) ((a)-(b)) | ||||
| #define ADD32_ovflw(a,b) ((a)+(b)) | ||||
| #define SUB32_ovflw(a,b) ((a)-(b)) | ||||
| #define MULT16_16_16(a,b)     ((a)*(b)) | ||||
| #define MULT16_16(a,b)     ((opus_val32)(a)*(opus_val32)(b)) | ||||
| #define MAC16_16(c,a,b)     ((c)+(opus_val32)(a)*(opus_val32)(b)) | ||||
|  | @ -235,9 +279,9 @@ static OPUS_INLINE int celt_isnan(float x) | |||
| 
 | ||||
| #ifndef GLOBAL_STACK_SIZE | ||||
| #ifdef FIXED_POINT | ||||
| #define GLOBAL_STACK_SIZE 100000 | ||||
| #define GLOBAL_STACK_SIZE 120000 | ||||
| #else | ||||
| #define GLOBAL_STACK_SIZE 100000 | ||||
| #define GLOBAL_STACK_SIZE 120000 | ||||
| #endif | ||||
| #endif | ||||
| 
 | ||||
|  |  | |||
							
								
								
									
										353
									
								
								lib/rbcodec/codecs/libopus/celt/arm/arm2gnu.pl
									
										
									
									
									
										Executable file
									
								
							
							
						
						
									
										353
									
								
								lib/rbcodec/codecs/libopus/celt/arm/arm2gnu.pl
									
										
									
									
									
										Executable file
									
								
							|  | @ -0,0 +1,353 @@ | |||
| #!/usr/bin/perl | ||||
| # Copyright (C) 2002-2013 Xiph.org Foundation | ||||
| # | ||||
| # Redistribution and use in source and binary forms, with or without | ||||
| # modification, are permitted provided that the following conditions | ||||
| # are met: | ||||
| # | ||||
| # - Redistributions of source code must retain the above copyright | ||||
| # notice, this list of conditions and the following disclaimer. | ||||
| # | ||||
| # - Redistributions in binary form must reproduce the above copyright | ||||
| # notice, this list of conditions and the following disclaimer in the | ||||
| # documentation and/or other materials provided with the distribution. | ||||
| # | ||||
| # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
| # ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
| # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
| # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
| # OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
| # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
| # PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
| # PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
| # LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
| # NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| # SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| 
 | ||||
| my $bigend;  # little/big endian | ||||
| my $nxstack; | ||||
| my $apple = 0; | ||||
| my $symprefix = ""; | ||||
| 
 | ||||
| $nxstack = 0; | ||||
| 
 | ||||
| eval 'exec /usr/local/bin/perl -S $0 ${1+"$@"}' | ||||
|     if $running_under_some_shell; | ||||
| 
 | ||||
| while ($ARGV[0] =~ /^-/) { | ||||
|     $_ = shift; | ||||
|   last if /^--$/; | ||||
|     if (/^-n$/) { | ||||
|     $nflag++; | ||||
|     next; | ||||
|     } | ||||
|     if (/^--apple$/) { | ||||
|         $apple = 1; | ||||
|         $symprefix = "_"; | ||||
|         next; | ||||
|     } | ||||
|     die "I don't recognize this switch: $_\\n"; | ||||
| } | ||||
| $printit++ unless $nflag; | ||||
| 
 | ||||
| $\ = "\n";      # automatically add newline on print | ||||
| $n=0; | ||||
| 
 | ||||
| $thumb = 0;     # ARM mode by default, not Thumb. | ||||
| @proc_stack = (); | ||||
| 
 | ||||
| printf ("    .syntax unified\n"); | ||||
| 
 | ||||
| LINE: | ||||
| while (<>) { | ||||
| 
 | ||||
|     # For ADRLs we need to add a new line after the substituted one. | ||||
|     $addPadding = 0; | ||||
| 
 | ||||
|     # First, we do not dare to touch *anything* inside double quotes, do we? | ||||
|     # Second, if you want a dollar character in the string, | ||||
|     # insert two of them -- that's how ARM C and assembler treat strings. | ||||
|     s/^([A-Za-z_]\w*)[ \t]+DCB[ \t]*\"/$1:   .ascii \"/   && do { s/\$\$/\$/g; next }; | ||||
|     s/\bDCB\b[ \t]*\"/.ascii \"/                          && do { s/\$\$/\$/g; next }; | ||||
|     s/^(\S+)\s+RN\s+(\S+)/$1 .req r$2/                    && do { s/\$\$/\$/g; next }; | ||||
|     # If there's nothing on a line but a comment, don't try to apply any further | ||||
|     #  substitutions (this is a cheap hack to avoid mucking up the license header) | ||||
|     s/^([ \t]*);/$1@/                                     && do { s/\$\$/\$/g; next }; | ||||
|     # If substituted -- leave immediately ! | ||||
| 
 | ||||
|     s/@/,:/; | ||||
|     s/;/@/; | ||||
|     while ( /@.*'/ ) { | ||||
|       s/(@.*)'/$1/g; | ||||
|     } | ||||
|     s/\{FALSE\}/0/g; | ||||
|     s/\{TRUE\}/1/g; | ||||
|     s/\{(\w\w\w\w+)\}/$1/g; | ||||
|     s/\bINCLUDE[ \t]*([^ \t\n]+)/.include \"$1\"/; | ||||
|     s/\bGET[ \t]*([^ \t\n]+)/.include \"${ my $x=$1; $x =~ s|\.s|-gnu.S|; \$x }\"/; | ||||
|     s/\bIMPORT\b/.extern/; | ||||
|     s/\bEXPORT\b\s*/.global $symprefix/; | ||||
|     s/^(\s+)\[/$1IF/; | ||||
|     s/^(\s+)\|/$1ELSE/; | ||||
|     s/^(\s+)\]/$1ENDIF/; | ||||
|     s/IF *:DEF:/ .ifdef/; | ||||
|     s/IF *:LNOT: *:DEF:/ .ifndef/; | ||||
|     s/ELSE/ .else/; | ||||
|     s/ENDIF/ .endif/; | ||||
| 
 | ||||
|     if( /\bIF\b/ ) { | ||||
|       s/\bIF\b/ .if/; | ||||
|       s/=/==/; | ||||
|     } | ||||
|     if ( $n == 2) { | ||||
|         s/\$/\\/g; | ||||
|     } | ||||
|     if ($n == 1) { | ||||
|         s/\$//g; | ||||
|         s/label//g; | ||||
|     $n = 2; | ||||
|       } | ||||
|     if ( /MACRO/ ) { | ||||
|       s/MACRO *\n/.macro/; | ||||
|       $n=1; | ||||
|     } | ||||
|     if ( /\bMEND\b/ ) { | ||||
|       s/\bMEND\b/.endm/; | ||||
|       $n=0; | ||||
|     } | ||||
| 
 | ||||
|     # ".rdata" doesn't work in 'as' version 2.13.2, as it is ".rodata" there. | ||||
|     # | ||||
|     if ( /\bAREA\b/ ) { | ||||
|         my $align; | ||||
|         $align = "2"; | ||||
|         if ( /ALIGN=(\d+)/ ) { | ||||
|             $align = $1; | ||||
|         } | ||||
|         if ( /CODE/ ) { | ||||
|             $nxstack = 1; | ||||
|         } | ||||
|         s/^(.+)CODE(.+)READONLY(.*)/    .text/; | ||||
|         s/^(.+)DATA(.+)READONLY(.*)/    .section .rdata/; | ||||
|         s/^(.+)\|\|\.data\|\|(.+)/    .data/; | ||||
|         s/^(.+)\|\|\.bss\|\|(.+)/    .bss/; | ||||
|         s/$/;   .p2align $align/; | ||||
|         # Enable NEON instructions but don't produce a binary that requires | ||||
|         # ARMv7. RVCT does not have equivalent directives, so we just do this | ||||
|         # for all CODE areas. | ||||
|         if ( /.text/ ) { | ||||
|             # Separating .arch, .fpu, etc., by semicolons does not work (gas | ||||
|             # thinks the semicolon is part of the arch name, even when there's | ||||
|             # whitespace separating them). Sadly this means our line numbers | ||||
|             # won't match the original source file (we could use the .line | ||||
|             # directive, which is documented to be obsolete, but then gdb will | ||||
|             # show the wrong line in the translated source file). | ||||
|             s/$/;   .arch armv7-a\n   .fpu neon\n   .object_arch armv4t/ unless ($apple); | ||||
|         } | ||||
|     } | ||||
| 
 | ||||
|     s/\|\|\.constdata\$(\d+)\|\|/.L_CONST$1/;       # ||.constdata$3|| | ||||
|     s/\|\|\.bss\$(\d+)\|\|/.L_BSS$1/;               # ||.bss$2|| | ||||
|     s/\|\|\.data\$(\d+)\|\|/.L_DATA$1/;             # ||.data$2|| | ||||
|     s/\|\|([a-zA-Z0-9_]+)\@([a-zA-Z0-9_]+)\|\|/@ $&/; | ||||
|     s/^(\s+)\%(\s)/    .space $1/; | ||||
| 
 | ||||
|     s/\|(.+)\.(\d+)\|/\.$1_$2/;                     # |L80.123| -> .L80_123 | ||||
|     s/\bCODE32\b/.code 32/ && do {$thumb = 0}; | ||||
|     s/\bCODE16\b/.code 16/ && do {$thumb = 1}; | ||||
|     if (/\bPROC\b/) | ||||
|     { | ||||
|         my $prefix; | ||||
|         my $proc; | ||||
|         /^([A-Za-z_\.]\w+)\b/; | ||||
|         $proc = $1; | ||||
|         $prefix = ""; | ||||
|         if ($proc) | ||||
|         { | ||||
|             $prefix = $prefix.sprintf("\t.type\t%s, %%function", $proc) unless ($apple); | ||||
|             # Make sure we $prefix isn't empty here (for the $apple case). | ||||
|             # We handle mangling the label here, make sure it doesn't match | ||||
|             # the label handling below (if $prefix would be empty). | ||||
|             $prefix = $prefix."; "; | ||||
|             push(@proc_stack, $proc); | ||||
|             s/^[A-Za-z_\.]\w+/$symprefix$&:/; | ||||
|         } | ||||
|         $prefix = $prefix."\t.thumb_func; " if ($thumb); | ||||
|         s/\bPROC\b/@ $&/; | ||||
|         $_ = $prefix.$_; | ||||
|     } | ||||
|     s/^(\s*)(S|Q|SH|U|UQ|UH)ASX\b/$1$2ADDSUBX/; | ||||
|     s/^(\s*)(S|Q|SH|U|UQ|UH)SAX\b/$1$2SUBADDX/; | ||||
|     if (/\bENDP\b/) | ||||
|     { | ||||
|         my $proc; | ||||
|         s/\bENDP\b/@ $&/; | ||||
|         $proc = pop(@proc_stack); | ||||
|         $_ = "\t.size $proc, .-$proc".$_ if ($proc && !$apple); | ||||
|     } | ||||
|     s/\bSUBT\b/@ $&/; | ||||
|     s/\bDATA\b/@ $&/;   # DATA directive is deprecated -- Asm guide, p.7-25 | ||||
|     s/\bKEEP\b/@ $&/; | ||||
|     s/\bEXPORTAS\b/@ $&/; | ||||
|     s/\|\|(.)+\bEQU\b/@ $&/; | ||||
|     s/\|\|([\w\$]+)\|\|/$1/; | ||||
|     s/\bENTRY\b/@ $&/; | ||||
|     s/\bASSERT\b/@ $&/; | ||||
|     s/\bGBLL\b/@ $&/; | ||||
|     s/\bGBLA\b/@ $&/; | ||||
|     s/^\W+OPT\b/@ $&/; | ||||
|     s/:OR:/|/g; | ||||
|     s/:SHL:/<</g; | ||||
|     s/:SHR:/>>/g; | ||||
|     s/:AND:/&/g; | ||||
|     s/:LAND:/&&/g; | ||||
|     s/CPSR/cpsr/; | ||||
|     s/SPSR/spsr/; | ||||
|     s/ALIGN$/.balign 4/; | ||||
|     s/ALIGN\s+([0-9x]+)$/.balign $1/; | ||||
|     s/psr_cxsf/psr_all/; | ||||
|     s/LTORG/.ltorg/; | ||||
|     s/^([A-Za-z_]\w*)[ \t]+EQU/ .set $1,/; | ||||
|     s/^([A-Za-z_]\w*)[ \t]+SETL/ .set $1,/; | ||||
|     s/^([A-Za-z_]\w*)[ \t]+SETA/ .set $1,/; | ||||
|     s/^([A-Za-z_]\w*)[ \t]+\*/ .set $1,/; | ||||
| 
 | ||||
|     #  {PC} + 0xdeadfeed  -->  . + 0xdeadfeed | ||||
|     s/\{PC\} \+/ \. +/; | ||||
| 
 | ||||
|     # Single hex constant on the line ! | ||||
|     # | ||||
|     # >>> NOTE <<< | ||||
|     #   Double-precision floats in gcc are always mixed-endian, which means | ||||
|     #   bytes in two words are little-endian, but words are big-endian. | ||||
|     #   So, 0x0000deadfeed0000 would be stored as 0x0000dead at low address | ||||
|     #   and 0xfeed0000 at high address. | ||||
|     # | ||||
|     s/\bDCFD\b[ \t]+0x([a-fA-F0-9]{8})([a-fA-F0-9]{8})/.long 0x$1, 0x$2/; | ||||
|     # Only decimal constants on the line, no hex ! | ||||
|     s/\bDCFD\b[ \t]+([0-9\.\-]+)/.double $1/; | ||||
| 
 | ||||
|     # Single hex constant on the line ! | ||||
| #    s/\bDCFS\b[ \t]+0x([a-f0-9]{8})([a-f0-9]{8})/.long 0x$1, 0x$2/; | ||||
|     # Only decimal constants on the line, no hex ! | ||||
| #    s/\bDCFS\b[ \t]+([0-9\.\-]+)/.double $1/; | ||||
|     s/\bDCFS[ \t]+0x/.word 0x/; | ||||
|     s/\bDCFS\b/.float/; | ||||
| 
 | ||||
|     s/^([A-Za-z_]\w*)[ \t]+DCD/$1 .word/; | ||||
|     s/\bDCD\b/.word/; | ||||
|     s/^([A-Za-z_]\w*)[ \t]+DCW/$1 .short/; | ||||
|     s/\bDCW\b/.short/; | ||||
|     s/^([A-Za-z_]\w*)[ \t]+DCB/$1 .byte/; | ||||
|     s/\bDCB\b/.byte/; | ||||
|     s/^([A-Za-z_]\w*)[ \t]+\%/.comm $1,/; | ||||
|     s/^[A-Za-z_\.]\w+/$&:/; | ||||
|     s/^(\d+)/$1:/; | ||||
|     s/\%(\d+)/$1b_or_f/; | ||||
|     s/\%[Bb](\d+)/$1b/; | ||||
|     s/\%[Ff](\d+)/$1f/; | ||||
|     s/\%[Ff][Tt](\d+)/$1f/; | ||||
|     s/&([\dA-Fa-f]+)/0x$1/; | ||||
|     if ( /\b2_[01]+\b/ ) { | ||||
|       s/\b2_([01]+)\b/conv$1&&&&/g; | ||||
|       while ( /[01][01][01][01]&&&&/ ) { | ||||
|         s/0000&&&&/&&&&0/g; | ||||
|         s/0001&&&&/&&&&1/g; | ||||
|         s/0010&&&&/&&&&2/g; | ||||
|         s/0011&&&&/&&&&3/g; | ||||
|         s/0100&&&&/&&&&4/g; | ||||
|         s/0101&&&&/&&&&5/g; | ||||
|         s/0110&&&&/&&&&6/g; | ||||
|         s/0111&&&&/&&&&7/g; | ||||
|         s/1000&&&&/&&&&8/g; | ||||
|         s/1001&&&&/&&&&9/g; | ||||
|         s/1010&&&&/&&&&A/g; | ||||
|         s/1011&&&&/&&&&B/g; | ||||
|         s/1100&&&&/&&&&C/g; | ||||
|         s/1101&&&&/&&&&D/g; | ||||
|         s/1110&&&&/&&&&E/g; | ||||
|         s/1111&&&&/&&&&F/g; | ||||
|       } | ||||
|       s/000&&&&/&&&&0/g; | ||||
|       s/001&&&&/&&&&1/g; | ||||
|       s/010&&&&/&&&&2/g; | ||||
|       s/011&&&&/&&&&3/g; | ||||
|       s/100&&&&/&&&&4/g; | ||||
|       s/101&&&&/&&&&5/g; | ||||
|       s/110&&&&/&&&&6/g; | ||||
|       s/111&&&&/&&&&7/g; | ||||
|       s/00&&&&/&&&&0/g; | ||||
|       s/01&&&&/&&&&1/g; | ||||
|       s/10&&&&/&&&&2/g; | ||||
|       s/11&&&&/&&&&3/g; | ||||
|       s/0&&&&/&&&&0/g; | ||||
|       s/1&&&&/&&&&1/g; | ||||
|       s/conv&&&&/0x/g; | ||||
|     } | ||||
| 
 | ||||
|     if ( /commandline/) | ||||
|     { | ||||
|         if( /-bigend/) | ||||
|         { | ||||
|             $bigend=1; | ||||
|         } | ||||
|     } | ||||
| 
 | ||||
|     if ( /\bDCDU\b/ ) | ||||
|     { | ||||
|         my $cmd=$_; | ||||
|         my $value; | ||||
|         my $prefix; | ||||
|         my $w1; | ||||
|         my $w2; | ||||
|         my $w3; | ||||
|         my $w4; | ||||
| 
 | ||||
|         s/\s+DCDU\b/@ $&/; | ||||
| 
 | ||||
|         $cmd =~ /\bDCDU\b\s+0x(\d+)/; | ||||
|         $value = $1; | ||||
|         $value =~ /(\w\w)(\w\w)(\w\w)(\w\w)/; | ||||
|         $w1 = $1; | ||||
|         $w2 = $2; | ||||
|         $w3 = $3; | ||||
|         $w4 = $4; | ||||
| 
 | ||||
|         if( $bigend ne "") | ||||
|         { | ||||
|             # big endian | ||||
|             $prefix = "\t.byte\t0x".$w1.";". | ||||
|                       "\t.byte\t0x".$w2.";". | ||||
|                       "\t.byte\t0x".$w3.";". | ||||
|                       "\t.byte\t0x".$w4."; "; | ||||
|         } | ||||
|         else | ||||
|         { | ||||
|             # little endian | ||||
|             $prefix = "\t.byte\t0x".$w4.";". | ||||
|                       "\t.byte\t0x".$w3.";". | ||||
|                       "\t.byte\t0x".$w2.";". | ||||
|                       "\t.byte\t0x".$w1."; "; | ||||
|         } | ||||
|         $_=$prefix.$_; | ||||
|     } | ||||
| 
 | ||||
|     if ( /\badrl\b/i ) | ||||
|     { | ||||
|         s/\badrl\s+(\w+)\s*,\s*(\w+)/ldr $1,=$2/i; | ||||
|         $addPadding = 1; | ||||
|     } | ||||
|     s/\bEND\b/@ END/; | ||||
| } continue { | ||||
|     printf ("%s", $_) if $printit; | ||||
|     if ($addPadding != 0) | ||||
|     { | ||||
|         printf ("   mov r0,r0\n"); | ||||
|         $addPadding = 0; | ||||
|     } | ||||
| } | ||||
| #If we had a code section, mark that this object doesn't need an executable | ||||
| # stack. | ||||
| if ($nxstack && !$apple) { | ||||
|     printf ("    .section\t.note.GNU-stack,\"\",\%\%progbits\n"); | ||||
| } | ||||
							
								
								
									
										160
									
								
								lib/rbcodec/codecs/libopus/celt/arm/arm_celt_map.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										160
									
								
								lib/rbcodec/codecs/libopus/celt/arm/arm_celt_map.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,160 @@ | |||
| /* Copyright (c) 2010 Xiph.Org Foundation
 | ||||
|  * Copyright (c) 2013 Parrot */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include "pitch.h" | ||||
| #include "kiss_fft.h" | ||||
| #include "mdct.h" | ||||
| 
 | ||||
| #if defined(OPUS_HAVE_RTCD) | ||||
| 
 | ||||
| # if defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR) | ||||
| opus_val32 (*const CELT_INNER_PROD_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *x, const opus_val16 *y, int N) = { | ||||
|   celt_inner_prod_c,   /* ARMv4 */ | ||||
|   celt_inner_prod_c,   /* EDSP */ | ||||
|   celt_inner_prod_c,   /* Media */ | ||||
|   celt_inner_prod_neon /* NEON */ | ||||
| }; | ||||
| 
 | ||||
| void (*const DUAL_INNER_PROD_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *x, const opus_val16 *y01, const opus_val16 *y02, | ||||
|       int N, opus_val32 *xy1, opus_val32 *xy2) = { | ||||
|   dual_inner_prod_c,   /* ARMv4 */ | ||||
|   dual_inner_prod_c,   /* EDSP */ | ||||
|   dual_inner_prod_c,   /* Media */ | ||||
|   dual_inner_prod_neon /* NEON */ | ||||
| }; | ||||
| # endif | ||||
| 
 | ||||
| # if defined(FIXED_POINT) | ||||
| #  if ((defined(OPUS_ARM_MAY_HAVE_NEON) && !defined(OPUS_ARM_PRESUME_NEON)) || \ | ||||
|     (defined(OPUS_ARM_MAY_HAVE_MEDIA) && !defined(OPUS_ARM_PRESUME_MEDIA)) || \ | ||||
|     (defined(OPUS_ARM_MAY_HAVE_EDSP) && !defined(OPUS_ARM_PRESUME_EDSP))) | ||||
| opus_val32 (*const CELT_PITCH_XCORR_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *, | ||||
|     const opus_val16 *, opus_val32 *, int, int, int) = { | ||||
|   celt_pitch_xcorr_c,               /* ARMv4 */ | ||||
|   MAY_HAVE_EDSP(celt_pitch_xcorr),  /* EDSP */ | ||||
|   MAY_HAVE_MEDIA(celt_pitch_xcorr), /* Media */ | ||||
|   MAY_HAVE_NEON(celt_pitch_xcorr)   /* NEON */ | ||||
| }; | ||||
| 
 | ||||
| #  endif | ||||
| # else /* !FIXED_POINT */ | ||||
| #  if defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR) | ||||
| void (*const CELT_PITCH_XCORR_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *, | ||||
|     const opus_val16 *, opus_val32 *, int, int, int) = { | ||||
|   celt_pitch_xcorr_c,              /* ARMv4 */ | ||||
|   celt_pitch_xcorr_c,              /* EDSP */ | ||||
|   celt_pitch_xcorr_c,              /* Media */ | ||||
|   celt_pitch_xcorr_float_neon      /* Neon */ | ||||
| }; | ||||
| #  endif | ||||
| # endif /* FIXED_POINT */ | ||||
| 
 | ||||
| #if defined(FIXED_POINT) && defined(OPUS_HAVE_RTCD) && \ | ||||
|  defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR) | ||||
| 
 | ||||
| void (*const XCORR_KERNEL_IMPL[OPUS_ARCHMASK + 1])( | ||||
|          const opus_val16 *x, | ||||
|          const opus_val16 *y, | ||||
|          opus_val32       sum[4], | ||||
|          int              len | ||||
| ) = { | ||||
|   xcorr_kernel_c,                /* ARMv4 */ | ||||
|   xcorr_kernel_c,                /* EDSP */ | ||||
|   xcorr_kernel_c,                /* Media */ | ||||
|   xcorr_kernel_neon_fixed,       /* Neon */ | ||||
| }; | ||||
| 
 | ||||
| #endif | ||||
| 
 | ||||
| # if defined(OPUS_ARM_MAY_HAVE_NEON_INTR) | ||||
| #  if defined(HAVE_ARM_NE10) | ||||
| #   if defined(CUSTOM_MODES) | ||||
| int (*const OPUS_FFT_ALLOC_ARCH_IMPL[OPUS_ARCHMASK+1])(kiss_fft_state *st) = { | ||||
|    opus_fft_alloc_arch_c,        /* ARMv4 */ | ||||
|    opus_fft_alloc_arch_c,        /* EDSP */ | ||||
|    opus_fft_alloc_arch_c,        /* Media */ | ||||
|    opus_fft_alloc_arm_neon       /* Neon with NE10 library support */ | ||||
| }; | ||||
| 
 | ||||
| void (*const OPUS_FFT_FREE_ARCH_IMPL[OPUS_ARCHMASK+1])(kiss_fft_state *st) = { | ||||
|    opus_fft_free_arch_c,         /* ARMv4 */ | ||||
|    opus_fft_free_arch_c,         /* EDSP */ | ||||
|    opus_fft_free_arch_c,         /* Media */ | ||||
|    opus_fft_free_arm_neon        /* Neon with NE10 */ | ||||
| }; | ||||
| #   endif /* CUSTOM_MODES */ | ||||
| 
 | ||||
| void (*const OPUS_FFT[OPUS_ARCHMASK+1])(const kiss_fft_state *cfg, | ||||
|                                         const kiss_fft_cpx *fin, | ||||
|                                         kiss_fft_cpx *fout) = { | ||||
|    opus_fft_c,                   /* ARMv4 */ | ||||
|    opus_fft_c,                   /* EDSP */ | ||||
|    opus_fft_c,                   /* Media */ | ||||
|    opus_fft_neon                 /* Neon with NE10 */ | ||||
| }; | ||||
| 
 | ||||
| void (*const OPUS_IFFT[OPUS_ARCHMASK+1])(const kiss_fft_state *cfg, | ||||
|                                          const kiss_fft_cpx *fin, | ||||
|                                          kiss_fft_cpx *fout) = { | ||||
|    opus_ifft_c,                   /* ARMv4 */ | ||||
|    opus_ifft_c,                   /* EDSP */ | ||||
|    opus_ifft_c,                   /* Media */ | ||||
|    opus_ifft_neon                 /* Neon with NE10 */ | ||||
| }; | ||||
| 
 | ||||
| void (*const CLT_MDCT_FORWARD_IMPL[OPUS_ARCHMASK+1])(const mdct_lookup *l, | ||||
|                                                      kiss_fft_scalar *in, | ||||
|                                                      kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|                                                      const opus_val16 *window, | ||||
|                                                      int overlap, int shift, | ||||
|                                                      int stride, int arch) = { | ||||
|    clt_mdct_forward_c,           /* ARMv4 */ | ||||
|    clt_mdct_forward_c,           /* EDSP */ | ||||
|    clt_mdct_forward_c,           /* Media */ | ||||
|    clt_mdct_forward_neon         /* Neon with NE10 */ | ||||
| }; | ||||
| 
 | ||||
| void (*const CLT_MDCT_BACKWARD_IMPL[OPUS_ARCHMASK+1])(const mdct_lookup *l, | ||||
|                                                       kiss_fft_scalar *in, | ||||
|                                                       kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|                                                       const opus_val16 *window, | ||||
|                                                       int overlap, int shift, | ||||
|                                                       int stride, int arch) = { | ||||
|    clt_mdct_backward_c,           /* ARMv4 */ | ||||
|    clt_mdct_backward_c,           /* EDSP */ | ||||
|    clt_mdct_backward_c,           /* Media */ | ||||
|    clt_mdct_backward_neon         /* Neon with NE10 */ | ||||
| }; | ||||
| 
 | ||||
| #  endif /* HAVE_ARM_NE10 */ | ||||
| # endif /* OPUS_ARM_MAY_HAVE_NEON_INTR */ | ||||
| 
 | ||||
| #endif /* OPUS_HAVE_RTCD */ | ||||
							
								
								
									
										185
									
								
								lib/rbcodec/codecs/libopus/celt/arm/armcpu.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										185
									
								
								lib/rbcodec/codecs/libopus/celt/arm/armcpu.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,185 @@ | |||
| /* Copyright (c) 2010 Xiph.Org Foundation
 | ||||
|  * Copyright (c) 2013 Parrot */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| /* Original code from libtheora modified to suit to Opus */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #ifdef OPUS_HAVE_RTCD | ||||
| 
 | ||||
| #include "armcpu.h" | ||||
| #include "cpu_support.h" | ||||
| #include "os_support.h" | ||||
| #include "opus_types.h" | ||||
| #include "arch.h" | ||||
| 
 | ||||
| #define OPUS_CPU_ARM_V4_FLAG    (1<<OPUS_ARCH_ARM_V4) | ||||
| #define OPUS_CPU_ARM_EDSP_FLAG  (1<<OPUS_ARCH_ARM_EDSP) | ||||
| #define OPUS_CPU_ARM_MEDIA_FLAG (1<<OPUS_ARCH_ARM_MEDIA) | ||||
| #define OPUS_CPU_ARM_NEON_FLAG  (1<<OPUS_ARCH_ARM_NEON) | ||||
| 
 | ||||
| #if defined(_MSC_VER) | ||||
| /*For GetExceptionCode() and EXCEPTION_ILLEGAL_INSTRUCTION.*/ | ||||
| # define WIN32_LEAN_AND_MEAN | ||||
| # define WIN32_EXTRA_LEAN | ||||
| # include <windows.h> | ||||
| 
 | ||||
| static OPUS_INLINE opus_uint32 opus_cpu_capabilities(void){ | ||||
|   opus_uint32 flags; | ||||
|   flags=0; | ||||
|   /* MSVC has no OPUS_INLINE __asm support for ARM, but it does let you __emit
 | ||||
|    * instructions via their assembled hex code. | ||||
|    * All of these instructions should be essentially nops. */ | ||||
| # if defined(OPUS_ARM_MAY_HAVE_EDSP) || defined(OPUS_ARM_MAY_HAVE_MEDIA) \ | ||||
|  || defined(OPUS_ARM_MAY_HAVE_NEON) || defined(OPUS_ARM_MAY_HAVE_NEON_INTR) | ||||
|   __try{ | ||||
|     /*PLD [r13]*/ | ||||
|     __emit(0xF5DDF000); | ||||
|     flags|=OPUS_CPU_ARM_EDSP_FLAG; | ||||
|   } | ||||
|   __except(GetExceptionCode()==EXCEPTION_ILLEGAL_INSTRUCTION){ | ||||
|     /*Ignore exception.*/ | ||||
|   } | ||||
| #  if defined(OPUS_ARM_MAY_HAVE_MEDIA) \ | ||||
|  || defined(OPUS_ARM_MAY_HAVE_NEON) || defined(OPUS_ARM_MAY_HAVE_NEON_INTR) | ||||
|   __try{ | ||||
|     /*SHADD8 r3,r3,r3*/ | ||||
|     __emit(0xE6333F93); | ||||
|     flags|=OPUS_CPU_ARM_MEDIA_FLAG; | ||||
|   } | ||||
|   __except(GetExceptionCode()==EXCEPTION_ILLEGAL_INSTRUCTION){ | ||||
|     /*Ignore exception.*/ | ||||
|   } | ||||
| #   if defined(OPUS_ARM_MAY_HAVE_NEON) || defined(OPUS_ARM_MAY_HAVE_NEON_INTR) | ||||
|   __try{ | ||||
|     /*VORR q0,q0,q0*/ | ||||
|     __emit(0xF2200150); | ||||
|     flags|=OPUS_CPU_ARM_NEON_FLAG; | ||||
|   } | ||||
|   __except(GetExceptionCode()==EXCEPTION_ILLEGAL_INSTRUCTION){ | ||||
|     /*Ignore exception.*/ | ||||
|   } | ||||
| #   endif | ||||
| #  endif | ||||
| # endif | ||||
|   return flags; | ||||
| } | ||||
| 
 | ||||
| #elif defined(__linux__) | ||||
| /* Linux based */ | ||||
| opus_uint32 opus_cpu_capabilities(void) | ||||
| { | ||||
|   opus_uint32 flags = 0; | ||||
|   FILE *cpuinfo; | ||||
| 
 | ||||
|   /* Reading /proc/self/auxv would be easier, but that doesn't work reliably on
 | ||||
|    * Android */ | ||||
|   cpuinfo = fopen("/proc/cpuinfo", "r"); | ||||
| 
 | ||||
|   if(cpuinfo != NULL) | ||||
|   { | ||||
|     /* 512 should be enough for anybody (it's even enough for all the flags that
 | ||||
|      * x86 has accumulated... so far). */ | ||||
|     char buf[512]; | ||||
| 
 | ||||
|     while(fgets(buf, 512, cpuinfo) != NULL) | ||||
|     { | ||||
| # if defined(OPUS_ARM_MAY_HAVE_EDSP) || defined(OPUS_ARM_MAY_HAVE_MEDIA) \ | ||||
|  || defined(OPUS_ARM_MAY_HAVE_NEON) || defined(OPUS_ARM_MAY_HAVE_NEON_INTR) | ||||
|       /* Search for edsp and neon flag */ | ||||
|       if(memcmp(buf, "Features", 8) == 0) | ||||
|       { | ||||
|         char *p; | ||||
|         p = strstr(buf, " edsp"); | ||||
|         if(p != NULL && (p[5] == ' ' || p[5] == '\n')) | ||||
|           flags |= OPUS_CPU_ARM_EDSP_FLAG; | ||||
| 
 | ||||
| #  if defined(OPUS_ARM_MAY_HAVE_NEON) || defined(OPUS_ARM_MAY_HAVE_NEON_INTR) | ||||
|         p = strstr(buf, " neon"); | ||||
|         if(p != NULL && (p[5] == ' ' || p[5] == '\n')) | ||||
|           flags |= OPUS_CPU_ARM_NEON_FLAG; | ||||
| #  endif | ||||
|       } | ||||
| # endif | ||||
| 
 | ||||
| # if defined(OPUS_ARM_MAY_HAVE_MEDIA) \ | ||||
|  || defined(OPUS_ARM_MAY_HAVE_NEON) || defined(OPUS_ARM_MAY_HAVE_NEON_INTR) | ||||
|       /* Search for media capabilities (>= ARMv6) */ | ||||
|       if(memcmp(buf, "CPU architecture:", 17) == 0) | ||||
|       { | ||||
|         int version; | ||||
|         version = atoi(buf+17); | ||||
| 
 | ||||
|         if(version >= 6) | ||||
|           flags |= OPUS_CPU_ARM_MEDIA_FLAG; | ||||
|       } | ||||
| # endif | ||||
|     } | ||||
| 
 | ||||
|     fclose(cpuinfo); | ||||
|   } | ||||
|   return flags; | ||||
| } | ||||
| #else | ||||
| /* The feature registers which can tell us what the processor supports are
 | ||||
|  * accessible in priveleged modes only, so we can't have a general user-space | ||||
|  * detection method like on x86.*/ | ||||
| # error "Configured to use ARM asm but no CPU detection method available for " \ | ||||
|    "your platform.  Reconfigure with --disable-rtcd (or send patches)." | ||||
| #endif | ||||
| 
 | ||||
| int opus_select_arch(void) | ||||
| { | ||||
|   opus_uint32 flags = opus_cpu_capabilities(); | ||||
|   int arch = 0; | ||||
| 
 | ||||
|   if(!(flags & OPUS_CPU_ARM_EDSP_FLAG)) { | ||||
|     /* Asserts ensure arch values are sequential */ | ||||
|     celt_assert(arch == OPUS_ARCH_ARM_V4); | ||||
|     return arch; | ||||
|   } | ||||
|   arch++; | ||||
| 
 | ||||
|   if(!(flags & OPUS_CPU_ARM_MEDIA_FLAG)) { | ||||
|     celt_assert(arch == OPUS_ARCH_ARM_EDSP); | ||||
|     return arch; | ||||
|   } | ||||
|   arch++; | ||||
| 
 | ||||
|   if(!(flags & OPUS_CPU_ARM_NEON_FLAG)) { | ||||
|     celt_assert(arch == OPUS_ARCH_ARM_MEDIA); | ||||
|     return arch; | ||||
|   } | ||||
|   arch++; | ||||
| 
 | ||||
|   celt_assert(arch == OPUS_ARCH_ARM_NEON); | ||||
|   return arch; | ||||
| } | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										77
									
								
								lib/rbcodec/codecs/libopus/celt/arm/armcpu.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										77
									
								
								lib/rbcodec/codecs/libopus/celt/arm/armcpu.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,77 @@ | |||
| /* Copyright (c) 2010 Xiph.Org Foundation
 | ||||
|  * Copyright (c) 2013 Parrot */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #if !defined(ARMCPU_H) | ||||
| # define ARMCPU_H | ||||
| 
 | ||||
| # if defined(OPUS_ARM_MAY_HAVE_EDSP) | ||||
| #  define MAY_HAVE_EDSP(name) name ## _edsp | ||||
| # else | ||||
| #  define MAY_HAVE_EDSP(name) name ## _c | ||||
| # endif | ||||
| 
 | ||||
| # if defined(OPUS_ARM_MAY_HAVE_MEDIA) | ||||
| #  define MAY_HAVE_MEDIA(name) name ## _media | ||||
| # else | ||||
| #  define MAY_HAVE_MEDIA(name) MAY_HAVE_EDSP(name) | ||||
| # endif | ||||
| 
 | ||||
| # if defined(OPUS_ARM_MAY_HAVE_NEON) | ||||
| #  define MAY_HAVE_NEON(name) name ## _neon | ||||
| # else | ||||
| #  define MAY_HAVE_NEON(name) MAY_HAVE_MEDIA(name) | ||||
| # endif | ||||
| 
 | ||||
| # if defined(OPUS_ARM_PRESUME_EDSP) | ||||
| #  define PRESUME_EDSP(name) name ## _edsp | ||||
| # else | ||||
| #  define PRESUME_EDSP(name) name ## _c | ||||
| # endif | ||||
| 
 | ||||
| # if defined(OPUS_ARM_PRESUME_MEDIA) | ||||
| #  define PRESUME_MEDIA(name) name ## _media | ||||
| # else | ||||
| #  define PRESUME_MEDIA(name) PRESUME_EDSP(name) | ||||
| # endif | ||||
| 
 | ||||
| # if defined(OPUS_ARM_PRESUME_NEON) | ||||
| #  define PRESUME_NEON(name) name ## _neon | ||||
| # else | ||||
| #  define PRESUME_NEON(name) PRESUME_MEDIA(name) | ||||
| # endif | ||||
| 
 | ||||
| # if defined(OPUS_HAVE_RTCD) | ||||
| int opus_select_arch(void); | ||||
| 
 | ||||
| #define OPUS_ARCH_ARM_V4    (0) | ||||
| #define OPUS_ARCH_ARM_EDSP  (1) | ||||
| #define OPUS_ARCH_ARM_MEDIA (2) | ||||
| #define OPUS_ARCH_ARM_NEON  (3) | ||||
| 
 | ||||
| # endif | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										37
									
								
								lib/rbcodec/codecs/libopus/celt/arm/armopts.s.in
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										37
									
								
								lib/rbcodec/codecs/libopus/celt/arm/armopts.s.in
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,37 @@ | |||
| /* Copyright (C) 2013 Mozilla Corporation */ | ||||
| /* | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
 | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
 | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| ; Set the following to 1 if we have EDSP instructions
 | ||||
| ;  (LDRD/STRD, etc., ARMv5E and later).
 | ||||
| OPUS_ARM_MAY_HAVE_EDSP  * @OPUS_ARM_MAY_HAVE_EDSP@
 | ||||
| 
 | ||||
| ; Set the following to 1 if we have ARMv6 media instructions.
 | ||||
| OPUS_ARM_MAY_HAVE_MEDIA * @OPUS_ARM_MAY_HAVE_MEDIA@
 | ||||
| 
 | ||||
| ; Set the following to 1 if we have NEON (some ARMv7)
 | ||||
| OPUS_ARM_MAY_HAVE_NEON  * @OPUS_ARM_MAY_HAVE_NEON@
 | ||||
| 
 | ||||
| END | ||||
							
								
								
									
										173
									
								
								lib/rbcodec/codecs/libopus/celt/arm/celt_fft_ne10.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										173
									
								
								lib/rbcodec/codecs/libopus/celt/arm/celt_fft_ne10.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,173 @@ | |||
| /* Copyright (c) 2015 Xiph.Org Foundation
 | ||||
|    Written by Viswanath Puttagunta */ | ||||
| /**
 | ||||
|    @file celt_fft_ne10.c | ||||
|    @brief ARM Neon optimizations for fft using NE10 library | ||||
|  */ | ||||
| 
 | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef SKIP_CONFIG_H | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| #endif | ||||
| 
 | ||||
| #include <NE10_dsp.h> | ||||
| #include "os_support.h" | ||||
| #include "kiss_fft.h" | ||||
| #include "stack_alloc.h" | ||||
| 
 | ||||
| #if !defined(FIXED_POINT) | ||||
| # define NE10_FFT_ALLOC_C2C_TYPE_NEON ne10_fft_alloc_c2c_float32_neon | ||||
| # define NE10_FFT_CFG_TYPE_T ne10_fft_cfg_float32_t | ||||
| # define NE10_FFT_STATE_TYPE_T ne10_fft_state_float32_t | ||||
| # define NE10_FFT_DESTROY_C2C_TYPE ne10_fft_destroy_c2c_float32 | ||||
| # define NE10_FFT_CPX_TYPE_T ne10_fft_cpx_float32_t | ||||
| # define NE10_FFT_C2C_1D_TYPE_NEON ne10_fft_c2c_1d_float32_neon | ||||
| #else | ||||
| # define NE10_FFT_ALLOC_C2C_TYPE_NEON(nfft) ne10_fft_alloc_c2c_int32_neon(nfft) | ||||
| # define NE10_FFT_CFG_TYPE_T ne10_fft_cfg_int32_t | ||||
| # define NE10_FFT_STATE_TYPE_T ne10_fft_state_int32_t | ||||
| # define NE10_FFT_DESTROY_C2C_TYPE ne10_fft_destroy_c2c_int32 | ||||
| # define NE10_FFT_DESTROY_C2C_TYPE ne10_fft_destroy_c2c_int32 | ||||
| # define NE10_FFT_CPX_TYPE_T ne10_fft_cpx_int32_t | ||||
| # define NE10_FFT_C2C_1D_TYPE_NEON ne10_fft_c2c_1d_int32_neon | ||||
| #endif | ||||
| 
 | ||||
| #if defined(CUSTOM_MODES) | ||||
| 
 | ||||
| /* nfft lengths in NE10 that support scaled fft */ | ||||
| # define NE10_FFTSCALED_SUPPORT_MAX 4 | ||||
| static const int ne10_fft_scaled_support[NE10_FFTSCALED_SUPPORT_MAX] = { | ||||
|    480, 240, 120, 60 | ||||
| }; | ||||
| 
 | ||||
| int opus_fft_alloc_arm_neon(kiss_fft_state *st) | ||||
| { | ||||
|    int i; | ||||
|    size_t memneeded = sizeof(struct arch_fft_state); | ||||
| 
 | ||||
|    st->arch_fft = (arch_fft_state *)opus_alloc(memneeded); | ||||
|    if (!st->arch_fft) | ||||
|       return -1; | ||||
| 
 | ||||
|    for (i = 0; i < NE10_FFTSCALED_SUPPORT_MAX; i++) { | ||||
|       if(st->nfft == ne10_fft_scaled_support[i]) | ||||
|          break; | ||||
|    } | ||||
|    if (i == NE10_FFTSCALED_SUPPORT_MAX) { | ||||
|       /* This nfft length (scaled fft) is not supported in NE10 */ | ||||
|       st->arch_fft->is_supported = 0; | ||||
|       st->arch_fft->priv = NULL; | ||||
|    } | ||||
|    else { | ||||
|       st->arch_fft->is_supported = 1; | ||||
|       st->arch_fft->priv = (void *)NE10_FFT_ALLOC_C2C_TYPE_NEON(st->nfft); | ||||
|       if (st->arch_fft->priv == NULL) { | ||||
|          return -1; | ||||
|       } | ||||
|    } | ||||
|    return 0; | ||||
| } | ||||
| 
 | ||||
| void opus_fft_free_arm_neon(kiss_fft_state *st) | ||||
| { | ||||
|    NE10_FFT_CFG_TYPE_T cfg; | ||||
| 
 | ||||
|    if (!st->arch_fft) | ||||
|       return; | ||||
| 
 | ||||
|    cfg = (NE10_FFT_CFG_TYPE_T)st->arch_fft->priv; | ||||
|    if (cfg) | ||||
|       NE10_FFT_DESTROY_C2C_TYPE(cfg); | ||||
|    opus_free(st->arch_fft); | ||||
| } | ||||
| #endif | ||||
| 
 | ||||
| void opus_fft_neon(const kiss_fft_state *st, | ||||
|                    const kiss_fft_cpx *fin, | ||||
|                    kiss_fft_cpx *fout) | ||||
| { | ||||
|    NE10_FFT_STATE_TYPE_T state; | ||||
|    NE10_FFT_CFG_TYPE_T cfg = &state; | ||||
|    VARDECL(NE10_FFT_CPX_TYPE_T, buffer); | ||||
|    SAVE_STACK; | ||||
|    ALLOC(buffer, st->nfft, NE10_FFT_CPX_TYPE_T); | ||||
| 
 | ||||
|    if (!st->arch_fft->is_supported) { | ||||
|       /* This nfft length (scaled fft) not supported in NE10 */ | ||||
|       opus_fft_c(st, fin, fout); | ||||
|    } | ||||
|    else { | ||||
|       memcpy((void *)cfg, st->arch_fft->priv, sizeof(NE10_FFT_STATE_TYPE_T)); | ||||
|       state.buffer = (NE10_FFT_CPX_TYPE_T *)&buffer[0]; | ||||
| #if !defined(FIXED_POINT) | ||||
|       state.is_forward_scaled = 1; | ||||
| 
 | ||||
|       NE10_FFT_C2C_1D_TYPE_NEON((NE10_FFT_CPX_TYPE_T *)fout, | ||||
|                                 (NE10_FFT_CPX_TYPE_T *)fin, | ||||
|                                 cfg, 0); | ||||
| #else | ||||
|       NE10_FFT_C2C_1D_TYPE_NEON((NE10_FFT_CPX_TYPE_T *)fout, | ||||
|                                 (NE10_FFT_CPX_TYPE_T *)fin, | ||||
|                                 cfg, 0, 1); | ||||
| #endif | ||||
|    } | ||||
|    RESTORE_STACK; | ||||
| } | ||||
| 
 | ||||
| void opus_ifft_neon(const kiss_fft_state *st, | ||||
|                     const kiss_fft_cpx *fin, | ||||
|                     kiss_fft_cpx *fout) | ||||
| { | ||||
|    NE10_FFT_STATE_TYPE_T state; | ||||
|    NE10_FFT_CFG_TYPE_T cfg = &state; | ||||
|    VARDECL(NE10_FFT_CPX_TYPE_T, buffer); | ||||
|    SAVE_STACK; | ||||
|    ALLOC(buffer, st->nfft, NE10_FFT_CPX_TYPE_T); | ||||
| 
 | ||||
|    if (!st->arch_fft->is_supported) { | ||||
|       /* This nfft length (scaled fft) not supported in NE10 */ | ||||
|       opus_ifft_c(st, fin, fout); | ||||
|    } | ||||
|    else { | ||||
|       memcpy((void *)cfg, st->arch_fft->priv, sizeof(NE10_FFT_STATE_TYPE_T)); | ||||
|       state.buffer = (NE10_FFT_CPX_TYPE_T *)&buffer[0]; | ||||
| #if !defined(FIXED_POINT) | ||||
|       state.is_backward_scaled = 0; | ||||
| 
 | ||||
|       NE10_FFT_C2C_1D_TYPE_NEON((NE10_FFT_CPX_TYPE_T *)fout, | ||||
|                                 (NE10_FFT_CPX_TYPE_T *)fin, | ||||
|                                 cfg, 1); | ||||
| #else | ||||
|       NE10_FFT_C2C_1D_TYPE_NEON((NE10_FFT_CPX_TYPE_T *)fout, | ||||
|                                 (NE10_FFT_CPX_TYPE_T *)fin, | ||||
|                                 cfg, 1, 0); | ||||
| #endif | ||||
|    } | ||||
|    RESTORE_STACK; | ||||
| } | ||||
							
								
								
									
										258
									
								
								lib/rbcodec/codecs/libopus/celt/arm/celt_mdct_ne10.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										258
									
								
								lib/rbcodec/codecs/libopus/celt/arm/celt_mdct_ne10.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,258 @@ | |||
| /* Copyright (c) 2015 Xiph.Org Foundation
 | ||||
|    Written by Viswanath Puttagunta */ | ||||
| /**
 | ||||
|    @file celt_mdct_ne10.c | ||||
|    @brief ARM Neon optimizations for mdct using NE10 library | ||||
|  */ | ||||
| 
 | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef SKIP_CONFIG_H | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| #endif | ||||
| 
 | ||||
| #include "kiss_fft.h" | ||||
| #include "_kiss_fft_guts.h" | ||||
| #include "mdct.h" | ||||
| #include "stack_alloc.h" | ||||
| 
 | ||||
| void clt_mdct_forward_neon(const mdct_lookup *l, | ||||
|                            kiss_fft_scalar *in, | ||||
|                            kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|                            const opus_val16 *window, | ||||
|                            int overlap, int shift, int stride, int arch) | ||||
| { | ||||
|    int i; | ||||
|    int N, N2, N4; | ||||
|    VARDECL(kiss_fft_scalar, f); | ||||
|    VARDECL(kiss_fft_cpx, f2); | ||||
|    const kiss_fft_state *st = l->kfft[shift]; | ||||
|    const kiss_twiddle_scalar *trig; | ||||
| 
 | ||||
|    SAVE_STACK; | ||||
| 
 | ||||
|    N = l->n; | ||||
|    trig = l->trig; | ||||
|    for (i=0;i<shift;i++) | ||||
|    { | ||||
|       N >>= 1; | ||||
|       trig += N; | ||||
|    } | ||||
|    N2 = N>>1; | ||||
|    N4 = N>>2; | ||||
| 
 | ||||
|    ALLOC(f, N2, kiss_fft_scalar); | ||||
|    ALLOC(f2, N4, kiss_fft_cpx); | ||||
| 
 | ||||
|    /* Consider the input to be composed of four blocks: [a, b, c, d] */ | ||||
|    /* Window, shuffle, fold */ | ||||
|    { | ||||
|       /* Temp pointers to make it really clear to the compiler what we're doing */ | ||||
|       const kiss_fft_scalar * OPUS_RESTRICT xp1 = in+(overlap>>1); | ||||
|       const kiss_fft_scalar * OPUS_RESTRICT xp2 = in+N2-1+(overlap>>1); | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp = f; | ||||
|       const opus_val16 * OPUS_RESTRICT wp1 = window+(overlap>>1); | ||||
|       const opus_val16 * OPUS_RESTRICT wp2 = window+(overlap>>1)-1; | ||||
|       for(i=0;i<((overlap+3)>>2);i++) | ||||
|       { | ||||
|          /* Real part arranged as -d-cR, Imag part arranged as -b+aR*/ | ||||
|          *yp++ = MULT16_32_Q15(*wp2, xp1[N2]) + MULT16_32_Q15(*wp1,*xp2); | ||||
|          *yp++ = MULT16_32_Q15(*wp1, *xp1)    - MULT16_32_Q15(*wp2, xp2[-N2]); | ||||
|          xp1+=2; | ||||
|          xp2-=2; | ||||
|          wp1+=2; | ||||
|          wp2-=2; | ||||
|       } | ||||
|       wp1 = window; | ||||
|       wp2 = window+overlap-1; | ||||
|       for(;i<N4-((overlap+3)>>2);i++) | ||||
|       { | ||||
|          /* Real part arranged as a-bR, Imag part arranged as -c-dR */ | ||||
|          *yp++ = *xp2; | ||||
|          *yp++ = *xp1; | ||||
|          xp1+=2; | ||||
|          xp2-=2; | ||||
|       } | ||||
|       for(;i<N4;i++) | ||||
|       { | ||||
|          /* Real part arranged as a-bR, Imag part arranged as -c-dR */ | ||||
|          *yp++ =  -MULT16_32_Q15(*wp1, xp1[-N2]) + MULT16_32_Q15(*wp2, *xp2); | ||||
|          *yp++ = MULT16_32_Q15(*wp2, *xp1)     + MULT16_32_Q15(*wp1, xp2[N2]); | ||||
|          xp1+=2; | ||||
|          xp2-=2; | ||||
|          wp1+=2; | ||||
|          wp2-=2; | ||||
|       } | ||||
|    } | ||||
|    /* Pre-rotation */ | ||||
|    { | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp = f; | ||||
|       const kiss_twiddle_scalar *t = &trig[0]; | ||||
|       for(i=0;i<N4;i++) | ||||
|       { | ||||
|          kiss_fft_cpx yc; | ||||
|          kiss_twiddle_scalar t0, t1; | ||||
|          kiss_fft_scalar re, im, yr, yi; | ||||
|          t0 = t[i]; | ||||
|          t1 = t[N4+i]; | ||||
|          re = *yp++; | ||||
|          im = *yp++; | ||||
|          yr = S_MUL(re,t0)  -  S_MUL(im,t1); | ||||
|          yi = S_MUL(im,t0)  +  S_MUL(re,t1); | ||||
|          yc.r = yr; | ||||
|          yc.i = yi; | ||||
|          f2[i] = yc; | ||||
|       } | ||||
|    } | ||||
| 
 | ||||
|    opus_fft(st, f2, (kiss_fft_cpx *)f, arch); | ||||
| 
 | ||||
|    /* Post-rotate */ | ||||
|    { | ||||
|       /* Temp pointers to make it really clear to the compiler what we're doing */ | ||||
|       const kiss_fft_cpx * OPUS_RESTRICT fp = (kiss_fft_cpx *)f; | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp1 = out; | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp2 = out+stride*(N2-1); | ||||
|       const kiss_twiddle_scalar *t = &trig[0]; | ||||
|       /* Temp pointers to make it really clear to the compiler what we're doing */ | ||||
|       for(i=0;i<N4;i++) | ||||
|       { | ||||
|          kiss_fft_scalar yr, yi; | ||||
|          yr = S_MUL(fp->i,t[N4+i]) - S_MUL(fp->r,t[i]); | ||||
|          yi = S_MUL(fp->r,t[N4+i]) + S_MUL(fp->i,t[i]); | ||||
|          *yp1 = yr; | ||||
|          *yp2 = yi; | ||||
|          fp++; | ||||
|          yp1 += 2*stride; | ||||
|          yp2 -= 2*stride; | ||||
|       } | ||||
|    } | ||||
|    RESTORE_STACK; | ||||
| } | ||||
| 
 | ||||
| void clt_mdct_backward_neon(const mdct_lookup *l, | ||||
|                             kiss_fft_scalar *in, | ||||
|                             kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|                             const opus_val16 * OPUS_RESTRICT window, | ||||
|                             int overlap, int shift, int stride, int arch) | ||||
| { | ||||
|    int i; | ||||
|    int N, N2, N4; | ||||
|    VARDECL(kiss_fft_scalar, f); | ||||
|    const kiss_twiddle_scalar *trig; | ||||
|    const kiss_fft_state *st = l->kfft[shift]; | ||||
| 
 | ||||
|    N = l->n; | ||||
|    trig = l->trig; | ||||
|    for (i=0;i<shift;i++) | ||||
|    { | ||||
|       N >>= 1; | ||||
|       trig += N; | ||||
|    } | ||||
|    N2 = N>>1; | ||||
|    N4 = N>>2; | ||||
| 
 | ||||
|    ALLOC(f, N2, kiss_fft_scalar); | ||||
| 
 | ||||
|    /* Pre-rotate */ | ||||
|    { | ||||
|       /* Temp pointers to make it really clear to the compiler what we're doing */ | ||||
|       const kiss_fft_scalar * OPUS_RESTRICT xp1 = in; | ||||
|       const kiss_fft_scalar * OPUS_RESTRICT xp2 = in+stride*(N2-1); | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp = f; | ||||
|       const kiss_twiddle_scalar * OPUS_RESTRICT t = &trig[0]; | ||||
|       for(i=0;i<N4;i++) | ||||
|       { | ||||
|          kiss_fft_scalar yr, yi; | ||||
|          yr = S_MUL(*xp2, t[i]) + S_MUL(*xp1, t[N4+i]); | ||||
|          yi = S_MUL(*xp1, t[i]) - S_MUL(*xp2, t[N4+i]); | ||||
|          yp[2*i] = yr; | ||||
|          yp[2*i+1] = yi; | ||||
|          xp1+=2*stride; | ||||
|          xp2-=2*stride; | ||||
|       } | ||||
|    } | ||||
| 
 | ||||
|    opus_ifft(st, (kiss_fft_cpx *)f, (kiss_fft_cpx*)(out+(overlap>>1)), arch); | ||||
| 
 | ||||
|    /* Post-rotate and de-shuffle from both ends of the buffer at once to make
 | ||||
|       it in-place. */ | ||||
|    { | ||||
|       kiss_fft_scalar * yp0 = out+(overlap>>1); | ||||
|       kiss_fft_scalar * yp1 = out+(overlap>>1)+N2-2; | ||||
|       const kiss_twiddle_scalar *t = &trig[0]; | ||||
|       /* Loop to (N4+1)>>1 to handle odd N4. When N4 is odd, the
 | ||||
|          middle pair will be computed twice. */ | ||||
|       for(i=0;i<(N4+1)>>1;i++) | ||||
|       { | ||||
|          kiss_fft_scalar re, im, yr, yi; | ||||
|          kiss_twiddle_scalar t0, t1; | ||||
|          re = yp0[0]; | ||||
|          im = yp0[1]; | ||||
|          t0 = t[i]; | ||||
|          t1 = t[N4+i]; | ||||
|          /* We'd scale up by 2 here, but instead it's done when mixing the windows */ | ||||
|          yr = S_MUL(re,t0) + S_MUL(im,t1); | ||||
|          yi = S_MUL(re,t1) - S_MUL(im,t0); | ||||
|          re = yp1[0]; | ||||
|          im = yp1[1]; | ||||
|          yp0[0] = yr; | ||||
|          yp1[1] = yi; | ||||
| 
 | ||||
|          t0 = t[(N4-i-1)]; | ||||
|          t1 = t[(N2-i-1)]; | ||||
|          /* We'd scale up by 2 here, but instead it's done when mixing the windows */ | ||||
|          yr = S_MUL(re,t0) + S_MUL(im,t1); | ||||
|          yi = S_MUL(re,t1) - S_MUL(im,t0); | ||||
|          yp1[0] = yr; | ||||
|          yp0[1] = yi; | ||||
|          yp0 += 2; | ||||
|          yp1 -= 2; | ||||
|       } | ||||
|    } | ||||
| 
 | ||||
|    /* Mirror on both sides for TDAC */ | ||||
|    { | ||||
|       kiss_fft_scalar * OPUS_RESTRICT xp1 = out+overlap-1; | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp1 = out; | ||||
|       const opus_val16 * OPUS_RESTRICT wp1 = window; | ||||
|       const opus_val16 * OPUS_RESTRICT wp2 = window+overlap-1; | ||||
| 
 | ||||
|       for(i = 0; i < overlap/2; i++) | ||||
|       { | ||||
|          kiss_fft_scalar x1, x2; | ||||
|          x1 = *xp1; | ||||
|          x2 = *yp1; | ||||
|          *yp1++ = MULT16_32_Q15(*wp2, x2) - MULT16_32_Q15(*wp1, x1); | ||||
|          *xp1-- = MULT16_32_Q15(*wp1, x2) + MULT16_32_Q15(*wp2, x1); | ||||
|          wp1++; | ||||
|          wp2--; | ||||
|       } | ||||
|    } | ||||
|    RESTORE_STACK; | ||||
| } | ||||
							
								
								
									
										211
									
								
								lib/rbcodec/codecs/libopus/celt/arm/celt_neon_intr.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										211
									
								
								lib/rbcodec/codecs/libopus/celt/arm/celt_neon_intr.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,211 @@ | |||
| /* Copyright (c) 2014-2015 Xiph.Org Foundation
 | ||||
|    Written by Viswanath Puttagunta */ | ||||
| /**
 | ||||
|    @file celt_neon_intr.c | ||||
|    @brief ARM Neon Intrinsic optimizations for celt | ||||
|  */ | ||||
| 
 | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <arm_neon.h> | ||||
| #include "../pitch.h" | ||||
| 
 | ||||
| #if defined(FIXED_POINT) | ||||
| void xcorr_kernel_neon_fixed(const opus_val16 * x, const opus_val16 * y, opus_val32 sum[4], int len) | ||||
| { | ||||
|    int j; | ||||
|    int32x4_t a = vld1q_s32(sum); | ||||
|    /* Load y[0...3] */ | ||||
|    /* This requires len>0 to always be valid (which we assert in the C code). */ | ||||
|    int16x4_t y0 = vld1_s16(y); | ||||
|    y += 4; | ||||
| 
 | ||||
|    for (j = 0; j + 8 <= len; j += 8) | ||||
|    { | ||||
|       /* Load x[0...7] */ | ||||
|       int16x8_t xx = vld1q_s16(x); | ||||
|       int16x4_t x0 = vget_low_s16(xx); | ||||
|       int16x4_t x4 = vget_high_s16(xx); | ||||
|       /* Load y[4...11] */ | ||||
|       int16x8_t yy = vld1q_s16(y); | ||||
|       int16x4_t y4 = vget_low_s16(yy); | ||||
|       int16x4_t y8 = vget_high_s16(yy); | ||||
|       int32x4_t a0 = vmlal_lane_s16(a, y0, x0, 0); | ||||
|       int32x4_t a1 = vmlal_lane_s16(a0, y4, x4, 0); | ||||
| 
 | ||||
|       int16x4_t y1 = vext_s16(y0, y4, 1); | ||||
|       int16x4_t y5 = vext_s16(y4, y8, 1); | ||||
|       int32x4_t a2 = vmlal_lane_s16(a1, y1, x0, 1); | ||||
|       int32x4_t a3 = vmlal_lane_s16(a2, y5, x4, 1); | ||||
| 
 | ||||
|       int16x4_t y2 = vext_s16(y0, y4, 2); | ||||
|       int16x4_t y6 = vext_s16(y4, y8, 2); | ||||
|       int32x4_t a4 = vmlal_lane_s16(a3, y2, x0, 2); | ||||
|       int32x4_t a5 = vmlal_lane_s16(a4, y6, x4, 2); | ||||
| 
 | ||||
|       int16x4_t y3 = vext_s16(y0, y4, 3); | ||||
|       int16x4_t y7 = vext_s16(y4, y8, 3); | ||||
|       int32x4_t a6 = vmlal_lane_s16(a5, y3, x0, 3); | ||||
|       int32x4_t a7 = vmlal_lane_s16(a6, y7, x4, 3); | ||||
| 
 | ||||
|       y0 = y8; | ||||
|       a = a7; | ||||
|       x += 8; | ||||
|       y += 8; | ||||
|    } | ||||
| 
 | ||||
|    for (; j < len; j++) | ||||
|    { | ||||
|       int16x4_t x0 = vld1_dup_s16(x);  /* load next x */ | ||||
|       int32x4_t a0 = vmlal_s16(a, y0, x0); | ||||
| 
 | ||||
|       int16x4_t y4 = vld1_dup_s16(y);  /* load next y */ | ||||
|       y0 = vext_s16(y0, y4, 1); | ||||
|       a = a0; | ||||
|       x++; | ||||
|       y++; | ||||
|    } | ||||
| 
 | ||||
|    vst1q_s32(sum, a); | ||||
| } | ||||
| 
 | ||||
| #else | ||||
| /*
 | ||||
|  * Function: xcorr_kernel_neon_float | ||||
|  * --------------------------------- | ||||
|  * Computes 4 correlation values and stores them in sum[4] | ||||
|  */ | ||||
| static void xcorr_kernel_neon_float(const float32_t *x, const float32_t *y, | ||||
|       float32_t sum[4], int len) { | ||||
|    float32x4_t YY[3]; | ||||
|    float32x4_t YEXT[3]; | ||||
|    float32x4_t XX[2]; | ||||
|    float32x2_t XX_2; | ||||
|    float32x4_t SUMM; | ||||
|    const float32_t *xi = x; | ||||
|    const float32_t *yi = y; | ||||
| 
 | ||||
|    celt_assert(len>0); | ||||
| 
 | ||||
|    YY[0] = vld1q_f32(yi); | ||||
|    SUMM = vdupq_n_f32(0); | ||||
| 
 | ||||
|    /* Consume 8 elements in x vector and 12 elements in y
 | ||||
|     * vector. However, the 12'th element never really gets | ||||
|     * touched in this loop. So, if len == 8, then we only | ||||
|     * must access y[0] to y[10]. y[11] must not be accessed | ||||
|     * hence make sure len > 8 and not len >= 8 | ||||
|     */ | ||||
|    while (len > 8) { | ||||
|       yi += 4; | ||||
|       YY[1] = vld1q_f32(yi); | ||||
|       yi += 4; | ||||
|       YY[2] = vld1q_f32(yi); | ||||
| 
 | ||||
|       XX[0] = vld1q_f32(xi); | ||||
|       xi += 4; | ||||
|       XX[1] = vld1q_f32(xi); | ||||
|       xi += 4; | ||||
| 
 | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YY[0], vget_low_f32(XX[0]), 0); | ||||
|       YEXT[0] = vextq_f32(YY[0], YY[1], 1); | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YEXT[0], vget_low_f32(XX[0]), 1); | ||||
|       YEXT[1] = vextq_f32(YY[0], YY[1], 2); | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YEXT[1], vget_high_f32(XX[0]), 0); | ||||
|       YEXT[2] = vextq_f32(YY[0], YY[1], 3); | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YEXT[2], vget_high_f32(XX[0]), 1); | ||||
| 
 | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YY[1], vget_low_f32(XX[1]), 0); | ||||
|       YEXT[0] = vextq_f32(YY[1], YY[2], 1); | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YEXT[0], vget_low_f32(XX[1]), 1); | ||||
|       YEXT[1] = vextq_f32(YY[1], YY[2], 2); | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YEXT[1], vget_high_f32(XX[1]), 0); | ||||
|       YEXT[2] = vextq_f32(YY[1], YY[2], 3); | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YEXT[2], vget_high_f32(XX[1]), 1); | ||||
| 
 | ||||
|       YY[0] = YY[2]; | ||||
|       len -= 8; | ||||
|    } | ||||
| 
 | ||||
|    /* Consume 4 elements in x vector and 8 elements in y
 | ||||
|     * vector. However, the 8'th element in y never really gets | ||||
|     * touched in this loop. So, if len == 4, then we only | ||||
|     * must access y[0] to y[6]. y[7] must not be accessed | ||||
|     * hence make sure len>4 and not len>=4 | ||||
|     */ | ||||
|    if (len > 4) { | ||||
|       yi += 4; | ||||
|       YY[1] = vld1q_f32(yi); | ||||
| 
 | ||||
|       XX[0] = vld1q_f32(xi); | ||||
|       xi += 4; | ||||
| 
 | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YY[0], vget_low_f32(XX[0]), 0); | ||||
|       YEXT[0] = vextq_f32(YY[0], YY[1], 1); | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YEXT[0], vget_low_f32(XX[0]), 1); | ||||
|       YEXT[1] = vextq_f32(YY[0], YY[1], 2); | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YEXT[1], vget_high_f32(XX[0]), 0); | ||||
|       YEXT[2] = vextq_f32(YY[0], YY[1], 3); | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YEXT[2], vget_high_f32(XX[0]), 1); | ||||
| 
 | ||||
|       YY[0] = YY[1]; | ||||
|       len -= 4; | ||||
|    } | ||||
| 
 | ||||
|    while (--len > 0) { | ||||
|       XX_2 = vld1_dup_f32(xi++); | ||||
|       SUMM = vmlaq_lane_f32(SUMM, YY[0], XX_2, 0); | ||||
|       YY[0]= vld1q_f32(++yi); | ||||
|    } | ||||
| 
 | ||||
|    XX_2 = vld1_dup_f32(xi); | ||||
|    SUMM = vmlaq_lane_f32(SUMM, YY[0], XX_2, 0); | ||||
| 
 | ||||
|    vst1q_f32(sum, SUMM); | ||||
| } | ||||
| 
 | ||||
| void celt_pitch_xcorr_float_neon(const opus_val16 *_x, const opus_val16 *_y, | ||||
|                         opus_val32 *xcorr, int len, int max_pitch, int arch) { | ||||
|    int i; | ||||
|    (void)arch; | ||||
|    celt_assert(max_pitch > 0); | ||||
|    celt_sig_assert((((unsigned char *)_x-(unsigned char *)NULL)&3)==0); | ||||
| 
 | ||||
|    for (i = 0; i < (max_pitch-3); i += 4) { | ||||
|       xcorr_kernel_neon_float((const float32_t *)_x, (const float32_t *)_y+i, | ||||
|             (float32_t *)xcorr+i, len); | ||||
|    } | ||||
| 
 | ||||
|    /* In case max_pitch isn't a multiple of 4, do non-unrolled version. */ | ||||
|    for (; i < max_pitch; i++) { | ||||
|       xcorr[i] = celt_inner_prod_neon(_x, _y+i, len); | ||||
|    } | ||||
| } | ||||
| #endif | ||||
							
								
								
									
										551
									
								
								lib/rbcodec/codecs/libopus/celt/arm/celt_pitch_xcorr_arm.s
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										551
									
								
								lib/rbcodec/codecs/libopus/celt/arm/celt_pitch_xcorr_arm.s
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,551 @@ | |||
| ; Copyright (c) 2007-2008 CSIRO
 | ||||
| ; Copyright (c) 2007-2009 Xiph.Org Foundation
 | ||||
| ; Copyright (c) 2013      Parrot
 | ||||
| ; Written by Aurélien Zanelli
 | ||||
| ;
 | ||||
| ; Redistribution and use in source and binary forms, with or without
 | ||||
| ; modification, are permitted provided that the following conditions
 | ||||
| ; are met:
 | ||||
| ;
 | ||||
| ; - Redistributions of source code must retain the above copyright
 | ||||
| ; notice, this list of conditions and the following disclaimer.
 | ||||
| ;
 | ||||
| ; - Redistributions in binary form must reproduce the above copyright
 | ||||
| ; notice, this list of conditions and the following disclaimer in the
 | ||||
| ; documentation and/or other materials provided with the distribution.
 | ||||
| ;
 | ||||
| ; THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 | ||||
| ; ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 | ||||
| ; LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 | ||||
| ; A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
 | ||||
| ; OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
 | ||||
| ; EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
 | ||||
| ; PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
 | ||||
| ; PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
 | ||||
| ; LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
 | ||||
| ; NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
 | ||||
| ; SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 | ||||
| 
 | ||||
|   AREA  |.text|, CODE, READONLY | ||||
| 
 | ||||
|   GET    celt/arm/armopts.s | ||||
| 
 | ||||
| IF OPUS_ARM_MAY_HAVE_EDSP | ||||
|   EXPORT celt_pitch_xcorr_edsp | ||||
| ENDIF | ||||
| 
 | ||||
| IF OPUS_ARM_MAY_HAVE_NEON | ||||
|   EXPORT celt_pitch_xcorr_neon | ||||
| ENDIF | ||||
| 
 | ||||
| IF OPUS_ARM_MAY_HAVE_NEON | ||||
| 
 | ||||
| ; Compute sum[k]=sum(x[j]*y[j+k],j=0...len-1), k=0...3
 | ||||
| xcorr_kernel_neon PROC | ||||
| xcorr_kernel_neon_start | ||||
|   ; input:
 | ||||
|   ;   r3     = int         len
 | ||||
|   ;   r4     = opus_val16 *x
 | ||||
|   ;   r5     = opus_val16 *y
 | ||||
|   ;   q0     = opus_val32  sum[4]
 | ||||
|   ; output:
 | ||||
|   ;   q0     = opus_val32  sum[4]
 | ||||
|   ; preserved: r0-r3, r6-r11, d2, q4-q7, q9-q15
 | ||||
|   ; internal usage:
 | ||||
|   ;   r12 = int j
 | ||||
|   ;   d3  = y_3|y_2|y_1|y_0
 | ||||
|   ;   q2  = y_B|y_A|y_9|y_8|y_7|y_6|y_5|y_4
 | ||||
|   ;   q3  = x_7|x_6|x_5|x_4|x_3|x_2|x_1|x_0
 | ||||
|   ;   q8  = scratch
 | ||||
|   ;
 | ||||
|   ; Load y[0...3]
 | ||||
|   ; This requires len>0 to always be valid (which we assert in the C code).
 | ||||
|   VLD1.16      {d5}, [r5]! | ||||
|   SUBS         r12, r3, #8 | ||||
|   BLE xcorr_kernel_neon_process4 | ||||
| ; Process 8 samples at a time.
 | ||||
| ; This loop loads one y value more than we actually need. Therefore we have to
 | ||||
| ; stop as soon as there are 8 or fewer samples left (instead of 7), to avoid
 | ||||
| ; reading past the end of the array.
 | ||||
| xcorr_kernel_neon_process8 | ||||
|   ; This loop has 19 total instructions (10 cycles to issue, minimum), with
 | ||||
|   ; - 2 cycles of ARM insrtuctions,
 | ||||
|   ; - 10 cycles of load/store/byte permute instructions, and
 | ||||
|   ; - 9 cycles of data processing instructions.
 | ||||
|   ; On a Cortex A8, we dual-issue the maximum amount (9 cycles) between the
 | ||||
|   ; latter two categories, meaning the whole loop should run in 10 cycles per
 | ||||
|   ; iteration, barring cache misses.
 | ||||
|   ;
 | ||||
|   ; Load x[0...7]
 | ||||
|   VLD1.16      {d6, d7}, [r4]! | ||||
|   ; Unlike VMOV, VAND is a data processsing instruction (and doesn't get
 | ||||
|   ; assembled to VMOV, like VORR would), so it dual-issues with the prior VLD1.
 | ||||
|   VAND         d3, d5, d5 | ||||
|   SUBS         r12, r12, #8 | ||||
|   ; Load y[4...11]
 | ||||
|   VLD1.16      {d4, d5}, [r5]! | ||||
|   VMLAL.S16    q0, d3, d6[0] | ||||
|   VEXT.16      d16, d3, d4, #1 | ||||
|   VMLAL.S16    q0, d4, d7[0] | ||||
|   VEXT.16      d17, d4, d5, #1 | ||||
|   VMLAL.S16    q0, d16, d6[1] | ||||
|   VEXT.16      d16, d3, d4, #2 | ||||
|   VMLAL.S16    q0, d17, d7[1] | ||||
|   VEXT.16      d17, d4, d5, #2 | ||||
|   VMLAL.S16    q0, d16, d6[2] | ||||
|   VEXT.16      d16, d3, d4, #3 | ||||
|   VMLAL.S16    q0, d17, d7[2] | ||||
|   VEXT.16      d17, d4, d5, #3 | ||||
|   VMLAL.S16    q0, d16, d6[3] | ||||
|   VMLAL.S16    q0, d17, d7[3] | ||||
|   BGT xcorr_kernel_neon_process8 | ||||
| ; Process 4 samples here if we have > 4 left (still reading one extra y value).
 | ||||
| xcorr_kernel_neon_process4 | ||||
|   ADDS         r12, r12, #4 | ||||
|   BLE xcorr_kernel_neon_process2 | ||||
|   ; Load x[0...3]
 | ||||
|   VLD1.16      d6, [r4]! | ||||
|   ; Use VAND since it's a data processing instruction again.
 | ||||
|   VAND         d4, d5, d5 | ||||
|   SUB          r12, r12, #4 | ||||
|   ; Load y[4...7]
 | ||||
|   VLD1.16      d5, [r5]! | ||||
|   VMLAL.S16    q0, d4, d6[0] | ||||
|   VEXT.16      d16, d4, d5, #1 | ||||
|   VMLAL.S16    q0, d16, d6[1] | ||||
|   VEXT.16      d16, d4, d5, #2 | ||||
|   VMLAL.S16    q0, d16, d6[2] | ||||
|   VEXT.16      d16, d4, d5, #3 | ||||
|   VMLAL.S16    q0, d16, d6[3] | ||||
| ; Process 2 samples here if we have > 2 left (still reading one extra y value).
 | ||||
| xcorr_kernel_neon_process2 | ||||
|   ADDS         r12, r12, #2 | ||||
|   BLE xcorr_kernel_neon_process1 | ||||
|   ; Load x[0...1]
 | ||||
|   VLD2.16      {d6[],d7[]}, [r4]! | ||||
|   ; Use VAND since it's a data processing instruction again.
 | ||||
|   VAND         d4, d5, d5 | ||||
|   SUB          r12, r12, #2 | ||||
|   ; Load y[4...5]
 | ||||
|   VLD1.32      {d5[]}, [r5]! | ||||
|   VMLAL.S16    q0, d4, d6 | ||||
|   VEXT.16      d16, d4, d5, #1 | ||||
|   ; Replace bottom copy of {y5,y4} in d5 with {y3,y2} from d4, using VSRI
 | ||||
|   ; instead of VEXT, since it's a data-processing instruction.
 | ||||
|   VSRI.64      d5, d4, #32 | ||||
|   VMLAL.S16    q0, d16, d7 | ||||
| ; Process 1 sample using the extra y value we loaded above.
 | ||||
| xcorr_kernel_neon_process1 | ||||
|   ; Load next *x
 | ||||
|   VLD1.16      {d6[]}, [r4]! | ||||
|   ADDS         r12, r12, #1 | ||||
|   ; y[0...3] are left in d5 from prior iteration(s) (if any)
 | ||||
|   VMLAL.S16    q0, d5, d6 | ||||
|   MOVLE        pc, lr | ||||
| ; Now process 1 last sample, not reading ahead.
 | ||||
|   ; Load last *y
 | ||||
|   VLD1.16      {d4[]}, [r5]! | ||||
|   VSRI.64      d4, d5, #16 | ||||
|   ; Load last *x
 | ||||
|   VLD1.16      {d6[]}, [r4]! | ||||
|   VMLAL.S16    q0, d4, d6 | ||||
|   MOV          pc, lr | ||||
|   ENDP | ||||
| 
 | ||||
| ; opus_val32 celt_pitch_xcorr_neon(opus_val16 *_x, opus_val16 *_y,
 | ||||
| ;  opus_val32 *xcorr, int len, int max_pitch, int arch)
 | ||||
| celt_pitch_xcorr_neon PROC | ||||
|   ; input:
 | ||||
|   ;   r0  = opus_val16 *_x
 | ||||
|   ;   r1  = opus_val16 *_y
 | ||||
|   ;   r2  = opus_val32 *xcorr
 | ||||
|   ;   r3  = int         len
 | ||||
|   ; output:
 | ||||
|   ;   r0  = int         maxcorr
 | ||||
|   ; internal usage:
 | ||||
|   ;   r4  = opus_val16 *x (for xcorr_kernel_neon())
 | ||||
|   ;   r5  = opus_val16 *y (for xcorr_kernel_neon())
 | ||||
|   ;   r6  = int         max_pitch
 | ||||
|   ;   r12 = int         j
 | ||||
|   ;   q15 = int         maxcorr[4] (q15 is not used by xcorr_kernel_neon())
 | ||||
|   ; ignored:
 | ||||
|   ;         int         arch
 | ||||
|   STMFD        sp!, {r4-r6, lr} | ||||
|   LDR          r6, [sp, #16] | ||||
|   VMOV.S32     q15, #1 | ||||
|   ; if (max_pitch < 4) goto celt_pitch_xcorr_neon_process4_done
 | ||||
|   SUBS         r6, r6, #4 | ||||
|   BLT celt_pitch_xcorr_neon_process4_done | ||||
| celt_pitch_xcorr_neon_process4 | ||||
|   ; xcorr_kernel_neon parameters:
 | ||||
|   ; r3 = len, r4 = _x, r5 = _y, q0 = {0, 0, 0, 0}
 | ||||
|   MOV          r4, r0 | ||||
|   MOV          r5, r1 | ||||
|   VEOR         q0, q0, q0 | ||||
|   ; xcorr_kernel_neon only modifies r4, r5, r12, and q0...q3.
 | ||||
|   ; So we don't save/restore any other registers.
 | ||||
|   BL xcorr_kernel_neon_start | ||||
|   SUBS         r6, r6, #4 | ||||
|   VST1.32      {q0}, [r2]! | ||||
|   ; _y += 4
 | ||||
|   ADD          r1, r1, #8 | ||||
|   VMAX.S32     q15, q15, q0 | ||||
|   ; if (max_pitch < 4) goto celt_pitch_xcorr_neon_process4_done
 | ||||
|   BGE celt_pitch_xcorr_neon_process4 | ||||
| ; We have less than 4 sums left to compute.
 | ||||
| celt_pitch_xcorr_neon_process4_done | ||||
|   ADDS         r6, r6, #4 | ||||
|   ; Reduce maxcorr to a single value
 | ||||
|   VMAX.S32     d30, d30, d31 | ||||
|   VPMAX.S32    d30, d30, d30 | ||||
|   ; if (max_pitch <= 0) goto celt_pitch_xcorr_neon_done
 | ||||
|   BLE celt_pitch_xcorr_neon_done | ||||
| ; Now compute each remaining sum one at a time.
 | ||||
| celt_pitch_xcorr_neon_process_remaining | ||||
|   MOV          r4, r0 | ||||
|   MOV          r5, r1 | ||||
|   VMOV.I32     q0, #0 | ||||
|   SUBS         r12, r3, #8 | ||||
|   BLT celt_pitch_xcorr_neon_process_remaining4 | ||||
| ; Sum terms 8 at a time.
 | ||||
| celt_pitch_xcorr_neon_process_remaining_loop8 | ||||
|   ; Load x[0...7]
 | ||||
|   VLD1.16      {q1}, [r4]! | ||||
|   ; Load y[0...7]
 | ||||
|   VLD1.16      {q2}, [r5]! | ||||
|   SUBS         r12, r12, #8 | ||||
|   VMLAL.S16    q0, d4, d2 | ||||
|   VMLAL.S16    q0, d5, d3 | ||||
|   BGE celt_pitch_xcorr_neon_process_remaining_loop8 | ||||
| ; Sum terms 4 at a time.
 | ||||
| celt_pitch_xcorr_neon_process_remaining4 | ||||
|   ADDS         r12, r12, #4 | ||||
|   BLT celt_pitch_xcorr_neon_process_remaining4_done | ||||
|   ; Load x[0...3]
 | ||||
|   VLD1.16      {d2}, [r4]! | ||||
|   ; Load y[0...3]
 | ||||
|   VLD1.16      {d3}, [r5]! | ||||
|   SUB          r12, r12, #4 | ||||
|   VMLAL.S16    q0, d3, d2 | ||||
| celt_pitch_xcorr_neon_process_remaining4_done | ||||
|   ; Reduce the sum to a single value.
 | ||||
|   VADD.S32     d0, d0, d1 | ||||
|   VPADDL.S32   d0, d0 | ||||
|   ADDS         r12, r12, #4 | ||||
|   BLE celt_pitch_xcorr_neon_process_remaining_loop_done | ||||
| ; Sum terms 1 at a time.
 | ||||
| celt_pitch_xcorr_neon_process_remaining_loop1 | ||||
|   VLD1.16      {d2[]}, [r4]! | ||||
|   VLD1.16      {d3[]}, [r5]! | ||||
|   SUBS         r12, r12, #1 | ||||
|   VMLAL.S16    q0, d2, d3 | ||||
|   BGT celt_pitch_xcorr_neon_process_remaining_loop1 | ||||
| celt_pitch_xcorr_neon_process_remaining_loop_done | ||||
|   VST1.32      {d0[0]}, [r2]! | ||||
|   VMAX.S32     d30, d30, d0 | ||||
|   SUBS         r6, r6, #1 | ||||
|   ; _y++
 | ||||
|   ADD          r1, r1, #2 | ||||
|   ; if (--max_pitch > 0) goto celt_pitch_xcorr_neon_process_remaining
 | ||||
|   BGT celt_pitch_xcorr_neon_process_remaining | ||||
| celt_pitch_xcorr_neon_done | ||||
|   VMOV.32      r0, d30[0] | ||||
|   LDMFD        sp!, {r4-r6, pc} | ||||
|   ENDP | ||||
| 
 | ||||
| ENDIF | ||||
| 
 | ||||
| IF OPUS_ARM_MAY_HAVE_EDSP | ||||
| 
 | ||||
| ; This will get used on ARMv7 devices without NEON, so it has been optimized
 | ||||
| ; to take advantage of dual-issuing where possible.
 | ||||
| xcorr_kernel_edsp PROC | ||||
| xcorr_kernel_edsp_start | ||||
|   ; input:
 | ||||
|   ;   r3      = int         len
 | ||||
|   ;   r4      = opus_val16 *_x (must be 32-bit aligned)
 | ||||
|   ;   r5      = opus_val16 *_y (must be 32-bit aligned)
 | ||||
|   ;   r6...r9 = opus_val32  sum[4]
 | ||||
|   ; output:
 | ||||
|   ;   r6...r9 = opus_val32  sum[4]
 | ||||
|   ; preserved: r0-r5
 | ||||
|   ; internal usage
 | ||||
|   ;   r2      = int         j
 | ||||
|   ;   r12,r14 = opus_val16  x[4]
 | ||||
|   ;   r10,r11 = opus_val16  y[4]
 | ||||
|   STMFD        sp!, {r2,r4,r5,lr} | ||||
|   LDR          r10, [r5], #4      ; Load y[0...1]
 | ||||
|   SUBS         r2, r3, #4         ; j = len-4
 | ||||
|   LDR          r11, [r5], #4      ; Load y[2...3]
 | ||||
|   BLE xcorr_kernel_edsp_process4_done | ||||
|   LDR          r12, [r4], #4      ; Load x[0...1]
 | ||||
|   ; Stall
 | ||||
| xcorr_kernel_edsp_process4 | ||||
|   ; The multiplies must issue from pipeline 0, and can't dual-issue with each
 | ||||
|   ; other. Every other instruction here dual-issues with a multiply, and is
 | ||||
|   ; thus "free". There should be no stalls in the body of the loop.
 | ||||
|   SMLABB       r6, r12, r10, r6   ; sum[0] = MAC16_16(sum[0],x_0,y_0)
 | ||||
|   LDR          r14, [r4], #4      ; Load x[2...3]
 | ||||
|   SMLABT       r7, r12, r10, r7   ; sum[1] = MAC16_16(sum[1],x_0,y_1)
 | ||||
|   SUBS         r2, r2, #4         ; j-=4
 | ||||
|   SMLABB       r8, r12, r11, r8   ; sum[2] = MAC16_16(sum[2],x_0,y_2)
 | ||||
|   SMLABT       r9, r12, r11, r9   ; sum[3] = MAC16_16(sum[3],x_0,y_3)
 | ||||
|   SMLATT       r6, r12, r10, r6   ; sum[0] = MAC16_16(sum[0],x_1,y_1)
 | ||||
|   LDR          r10, [r5], #4      ; Load y[4...5]
 | ||||
|   SMLATB       r7, r12, r11, r7   ; sum[1] = MAC16_16(sum[1],x_1,y_2)
 | ||||
|   SMLATT       r8, r12, r11, r8   ; sum[2] = MAC16_16(sum[2],x_1,y_3)
 | ||||
|   SMLATB       r9, r12, r10, r9   ; sum[3] = MAC16_16(sum[3],x_1,y_4)
 | ||||
|   LDRGT        r12, [r4], #4      ; Load x[0...1]
 | ||||
|   SMLABB       r6, r14, r11, r6   ; sum[0] = MAC16_16(sum[0],x_2,y_2)
 | ||||
|   SMLABT       r7, r14, r11, r7   ; sum[1] = MAC16_16(sum[1],x_2,y_3)
 | ||||
|   SMLABB       r8, r14, r10, r8   ; sum[2] = MAC16_16(sum[2],x_2,y_4)
 | ||||
|   SMLABT       r9, r14, r10, r9   ; sum[3] = MAC16_16(sum[3],x_2,y_5)
 | ||||
|   SMLATT       r6, r14, r11, r6   ; sum[0] = MAC16_16(sum[0],x_3,y_3)
 | ||||
|   LDR          r11, [r5], #4      ; Load y[6...7]
 | ||||
|   SMLATB       r7, r14, r10, r7   ; sum[1] = MAC16_16(sum[1],x_3,y_4)
 | ||||
|   SMLATT       r8, r14, r10, r8   ; sum[2] = MAC16_16(sum[2],x_3,y_5)
 | ||||
|   SMLATB       r9, r14, r11, r9   ; sum[3] = MAC16_16(sum[3],x_3,y_6)
 | ||||
|   BGT xcorr_kernel_edsp_process4 | ||||
| xcorr_kernel_edsp_process4_done | ||||
|   ADDS         r2, r2, #4 | ||||
|   BLE xcorr_kernel_edsp_done | ||||
|   LDRH         r12, [r4], #2      ; r12 = *x++
 | ||||
|   SUBS         r2, r2, #1         ; j--
 | ||||
|   ; Stall
 | ||||
|   SMLABB       r6, r12, r10, r6   ; sum[0] = MAC16_16(sum[0],x,y_0)
 | ||||
|   LDRHGT       r14, [r4], #2      ; r14 = *x++
 | ||||
|   SMLABT       r7, r12, r10, r7   ; sum[1] = MAC16_16(sum[1],x,y_1)
 | ||||
|   SMLABB       r8, r12, r11, r8   ; sum[2] = MAC16_16(sum[2],x,y_2)
 | ||||
|   SMLABT       r9, r12, r11, r9   ; sum[3] = MAC16_16(sum[3],x,y_3)
 | ||||
|   BLE xcorr_kernel_edsp_done | ||||
|   SMLABT       r6, r14, r10, r6   ; sum[0] = MAC16_16(sum[0],x,y_1)
 | ||||
|   SUBS         r2, r2, #1         ; j--
 | ||||
|   SMLABB       r7, r14, r11, r7   ; sum[1] = MAC16_16(sum[1],x,y_2)
 | ||||
|   LDRH         r10, [r5], #2      ; r10 = y_4 = *y++
 | ||||
|   SMLABT       r8, r14, r11, r8   ; sum[2] = MAC16_16(sum[2],x,y_3)
 | ||||
|   LDRHGT       r12, [r4], #2      ; r12 = *x++
 | ||||
|   SMLABB       r9, r14, r10, r9   ; sum[3] = MAC16_16(sum[3],x,y_4)
 | ||||
|   BLE xcorr_kernel_edsp_done | ||||
|   SMLABB       r6, r12, r11, r6   ; sum[0] = MAC16_16(sum[0],tmp,y_2)
 | ||||
|   CMP          r2, #1             ; j--
 | ||||
|   SMLABT       r7, r12, r11, r7   ; sum[1] = MAC16_16(sum[1],tmp,y_3)
 | ||||
|   LDRH         r2, [r5], #2       ; r2 = y_5 = *y++
 | ||||
|   SMLABB       r8, r12, r10, r8   ; sum[2] = MAC16_16(sum[2],tmp,y_4)
 | ||||
|   LDRHGT       r14, [r4]          ; r14 = *x
 | ||||
|   SMLABB       r9, r12, r2, r9    ; sum[3] = MAC16_16(sum[3],tmp,y_5)
 | ||||
|   BLE xcorr_kernel_edsp_done | ||||
|   SMLABT       r6, r14, r11, r6   ; sum[0] = MAC16_16(sum[0],tmp,y_3)
 | ||||
|   LDRH         r11, [r5]          ; r11 = y_6 = *y
 | ||||
|   SMLABB       r7, r14, r10, r7   ; sum[1] = MAC16_16(sum[1],tmp,y_4)
 | ||||
|   SMLABB       r8, r14, r2, r8    ; sum[2] = MAC16_16(sum[2],tmp,y_5)
 | ||||
|   SMLABB       r9, r14, r11, r9   ; sum[3] = MAC16_16(sum[3],tmp,y_6)
 | ||||
| xcorr_kernel_edsp_done | ||||
|   LDMFD        sp!, {r2,r4,r5,pc} | ||||
|   ENDP | ||||
| 
 | ||||
| celt_pitch_xcorr_edsp PROC | ||||
|   ; input:
 | ||||
|   ;   r0  = opus_val16 *_x (must be 32-bit aligned)
 | ||||
|   ;   r1  = opus_val16 *_y (only needs to be 16-bit aligned)
 | ||||
|   ;   r2  = opus_val32 *xcorr
 | ||||
|   ;   r3  = int         len
 | ||||
|   ; output:
 | ||||
|   ;   r0  = maxcorr
 | ||||
|   ; internal usage
 | ||||
|   ;   r4  = opus_val16 *x
 | ||||
|   ;   r5  = opus_val16 *y
 | ||||
|   ;   r6  = opus_val32  sum0
 | ||||
|   ;   r7  = opus_val32  sum1
 | ||||
|   ;   r8  = opus_val32  sum2
 | ||||
|   ;   r9  = opus_val32  sum3
 | ||||
|   ;   r1  = int         max_pitch
 | ||||
|   ;   r12 = int         j
 | ||||
|   ; ignored:
 | ||||
|   ;         int         arch
 | ||||
|   STMFD        sp!, {r4-r11, lr} | ||||
|   MOV          r5, r1 | ||||
|   LDR          r1, [sp, #36] | ||||
|   MOV          r4, r0 | ||||
|   TST          r5, #3 | ||||
|   ; maxcorr = 1
 | ||||
|   MOV          r0, #1 | ||||
|   BEQ          celt_pitch_xcorr_edsp_process1u_done | ||||
| ; Compute one sum at the start to make y 32-bit aligned.
 | ||||
|   SUBS         r12, r3, #4 | ||||
|   ; r14 = sum = 0
 | ||||
|   MOV          r14, #0 | ||||
|   LDRH         r8, [r5], #2 | ||||
|   BLE celt_pitch_xcorr_edsp_process1u_loop4_done | ||||
|   LDR          r6, [r4], #4 | ||||
|   MOV          r8, r8, LSL #16 | ||||
| celt_pitch_xcorr_edsp_process1u_loop4 | ||||
|   LDR          r9, [r5], #4 | ||||
|   SMLABT       r14, r6, r8, r14     ; sum = MAC16_16(sum, x_0, y_0)
 | ||||
|   LDR          r7, [r4], #4 | ||||
|   SMLATB       r14, r6, r9, r14     ; sum = MAC16_16(sum, x_1, y_1)
 | ||||
|   LDR          r8, [r5], #4 | ||||
|   SMLABT       r14, r7, r9, r14     ; sum = MAC16_16(sum, x_2, y_2)
 | ||||
|   SUBS         r12, r12, #4         ; j-=4
 | ||||
|   SMLATB       r14, r7, r8, r14     ; sum = MAC16_16(sum, x_3, y_3)
 | ||||
|   LDRGT        r6, [r4], #4 | ||||
|   BGT celt_pitch_xcorr_edsp_process1u_loop4 | ||||
|   MOV          r8, r8, LSR #16 | ||||
| celt_pitch_xcorr_edsp_process1u_loop4_done | ||||
|   ADDS         r12, r12, #4 | ||||
| celt_pitch_xcorr_edsp_process1u_loop1 | ||||
|   LDRHGE       r6, [r4], #2 | ||||
|   ; Stall
 | ||||
|   SMLABBGE     r14, r6, r8, r14    ; sum = MAC16_16(sum, *x, *y)
 | ||||
|   SUBSGE       r12, r12, #1 | ||||
|   LDRHGT       r8, [r5], #2 | ||||
|   BGT celt_pitch_xcorr_edsp_process1u_loop1 | ||||
|   ; Restore _x
 | ||||
|   SUB          r4, r4, r3, LSL #1 | ||||
|   ; Restore and advance _y
 | ||||
|   SUB          r5, r5, r3, LSL #1 | ||||
|   ; maxcorr = max(maxcorr, sum)
 | ||||
|   CMP          r0, r14 | ||||
|   ADD          r5, r5, #2 | ||||
|   MOVLT        r0, r14 | ||||
|   SUBS         r1, r1, #1 | ||||
|   ; xcorr[i] = sum
 | ||||
|   STR          r14, [r2], #4 | ||||
|   BLE celt_pitch_xcorr_edsp_done | ||||
| celt_pitch_xcorr_edsp_process1u_done | ||||
|   ; if (max_pitch < 4) goto celt_pitch_xcorr_edsp_process2
 | ||||
|   SUBS         r1, r1, #4 | ||||
|   BLT celt_pitch_xcorr_edsp_process2 | ||||
| celt_pitch_xcorr_edsp_process4 | ||||
|   ; xcorr_kernel_edsp parameters:
 | ||||
|   ; r3 = len, r4 = _x, r5 = _y, r6...r9 = sum[4] = {0, 0, 0, 0}
 | ||||
|   MOV          r6, #0 | ||||
|   MOV          r7, #0 | ||||
|   MOV          r8, #0 | ||||
|   MOV          r9, #0 | ||||
|   BL xcorr_kernel_edsp_start  ; xcorr_kernel_edsp(_x, _y+i, xcorr+i, len)
 | ||||
|   ; maxcorr = max(maxcorr, sum0, sum1, sum2, sum3)
 | ||||
|   CMP          r0, r6 | ||||
|   ; _y+=4
 | ||||
|   ADD          r5, r5, #8 | ||||
|   MOVLT        r0, r6 | ||||
|   CMP          r0, r7 | ||||
|   MOVLT        r0, r7 | ||||
|   CMP          r0, r8 | ||||
|   MOVLT        r0, r8 | ||||
|   CMP          r0, r9 | ||||
|   MOVLT        r0, r9 | ||||
|   STMIA        r2!, {r6-r9} | ||||
|   SUBS         r1, r1, #4 | ||||
|   BGE celt_pitch_xcorr_edsp_process4 | ||||
| celt_pitch_xcorr_edsp_process2 | ||||
|   ADDS         r1, r1, #2 | ||||
|   BLT celt_pitch_xcorr_edsp_process1a | ||||
|   SUBS         r12, r3, #4 | ||||
|   ; {r10, r11} = {sum0, sum1} = {0, 0}
 | ||||
|   MOV          r10, #0 | ||||
|   MOV          r11, #0 | ||||
|   LDR          r8, [r5], #4 | ||||
|   BLE celt_pitch_xcorr_edsp_process2_loop_done | ||||
|   LDR          r6, [r4], #4 | ||||
|   LDR          r9, [r5], #4 | ||||
| celt_pitch_xcorr_edsp_process2_loop4 | ||||
|   SMLABB       r10, r6, r8, r10     ; sum0 = MAC16_16(sum0, x_0, y_0)
 | ||||
|   LDR          r7, [r4], #4 | ||||
|   SMLABT       r11, r6, r8, r11     ; sum1 = MAC16_16(sum1, x_0, y_1)
 | ||||
|   SUBS         r12, r12, #4         ; j-=4
 | ||||
|   SMLATT       r10, r6, r8, r10     ; sum0 = MAC16_16(sum0, x_1, y_1)
 | ||||
|   LDR          r8, [r5], #4 | ||||
|   SMLATB       r11, r6, r9, r11     ; sum1 = MAC16_16(sum1, x_1, y_2)
 | ||||
|   LDRGT        r6, [r4], #4 | ||||
|   SMLABB       r10, r7, r9, r10     ; sum0 = MAC16_16(sum0, x_2, y_2)
 | ||||
|   SMLABT       r11, r7, r9, r11     ; sum1 = MAC16_16(sum1, x_2, y_3)
 | ||||
|   SMLATT       r10, r7, r9, r10     ; sum0 = MAC16_16(sum0, x_3, y_3)
 | ||||
|   LDRGT        r9, [r5], #4 | ||||
|   SMLATB       r11, r7, r8, r11     ; sum1 = MAC16_16(sum1, x_3, y_4)
 | ||||
|   BGT celt_pitch_xcorr_edsp_process2_loop4 | ||||
| celt_pitch_xcorr_edsp_process2_loop_done | ||||
|   ADDS         r12, r12, #2 | ||||
|   BLE  celt_pitch_xcorr_edsp_process2_1 | ||||
|   LDR          r6, [r4], #4 | ||||
|   ; Stall
 | ||||
|   SMLABB       r10, r6, r8, r10     ; sum0 = MAC16_16(sum0, x_0, y_0)
 | ||||
|   LDR          r9, [r5], #4 | ||||
|   SMLABT       r11, r6, r8, r11     ; sum1 = MAC16_16(sum1, x_0, y_1)
 | ||||
|   SUB          r12, r12, #2 | ||||
|   SMLATT       r10, r6, r8, r10     ; sum0 = MAC16_16(sum0, x_1, y_1)
 | ||||
|   MOV          r8, r9 | ||||
|   SMLATB       r11, r6, r9, r11     ; sum1 = MAC16_16(sum1, x_1, y_2)
 | ||||
| celt_pitch_xcorr_edsp_process2_1 | ||||
|   LDRH         r6, [r4], #2 | ||||
|   ADDS         r12, r12, #1 | ||||
|   ; Stall
 | ||||
|   SMLABB       r10, r6, r8, r10     ; sum0 = MAC16_16(sum0, x_0, y_0)
 | ||||
|   LDRHGT       r7, [r4], #2 | ||||
|   SMLABT       r11, r6, r8, r11     ; sum1 = MAC16_16(sum1, x_0, y_1)
 | ||||
|   BLE celt_pitch_xcorr_edsp_process2_done | ||||
|   LDRH         r9, [r5], #2 | ||||
|   SMLABT       r10, r7, r8, r10     ; sum0 = MAC16_16(sum0, x_0, y_1)
 | ||||
|   SMLABB       r11, r7, r9, r11     ; sum1 = MAC16_16(sum1, x_0, y_2)
 | ||||
| celt_pitch_xcorr_edsp_process2_done | ||||
|   ; Restore _x
 | ||||
|   SUB          r4, r4, r3, LSL #1 | ||||
|   ; Restore and advance _y
 | ||||
|   SUB          r5, r5, r3, LSL #1 | ||||
|   ; maxcorr = max(maxcorr, sum0)
 | ||||
|   CMP          r0, r10 | ||||
|   ADD          r5, r5, #2 | ||||
|   MOVLT        r0, r10 | ||||
|   SUB          r1, r1, #2 | ||||
|   ; maxcorr = max(maxcorr, sum1)
 | ||||
|   CMP          r0, r11 | ||||
|   ; xcorr[i] = sum
 | ||||
|   STR          r10, [r2], #4 | ||||
|   MOVLT        r0, r11 | ||||
|   STR          r11, [r2], #4 | ||||
| celt_pitch_xcorr_edsp_process1a | ||||
|   ADDS         r1, r1, #1 | ||||
|   BLT celt_pitch_xcorr_edsp_done | ||||
|   SUBS         r12, r3, #4 | ||||
|   ; r14 = sum = 0
 | ||||
|   MOV          r14, #0 | ||||
|   BLT celt_pitch_xcorr_edsp_process1a_loop_done | ||||
|   LDR          r6, [r4], #4 | ||||
|   LDR          r8, [r5], #4 | ||||
|   LDR          r7, [r4], #4 | ||||
|   LDR          r9, [r5], #4 | ||||
| celt_pitch_xcorr_edsp_process1a_loop4 | ||||
|   SMLABB       r14, r6, r8, r14     ; sum = MAC16_16(sum, x_0, y_0)
 | ||||
|   SUBS         r12, r12, #4         ; j-=4
 | ||||
|   SMLATT       r14, r6, r8, r14     ; sum = MAC16_16(sum, x_1, y_1)
 | ||||
|   LDRGE        r6, [r4], #4 | ||||
|   SMLABB       r14, r7, r9, r14     ; sum = MAC16_16(sum, x_2, y_2)
 | ||||
|   LDRGE        r8, [r5], #4 | ||||
|   SMLATT       r14, r7, r9, r14     ; sum = MAC16_16(sum, x_3, y_3)
 | ||||
|   LDRGE        r7, [r4], #4 | ||||
|   LDRGE        r9, [r5], #4 | ||||
|   BGE celt_pitch_xcorr_edsp_process1a_loop4 | ||||
| celt_pitch_xcorr_edsp_process1a_loop_done | ||||
|   ADDS         r12, r12, #2 | ||||
|   LDRGE        r6, [r4], #4 | ||||
|   LDRGE        r8, [r5], #4 | ||||
|   ; Stall
 | ||||
|   SMLABBGE     r14, r6, r8, r14     ; sum = MAC16_16(sum, x_0, y_0)
 | ||||
|   SUBGE        r12, r12, #2 | ||||
|   SMLATTGE     r14, r6, r8, r14     ; sum = MAC16_16(sum, x_1, y_1)
 | ||||
|   ADDS         r12, r12, #1 | ||||
|   LDRHGE       r6, [r4], #2 | ||||
|   LDRHGE       r8, [r5], #2 | ||||
|   ; Stall
 | ||||
|   SMLABBGE     r14, r6, r8, r14     ; sum = MAC16_16(sum, *x, *y)
 | ||||
|   ; maxcorr = max(maxcorr, sum)
 | ||||
|   CMP          r0, r14 | ||||
|   ; xcorr[i] = sum
 | ||||
|   STR          r14, [r2], #4 | ||||
|   MOVLT        r0, r14 | ||||
| celt_pitch_xcorr_edsp_done | ||||
|   LDMFD        sp!, {r4-r11, pc} | ||||
|   ENDP | ||||
| 
 | ||||
| ENDIF | ||||
| 
 | ||||
| END | ||||
							
								
								
									
										71
									
								
								lib/rbcodec/codecs/libopus/celt/arm/fft_arm.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										71
									
								
								lib/rbcodec/codecs/libopus/celt/arm/fft_arm.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,71 @@ | |||
| /* Copyright (c) 2015 Xiph.Org Foundation
 | ||||
|    Written by Viswanath Puttagunta */ | ||||
| /**
 | ||||
|    @file fft_arm.h | ||||
|    @brief ARM Neon Intrinsic optimizations for fft using NE10 library | ||||
|  */ | ||||
| 
 | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| 
 | ||||
| #if !defined(FFT_ARM_H) | ||||
| #define FFT_ARM_H | ||||
| 
 | ||||
| #include "kiss_fft.h" | ||||
| 
 | ||||
| #if defined(HAVE_ARM_NE10) | ||||
| 
 | ||||
| int opus_fft_alloc_arm_neon(kiss_fft_state *st); | ||||
| void opus_fft_free_arm_neon(kiss_fft_state *st); | ||||
| 
 | ||||
| void opus_fft_neon(const kiss_fft_state *st, | ||||
|                    const kiss_fft_cpx *fin, | ||||
|                    kiss_fft_cpx *fout); | ||||
| 
 | ||||
| void opus_ifft_neon(const kiss_fft_state *st, | ||||
|                     const kiss_fft_cpx *fin, | ||||
|                     kiss_fft_cpx *fout); | ||||
| 
 | ||||
| #if !defined(OPUS_HAVE_RTCD) | ||||
| #define OVERRIDE_OPUS_FFT (1) | ||||
| 
 | ||||
| #define opus_fft_alloc_arch(_st, arch) \ | ||||
|    ((void)(arch), opus_fft_alloc_arm_neon(_st)) | ||||
| 
 | ||||
| #define opus_fft_free_arch(_st, arch) \ | ||||
|    ((void)(arch), opus_fft_free_arm_neon(_st)) | ||||
| 
 | ||||
| #define opus_fft(_st, _fin, _fout, arch) \ | ||||
|    ((void)(arch), opus_fft_neon(_st, _fin, _fout)) | ||||
| 
 | ||||
| #define opus_ifft(_st, _fin, _fout, arch) \ | ||||
|    ((void)(arch), opus_ifft_neon(_st, _fin, _fout)) | ||||
| 
 | ||||
| #endif /* OPUS_HAVE_RTCD */ | ||||
| 
 | ||||
| #endif /* HAVE_ARM_NE10 */ | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										35
									
								
								lib/rbcodec/codecs/libopus/celt/arm/fixed_arm64.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										35
									
								
								lib/rbcodec/codecs/libopus/celt/arm/fixed_arm64.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,35 @@ | |||
| /* Copyright (C) 2015 Vidyo */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef FIXED_ARM64_H | ||||
| #define FIXED_ARM64_H | ||||
| 
 | ||||
| #include <arm_neon.h> | ||||
| 
 | ||||
| #undef SIG2WORD16 | ||||
| #define SIG2WORD16(x) (vqmovns_s32(PSHR32((x), SIG_SHIFT))) | ||||
| 
 | ||||
| #endif | ||||
|  | @ -37,7 +37,7 @@ static OPUS_INLINE opus_val32 MULT16_32_Q16_armv4(opus_val16 a, opus_val32 b) | |||
|       "#MULT16_32_Q16\n\t" | ||||
|       "smull %0, %1, %2, %3\n\t" | ||||
|       : "=&r"(rd_lo), "=&r"(rd_hi) | ||||
|       : "%r"(b),"r"(a<<16) | ||||
|       : "%r"(b),"r"(SHL32(a,16)) | ||||
|   ); | ||||
|   return rd_hi; | ||||
| } | ||||
|  | @ -54,10 +54,10 @@ static OPUS_INLINE opus_val32 MULT16_32_Q15_armv4(opus_val16 a, opus_val32 b) | |||
|       "#MULT16_32_Q15\n\t" | ||||
|       "smull %0, %1, %2, %3\n\t" | ||||
|       : "=&r"(rd_lo), "=&r"(rd_hi) | ||||
|       : "%r"(b), "r"(a<<16) | ||||
|       : "%r"(b), "r"(SHL32(a,16)) | ||||
|   ); | ||||
|   /*We intentionally don't OR in the high bit of rd_lo for speed.*/ | ||||
|   return rd_hi<<1; | ||||
|   return SHL32(rd_hi,1); | ||||
| } | ||||
| #define MULT16_32_Q15(a, b) (MULT16_32_Q15_armv4(a, b)) | ||||
| 
 | ||||
|  |  | |||
|  | @ -59,7 +59,7 @@ static OPUS_INLINE opus_val32 MULT16_32_Q15_armv5e(opus_val16 a, opus_val32 b) | |||
|       : "=r"(res) | ||||
|       : "r"(b), "r"(a) | ||||
|   ); | ||||
|   return res<<1; | ||||
|   return SHL32(res,1); | ||||
| } | ||||
| #define MULT16_32_Q15(a, b) (MULT16_32_Q15_armv5e(a, b)) | ||||
| 
 | ||||
|  | @ -76,7 +76,7 @@ static OPUS_INLINE opus_val32 MAC16_32_Q15_armv5e(opus_val32 c, opus_val16 a, | |||
|       "#MAC16_32_Q15\n\t" | ||||
|       "smlawb %0, %1, %2, %3;\n" | ||||
|       : "=r"(res) | ||||
|       : "r"(b<<1), "r"(a), "r"(c) | ||||
|       : "r"(SHL32(b,1)), "r"(a), "r"(c) | ||||
|   ); | ||||
|   return res; | ||||
| } | ||||
|  |  | |||
							
								
								
									
										59
									
								
								lib/rbcodec/codecs/libopus/celt/arm/mdct_arm.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										59
									
								
								lib/rbcodec/codecs/libopus/celt/arm/mdct_arm.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,59 @@ | |||
| /* Copyright (c) 2015 Xiph.Org Foundation
 | ||||
|    Written by Viswanath Puttagunta */ | ||||
| /**
 | ||||
|    @file arm_mdct.h | ||||
|    @brief ARM Neon Intrinsic optimizations for mdct using NE10 library | ||||
|  */ | ||||
| 
 | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #if !defined(MDCT_ARM_H) | ||||
| #define MDCT_ARM_H | ||||
| 
 | ||||
| #include "mdct.h" | ||||
| 
 | ||||
| #if defined(HAVE_ARM_NE10) | ||||
| /** Compute a forward MDCT and scale by 4/N, trashes the input array */ | ||||
| void clt_mdct_forward_neon(const mdct_lookup *l, kiss_fft_scalar *in, | ||||
|                            kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|                            const opus_val16 *window, int overlap, | ||||
|                            int shift, int stride, int arch); | ||||
| 
 | ||||
| void clt_mdct_backward_neon(const mdct_lookup *l, kiss_fft_scalar *in, | ||||
|                             kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|                             const opus_val16 *window, int overlap, | ||||
|                             int shift, int stride, int arch); | ||||
| 
 | ||||
| #if !defined(OPUS_HAVE_RTCD) | ||||
| #define OVERRIDE_OPUS_MDCT (1) | ||||
| #define clt_mdct_forward(_l, _in, _out, _window, _int, _shift, _stride, _arch) \ | ||||
|       clt_mdct_forward_neon(_l, _in, _out, _window, _int, _shift, _stride, _arch) | ||||
| #define clt_mdct_backward(_l, _in, _out, _window, _int, _shift, _stride, _arch) \ | ||||
|       clt_mdct_backward_neon(_l, _in, _out, _window, _int, _shift, _stride, _arch) | ||||
| #endif /* OPUS_HAVE_RTCD */ | ||||
| #endif /* HAVE_ARM_NE10 */ | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										160
									
								
								lib/rbcodec/codecs/libopus/celt/arm/pitch_arm.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										160
									
								
								lib/rbcodec/codecs/libopus/celt/arm/pitch_arm.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,160 @@ | |||
| /* Copyright (c) 2010 Xiph.Org Foundation
 | ||||
|  * Copyright (c) 2013 Parrot */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #if !defined(PITCH_ARM_H) | ||||
| # define PITCH_ARM_H | ||||
| 
 | ||||
| # include "armcpu.h" | ||||
| 
 | ||||
| # if defined(OPUS_ARM_MAY_HAVE_NEON_INTR) | ||||
| opus_val32 celt_inner_prod_neon(const opus_val16 *x, const opus_val16 *y, int N); | ||||
| void dual_inner_prod_neon(const opus_val16 *x, const opus_val16 *y01, | ||||
|         const opus_val16 *y02, int N, opus_val32 *xy1, opus_val32 *xy2); | ||||
| 
 | ||||
| #  if !defined(OPUS_HAVE_RTCD) && defined(OPUS_ARM_PRESUME_NEON) | ||||
| #   define OVERRIDE_CELT_INNER_PROD (1) | ||||
| #   define OVERRIDE_DUAL_INNER_PROD (1) | ||||
| #   define celt_inner_prod(x, y, N, arch) ((void)(arch), PRESUME_NEON(celt_inner_prod)(x, y, N)) | ||||
| #   define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) ((void)(arch), PRESUME_NEON(dual_inner_prod)(x, y01, y02, N, xy1, xy2)) | ||||
| #  endif | ||||
| # endif | ||||
| 
 | ||||
| # if !defined(OVERRIDE_CELT_INNER_PROD) | ||||
| #  if defined(OPUS_HAVE_RTCD) && (defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR)) | ||||
| extern opus_val32 (*const CELT_INNER_PROD_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *x, const opus_val16 *y, int N); | ||||
| #   define OVERRIDE_CELT_INNER_PROD (1) | ||||
| #   define celt_inner_prod(x, y, N, arch) ((*CELT_INNER_PROD_IMPL[(arch)&OPUS_ARCHMASK])(x, y, N)) | ||||
| #  elif defined(OPUS_ARM_PRESUME_NEON_INTR) | ||||
| #   define OVERRIDE_CELT_INNER_PROD (1) | ||||
| #   define celt_inner_prod(x, y, N, arch) ((void)(arch), celt_inner_prod_neon(x, y, N)) | ||||
| #  endif | ||||
| # endif | ||||
| 
 | ||||
| # if !defined(OVERRIDE_DUAL_INNER_PROD) | ||||
| #  if defined(OPUS_HAVE_RTCD) && (defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR)) | ||||
| extern void (*const DUAL_INNER_PROD_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *x, | ||||
|         const opus_val16 *y01, const opus_val16 *y02, int N, opus_val32 *xy1, opus_val32 *xy2); | ||||
| #   define OVERRIDE_DUAL_INNER_PROD (1) | ||||
| #   define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) ((*DUAL_INNER_PROD_IMPL[(arch)&OPUS_ARCHMASK])(x, y01, y02, N, xy1, xy2)) | ||||
| #  elif defined(OPUS_ARM_PRESUME_NEON_INTR) | ||||
| #   define OVERRIDE_DUAL_INNER_PROD (1) | ||||
| #   define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) ((void)(arch), dual_inner_prod_neon(x, y01, y02, N, xy1, xy2)) | ||||
| #  endif | ||||
| # endif | ||||
| 
 | ||||
| # if defined(FIXED_POINT) | ||||
| 
 | ||||
| #  if defined(OPUS_ARM_MAY_HAVE_NEON) | ||||
| opus_val32 celt_pitch_xcorr_neon(const opus_val16 *_x, const opus_val16 *_y, | ||||
|     opus_val32 *xcorr, int len, int max_pitch, int arch); | ||||
| #  endif | ||||
| 
 | ||||
| #  if defined(OPUS_ARM_MAY_HAVE_MEDIA) | ||||
| #   define celt_pitch_xcorr_media MAY_HAVE_EDSP(celt_pitch_xcorr) | ||||
| #  endif | ||||
| 
 | ||||
| #  if defined(OPUS_ARM_MAY_HAVE_EDSP) | ||||
| opus_val32 celt_pitch_xcorr_edsp(const opus_val16 *_x, const opus_val16 *_y, | ||||
|     opus_val32 *xcorr, int len, int max_pitch, int arch); | ||||
| #  endif | ||||
| 
 | ||||
| #  if defined(OPUS_HAVE_RTCD) && \ | ||||
|     ((defined(OPUS_ARM_MAY_HAVE_NEON) && !defined(OPUS_ARM_PRESUME_NEON)) || \ | ||||
|      (defined(OPUS_ARM_MAY_HAVE_MEDIA) && !defined(OPUS_ARM_PRESUME_MEDIA)) || \ | ||||
|      (defined(OPUS_ARM_MAY_HAVE_EDSP) && !defined(OPUS_ARM_PRESUME_EDSP))) | ||||
| extern opus_val32 | ||||
| (*const CELT_PITCH_XCORR_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *, | ||||
|       const opus_val16 *, opus_val32 *, int, int, int); | ||||
| #   define OVERRIDE_PITCH_XCORR (1) | ||||
| #   define celt_pitch_xcorr(_x, _y, xcorr, len, max_pitch, arch) \ | ||||
|   ((*CELT_PITCH_XCORR_IMPL[(arch)&OPUS_ARCHMASK])(_x, _y, \ | ||||
|         xcorr, len, max_pitch, arch)) | ||||
| 
 | ||||
| #  elif defined(OPUS_ARM_PRESUME_EDSP) || \ | ||||
|     defined(OPUS_ARM_PRESUME_MEDIA) || \ | ||||
|     defined(OPUS_ARM_PRESUME_NEON) | ||||
| #   define OVERRIDE_PITCH_XCORR (1) | ||||
| #   define celt_pitch_xcorr (PRESUME_NEON(celt_pitch_xcorr)) | ||||
| 
 | ||||
| #  endif | ||||
| 
 | ||||
| #  if defined(OPUS_ARM_MAY_HAVE_NEON_INTR) | ||||
| void xcorr_kernel_neon_fixed( | ||||
|                     const opus_val16 *x, | ||||
|                     const opus_val16 *y, | ||||
|                     opus_val32       sum[4], | ||||
|                     int              len); | ||||
| #  endif | ||||
| 
 | ||||
| #  if defined(OPUS_HAVE_RTCD) && \ | ||||
|     (defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR)) | ||||
| 
 | ||||
| extern void (*const XCORR_KERNEL_IMPL[OPUS_ARCHMASK + 1])( | ||||
|                     const opus_val16 *x, | ||||
|                     const opus_val16 *y, | ||||
|                     opus_val32       sum[4], | ||||
|                     int              len); | ||||
| 
 | ||||
| #   define OVERRIDE_XCORR_KERNEL (1) | ||||
| #   define xcorr_kernel(x, y, sum, len, arch) \ | ||||
|      ((*XCORR_KERNEL_IMPL[(arch) & OPUS_ARCHMASK])(x, y, sum, len)) | ||||
| 
 | ||||
| #  elif defined(OPUS_ARM_PRESUME_NEON_INTR) | ||||
| #   define OVERRIDE_XCORR_KERNEL (1) | ||||
| #   define xcorr_kernel(x, y, sum, len, arch) \ | ||||
|       ((void)arch, xcorr_kernel_neon_fixed(x, y, sum, len)) | ||||
| 
 | ||||
| #  endif | ||||
| 
 | ||||
| #else /* Start !FIXED_POINT */ | ||||
| /* Float case */ | ||||
| #if defined(OPUS_ARM_MAY_HAVE_NEON_INTR) | ||||
| void celt_pitch_xcorr_float_neon(const opus_val16 *_x, const opus_val16 *_y, | ||||
|                                  opus_val32 *xcorr, int len, int max_pitch, int arch); | ||||
| #endif | ||||
| 
 | ||||
| #  if defined(OPUS_HAVE_RTCD) && \ | ||||
|     (defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR)) | ||||
| extern void | ||||
| (*const CELT_PITCH_XCORR_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *, | ||||
|       const opus_val16 *, opus_val32 *, int, int, int); | ||||
| 
 | ||||
| #  define OVERRIDE_PITCH_XCORR (1) | ||||
| #  define celt_pitch_xcorr(_x, _y, xcorr, len, max_pitch, arch) \ | ||||
|   ((*CELT_PITCH_XCORR_IMPL[(arch)&OPUS_ARCHMASK])(_x, _y, \ | ||||
|         xcorr, len, max_pitch, arch)) | ||||
| 
 | ||||
| #  elif defined(OPUS_ARM_PRESUME_NEON_INTR) | ||||
| 
 | ||||
| #   define OVERRIDE_PITCH_XCORR (1) | ||||
| #   define celt_pitch_xcorr celt_pitch_xcorr_float_neon | ||||
| 
 | ||||
| #  endif | ||||
| 
 | ||||
| #endif /* end !FIXED_POINT */ | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										290
									
								
								lib/rbcodec/codecs/libopus/celt/arm/pitch_neon_intr.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										290
									
								
								lib/rbcodec/codecs/libopus/celt/arm/pitch_neon_intr.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,290 @@ | |||
| /***********************************************************************
 | ||||
| Copyright (c) 2017 Google Inc. | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions | ||||
| are met: | ||||
| - Redistributions of source code must retain the above copyright notice, | ||||
| this list of conditions and the following disclaimer. | ||||
| - Redistributions in binary form must reproduce the above copyright | ||||
| notice, this list of conditions and the following disclaimer in the | ||||
| documentation and/or other materials provided with the distribution. | ||||
| - Neither the name of Internet Society, IETF or IETF Trust, nor the | ||||
| names of specific contributors, may be used to endorse or promote | ||||
| products derived from this software without specific prior written | ||||
| permission. | ||||
| THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||
| AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||
| IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||
| ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE | ||||
| LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||
| CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||
| SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||
| INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||
| CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||
| ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||
| POSSIBILITY OF SUCH DAMAGE. | ||||
| ***********************************************************************/ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <arm_neon.h> | ||||
| #include "pitch.h" | ||||
| 
 | ||||
| #ifdef FIXED_POINT | ||||
| 
 | ||||
| opus_val32 celt_inner_prod_neon(const opus_val16 *x, const opus_val16 *y, int N) | ||||
| { | ||||
|     int i; | ||||
|     opus_val32 xy; | ||||
|     int16x8_t x_s16x8, y_s16x8; | ||||
|     int32x4_t xy_s32x4 = vdupq_n_s32(0); | ||||
|     int64x2_t xy_s64x2; | ||||
|     int64x1_t xy_s64x1; | ||||
| 
 | ||||
|     for (i = 0; i < N - 7; i += 8) { | ||||
|         x_s16x8  = vld1q_s16(&x[i]); | ||||
|         y_s16x8  = vld1q_s16(&y[i]); | ||||
|         xy_s32x4 = vmlal_s16(xy_s32x4, vget_low_s16 (x_s16x8), vget_low_s16 (y_s16x8)); | ||||
|         xy_s32x4 = vmlal_s16(xy_s32x4, vget_high_s16(x_s16x8), vget_high_s16(y_s16x8)); | ||||
|     } | ||||
| 
 | ||||
|     if (N - i >= 4) { | ||||
|         const int16x4_t x_s16x4 = vld1_s16(&x[i]); | ||||
|         const int16x4_t y_s16x4 = vld1_s16(&y[i]); | ||||
|         xy_s32x4 = vmlal_s16(xy_s32x4, x_s16x4, y_s16x4); | ||||
|         i += 4; | ||||
|     } | ||||
| 
 | ||||
|     xy_s64x2 = vpaddlq_s32(xy_s32x4); | ||||
|     xy_s64x1 = vadd_s64(vget_low_s64(xy_s64x2), vget_high_s64(xy_s64x2)); | ||||
|     xy       = vget_lane_s32(vreinterpret_s32_s64(xy_s64x1), 0); | ||||
| 
 | ||||
|     for (; i < N; i++) { | ||||
|         xy = MAC16_16(xy, x[i], y[i]); | ||||
|     } | ||||
| 
 | ||||
| #ifdef OPUS_CHECK_ASM | ||||
|     celt_assert(celt_inner_prod_c(x, y, N) == xy); | ||||
| #endif | ||||
| 
 | ||||
|     return xy; | ||||
| } | ||||
| 
 | ||||
| void dual_inner_prod_neon(const opus_val16 *x, const opus_val16 *y01, const opus_val16 *y02, | ||||
|         int N, opus_val32 *xy1, opus_val32 *xy2) | ||||
| { | ||||
|     int i; | ||||
|     opus_val32 xy01, xy02; | ||||
|     int16x8_t x_s16x8, y01_s16x8, y02_s16x8; | ||||
|     int32x4_t xy01_s32x4 = vdupq_n_s32(0); | ||||
|     int32x4_t xy02_s32x4 = vdupq_n_s32(0); | ||||
|     int64x2_t xy01_s64x2, xy02_s64x2; | ||||
|     int64x1_t xy01_s64x1, xy02_s64x1; | ||||
| 
 | ||||
|     for (i = 0; i < N - 7; i += 8) { | ||||
|         x_s16x8    = vld1q_s16(&x[i]); | ||||
|         y01_s16x8  = vld1q_s16(&y01[i]); | ||||
|         y02_s16x8  = vld1q_s16(&y02[i]); | ||||
|         xy01_s32x4 = vmlal_s16(xy01_s32x4, vget_low_s16 (x_s16x8), vget_low_s16 (y01_s16x8)); | ||||
|         xy02_s32x4 = vmlal_s16(xy02_s32x4, vget_low_s16 (x_s16x8), vget_low_s16 (y02_s16x8)); | ||||
|         xy01_s32x4 = vmlal_s16(xy01_s32x4, vget_high_s16(x_s16x8), vget_high_s16(y01_s16x8)); | ||||
|         xy02_s32x4 = vmlal_s16(xy02_s32x4, vget_high_s16(x_s16x8), vget_high_s16(y02_s16x8)); | ||||
|     } | ||||
| 
 | ||||
|     if (N - i >= 4) { | ||||
|         const int16x4_t x_s16x4   = vld1_s16(&x[i]); | ||||
|         const int16x4_t y01_s16x4 = vld1_s16(&y01[i]); | ||||
|         const int16x4_t y02_s16x4 = vld1_s16(&y02[i]); | ||||
|         xy01_s32x4 = vmlal_s16(xy01_s32x4, x_s16x4, y01_s16x4); | ||||
|         xy02_s32x4 = vmlal_s16(xy02_s32x4, x_s16x4, y02_s16x4); | ||||
|         i += 4; | ||||
|     } | ||||
| 
 | ||||
|     xy01_s64x2 = vpaddlq_s32(xy01_s32x4); | ||||
|     xy02_s64x2 = vpaddlq_s32(xy02_s32x4); | ||||
|     xy01_s64x1 = vadd_s64(vget_low_s64(xy01_s64x2), vget_high_s64(xy01_s64x2)); | ||||
|     xy02_s64x1 = vadd_s64(vget_low_s64(xy02_s64x2), vget_high_s64(xy02_s64x2)); | ||||
|     xy01       = vget_lane_s32(vreinterpret_s32_s64(xy01_s64x1), 0); | ||||
|     xy02       = vget_lane_s32(vreinterpret_s32_s64(xy02_s64x1), 0); | ||||
| 
 | ||||
|     for (; i < N; i++) { | ||||
|         xy01 = MAC16_16(xy01, x[i], y01[i]); | ||||
|         xy02 = MAC16_16(xy02, x[i], y02[i]); | ||||
|     } | ||||
|     *xy1 = xy01; | ||||
|     *xy2 = xy02; | ||||
| 
 | ||||
| #ifdef OPUS_CHECK_ASM | ||||
|     { | ||||
|         opus_val32 xy1_c, xy2_c; | ||||
|         dual_inner_prod_c(x, y01, y02, N, &xy1_c, &xy2_c); | ||||
|         celt_assert(xy1_c == *xy1); | ||||
|         celt_assert(xy2_c == *xy2); | ||||
|     } | ||||
| #endif | ||||
| } | ||||
| 
 | ||||
| #else /* !FIXED_POINT */ | ||||
| 
 | ||||
| /* ========================================================================== */ | ||||
| 
 | ||||
| #ifdef OPUS_CHECK_ASM | ||||
| 
 | ||||
| /* This part of code simulates floating-point NEON operations. */ | ||||
| 
 | ||||
| /* celt_inner_prod_neon_float_c_simulation() simulates the floating-point   */ | ||||
| /* operations of celt_inner_prod_neon(), and both functions should have bit */ | ||||
| /* exact output.                                                            */ | ||||
| static opus_val32 celt_inner_prod_neon_float_c_simulation(const opus_val16 *x, const opus_val16 *y, int N) | ||||
| { | ||||
|    int i; | ||||
|    opus_val32 xy, xy0 = 0, xy1 = 0, xy2 = 0, xy3 = 0; | ||||
|    for (i = 0; i < N - 3; i += 4) { | ||||
|       xy0 = MAC16_16(xy0, x[i + 0], y[i + 0]); | ||||
|       xy1 = MAC16_16(xy1, x[i + 1], y[i + 1]); | ||||
|       xy2 = MAC16_16(xy2, x[i + 2], y[i + 2]); | ||||
|       xy3 = MAC16_16(xy3, x[i + 3], y[i + 3]); | ||||
|    } | ||||
|    xy0 += xy2; | ||||
|    xy1 += xy3; | ||||
|    xy = xy0 + xy1; | ||||
|    for (; i < N; i++) { | ||||
|       xy = MAC16_16(xy, x[i], y[i]); | ||||
|    } | ||||
|    return xy; | ||||
| } | ||||
| 
 | ||||
| /* dual_inner_prod_neon_float_c_simulation() simulates the floating-point   */ | ||||
| /* operations of dual_inner_prod_neon(), and both functions should have bit */ | ||||
| /* exact output.                                                            */ | ||||
| static void dual_inner_prod_neon_float_c_simulation(const opus_val16 *x, const opus_val16 *y01, const opus_val16 *y02, | ||||
|       int N, opus_val32 *xy1, opus_val32 *xy2) | ||||
| { | ||||
|    int i; | ||||
|    opus_val32 xy01, xy02, xy01_0 = 0, xy01_1 = 0, xy01_2 = 0, xy01_3 = 0, xy02_0 = 0, xy02_1 = 0, xy02_2 = 0, xy02_3 = 0; | ||||
|    for (i = 0; i < N - 3; i += 4) { | ||||
|       xy01_0 = MAC16_16(xy01_0, x[i + 0], y01[i + 0]); | ||||
|       xy01_1 = MAC16_16(xy01_1, x[i + 1], y01[i + 1]); | ||||
|       xy01_2 = MAC16_16(xy01_2, x[i + 2], y01[i + 2]); | ||||
|       xy01_3 = MAC16_16(xy01_3, x[i + 3], y01[i + 3]); | ||||
|       xy02_0 = MAC16_16(xy02_0, x[i + 0], y02[i + 0]); | ||||
|       xy02_1 = MAC16_16(xy02_1, x[i + 1], y02[i + 1]); | ||||
|       xy02_2 = MAC16_16(xy02_2, x[i + 2], y02[i + 2]); | ||||
|       xy02_3 = MAC16_16(xy02_3, x[i + 3], y02[i + 3]); | ||||
|    } | ||||
|    xy01_0 += xy01_2; | ||||
|    xy02_0 += xy02_2; | ||||
|    xy01_1 += xy01_3; | ||||
|    xy02_1 += xy02_3; | ||||
|    xy01 = xy01_0 + xy01_1; | ||||
|    xy02 = xy02_0 + xy02_1; | ||||
|    for (; i < N; i++) { | ||||
|       xy01 = MAC16_16(xy01, x[i], y01[i]); | ||||
|       xy02 = MAC16_16(xy02, x[i], y02[i]); | ||||
|    } | ||||
|    *xy1 = xy01; | ||||
|    *xy2 = xy02; | ||||
| } | ||||
| 
 | ||||
| #endif /* OPUS_CHECK_ASM */ | ||||
| 
 | ||||
| /* ========================================================================== */ | ||||
| 
 | ||||
| opus_val32 celt_inner_prod_neon(const opus_val16 *x, const opus_val16 *y, int N) | ||||
| { | ||||
|     int i; | ||||
|     opus_val32 xy; | ||||
|     float32x4_t xy_f32x4 = vdupq_n_f32(0); | ||||
|     float32x2_t xy_f32x2; | ||||
| 
 | ||||
|     for (i = 0; i < N - 7; i += 8) { | ||||
|         float32x4_t x_f32x4, y_f32x4; | ||||
|         x_f32x4  = vld1q_f32(&x[i]); | ||||
|         y_f32x4  = vld1q_f32(&y[i]); | ||||
|         xy_f32x4 = vmlaq_f32(xy_f32x4, x_f32x4, y_f32x4); | ||||
|         x_f32x4  = vld1q_f32(&x[i + 4]); | ||||
|         y_f32x4  = vld1q_f32(&y[i + 4]); | ||||
|         xy_f32x4 = vmlaq_f32(xy_f32x4, x_f32x4, y_f32x4); | ||||
|     } | ||||
| 
 | ||||
|     if (N - i >= 4) { | ||||
|         const float32x4_t x_f32x4 = vld1q_f32(&x[i]); | ||||
|         const float32x4_t y_f32x4 = vld1q_f32(&y[i]); | ||||
|         xy_f32x4 = vmlaq_f32(xy_f32x4, x_f32x4, y_f32x4); | ||||
|         i += 4; | ||||
|     } | ||||
| 
 | ||||
|     xy_f32x2 = vadd_f32(vget_low_f32(xy_f32x4), vget_high_f32(xy_f32x4)); | ||||
|     xy_f32x2 = vpadd_f32(xy_f32x2, xy_f32x2); | ||||
|     xy       = vget_lane_f32(xy_f32x2, 0); | ||||
| 
 | ||||
|     for (; i < N; i++) { | ||||
|         xy = MAC16_16(xy, x[i], y[i]); | ||||
|     } | ||||
| 
 | ||||
| #ifdef OPUS_CHECK_ASM | ||||
|     celt_assert(ABS32(celt_inner_prod_neon_float_c_simulation(x, y, N) - xy) <= VERY_SMALL); | ||||
| #endif | ||||
| 
 | ||||
|     return xy; | ||||
| } | ||||
| 
 | ||||
| void dual_inner_prod_neon(const opus_val16 *x, const opus_val16 *y01, const opus_val16 *y02, | ||||
|         int N, opus_val32 *xy1, opus_val32 *xy2) | ||||
| { | ||||
|     int i; | ||||
|     opus_val32 xy01, xy02; | ||||
|     float32x4_t xy01_f32x4 = vdupq_n_f32(0); | ||||
|     float32x4_t xy02_f32x4 = vdupq_n_f32(0); | ||||
|     float32x2_t xy01_f32x2, xy02_f32x2; | ||||
| 
 | ||||
|     for (i = 0; i < N - 7; i += 8) { | ||||
|         float32x4_t x_f32x4, y01_f32x4, y02_f32x4; | ||||
|         x_f32x4    = vld1q_f32(&x[i]); | ||||
|         y01_f32x4  = vld1q_f32(&y01[i]); | ||||
|         y02_f32x4  = vld1q_f32(&y02[i]); | ||||
|         xy01_f32x4 = vmlaq_f32(xy01_f32x4, x_f32x4, y01_f32x4); | ||||
|         xy02_f32x4 = vmlaq_f32(xy02_f32x4, x_f32x4, y02_f32x4); | ||||
|         x_f32x4    = vld1q_f32(&x[i + 4]); | ||||
|         y01_f32x4  = vld1q_f32(&y01[i + 4]); | ||||
|         y02_f32x4  = vld1q_f32(&y02[i + 4]); | ||||
|         xy01_f32x4 = vmlaq_f32(xy01_f32x4, x_f32x4, y01_f32x4); | ||||
|         xy02_f32x4 = vmlaq_f32(xy02_f32x4, x_f32x4, y02_f32x4); | ||||
|     } | ||||
| 
 | ||||
|     if (N - i >= 4) { | ||||
|         const float32x4_t x_f32x4   = vld1q_f32(&x[i]); | ||||
|         const float32x4_t y01_f32x4 = vld1q_f32(&y01[i]); | ||||
|         const float32x4_t y02_f32x4 = vld1q_f32(&y02[i]); | ||||
|         xy01_f32x4 = vmlaq_f32(xy01_f32x4, x_f32x4, y01_f32x4); | ||||
|         xy02_f32x4 = vmlaq_f32(xy02_f32x4, x_f32x4, y02_f32x4); | ||||
|         i += 4; | ||||
|     } | ||||
| 
 | ||||
|     xy01_f32x2 = vadd_f32(vget_low_f32(xy01_f32x4), vget_high_f32(xy01_f32x4)); | ||||
|     xy02_f32x2 = vadd_f32(vget_low_f32(xy02_f32x4), vget_high_f32(xy02_f32x4)); | ||||
|     xy01_f32x2 = vpadd_f32(xy01_f32x2, xy01_f32x2); | ||||
|     xy02_f32x2 = vpadd_f32(xy02_f32x2, xy02_f32x2); | ||||
|     xy01       = vget_lane_f32(xy01_f32x2, 0); | ||||
|     xy02       = vget_lane_f32(xy02_f32x2, 0); | ||||
| 
 | ||||
|     for (; i < N; i++) { | ||||
|         xy01 = MAC16_16(xy01, x[i], y01[i]); | ||||
|         xy02 = MAC16_16(xy02, x[i], y02[i]); | ||||
|     } | ||||
|     *xy1 = xy01; | ||||
|     *xy2 = xy02; | ||||
| 
 | ||||
| #ifdef OPUS_CHECK_ASM | ||||
|     { | ||||
|         opus_val32 xy1_c, xy2_c; | ||||
|         dual_inner_prod_neon_float_c_simulation(x, y01, y02, N, &xy1_c, &xy2_c); | ||||
|         celt_assert(ABS32(xy1_c - *xy1) <= VERY_SMALL); | ||||
|         celt_assert(ABS32(xy2_c - *xy2) <= VERY_SMALL); | ||||
|     } | ||||
| #endif | ||||
| } | ||||
| 
 | ||||
| #endif /* FIXED_POINT */ | ||||
|  | @ -65,19 +65,19 @@ opus_uint32 celt_lcg_rand(opus_uint32 seed) | |||
| 
 | ||||
| /* This is a cos() approximation designed to be bit-exact on any platform. Bit exactness
 | ||||
|    with this approximation is important because it has an impact on the bit allocation */ | ||||
| static opus_int16 bitexact_cos(opus_int16 x) | ||||
| opus_int16 bitexact_cos(opus_int16 x) | ||||
| { | ||||
|    opus_int32 tmp; | ||||
|    opus_int16 x2; | ||||
|    tmp = (4096+((opus_int32)(x)*(x)))>>13; | ||||
|    celt_assert(tmp<=32767); | ||||
|    celt_sig_assert(tmp<=32767); | ||||
|    x2 = tmp; | ||||
|    x2 = (32767-x2) + FRAC_MUL16(x2, (-7651 + FRAC_MUL16(x2, (8277 + FRAC_MUL16(-626, x2))))); | ||||
|    celt_assert(x2<=32766); | ||||
|    celt_sig_assert(x2<=32766); | ||||
|    return 1+x2; | ||||
| } | ||||
| 
 | ||||
| static int bitexact_log2tan(int isin,int icos) | ||||
| int bitexact_log2tan(int isin,int icos) | ||||
| { | ||||
|    int lc; | ||||
|    int ls; | ||||
|  | @ -90,13 +90,13 @@ static int bitexact_log2tan(int isin,int icos) | |||
|          -FRAC_MUL16(icos, FRAC_MUL16(icos, -2597) + 7932); | ||||
| } | ||||
| 
 | ||||
| #if 0 | ||||
| #ifdef FIXED_POINT | ||||
| /* Compute the amplitude (sqrt energy) in each of the bands */ | ||||
| void compute_band_energies(const CELTMode *m, const celt_sig *X, celt_ener *bandE, int end, int C, int LM) | ||||
| void compute_band_energies(const CELTMode *m, const celt_sig *X, celt_ener *bandE, int end, int C, int LM, int arch) | ||||
| { | ||||
|    int i, c, N; | ||||
|    const opus_int16 *eBands = m->eBands; | ||||
|    (void)arch; | ||||
|    N = m->shortMdctSize<<LM; | ||||
|    c=0; do { | ||||
|       for (i=0;i<end;i++) | ||||
|  | @ -156,7 +156,7 @@ void normalise_bands(const CELTMode *m, const celt_sig * OPUS_RESTRICT freq, cel | |||
| 
 | ||||
| #else /* FIXED_POINT */ | ||||
| /* Compute the amplitude (sqrt energy) in each of the bands */ | ||||
| void compute_band_energies(const CELTMode *m, const celt_sig *X, celt_ener *bandE, int end, int C, int LM) | ||||
| void compute_band_energies(const CELTMode *m, const celt_sig *X, celt_ener *bandE, int end, int C, int LM, int arch) | ||||
| { | ||||
|    int i, c, N; | ||||
|    const opus_int16 *eBands = m->eBands; | ||||
|  | @ -165,7 +165,7 @@ void compute_band_energies(const CELTMode *m, const celt_sig *X, celt_ener *band | |||
|       for (i=0;i<end;i++) | ||||
|       { | ||||
|          opus_val32 sum; | ||||
|          sum = 1e-27f + celt_inner_prod(&X[c*N+(eBands[i]<<LM)], &X[c*N+(eBands[i]<<LM)], (eBands[i+1]-eBands[i])<<LM); | ||||
|          sum = 1e-27f + celt_inner_prod(&X[c*N+(eBands[i]<<LM)], &X[c*N+(eBands[i]<<LM)], (eBands[i+1]-eBands[i])<<LM, arch); | ||||
|          bandE[i+c*m->nbEBands] = celt_sqrt(sum); | ||||
|          /*printf ("%f ", bandE[i+c*m->nbEBands]);*/ | ||||
|       } | ||||
|  | @ -191,7 +191,6 @@ void normalise_bands(const CELTMode *m, const celt_sig * OPUS_RESTRICT freq, cel | |||
| } | ||||
| 
 | ||||
| #endif /* FIXED_POINT */ | ||||
| #endif | ||||
| 
 | ||||
| /* De-normalise the energy to produce the synthesis from the unit-energy bands */ | ||||
| void denormalise_bands(const CELTMode *m, const celt_norm * OPUS_RESTRICT X, | ||||
|  | @ -226,9 +225,9 @@ void denormalise_bands(const CELTMode *m, const celt_norm * OPUS_RESTRICT X, | |||
| #endif | ||||
|       j=M*eBands[i]; | ||||
|       band_end = M*eBands[i+1]; | ||||
|       lg = ADD16(bandLogE[i], SHL16((opus_val16)eMeans[i],6)); | ||||
|       lg = SATURATE16(ADD32(bandLogE[i], SHL32((opus_val32)eMeans[i],6))); | ||||
| #ifndef FIXED_POINT | ||||
|       g = celt_exp2(lg); | ||||
|       g = celt_exp2(MIN32(32.f, lg)); | ||||
| #else | ||||
|       /* Handle the integer part of the log energy */ | ||||
|       shift = 16-(lg>>DB_SHIFT); | ||||
|  | @ -243,12 +242,12 @@ void denormalise_bands(const CELTMode *m, const celt_norm * OPUS_RESTRICT X, | |||
|       /* Handle extreme gains with negative shift. */ | ||||
|       if (shift<0) | ||||
|       { | ||||
|          /* For shift < -2 we'd be likely to overflow, so we're capping
 | ||||
|                the gain here. This shouldn't happen unless the bitstream is | ||||
|                already corrupted. */ | ||||
|          if (shift < -2) | ||||
|          /* For shift <= -2 and g > 16384 we'd be likely to overflow, so we're
 | ||||
|             capping the gain here, which is equivalent to a cap of 18 on lg. | ||||
|             This shouldn't trigger unless the bitstream is already corrupted. */ | ||||
|          if (shift <= -2) | ||||
|          { | ||||
|             g = 32767; | ||||
|             g = 16384; | ||||
|             shift = -2; | ||||
|          } | ||||
|          do { | ||||
|  | @ -268,7 +267,7 @@ void denormalise_bands(const CELTMode *m, const celt_norm * OPUS_RESTRICT X, | |||
| /* This prevents energy collapse for transients with multiple short MDCTs */ | ||||
| void anti_collapse(const CELTMode *m, celt_norm *X_, unsigned char *collapse_masks, int LM, int C, int size, | ||||
|       int start, int end, const opus_val16 *logE, const opus_val16 *prev1logE, | ||||
|       const opus_val16 *prev2logE, const int *pulses, opus_uint32 seed) | ||||
|       const opus_val16 *prev2logE, const int *pulses, opus_uint32 seed, int arch) | ||||
| { | ||||
|    int c, i, j, k; | ||||
|    for (i=start;i<end;i++) | ||||
|  | @ -283,7 +282,7 @@ void anti_collapse(const CELTMode *m, celt_norm *X_, unsigned char *collapse_mas | |||
| 
 | ||||
|       N0 = m->eBands[i+1]-m->eBands[i]; | ||||
|       /* depth in 1/8 bits */ | ||||
|       celt_assert(pulses[i]>=0); | ||||
|       celt_sig_assert(pulses[i]>=0); | ||||
|       depth = celt_udiv(1+pulses[i], (m->eBands[i+1]-m->eBands[i]))>>LM; | ||||
| 
 | ||||
| #ifdef FIXED_POINT | ||||
|  | @ -357,11 +356,35 @@ void anti_collapse(const CELTMode *m, celt_norm *X_, unsigned char *collapse_mas | |||
|          } | ||||
|          /* We just added some energy, so we need to renormalise */ | ||||
|          if (renormalize) | ||||
|             renormalise_vector(X, N0<<LM, Q15ONE); | ||||
|             renormalise_vector(X, N0<<LM, Q15ONE, arch); | ||||
|       } while (++c<C); | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| /* Compute the weights to use for optimizing normalized distortion across
 | ||||
|    channels. We use the amplitude to weight square distortion, which means | ||||
|    that we use the square root of the value we would have been using if we | ||||
|    wanted to minimize the MSE in the non-normalized domain. This roughly | ||||
|    corresponds to some quick-and-dirty perceptual experiments I ran to | ||||
|    measure inter-aural masking (there doesn't seem to be any published data | ||||
|    on the topic). */ | ||||
| static void compute_channel_weights(celt_ener Ex, celt_ener Ey, opus_val16 w[2]) | ||||
| { | ||||
|    celt_ener minE; | ||||
| #ifdef FIXED_POINT | ||||
|    int shift; | ||||
| #endif | ||||
|    minE = MIN32(Ex, Ey); | ||||
|    /* Adjustment to make the weights a bit more conservative. */ | ||||
|    Ex = ADD32(Ex, minE/3); | ||||
|    Ey = ADD32(Ey, minE/3); | ||||
| #ifdef FIXED_POINT | ||||
|    shift = celt_ilog2(EPSILON+MAX32(Ex, Ey))-14; | ||||
| #endif | ||||
|    w[0] = VSHR32(Ex, shift); | ||||
|    w[1] = VSHR32(Ey, shift); | ||||
| } | ||||
| 
 | ||||
| static void intensity_stereo(const CELTMode *m, celt_norm * OPUS_RESTRICT X, const celt_norm * OPUS_RESTRICT Y, const celt_ener *bandE, int bandID, int N) | ||||
| { | ||||
|    int i = bandID; | ||||
|  | @ -400,7 +423,7 @@ static void stereo_split(celt_norm * OPUS_RESTRICT X, celt_norm * OPUS_RESTRICT | |||
|    } | ||||
| } | ||||
| 
 | ||||
| static void stereo_merge(celt_norm * OPUS_RESTRICT X, celt_norm * OPUS_RESTRICT Y, opus_val16 mid, int N) | ||||
| static void stereo_merge(celt_norm * OPUS_RESTRICT X, celt_norm * OPUS_RESTRICT Y, opus_val16 mid, int N, int arch) | ||||
| { | ||||
|    int j; | ||||
|    opus_val32 xp=0, side=0; | ||||
|  | @ -412,11 +435,11 @@ static void stereo_merge(celt_norm * OPUS_RESTRICT X, celt_norm * OPUS_RESTRICT | |||
|    opus_val32 t, lgain, rgain; | ||||
| 
 | ||||
|    /* Compute the norm of X+Y and X-Y as |X|^2 + |Y|^2 +/- sum(xy) */ | ||||
|    dual_inner_prod(Y, X, Y, N, &xp, &side); | ||||
|    dual_inner_prod(Y, X, Y, N, &xp, &side, arch); | ||||
|    /* Compensating for the mid normalization */ | ||||
|    xp = MULT16_32_Q15(mid, xp); | ||||
|    /* mid and side are in Q15, not Q14 like X and Y */ | ||||
|    mid2 = SHR32(mid, 1); | ||||
|    mid2 = SHR16(mid, 1); | ||||
|    El = MULT16_16(mid2, mid2) + side - 2*xp; | ||||
|    Er = MULT16_16(mid2, mid2) + side + 2*xp; | ||||
|    if (Er < QCONST32(6e-4f, 28) || El < QCONST32(6e-4f, 28)) | ||||
|  | @ -452,11 +475,10 @@ static void stereo_merge(celt_norm * OPUS_RESTRICT X, celt_norm * OPUS_RESTRICT | |||
|    } | ||||
| } | ||||
| 
 | ||||
| #if 0 | ||||
| /* Decide whether we should spread the pulses in the current frame */ | ||||
| int spreading_decision(const CELTMode *m, const celt_norm *X, int *average, | ||||
|       int last_decision, int *hf_average, int *tapset_decision, int update_hf, | ||||
|       int end, int C, int M) | ||||
|       int end, int C, int M, const int *spread_weight) | ||||
| { | ||||
|    int i, c, N0; | ||||
|    int sum = 0, nbBands=0; | ||||
|  | @ -497,8 +519,8 @@ int spreading_decision(const CELTMode *m, const celt_norm *X, int *average, | |||
|          if (i>m->nbEBands-4) | ||||
|             hf_sum += celt_udiv(32*(tcount[1]+tcount[0]), N); | ||||
|          tmp = (2*tcount[2] >= N) + (2*tcount[1] >= N) + (2*tcount[0] >= N); | ||||
|          sum += tmp*256; | ||||
|          nbBands++; | ||||
|          sum += tmp*spread_weight[i]; | ||||
|          nbBands+=spread_weight[i]; | ||||
|       } | ||||
|    } while (++c<C); | ||||
| 
 | ||||
|  | @ -522,7 +544,7 @@ int spreading_decision(const CELTMode *m, const celt_norm *X, int *average, | |||
|    /*printf("%d %d %d\n", hf_sum, *hf_average, *tapset_decision);*/ | ||||
|    celt_assert(nbBands>0); /* end has to be non-zero */ | ||||
|    celt_assert(sum>=0); | ||||
|    sum = celt_udiv(sum, nbBands); | ||||
|    sum = celt_udiv((opus_int32)sum<<8, nbBands); | ||||
|    /* Recursive averaging */ | ||||
|    sum = (sum+*average)>>1; | ||||
|    *average = sum; | ||||
|  | @ -546,7 +568,6 @@ int spreading_decision(const CELTMode *m, const celt_norm *X, int *average, | |||
| #endif | ||||
|    return decision; | ||||
| } | ||||
| #endif | ||||
| 
 | ||||
| /* Indexing table for converting from natural Hadamard to ordery Hadamard
 | ||||
|    This is essentially a bit-reversed Gray, on top of which we've added | ||||
|  | @ -651,6 +672,7 @@ static int compute_qn(int N, int b, int offset, int pulse_cap, int stereo) | |||
| 
 | ||||
| struct band_ctx { | ||||
|    int encode; | ||||
|    int resynth; | ||||
|    const CELTMode *m; | ||||
|    int i; | ||||
|    int intensity; | ||||
|  | @ -660,6 +682,10 @@ struct band_ctx { | |||
|    opus_int32 remaining_bits; | ||||
|    const celt_ener *bandE; | ||||
|    opus_uint32 seed; | ||||
|    int arch; | ||||
|    int theta_round; | ||||
|    int disable_inv; | ||||
|    int avoid_split_noise; | ||||
| }; | ||||
| 
 | ||||
| struct split_ctx { | ||||
|  | @ -711,14 +737,41 @@ static void compute_theta(struct band_ctx *ctx, struct split_ctx *sctx, | |||
|          side and mid. With just that parameter, we can re-scale both | ||||
|          mid and side because we know that 1) they have unit norm and | ||||
|          2) they are orthogonal. */ | ||||
|       itheta = stereo_itheta(X, Y, stereo, N); | ||||
|       itheta = stereo_itheta(X, Y, stereo, N, ctx->arch); | ||||
|    } | ||||
|    tell = ec_tell_frac(ec); | ||||
|    if (qn!=1) | ||||
|    { | ||||
|       if (encode) | ||||
|          itheta = (itheta*qn+8192)>>14; | ||||
| 
 | ||||
|       { | ||||
|          if (!stereo || ctx->theta_round == 0) | ||||
|          { | ||||
|             itheta = (itheta*(opus_int32)qn+8192)>>14; | ||||
|             if (!stereo && ctx->avoid_split_noise && itheta > 0 && itheta < qn) | ||||
|             { | ||||
|                /* Check if the selected value of theta will cause the bit allocation
 | ||||
|                   to inject noise on one side. If so, make sure the energy of that side | ||||
|                   is zero. */ | ||||
|                int unquantized = celt_udiv((opus_int32)itheta*16384, qn); | ||||
|                imid = bitexact_cos((opus_int16)unquantized); | ||||
|                iside = bitexact_cos((opus_int16)(16384-unquantized)); | ||||
|                delta = FRAC_MUL16((N-1)<<7,bitexact_log2tan(iside,imid)); | ||||
|                if (delta > *b) | ||||
|                   itheta = qn; | ||||
|                else if (delta < -*b) | ||||
|                   itheta = 0; | ||||
|             } | ||||
|          } else { | ||||
|             int down; | ||||
|             /* Bias quantization towards itheta=0 and itheta=16384. */ | ||||
|             int bias = itheta > 8192 ? 32767/qn : -32767/qn; | ||||
|             down = IMIN(qn-1, IMAX(0, (itheta*(opus_int32)qn + bias)>>14)); | ||||
|             if (ctx->theta_round < 0) | ||||
|                itheta = down; | ||||
|             else | ||||
|                itheta = down+1; | ||||
|          } | ||||
|       } | ||||
|       /* Entropy coding of the angle. We use a uniform pdf for the
 | ||||
|          time split, a step for stereo, and a triangular one for the rest. */ | ||||
|       if (stereo && N>2) | ||||
|  | @ -796,7 +849,7 @@ static void compute_theta(struct band_ctx *ctx, struct split_ctx *sctx, | |||
|    } else if (stereo) { | ||||
|       if (encode) | ||||
|       { | ||||
|          inv = itheta > 8192; | ||||
|          inv = itheta > 8192 && !ctx->disable_inv; | ||||
|          if (inv) | ||||
|          { | ||||
|             int j; | ||||
|  | @ -813,6 +866,9 @@ static void compute_theta(struct band_ctx *ctx, struct split_ctx *sctx, | |||
|             inv = ec_dec_bit_logp(ec, 2); | ||||
|       } else | ||||
|          inv = 0; | ||||
|       /* inv flag override to avoid problems with downmixing. */ | ||||
|       if (ctx->disable_inv) | ||||
|          inv = 0; | ||||
|       itheta = 0; | ||||
|    } | ||||
|    qalloc = ec_tell_frac(ec) - tell; | ||||
|  | @ -848,11 +904,6 @@ static void compute_theta(struct band_ctx *ctx, struct split_ctx *sctx, | |||
| static unsigned quant_band_n1(struct band_ctx *ctx, celt_norm *X, celt_norm *Y, int b, | ||||
|       celt_norm *lowband_out) | ||||
| { | ||||
| #ifdef RESYNTH | ||||
|    int resynth = 1; | ||||
| #else | ||||
|    int resynth = !ctx->encode; | ||||
| #endif | ||||
|    int c; | ||||
|    int stereo; | ||||
|    celt_norm *x = X; | ||||
|  | @ -877,7 +928,7 @@ static unsigned quant_band_n1(struct band_ctx *ctx, celt_norm *X, celt_norm *Y, | |||
|          ctx->remaining_bits -= 1<<BITRES; | ||||
|          b-=1<<BITRES; | ||||
|       } | ||||
|       if (resynth) | ||||
|       if (ctx->resynth) | ||||
|          x[0] = sign ? -NORM_SCALING : NORM_SCALING; | ||||
|       x = Y; | ||||
|    } while (++c<1+stereo); | ||||
|  | @ -902,11 +953,6 @@ static unsigned quant_partition(struct band_ctx *ctx, celt_norm *X, | |||
|    int B0=B; | ||||
|    opus_val16 mid=0, side=0; | ||||
|    unsigned cm=0; | ||||
| #ifdef RESYNTH | ||||
|    int resynth = 1; | ||||
| #else | ||||
|    int resynth = !ctx->encode; | ||||
| #endif | ||||
|    celt_norm *Y=NULL; | ||||
|    int encode; | ||||
|    const CELTMode *m; | ||||
|  | @ -938,8 +984,7 @@ static unsigned quant_partition(struct band_ctx *ctx, celt_norm *X, | |||
|          fill = (fill&1)|(fill<<1); | ||||
|       B = (B+1)>>1; | ||||
| 
 | ||||
|       compute_theta(ctx, &sctx, X, Y, N, &b, B, B0, | ||||
|             LM, 0, &fill); | ||||
|       compute_theta(ctx, &sctx, X, Y, N, &b, B, B0, LM, 0, &fill); | ||||
|       imid = sctx.imid; | ||||
|       iside = sctx.iside; | ||||
|       delta = sctx.delta; | ||||
|  | @ -973,24 +1018,20 @@ static unsigned quant_partition(struct band_ctx *ctx, celt_norm *X, | |||
|       rebalance = ctx->remaining_bits; | ||||
|       if (mbits >= sbits) | ||||
|       { | ||||
|          cm = quant_partition(ctx, X, N, mbits, B, | ||||
|                lowband, LM, | ||||
|          cm = quant_partition(ctx, X, N, mbits, B, lowband, LM, | ||||
|                MULT16_16_P15(gain,mid), fill); | ||||
|          rebalance = mbits - (rebalance-ctx->remaining_bits); | ||||
|          if (rebalance > 3<<BITRES && itheta!=0) | ||||
|             sbits += rebalance - (3<<BITRES); | ||||
|          cm |= quant_partition(ctx, Y, N, sbits, B, | ||||
|                next_lowband2, LM, | ||||
|          cm |= quant_partition(ctx, Y, N, sbits, B, next_lowband2, LM, | ||||
|                MULT16_16_P15(gain,side), fill>>B)<<(B0>>1); | ||||
|       } else { | ||||
|          cm = quant_partition(ctx, Y, N, sbits, B, | ||||
|                next_lowband2, LM, | ||||
|          cm = quant_partition(ctx, Y, N, sbits, B, next_lowband2, LM, | ||||
|                MULT16_16_P15(gain,side), fill>>B)<<(B0>>1); | ||||
|          rebalance = sbits - (rebalance-ctx->remaining_bits); | ||||
|          if (rebalance > 3<<BITRES && itheta!=16384) | ||||
|             mbits += rebalance - (3<<BITRES); | ||||
|          cm |= quant_partition(ctx, X, N, mbits, B, | ||||
|                lowband, LM, | ||||
|          cm |= quant_partition(ctx, X, N, mbits, B, lowband, LM, | ||||
|                MULT16_16_P15(gain,mid), fill); | ||||
|       } | ||||
|    } else { | ||||
|  | @ -1015,18 +1056,14 @@ static unsigned quant_partition(struct band_ctx *ctx, celt_norm *X, | |||
|          /* Finally do the actual quantization */ | ||||
|          if (encode) | ||||
|          { | ||||
|             cm = alg_quant(X, N, K, spread, B, ec | ||||
| #ifdef RESYNTH | ||||
|                  , gain | ||||
| #endif | ||||
|                  ); | ||||
|             cm = alg_quant(X, N, K, spread, B, ec, gain, ctx->resynth, ctx->arch); | ||||
|          } else { | ||||
|             cm = alg_unquant(X, N, K, spread, B, ec, gain); | ||||
|          } | ||||
|       } else { | ||||
|          /* If there's no pulse, fill the band anyway */ | ||||
|          int j; | ||||
|          if (resynth) | ||||
|          if (ctx->resynth) | ||||
|          { | ||||
|             unsigned cm_mask; | ||||
|             /* B can be as large as 16, so this shift might overflow an int on a
 | ||||
|  | @ -1059,7 +1096,7 @@ static unsigned quant_partition(struct band_ctx *ctx, celt_norm *X, | |||
|                   } | ||||
|                   cm = fill; | ||||
|                } | ||||
|                renormalise_vector(X, N, gain); | ||||
|                renormalise_vector(X, N, gain, ctx->arch); | ||||
|             } | ||||
|          } | ||||
|       } | ||||
|  | @ -1083,11 +1120,6 @@ static unsigned quant_band(struct band_ctx *ctx, celt_norm *X, | |||
|    int recombine=0; | ||||
|    int longBlocks; | ||||
|    unsigned cm=0; | ||||
| #ifdef RESYNTH | ||||
|    int resynth = 1; | ||||
| #else | ||||
|    int resynth = !ctx->encode; | ||||
| #endif | ||||
|    int k; | ||||
|    int encode; | ||||
|    int tf_change; | ||||
|  | @ -1154,11 +1186,10 @@ static unsigned quant_band(struct band_ctx *ctx, celt_norm *X, | |||
|          deinterleave_hadamard(lowband, N_B>>recombine, B0<<recombine, longBlocks); | ||||
|    } | ||||
| 
 | ||||
|    cm = quant_partition(ctx, X, N, b, B, lowband, | ||||
|          LM, gain, fill); | ||||
|    cm = quant_partition(ctx, X, N, b, B, lowband, LM, gain, fill); | ||||
| 
 | ||||
|    /* This code is used by the decoder and by the resynthesis-enabled encoder */ | ||||
|    if (resynth) | ||||
|    if (ctx->resynth) | ||||
|    { | ||||
|       /* Undo the sample reorganization going from time order to frequency order */ | ||||
|       if (B0>1) | ||||
|  | @ -1211,11 +1242,6 @@ static unsigned quant_band_stereo(struct band_ctx *ctx, celt_norm *X, celt_norm | |||
|    int inv = 0; | ||||
|    opus_val16 mid=0, side=0; | ||||
|    unsigned cm=0; | ||||
| #ifdef RESYNTH | ||||
|    int resynth = 1; | ||||
| #else | ||||
|    int resynth = !ctx->encode; | ||||
| #endif | ||||
|    int mbits, sbits, delta; | ||||
|    int itheta; | ||||
|    int qalloc; | ||||
|  | @ -1235,8 +1261,7 @@ static unsigned quant_band_stereo(struct band_ctx *ctx, celt_norm *X, celt_norm | |||
| 
 | ||||
|    orig_fill = fill; | ||||
| 
 | ||||
|    compute_theta(ctx, &sctx, X, Y, N, &b, B, B, | ||||
|          LM, 1, &fill); | ||||
|    compute_theta(ctx, &sctx, X, Y, N, &b, B, B, LM, 1, &fill); | ||||
|    inv = sctx.inv; | ||||
|    imid = sctx.imid; | ||||
|    iside = sctx.iside; | ||||
|  | @ -1284,13 +1309,13 @@ static unsigned quant_band_stereo(struct band_ctx *ctx, celt_norm *X, celt_norm | |||
|       sign = 1-2*sign; | ||||
|       /* We use orig_fill here because we want to fold the side, but if
 | ||||
|          itheta==16384, we'll have cleared the low bits of fill. */ | ||||
|       cm = quant_band(ctx, x2, N, mbits, B, lowband, | ||||
|             LM, lowband_out, Q15ONE, lowband_scratch, orig_fill); | ||||
|       cm = quant_band(ctx, x2, N, mbits, B, lowband, LM, lowband_out, Q15ONE, | ||||
|             lowband_scratch, orig_fill); | ||||
|       /* We don't split N=2 bands, so cm is either 1 or 0 (for a fold-collapse),
 | ||||
|          and there's no need to worry about mixing with the other channel. */ | ||||
|       y2[0] = -sign*x2[1]; | ||||
|       y2[1] = sign*x2[0]; | ||||
|       if (resynth) | ||||
|       if (ctx->resynth) | ||||
|       { | ||||
|          celt_norm tmp; | ||||
|          X[0] = MULT16_16_Q15(mid, X[0]); | ||||
|  | @ -1317,41 +1342,35 @@ static unsigned quant_band_stereo(struct band_ctx *ctx, celt_norm *X, celt_norm | |||
|       { | ||||
|          /* In stereo mode, we do not apply a scaling to the mid because we need the normalized
 | ||||
|             mid for folding later. */ | ||||
|          cm = quant_band(ctx, X, N, mbits, B, | ||||
|                lowband, LM, lowband_out, | ||||
|                Q15ONE, lowband_scratch, fill); | ||||
|          cm = quant_band(ctx, X, N, mbits, B, lowband, LM, lowband_out, Q15ONE, | ||||
|                lowband_scratch, fill); | ||||
|          rebalance = mbits - (rebalance-ctx->remaining_bits); | ||||
|          if (rebalance > 3<<BITRES && itheta!=0) | ||||
|             sbits += rebalance - (3<<BITRES); | ||||
| 
 | ||||
|          /* For a stereo split, the high bits of fill are always zero, so no
 | ||||
|             folding will be done to the side. */ | ||||
|          cm |= quant_band(ctx, Y, N, sbits, B, | ||||
|                NULL, LM, NULL, | ||||
|                side, NULL, fill>>B); | ||||
|          cm |= quant_band(ctx, Y, N, sbits, B, NULL, LM, NULL, side, NULL, fill>>B); | ||||
|       } else { | ||||
|          /* For a stereo split, the high bits of fill are always zero, so no
 | ||||
|             folding will be done to the side. */ | ||||
|          cm = quant_band(ctx, Y, N, sbits, B, | ||||
|                NULL, LM, NULL, | ||||
|                side, NULL, fill>>B); | ||||
|          cm = quant_band(ctx, Y, N, sbits, B, NULL, LM, NULL, side, NULL, fill>>B); | ||||
|          rebalance = sbits - (rebalance-ctx->remaining_bits); | ||||
|          if (rebalance > 3<<BITRES && itheta!=16384) | ||||
|             mbits += rebalance - (3<<BITRES); | ||||
|          /* In stereo mode, we do not apply a scaling to the mid because we need the normalized
 | ||||
|             mid for folding later. */ | ||||
|          cm |= quant_band(ctx, X, N, mbits, B, | ||||
|                lowband, LM, lowband_out, | ||||
|                Q15ONE, lowband_scratch, fill); | ||||
|          cm |= quant_band(ctx, X, N, mbits, B, lowband, LM, lowband_out, Q15ONE, | ||||
|                lowband_scratch, fill); | ||||
|       } | ||||
|    } | ||||
| 
 | ||||
| 
 | ||||
|    /* This code is used by the decoder and by the resynthesis-enabled encoder */ | ||||
|    if (resynth) | ||||
|    if (ctx->resynth) | ||||
|    { | ||||
|       if (N!=2) | ||||
|          stereo_merge(X, Y, mid, N); | ||||
|          stereo_merge(X, Y, mid, N, ctx->arch); | ||||
|       if (inv) | ||||
|       { | ||||
|          int j; | ||||
|  | @ -1362,17 +1381,38 @@ static unsigned quant_band_stereo(struct band_ctx *ctx, celt_norm *X, celt_norm | |||
|    return cm; | ||||
| } | ||||
| 
 | ||||
| static void special_hybrid_folding(const CELTMode *m, celt_norm *norm, celt_norm *norm2, int start, int M, int dual_stereo) | ||||
| { | ||||
|    int n1, n2; | ||||
|    const opus_int16 * OPUS_RESTRICT eBands = m->eBands; | ||||
|    n1 = M*(eBands[start+1]-eBands[start]); | ||||
|    n2 = M*(eBands[start+2]-eBands[start+1]); | ||||
|    /* Duplicate enough of the first band folding data to be able to fold the second band.
 | ||||
|       Copies no data for CELT-only mode. */ | ||||
|    OPUS_COPY(&norm[n1], &norm[2*n1 - n2], n2-n1); | ||||
|    if (dual_stereo) | ||||
|       OPUS_COPY(&norm2[n1], &norm2[2*n1 - n2], n2-n1); | ||||
| } | ||||
| 
 | ||||
| void quant_all_bands(int encode, const CELTMode *m, int start, int end, | ||||
|       celt_norm *X_, celt_norm *Y_, unsigned char *collapse_masks, const celt_ener *bandE, int *pulses, | ||||
|       int shortBlocks, int spread, int dual_stereo, int intensity, int *tf_res, | ||||
|       opus_int32 total_bits, opus_int32 balance, ec_ctx *ec, int LM, int codedBands, opus_uint32 *seed) | ||||
|       celt_norm *X_, celt_norm *Y_, unsigned char *collapse_masks, | ||||
|       const celt_ener *bandE, int *pulses, int shortBlocks, int spread, | ||||
|       int dual_stereo, int intensity, int *tf_res, opus_int32 total_bits, | ||||
|       opus_int32 balance, ec_ctx *ec, int LM, int codedBands, | ||||
|       opus_uint32 *seed, int complexity, int arch, int disable_inv) | ||||
| { | ||||
|    int i; | ||||
|    opus_int32 remaining_bits; | ||||
|    const opus_int16 * OPUS_RESTRICT eBands = m->eBands; | ||||
|    celt_norm * OPUS_RESTRICT norm, * OPUS_RESTRICT norm2; | ||||
|    VARDECL(celt_norm, _norm); | ||||
|    VARDECL(celt_norm, _lowband_scratch); | ||||
|    VARDECL(celt_norm, X_save); | ||||
|    VARDECL(celt_norm, Y_save); | ||||
|    VARDECL(celt_norm, X_save2); | ||||
|    VARDECL(celt_norm, Y_save2); | ||||
|    VARDECL(celt_norm, norm_save2); | ||||
|    int resynth_alloc; | ||||
|    celt_norm *lowband_scratch; | ||||
|    int B; | ||||
|    int M; | ||||
|  | @ -1380,10 +1420,11 @@ void quant_all_bands(int encode, const CELTMode *m, int start, int end, | |||
|    int update_lowband = 1; | ||||
|    int C = Y_ != NULL ? 2 : 1; | ||||
|    int norm_offset; | ||||
|    int theta_rdo = encode && Y_!=NULL && !dual_stereo && complexity>=8; | ||||
| #ifdef RESYNTH | ||||
|    int resynth = 1; | ||||
| #else | ||||
|    int resynth = !encode; | ||||
|    int resynth = !encode || theta_rdo; | ||||
| #endif | ||||
|    struct band_ctx ctx; | ||||
|    SAVE_STACK; | ||||
|  | @ -1396,9 +1437,24 @@ void quant_all_bands(int encode, const CELTMode *m, int start, int end, | |||
|    ALLOC(_norm, C*(M*eBands[m->nbEBands-1]-norm_offset), celt_norm); | ||||
|    norm = _norm; | ||||
|    norm2 = norm + M*eBands[m->nbEBands-1]-norm_offset; | ||||
|    /* We can use the last band as scratch space because we don't need that
 | ||||
|       scratch space for the last band. */ | ||||
|    lowband_scratch = X_+M*eBands[m->nbEBands-1]; | ||||
| 
 | ||||
|    /* For decoding, we can use the last band as scratch space because we don't need that
 | ||||
|       scratch space for the last band and we don't care about the data there until we're | ||||
|       decoding the last band. */ | ||||
|    if (encode && resynth) | ||||
|       resynth_alloc = M*(eBands[m->nbEBands]-eBands[m->nbEBands-1]); | ||||
|    else | ||||
|       resynth_alloc = ALLOC_NONE; | ||||
|    ALLOC(_lowband_scratch, resynth_alloc, celt_norm); | ||||
|    if (encode && resynth) | ||||
|       lowband_scratch = _lowband_scratch; | ||||
|    else | ||||
|       lowband_scratch = X_+M*eBands[m->nbEBands-1]; | ||||
|    ALLOC(X_save, resynth_alloc, celt_norm); | ||||
|    ALLOC(Y_save, resynth_alloc, celt_norm); | ||||
|    ALLOC(X_save2, resynth_alloc, celt_norm); | ||||
|    ALLOC(Y_save2, resynth_alloc, celt_norm); | ||||
|    ALLOC(norm_save2, resynth_alloc, celt_norm); | ||||
| 
 | ||||
|    lowband_offset = 0; | ||||
|    ctx.bandE = bandE; | ||||
|  | @ -1408,6 +1464,12 @@ void quant_all_bands(int encode, const CELTMode *m, int start, int end, | |||
|    ctx.m = m; | ||||
|    ctx.seed = *seed; | ||||
|    ctx.spread = spread; | ||||
|    ctx.arch = arch; | ||||
|    ctx.disable_inv = disable_inv; | ||||
|    ctx.resynth = resynth; | ||||
|    ctx.theta_round = 0; | ||||
|    /* Avoid injecting noise in the first band on transients. */ | ||||
|    ctx.avoid_split_noise = B > 1; | ||||
|    for (i=start;i<end;i++) | ||||
|    { | ||||
|       opus_int32 tell; | ||||
|  | @ -1430,6 +1492,7 @@ void quant_all_bands(int encode, const CELTMode *m, int start, int end, | |||
|       else | ||||
|          Y = NULL; | ||||
|       N = M*eBands[i+1]-M*eBands[i]; | ||||
|       celt_assert(N > 0); | ||||
|       tell = ec_tell_frac(ec); | ||||
| 
 | ||||
|       /* Compute how many bits we want to allocate to this band */ | ||||
|  | @ -1445,8 +1508,15 @@ void quant_all_bands(int encode, const CELTMode *m, int start, int end, | |||
|          b = 0; | ||||
|       } | ||||
| 
 | ||||
| #ifndef DISABLE_UPDATE_DRAFT | ||||
|       if (resynth && (M*eBands[i]-N >= M*eBands[start] || i==start+1) && (update_lowband || lowband_offset==0)) | ||||
|             lowband_offset = i; | ||||
|       if (i == start+1) | ||||
|          special_hybrid_folding(m, norm, norm2, start, M, dual_stereo); | ||||
| #else | ||||
|       if (resynth && M*eBands[i]-N >= M*eBands[start] && (update_lowband || lowband_offset==0)) | ||||
|             lowband_offset = i; | ||||
| #endif | ||||
| 
 | ||||
|       tf_change = tf_res[i]; | ||||
|       ctx.tf_change = tf_change; | ||||
|  | @ -1457,7 +1527,7 @@ void quant_all_bands(int encode, const CELTMode *m, int start, int end, | |||
|             Y = norm; | ||||
|          lowband_scratch = NULL; | ||||
|       } | ||||
|       if (i==end-1) | ||||
|       if (last && !theta_rdo) | ||||
|          lowband_scratch = NULL; | ||||
| 
 | ||||
|       /* Get a conservative estimate of the collapse_mask's for the bands we're
 | ||||
|  | @ -1472,7 +1542,11 @@ void quant_all_bands(int encode, const CELTMode *m, int start, int end, | |||
|          fold_start = lowband_offset; | ||||
|          while(M*eBands[--fold_start] > effective_lowband+norm_offset); | ||||
|          fold_end = lowband_offset-1; | ||||
| #ifndef DISABLE_UPDATE_DRAFT | ||||
|          while(++fold_end < i && M*eBands[fold_end] < effective_lowband+norm_offset+N); | ||||
| #else | ||||
|          while(M*eBands[++fold_end] < effective_lowband+norm_offset+N); | ||||
| #endif | ||||
|          x_cm = y_cm = 0; | ||||
|          fold_i = fold_start; do { | ||||
|            x_cm |= collapse_masks[fold_i*C+0]; | ||||
|  | @ -1505,13 +1579,79 @@ void quant_all_bands(int encode, const CELTMode *m, int start, int end, | |||
|       } else { | ||||
|          if (Y!=NULL) | ||||
|          { | ||||
|             x_cm = quant_band_stereo(&ctx, X, Y, N, b, B, | ||||
|                   effective_lowband != -1 ? norm+effective_lowband : NULL, LM, | ||||
|                         last?NULL:norm+M*eBands[i]-norm_offset, lowband_scratch, x_cm|y_cm); | ||||
|             if (theta_rdo && i < intensity) | ||||
|             { | ||||
|                ec_ctx ec_save, ec_save2; | ||||
|                struct band_ctx ctx_save, ctx_save2; | ||||
|                opus_val32 dist0, dist1; | ||||
|                unsigned cm, cm2; | ||||
|                int nstart_bytes, nend_bytes, save_bytes; | ||||
|                unsigned char *bytes_buf; | ||||
|                unsigned char bytes_save[1275]; | ||||
|                opus_val16 w[2]; | ||||
|                compute_channel_weights(bandE[i], bandE[i+m->nbEBands], w); | ||||
|                /* Make a copy. */ | ||||
|                cm = x_cm|y_cm; | ||||
|                ec_save = *ec; | ||||
|                ctx_save = ctx; | ||||
|                OPUS_COPY(X_save, X, N); | ||||
|                OPUS_COPY(Y_save, Y, N); | ||||
|                /* Encode and round down. */ | ||||
|                ctx.theta_round = -1; | ||||
|                x_cm = quant_band_stereo(&ctx, X, Y, N, b, B, | ||||
|                      effective_lowband != -1 ? norm+effective_lowband : NULL, LM, | ||||
|                      last?NULL:norm+M*eBands[i]-norm_offset, lowband_scratch, cm); | ||||
|                dist0 = MULT16_32_Q15(w[0], celt_inner_prod(X_save, X, N, arch)) + MULT16_32_Q15(w[1], celt_inner_prod(Y_save, Y, N, arch)); | ||||
| 
 | ||||
|                /* Save first result. */ | ||||
|                cm2 = x_cm; | ||||
|                ec_save2 = *ec; | ||||
|                ctx_save2 = ctx; | ||||
|                OPUS_COPY(X_save2, X, N); | ||||
|                OPUS_COPY(Y_save2, Y, N); | ||||
|                if (!last) | ||||
|                   OPUS_COPY(norm_save2, norm+M*eBands[i]-norm_offset, N); | ||||
|                nstart_bytes = ec_save.offs; | ||||
|                nend_bytes = ec_save.storage; | ||||
|                bytes_buf = ec_save.buf+nstart_bytes; | ||||
|                save_bytes = nend_bytes-nstart_bytes; | ||||
|                OPUS_COPY(bytes_save, bytes_buf, save_bytes); | ||||
| 
 | ||||
|                /* Restore */ | ||||
|                *ec = ec_save; | ||||
|                ctx = ctx_save; | ||||
|                OPUS_COPY(X, X_save, N); | ||||
|                OPUS_COPY(Y, Y_save, N); | ||||
| #ifndef DISABLE_UPDATE_DRAFT | ||||
|                if (i == start+1) | ||||
|                   special_hybrid_folding(m, norm, norm2, start, M, dual_stereo); | ||||
| #endif | ||||
|                /* Encode and round up. */ | ||||
|                ctx.theta_round = 1; | ||||
|                x_cm = quant_band_stereo(&ctx, X, Y, N, b, B, | ||||
|                      effective_lowband != -1 ? norm+effective_lowband : NULL, LM, | ||||
|                      last?NULL:norm+M*eBands[i]-norm_offset, lowband_scratch, cm); | ||||
|                dist1 = MULT16_32_Q15(w[0], celt_inner_prod(X_save, X, N, arch)) + MULT16_32_Q15(w[1], celt_inner_prod(Y_save, Y, N, arch)); | ||||
|                if (dist0 >= dist1) { | ||||
|                   x_cm = cm2; | ||||
|                   *ec = ec_save2; | ||||
|                   ctx = ctx_save2; | ||||
|                   OPUS_COPY(X, X_save2, N); | ||||
|                   OPUS_COPY(Y, Y_save2, N); | ||||
|                   if (!last) | ||||
|                      OPUS_COPY(norm+M*eBands[i]-norm_offset, norm_save2, N); | ||||
|                   OPUS_COPY(bytes_buf, bytes_save, save_bytes); | ||||
|                } | ||||
|             } else { | ||||
|                ctx.theta_round = 0; | ||||
|                x_cm = quant_band_stereo(&ctx, X, Y, N, b, B, | ||||
|                      effective_lowband != -1 ? norm+effective_lowband : NULL, LM, | ||||
|                      last?NULL:norm+M*eBands[i]-norm_offset, lowband_scratch, x_cm|y_cm); | ||||
|             } | ||||
|          } else { | ||||
|             x_cm = quant_band(&ctx, X, N, b, B, | ||||
|                   effective_lowband != -1 ? norm+effective_lowband : NULL, LM, | ||||
|                         last?NULL:norm+M*eBands[i]-norm_offset, Q15ONE, lowband_scratch, x_cm|y_cm); | ||||
|                   last?NULL:norm+M*eBands[i]-norm_offset, Q15ONE, lowband_scratch, x_cm|y_cm); | ||||
|          } | ||||
|          y_cm = x_cm; | ||||
|       } | ||||
|  | @ -1521,6 +1661,9 @@ void quant_all_bands(int encode, const CELTMode *m, int start, int end, | |||
| 
 | ||||
|       /* Update the folding position only as long as we have 1 bit/sample depth. */ | ||||
|       update_lowband = b>(N<<BITRES); | ||||
|       /* We only need to avoid noise on a split for the first band. After that, we
 | ||||
|          have folding. */ | ||||
|       ctx.avoid_split_noise = 0; | ||||
|    } | ||||
|    *seed = ctx.seed; | ||||
| 
 | ||||
|  |  | |||
|  | @ -36,12 +36,15 @@ | |||
| #include "entdec.h" | ||||
| #include "rate.h" | ||||
| 
 | ||||
| opus_int16 bitexact_cos(opus_int16 x); | ||||
| int bitexact_log2tan(int isin,int icos); | ||||
| 
 | ||||
| /** Compute the amplitude (sqrt energy) in each of the bands
 | ||||
|  * @param m Mode data | ||||
|  * @param X Spectrum | ||||
|  * @param bandE Square root of the energy for each band (returned) | ||||
|  */ | ||||
| void compute_band_energies(const CELTMode *m, const celt_sig *X, celt_ener *bandE, int end, int C, int LM); | ||||
| void compute_band_energies(const CELTMode *m, const celt_sig *X, celt_ener *bandE, int end, int C, int LM, int arch); | ||||
| 
 | ||||
| /*void compute_noise_energies(const CELTMode *m, const celt_sig *X, const opus_val16 *tonality, celt_ener *bandE);*/ | ||||
| 
 | ||||
|  | @ -69,7 +72,7 @@ void denormalise_bands(const CELTMode *m, const celt_norm * OPUS_RESTRICT X, | |||
| 
 | ||||
| int spreading_decision(const CELTMode *m, const celt_norm *X, int *average, | ||||
|       int last_decision, int *hf_average, int *tapset_decision, int update_hf, | ||||
|       int end, int C, int M); | ||||
|       int end, int C, int M, const int *spread_weight); | ||||
| 
 | ||||
| #ifdef MEASURE_NORM_MSE | ||||
| void measure_norm_mse(const CELTMode *m, float *X, float *X0, float *bandE, float *bandE0, int M, int N, int C); | ||||
|  | @ -98,15 +101,20 @@ void haar1(celt_norm *X, int N0, int stride); | |||
|  * @param LM log2() of the number of 2.5 subframes in the frame | ||||
|  * @param codedBands Last band to receive bits + 1 | ||||
|  * @param seed Random generator seed | ||||
|  * @param arch Run-time architecture (see opus_select_arch()) | ||||
|  */ | ||||
| void quant_all_bands(int encode, const CELTMode *m, int start, int end, | ||||
|       celt_norm * X, celt_norm * Y, unsigned char *collapse_masks, const celt_ener *bandE, int *pulses, | ||||
|       int shortBlocks, int spread, int dual_stereo, int intensity, int *tf_res, | ||||
|       opus_int32 total_bits, opus_int32 balance, ec_ctx *ec, int M, int codedBands, opus_uint32 *seed); | ||||
|       celt_norm * X, celt_norm * Y, unsigned char *collapse_masks, | ||||
|       const celt_ener *bandE, int *pulses, int shortBlocks, int spread, | ||||
|       int dual_stereo, int intensity, int *tf_res, opus_int32 total_bits, | ||||
|       opus_int32 balance, ec_ctx *ec, int M, int codedBands, opus_uint32 *seed, | ||||
|       int complexity, int arch, int disable_inv); | ||||
| 
 | ||||
| void anti_collapse(const CELTMode *m, celt_norm *X_, unsigned char *collapse_masks, int LM, int C, int size, | ||||
|       int start, int end, const opus_val16 *logE, const opus_val16 *prev1logE, | ||||
|       const opus_val16 *prev2logE, const int *pulses, opus_uint32 seed); | ||||
| void anti_collapse(const CELTMode *m, celt_norm *X_, | ||||
|       unsigned char *collapse_masks, int LM, int C, int size, int start, | ||||
|       int end, const opus_val16 *logE, const opus_val16 *prev1logE, | ||||
|       const opus_val16 *prev2logE, const int *pulses, opus_uint32 seed, | ||||
|       int arch); | ||||
| 
 | ||||
| opus_uint32 celt_lcg_rand(opus_uint32 seed); | ||||
| 
 | ||||
|  |  | |||
|  | @ -89,10 +89,13 @@ int resampling_factor(opus_int32 rate) | |||
|    return ret; | ||||
| } | ||||
| 
 | ||||
| #ifndef OVERRIDE_COMB_FILTER_CONST | ||||
| #if !defined(OVERRIDE_COMB_FILTER_CONST) || defined(NON_STATIC_COMB_FILTER_CONST_C) | ||||
| /* This version should be faster on ARM */ | ||||
| #ifdef OPUS_ARM_ASM | ||||
| static void comb_filter_const(opus_val32 *y, opus_val32 *x, int T, int N, | ||||
| #ifndef NON_STATIC_COMB_FILTER_CONST_C | ||||
| static | ||||
| #endif | ||||
| void comb_filter_const_c(opus_val32 *y, opus_val32 *x, int T, int N, | ||||
|       opus_val16 g10, opus_val16 g11, opus_val16 g12) | ||||
| { | ||||
|    opus_val32 x0, x1, x2, x3, x4; | ||||
|  | @ -108,26 +111,31 @@ static void comb_filter_const(opus_val32 *y, opus_val32 *x, int T, int N, | |||
|       t = MAC16_32_Q16(x[i], g10, x2); | ||||
|       t = MAC16_32_Q16(t, g11, ADD32(x1,x3)); | ||||
|       t = MAC16_32_Q16(t, g12, ADD32(x0,x4)); | ||||
|       t = SATURATE(t, SIG_SAT); | ||||
|       y[i] = t; | ||||
|       x4=SHL32(x[i-T+3],1); | ||||
|       t = MAC16_32_Q16(x[i+1], g10, x1); | ||||
|       t = MAC16_32_Q16(t, g11, ADD32(x0,x2)); | ||||
|       t = MAC16_32_Q16(t, g12, ADD32(x4,x3)); | ||||
|       t = SATURATE(t, SIG_SAT); | ||||
|       y[i+1] = t; | ||||
|       x3=SHL32(x[i-T+4],1); | ||||
|       t = MAC16_32_Q16(x[i+2], g10, x0); | ||||
|       t = MAC16_32_Q16(t, g11, ADD32(x4,x1)); | ||||
|       t = MAC16_32_Q16(t, g12, ADD32(x3,x2)); | ||||
|       t = SATURATE(t, SIG_SAT); | ||||
|       y[i+2] = t; | ||||
|       x2=SHL32(x[i-T+5],1); | ||||
|       t = MAC16_32_Q16(x[i+3], g10, x4); | ||||
|       t = MAC16_32_Q16(t, g11, ADD32(x3,x0)); | ||||
|       t = MAC16_32_Q16(t, g12, ADD32(x2,x1)); | ||||
|       t = SATURATE(t, SIG_SAT); | ||||
|       y[i+3] = t; | ||||
|       x1=SHL32(x[i-T+6],1); | ||||
|       t = MAC16_32_Q16(x[i+4], g10, x3); | ||||
|       t = MAC16_32_Q16(t, g11, ADD32(x2,x4)); | ||||
|       t = MAC16_32_Q16(t, g12, ADD32(x1,x0)); | ||||
|       t = SATURATE(t, SIG_SAT); | ||||
|       y[i+4] = t; | ||||
|    } | ||||
| #ifdef CUSTOM_MODES | ||||
|  | @ -138,6 +146,7 @@ static void comb_filter_const(opus_val32 *y, opus_val32 *x, int T, int N, | |||
|       t = MAC16_32_Q16(x[i], g10, x2); | ||||
|       t = MAC16_32_Q16(t, g11, ADD32(x1,x3)); | ||||
|       t = MAC16_32_Q16(t, g12, ADD32(x0,x4)); | ||||
|       t = SATURATE(t, SIG_SAT); | ||||
|       y[i] = t; | ||||
|       x4=x3; | ||||
|       x3=x2; | ||||
|  | @ -147,7 +156,10 @@ static void comb_filter_const(opus_val32 *y, opus_val32 *x, int T, int N, | |||
| #endif | ||||
| } | ||||
| #else | ||||
| static void comb_filter_const(opus_val32 *y, opus_val32 *x, int T, int N, | ||||
| #ifndef NON_STATIC_COMB_FILTER_CONST_C | ||||
| static | ||||
| #endif | ||||
| void comb_filter_const_c(opus_val32 *y, opus_val32 *x, int T, int N, | ||||
|       opus_val16 g10, opus_val16 g11, opus_val16 g12) | ||||
| { | ||||
|    opus_val32 x0, x1, x2, x3, x4; | ||||
|  | @ -163,6 +175,7 @@ static void comb_filter_const(opus_val32 *y, opus_val32 *x, int T, int N, | |||
|                + MULT16_32_Q15(g10,x2) | ||||
|                + MULT16_32_Q15(g11,ADD32(x1,x3)) | ||||
|                + MULT16_32_Q15(g12,ADD32(x0,x4)); | ||||
|       y[i] = SATURATE(y[i], SIG_SAT); | ||||
|       x4=x3; | ||||
|       x3=x2; | ||||
|       x2=x1; | ||||
|  | @ -176,7 +189,7 @@ static void comb_filter_const(opus_val32 *y, opus_val32 *x, int T, int N, | |||
| #ifndef OVERRIDE_comb_filter | ||||
| void comb_filter(opus_val32 *y, opus_val32 *x, int T0, int T1, int N, | ||||
|       opus_val16 g0, opus_val16 g1, int tapset0, int tapset1, | ||||
|       const opus_val16 *window, int overlap) | ||||
|       const opus_val16 *window, int overlap, int arch) | ||||
| { | ||||
|    int i; | ||||
|    /* printf ("%d %d %f %f\n", T0, T1, g0, g1); */ | ||||
|  | @ -194,6 +207,10 @@ void comb_filter(opus_val32 *y, opus_val32 *x, int T0, int T1, int N, | |||
|          OPUS_MOVE(y, x, N); | ||||
|       return; | ||||
|    } | ||||
|    /* When the gain is zero, T0 and/or T1 is set to zero. We need
 | ||||
|       to have then be at least 2 to avoid processing garbage data. */ | ||||
|    T0 = IMAX(T0, COMBFILTER_MINPERIOD); | ||||
|    T1 = IMAX(T1, COMBFILTER_MINPERIOD); | ||||
|    g00 = MULT16_16_P15(g0, gains[tapset0][0]); | ||||
|    g01 = MULT16_16_P15(g0, gains[tapset0][1]); | ||||
|    g02 = MULT16_16_P15(g0, gains[tapset0][2]); | ||||
|  | @ -219,6 +236,7 @@ void comb_filter(opus_val32 *y, opus_val32 *x, int T0, int T1, int N, | |||
|                + MULT16_32_Q15(MULT16_16_Q15(f,g10),x2) | ||||
|                + MULT16_32_Q15(MULT16_16_Q15(f,g11),ADD32(x1,x3)) | ||||
|                + MULT16_32_Q15(MULT16_16_Q15(f,g12),ADD32(x0,x4)); | ||||
|       y[i] = SATURATE(y[i], SIG_SAT); | ||||
|       x4=x3; | ||||
|       x3=x2; | ||||
|       x2=x1; | ||||
|  | @ -234,15 +252,20 @@ void comb_filter(opus_val32 *y, opus_val32 *x, int T0, int T1, int N, | |||
|    } | ||||
| 
 | ||||
|    /* Compute the part with the constant filter. */ | ||||
|    comb_filter_const(y+i, x+i, T1, N-i, g10, g11, g12); | ||||
|    comb_filter_const(y+i, x+i, T1, N-i, g10, g11, g12, arch); | ||||
| } | ||||
| #endif /* OVERRIDE_comb_filter */ | ||||
| 
 | ||||
| /* TF change table. Positive values mean better frequency resolution (longer
 | ||||
|    effective window), whereas negative values mean better time resolution | ||||
|    (shorter effective window). The second index is computed as: | ||||
|    4*isTransient + 2*tf_select + per_band_flag */ | ||||
| const signed char tf_select_table[4][8] = { | ||||
|       {0, -1, 0, -1,    0,-1, 0,-1}, | ||||
|       {0, -1, 0, -2,    1, 0, 1,-1}, | ||||
|       {0, -2, 0, -3,    2, 0, 1,-1}, | ||||
|       {0, -2, 0, -3,    3, 0, 1,-1}, | ||||
|     /*isTransient=0     isTransient=1 */ | ||||
|       {0, -1, 0, -1,    0,-1, 0,-1}, /* 2.5 ms */ | ||||
|       {0, -1, 0, -2,    1, 0, 1,-1}, /* 5 ms */ | ||||
|       {0, -2, 0, -3,    2, 0, 1,-1}, /* 10 ms */ | ||||
|       {0, -2, 0, -3,    3, 0, 1,-1}, /* 20 ms */ | ||||
| }; | ||||
| 
 | ||||
| 
 | ||||
|  | @ -280,6 +303,9 @@ const char *opus_strerror(int error) | |||
| const char *opus_get_version_string(void) | ||||
| { | ||||
|     return "libopus " PACKAGE_VERSION | ||||
|     /* Applications may rely on the presence of this substring in the version
 | ||||
|        string to determine if they have a fixed-point or floating-point build | ||||
|        at runtime. */ | ||||
| #ifdef FIXED_POINT | ||||
|           "-fixed" | ||||
| #endif | ||||
|  |  | |||
|  | @ -50,6 +50,8 @@ extern "C" { | |||
| #define CELTDecoder OpusCustomDecoder | ||||
| #define CELTMode OpusCustomMode | ||||
| 
 | ||||
| #define LEAK_BANDS 19 | ||||
| 
 | ||||
| typedef struct { | ||||
|    int valid; | ||||
|    float tonality; | ||||
|  | @ -57,17 +59,27 @@ typedef struct { | |||
|    float noisiness; | ||||
|    float activity; | ||||
|    float music_prob; | ||||
|    int        bandwidth; | ||||
| }AnalysisInfo; | ||||
|    float music_prob_min; | ||||
|    float music_prob_max; | ||||
|    int   bandwidth; | ||||
|    float activity_probability; | ||||
|    float max_pitch_ratio; | ||||
|    /* Store as Q6 char to save space. */ | ||||
|    unsigned char leak_boost[LEAK_BANDS]; | ||||
| } AnalysisInfo; | ||||
| 
 | ||||
| typedef struct { | ||||
|    int signalType; | ||||
|    int offset; | ||||
| } SILKInfo; | ||||
| 
 | ||||
| #define __celt_check_mode_ptr_ptr(ptr) ((ptr) + ((ptr) - (const CELTMode**)(ptr))) | ||||
| 
 | ||||
| #define __celt_check_analysis_ptr(ptr) ((ptr) + ((ptr) - (const AnalysisInfo*)(ptr))) | ||||
| 
 | ||||
| /* Encoder/decoder Requests */ | ||||
| #define __celt_check_silkinfo_ptr(ptr) ((ptr) + ((ptr) - (const SILKInfo*)(ptr))) | ||||
| 
 | ||||
| /* Expose this option again when variable framesize actually works */ | ||||
| #define OPUS_FRAMESIZE_VARIABLE              5010 /**< Optimize the frame size dynamically */ | ||||
| /* Encoder/decoder Requests */ | ||||
| 
 | ||||
| 
 | ||||
| #define CELT_SET_PREDICTION_REQUEST    10002 | ||||
|  | @ -116,6 +128,9 @@ typedef struct { | |||
| #define OPUS_SET_ENERGY_MASK_REQUEST    10026 | ||||
| #define OPUS_SET_ENERGY_MASK(x) OPUS_SET_ENERGY_MASK_REQUEST, __opus_check_val16_ptr(x) | ||||
| 
 | ||||
| #define CELT_SET_SILK_INFO_REQUEST    10028 | ||||
| #define CELT_SET_SILK_INFO(x) CELT_SET_SILK_INFO_REQUEST, __celt_check_silkinfo_ptr(x) | ||||
| 
 | ||||
| /* Encoder stuff */ | ||||
| 
 | ||||
| int celt_encoder_get_size(int channels); | ||||
|  | @ -194,6 +209,13 @@ static OPUS_INLINE int fromOpus(unsigned char c) | |||
| 
 | ||||
| extern const signed char tf_select_table[4][8]; | ||||
| 
 | ||||
| #if defined(ENABLE_HARDENING) || defined(ENABLE_ASSERTIONS) | ||||
| void validate_celt_decoder(CELTDecoder *st); | ||||
| #define VALIDATE_CELT_DECODER(st) validate_celt_decoder(st) | ||||
| #else | ||||
| #define VALIDATE_CELT_DECODER(st) | ||||
| #endif | ||||
| 
 | ||||
| int resampling_factor(opus_int32 rate); | ||||
| 
 | ||||
| void celt_preemphasis(const opus_val16 * OPUS_RESTRICT pcmp, celt_sig * OPUS_RESTRICT inp, | ||||
|  | @ -201,7 +223,17 @@ void celt_preemphasis(const opus_val16 * OPUS_RESTRICT pcmp, celt_sig * OPUS_RES | |||
| 
 | ||||
| void comb_filter(opus_val32 *y, opus_val32 *x, int T0, int T1, int N, | ||||
|       opus_val16 g0, opus_val16 g1, int tapset0, int tapset1, | ||||
|       const opus_val16 *window, int overlap); | ||||
|       const opus_val16 *window, int overlap, int arch); | ||||
| 
 | ||||
| #ifdef NON_STATIC_COMB_FILTER_CONST_C | ||||
| void comb_filter_const_c(opus_val32 *y, opus_val32 *x, int T, int N, | ||||
|                          opus_val16 g10, opus_val16 g11, opus_val16 g12); | ||||
| #endif | ||||
| 
 | ||||
| #ifndef OVERRIDE_COMB_FILTER_CONST | ||||
| # define comb_filter_const(y, x, T, N, g10, g11, g12, arch) \ | ||||
|     ((void)(arch),comb_filter_const_c(y, x, T, N, g10, g11, g12)) | ||||
| #endif | ||||
| 
 | ||||
| void init_caps(const CELTMode *m,int *cap,int LM,int C); | ||||
| 
 | ||||
|  |  | |||
|  | @ -51,6 +51,14 @@ | |||
| #include "celt_lpc.h" | ||||
| #include "vq.h" | ||||
| 
 | ||||
| /* The maximum pitch lag to allow in the pitch-based PLC. It's possible to save
 | ||||
|    CPU time in the PLC pitch search by making this smaller than MAX_PERIOD. The | ||||
|    current value corresponds to a pitch of 66.67 Hz. */ | ||||
| #define PLC_PITCH_LAG_MAX (720) | ||||
| /* The minimum pitch lag to allow in the pitch-based PLC. This corresponds to a
 | ||||
|    pitch of 480 Hz. */ | ||||
| #define PLC_PITCH_LAG_MIN (100) | ||||
| 
 | ||||
| #if defined(SMALL_FOOTPRINT) && defined(FIXED_POINT) | ||||
| #define NORM_ALIASING_HACK | ||||
| #endif | ||||
|  | @ -73,6 +81,7 @@ struct OpusCustomDecoder { | |||
|    int downsample; | ||||
|    int start, end; | ||||
|    int signalling; | ||||
|    int disable_inv; | ||||
|    int arch; | ||||
| 
 | ||||
|    /* Everything beyond this point gets cleared on a reset */ | ||||
|  | @ -82,6 +91,7 @@ struct OpusCustomDecoder { | |||
|    int error; | ||||
|    int last_pitch_index; | ||||
|    int loss_count; | ||||
|    int skip_plc; | ||||
|    int postfilter_period; | ||||
|    int postfilter_period_old; | ||||
|    opus_val16 postfilter_gain; | ||||
|  | @ -99,6 +109,38 @@ struct OpusCustomDecoder { | |||
|    /* opus_val16 backgroundLogE[], Size = 2*mode->nbEBands */ | ||||
| }; | ||||
| 
 | ||||
| #if defined(ENABLE_HARDENING) || defined(ENABLE_ASSERTIONS) | ||||
| /* Make basic checks on the CELT state to ensure we don't end
 | ||||
|    up writing all over memory. */ | ||||
| void validate_celt_decoder(CELTDecoder *st) | ||||
| { | ||||
| #ifndef CUSTOM_MODES | ||||
|    celt_assert(st->mode == opus_custom_mode_create(48000, 960, NULL)); | ||||
|    celt_assert(st->overlap == 120); | ||||
| #endif | ||||
|    celt_assert(st->channels == 1 || st->channels == 2); | ||||
|    celt_assert(st->stream_channels == 1 || st->stream_channels == 2); | ||||
|    celt_assert(st->downsample > 0); | ||||
|    celt_assert(st->start == 0 || st->start == 17); | ||||
|    celt_assert(st->start < st->end); | ||||
|    celt_assert(st->end <= 21); | ||||
| #ifdef OPUS_ARCHMASK | ||||
|    celt_assert(st->arch >= 0); | ||||
|    celt_assert(st->arch <= OPUS_ARCHMASK); | ||||
| #endif | ||||
|    celt_assert(st->last_pitch_index <= PLC_PITCH_LAG_MAX); | ||||
|    celt_assert(st->last_pitch_index >= PLC_PITCH_LAG_MIN || st->last_pitch_index == 0); | ||||
|    celt_assert(st->postfilter_period < MAX_PERIOD); | ||||
|    celt_assert(st->postfilter_period >= COMBFILTER_MINPERIOD || st->postfilter_period == 0); | ||||
|    celt_assert(st->postfilter_period_old < MAX_PERIOD); | ||||
|    celt_assert(st->postfilter_period_old >= COMBFILTER_MINPERIOD || st->postfilter_period_old == 0); | ||||
|    celt_assert(st->postfilter_tapset <= 2); | ||||
|    celt_assert(st->postfilter_tapset >= 0); | ||||
|    celt_assert(st->postfilter_tapset_old <= 2); | ||||
|    celt_assert(st->postfilter_tapset_old >= 0); | ||||
| } | ||||
| #endif | ||||
| 
 | ||||
| int celt_decoder_get_size(int channels) | ||||
| { | ||||
|    const CELTMode *mode = opus_custom_mode_create(48000, 960, NULL); | ||||
|  | @ -162,10 +204,13 @@ OPUS_CUSTOM_NOSTATIC int opus_custom_decoder_init(CELTDecoder *st, const CELTMod | |||
|    st->start = 0; | ||||
|    st->end = st->mode->effEBands; | ||||
|    st->signalling = 1; | ||||
| #ifndef DISABLE_UPDATE_DRAFT | ||||
|    st->disable_inv = channels == 1; | ||||
| #else | ||||
|    st->disable_inv = 0; | ||||
| #endif | ||||
|    st->arch = opus_select_arch(); | ||||
| 
 | ||||
|    st->loss_count = 0; | ||||
| 
 | ||||
|    opus_custom_decoder_ctl(st, OPUS_RESET_STATE); | ||||
| 
 | ||||
|    return OPUS_OK; | ||||
|  | @ -178,6 +223,36 @@ void opus_custom_decoder_destroy(CELTDecoder *st) | |||
| } | ||||
| #endif /* CUSTOM_MODES */ | ||||
| 
 | ||||
| #ifndef CUSTOM_MODES | ||||
| /* Special case for stereo with no downsampling and no accumulation. This is
 | ||||
|    quite common and we can make it faster by processing both channels in the | ||||
|    same loop, reducing overhead due to the dependency loop in the IIR filter. */ | ||||
| static void deemphasis_stereo_simple(celt_sig *in[], opus_val16 *pcm, int N, const opus_val16 coef0, | ||||
|       celt_sig *mem) | ||||
| { | ||||
|    celt_sig * OPUS_RESTRICT x0; | ||||
|    celt_sig * OPUS_RESTRICT x1; | ||||
|    celt_sig m0, m1; | ||||
|    int j; | ||||
|    x0=in[0]; | ||||
|    x1=in[1]; | ||||
|    m0 = mem[0]; | ||||
|    m1 = mem[1]; | ||||
|    for (j=0;j<N;j++) | ||||
|    { | ||||
|       celt_sig tmp0, tmp1; | ||||
|       /* Add VERY_SMALL to x[] first to reduce dependency chain. */ | ||||
|       tmp0 = x0[j] + VERY_SMALL + m0; | ||||
|       tmp1 = x1[j] + VERY_SMALL + m1; | ||||
|       m0 = MULT16_32_Q15(coef0, tmp0); | ||||
|       m1 = MULT16_32_Q15(coef0, tmp1); | ||||
|       pcm[2*j  ] = SCALEOUT(SIG2WORD16(tmp0)); | ||||
|       pcm[2*j+1] = SCALEOUT(SIG2WORD16(tmp1)); | ||||
|    } | ||||
|    mem[0] = m0; | ||||
|    mem[1] = m1; | ||||
| } | ||||
| #endif | ||||
| 
 | ||||
| #ifndef RESYNTH | ||||
| static | ||||
|  | @ -191,6 +266,14 @@ void deemphasis(celt_sig *in[], opus_val16 *pcm, int N, int C, int downsample, c | |||
|    opus_val16 coef0; | ||||
|    VARDECL(celt_sig, scratch); | ||||
|    SAVE_STACK; | ||||
| #ifndef CUSTOM_MODES | ||||
|    /* Short version for common case. */ | ||||
|    if (downsample == 1 && C == 2 && !accum) | ||||
|    { | ||||
|       deemphasis_stereo_simple(in, pcm, N, coef[0], mem); | ||||
|       return; | ||||
|    } | ||||
| #endif | ||||
| #ifndef FIXED_POINT | ||||
|    (void)accum; | ||||
|    celt_assert(accum==0); | ||||
|  | @ -226,7 +309,7 @@ void deemphasis(celt_sig *in[], opus_val16 *pcm, int N, int C, int downsample, c | |||
|          /* Shortcut for the standard (non-custom modes) case */ | ||||
|          for (j=0;j<N;j++) | ||||
|          { | ||||
|             celt_sig tmp = x[j] + m + VERY_SMALL; | ||||
|             celt_sig tmp = x[j] + VERY_SMALL + m; | ||||
|             m = MULT16_32_Q15(coef0, tmp); | ||||
|             scratch[j] = tmp; | ||||
|          } | ||||
|  | @ -247,7 +330,7 @@ void deemphasis(celt_sig *in[], opus_val16 *pcm, int N, int C, int downsample, c | |||
|          { | ||||
|             for (j=0;j<N;j++) | ||||
|             { | ||||
|                celt_sig tmp = x[j] + m + VERY_SMALL; | ||||
|                celt_sig tmp = x[j] + VERY_SMALL + m; | ||||
|                m = MULT16_32_Q15(coef0, tmp); | ||||
|                y[j*C] = SCALEOUT(SIG2WORD16(tmp)); | ||||
|             } | ||||
|  | @ -278,8 +361,9 @@ void deemphasis(celt_sig *in[], opus_val16 *pcm, int N, int C, int downsample, c | |||
| static | ||||
| #endif | ||||
| void celt_synthesis(const CELTMode *mode, celt_norm *X, celt_sig * out_syn[], | ||||
|       opus_val16 *oldBandE, int start, int effEnd, int C, int CC, int isTransient, | ||||
|       int LM, int downsample, int silence) | ||||
|                     opus_val16 *oldBandE, int start, int effEnd, int C, int CC, | ||||
|                     int isTransient, int LM, int downsample, | ||||
|                     int silence, int arch) | ||||
| { | ||||
|    int c, i; | ||||
|    int M; | ||||
|  | @ -319,9 +403,9 @@ void celt_synthesis(const CELTMode *mode, celt_norm *X, celt_sig * out_syn[], | |||
|       freq2 = out_syn[1]+overlap/2; | ||||
|       OPUS_COPY(freq2, freq, N); | ||||
|       for (b=0;b<B;b++) | ||||
|          clt_mdct_backward(&mode->mdct, &freq2[b], out_syn[0]+NB*b, mode->window, overlap, shift, B); | ||||
|          clt_mdct_backward(&mode->mdct, &freq2[b], out_syn[0]+NB*b, mode->window, overlap, shift, B, arch); | ||||
|       for (b=0;b<B;b++) | ||||
|          clt_mdct_backward(&mode->mdct, &freq[b], out_syn[1]+NB*b, mode->window, overlap, shift, B); | ||||
|          clt_mdct_backward(&mode->mdct, &freq[b], out_syn[1]+NB*b, mode->window, overlap, shift, B, arch); | ||||
|    } else if (CC==1&&C==2) | ||||
|    { | ||||
|       /* Downmixing a stereo stream to mono */ | ||||
|  | @ -333,18 +417,24 @@ void celt_synthesis(const CELTMode *mode, celt_norm *X, celt_sig * out_syn[], | |||
|       denormalise_bands(mode, X+N, freq2, oldBandE+nbEBands, start, effEnd, M, | ||||
|             downsample, silence); | ||||
|       for (i=0;i<N;i++) | ||||
|          freq[i] = HALF32(ADD32(freq[i],freq2[i])); | ||||
|          freq[i] = ADD32(HALF32(freq[i]), HALF32(freq2[i])); | ||||
|       for (b=0;b<B;b++) | ||||
|          clt_mdct_backward(&mode->mdct, &freq[b], out_syn[0]+NB*b, mode->window, overlap, shift, B); | ||||
|          clt_mdct_backward(&mode->mdct, &freq[b], out_syn[0]+NB*b, mode->window, overlap, shift, B, arch); | ||||
|    } else { | ||||
|       /* Normal case (mono or stereo) */ | ||||
|       c=0; do { | ||||
|          denormalise_bands(mode, X+c*N, freq, oldBandE+c*nbEBands, start, effEnd, M, | ||||
|                downsample, silence); | ||||
|          for (b=0;b<B;b++) | ||||
|             clt_mdct_backward(&mode->mdct, &freq[b], out_syn[c]+NB*b, mode->window, overlap, shift, B); | ||||
|             clt_mdct_backward(&mode->mdct, &freq[b], out_syn[c]+NB*b, mode->window, overlap, shift, B, arch); | ||||
|       } while (++c<CC); | ||||
|    } | ||||
|    /* Saturate IMDCT output so that we can't overflow in the pitch postfilter
 | ||||
|       or in the */ | ||||
|    c=0; do { | ||||
|       for (i=0;i<N;i++) | ||||
|          out_syn[c][i] = SATURATE(out_syn[c][i], SIG_SAT); | ||||
|    } while (++c<CC); | ||||
|    RESTORE_STACK; | ||||
| } | ||||
| 
 | ||||
|  | @ -387,14 +477,6 @@ static void tf_decode(int start, int end, int isTransient, int *tf_res, int LM, | |||
|    } | ||||
| } | ||||
| 
 | ||||
| /* The maximum pitch lag to allow in the pitch-based PLC. It's possible to save
 | ||||
|    CPU time in the PLC pitch search by making this smaller than MAX_PERIOD. The | ||||
|    current value corresponds to a pitch of 66.67 Hz. */ | ||||
| #define PLC_PITCH_LAG_MAX (720) | ||||
| /* The minimum pitch lag to allow in the pitch-based PLC. This corresponds to a
 | ||||
|    pitch of 480 Hz. */ | ||||
| #define PLC_PITCH_LAG_MIN (100) | ||||
| 
 | ||||
| static int celt_plc_pitch_search(celt_sig *decode_mem[2], int C, int arch) | ||||
| { | ||||
|    int pitch_index; | ||||
|  | @ -446,7 +528,7 @@ static void celt_decode_lost(CELTDecoder * OPUS_RESTRICT st, int N, int LM) | |||
| 
 | ||||
|    loss_count = st->loss_count; | ||||
|    start = st->start; | ||||
|    noise_based = loss_count >= 5 || start != 0; | ||||
|    noise_based = loss_count >= 5 || start != 0 || st->skip_plc; | ||||
|    if (noise_based) | ||||
|    { | ||||
|       /* Noise-based PLC/CNG */ | ||||
|  | @ -456,10 +538,9 @@ static void celt_decode_lost(CELTDecoder * OPUS_RESTRICT st, int N, int LM) | |||
|       VARDECL(celt_norm, X); | ||||
| #endif | ||||
|       opus_uint32 seed; | ||||
|       opus_val16 *plcLogE; | ||||
|       int end; | ||||
|       int effEnd; | ||||
| 
 | ||||
|       opus_val16 decay; | ||||
|       end = st->end; | ||||
|       effEnd = IMAX(start, IMIN(end, mode->effEBands)); | ||||
| 
 | ||||
|  | @ -471,19 +552,13 @@ static void celt_decode_lost(CELTDecoder * OPUS_RESTRICT st, int N, int LM) | |||
|       ALLOC(X, C*N, celt_norm);   /**< Interleaved normalised MDCTs */ | ||||
| #endif | ||||
| 
 | ||||
|       if (loss_count >= 5) | ||||
|          plcLogE = backgroundLogE; | ||||
|       else { | ||||
|          /* Energy decay */ | ||||
|          opus_val16 decay = loss_count==0 ? | ||||
|                QCONST16(1.5f, DB_SHIFT) : QCONST16(.5f, DB_SHIFT); | ||||
|          c=0; do | ||||
|          { | ||||
|             for (i=start;i<end;i++) | ||||
|                oldBandE[c*nbEBands+i] -= decay; | ||||
|          } while (++c<C); | ||||
|          plcLogE = oldBandE; | ||||
|       } | ||||
|       /* Energy decay */ | ||||
|       decay = loss_count==0 ? QCONST16(1.5f, DB_SHIFT) : QCONST16(.5f, DB_SHIFT); | ||||
|       c=0; do | ||||
|       { | ||||
|          for (i=start;i<end;i++) | ||||
|             oldBandE[c*nbEBands+i] = MAX16(backgroundLogE[c*nbEBands+i], oldBandE[c*nbEBands+i] - decay); | ||||
|       } while (++c<C); | ||||
|       seed = st->rng; | ||||
|       for (c=0;c<C;c++) | ||||
|       { | ||||
|  | @ -499,7 +574,7 @@ static void celt_decode_lost(CELTDecoder * OPUS_RESTRICT st, int N, int LM) | |||
|                seed = celt_lcg_rand(seed); | ||||
|                X[boffs+j] = (celt_norm)((opus_int32)seed>>20); | ||||
|             } | ||||
|             renormalise_vector(X+boffs, blen, Q15ONE); | ||||
|             renormalise_vector(X+boffs, blen, Q15ONE, st->arch); | ||||
|          } | ||||
|       } | ||||
|       st->rng = seed; | ||||
|  | @ -509,14 +584,17 @@ static void celt_decode_lost(CELTDecoder * OPUS_RESTRICT st, int N, int LM) | |||
|                DECODE_BUFFER_SIZE-N+(overlap>>1)); | ||||
|       } while (++c<C); | ||||
| 
 | ||||
|       celt_synthesis(mode, X, out_syn, plcLogE, start, effEnd, C, C, 0, LM, st->downsample, 0); | ||||
|       celt_synthesis(mode, X, out_syn, oldBandE, start, effEnd, C, C, 0, LM, st->downsample, 0, st->arch); | ||||
|    } else { | ||||
|       int exc_length; | ||||
|       /* Pitch-based PLC */ | ||||
|       const opus_val16 *window; | ||||
|       opus_val16 *exc; | ||||
|       opus_val16 fade = Q15ONE; | ||||
|       int pitch_index; | ||||
|       VARDECL(opus_val32, etmp); | ||||
|       VARDECL(opus_val16, exc); | ||||
|       VARDECL(opus_val16, _exc); | ||||
|       VARDECL(opus_val16, fir_tmp); | ||||
| 
 | ||||
|       if (loss_count == 0) | ||||
|       { | ||||
|  | @ -526,8 +604,14 @@ static void celt_decode_lost(CELTDecoder * OPUS_RESTRICT st, int N, int LM) | |||
|          fade = QCONST16(.8f,15); | ||||
|       } | ||||
| 
 | ||||
|       /* We want the excitation for 2 pitch periods in order to look for a
 | ||||
|          decaying signal, but we can't get more than MAX_PERIOD. */ | ||||
|       exc_length = IMIN(2*pitch_index, MAX_PERIOD); | ||||
| 
 | ||||
|       ALLOC(etmp, overlap, opus_val32); | ||||
|       ALLOC(exc, MAX_PERIOD, opus_val16); | ||||
|       ALLOC(_exc, MAX_PERIOD+LPC_ORDER, opus_val16); | ||||
|       ALLOC(fir_tmp, exc_length, opus_val16); | ||||
|       exc = _exc+LPC_ORDER; | ||||
|       window = mode->window; | ||||
|       c=0; do { | ||||
|          opus_val16 decay; | ||||
|  | @ -536,13 +620,11 @@ static void celt_decode_lost(CELTDecoder * OPUS_RESTRICT st, int N, int LM) | |||
|          celt_sig *buf; | ||||
|          int extrapolation_offset; | ||||
|          int extrapolation_len; | ||||
|          int exc_length; | ||||
|          int j; | ||||
| 
 | ||||
|          buf = decode_mem[c]; | ||||
|          for (i=0;i<MAX_PERIOD;i++) { | ||||
|             exc[i] = ROUND16(buf[DECODE_BUFFER_SIZE-MAX_PERIOD+i], SIG_SHIFT); | ||||
|          } | ||||
|          for (i=0;i<MAX_PERIOD+LPC_ORDER;i++) | ||||
|             exc[i-LPC_ORDER] = ROUND16(buf[DECODE_BUFFER_SIZE-MAX_PERIOD-LPC_ORDER+i], SIG_SHIFT); | ||||
| 
 | ||||
|          if (loss_count == 0) | ||||
|          { | ||||
|  | @ -568,22 +650,32 @@ static void celt_decode_lost(CELTDecoder * OPUS_RESTRICT st, int N, int LM) | |||
| #endif | ||||
|             } | ||||
|             _celt_lpc(lpc+c*LPC_ORDER, ac, LPC_ORDER); | ||||
| #ifdef FIXED_POINT | ||||
|          /* For fixed-point, apply bandwidth expansion until we can guarantee that
 | ||||
|             no overflow can happen in the IIR filter. This means: | ||||
|             32768*sum(abs(filter)) < 2^31 */ | ||||
|          while (1) { | ||||
|             opus_val16 tmp=Q15ONE; | ||||
|             opus_val32 sum=QCONST16(1., SIG_SHIFT); | ||||
|             for (i=0;i<LPC_ORDER;i++) | ||||
|                sum += ABS16(lpc[c*LPC_ORDER+i]); | ||||
|             if (sum < 65535) break; | ||||
|             for (i=0;i<LPC_ORDER;i++) | ||||
|             { | ||||
|                tmp = MULT16_16_Q15(QCONST16(.99f,15), tmp); | ||||
|                lpc[c*LPC_ORDER+i] = MULT16_16_Q15(lpc[c*LPC_ORDER+i], tmp); | ||||
|             } | ||||
|          } | ||||
| #endif | ||||
|          } | ||||
|          /* We want the excitation for 2 pitch periods in order to look for a
 | ||||
|             decaying signal, but we can't get more than MAX_PERIOD. */ | ||||
|          exc_length = IMIN(2*pitch_index, MAX_PERIOD); | ||||
|          /* Initialize the LPC history with the samples just before the start
 | ||||
|             of the region for which we're computing the excitation. */ | ||||
|          { | ||||
|             opus_val16 lpc_mem[LPC_ORDER]; | ||||
|             for (i=0;i<LPC_ORDER;i++) | ||||
|             { | ||||
|                lpc_mem[i] = | ||||
|                      ROUND16(buf[DECODE_BUFFER_SIZE-exc_length-1-i], SIG_SHIFT); | ||||
|             } | ||||
|             /* Compute the excitation for exc_length samples before the loss. */ | ||||
|             /* Compute the excitation for exc_length samples before the loss. We need the copy
 | ||||
|                because celt_fir() cannot filter in-place. */ | ||||
|             celt_fir(exc+MAX_PERIOD-exc_length, lpc+c*LPC_ORDER, | ||||
|                   exc+MAX_PERIOD-exc_length, exc_length, LPC_ORDER, lpc_mem); | ||||
|                   fir_tmp, exc_length, LPC_ORDER, st->arch); | ||||
|             OPUS_COPY(exc+MAX_PERIOD-exc_length, fir_tmp, exc_length); | ||||
|          } | ||||
| 
 | ||||
|          /* Check if the waveform is decaying, and if so how fast.
 | ||||
|  | @ -637,9 +729,8 @@ static void celt_decode_lost(CELTDecoder * OPUS_RESTRICT st, int N, int LM) | |||
|             tmp = ROUND16( | ||||
|                   buf[DECODE_BUFFER_SIZE-MAX_PERIOD-N+extrapolation_offset+j], | ||||
|                   SIG_SHIFT); | ||||
|             S1 += SHR32(MULT16_16(tmp, tmp), 8); | ||||
|             S1 += SHR32(MULT16_16(tmp, tmp), 10); | ||||
|          } | ||||
| 
 | ||||
|          { | ||||
|             opus_val16 lpc_mem[LPC_ORDER]; | ||||
|             /* Copy the last decoded samples (prior to the overlap region) to
 | ||||
|  | @ -650,7 +741,11 @@ static void celt_decode_lost(CELTDecoder * OPUS_RESTRICT st, int N, int LM) | |||
|                the signal domain. */ | ||||
|             celt_iir(buf+DECODE_BUFFER_SIZE-N, lpc+c*LPC_ORDER, | ||||
|                   buf+DECODE_BUFFER_SIZE-N, extrapolation_len, LPC_ORDER, | ||||
|                   lpc_mem); | ||||
|                   lpc_mem, st->arch); | ||||
| #ifdef FIXED_POINT | ||||
|             for (i=0; i < extrapolation_len; i++) | ||||
|                buf[DECODE_BUFFER_SIZE-N+i] = SATURATE(buf[DECODE_BUFFER_SIZE-N+i], SIG_SAT); | ||||
| #endif | ||||
|          } | ||||
| 
 | ||||
|          /* Check if the synthesis energy is higher than expected, which can
 | ||||
|  | @ -661,7 +756,7 @@ static void celt_decode_lost(CELTDecoder * OPUS_RESTRICT st, int N, int LM) | |||
|             for (i=0;i<extrapolation_len;i++) | ||||
|             { | ||||
|                opus_val16 tmp = ROUND16(buf[DECODE_BUFFER_SIZE-N+i], SIG_SHIFT); | ||||
|                S2 += SHR32(MULT16_16(tmp, tmp), 8); | ||||
|                S2 += SHR32(MULT16_16(tmp, tmp), 10); | ||||
|             } | ||||
|             /* This checks for an "explosion" in the synthesis. */ | ||||
| #ifdef FIXED_POINT | ||||
|  | @ -698,7 +793,7 @@ static void celt_decode_lost(CELTDecoder * OPUS_RESTRICT st, int N, int LM) | |||
|          comb_filter(etmp, buf+DECODE_BUFFER_SIZE, | ||||
|               st->postfilter_period, st->postfilter_period, overlap, | ||||
|               -st->postfilter_gain, -st->postfilter_gain, | ||||
|               st->postfilter_tapset, st->postfilter_tapset, NULL, 0); | ||||
|               st->postfilter_tapset, st->postfilter_tapset, NULL, 0, st->arch); | ||||
| 
 | ||||
|          /* Simulate TDAC on the concealed audio so that it blends with the
 | ||||
|             MDCT of the next frame. */ | ||||
|  | @ -769,6 +864,7 @@ int celt_decode_with_ec(CELTDecoder * OPUS_RESTRICT st, const unsigned char *dat | |||
|    const opus_int16 *eBands; | ||||
|    ALLOC_STACK; | ||||
| 
 | ||||
|    VALIDATE_CELT_DECODER(st); | ||||
|    mode = st->mode; | ||||
|    nbEBands = mode->nbEBands; | ||||
|    overlap = mode->overlap; | ||||
|  | @ -838,6 +934,10 @@ int celt_decode_with_ec(CELTDecoder * OPUS_RESTRICT st, const unsigned char *dat | |||
|       return frame_size/st->downsample; | ||||
|    } | ||||
| 
 | ||||
|    /* Check if there are at least two packets received consecutively before
 | ||||
|     * turning on the pitch-based PLC */ | ||||
|    st->skip_plc = st->loss_count != 0; | ||||
| 
 | ||||
|    if (dec == NULL) | ||||
|    { | ||||
|       ec_dec_init(&_dec,(unsigned char*)data,len); | ||||
|  | @ -959,7 +1059,7 @@ int celt_decode_with_ec(CELTDecoder * OPUS_RESTRICT st, const unsigned char *dat | |||
|    ALLOC(pulses, nbEBands, int); | ||||
|    ALLOC(fine_priority, nbEBands, int); | ||||
| 
 | ||||
|    codedBands = compute_allocation(mode, start, end, offsets, cap, | ||||
|    codedBands = clt_compute_allocation(mode, start, end, offsets, cap, | ||||
|          alloc_trim, &intensity, &dual_stereo, bits, &balance, pulses, | ||||
|          fine_quant, fine_priority, C, LM, dec, 0, 0, 0); | ||||
| 
 | ||||
|  | @ -982,7 +1082,8 @@ int celt_decode_with_ec(CELTDecoder * OPUS_RESTRICT st, const unsigned char *dat | |||
| 
 | ||||
|    quant_all_bands(0, mode, start, end, X, C==2 ? X+N : NULL, collapse_masks, | ||||
|          NULL, pulses, shortBlocks, spread_decision, dual_stereo, intensity, tf_res, | ||||
|          len*(8<<BITRES)-anti_collapse_rsv, balance, dec, LM, codedBands, &st->rng); | ||||
|          len*(8<<BITRES)-anti_collapse_rsv, balance, dec, LM, codedBands, &st->rng, 0, | ||||
|          st->arch, st->disable_inv); | ||||
| 
 | ||||
|    if (anti_collapse_rsv > 0) | ||||
|    { | ||||
|  | @ -994,7 +1095,7 @@ int celt_decode_with_ec(CELTDecoder * OPUS_RESTRICT st, const unsigned char *dat | |||
| 
 | ||||
|    if (anti_collapse_on) | ||||
|       anti_collapse(mode, X, collapse_masks, LM, C, N, | ||||
|             start, end, oldBandE, oldLogE, oldLogE2, pulses, st->rng); | ||||
|             start, end, oldBandE, oldLogE, oldLogE2, pulses, st->rng, st->arch); | ||||
| 
 | ||||
|    if (silence) | ||||
|    { | ||||
|  | @ -1002,18 +1103,19 @@ int celt_decode_with_ec(CELTDecoder * OPUS_RESTRICT st, const unsigned char *dat | |||
|          oldBandE[i] = -QCONST16(28.f,DB_SHIFT); | ||||
|    } | ||||
| 
 | ||||
|    celt_synthesis(mode, X, out_syn, oldBandE, start, effEnd, C, CC, isTransient, LM, st->downsample, silence); | ||||
|    celt_synthesis(mode, X, out_syn, oldBandE, start, effEnd, | ||||
|                   C, CC, isTransient, LM, st->downsample, silence, st->arch); | ||||
| 
 | ||||
|    c=0; do { | ||||
|       st->postfilter_period=IMAX(st->postfilter_period, COMBFILTER_MINPERIOD); | ||||
|       st->postfilter_period_old=IMAX(st->postfilter_period_old, COMBFILTER_MINPERIOD); | ||||
|       comb_filter(out_syn[c], out_syn[c], st->postfilter_period_old, st->postfilter_period, mode->shortMdctSize, | ||||
|             st->postfilter_gain_old, st->postfilter_gain, st->postfilter_tapset_old, st->postfilter_tapset, | ||||
|             mode->window, overlap); | ||||
|             mode->window, overlap, st->arch); | ||||
|       if (LM!=0) | ||||
|          comb_filter(out_syn[c]+mode->shortMdctSize, out_syn[c]+mode->shortMdctSize, st->postfilter_period, postfilter_pitch, N-mode->shortMdctSize, | ||||
|                st->postfilter_gain, postfilter_gain, st->postfilter_tapset, postfilter_tapset, | ||||
|                mode->window, overlap); | ||||
|                mode->window, overlap, st->arch); | ||||
| 
 | ||||
|    } while (++c<CC); | ||||
|    st->postfilter_period_old = st->postfilter_period; | ||||
|  | @ -1035,10 +1137,18 @@ int celt_decode_with_ec(CELTDecoder * OPUS_RESTRICT st, const unsigned char *dat | |||
|    /* In case start or end were to change */ | ||||
|    if (!isTransient) | ||||
|    { | ||||
|       opus_val16 max_background_increase; | ||||
|       OPUS_COPY(oldLogE2, oldLogE, 2*nbEBands); | ||||
|       OPUS_COPY(oldLogE, oldBandE, 2*nbEBands); | ||||
|       /* In normal circumstances, we only allow the noise floor to increase by
 | ||||
|          up to 2.4 dB/second, but when we're in DTX, we allow up to 6 dB | ||||
|          increase for each update.*/ | ||||
|       if (st->loss_count < 10) | ||||
|          max_background_increase = M*QCONST16(0.001f,DB_SHIFT); | ||||
|       else | ||||
|          max_background_increase = QCONST16(1.f,DB_SHIFT); | ||||
|       for (i=0;i<2*nbEBands;i++) | ||||
|          backgroundLogE[i] = MIN16(backgroundLogE[i] + M*QCONST16(0.001f,DB_SHIFT), oldBandE[i]); | ||||
|          backgroundLogE[i] = MIN16(backgroundLogE[i] + max_background_increase, oldBandE[i]); | ||||
|    } else { | ||||
|       for (i=0;i<2*nbEBands;i++) | ||||
|          oldLogE[i] = MIN16(oldLogE[i], oldBandE[i]); | ||||
|  | @ -1195,6 +1305,7 @@ int opus_custom_decoder_ctl(CELTDecoder * OPUS_RESTRICT st, int request, ...) | |||
|                ((char*)&st->DECODER_RESET_START - (char*)st)); | ||||
|          for (i=0;i<2*st->mode->nbEBands;i++) | ||||
|             oldLogE[i]=oldLogE2[i]=-QCONST16(28.f,DB_SHIFT); | ||||
|          st->skip_plc = 1; | ||||
|       } | ||||
|       break; | ||||
|       case OPUS_GET_PITCH_REQUEST: | ||||
|  | @ -1227,6 +1338,26 @@ int opus_custom_decoder_ctl(CELTDecoder * OPUS_RESTRICT st, int request, ...) | |||
|          *value=st->rng; | ||||
|       } | ||||
|       break; | ||||
|       case OPUS_SET_PHASE_INVERSION_DISABLED_REQUEST: | ||||
|       { | ||||
|           opus_int32 value = va_arg(ap, opus_int32); | ||||
|           if(value<0 || value>1) | ||||
|           { | ||||
|              goto bad_arg; | ||||
|           } | ||||
|           st->disable_inv = value; | ||||
|       } | ||||
|       break; | ||||
|       case OPUS_GET_PHASE_INVERSION_DISABLED_REQUEST: | ||||
|       { | ||||
|           opus_int32 *value = va_arg(ap, opus_int32*); | ||||
|           if (!value) | ||||
|           { | ||||
|              goto bad_arg; | ||||
|           } | ||||
|           *value = st->disable_inv; | ||||
|       } | ||||
|       break; | ||||
|       default: | ||||
|          goto bad_request; | ||||
|    } | ||||
|  |  | |||
							
								
								
									
										2607
									
								
								lib/rbcodec/codecs/libopus/celt/celt_encoder.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										2607
									
								
								lib/rbcodec/codecs/libopus/celt/celt_encoder.c
									
										
									
									
									
										Normal file
									
								
							
										
											
												File diff suppressed because it is too large
												Load diff
											
										
									
								
							|  | @ -49,8 +49,7 @@ int          p | |||
|    float *lpc = _lpc; | ||||
| #endif | ||||
| 
 | ||||
|    for (i = 0; i < p; i++) | ||||
|       lpc[i] = 0; | ||||
|    OPUS_CLEAR(lpc, p); | ||||
|    if (ac[0] != 0) | ||||
|    { | ||||
|       for (i = 0; i < p; i++) { | ||||
|  | @ -88,56 +87,42 @@ int          p | |||
| #endif | ||||
| } | ||||
| 
 | ||||
| void celt_fir(const opus_val16 *_x, | ||||
| 
 | ||||
| void celt_fir_c( | ||||
|          const opus_val16 *x, | ||||
|          const opus_val16 *num, | ||||
|          opus_val16 *_y, | ||||
|          opus_val16 *y, | ||||
|          int N, | ||||
|          int ord, | ||||
|          opus_val16 *mem) | ||||
|          int arch) | ||||
| { | ||||
|    int i,j; | ||||
|    VARDECL(opus_val16, rnum); | ||||
|    VARDECL(opus_val16, x); | ||||
|    SAVE_STACK; | ||||
| 
 | ||||
|    celt_assert(x != y); | ||||
|    ALLOC(rnum, ord, opus_val16); | ||||
|    ALLOC(x, N+ord, opus_val16); | ||||
|    for(i=0;i<ord;i++) | ||||
|       rnum[i] = num[ord-i-1]; | ||||
|    for(i=0;i<ord;i++) | ||||
|       x[i] = mem[ord-i-1]; | ||||
|    for (i=0;i<N;i++) | ||||
|       x[i+ord]=_x[i]; | ||||
|    for(i=0;i<ord;i++) | ||||
|       mem[i] = _x[N-i-1]; | ||||
| #ifdef SMALL_FOOTPRINT | ||||
|    for (i=0;i<N;i++) | ||||
|    { | ||||
|       opus_val32 sum = SHL32(EXTEND32(_x[i]), SIG_SHIFT); | ||||
|       for (j=0;j<ord;j++) | ||||
|       { | ||||
|          sum = MAC16_16(sum,rnum[j],x[i+j]); | ||||
|       } | ||||
|       _y[i] = SATURATE16(PSHR32(sum, SIG_SHIFT)); | ||||
|    } | ||||
| #else | ||||
|    for (i=0;i<N-3;i+=4) | ||||
|    { | ||||
|       opus_val32 sum[4]={0,0,0,0}; | ||||
|       xcorr_kernel(rnum, x+i, sum, ord); | ||||
|       _y[i  ] = SATURATE16(ADD32(EXTEND32(_x[i  ]), PSHR32(sum[0], SIG_SHIFT))); | ||||
|       _y[i+1] = SATURATE16(ADD32(EXTEND32(_x[i+1]), PSHR32(sum[1], SIG_SHIFT))); | ||||
|       _y[i+2] = SATURATE16(ADD32(EXTEND32(_x[i+2]), PSHR32(sum[2], SIG_SHIFT))); | ||||
|       _y[i+3] = SATURATE16(ADD32(EXTEND32(_x[i+3]), PSHR32(sum[3], SIG_SHIFT))); | ||||
|       opus_val32 sum[4]; | ||||
|       sum[0] = SHL32(EXTEND32(x[i  ]), SIG_SHIFT); | ||||
|       sum[1] = SHL32(EXTEND32(x[i+1]), SIG_SHIFT); | ||||
|       sum[2] = SHL32(EXTEND32(x[i+2]), SIG_SHIFT); | ||||
|       sum[3] = SHL32(EXTEND32(x[i+3]), SIG_SHIFT); | ||||
|       xcorr_kernel(rnum, x+i-ord, sum, ord, arch); | ||||
|       y[i  ] = ROUND16(sum[0], SIG_SHIFT); | ||||
|       y[i+1] = ROUND16(sum[1], SIG_SHIFT); | ||||
|       y[i+2] = ROUND16(sum[2], SIG_SHIFT); | ||||
|       y[i+3] = ROUND16(sum[3], SIG_SHIFT); | ||||
|    } | ||||
|    for (;i<N;i++) | ||||
|    { | ||||
|       opus_val32 sum = 0; | ||||
|       opus_val32 sum = SHL32(EXTEND32(x[i]), SIG_SHIFT); | ||||
|       for (j=0;j<ord;j++) | ||||
|          sum = MAC16_16(sum,rnum[j],x[i+j]); | ||||
|       _y[i] = SATURATE16(ADD32(EXTEND32(_x[i]), PSHR32(sum, SIG_SHIFT))); | ||||
|          sum = MAC16_16(sum,rnum[j],x[i+j-ord]); | ||||
|       y[i] = ROUND16(sum, SIG_SHIFT); | ||||
|    } | ||||
| #endif | ||||
|    RESTORE_STACK; | ||||
| } | ||||
| 
 | ||||
|  | @ -146,10 +131,12 @@ void celt_iir(const opus_val32 *_x, | |||
|          opus_val32 *_y, | ||||
|          int N, | ||||
|          int ord, | ||||
|          opus_val16 *mem) | ||||
|          opus_val16 *mem, | ||||
|          int arch) | ||||
| { | ||||
| #ifdef SMALL_FOOTPRINT | ||||
|    int i,j; | ||||
|    (void)arch; | ||||
|    for (i=0;i<N;i++) | ||||
|    { | ||||
|       opus_val32 sum = _x[i]; | ||||
|  | @ -161,7 +148,7 @@ void celt_iir(const opus_val32 *_x, | |||
|       { | ||||
|          mem[j]=mem[j-1]; | ||||
|       } | ||||
|       mem[0] = ROUND16(sum,SIG_SHIFT); | ||||
|       mem[0] = SROUND16(sum, SIG_SHIFT); | ||||
|       _y[i] = sum; | ||||
|    } | ||||
| #else | ||||
|  | @ -187,23 +174,23 @@ void celt_iir(const opus_val32 *_x, | |||
|       sum[1]=_x[i+1]; | ||||
|       sum[2]=_x[i+2]; | ||||
|       sum[3]=_x[i+3]; | ||||
|       xcorr_kernel(rden, y+i, sum, ord); | ||||
|       xcorr_kernel(rden, y+i, sum, ord, arch); | ||||
| 
 | ||||
|       /* Patch up the result to compensate for the fact that this is an IIR */ | ||||
|       y[i+ord  ] = -ROUND16(sum[0],SIG_SHIFT); | ||||
|       y[i+ord  ] = -SROUND16(sum[0],SIG_SHIFT); | ||||
|       _y[i  ] = sum[0]; | ||||
|       sum[1] = MAC16_16(sum[1], y[i+ord  ], den[0]); | ||||
|       y[i+ord+1] = -ROUND16(sum[1],SIG_SHIFT); | ||||
|       y[i+ord+1] = -SROUND16(sum[1],SIG_SHIFT); | ||||
|       _y[i+1] = sum[1]; | ||||
|       sum[2] = MAC16_16(sum[2], y[i+ord+1], den[0]); | ||||
|       sum[2] = MAC16_16(sum[2], y[i+ord  ], den[1]); | ||||
|       y[i+ord+2] = -ROUND16(sum[2],SIG_SHIFT); | ||||
|       y[i+ord+2] = -SROUND16(sum[2],SIG_SHIFT); | ||||
|       _y[i+2] = sum[2]; | ||||
| 
 | ||||
|       sum[3] = MAC16_16(sum[3], y[i+ord+2], den[0]); | ||||
|       sum[3] = MAC16_16(sum[3], y[i+ord+1], den[1]); | ||||
|       sum[3] = MAC16_16(sum[3], y[i+ord  ], den[2]); | ||||
|       y[i+ord+3] = -ROUND16(sum[3],SIG_SHIFT); | ||||
|       y[i+ord+3] = -SROUND16(sum[3],SIG_SHIFT); | ||||
|       _y[i+3] = sum[3]; | ||||
|    } | ||||
|    for (;i<N;i++) | ||||
|  | @ -211,7 +198,7 @@ void celt_iir(const opus_val32 *_x, | |||
|       opus_val32 sum = _x[i]; | ||||
|       for (j=0;j<ord;j++) | ||||
|          sum -= MULT16_16(rden[j],y[i+j]); | ||||
|       y[i+ord] = ROUND16(sum,SIG_SHIFT); | ||||
|       y[i+ord] = SROUND16(sum,SIG_SHIFT); | ||||
|       _y[i] = sum; | ||||
|    } | ||||
|    for(i=0;i<ord;i++) | ||||
|  |  | |||
|  | @ -29,24 +29,36 @@ | |||
| #define PLC_H | ||||
| 
 | ||||
| #include "arch.h" | ||||
| #include "cpu_support.h" | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE4_1) | ||||
| #include "x86/celt_lpc_sse.h" | ||||
| #endif | ||||
| 
 | ||||
| #define LPC_ORDER 24 | ||||
| 
 | ||||
| void _celt_lpc(opus_val16 *_lpc, const opus_val32 *ac, int p); | ||||
| 
 | ||||
| void celt_fir(const opus_val16 *x, | ||||
| void celt_fir_c( | ||||
|          const opus_val16 *x, | ||||
|          const opus_val16 *num, | ||||
|          opus_val16 *y, | ||||
|          int N, | ||||
|          int ord, | ||||
|          opus_val16 *mem); | ||||
|          int arch); | ||||
| 
 | ||||
| #if !defined(OVERRIDE_CELT_FIR) | ||||
| #define celt_fir(x, num, y, N, ord, arch) \ | ||||
|     (celt_fir_c(x, num, y, N, ord, arch)) | ||||
| #endif | ||||
| 
 | ||||
| void celt_iir(const opus_val32 *x, | ||||
|          const opus_val16 *den, | ||||
|          opus_val32 *y, | ||||
|          int N, | ||||
|          int ord, | ||||
|          opus_val16 *mem); | ||||
|          opus_val16 *mem, | ||||
|          int arch); | ||||
| 
 | ||||
| int _celt_autocorr(const opus_val16 *x, opus_val32 *ac, | ||||
|          const opus_val16 *window, int overlap, int lag, int n, int arch); | ||||
|  |  | |||
|  | @ -31,7 +31,8 @@ | |||
| #include "opus_types.h" | ||||
| #include "opus_defines.h" | ||||
| 
 | ||||
| #if defined(OPUS_HAVE_RTCD) && defined(OPUS_ARM_ASM) | ||||
| #if defined(OPUS_HAVE_RTCD) && \ | ||||
|   (defined(OPUS_ARM_ASM) || defined(OPUS_ARM_MAY_HAVE_NEON_INTR)) | ||||
| #include "arm/armcpu.h" | ||||
| 
 | ||||
| /* We currently support 4 ARM variants:
 | ||||
|  | @ -42,6 +43,22 @@ | |||
|  */ | ||||
| #define OPUS_ARCHMASK 3 | ||||
| 
 | ||||
| #elif (defined(OPUS_X86_MAY_HAVE_SSE) && !defined(OPUS_X86_PRESUME_SSE)) || \ | ||||
|   (defined(OPUS_X86_MAY_HAVE_SSE2) && !defined(OPUS_X86_PRESUME_SSE2)) || \ | ||||
|   (defined(OPUS_X86_MAY_HAVE_SSE4_1) && !defined(OPUS_X86_PRESUME_SSE4_1)) || \ | ||||
|   (defined(OPUS_X86_MAY_HAVE_AVX) && !defined(OPUS_X86_PRESUME_AVX)) | ||||
| 
 | ||||
| #include "x86/x86cpu.h" | ||||
| /* We currently support 5 x86 variants:
 | ||||
|  * arch[0] -> non-sse | ||||
|  * arch[1] -> sse | ||||
|  * arch[2] -> sse2 | ||||
|  * arch[3] -> sse4.1 | ||||
|  * arch[4] -> avx | ||||
|  */ | ||||
| #define OPUS_ARCHMASK 7 | ||||
| int opus_select_arch(void); | ||||
| 
 | ||||
| #else | ||||
| #define OPUS_ARCHMASK 0 | ||||
| 
 | ||||
|  | @ -50,5 +67,4 @@ static OPUS_INLINE int opus_select_arch(void) | |||
|   return 0; | ||||
| } | ||||
| #endif | ||||
| 
 | ||||
| #endif | ||||
|  |  | |||
|  | @ -74,7 +74,7 @@ int log2_frac(opus_uint32 val, int frac) | |||
| /*Although derived separately, the pulse vector coding scheme is equivalent to
 | ||||
|    a Pyramid Vector Quantizer \cite{Fis86}. | ||||
|   Some additional notes about an early version appear at | ||||
|    http://people.xiph.org/~tterribe/notes/cwrs.html, but the codebook ordering
 | ||||
|    https://people.xiph.org/~tterribe/notes/cwrs.html, but the codebook ordering
 | ||||
|    and the definitions of some terms have evolved since that was written. | ||||
| 
 | ||||
|   The conversion from a pulse vector to an integer index (encoding) and back | ||||
|  | @ -210,7 +210,7 @@ int log2_frac(opus_uint32 val, int frac) | |||
| #if defined(CUSTOM_MODES) | ||||
| static const opus_uint32 CELT_PVQ_U_DATA[1488]={ | ||||
| #else | ||||
| static const opus_uint32 CELT_PVQ_U_DATA[1272] ICONST_ATTR ={ | ||||
| static const opus_uint32 CELT_PVQ_U_DATA[1272]={ | ||||
| #endif | ||||
|   /*N=0, K=0...176:*/ | ||||
|   1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
|  | @ -418,7 +418,7 @@ static const opus_uint32 *const CELT_PVQ_U_ROW[15]={ | |||
|   CELT_PVQ_U_DATA+1464,CELT_PVQ_U_DATA+1470,CELT_PVQ_U_DATA+1473 | ||||
| }; | ||||
| #else | ||||
| static const opus_uint32 *const CELT_PVQ_U_ROW[15] ICONST_ATTR ={ | ||||
| static const opus_uint32 *const CELT_PVQ_U_ROW[15]={ | ||||
|   CELT_PVQ_U_DATA+   0,CELT_PVQ_U_DATA+ 176,CELT_PVQ_U_DATA+ 351, | ||||
|   CELT_PVQ_U_DATA+ 525,CELT_PVQ_U_DATA+ 698,CELT_PVQ_U_DATA+ 870, | ||||
|   CELT_PVQ_U_DATA+1041,CELT_PVQ_U_DATA+1131,CELT_PVQ_U_DATA+1178, | ||||
|  | @ -482,7 +482,7 @@ static opus_val32 cwrsi(int _n,int _k,opus_uint32 _i,int *_y){ | |||
|       k0=_k; | ||||
|       q=row[_n]; | ||||
|       if(q>_i){ | ||||
|         celt_assert(p>q); | ||||
|         celt_sig_assert(p>q); | ||||
|         _k=_n; | ||||
|         do p=CELT_PVQ_U_ROW[--_k][_n]; | ||||
|         while(p>_i); | ||||
|  |  | |||
							
								
								
									
										32
									
								
								lib/rbcodec/codecs/libopus/celt/dump_modes/Makefile
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										32
									
								
								lib/rbcodec/codecs/libopus/celt/dump_modes/Makefile
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,32 @@ | |||
| 
 | ||||
| CFLAGS=-O2 -Wall -Wextra -DHAVE_CONFIG_H | ||||
| INCLUDES=-I. -I../ -I../.. -I../../include | ||||
| 
 | ||||
| SOURCES = dump_modes.c \
 | ||||
|           ../modes.c \
 | ||||
|           ../cwrs.c \
 | ||||
|           ../rate.c \
 | ||||
|           ../entcode.c \
 | ||||
|           ../entenc.c \
 | ||||
|           ../entdec.c \
 | ||||
|           ../mathops.c \
 | ||||
|           ../mdct.c \
 | ||||
|           ../kiss_fft.c | ||||
| 
 | ||||
| ifdef HAVE_ARM_NE10 | ||||
| CC = gcc | ||||
| CFLAGS += -mfpu=neon | ||||
| INCLUDES += -I$(NE10_INCDIR) -DHAVE_ARM_NE10 -DOPUS_ARM_PRESUME_NEON_INTR | ||||
| LIBS = -L$(NE10_LIBDIR) -lNE10 | ||||
| SOURCES += ../arm/celt_ne10_fft.c \
 | ||||
|            dump_modes_arm_ne10.c \
 | ||||
|            ../arm/armcpu.c | ||||
| endif | ||||
| 
 | ||||
| all: dump_modes | ||||
| 
 | ||||
| dump_modes: | ||||
| 	$(PREFIX)$(CC) $(CFLAGS) $(INCLUDES) -DCUSTOM_MODES_ONLY -DCUSTOM_MODES $(SOURCES) -o $@ $(LIBS) -lm | ||||
| 
 | ||||
| clean: | ||||
| 	rm -f dump_modes | ||||
							
								
								
									
										353
									
								
								lib/rbcodec/codecs/libopus/celt/dump_modes/dump_modes.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										353
									
								
								lib/rbcodec/codecs/libopus/celt/dump_modes/dump_modes.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,353 @@ | |||
| /* Copyright (c) 2008 CSIRO
 | ||||
|    Copyright (c) 2008-2009 Xiph.Org Foundation | ||||
|    Written by Jean-Marc Valin */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <stdlib.h> | ||||
| #include <stdio.h> | ||||
| #include "modes.h" | ||||
| #include "celt.h" | ||||
| #include "rate.h" | ||||
| #include "dump_modes_arch.h" | ||||
| 
 | ||||
| #define INT16 "%d" | ||||
| #define INT32 "%d" | ||||
| #define FLOAT "%#0.8gf" | ||||
| 
 | ||||
| #ifdef FIXED_POINT | ||||
| #define WORD16 INT16 | ||||
| #define WORD32 INT32 | ||||
| #else | ||||
| #define WORD16 FLOAT | ||||
| #define WORD32 FLOAT | ||||
| #endif | ||||
| 
 | ||||
| void dump_modes(FILE *file, CELTMode **modes, int nb_modes) | ||||
| { | ||||
|    int i, j, k; | ||||
|    int mdct_twiddles_size; | ||||
|    fprintf(file, "/* The contents of this file was automatically generated by dump_modes.c\n"); | ||||
|    fprintf(file, "   with arguments:"); | ||||
|    for (i=0;i<nb_modes;i++) | ||||
|    { | ||||
|       CELTMode *mode = modes[i]; | ||||
|       fprintf(file, " %d %d",mode->Fs,mode->shortMdctSize*mode->nbShortMdcts); | ||||
|    } | ||||
|    fprintf(file, "\n   It contains static definitions for some pre-defined modes. */\n"); | ||||
|    fprintf(file, "#include \"modes.h\"\n"); | ||||
|    fprintf(file, "#include \"rate.h\"\n"); | ||||
|    fprintf(file, "\n#ifdef HAVE_ARM_NE10\n"); | ||||
|    fprintf(file, "#define OVERRIDE_FFT 1\n"); | ||||
|    fprintf(file, "#include \"%s\"\n", ARM_NE10_ARCH_FILE_NAME); | ||||
|    fprintf(file, "#endif\n"); | ||||
| 
 | ||||
|    fprintf(file, "\n"); | ||||
| 
 | ||||
|    for (i=0;i<nb_modes;i++) | ||||
|    { | ||||
|       CELTMode *mode = modes[i]; | ||||
|       int mdctSize; | ||||
|       int standard, framerate; | ||||
| 
 | ||||
|       mdctSize = mode->shortMdctSize*mode->nbShortMdcts; | ||||
|       standard = (mode->Fs == 400*(opus_int32)mode->shortMdctSize); | ||||
|       framerate = mode->Fs/mode->shortMdctSize; | ||||
| 
 | ||||
|       if (!standard) | ||||
|       { | ||||
|          fprintf(file, "#ifndef DEF_EBANDS%d_%d\n", mode->Fs, mdctSize); | ||||
|          fprintf(file, "#define DEF_EBANDS%d_%d\n", mode->Fs, mdctSize); | ||||
|          fprintf (file, "static const opus_int16 eBands%d_%d[%d] = {\n", mode->Fs, mdctSize, mode->nbEBands+2); | ||||
|          for (j=0;j<mode->nbEBands+2;j++) | ||||
|             fprintf (file, "%d, ", mode->eBands[j]); | ||||
|          fprintf (file, "};\n"); | ||||
|          fprintf(file, "#endif\n"); | ||||
|          fprintf(file, "\n"); | ||||
|       } | ||||
| 
 | ||||
|       fprintf(file, "#ifndef DEF_WINDOW%d\n", mode->overlap); | ||||
|       fprintf(file, "#define DEF_WINDOW%d\n", mode->overlap); | ||||
|       fprintf (file, "static const opus_val16 window%d[%d] = {\n", mode->overlap, mode->overlap); | ||||
|       for (j=0;j<mode->overlap;j++) | ||||
|          fprintf (file, WORD16 ",%c", mode->window[j],(j+6)%5==0?'\n':' '); | ||||
|       fprintf (file, "};\n"); | ||||
|       fprintf(file, "#endif\n"); | ||||
|       fprintf(file, "\n"); | ||||
| 
 | ||||
|       if (!standard) | ||||
|       { | ||||
|          fprintf(file, "#ifndef DEF_ALLOC_VECTORS%d_%d\n", mode->Fs, mdctSize); | ||||
|          fprintf(file, "#define DEF_ALLOC_VECTORS%d_%d\n", mode->Fs, mdctSize); | ||||
|          fprintf (file, "static const unsigned char allocVectors%d_%d[%d] = {\n", mode->Fs, mdctSize, mode->nbEBands*mode->nbAllocVectors); | ||||
|          for (j=0;j<mode->nbAllocVectors;j++) | ||||
|          { | ||||
|             for (k=0;k<mode->nbEBands;k++) | ||||
|                fprintf (file, "%2d, ", mode->allocVectors[j*mode->nbEBands+k]); | ||||
|             fprintf (file, "\n"); | ||||
|          } | ||||
|          fprintf (file, "};\n"); | ||||
|          fprintf(file, "#endif\n"); | ||||
|          fprintf(file, "\n"); | ||||
|       } | ||||
| 
 | ||||
|       fprintf(file, "#ifndef DEF_LOGN%d\n", framerate); | ||||
|       fprintf(file, "#define DEF_LOGN%d\n", framerate); | ||||
|       fprintf (file, "static const opus_int16 logN%d[%d] = {\n", framerate, mode->nbEBands); | ||||
|       for (j=0;j<mode->nbEBands;j++) | ||||
|          fprintf (file, "%d, ", mode->logN[j]); | ||||
|       fprintf (file, "};\n"); | ||||
|       fprintf(file, "#endif\n"); | ||||
|       fprintf(file, "\n"); | ||||
| 
 | ||||
|       /* Pulse cache */ | ||||
|       fprintf(file, "#ifndef DEF_PULSE_CACHE%d\n", mode->Fs/mdctSize); | ||||
|       fprintf(file, "#define DEF_PULSE_CACHE%d\n", mode->Fs/mdctSize); | ||||
|       fprintf (file, "static const opus_int16 cache_index%d[%d] = {\n", mode->Fs/mdctSize, (mode->maxLM+2)*mode->nbEBands); | ||||
|       for (j=0;j<mode->nbEBands*(mode->maxLM+2);j++) | ||||
|          fprintf (file, "%d,%c", mode->cache.index[j],(j+16)%15==0?'\n':' '); | ||||
|       fprintf (file, "};\n"); | ||||
|       fprintf (file, "static const unsigned char cache_bits%d[%d] = {\n", mode->Fs/mdctSize, mode->cache.size); | ||||
|       for (j=0;j<mode->cache.size;j++) | ||||
|          fprintf (file, "%d,%c", mode->cache.bits[j],(j+16)%15==0?'\n':' '); | ||||
|       fprintf (file, "};\n"); | ||||
|       fprintf (file, "static const unsigned char cache_caps%d[%d] = {\n", mode->Fs/mdctSize, (mode->maxLM+1)*2*mode->nbEBands); | ||||
|       for (j=0;j<(mode->maxLM+1)*2*mode->nbEBands;j++) | ||||
|          fprintf (file, "%d,%c", mode->cache.caps[j],(j+16)%15==0?'\n':' '); | ||||
|       fprintf (file, "};\n"); | ||||
| 
 | ||||
|       fprintf(file, "#endif\n"); | ||||
|       fprintf(file, "\n"); | ||||
| 
 | ||||
|       /* FFT twiddles */ | ||||
|       fprintf(file, "#ifndef FFT_TWIDDLES%d_%d\n", mode->Fs, mdctSize); | ||||
|       fprintf(file, "#define FFT_TWIDDLES%d_%d\n", mode->Fs, mdctSize); | ||||
|       fprintf (file, "static const kiss_twiddle_cpx fft_twiddles%d_%d[%d] = {\n", | ||||
|             mode->Fs, mdctSize, mode->mdct.kfft[0]->nfft); | ||||
|       for (j=0;j<mode->mdct.kfft[0]->nfft;j++) | ||||
|          fprintf (file, "{" WORD16 ", " WORD16 "},%c", mode->mdct.kfft[0]->twiddles[j].r, mode->mdct.kfft[0]->twiddles[j].i,(j+3)%2==0?'\n':' '); | ||||
|       fprintf (file, "};\n"); | ||||
| 
 | ||||
| #ifdef OVERRIDE_FFT | ||||
|       dump_mode_arch(mode); | ||||
| #endif | ||||
|       /* FFT Bitrev tables */ | ||||
|       for (k=0;k<=mode->mdct.maxshift;k++) | ||||
|       { | ||||
|          fprintf(file, "#ifndef FFT_BITREV%d\n", mode->mdct.kfft[k]->nfft); | ||||
|          fprintf(file, "#define FFT_BITREV%d\n", mode->mdct.kfft[k]->nfft); | ||||
|          fprintf (file, "static const opus_int16 fft_bitrev%d[%d] = {\n", | ||||
|                mode->mdct.kfft[k]->nfft, mode->mdct.kfft[k]->nfft); | ||||
|          for (j=0;j<mode->mdct.kfft[k]->nfft;j++) | ||||
|             fprintf (file, "%d,%c", mode->mdct.kfft[k]->bitrev[j],(j+16)%15==0?'\n':' '); | ||||
|          fprintf (file, "};\n"); | ||||
| 
 | ||||
|          fprintf(file, "#endif\n"); | ||||
|          fprintf(file, "\n"); | ||||
|       } | ||||
| 
 | ||||
|       /* FFT States */ | ||||
|       for (k=0;k<=mode->mdct.maxshift;k++) | ||||
|       { | ||||
|          fprintf(file, "#ifndef FFT_STATE%d_%d_%d\n", mode->Fs, mdctSize, k); | ||||
|          fprintf(file, "#define FFT_STATE%d_%d_%d\n", mode->Fs, mdctSize, k); | ||||
|          fprintf (file, "static const kiss_fft_state fft_state%d_%d_%d = {\n", | ||||
|                mode->Fs, mdctSize, k); | ||||
|          fprintf (file, "%d,    /* nfft */\n", mode->mdct.kfft[k]->nfft); | ||||
|          fprintf (file, WORD16 ",    /* scale */\n", mode->mdct.kfft[k]->scale); | ||||
| #ifdef FIXED_POINT | ||||
|          fprintf (file, "%d,    /* scale_shift */\n", mode->mdct.kfft[k]->scale_shift); | ||||
| #endif | ||||
|          fprintf (file, "%d,    /* shift */\n", mode->mdct.kfft[k]->shift); | ||||
|          fprintf (file, "{"); | ||||
|          for (j=0;j<2*MAXFACTORS;j++) | ||||
|             fprintf (file, "%d, ", mode->mdct.kfft[k]->factors[j]); | ||||
|          fprintf (file, "},    /* factors */\n"); | ||||
|          fprintf (file, "fft_bitrev%d,    /* bitrev */\n", mode->mdct.kfft[k]->nfft); | ||||
|          fprintf (file, "fft_twiddles%d_%d,    /* bitrev */\n", mode->Fs, mdctSize); | ||||
| 
 | ||||
|          fprintf (file, "#ifdef OVERRIDE_FFT\n"); | ||||
|          fprintf (file, "(arch_fft_state *)&cfg_arch_%d,\n", mode->mdct.kfft[k]->nfft); | ||||
|          fprintf (file, "#else\n"); | ||||
|          fprintf (file, "NULL,\n"); | ||||
|          fprintf(file, "#endif\n"); | ||||
| 
 | ||||
|          fprintf (file, "};\n"); | ||||
| 
 | ||||
|          fprintf(file, "#endif\n"); | ||||
|          fprintf(file, "\n"); | ||||
|       } | ||||
| 
 | ||||
|       fprintf(file, "#endif\n"); | ||||
|       fprintf(file, "\n"); | ||||
| 
 | ||||
|       /* MDCT twiddles */ | ||||
|       mdct_twiddles_size = mode->mdct.n-(mode->mdct.n/2>>mode->mdct.maxshift); | ||||
|       fprintf(file, "#ifndef MDCT_TWIDDLES%d\n", mdctSize); | ||||
|       fprintf(file, "#define MDCT_TWIDDLES%d\n", mdctSize); | ||||
|       fprintf (file, "static const opus_val16 mdct_twiddles%d[%d] = {\n", | ||||
|             mdctSize, mdct_twiddles_size); | ||||
|       for (j=0;j<mdct_twiddles_size;j++) | ||||
|          fprintf (file, WORD16 ",%c", mode->mdct.trig[j],(j+6)%5==0?'\n':' '); | ||||
|       fprintf (file, "};\n"); | ||||
| 
 | ||||
|       fprintf(file, "#endif\n"); | ||||
|       fprintf(file, "\n"); | ||||
| 
 | ||||
| 
 | ||||
|       /* Print the actual mode data */ | ||||
|       fprintf(file, "static const CELTMode mode%d_%d_%d = {\n", mode->Fs, mdctSize, mode->overlap); | ||||
|       fprintf(file, INT32 ",    /* Fs */\n", mode->Fs); | ||||
|       fprintf(file, "%d,    /* overlap */\n", mode->overlap); | ||||
|       fprintf(file, "%d,    /* nbEBands */\n", mode->nbEBands); | ||||
|       fprintf(file, "%d,    /* effEBands */\n", mode->effEBands); | ||||
|       fprintf(file, "{"); | ||||
|       for (j=0;j<4;j++) | ||||
|          fprintf(file, WORD16 ", ", mode->preemph[j]); | ||||
|       fprintf(file, "},    /* preemph */\n"); | ||||
|       if (standard) | ||||
|          fprintf(file, "eband5ms,    /* eBands */\n"); | ||||
|       else | ||||
|          fprintf(file, "eBands%d_%d,    /* eBands */\n", mode->Fs, mdctSize); | ||||
| 
 | ||||
|       fprintf(file, "%d,    /* maxLM */\n", mode->maxLM); | ||||
|       fprintf(file, "%d,    /* nbShortMdcts */\n", mode->nbShortMdcts); | ||||
|       fprintf(file, "%d,    /* shortMdctSize */\n", mode->shortMdctSize); | ||||
| 
 | ||||
|       fprintf(file, "%d,    /* nbAllocVectors */\n", mode->nbAllocVectors); | ||||
|       if (standard) | ||||
|          fprintf(file, "band_allocation,    /* allocVectors */\n"); | ||||
|       else | ||||
|          fprintf(file, "allocVectors%d_%d,    /* allocVectors */\n", mode->Fs, mdctSize); | ||||
| 
 | ||||
|       fprintf(file, "logN%d,    /* logN */\n", framerate); | ||||
|       fprintf(file, "window%d,    /* window */\n", mode->overlap); | ||||
|       fprintf(file, "{%d, %d, {", mode->mdct.n, mode->mdct.maxshift); | ||||
|       for (k=0;k<=mode->mdct.maxshift;k++) | ||||
|          fprintf(file, "&fft_state%d_%d_%d, ", mode->Fs, mdctSize, k); | ||||
|       fprintf (file, "}, mdct_twiddles%d},    /* mdct */\n", mdctSize); | ||||
| 
 | ||||
|       fprintf(file, "{%d, cache_index%d, cache_bits%d, cache_caps%d},    /* cache */\n", | ||||
|             mode->cache.size, mode->Fs/mdctSize, mode->Fs/mdctSize, mode->Fs/mdctSize); | ||||
|       fprintf(file, "};\n"); | ||||
|    } | ||||
|    fprintf(file, "\n"); | ||||
|    fprintf(file, "/* List of all the available modes */\n"); | ||||
|    fprintf(file, "#define TOTAL_MODES %d\n", nb_modes); | ||||
|    fprintf(file, "static const CELTMode * const static_mode_list[TOTAL_MODES] = {\n"); | ||||
|    for (i=0;i<nb_modes;i++) | ||||
|    { | ||||
|       CELTMode *mode = modes[i]; | ||||
|       int mdctSize; | ||||
|       mdctSize = mode->shortMdctSize*mode->nbShortMdcts; | ||||
|       fprintf(file, "&mode%d_%d_%d,\n", mode->Fs, mdctSize, mode->overlap); | ||||
|    } | ||||
|    fprintf(file, "};\n"); | ||||
| } | ||||
| 
 | ||||
| void dump_header(FILE *file, CELTMode **modes, int nb_modes) | ||||
| { | ||||
|    int i; | ||||
|    int channels = 0; | ||||
|    int frame_size = 0; | ||||
|    int overlap = 0; | ||||
|    fprintf (file, "/* This header file is generated automatically*/\n"); | ||||
|    for (i=0;i<nb_modes;i++) | ||||
|    { | ||||
|       CELTMode *mode = modes[i]; | ||||
|       if (frame_size==0) | ||||
|          frame_size = mode->shortMdctSize*mode->nbShortMdcts; | ||||
|       else if (frame_size != mode->shortMdctSize*mode->nbShortMdcts) | ||||
|          frame_size = -1; | ||||
|       if (overlap==0) | ||||
|          overlap = mode->overlap; | ||||
|       else if (overlap != mode->overlap) | ||||
|          overlap = -1; | ||||
|    } | ||||
|    if (channels>0) | ||||
|    { | ||||
|       fprintf (file, "#define CHANNELS(mode) %d\n", channels); | ||||
|       if (channels==1) | ||||
|          fprintf (file, "#define DISABLE_STEREO\n"); | ||||
|    } | ||||
|    if (frame_size>0) | ||||
|    { | ||||
|       fprintf (file, "#define FRAMESIZE(mode) %d\n", frame_size); | ||||
|    } | ||||
|    if (overlap>0) | ||||
|    { | ||||
|       fprintf (file, "#define OVERLAP(mode) %d\n", overlap); | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| #ifdef FIXED_POINT | ||||
| #define BASENAME "static_modes_fixed" | ||||
| #else | ||||
| #define BASENAME "static_modes_float" | ||||
| #endif | ||||
| 
 | ||||
| int main(int argc, char **argv) | ||||
| { | ||||
|    int i, nb; | ||||
|    FILE *file; | ||||
|    CELTMode **m; | ||||
|    if (argc%2 != 1 || argc<3) | ||||
|    { | ||||
|       fprintf (stderr, "Usage: %s rate frame_size [rate frame_size] [rate frame_size]...\n",argv[0]); | ||||
|       return 1; | ||||
|    } | ||||
|    nb = (argc-1)/2; | ||||
|    m = malloc(nb*sizeof(CELTMode*)); | ||||
|    for (i=0;i<nb;i++) | ||||
|    { | ||||
|       int Fs, frame; | ||||
|       Fs      = atoi(argv[2*i+1]); | ||||
|       frame   = atoi(argv[2*i+2]); | ||||
|       m[i] = opus_custom_mode_create(Fs, frame, NULL); | ||||
|       if (m[i]==NULL) | ||||
|       { | ||||
|          fprintf(stderr,"Error creating mode with Fs=%s, frame_size=%s\n", | ||||
|                argv[2*i+1],argv[2*i+2]); | ||||
|          return EXIT_FAILURE; | ||||
|       } | ||||
|    } | ||||
|    file = fopen(BASENAME ".h", "w"); | ||||
| #ifdef OVERRIDE_FFT | ||||
|    dump_modes_arch_init(m, nb); | ||||
| #endif | ||||
|    dump_modes(file, m, nb); | ||||
|    fclose(file); | ||||
| #ifdef OVERRIDE_FFT | ||||
|    dump_modes_arch_finalize(); | ||||
| #endif | ||||
|    for (i=0;i<nb;i++) | ||||
|       opus_custom_mode_destroy(m[i]); | ||||
|    free(m); | ||||
|    return 0; | ||||
| } | ||||
							
								
								
									
										45
									
								
								lib/rbcodec/codecs/libopus/celt/dump_modes/dump_modes_arch.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										45
									
								
								lib/rbcodec/codecs/libopus/celt/dump_modes/dump_modes_arch.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,45 @@ | |||
| /* Copyright (c) 2015 Xiph.Org Foundation
 | ||||
|    Written by Viswanath Puttagunta */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef DUMP_MODE_ARCH_H | ||||
| #define DUMP_MODE_ARCH_H | ||||
| 
 | ||||
| void dump_modes_arch_init(); | ||||
| void dump_mode_arch(CELTMode *mode); | ||||
| void dump_modes_arch_finalize(); | ||||
| 
 | ||||
| #if !defined(FIXED_POINT) | ||||
| #define ARM_NE10_ARCH_FILE_NAME "static_modes_float_arm_ne10.h" | ||||
| #else | ||||
| #define ARM_NE10_ARCH_FILE_NAME "static_modes_fixed_arm_ne10.h" | ||||
| #endif | ||||
| 
 | ||||
| #if defined(HAVE_ARM_NE10) | ||||
| #define OVERRIDE_FFT (1) | ||||
| #endif | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										152
									
								
								lib/rbcodec/codecs/libopus/celt/dump_modes/dump_modes_arm_ne10.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										152
									
								
								lib/rbcodec/codecs/libopus/celt/dump_modes/dump_modes_arm_ne10.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,152 @@ | |||
| /* Copyright (c) 2015 Xiph.Org Foundation
 | ||||
|    Written by Viswanath Puttagunta */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #if defined(HAVE_CONFIG_H) | ||||
| # include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <stdio.h> | ||||
| #include <stdlib.h> | ||||
| #include "modes.h" | ||||
| #include "dump_modes_arch.h" | ||||
| #include <NE10_dsp.h> | ||||
| 
 | ||||
| #if !defined(FIXED_POINT) | ||||
| # define NE10_FFT_CFG_TYPE_T ne10_fft_cfg_float32_t | ||||
| # define NE10_FFT_CPX_TYPE_T_STR "ne10_fft_cpx_float32_t" | ||||
| # define NE10_FFT_STATE_TYPE_T_STR "ne10_fft_state_float32_t" | ||||
| #else | ||||
| # define NE10_FFT_CFG_TYPE_T ne10_fft_cfg_int32_t | ||||
| # define NE10_FFT_CPX_TYPE_T_STR "ne10_fft_cpx_int32_t" | ||||
| # define NE10_FFT_STATE_TYPE_T_STR "ne10_fft_state_int32_t" | ||||
| #endif | ||||
| 
 | ||||
| static FILE *file; | ||||
| 
 | ||||
| void dump_modes_arch_init(CELTMode **modes, int nb_modes) | ||||
| { | ||||
|    int i; | ||||
| 
 | ||||
|    file = fopen(ARM_NE10_ARCH_FILE_NAME, "w"); | ||||
|    fprintf(file, "/* The contents of this file was automatically generated by\n"); | ||||
|    fprintf(file, " * dump_mode_arm_ne10.c with arguments:"); | ||||
|    for (i=0;i<nb_modes;i++) | ||||
|    { | ||||
|       CELTMode *mode = modes[i]; | ||||
|       fprintf(file, " %d %d",mode->Fs,mode->shortMdctSize*mode->nbShortMdcts); | ||||
|    } | ||||
|    fprintf(file, "\n * It contains static definitions for some pre-defined modes. */\n"); | ||||
|    fprintf(file, "#include <NE10_types.h>\n\n"); | ||||
| } | ||||
| 
 | ||||
| void dump_modes_arch_finalize() | ||||
| { | ||||
|    fclose(file); | ||||
| } | ||||
| 
 | ||||
| void dump_mode_arch(CELTMode *mode) | ||||
| { | ||||
|    int k, j; | ||||
|    int mdctSize; | ||||
| 
 | ||||
|    mdctSize = mode->shortMdctSize*mode->nbShortMdcts; | ||||
| 
 | ||||
|    fprintf(file, "#ifndef NE10_FFT_PARAMS%d_%d\n", mode->Fs, mdctSize); | ||||
|    fprintf(file, "#define NE10_FFT_PARAMS%d_%d\n", mode->Fs, mdctSize); | ||||
|    /* cfg->factors */ | ||||
|    for(k=0;k<=mode->mdct.maxshift;k++) { | ||||
|       NE10_FFT_CFG_TYPE_T cfg; | ||||
|       cfg = (NE10_FFT_CFG_TYPE_T)mode->mdct.kfft[k]->arch_fft->priv; | ||||
|       if (!cfg) | ||||
|          continue; | ||||
|       fprintf(file, "static const ne10_int32_t ne10_factors_%d[%d] = {\n", | ||||
|               mode->mdct.kfft[k]->nfft, (NE10_MAXFACTORS * 2)); | ||||
|       for(j=0;j<(NE10_MAXFACTORS * 2);j++) { | ||||
|          fprintf(file, "%d,%c", cfg->factors[j],(j+16)%15==0?'\n':' '); | ||||
|       } | ||||
|       fprintf (file, "};\n"); | ||||
|    } | ||||
| 
 | ||||
|    /* cfg->twiddles */ | ||||
|    for(k=0;k<=mode->mdct.maxshift;k++) { | ||||
|       NE10_FFT_CFG_TYPE_T cfg; | ||||
|       cfg = (NE10_FFT_CFG_TYPE_T)mode->mdct.kfft[k]->arch_fft->priv; | ||||
|       if (!cfg) | ||||
|          continue; | ||||
|       fprintf(file, "static const %s ne10_twiddles_%d[%d] = {\n", | ||||
|               NE10_FFT_CPX_TYPE_T_STR, mode->mdct.kfft[k]->nfft, | ||||
|               mode->mdct.kfft[k]->nfft); | ||||
|       for(j=0;j<mode->mdct.kfft[k]->nfft;j++) { | ||||
| #if !defined(FIXED_POINT) | ||||
|          fprintf(file, "{%#0.8gf,%#0.8gf},%c", | ||||
|                  cfg->twiddles[j].r, cfg->twiddles[j].i,(j+4)%3==0?'\n':' '); | ||||
| #else | ||||
|          fprintf(file, "{%d,%d},%c", | ||||
|                  cfg->twiddles[j].r, cfg->twiddles[j].i,(j+4)%3==0?'\n':' '); | ||||
| #endif | ||||
|       } | ||||
|       fprintf (file, "};\n"); | ||||
|    } | ||||
| 
 | ||||
|    for(k=0;k<=mode->mdct.maxshift;k++) { | ||||
|       NE10_FFT_CFG_TYPE_T cfg; | ||||
|       cfg = (NE10_FFT_CFG_TYPE_T)mode->mdct.kfft[k]->arch_fft->priv; | ||||
|       if (!cfg) { | ||||
|          fprintf(file, "/* Ne10 does not support scaled FFT for length = %d */\n", | ||||
|                  mode->mdct.kfft[k]->nfft); | ||||
|          fprintf(file, "static const arch_fft_state cfg_arch_%d = {\n", mode->mdct.kfft[k]->nfft); | ||||
|          fprintf(file, "0,\n"); | ||||
|          fprintf(file, "NULL\n"); | ||||
|          fprintf(file, "};\n"); | ||||
|          continue; | ||||
|       } | ||||
|       fprintf(file, "static const %s %s_%d = {\n", NE10_FFT_STATE_TYPE_T_STR, | ||||
|               NE10_FFT_STATE_TYPE_T_STR, mode->mdct.kfft[k]->nfft); | ||||
|       fprintf(file, "%d,\n", cfg->nfft); | ||||
|       fprintf(file, "(ne10_int32_t *)ne10_factors_%d,\n", mode->mdct.kfft[k]->nfft); | ||||
|       fprintf(file, "(%s *)ne10_twiddles_%d,\n", | ||||
|               NE10_FFT_CPX_TYPE_T_STR, mode->mdct.kfft[k]->nfft); | ||||
|       fprintf(file, "NULL,\n");  /* buffer */ | ||||
|       fprintf(file, "(%s *)&ne10_twiddles_%d[%d],\n", | ||||
|               NE10_FFT_CPX_TYPE_T_STR, mode->mdct.kfft[k]->nfft, cfg->nfft); | ||||
| #if !defined(FIXED_POINT) | ||||
|       fprintf(file, "/* is_forward_scaled = true */\n"); | ||||
|       fprintf(file, "(ne10_int32_t) 1,\n"); | ||||
|       fprintf(file, "/* is_backward_scaled = false */\n"); | ||||
|       fprintf(file, "(ne10_int32_t) 0,\n"); | ||||
| #endif | ||||
|       fprintf(file, "};\n"); | ||||
| 
 | ||||
|       fprintf(file, "static const arch_fft_state cfg_arch_%d = {\n", | ||||
|               mode->mdct.kfft[k]->nfft); | ||||
|       fprintf(file, "1,\n"); | ||||
|       fprintf(file, "(void *)&%s_%d,\n", | ||||
|               NE10_FFT_STATE_TYPE_T_STR, mode->mdct.kfft[k]->nfft); | ||||
|       fprintf(file, "};\n\n"); | ||||
|    } | ||||
|    fprintf(file, "#endif  /* end NE10_FFT_PARAMS%d_%d */\n", mode->Fs, mdctSize); | ||||
| } | ||||
|  | @ -116,7 +116,7 @@ opus_uint32 ec_tell_frac(ec_ctx *_this){ | |||
| 
 | ||||
| #ifdef USE_SMALL_DIV_TABLE | ||||
| /* Result of 2^32/(2*i+1), except for i=0. */ | ||||
| const opus_uint32 SMALL_DIV_TABLE[129] ICONST_ATTR = { | ||||
| const opus_uint32 SMALL_DIV_TABLE[129] = { | ||||
|    0xFFFFFFFF, 0x55555555, 0x33333333, 0x24924924, | ||||
|    0x1C71C71C, 0x1745D174, 0x13B13B13, 0x11111111, | ||||
|    0x0F0F0F0F, 0x0D79435E, 0x0C30C30C, 0x0B21642C, | ||||
|  |  | |||
|  | @ -122,7 +122,7 @@ opus_uint32 ec_tell_frac(ec_ctx *_this); | |||
| 
 | ||||
| /* Tested exhaustively for all n and for 1<=d<=256 */ | ||||
| static OPUS_INLINE opus_uint32 celt_udiv(opus_uint32 n, opus_uint32 d) { | ||||
|    celt_assert(d>0); | ||||
|    celt_sig_assert(d>0); | ||||
| #ifdef USE_SMALL_DIV_TABLE | ||||
|    if (d>256) | ||||
|       return n/d; | ||||
|  | @ -138,7 +138,7 @@ static OPUS_INLINE opus_uint32 celt_udiv(opus_uint32 n, opus_uint32 d) { | |||
| } | ||||
| 
 | ||||
| static OPUS_INLINE opus_int32 celt_sudiv(opus_int32 n, opus_int32 d) { | ||||
|    celt_assert(d>0); | ||||
|    celt_sig_assert(d>0); | ||||
| #ifdef USE_SMALL_DIV_TABLE | ||||
|    if (n<0) | ||||
|       return -(opus_int32)celt_udiv(-n, d); | ||||
|  |  | |||
|  | @ -85,7 +85,7 @@ int ec_dec_icdf(ec_dec *_this,const unsigned char *_icdf,unsigned _ftb); | |||
|   The bits must have been encoded with ec_enc_uint(). | ||||
|   No call to ec_dec_update() is necessary after this call. | ||||
|   _ft: The number of integers that can be decoded (one more than the max). | ||||
|        This must be at least one, and no more than 2**32-1. | ||||
|        This must be at least 2, and no more than 2**32-1. | ||||
|   Return: The decoded bits.*/ | ||||
| opus_uint32 ec_dec_uint(ec_dec *_this,opus_uint32 _ft); | ||||
| 
 | ||||
|  |  | |||
|  | @ -98,7 +98,7 @@ static void ec_enc_carry_out(ec_enc *_this,int _c){ | |||
|   else _this->ext++; | ||||
| } | ||||
| 
 | ||||
| static void ec_enc_normalize(ec_enc *_this){ | ||||
| static OPUS_INLINE void ec_enc_normalize(ec_enc *_this){ | ||||
|   /*If the range is too small, output some bits and rescale it.*/ | ||||
|   while(_this->rng<=EC_CODE_BOT){ | ||||
|     ec_enc_carry_out(_this,(int)(_this->val>>EC_CODE_SHIFT)); | ||||
|  |  | |||
|  | @ -67,7 +67,7 @@ void ec_enc_icdf(ec_enc *_this,int _s,const unsigned char *_icdf,unsigned _ftb); | |||
| /*Encodes a raw unsigned integer in the stream.
 | ||||
|   _fl: The integer to encode. | ||||
|   _ft: The number of integers that can be encoded (one more than the max). | ||||
|        This must be at least one, and no more than 2**32-1.*/ | ||||
|        This must be at least 2, and no more than 2**32-1.*/ | ||||
| void ec_enc_uint(ec_enc *_this,opus_uint32 _fl,opus_uint32 _ft); | ||||
| 
 | ||||
| /*Encodes a sequence of raw bits in the stream.
 | ||||
|  |  | |||
							
								
								
									
										79
									
								
								lib/rbcodec/codecs/libopus/celt/fixed_c5x.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										79
									
								
								lib/rbcodec/codecs/libopus/celt/fixed_c5x.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,79 @@ | |||
| /* Copyright (C) 2003 Jean-Marc Valin */ | ||||
| /**
 | ||||
|    @file fixed_c5x.h | ||||
|    @brief Fixed-point operations for the TI C5x DSP family | ||||
| */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef FIXED_C5X_H | ||||
| #define FIXED_C5X_H | ||||
| 
 | ||||
| #include "dsplib.h" | ||||
| 
 | ||||
| #undef IMUL32 | ||||
| static OPUS_INLINE long IMUL32(long i, long j) | ||||
| { | ||||
|    long ac0, ac1; | ||||
|    ac0 = _lmpy(i>>16,j); | ||||
|    ac1 = ac0 + _lmpy(i,j>>16); | ||||
|    return _lmpyu(i,j) + (ac1<<16); | ||||
| } | ||||
| 
 | ||||
| #undef MAX16 | ||||
| #define MAX16(a,b) _max(a,b) | ||||
| 
 | ||||
| #undef MIN16 | ||||
| #define MIN16(a,b) _min(a,b) | ||||
| 
 | ||||
| #undef MAX32 | ||||
| #define MAX32(a,b) _lmax(a,b) | ||||
| 
 | ||||
| #undef MIN32 | ||||
| #define MIN32(a,b) _lmin(a,b) | ||||
| 
 | ||||
| #undef VSHR32 | ||||
| #define VSHR32(a, shift) _lshl(a,-(shift)) | ||||
| 
 | ||||
| #undef MULT16_16_Q15 | ||||
| #define MULT16_16_Q15(a,b) (_smpy(a,b)) | ||||
| 
 | ||||
| #undef MULT16_16SU | ||||
| #define MULT16_16SU(a,b) _lmpysu(a,b) | ||||
| 
 | ||||
| #undef MULT_16_16 | ||||
| #define MULT_16_16(a,b) _lmpy(a,b) | ||||
| 
 | ||||
| /* FIXME: This is technically incorrect and is bound to cause problems. Is there any cleaner solution? */ | ||||
| #undef MULT16_32_Q15 | ||||
| #define MULT16_32_Q15(a,b) ADD32(SHL(MULT16_16((a),SHR((b),16)),1), SHR(MULT16_16SU((a),(b)),15)) | ||||
| 
 | ||||
| #define celt_ilog2(x) (30 - _lnorm(x)) | ||||
| #define OVERRIDE_CELT_ILOG2 | ||||
| 
 | ||||
| #define celt_maxabs16(x, len) MAX32(EXTEND32(maxval((DATA *)x, len)),-EXTEND32(minval((DATA *)x, len))) | ||||
| #define OVERRIDE_CELT_MAXABS16 | ||||
| 
 | ||||
| #endif /* FIXED_C5X_H */ | ||||
							
								
								
									
										70
									
								
								lib/rbcodec/codecs/libopus/celt/fixed_c6x.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										70
									
								
								lib/rbcodec/codecs/libopus/celt/fixed_c6x.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,70 @@ | |||
| /* Copyright (C) 2008 CSIRO */ | ||||
| /**
 | ||||
|    @file fixed_c6x.h | ||||
|    @brief Fixed-point operations for the TI C6x DSP family | ||||
| */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef FIXED_C6X_H | ||||
| #define FIXED_C6X_H | ||||
| 
 | ||||
| #undef MULT16_16SU | ||||
| #define MULT16_16SU(a,b) _mpysu(a,b) | ||||
| 
 | ||||
| #undef MULT_16_16 | ||||
| #define MULT_16_16(a,b) _mpy(a,b) | ||||
| 
 | ||||
| #define celt_ilog2(x) (30 - _norm(x)) | ||||
| #define OVERRIDE_CELT_ILOG2 | ||||
| 
 | ||||
| #undef MULT16_32_Q15 | ||||
| #define MULT16_32_Q15(a,b) (_mpylill(a, b) >> 15) | ||||
| 
 | ||||
| #if 0 | ||||
| #include "dsplib.h" | ||||
| 
 | ||||
| #undef MAX16 | ||||
| #define MAX16(a,b) _max(a,b) | ||||
| 
 | ||||
| #undef MIN16 | ||||
| #define MIN16(a,b) _min(a,b) | ||||
| 
 | ||||
| #undef MAX32 | ||||
| #define MAX32(a,b) _lmax(a,b) | ||||
| 
 | ||||
| #undef MIN32 | ||||
| #define MIN32(a,b) _lmin(a,b) | ||||
| 
 | ||||
| #undef VSHR32 | ||||
| #define VSHR32(a, shift) _lshl(a,-(shift)) | ||||
| 
 | ||||
| #undef MULT16_16_Q15 | ||||
| #define MULT16_16_Q15(a,b) (_smpy(a,b)) | ||||
| 
 | ||||
| #define celt_maxabs16(x, len) MAX32(EXTEND32(maxval((DATA *)x, len)),-EXTEND32(minval((DATA *)x, len))) | ||||
| #define OVERRIDE_CELT_MAXABS16 | ||||
| 
 | ||||
| #endif /* FIXED_C6X_H */ | ||||
							
								
								
									
										791
									
								
								lib/rbcodec/codecs/libopus/celt/fixed_debug.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										791
									
								
								lib/rbcodec/codecs/libopus/celt/fixed_debug.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,791 @@ | |||
| /* Copyright (C) 2003-2008 Jean-Marc Valin
 | ||||
|    Copyright (C) 2007-2012 Xiph.Org Foundation */ | ||||
| /**
 | ||||
|    @file fixed_debug.h | ||||
|    @brief Fixed-point operations with debugging | ||||
| */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef FIXED_DEBUG_H | ||||
| #define FIXED_DEBUG_H | ||||
| 
 | ||||
| #include <stdio.h> | ||||
| #include "opus_defines.h" | ||||
| 
 | ||||
| #ifdef CELT_C | ||||
| OPUS_EXPORT opus_int64 celt_mips=0; | ||||
| #else | ||||
| extern opus_int64 celt_mips; | ||||
| #endif | ||||
| 
 | ||||
| #define MULT16_16SU(a,b) ((opus_val32)(opus_val16)(a)*(opus_val32)(opus_uint16)(b)) | ||||
| #define MULT32_32_Q31(a,b) ADD32(ADD32(SHL32(MULT16_16(SHR32((a),16),SHR((b),16)),1), SHR32(MULT16_16SU(SHR32((a),16),((b)&0x0000ffff)),15)), SHR32(MULT16_16SU(SHR32((b),16),((a)&0x0000ffff)),15)) | ||||
| 
 | ||||
| /** 16x32 multiplication, followed by a 16-bit shift right. Results fits in 32 bits */ | ||||
| #define MULT16_32_Q16(a,b) ADD32(MULT16_16((a),SHR32((b),16)), SHR32(MULT16_16SU((a),((b)&0x0000ffff)),16)) | ||||
| 
 | ||||
| #define MULT16_32_P16(a,b) MULT16_32_PX(a,b,16) | ||||
| 
 | ||||
| #define QCONST16(x,bits) ((opus_val16)(.5+(x)*(((opus_val32)1)<<(bits)))) | ||||
| #define QCONST32(x,bits) ((opus_val32)(.5+(x)*(((opus_val32)1)<<(bits)))) | ||||
| 
 | ||||
| #define VERIFY_SHORT(x) ((x)<=32767&&(x)>=-32768) | ||||
| #define VERIFY_INT(x) ((x)<=2147483647LL&&(x)>=-2147483648LL) | ||||
| #define VERIFY_UINT(x) ((x)<=(2147483647LLU<<1)) | ||||
| 
 | ||||
| #define SHR(a,b) SHR32(a,b) | ||||
| #define PSHR(a,b) PSHR32(a,b) | ||||
| 
 | ||||
| /** Add two 32-bit values, ignore any overflows */ | ||||
| #define ADD32_ovflw(a,b) (celt_mips+=2,(opus_val32)((opus_uint32)(a)+(opus_uint32)(b))) | ||||
| /** Subtract two 32-bit values, ignore any overflows */ | ||||
| #define SUB32_ovflw(a,b) (celt_mips+=2,(opus_val32)((opus_uint32)(a)-(opus_uint32)(b))) | ||||
| /* Avoid MSVC warning C4146: unary minus operator applied to unsigned type */ | ||||
| /** Negate 32-bit value, ignore any overflows */ | ||||
| #define NEG32_ovflw(a) (celt_mips+=2,(opus_val32)(0-(opus_uint32)(a))) | ||||
| 
 | ||||
| static OPUS_INLINE short NEG16(int x) | ||||
| { | ||||
|    int res; | ||||
|    if (!VERIFY_SHORT(x)) | ||||
|    { | ||||
|       fprintf (stderr, "NEG16: input is not short: %d\n", (int)x); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = -x; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "NEG16: output is not short: %d\n", (int)res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips++; | ||||
|    return res; | ||||
| } | ||||
| static OPUS_INLINE int NEG32(opus_int64 x) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_INT(x)) | ||||
|    { | ||||
|       fprintf (stderr, "NEG16: input is not int: %d\n", (int)x); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = -x; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "NEG16: output is not int: %d\n", (int)res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=2; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define EXTRACT16(x) EXTRACT16_(x, __FILE__, __LINE__) | ||||
| static OPUS_INLINE short EXTRACT16_(int x, char *file, int line) | ||||
| { | ||||
|    int res; | ||||
|    if (!VERIFY_SHORT(x)) | ||||
|    { | ||||
|       fprintf (stderr, "EXTRACT16: input is not short: %d in %s: line %d\n", x, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = x; | ||||
|    celt_mips++; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define EXTEND32(x) EXTEND32_(x, __FILE__, __LINE__) | ||||
| static OPUS_INLINE int EXTEND32_(int x, char *file, int line) | ||||
| { | ||||
|    int res; | ||||
|    if (!VERIFY_SHORT(x)) | ||||
|    { | ||||
|       fprintf (stderr, "EXTEND32: input is not short: %d in %s: line %d\n", x, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = x; | ||||
|    celt_mips++; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define SHR16(a, shift) SHR16_(a, shift, __FILE__, __LINE__) | ||||
| static OPUS_INLINE short SHR16_(int a, int shift, char *file, int line) | ||||
| { | ||||
|    int res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(shift)) | ||||
|    { | ||||
|       fprintf (stderr, "SHR16: inputs are not short: %d >> %d in %s: line %d\n", a, shift, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a>>shift; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "SHR16: output is not short: %d in %s: line %d\n", res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips++; | ||||
|    return res; | ||||
| } | ||||
| #define SHL16(a, shift) SHL16_(a, shift, __FILE__, __LINE__) | ||||
| static OPUS_INLINE short SHL16_(int a, int shift, char *file, int line) | ||||
| { | ||||
|    int res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(shift)) | ||||
|    { | ||||
|       fprintf (stderr, "SHL16: inputs are not short: %d %d in %s: line %d\n", a, shift, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a<<shift; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "SHL16: output is not short: %d in %s: line %d\n", res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips++; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| static OPUS_INLINE int SHR32(opus_int64 a, int shift) | ||||
| { | ||||
|    opus_int64  res; | ||||
|    if (!VERIFY_INT(a) || !VERIFY_SHORT(shift)) | ||||
|    { | ||||
|       fprintf (stderr, "SHR32: inputs are not int: %d %d\n", (int)a, shift); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a>>shift; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "SHR32: output is not int: %d\n", (int)res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=2; | ||||
|    return res; | ||||
| } | ||||
| #define SHL32(a, shift) SHL32_(a, shift, __FILE__, __LINE__) | ||||
| static OPUS_INLINE int SHL32_(opus_int64 a, int shift, char *file, int line) | ||||
| { | ||||
|    opus_int64  res; | ||||
|    if (!VERIFY_INT(a) || !VERIFY_SHORT(shift)) | ||||
|    { | ||||
|       fprintf (stderr, "SHL32: inputs are not int: %lld %d in %s: line %d\n", a, shift, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a<<shift; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "SHL32: output is not int: %lld<<%d = %lld in %s: line %d\n", a, shift, res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=2; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define PSHR32(a,shift) (celt_mips--,SHR32(ADD32((a),(((opus_val32)(1)<<((shift))>>1))),shift)) | ||||
| #define VSHR32(a, shift) (((shift)>0) ? SHR32(a, shift) : SHL32(a, -(shift))) | ||||
| 
 | ||||
| #define ROUND16(x,a) (celt_mips--,EXTRACT16(PSHR32((x),(a)))) | ||||
| #define SROUND16(x,a) (celt_mips--,EXTRACT16(SATURATE(PSHR32(x,a), 32767))); | ||||
| 
 | ||||
| #define HALF16(x)  (SHR16(x,1)) | ||||
| #define HALF32(x)  (SHR32(x,1)) | ||||
| 
 | ||||
| #define ADD16(a, b) ADD16_(a, b, __FILE__, __LINE__) | ||||
| static OPUS_INLINE short ADD16_(int a, int b, char *file, int line) | ||||
| { | ||||
|    int res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "ADD16: inputs are not short: %d %d in %s: line %d\n", a, b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a+b; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "ADD16: output is not short: %d+%d=%d in %s: line %d\n", a,b,res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips++; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define SUB16(a, b) SUB16_(a, b, __FILE__, __LINE__) | ||||
| static OPUS_INLINE short SUB16_(int a, int b, char *file, int line) | ||||
| { | ||||
|    int res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "SUB16: inputs are not short: %d %d in %s: line %d\n", a, b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a-b; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "SUB16: output is not short: %d in %s: line %d\n", res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips++; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define ADD32(a, b) ADD32_(a, b, __FILE__, __LINE__) | ||||
| static OPUS_INLINE int ADD32_(opus_int64 a, opus_int64 b, char *file, int line) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_INT(a) || !VERIFY_INT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "ADD32: inputs are not int: %d %d in %s: line %d\n", (int)a, (int)b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a+b; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "ADD32: output is not int: %d in %s: line %d\n", (int)res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=2; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define SUB32(a, b) SUB32_(a, b, __FILE__, __LINE__) | ||||
| static OPUS_INLINE int SUB32_(opus_int64 a, opus_int64 b, char *file, int line) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_INT(a) || !VERIFY_INT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "SUB32: inputs are not int: %d %d in %s: line %d\n", (int)a, (int)b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a-b; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "SUB32: output is not int: %d in %s: line %d\n", (int)res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=2; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #undef UADD32 | ||||
| #define UADD32(a, b) UADD32_(a, b, __FILE__, __LINE__) | ||||
| static OPUS_INLINE unsigned int UADD32_(opus_uint64 a, opus_uint64 b, char *file, int line) | ||||
| { | ||||
|    opus_uint64 res; | ||||
|    if (!VERIFY_UINT(a) || !VERIFY_UINT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "UADD32: inputs are not uint32: %llu %llu in %s: line %d\n", a, b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a+b; | ||||
|    if (!VERIFY_UINT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "UADD32: output is not uint32: %llu in %s: line %d\n", res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=2; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #undef USUB32 | ||||
| #define USUB32(a, b) USUB32_(a, b, __FILE__, __LINE__) | ||||
| static OPUS_INLINE unsigned int USUB32_(opus_uint64 a, opus_uint64 b, char *file, int line) | ||||
| { | ||||
|    opus_uint64 res; | ||||
|    if (!VERIFY_UINT(a) || !VERIFY_UINT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "USUB32: inputs are not uint32: %llu %llu in %s: line %d\n", a, b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    if (a<b) | ||||
|    { | ||||
|       fprintf (stderr, "USUB32: inputs underflow: %llu < %llu in %s: line %d\n", a, b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a-b; | ||||
|    if (!VERIFY_UINT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "USUB32: output is not uint32: %llu - %llu = %llu in %s: line %d\n", a, b, res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=2; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| /* result fits in 16 bits */ | ||||
| static OPUS_INLINE short MULT16_16_16(int a, int b) | ||||
| { | ||||
|    int res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_16: inputs are not short: %d %d\n", a, b); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a*b; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_16: output is not short: %d\n", res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips++; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define MULT16_16(a, b) MULT16_16_(a, b, __FILE__, __LINE__) | ||||
| static OPUS_INLINE int MULT16_16_(int a, int b, char *file, int line) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16: inputs are not short: %d %d in %s: line %d\n", a, b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = ((opus_int64)a)*b; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16: output is not int: %d in %s: line %d\n", (int)res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips++; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define MAC16_16(c,a,b)     (celt_mips-=2,ADD32((c),MULT16_16((a),(b)))) | ||||
| 
 | ||||
| #define MULT16_32_QX(a, b, Q) MULT16_32_QX_(a, b, Q, __FILE__, __LINE__) | ||||
| static OPUS_INLINE int MULT16_32_QX_(int a, opus_int64 b, int Q, char *file, int line) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_INT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_32_Q%d: inputs are not short+int: %d %d in %s: line %d\n", Q, (int)a, (int)b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    if (ABS32(b)>=((opus_val32)(1)<<(15+Q))) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_32_Q%d: second operand too large: %d %d in %s: line %d\n", Q, (int)a, (int)b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = (((opus_int64)a)*(opus_int64)b) >> Q; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_32_Q%d: output is not int: %d*%d=%d in %s: line %d\n", Q, (int)a, (int)b,(int)res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    if (Q==15) | ||||
|       celt_mips+=3; | ||||
|    else | ||||
|       celt_mips+=4; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define MULT16_32_PX(a, b, Q) MULT16_32_PX_(a, b, Q, __FILE__, __LINE__) | ||||
| static OPUS_INLINE int MULT16_32_PX_(int a, opus_int64 b, int Q, char *file, int line) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_INT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_32_P%d: inputs are not short+int: %d %d in %s: line %d\n\n", Q, (int)a, (int)b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    if (ABS32(b)>=((opus_int64)(1)<<(15+Q))) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_32_Q%d: second operand too large: %d %d in %s: line %d\n\n", Q, (int)a, (int)b,file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = ((((opus_int64)a)*(opus_int64)b) + (((opus_val32)(1)<<Q)>>1))>> Q; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_32_P%d: output is not int: %d*%d=%d in %s: line %d\n\n", Q, (int)a, (int)b,(int)res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    if (Q==15) | ||||
|       celt_mips+=4; | ||||
|    else | ||||
|       celt_mips+=5; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define MULT16_32_Q15(a,b) MULT16_32_QX(a,b,15) | ||||
| #define MAC16_32_Q15(c,a,b) (celt_mips-=2,ADD32((c),MULT16_32_Q15((a),(b)))) | ||||
| #define MAC16_32_Q16(c,a,b) (celt_mips-=2,ADD32((c),MULT16_32_Q16((a),(b)))) | ||||
| 
 | ||||
| static OPUS_INLINE int SATURATE(int a, int b) | ||||
| { | ||||
|    if (a>b) | ||||
|       a=b; | ||||
|    if (a<-b) | ||||
|       a = -b; | ||||
|    celt_mips+=3; | ||||
|    return a; | ||||
| } | ||||
| 
 | ||||
| static OPUS_INLINE opus_int16 SATURATE16(opus_int32 a) | ||||
| { | ||||
|    celt_mips+=3; | ||||
|    if (a>32767) | ||||
|       return 32767; | ||||
|    else if (a<-32768) | ||||
|       return -32768; | ||||
|    else return a; | ||||
| } | ||||
| 
 | ||||
| static OPUS_INLINE int MULT16_16_Q11_32(int a, int b) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_Q11: inputs are not short: %d %d\n", a, b); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = ((opus_int64)a)*b; | ||||
|    res >>= 11; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_Q11: output is not short: %d*%d=%d\n", (int)a, (int)b, (int)res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=3; | ||||
|    return res; | ||||
| } | ||||
| static OPUS_INLINE short MULT16_16_Q13(int a, int b) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_Q13: inputs are not short: %d %d\n", a, b); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = ((opus_int64)a)*b; | ||||
|    res >>= 13; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_Q13: output is not short: %d*%d=%d\n", a, b, (int)res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=3; | ||||
|    return res; | ||||
| } | ||||
| static OPUS_INLINE short MULT16_16_Q14(int a, int b) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_Q14: inputs are not short: %d %d\n", a, b); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = ((opus_int64)a)*b; | ||||
|    res >>= 14; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_Q14: output is not short: %d\n", (int)res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=3; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define MULT16_16_Q15(a, b) MULT16_16_Q15_(a, b, __FILE__, __LINE__) | ||||
| static OPUS_INLINE short MULT16_16_Q15_(int a, int b, char *file, int line) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_Q15: inputs are not short: %d %d in %s: line %d\n", a, b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = ((opus_int64)a)*b; | ||||
|    res >>= 15; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_Q15: output is not short: %d in %s: line %d\n", (int)res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=1; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| static OPUS_INLINE short MULT16_16_P13(int a, int b) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_P13: inputs are not short: %d %d\n", a, b); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = ((opus_int64)a)*b; | ||||
|    res += 4096; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_P13: overflow: %d*%d=%d\n", a, b, (int)res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res >>= 13; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_P13: output is not short: %d*%d=%d\n", a, b, (int)res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=4; | ||||
|    return res; | ||||
| } | ||||
| static OPUS_INLINE short MULT16_16_P14(int a, int b) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_P14: inputs are not short: %d %d\n", a, b); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = ((opus_int64)a)*b; | ||||
|    res += 8192; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_P14: overflow: %d*%d=%d\n", a, b, (int)res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res >>= 14; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_P14: output is not short: %d*%d=%d\n", a, b, (int)res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=4; | ||||
|    return res; | ||||
| } | ||||
| static OPUS_INLINE short MULT16_16_P15(int a, int b) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (!VERIFY_SHORT(a) || !VERIFY_SHORT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_P15: inputs are not short: %d %d\n", a, b); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = ((opus_int64)a)*b; | ||||
|    res += 16384; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_P15: overflow: %d*%d=%d\n", a, b, (int)res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res >>= 15; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "MULT16_16_P15: output is not short: %d*%d=%d\n", a, b, (int)res); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=2; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define DIV32_16(a, b) DIV32_16_(a, b, __FILE__, __LINE__) | ||||
| 
 | ||||
| static OPUS_INLINE int DIV32_16_(opus_int64 a, opus_int64 b, char *file, int line) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (b==0) | ||||
|    { | ||||
|       fprintf(stderr, "DIV32_16: divide by zero: %d/%d in %s: line %d\n", (int)a, (int)b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|       return 0; | ||||
|    } | ||||
|    if (!VERIFY_INT(a) || !VERIFY_SHORT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "DIV32_16: inputs are not int/short: %d %d in %s: line %d\n", (int)a, (int)b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a/b; | ||||
|    if (!VERIFY_SHORT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "DIV32_16: output is not short: %d / %d = %d in %s: line %d\n", (int)a,(int)b,(int)res, file, line); | ||||
|       if (res>32767) | ||||
|          res = 32767; | ||||
|       if (res<-32768) | ||||
|          res = -32768; | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=35; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| #define DIV32(a, b) DIV32_(a, b, __FILE__, __LINE__) | ||||
| static OPUS_INLINE int DIV32_(opus_int64 a, opus_int64 b, char *file, int line) | ||||
| { | ||||
|    opus_int64 res; | ||||
|    if (b==0) | ||||
|    { | ||||
|       fprintf(stderr, "DIV32: divide by zero: %d/%d in %s: line %d\n", (int)a, (int)b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|       return 0; | ||||
|    } | ||||
| 
 | ||||
|    if (!VERIFY_INT(a) || !VERIFY_INT(b)) | ||||
|    { | ||||
|       fprintf (stderr, "DIV32: inputs are not int/short: %d %d in %s: line %d\n", (int)a, (int)b, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    res = a/b; | ||||
|    if (!VERIFY_INT(res)) | ||||
|    { | ||||
|       fprintf (stderr, "DIV32: output is not int: %d in %s: line %d\n", (int)res, file, line); | ||||
| #ifdef FIXED_DEBUG_ASSERT | ||||
|       celt_assert(0); | ||||
| #endif | ||||
|    } | ||||
|    celt_mips+=70; | ||||
|    return res; | ||||
| } | ||||
| 
 | ||||
| static OPUS_INLINE opus_val16 SIG2WORD16_generic(celt_sig x) | ||||
| { | ||||
|    x = PSHR32(x, SIG_SHIFT); | ||||
|    x = MAX32(x, -32768); | ||||
|    x = MIN32(x, 32767); | ||||
|    return EXTRACT16(x); | ||||
| } | ||||
| #define SIG2WORD16(x) (SIG2WORD16_generic(x)) | ||||
| 
 | ||||
| 
 | ||||
| #undef PRINT_MIPS | ||||
| #define PRINT_MIPS(file) do {fprintf (file, "total complexity = %llu MIPS\n", celt_mips);} while (0); | ||||
| 
 | ||||
| #endif | ||||
|  | @ -37,16 +37,32 @@ | |||
| #define MULT16_16SU(a,b) ((opus_val32)(opus_val16)(a)*(opus_val32)(opus_uint16)(b)) | ||||
| 
 | ||||
| /** 16x32 multiplication, followed by a 16-bit shift right. Results fits in 32 bits */ | ||||
| #if OPUS_FAST_INT64 | ||||
| #define MULT16_32_Q16(a,b) ((opus_val32)SHR((opus_int64)((opus_val16)(a))*(b),16)) | ||||
| #else | ||||
| #define MULT16_32_Q16(a,b) ADD32(MULT16_16((a),SHR((b),16)), SHR(MULT16_16SU((a),((b)&0x0000ffff)),16)) | ||||
| #endif | ||||
| 
 | ||||
| /** 16x32 multiplication, followed by a 16-bit shift right (round-to-nearest). Results fits in 32 bits */ | ||||
| #if OPUS_FAST_INT64 | ||||
| #define MULT16_32_P16(a,b) ((opus_val32)PSHR((opus_int64)((opus_val16)(a))*(b),16)) | ||||
| #else | ||||
| #define MULT16_32_P16(a,b) ADD32(MULT16_16((a),SHR((b),16)), PSHR(MULT16_16SU((a),((b)&0x0000ffff)),16)) | ||||
| #endif | ||||
| 
 | ||||
| /** 16x32 multiplication, followed by a 15-bit shift right. Results fits in 32 bits */ | ||||
| #if OPUS_FAST_INT64 | ||||
| #define MULT16_32_Q15(a,b) ((opus_val32)SHR((opus_int64)((opus_val16)(a))*(b),15)) | ||||
| #else | ||||
| #define MULT16_32_Q15(a,b) ADD32(SHL(MULT16_16((a),SHR((b),16)),1), SHR(MULT16_16SU((a),((b)&0x0000ffff)),15)) | ||||
| #endif | ||||
| 
 | ||||
| /** 32x32 multiplication, followed by a 31-bit shift right. Results fits in 32 bits */ | ||||
| #if OPUS_FAST_INT64 | ||||
| #define MULT32_32_Q31(a,b) ((opus_val32)SHR((opus_int64)(a)*(opus_int64)(b),31)) | ||||
| #else | ||||
| #define MULT32_32_Q31(a,b) ADD32(ADD32(SHL(MULT16_16(SHR((a),16),SHR((b),16)),1), SHR(MULT16_16SU(SHR((a),16),((b)&0x0000ffff)),15)), SHR(MULT16_16SU(SHR((b),16),((a)&0x0000ffff)),15)) | ||||
| #endif | ||||
| 
 | ||||
| /** Compile-time conversion of float constant to 16-bit value */ | ||||
| #define QCONST16(x,bits) ((opus_val16)(.5+(x)*(((opus_val32)1)<<(bits)))) | ||||
|  | @ -88,6 +104,9 @@ | |||
| 
 | ||||
| /** Shift by a and round-to-neareast 32-bit value. Result is a 16-bit value */ | ||||
| #define ROUND16(x,a) (EXTRACT16(PSHR32((x),(a)))) | ||||
| /** Shift by a and round-to-neareast 32-bit value. Result is a saturated 16-bit value */ | ||||
| #define SROUND16(x,a) EXTRACT16(SATURATE(PSHR32(x,a), 32767)); | ||||
| 
 | ||||
| /** Divide by two */ | ||||
| #define HALF16(x)  (SHR16(x,1)) | ||||
| #define HALF32(x)  (SHR32(x,1)) | ||||
|  | @ -101,6 +120,14 @@ | |||
| /** Subtract two 32-bit values */ | ||||
| #define SUB32(a,b) ((opus_val32)(a)-(opus_val32)(b)) | ||||
| 
 | ||||
| /** Add two 32-bit values, ignore any overflows */ | ||||
| #define ADD32_ovflw(a,b) ((opus_val32)((opus_uint32)(a)+(opus_uint32)(b))) | ||||
| /** Subtract two 32-bit values, ignore any overflows */ | ||||
| #define SUB32_ovflw(a,b) ((opus_val32)((opus_uint32)(a)-(opus_uint32)(b))) | ||||
| /* Avoid MSVC warning C4146: unary minus operator applied to unsigned type */ | ||||
| /** Negate 32-bit value, ignore any overflows */ | ||||
| #define NEG32_ovflw(a) ((opus_val32)(0-(opus_uint32)(a))) | ||||
| 
 | ||||
| /** 16x16 multiplication where the result fits in 16 bits */ | ||||
| #define MULT16_16_16(a,b)     ((((opus_val16)(a))*((opus_val16)(b)))) | ||||
| 
 | ||||
|  |  | |||
|  | @ -61,7 +61,13 @@ | |||
| **      the config.h file. | ||||
| */ | ||||
| 
 | ||||
| #if (HAVE_LRINTF) | ||||
| /* With GCC, when SSE is available, the fastest conversion is cvtss2si. */ | ||||
| #if defined(__GNUC__) && defined(__SSE__) | ||||
| 
 | ||||
| #include <xmmintrin.h> | ||||
| static OPUS_INLINE opus_int32 float2int(float x) {return _mm_cvt_ss2si(_mm_set_ss(x));} | ||||
| 
 | ||||
| #elif defined(HAVE_LRINTF) | ||||
| 
 | ||||
| /*      These defines enable functionality introduced with the 1999 ISO C
 | ||||
| **      standard. They must be defined before the inclusion of math.h to | ||||
|  | @ -90,21 +96,21 @@ | |||
| #include <math.h> | ||||
| #define float2int(x) lrint(x) | ||||
| 
 | ||||
| #elif (defined(_MSC_VER) && _MSC_VER >= 1400) && (defined (WIN64) || defined (_WIN64)) | ||||
| #elif (defined(_MSC_VER) && _MSC_VER >= 1400) && (defined(_M_X64) || (defined(_M_IX86_FP) && _M_IX86_FP >= 1)) | ||||
|         #include <xmmintrin.h> | ||||
| 
 | ||||
|         __inline long int float2int(float value) | ||||
|         static __inline long int float2int(float value) | ||||
|         { | ||||
|                 return _mm_cvtss_si32(_mm_load_ss(&value)); | ||||
|         } | ||||
| #elif (defined(_MSC_VER) && _MSC_VER >= 1400) && (defined (WIN32) || defined (_WIN32)) | ||||
| #elif (defined(_MSC_VER) && _MSC_VER >= 1400) && defined (_M_IX86) | ||||
|         #include <math.h> | ||||
| 
 | ||||
|         /*      Win32 doesn't seem to have these functions.
 | ||||
|         **      Therefore implement OPUS_INLINE versions of these functions here. | ||||
|         */ | ||||
| 
 | ||||
|         __inline long int | ||||
|         static __inline long int | ||||
|         float2int (float flt) | ||||
|         {       int intgr; | ||||
| 
 | ||||
|  |  | |||
|  | @ -82,8 +82,8 @@ static void kf_bfly2( | |||
|          C_SUB( Fout2[0] ,  Fout[0] , t ); | ||||
|          C_ADDTO( Fout[0] ,  t ); | ||||
| 
 | ||||
|          t.r = S_MUL(Fout2[1].r+Fout2[1].i, tw); | ||||
|          t.i = S_MUL(Fout2[1].i-Fout2[1].r, tw); | ||||
|          t.r = S_MUL(ADD32_ovflw(Fout2[1].r, Fout2[1].i), tw); | ||||
|          t.i = S_MUL(SUB32_ovflw(Fout2[1].i, Fout2[1].r), tw); | ||||
|          C_SUB( Fout2[1] ,  Fout[1] , t ); | ||||
|          C_ADDTO( Fout[1] ,  t ); | ||||
| 
 | ||||
|  | @ -92,8 +92,8 @@ static void kf_bfly2( | |||
|          C_SUB( Fout2[2] ,  Fout[2] , t ); | ||||
|          C_ADDTO( Fout[2] ,  t ); | ||||
| 
 | ||||
|          t.r = S_MUL(Fout2[3].i-Fout2[3].r, tw); | ||||
|          t.i = S_MUL(-Fout2[3].i-Fout2[3].r, tw); | ||||
|          t.r = S_MUL(SUB32_ovflw(Fout2[3].i, Fout2[3].r), tw); | ||||
|          t.i = S_MUL(NEG32_ovflw(ADD32_ovflw(Fout2[3].i, Fout2[3].r)), tw); | ||||
|          C_SUB( Fout2[3] ,  Fout[3] , t ); | ||||
|          C_ADDTO( Fout[3] ,  t ); | ||||
|          Fout += 8; | ||||
|  | @ -126,10 +126,10 @@ static void kf_bfly4( | |||
|          C_ADDTO( *Fout , scratch1 ); | ||||
|          C_SUB( scratch1 , Fout[1] , Fout[3] ); | ||||
| 
 | ||||
|          Fout[1].r = scratch0.r + scratch1.i; | ||||
|          Fout[1].i = scratch0.i - scratch1.r; | ||||
|          Fout[3].r = scratch0.r - scratch1.i; | ||||
|          Fout[3].i = scratch0.i + scratch1.r; | ||||
|          Fout[1].r = ADD32_ovflw(scratch0.r, scratch1.i); | ||||
|          Fout[1].i = SUB32_ovflw(scratch0.i, scratch1.r); | ||||
|          Fout[3].r = SUB32_ovflw(scratch0.r, scratch1.i); | ||||
|          Fout[3].i = ADD32_ovflw(scratch0.i, scratch1.r); | ||||
|          Fout+=4; | ||||
|       } | ||||
|    } else { | ||||
|  | @ -160,10 +160,10 @@ static void kf_bfly4( | |||
|             tw3 += fstride*3; | ||||
|             C_ADDTO( *Fout , scratch[3] ); | ||||
| 
 | ||||
|             Fout[m].r = scratch[5].r + scratch[4].i; | ||||
|             Fout[m].i = scratch[5].i - scratch[4].r; | ||||
|             Fout[m3].r = scratch[5].r - scratch[4].i; | ||||
|             Fout[m3].i = scratch[5].i + scratch[4].r; | ||||
|             Fout[m].r = ADD32_ovflw(scratch[5].r, scratch[4].i); | ||||
|             Fout[m].i = SUB32_ovflw(scratch[5].i, scratch[4].r); | ||||
|             Fout[m3].r = SUB32_ovflw(scratch[5].r, scratch[4].i); | ||||
|             Fout[m3].i = ADD32_ovflw(scratch[5].i, scratch[4].r); | ||||
|             ++Fout; | ||||
|          } | ||||
|       } | ||||
|  | @ -191,7 +191,7 @@ static void kf_bfly3( | |||
| 
 | ||||
|    kiss_fft_cpx * Fout_beg = Fout; | ||||
| #ifdef FIXED_POINT | ||||
|    epi3.r = -16384; | ||||
|    /*epi3.r = -16384;*/ /* Unused */ | ||||
|    epi3.i = -28378; | ||||
| #else | ||||
|    epi3 = st->twiddles[fstride*m]; | ||||
|  | @ -212,18 +212,18 @@ static void kf_bfly3( | |||
|          tw1 += fstride; | ||||
|          tw2 += fstride*2; | ||||
| 
 | ||||
|          Fout[m].r = Fout->r - HALF_OF(scratch[3].r); | ||||
|          Fout[m].i = Fout->i - HALF_OF(scratch[3].i); | ||||
|          Fout[m].r = SUB32_ovflw(Fout->r, HALF_OF(scratch[3].r)); | ||||
|          Fout[m].i = SUB32_ovflw(Fout->i, HALF_OF(scratch[3].i)); | ||||
| 
 | ||||
|          C_MULBYSCALAR( scratch[0] , epi3.i ); | ||||
| 
 | ||||
|          C_ADDTO(*Fout,scratch[3]); | ||||
| 
 | ||||
|          Fout[m2].r = Fout[m].r + scratch[0].i; | ||||
|          Fout[m2].i = Fout[m].i - scratch[0].r; | ||||
|          Fout[m2].r = ADD32_ovflw(Fout[m].r, scratch[0].i); | ||||
|          Fout[m2].i = SUB32_ovflw(Fout[m].i, scratch[0].r); | ||||
| 
 | ||||
|          Fout[m].r -= scratch[0].i; | ||||
|          Fout[m].i += scratch[0].r; | ||||
|          Fout[m].r = SUB32_ovflw(Fout[m].r, scratch[0].i); | ||||
|          Fout[m].i = ADD32_ovflw(Fout[m].i, scratch[0].r); | ||||
| 
 | ||||
|          ++Fout; | ||||
|       } while(--k); | ||||
|  | @ -282,22 +282,22 @@ static void kf_bfly5( | |||
|          C_ADD( scratch[8],scratch[2],scratch[3]); | ||||
|          C_SUB( scratch[9],scratch[2],scratch[3]); | ||||
| 
 | ||||
|          Fout0->r += scratch[7].r + scratch[8].r; | ||||
|          Fout0->i += scratch[7].i + scratch[8].i; | ||||
|          Fout0->r = ADD32_ovflw(Fout0->r, ADD32_ovflw(scratch[7].r, scratch[8].r)); | ||||
|          Fout0->i = ADD32_ovflw(Fout0->i, ADD32_ovflw(scratch[7].i, scratch[8].i)); | ||||
| 
 | ||||
|          scratch[5].r = scratch[0].r + S_MUL(scratch[7].r,ya.r) + S_MUL(scratch[8].r,yb.r); | ||||
|          scratch[5].i = scratch[0].i + S_MUL(scratch[7].i,ya.r) + S_MUL(scratch[8].i,yb.r); | ||||
|          scratch[5].r = ADD32_ovflw(scratch[0].r, ADD32_ovflw(S_MUL(scratch[7].r,ya.r), S_MUL(scratch[8].r,yb.r))); | ||||
|          scratch[5].i = ADD32_ovflw(scratch[0].i, ADD32_ovflw(S_MUL(scratch[7].i,ya.r), S_MUL(scratch[8].i,yb.r))); | ||||
| 
 | ||||
|          scratch[6].r =  S_MUL(scratch[10].i,ya.i) + S_MUL(scratch[9].i,yb.i); | ||||
|          scratch[6].i = -S_MUL(scratch[10].r,ya.i) - S_MUL(scratch[9].r,yb.i); | ||||
|          scratch[6].r =  ADD32_ovflw(S_MUL(scratch[10].i,ya.i), S_MUL(scratch[9].i,yb.i)); | ||||
|          scratch[6].i = NEG32_ovflw(ADD32_ovflw(S_MUL(scratch[10].r,ya.i), S_MUL(scratch[9].r,yb.i))); | ||||
| 
 | ||||
|          C_SUB(*Fout1,scratch[5],scratch[6]); | ||||
|          C_ADD(*Fout4,scratch[5],scratch[6]); | ||||
| 
 | ||||
|          scratch[11].r = scratch[0].r + S_MUL(scratch[7].r,yb.r) + S_MUL(scratch[8].r,ya.r); | ||||
|          scratch[11].i = scratch[0].i + S_MUL(scratch[7].i,yb.r) + S_MUL(scratch[8].i,ya.r); | ||||
|          scratch[12].r = - S_MUL(scratch[10].i,yb.i) + S_MUL(scratch[9].i,ya.i); | ||||
|          scratch[12].i = S_MUL(scratch[10].r,yb.i) - S_MUL(scratch[9].r,ya.i); | ||||
|          scratch[11].r = ADD32_ovflw(scratch[0].r, ADD32_ovflw(S_MUL(scratch[7].r,yb.r), S_MUL(scratch[8].r,ya.r))); | ||||
|          scratch[11].i = ADD32_ovflw(scratch[0].i, ADD32_ovflw(S_MUL(scratch[7].i,yb.r), S_MUL(scratch[8].i,ya.r))); | ||||
|          scratch[12].r = SUB32_ovflw(S_MUL(scratch[9].i,ya.i), S_MUL(scratch[10].i,yb.i)); | ||||
|          scratch[12].i = SUB32_ovflw(S_MUL(scratch[10].r,yb.i), S_MUL(scratch[9].r,ya.i)); | ||||
| 
 | ||||
|          C_ADD(*Fout2,scratch[11],scratch[12]); | ||||
|          C_SUB(*Fout3,scratch[11],scratch[12]); | ||||
|  | @ -423,13 +423,19 @@ static void compute_twiddles(kiss_twiddle_cpx *twiddles, int nfft) | |||
| #endif | ||||
| } | ||||
| 
 | ||||
| int opus_fft_alloc_arch_c(kiss_fft_state *st) { | ||||
|    (void)st; | ||||
|    return 0; | ||||
| } | ||||
| 
 | ||||
| /*
 | ||||
|  * | ||||
|  * Allocates all necessary storage space for the fft and ifft. | ||||
|  * The return value is a contiguous block of memory.  As such, | ||||
|  * It can be freed with free(). | ||||
|  * */ | ||||
| kiss_fft_state *opus_fft_alloc_twiddles(int nfft,void * mem,size_t * lenmem,  const kiss_fft_state *base) | ||||
| kiss_fft_state *opus_fft_alloc_twiddles(int nfft,void * mem,size_t * lenmem, | ||||
|                                         const kiss_fft_state *base, int arch) | ||||
| { | ||||
|     kiss_fft_state *st=NULL; | ||||
|     size_t memneeded = sizeof(struct kiss_fft_state); /* twiddle factors*/ | ||||
|  | @ -478,22 +484,31 @@ kiss_fft_state *opus_fft_alloc_twiddles(int nfft,void * mem,size_t * lenmem,  co | |||
|         if (st->bitrev==NULL) | ||||
|             goto fail; | ||||
|         compute_bitrev_table(0, bitrev, 1,1, st->factors,st); | ||||
| 
 | ||||
|         /* Initialize architecture specific fft parameters */ | ||||
|         if (opus_fft_alloc_arch(st, arch)) | ||||
|             goto fail; | ||||
|     } | ||||
|     return st; | ||||
| fail: | ||||
|     opus_fft_free(st); | ||||
|     opus_fft_free(st, arch); | ||||
|     return NULL; | ||||
| } | ||||
| 
 | ||||
| kiss_fft_state *opus_fft_alloc(int nfft,void * mem,size_t * lenmem ) | ||||
| kiss_fft_state *opus_fft_alloc(int nfft,void * mem,size_t * lenmem, int arch) | ||||
| { | ||||
|    return opus_fft_alloc_twiddles(nfft, mem, lenmem, NULL); | ||||
|    return opus_fft_alloc_twiddles(nfft, mem, lenmem, NULL, arch); | ||||
| } | ||||
| 
 | ||||
| void opus_fft_free(const kiss_fft_state *cfg) | ||||
| void opus_fft_free_arch_c(kiss_fft_state *st) { | ||||
|    (void)st; | ||||
| } | ||||
| 
 | ||||
| void opus_fft_free(const kiss_fft_state *cfg, int arch) | ||||
| { | ||||
|    if (cfg) | ||||
|    { | ||||
|       opus_fft_free_arch((kiss_fft_state *)cfg, arch); | ||||
|       opus_free((opus_int16*)cfg->bitrev); | ||||
|       if (cfg->shift < 0) | ||||
|          opus_free((kiss_twiddle_cpx*)cfg->twiddles); | ||||
|  | @ -551,8 +566,7 @@ void opus_fft_impl(const kiss_fft_state *st,kiss_fft_cpx *fout) | |||
|     } | ||||
| } | ||||
| 
 | ||||
| #if 0 | ||||
| void opus_fft(const kiss_fft_state *st,const kiss_fft_cpx *fin,kiss_fft_cpx *fout) | ||||
| void opus_fft_c(const kiss_fft_state *st,const kiss_fft_cpx *fin,kiss_fft_cpx *fout) | ||||
| { | ||||
|    int i; | ||||
|    opus_val16 scale; | ||||
|  | @ -573,11 +587,9 @@ void opus_fft(const kiss_fft_state *st,const kiss_fft_cpx *fin,kiss_fft_cpx *fou | |||
|    } | ||||
|    opus_fft_impl(st, fout); | ||||
| } | ||||
| #endif | ||||
| 
 | ||||
| 
 | ||||
| #ifdef TEST_UNIT_DFT_C | ||||
| void opus_ifft(const kiss_fft_state *st,const kiss_fft_cpx *fin,kiss_fft_cpx *fout) | ||||
| void opus_ifft_c(const kiss_fft_state *st,const kiss_fft_cpx *fin,kiss_fft_cpx *fout) | ||||
| { | ||||
|    int i; | ||||
|    celt_assert2 (fin != fout, "In-place FFT not supported"); | ||||
|  | @ -590,4 +602,3 @@ void opus_ifft(const kiss_fft_state *st,const kiss_fft_cpx *fin,kiss_fft_cpx *fo | |||
|    for (i=0;i<st->nfft;i++) | ||||
|       fout[i].i = -fout[i].i; | ||||
| } | ||||
| #endif | ||||
|  |  | |||
|  | @ -32,6 +32,7 @@ | |||
| #include <stdlib.h> | ||||
| #include <math.h> | ||||
| #include "arch.h" | ||||
| #include "cpu_support.h" | ||||
| 
 | ||||
| #ifdef __cplusplus | ||||
| extern "C" { | ||||
|  | @ -77,6 +78,11 @@ typedef struct { | |||
|  4*4*4*2 | ||||
|  */ | ||||
| 
 | ||||
| typedef struct arch_fft_state{ | ||||
|    int is_supported; | ||||
|    void *priv; | ||||
| } arch_fft_state; | ||||
| 
 | ||||
| typedef struct kiss_fft_state{ | ||||
|     int nfft; | ||||
|     opus_val16 scale; | ||||
|  | @ -87,8 +93,13 @@ typedef struct kiss_fft_state{ | |||
|     opus_int16 factors[2*MAXFACTORS]; | ||||
|     const opus_int16 *bitrev; | ||||
|     const kiss_twiddle_cpx *twiddles; | ||||
|     arch_fft_state *arch_fft; | ||||
| } kiss_fft_state; | ||||
| 
 | ||||
| #if defined(HAVE_ARM_NE10) | ||||
| #include "arm/fft_arm.h" | ||||
| #endif | ||||
| 
 | ||||
| /*typedef struct kiss_fft_state* kiss_fft_cfg;*/ | ||||
| 
 | ||||
| /**
 | ||||
|  | @ -114,9 +125,9 @@ typedef struct kiss_fft_state{ | |||
|  *      buffer size in *lenmem. | ||||
|  * */ | ||||
| 
 | ||||
| kiss_fft_state *opus_fft_alloc_twiddles(int nfft,void * mem,size_t * lenmem, const kiss_fft_state *base); | ||||
| kiss_fft_state *opus_fft_alloc_twiddles(int nfft,void * mem,size_t * lenmem, const kiss_fft_state *base, int arch); | ||||
| 
 | ||||
| kiss_fft_state *opus_fft_alloc(int nfft,void * mem,size_t * lenmem); | ||||
| kiss_fft_state *opus_fft_alloc(int nfft,void * mem,size_t * lenmem, int arch); | ||||
| 
 | ||||
| /**
 | ||||
|  * opus_fft(cfg,in_out_buf) | ||||
|  | @ -128,13 +139,59 @@ kiss_fft_state *opus_fft_alloc(int nfft,void * mem,size_t * lenmem); | |||
|  * Note that each element is complex and can be accessed like | ||||
|     f[k].r and f[k].i | ||||
|  * */ | ||||
| void opus_fft(const kiss_fft_state *cfg,const kiss_fft_cpx *fin,kiss_fft_cpx *fout); | ||||
| void opus_ifft(const kiss_fft_state *cfg,const kiss_fft_cpx *fin,kiss_fft_cpx *fout); | ||||
| void opus_fft_c(const kiss_fft_state *cfg,const kiss_fft_cpx *fin,kiss_fft_cpx *fout); | ||||
| void opus_ifft_c(const kiss_fft_state *cfg,const kiss_fft_cpx *fin,kiss_fft_cpx *fout); | ||||
| 
 | ||||
| void opus_fft_impl(const kiss_fft_state *st,kiss_fft_cpx *fout); | ||||
| void opus_ifft_impl(const kiss_fft_state *st,kiss_fft_cpx *fout); | ||||
| 
 | ||||
| void opus_fft_free(const kiss_fft_state *cfg); | ||||
| void opus_fft_free(const kiss_fft_state *cfg, int arch); | ||||
| 
 | ||||
| 
 | ||||
| void opus_fft_free_arch_c(kiss_fft_state *st); | ||||
| int opus_fft_alloc_arch_c(kiss_fft_state *st); | ||||
| 
 | ||||
| #if !defined(OVERRIDE_OPUS_FFT) | ||||
| /* Is run-time CPU detection enabled on this platform? */ | ||||
| #if defined(OPUS_HAVE_RTCD) && (defined(HAVE_ARM_NE10)) | ||||
| 
 | ||||
| extern int (*const OPUS_FFT_ALLOC_ARCH_IMPL[OPUS_ARCHMASK+1])( | ||||
|  kiss_fft_state *st); | ||||
| 
 | ||||
| #define opus_fft_alloc_arch(_st, arch) \ | ||||
|          ((*OPUS_FFT_ALLOC_ARCH_IMPL[(arch)&OPUS_ARCHMASK])(_st)) | ||||
| 
 | ||||
| extern void (*const OPUS_FFT_FREE_ARCH_IMPL[OPUS_ARCHMASK+1])( | ||||
|  kiss_fft_state *st); | ||||
| #define opus_fft_free_arch(_st, arch) \ | ||||
|          ((*OPUS_FFT_FREE_ARCH_IMPL[(arch)&OPUS_ARCHMASK])(_st)) | ||||
| 
 | ||||
| extern void (*const OPUS_FFT[OPUS_ARCHMASK+1])(const kiss_fft_state *cfg, | ||||
|  const kiss_fft_cpx *fin, kiss_fft_cpx *fout); | ||||
| #define opus_fft(_cfg, _fin, _fout, arch) \ | ||||
|    ((*OPUS_FFT[(arch)&OPUS_ARCHMASK])(_cfg, _fin, _fout)) | ||||
| 
 | ||||
| extern void (*const OPUS_IFFT[OPUS_ARCHMASK+1])(const kiss_fft_state *cfg, | ||||
|  const kiss_fft_cpx *fin, kiss_fft_cpx *fout); | ||||
| #define opus_ifft(_cfg, _fin, _fout, arch) \ | ||||
|    ((*OPUS_IFFT[(arch)&OPUS_ARCHMASK])(_cfg, _fin, _fout)) | ||||
| 
 | ||||
| #else /* else for if defined(OPUS_HAVE_RTCD) && (defined(HAVE_ARM_NE10)) */ | ||||
| 
 | ||||
| #define opus_fft_alloc_arch(_st, arch) \ | ||||
|          ((void)(arch), opus_fft_alloc_arch_c(_st)) | ||||
| 
 | ||||
| #define opus_fft_free_arch(_st, arch) \ | ||||
|          ((void)(arch), opus_fft_free_arch_c(_st)) | ||||
| 
 | ||||
| #define opus_fft(_cfg, _fin, _fout, arch) \ | ||||
|          ((void)(arch), opus_fft_c(_cfg, _fin, _fout)) | ||||
| 
 | ||||
| #define opus_ifft(_cfg, _fin, _fout, arch) \ | ||||
|          ((void)(arch), opus_ifft_c(_cfg, _fin, _fout)) | ||||
| 
 | ||||
| #endif /* end if defined(OPUS_HAVE_RTCD) && (defined(HAVE_ARM_NE10)) */ | ||||
| #endif /* end if !defined(OVERRIDE_OPUS_FFT) */ | ||||
| 
 | ||||
| #ifdef __cplusplus | ||||
| } | ||||
|  |  | |||
|  | @ -38,7 +38,8 @@ | |||
| #include "mathops.h" | ||||
| 
 | ||||
| /*Compute floor(sqrt(_val)) with exact arithmetic.
 | ||||
|   This has been tested on all possible 32-bit inputs.*/ | ||||
|   _val must be greater than 0. | ||||
|   This has been tested on all possible 32-bit inputs greater than 0.*/ | ||||
| unsigned isqrt32(opus_uint32 _val){ | ||||
|   unsigned b; | ||||
|   unsigned g; | ||||
|  | @ -164,7 +165,7 @@ opus_val16 celt_cos_norm(opus_val32 x) | |||
|       { | ||||
|          return _celt_cos_pi_2(EXTRACT16(x)); | ||||
|       } else { | ||||
|          return NEG32(_celt_cos_pi_2(EXTRACT16(65536-x))); | ||||
|          return NEG16(_celt_cos_pi_2(EXTRACT16(65536-x))); | ||||
|       } | ||||
|    } else { | ||||
|       if (x&0x0000ffff) | ||||
|  | @ -182,7 +183,7 @@ opus_val32 celt_rcp(opus_val32 x) | |||
|    int i; | ||||
|    opus_val16 n; | ||||
|    opus_val16 r; | ||||
|    celt_assert2(x>0, "celt_rcp() only defined for positive values"); | ||||
|    celt_sig_assert(x>0); | ||||
|    i = celt_ilog2(x); | ||||
|    /* n is Q15 with range [0,1). */ | ||||
|    n = VSHR32(x,i-15)-32768; | ||||
|  |  | |||
|  | @ -38,11 +38,48 @@ | |||
| #include "entcode.h" | ||||
| #include "os_support.h" | ||||
| 
 | ||||
| #define PI 3.141592653f | ||||
| 
 | ||||
| #ifndef ABS | ||||
| #define ABS(a)(((a) < 0) ? - (a) :(a)) | ||||
| #endif | ||||
| 
 | ||||
| /* Multiplies two 16-bit fractional values. Bit-exactness of this macro is important */ | ||||
| #define FRAC_MUL16(a,b) ((16384+((opus_int32)(opus_int16)(a)*(opus_int16)(b)))>>15) | ||||
| 
 | ||||
| unsigned isqrt32(opus_uint32 _val); | ||||
| 
 | ||||
| /* CELT doesn't need it for fixed-point, by analysis.c does. */ | ||||
| #if !defined(FIXED_POINT) || defined(ANALYSIS_C) | ||||
| #define cA 0.43157974f | ||||
| #define cB 0.67848403f | ||||
| #define cC 0.08595542f | ||||
| #define cE ((float)PI/2) | ||||
| static OPUS_INLINE float fast_atan2f(float y, float x) { | ||||
|    float x2, y2; | ||||
|    x2 = x*x; | ||||
|    y2 = y*y; | ||||
|    /* For very small values, we don't care about the answer, so
 | ||||
|       we can just return 0. */ | ||||
|    if (x2 + y2 < 1e-18f) | ||||
|    { | ||||
|       return 0; | ||||
|    } | ||||
|    if(x2<y2){ | ||||
|       float den = (y2 + cB*x2) * (y2 + cC*x2); | ||||
|       return -x*y*(y2 + cA*x2) / den + (y<0 ? -cE : cE); | ||||
|    }else{ | ||||
|       float den = (x2 + cB*y2) * (x2 + cC*y2); | ||||
|       return  x*y*(x2 + cA*y2) / den + (y<0 ? -cE : cE) - (x*y<0 ? -cE : cE); | ||||
|    } | ||||
| } | ||||
| #undef cA | ||||
| #undef cB | ||||
| #undef cC | ||||
| #undef cE | ||||
| #endif | ||||
| 
 | ||||
| 
 | ||||
| #ifndef OVERRIDE_CELT_MAXABS16 | ||||
| static OPUS_INLINE opus_val32 celt_maxabs16(const opus_val16 *x, int len) | ||||
| { | ||||
|  | @ -80,7 +117,6 @@ static OPUS_INLINE opus_val32 celt_maxabs32(const opus_val32 *x, int len) | |||
| 
 | ||||
| #ifndef FIXED_POINT | ||||
| 
 | ||||
| #define PI 3.141592653f | ||||
| #define celt_sqrt(x) ((float)sqrt(x)) | ||||
| #define celt_rsqrt(x) (1.f/celt_sqrt(x)) | ||||
| #define celt_rsqrt_norm(x) (celt_rsqrt(x)) | ||||
|  | @ -147,7 +183,7 @@ static OPUS_INLINE float celt_exp2(float x) | |||
| /** Integer log in base2. Undefined for zero and negative numbers */ | ||||
| static OPUS_INLINE opus_int16 celt_ilog2(opus_int32 x) | ||||
| { | ||||
|    celt_assert2(x>0, "celt_ilog2() only defined for strictly positive numbers"); | ||||
|    celt_sig_assert(x>0); | ||||
|    return EC_ILOG(x)-1; | ||||
| } | ||||
| #endif | ||||
|  |  | |||
|  | @ -60,7 +60,7 @@ | |||
| 
 | ||||
| #ifdef CUSTOM_MODES | ||||
| 
 | ||||
| int clt_mdct_init(mdct_lookup *l,int N, int maxshift) | ||||
| int clt_mdct_init(mdct_lookup *l,int N, int maxshift, int arch) | ||||
| { | ||||
|    int i; | ||||
|    kiss_twiddle_scalar *trig; | ||||
|  | @ -71,9 +71,9 @@ int clt_mdct_init(mdct_lookup *l,int N, int maxshift) | |||
|    for (i=0;i<=maxshift;i++) | ||||
|    { | ||||
|       if (i==0) | ||||
|          l->kfft[i] = opus_fft_alloc(N>>2>>i, 0, 0); | ||||
|          l->kfft[i] = opus_fft_alloc(N>>2>>i, 0, 0, arch); | ||||
|       else | ||||
|          l->kfft[i] = opus_fft_alloc_twiddles(N>>2>>i, 0, 0, l->kfft[0]); | ||||
|          l->kfft[i] = opus_fft_alloc_twiddles(N>>2>>i, 0, 0, l->kfft[0], arch); | ||||
| #ifndef ENABLE_TI_DSPLIB55 | ||||
|       if (l->kfft[i]==NULL) | ||||
|          return 0; | ||||
|  | @ -104,21 +104,20 @@ int clt_mdct_init(mdct_lookup *l,int N, int maxshift) | |||
|    return 1; | ||||
| } | ||||
| 
 | ||||
| void clt_mdct_clear(mdct_lookup *l) | ||||
| void clt_mdct_clear(mdct_lookup *l, int arch) | ||||
| { | ||||
|    int i; | ||||
|    for (i=0;i<=l->maxshift;i++) | ||||
|       opus_fft_free(l->kfft[i]); | ||||
|       opus_fft_free(l->kfft[i], arch); | ||||
|    opus_free((kiss_twiddle_scalar*)l->trig); | ||||
| } | ||||
| 
 | ||||
| #endif /* CUSTOM_MODES */ | ||||
| 
 | ||||
| #if 0 | ||||
| /* Forward MDCT trashes the input array */ | ||||
| #ifndef OVERRIDE_clt_mdct_forward | ||||
| void clt_mdct_forward(const mdct_lookup *l, kiss_fft_scalar *in, kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|       const opus_val16 *window, int overlap, int shift, int stride) | ||||
| void clt_mdct_forward_c(const mdct_lookup *l, kiss_fft_scalar *in, kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|       const opus_val16 *window, int overlap, int shift, int stride, int arch) | ||||
| { | ||||
|    int i; | ||||
|    int N, N2, N4; | ||||
|  | @ -133,6 +132,7 @@ void clt_mdct_forward(const mdct_lookup *l, kiss_fft_scalar *in, kiss_fft_scalar | |||
|    int scale_shift = st->scale_shift-1; | ||||
| #endif | ||||
|    SAVE_STACK; | ||||
|    (void)arch; | ||||
|    scale = st->scale; | ||||
| 
 | ||||
|    N = l->n; | ||||
|  | @ -237,15 +237,15 @@ void clt_mdct_forward(const mdct_lookup *l, kiss_fft_scalar *in, kiss_fft_scalar | |||
|    RESTORE_STACK; | ||||
| } | ||||
| #endif /* OVERRIDE_clt_mdct_forward */ | ||||
| #endif | ||||
| 
 | ||||
| #ifndef OVERRIDE_clt_mdct_backward | ||||
| void clt_mdct_backward(const mdct_lookup *l, kiss_fft_scalar *in, kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|       const opus_val16 * OPUS_RESTRICT window, int overlap, int shift, int stride) | ||||
| void clt_mdct_backward_c(const mdct_lookup *l, kiss_fft_scalar *in, kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|       const opus_val16 * OPUS_RESTRICT window, int overlap, int shift, int stride, int arch) | ||||
| { | ||||
|    int i; | ||||
|    int N, N2, N4; | ||||
|    const kiss_twiddle_scalar *trig; | ||||
|    (void) arch; | ||||
| 
 | ||||
|    N = l->n; | ||||
|    trig = l->trig; | ||||
|  | @ -270,8 +270,8 @@ void clt_mdct_backward(const mdct_lookup *l, kiss_fft_scalar *in, kiss_fft_scala | |||
|          int rev; | ||||
|          kiss_fft_scalar yr, yi; | ||||
|          rev = *bitrev++; | ||||
|          yr = S_MUL(*xp2, t[i]) + S_MUL(*xp1, t[N4+i]); | ||||
|          yi = S_MUL(*xp1, t[i]) - S_MUL(*xp2, t[N4+i]); | ||||
|          yr = ADD32_ovflw(S_MUL(*xp2, t[i]), S_MUL(*xp1, t[N4+i])); | ||||
|          yi = SUB32_ovflw(S_MUL(*xp1, t[i]), S_MUL(*xp2, t[N4+i])); | ||||
|          /* We swap real and imag because we use an FFT instead of an IFFT. */ | ||||
|          yp[2*rev+1] = yr; | ||||
|          yp[2*rev] = yi; | ||||
|  | @ -301,8 +301,8 @@ void clt_mdct_backward(const mdct_lookup *l, kiss_fft_scalar *in, kiss_fft_scala | |||
|          t0 = t[i]; | ||||
|          t1 = t[N4+i]; | ||||
|          /* We'd scale up by 2 here, but instead it's done when mixing the windows */ | ||||
|          yr = S_MUL(re,t0) + S_MUL(im,t1); | ||||
|          yi = S_MUL(re,t1) - S_MUL(im,t0); | ||||
|          yr = ADD32_ovflw(S_MUL(re,t0), S_MUL(im,t1)); | ||||
|          yi = SUB32_ovflw(S_MUL(re,t1), S_MUL(im,t0)); | ||||
|          /* We swap real and imag because we're using an FFT instead of an IFFT. */ | ||||
|          re = yp1[1]; | ||||
|          im = yp1[0]; | ||||
|  | @ -312,8 +312,8 @@ void clt_mdct_backward(const mdct_lookup *l, kiss_fft_scalar *in, kiss_fft_scala | |||
|          t0 = t[(N4-i-1)]; | ||||
|          t1 = t[(N2-i-1)]; | ||||
|          /* We'd scale up by 2 here, but instead it's done when mixing the windows */ | ||||
|          yr = S_MUL(re,t0) + S_MUL(im,t1); | ||||
|          yi = S_MUL(re,t1) - S_MUL(im,t0); | ||||
|          yr = ADD32_ovflw(S_MUL(re,t0), S_MUL(im,t1)); | ||||
|          yi = SUB32_ovflw(S_MUL(re,t1), S_MUL(im,t0)); | ||||
|          yp1[0] = yr; | ||||
|          yp0[1] = yi; | ||||
|          yp0 += 2; | ||||
|  | @ -333,8 +333,8 @@ void clt_mdct_backward(const mdct_lookup *l, kiss_fft_scalar *in, kiss_fft_scala | |||
|          kiss_fft_scalar x1, x2; | ||||
|          x1 = *xp1; | ||||
|          x2 = *yp1; | ||||
|          *yp1++ = MULT16_32_Q15(*wp2, x2) - MULT16_32_Q15(*wp1, x1); | ||||
|          *xp1-- = MULT16_32_Q15(*wp1, x2) + MULT16_32_Q15(*wp2, x1); | ||||
|          *yp1++ = SUB32_ovflw(MULT16_32_Q15(*wp2, x2), MULT16_32_Q15(*wp1, x1)); | ||||
|          *xp1-- = ADD32_ovflw(MULT16_32_Q15(*wp1, x2), MULT16_32_Q15(*wp2, x1)); | ||||
|          wp1++; | ||||
|          wp2--; | ||||
|       } | ||||
|  |  | |||
|  | @ -53,18 +53,60 @@ typedef struct { | |||
|    const kiss_twiddle_scalar * OPUS_RESTRICT trig; | ||||
| } mdct_lookup; | ||||
| 
 | ||||
| int clt_mdct_init(mdct_lookup *l,int N, int maxshift); | ||||
| void clt_mdct_clear(mdct_lookup *l); | ||||
| #if defined(HAVE_ARM_NE10) | ||||
| #include "arm/mdct_arm.h" | ||||
| #endif | ||||
| 
 | ||||
| 
 | ||||
| int clt_mdct_init(mdct_lookup *l,int N, int maxshift, int arch); | ||||
| void clt_mdct_clear(mdct_lookup *l, int arch); | ||||
| 
 | ||||
| /** Compute a forward MDCT and scale by 4/N, trashes the input array */ | ||||
| void clt_mdct_forward(const mdct_lookup *l, kiss_fft_scalar *in, | ||||
|       kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|       const opus_val16 *window, int overlap, int shift, int stride); | ||||
| void clt_mdct_forward_c(const mdct_lookup *l, kiss_fft_scalar *in, | ||||
|                         kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|                         const opus_val16 *window, int overlap, | ||||
|                         int shift, int stride, int arch); | ||||
| 
 | ||||
| /** Compute a backward MDCT (no scaling) and performs weighted overlap-add
 | ||||
|     (scales implicitly by 1/2) */ | ||||
| void clt_mdct_backward(const mdct_lookup *l, kiss_fft_scalar *in, | ||||
| void clt_mdct_backward_c(const mdct_lookup *l, kiss_fft_scalar *in, | ||||
|       kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|       const opus_val16 * OPUS_RESTRICT window, int overlap, int shift, int stride); | ||||
|       const opus_val16 * OPUS_RESTRICT window, | ||||
|       int overlap, int shift, int stride, int arch); | ||||
| 
 | ||||
| #if !defined(OVERRIDE_OPUS_MDCT) | ||||
| /* Is run-time CPU detection enabled on this platform? */ | ||||
| #if defined(OPUS_HAVE_RTCD) && defined(HAVE_ARM_NE10) | ||||
| 
 | ||||
| extern void (*const CLT_MDCT_FORWARD_IMPL[OPUS_ARCHMASK+1])( | ||||
|       const mdct_lookup *l, kiss_fft_scalar *in, | ||||
|       kiss_fft_scalar * OPUS_RESTRICT out, const opus_val16 *window, | ||||
|       int overlap, int shift, int stride, int arch); | ||||
| 
 | ||||
| #define clt_mdct_forward(_l, _in, _out, _window, _overlap, _shift, _stride, _arch) \ | ||||
|    ((*CLT_MDCT_FORWARD_IMPL[(arch)&OPUS_ARCHMASK])(_l, _in, _out, \ | ||||
|                                                    _window, _overlap, _shift, \ | ||||
|                                                    _stride, _arch)) | ||||
| 
 | ||||
| extern void (*const CLT_MDCT_BACKWARD_IMPL[OPUS_ARCHMASK+1])( | ||||
|       const mdct_lookup *l, kiss_fft_scalar *in, | ||||
|       kiss_fft_scalar * OPUS_RESTRICT out, const opus_val16 *window, | ||||
|       int overlap, int shift, int stride, int arch); | ||||
| 
 | ||||
| #define clt_mdct_backward(_l, _in, _out, _window, _overlap, _shift, _stride, _arch) \ | ||||
|    (*CLT_MDCT_BACKWARD_IMPL[(arch)&OPUS_ARCHMASK])(_l, _in, _out, \ | ||||
|                                                    _window, _overlap, _shift, \ | ||||
|                                                    _stride, _arch) | ||||
| 
 | ||||
| #else /* if defined(OPUS_HAVE_RTCD) && defined(HAVE_ARM_NE10) */ | ||||
| 
 | ||||
| #define clt_mdct_forward(_l, _in, _out, _window, _overlap, _shift, _stride, _arch) \ | ||||
|    clt_mdct_forward_c(_l, _in, _out, _window, _overlap, _shift, _stride, _arch) | ||||
| 
 | ||||
| #define clt_mdct_backward(_l, _in, _out, _window, _overlap, _shift, _stride, _arch) \ | ||||
|    clt_mdct_backward_c(_l, _in, _out, _window, _overlap, _shift, _stride, _arch) | ||||
| 
 | ||||
| #endif /* end if defined(OPUS_HAVE_RTCD) && defined(HAVE_ARM_NE10) && !defined(FIXED_POINT) */ | ||||
| #endif /* end if !defined(OVERRIDE_OPUS_MDCT) */ | ||||
| 
 | ||||
| #endif | ||||
|  |  | |||
							
								
								
									
										151
									
								
								lib/rbcodec/codecs/libopus/celt/mips/celt_mipsr1.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										151
									
								
								lib/rbcodec/codecs/libopus/celt/mips/celt_mipsr1.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,151 @@ | |||
| /* Copyright (c) 2007-2008 CSIRO
 | ||||
|    Copyright (c) 2007-2010 Xiph.Org Foundation | ||||
|    Copyright (c) 2008 Gregory Maxwell | ||||
|    Written by Jean-Marc Valin and Gregory Maxwell */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef __CELT_MIPSR1_H__ | ||||
| #define __CELT_MIPSR1_H__ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #define CELT_C | ||||
| 
 | ||||
| #include "os_support.h" | ||||
| #include "mdct.h" | ||||
| #include <math.h> | ||||
| #include "celt.h" | ||||
| #include "pitch.h" | ||||
| #include "bands.h" | ||||
| #include "modes.h" | ||||
| #include "entcode.h" | ||||
| #include "quant_bands.h" | ||||
| #include "rate.h" | ||||
| #include "stack_alloc.h" | ||||
| #include "mathops.h" | ||||
| #include "float_cast.h" | ||||
| #include <stdarg.h> | ||||
| #include "celt_lpc.h" | ||||
| #include "vq.h" | ||||
| 
 | ||||
| #define OVERRIDE_comb_filter | ||||
| void comb_filter(opus_val32 *y, opus_val32 *x, int T0, int T1, int N, | ||||
|       opus_val16 g0, opus_val16 g1, int tapset0, int tapset1, | ||||
|       const opus_val16 *window, int overlap, int arch) | ||||
| { | ||||
|    int i; | ||||
|    opus_val32 x0, x1, x2, x3, x4; | ||||
| 
 | ||||
|    (void)arch; | ||||
| 
 | ||||
|    /* printf ("%d %d %f %f\n", T0, T1, g0, g1); */ | ||||
|    opus_val16 g00, g01, g02, g10, g11, g12; | ||||
|    static const opus_val16 gains[3][3] = { | ||||
|          {QCONST16(0.3066406250f, 15), QCONST16(0.2170410156f, 15), QCONST16(0.1296386719f, 15)}, | ||||
|          {QCONST16(0.4638671875f, 15), QCONST16(0.2680664062f, 15), QCONST16(0.f, 15)}, | ||||
|          {QCONST16(0.7998046875f, 15), QCONST16(0.1000976562f, 15), QCONST16(0.f, 15)}}; | ||||
| 
 | ||||
|    if (g0==0 && g1==0) | ||||
|    { | ||||
|       /* OPT: Happens to work without the OPUS_MOVE(), but only because the current encoder already copies x to y */ | ||||
|       if (x!=y) | ||||
|          OPUS_MOVE(y, x, N); | ||||
|       return; | ||||
|    } | ||||
| 
 | ||||
|    g00 = MULT16_16_P15(g0, gains[tapset0][0]); | ||||
|    g01 = MULT16_16_P15(g0, gains[tapset0][1]); | ||||
|    g02 = MULT16_16_P15(g0, gains[tapset0][2]); | ||||
|    g10 = MULT16_16_P15(g1, gains[tapset1][0]); | ||||
|    g11 = MULT16_16_P15(g1, gains[tapset1][1]); | ||||
|    g12 = MULT16_16_P15(g1, gains[tapset1][2]); | ||||
|    x1 = x[-T1+1]; | ||||
|    x2 = x[-T1  ]; | ||||
|    x3 = x[-T1-1]; | ||||
|    x4 = x[-T1-2]; | ||||
|    /* If the filter didn't change, we don't need the overlap */ | ||||
|    if (g0==g1 && T0==T1 && tapset0==tapset1) | ||||
|       overlap=0; | ||||
| 
 | ||||
|    for (i=0;i<overlap;i++) | ||||
|    { | ||||
|       opus_val16 f; | ||||
|       opus_val32 res; | ||||
|       f = MULT16_16_Q15(window[i],window[i]); | ||||
|       x0= x[i-T1+2]; | ||||
| 
 | ||||
|       asm volatile("MULT $ac1, %0, %1" : : "r" ((int)MULT16_16_Q15((Q15ONE-f),g00)), "r" ((int)x[i-T0])); | ||||
| 
 | ||||
|       asm volatile("MADD $ac1, %0, %1" : : "r" ((int)MULT16_16_Q15((Q15ONE-f),g01)), "r" ((int)ADD32(x[i-T0-1],x[i-T0+1]))); | ||||
|       asm volatile("MADD $ac1, %0, %1" : : "r" ((int)MULT16_16_Q15((Q15ONE-f),g02)), "r" ((int)ADD32(x[i-T0-2],x[i-T0+2]))); | ||||
|       asm volatile("MADD $ac1, %0, %1" : : "r" ((int)MULT16_16_Q15(f,g10)), "r" ((int)x2)); | ||||
|       asm volatile("MADD $ac1, %0, %1" : : "r" ((int)MULT16_16_Q15(f,g11)), "r" ((int)ADD32(x3,x1))); | ||||
|       asm volatile("MADD $ac1, %0, %1" : : "r" ((int)MULT16_16_Q15(f,g12)), "r" ((int)ADD32(x4,x0))); | ||||
| 
 | ||||
|       asm volatile("EXTR.W %0,$ac1, %1" : "=r" (res): "i" (15)); | ||||
| 
 | ||||
|       y[i] = x[i] + res; | ||||
| 
 | ||||
|       x4=x3; | ||||
|       x3=x2; | ||||
|       x2=x1; | ||||
|       x1=x0; | ||||
|    } | ||||
| 
 | ||||
|    x4 = x[i-T1-2]; | ||||
|    x3 = x[i-T1-1]; | ||||
|    x2 = x[i-T1]; | ||||
|    x1 = x[i-T1+1]; | ||||
| 
 | ||||
|    if (g1==0) | ||||
|    { | ||||
|       /* OPT: Happens to work without the OPUS_MOVE(), but only because the current encoder already copies x to y */ | ||||
|       if (x!=y) | ||||
|          OPUS_MOVE(y+overlap, x+overlap, N-overlap); | ||||
|       return; | ||||
|    } | ||||
| 
 | ||||
|    for (i=overlap;i<N;i++) | ||||
|    { | ||||
|       opus_val32 res; | ||||
|       x0=x[i-T1+2]; | ||||
| 
 | ||||
|       asm volatile("MULT $ac1, %0, %1" : : "r" ((int)g10), "r" ((int)x2)); | ||||
| 
 | ||||
|       asm volatile("MADD $ac1, %0, %1" : : "r" ((int)g11), "r" ((int)ADD32(x3,x1))); | ||||
|       asm volatile("MADD $ac1, %0, %1" : : "r" ((int)g12), "r" ((int)ADD32(x4,x0))); | ||||
|       asm volatile("EXTR.W %0,$ac1, %1" : "=r" (res): "i" (15)); | ||||
|       y[i] = x[i] + res; | ||||
|       x4=x3; | ||||
|       x3=x2; | ||||
|       x2=x1; | ||||
|       x1=x0; | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| #endif /* __CELT_MIPSR1_H__ */ | ||||
							
								
								
									
										126
									
								
								lib/rbcodec/codecs/libopus/celt/mips/fixed_generic_mipsr1.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										126
									
								
								lib/rbcodec/codecs/libopus/celt/mips/fixed_generic_mipsr1.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,126 @@ | |||
| /* Copyright (C) 2007-2009 Xiph.Org Foundation
 | ||||
|    Copyright (C) 2003-2008 Jean-Marc Valin | ||||
|    Copyright (C) 2007-2008 CSIRO */ | ||||
| /**
 | ||||
|    @file fixed_generic.h | ||||
|    @brief Generic fixed-point operations | ||||
| */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef CELT_FIXED_GENERIC_MIPSR1_H | ||||
| #define CELT_FIXED_GENERIC_MIPSR1_H | ||||
| 
 | ||||
| #undef MULT16_32_Q15_ADD | ||||
| static inline int MULT16_32_Q15_ADD(int a, int b, int c, int d) { | ||||
|     int m; | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" ((int)a), "r" ((int)b)); | ||||
|     asm volatile("madd $ac1, %0, %1" : : "r" ((int)c), "r" ((int)d)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (m): "i" (15)); | ||||
|     return m; | ||||
| } | ||||
| 
 | ||||
| #undef MULT16_32_Q15_SUB | ||||
| static inline int MULT16_32_Q15_SUB(int a, int b, int c, int d) { | ||||
|     int m; | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" ((int)a), "r" ((int)b)); | ||||
|     asm volatile("msub $ac1, %0, %1" : : "r" ((int)c), "r" ((int)d)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (m): "i" (15)); | ||||
|     return m; | ||||
| } | ||||
| 
 | ||||
| #undef MULT16_16_Q15_ADD | ||||
| static inline int MULT16_16_Q15_ADD(int a, int b, int c, int d) { | ||||
|     int m; | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" ((int)a), "r" ((int)b)); | ||||
|     asm volatile("madd $ac1, %0, %1" : : "r" ((int)c), "r" ((int)d)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (m): "i" (15)); | ||||
|     return m; | ||||
| } | ||||
| 
 | ||||
| #undef MULT16_16_Q15_SUB | ||||
| static inline int MULT16_16_Q15_SUB(int a, int b, int c, int d) { | ||||
|     int m; | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" ((int)a), "r" ((int)b)); | ||||
|     asm volatile("msub $ac1, %0, %1" : : "r" ((int)c), "r" ((int)d)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (m): "i" (15)); | ||||
|     return m; | ||||
| } | ||||
| 
 | ||||
| 
 | ||||
| #undef MULT16_32_Q16 | ||||
| static inline int MULT16_32_Q16(int a, int b) | ||||
| { | ||||
|     int c; | ||||
|     asm volatile("MULT $ac1,%0, %1" : : "r" (a), "r" (b)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (c): "i" (16)); | ||||
|     return c; | ||||
| } | ||||
| 
 | ||||
| #undef MULT16_32_P16 | ||||
| static inline int MULT16_32_P16(int a, int b) | ||||
| { | ||||
|     int c; | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" (a), "r" (b)); | ||||
|     asm volatile("EXTR_R.W %0,$ac1, %1" : "=r" (c): "i" (16)); | ||||
|     return c; | ||||
| } | ||||
| 
 | ||||
| #undef MULT16_32_Q15 | ||||
| static inline int MULT16_32_Q15(int a, int b) | ||||
| { | ||||
|     int c; | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" (a), "r" (b)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (c): "i" (15)); | ||||
|     return c; | ||||
| } | ||||
| 
 | ||||
| #undef MULT32_32_Q31 | ||||
| static inline int MULT32_32_Q31(int a, int b) | ||||
| { | ||||
|     int r; | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" (a), "r" (b)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (r): "i" (31)); | ||||
|     return r; | ||||
| } | ||||
| 
 | ||||
| #undef PSHR32 | ||||
| static inline int PSHR32(int a, int shift) | ||||
| { | ||||
|     int r; | ||||
|     asm volatile ("SHRAV_R.W %0, %1, %2" :"=r" (r): "r" (a), "r" (shift)); | ||||
|     return r; | ||||
| } | ||||
| 
 | ||||
| #undef MULT16_16_P15 | ||||
| static inline int MULT16_16_P15(int a, int b) | ||||
| { | ||||
|     int r; | ||||
|     asm volatile ("mul %0, %1, %2" :"=r" (r): "r" (a), "r" (b)); | ||||
|     asm volatile ("SHRA_R.W %0, %1, %2" : "+r" (r):  "0" (r), "i"(15)); | ||||
|     return r; | ||||
| } | ||||
| 
 | ||||
| #endif /* CELT_FIXED_GENERIC_MIPSR1_H */ | ||||
							
								
								
									
										167
									
								
								lib/rbcodec/codecs/libopus/celt/mips/kiss_fft_mipsr1.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										167
									
								
								lib/rbcodec/codecs/libopus/celt/mips/kiss_fft_mipsr1.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,167 @@ | |||
| /*Copyright (c) 2013, Xiph.Org Foundation and contributors.
 | ||||
| 
 | ||||
|   All rights reserved. | ||||
| 
 | ||||
|   Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions are met: | ||||
| 
 | ||||
|     * Redistributions of source code must retain the above copyright notice, | ||||
|        this list of conditions and the following disclaimer. | ||||
|     * Redistributions in binary form must reproduce the above copyright notice, | ||||
|        this list of conditions and the following disclaimer in the | ||||
|        documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||
|   AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||
|   IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||
|   ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE | ||||
|   LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||
|   CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||
|   SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||
|   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||
|   CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||
|   ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||
|   POSSIBILITY OF SUCH DAMAGE.*/ | ||||
| 
 | ||||
| #ifndef KISS_FFT_MIPSR1_H | ||||
| #define KISS_FFT_MIPSR1_H | ||||
| 
 | ||||
| #if !defined(KISS_FFT_GUTS_H) | ||||
| #error "This file should only be included from _kiss_fft_guts.h" | ||||
| #endif | ||||
| 
 | ||||
| #ifdef FIXED_POINT | ||||
| 
 | ||||
| #define S_MUL_ADD(a, b, c, d) (S_MUL(a,b)+S_MUL(c,d)) | ||||
| #define S_MUL_SUB(a, b, c, d) (S_MUL(a,b)-S_MUL(c,d)) | ||||
| 
 | ||||
| #undef S_MUL_ADD | ||||
| static inline int S_MUL_ADD(int a, int b, int c, int d) { | ||||
|     int m; | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" ((int)a), "r" ((int)b)); | ||||
|     asm volatile("madd $ac1, %0, %1" : : "r" ((int)c), "r" ((int)d)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (m): "i" (15)); | ||||
|     return m; | ||||
| } | ||||
| 
 | ||||
| #undef S_MUL_SUB | ||||
| static inline int S_MUL_SUB(int a, int b, int c, int d) { | ||||
|     int m; | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" ((int)a), "r" ((int)b)); | ||||
|     asm volatile("msub $ac1, %0, %1" : : "r" ((int)c), "r" ((int)d)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (m): "i" (15)); | ||||
|     return m; | ||||
| } | ||||
| 
 | ||||
| #undef C_MUL | ||||
| #   define C_MUL(m,a,b) (m=C_MUL_fun(a,b)) | ||||
| static inline kiss_fft_cpx C_MUL_fun(kiss_fft_cpx a, kiss_twiddle_cpx b) { | ||||
|     kiss_fft_cpx m; | ||||
| 
 | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" ((int)a.r), "r" ((int)b.r)); | ||||
|     asm volatile("msub $ac1, %0, %1" : : "r" ((int)a.i), "r" ((int)b.i)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (m.r): "i" (15)); | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" ((int)a.r), "r" ((int)b.i)); | ||||
|     asm volatile("madd $ac1, %0, %1" : : "r" ((int)a.i), "r" ((int)b.r)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (m.i): "i" (15)); | ||||
| 
 | ||||
|     return m; | ||||
| } | ||||
| #undef C_MULC | ||||
| #   define C_MULC(m,a,b) (m=C_MULC_fun(a,b)) | ||||
| static inline kiss_fft_cpx C_MULC_fun(kiss_fft_cpx a, kiss_twiddle_cpx b) { | ||||
|     kiss_fft_cpx m; | ||||
| 
 | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" ((int)a.r), "r" ((int)b.r)); | ||||
|     asm volatile("madd $ac1, %0, %1" : : "r" ((int)a.i), "r" ((int)b.i)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (m.r): "i" (15)); | ||||
|     asm volatile("MULT $ac1, %0, %1" : : "r" ((int)a.i), "r" ((int)b.r)); | ||||
|     asm volatile("msub $ac1, %0, %1" : : "r" ((int)a.r), "r" ((int)b.i)); | ||||
|     asm volatile("EXTR.W %0,$ac1, %1" : "=r" (m.i): "i" (15)); | ||||
| 
 | ||||
|     return m; | ||||
| } | ||||
| 
 | ||||
| #endif /* FIXED_POINT */ | ||||
| 
 | ||||
| #define OVERRIDE_kf_bfly5 | ||||
| static void kf_bfly5( | ||||
|                      kiss_fft_cpx * Fout, | ||||
|                      const size_t fstride, | ||||
|                      const kiss_fft_state *st, | ||||
|                      int m, | ||||
|                      int N, | ||||
|                      int mm | ||||
|                     ) | ||||
| { | ||||
|    kiss_fft_cpx *Fout0,*Fout1,*Fout2,*Fout3,*Fout4; | ||||
|    int i, u; | ||||
|    kiss_fft_cpx scratch[13]; | ||||
| 
 | ||||
|    const kiss_twiddle_cpx *tw; | ||||
|    kiss_twiddle_cpx ya,yb; | ||||
|    kiss_fft_cpx * Fout_beg = Fout; | ||||
| 
 | ||||
| #ifdef FIXED_POINT | ||||
|    ya.r = 10126; | ||||
|    ya.i = -31164; | ||||
|    yb.r = -26510; | ||||
|    yb.i = -19261; | ||||
| #else | ||||
|    ya = st->twiddles[fstride*m]; | ||||
|    yb = st->twiddles[fstride*2*m]; | ||||
| #endif | ||||
| 
 | ||||
|    tw=st->twiddles; | ||||
| 
 | ||||
|    for (i=0;i<N;i++) | ||||
|    { | ||||
|       Fout = Fout_beg + i*mm; | ||||
|       Fout0=Fout; | ||||
|       Fout1=Fout0+m; | ||||
|       Fout2=Fout0+2*m; | ||||
|       Fout3=Fout0+3*m; | ||||
|       Fout4=Fout0+4*m; | ||||
| 
 | ||||
|       /* For non-custom modes, m is guaranteed to be a multiple of 4. */ | ||||
|       for ( u=0; u<m; ++u ) { | ||||
|          scratch[0] = *Fout0; | ||||
| 
 | ||||
| 
 | ||||
|          C_MUL(scratch[1] ,*Fout1, tw[u*fstride]); | ||||
|          C_MUL(scratch[2] ,*Fout2, tw[2*u*fstride]); | ||||
|          C_MUL(scratch[3] ,*Fout3, tw[3*u*fstride]); | ||||
|          C_MUL(scratch[4] ,*Fout4, tw[4*u*fstride]); | ||||
| 
 | ||||
|          C_ADD( scratch[7],scratch[1],scratch[4]); | ||||
|          C_SUB( scratch[10],scratch[1],scratch[4]); | ||||
|          C_ADD( scratch[8],scratch[2],scratch[3]); | ||||
|          C_SUB( scratch[9],scratch[2],scratch[3]); | ||||
| 
 | ||||
|          Fout0->r += scratch[7].r + scratch[8].r; | ||||
|          Fout0->i += scratch[7].i + scratch[8].i; | ||||
|          scratch[5].r = scratch[0].r + S_MUL_ADD(scratch[7].r,ya.r,scratch[8].r,yb.r); | ||||
|          scratch[5].i = scratch[0].i + S_MUL_ADD(scratch[7].i,ya.r,scratch[8].i,yb.r); | ||||
| 
 | ||||
|          scratch[6].r =  S_MUL_ADD(scratch[10].i,ya.i,scratch[9].i,yb.i); | ||||
|          scratch[6].i =  -S_MUL_ADD(scratch[10].r,ya.i,scratch[9].r,yb.i); | ||||
| 
 | ||||
|          C_SUB(*Fout1,scratch[5],scratch[6]); | ||||
|          C_ADD(*Fout4,scratch[5],scratch[6]); | ||||
| 
 | ||||
|          scratch[11].r = scratch[0].r + S_MUL_ADD(scratch[7].r,yb.r,scratch[8].r,ya.r); | ||||
|          scratch[11].i = scratch[0].i + S_MUL_ADD(scratch[7].i,yb.r,scratch[8].i,ya.r); | ||||
| 
 | ||||
|          scratch[12].r =  S_MUL_SUB(scratch[9].i,ya.i,scratch[10].i,yb.i); | ||||
|          scratch[12].i =  S_MUL_SUB(scratch[10].r,yb.i,scratch[9].r,ya.i); | ||||
| 
 | ||||
|          C_ADD(*Fout2,scratch[11],scratch[12]); | ||||
|          C_SUB(*Fout3,scratch[11],scratch[12]); | ||||
| 
 | ||||
|          ++Fout0;++Fout1;++Fout2;++Fout3;++Fout4; | ||||
|       } | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| 
 | ||||
| #endif /* KISS_FFT_MIPSR1_H */ | ||||
							
								
								
									
										288
									
								
								lib/rbcodec/codecs/libopus/celt/mips/mdct_mipsr1.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										288
									
								
								lib/rbcodec/codecs/libopus/celt/mips/mdct_mipsr1.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,288 @@ | |||
| /* Copyright (c) 2007-2008 CSIRO
 | ||||
|    Copyright (c) 2007-2008 Xiph.Org Foundation | ||||
|    Written by Jean-Marc Valin */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| /* This is a simple MDCT implementation that uses a N/4 complex FFT
 | ||||
|    to do most of the work. It should be relatively straightforward to | ||||
|    plug in pretty much and FFT here. | ||||
| 
 | ||||
|    This replaces the Vorbis FFT (and uses the exact same API), which | ||||
|    was a bit too messy and that was ending up duplicating code | ||||
|    (might as well use the same FFT everywhere). | ||||
| 
 | ||||
|    The algorithm is similar to (and inspired from) Fabrice Bellard's | ||||
|    MDCT implementation in FFMPEG, but has differences in signs, ordering | ||||
|    and scaling in many places. | ||||
| */ | ||||
| #ifndef __MDCT_MIPSR1_H__ | ||||
| #define __MDCT_MIPSR1_H__ | ||||
| 
 | ||||
| #ifndef SKIP_CONFIG_H | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| #endif | ||||
| 
 | ||||
| #include "mdct.h" | ||||
| #include "kiss_fft.h" | ||||
| #include "_kiss_fft_guts.h" | ||||
| #include <math.h> | ||||
| #include "os_support.h" | ||||
| #include "mathops.h" | ||||
| #include "stack_alloc.h" | ||||
| 
 | ||||
| /* Forward MDCT trashes the input array */ | ||||
| #define OVERRIDE_clt_mdct_forward | ||||
| void clt_mdct_forward(const mdct_lookup *l, kiss_fft_scalar *in, kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|       const opus_val16 *window, int overlap, int shift, int stride, int arch) | ||||
| { | ||||
|    int i; | ||||
|    int N, N2, N4; | ||||
|    VARDECL(kiss_fft_scalar, f); | ||||
|    VARDECL(kiss_fft_cpx, f2); | ||||
|    const kiss_fft_state *st = l->kfft[shift]; | ||||
|    const kiss_twiddle_scalar *trig; | ||||
|    opus_val16 scale; | ||||
| #ifdef FIXED_POINT | ||||
|    /* Allows us to scale with MULT16_32_Q16(), which is faster than
 | ||||
|       MULT16_32_Q15() on ARM. */ | ||||
|    int scale_shift = st->scale_shift-1; | ||||
| #endif | ||||
| 
 | ||||
|     (void)arch; | ||||
| 
 | ||||
|    SAVE_STACK; | ||||
|    scale = st->scale; | ||||
| 
 | ||||
|    N = l->n; | ||||
|    trig = l->trig; | ||||
|    for (i=0;i<shift;i++) | ||||
|    { | ||||
|       N >>= 1; | ||||
|       trig += N; | ||||
|    } | ||||
|    N2 = N>>1; | ||||
|    N4 = N>>2; | ||||
| 
 | ||||
|    ALLOC(f, N2, kiss_fft_scalar); | ||||
|    ALLOC(f2, N4, kiss_fft_cpx); | ||||
| 
 | ||||
|    /* Consider the input to be composed of four blocks: [a, b, c, d] */ | ||||
|    /* Window, shuffle, fold */ | ||||
|    { | ||||
|       /* Temp pointers to make it really clear to the compiler what we're doing */ | ||||
|       const kiss_fft_scalar * OPUS_RESTRICT xp1 = in+(overlap>>1); | ||||
|       const kiss_fft_scalar * OPUS_RESTRICT xp2 = in+N2-1+(overlap>>1); | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp = f; | ||||
|       const opus_val16 * OPUS_RESTRICT wp1 = window+(overlap>>1); | ||||
|       const opus_val16 * OPUS_RESTRICT wp2 = window+(overlap>>1)-1; | ||||
|       for(i=0;i<((overlap+3)>>2);i++) | ||||
|       { | ||||
|          /* Real part arranged as -d-cR, Imag part arranged as -b+aR*/ | ||||
|           *yp++ = S_MUL_ADD(*wp2, xp1[N2],*wp1,*xp2); | ||||
|           *yp++ = S_MUL_SUB(*wp1, *xp1,*wp2, xp2[-N2]); | ||||
|          xp1+=2; | ||||
|          xp2-=2; | ||||
|          wp1+=2; | ||||
|          wp2-=2; | ||||
|       } | ||||
|       wp1 = window; | ||||
|       wp2 = window+overlap-1; | ||||
|       for(;i<N4-((overlap+3)>>2);i++) | ||||
|       { | ||||
|          /* Real part arranged as a-bR, Imag part arranged as -c-dR */ | ||||
|          *yp++ = *xp2; | ||||
|          *yp++ = *xp1; | ||||
|          xp1+=2; | ||||
|          xp2-=2; | ||||
|       } | ||||
|       for(;i<N4;i++) | ||||
|       { | ||||
|          /* Real part arranged as a-bR, Imag part arranged as -c-dR */ | ||||
|           *yp++ =  S_MUL_SUB(*wp2, *xp2, *wp1, xp1[-N2]); | ||||
|           *yp++ = S_MUL_ADD(*wp2, *xp1, *wp1, xp2[N2]); | ||||
|          xp1+=2; | ||||
|          xp2-=2; | ||||
|          wp1+=2; | ||||
|          wp2-=2; | ||||
|       } | ||||
|    } | ||||
|    /* Pre-rotation */ | ||||
|    { | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp = f; | ||||
|       const kiss_twiddle_scalar *t = &trig[0]; | ||||
|       for(i=0;i<N4;i++) | ||||
|       { | ||||
|          kiss_fft_cpx yc; | ||||
|          kiss_twiddle_scalar t0, t1; | ||||
|          kiss_fft_scalar re, im, yr, yi; | ||||
|          t0 = t[i]; | ||||
|          t1 = t[N4+i]; | ||||
|          re = *yp++; | ||||
|          im = *yp++; | ||||
| 
 | ||||
|          yr = S_MUL_SUB(re,t0,im,t1); | ||||
|          yi = S_MUL_ADD(im,t0,re,t1); | ||||
| 
 | ||||
|          yc.r = yr; | ||||
|          yc.i = yi; | ||||
|          yc.r = PSHR32(MULT16_32_Q16(scale, yc.r), scale_shift); | ||||
|          yc.i = PSHR32(MULT16_32_Q16(scale, yc.i), scale_shift); | ||||
|          f2[st->bitrev[i]] = yc; | ||||
|       } | ||||
|    } | ||||
| 
 | ||||
|    /* N/4 complex FFT, does not downscale anymore */ | ||||
|    opus_fft_impl(st, f2); | ||||
| 
 | ||||
|    /* Post-rotate */ | ||||
|    { | ||||
|       /* Temp pointers to make it really clear to the compiler what we're doing */ | ||||
|       const kiss_fft_cpx * OPUS_RESTRICT fp = f2; | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp1 = out; | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp2 = out+stride*(N2-1); | ||||
|       const kiss_twiddle_scalar *t = &trig[0]; | ||||
|       /* Temp pointers to make it really clear to the compiler what we're doing */ | ||||
|       for(i=0;i<N4;i++) | ||||
|       { | ||||
|          kiss_fft_scalar yr, yi; | ||||
|          yr = S_MUL_SUB(fp->i,t[N4+i] , fp->r,t[i]); | ||||
|          yi = S_MUL_ADD(fp->r,t[N4+i] ,fp->i,t[i]); | ||||
|          *yp1 = yr; | ||||
|          *yp2 = yi; | ||||
|          fp++; | ||||
|          yp1 += 2*stride; | ||||
|          yp2 -= 2*stride; | ||||
|       } | ||||
|    } | ||||
|    RESTORE_STACK; | ||||
| } | ||||
| 
 | ||||
| #define OVERRIDE_clt_mdct_backward | ||||
| void clt_mdct_backward(const mdct_lookup *l, kiss_fft_scalar *in, kiss_fft_scalar * OPUS_RESTRICT out, | ||||
|       const opus_val16 * OPUS_RESTRICT window, int overlap, int shift, int stride, int arch) | ||||
| { | ||||
|    int i; | ||||
|    int N, N2, N4; | ||||
|    const kiss_twiddle_scalar *trig; | ||||
| 
 | ||||
|     (void)arch; | ||||
| 
 | ||||
|    N = l->n; | ||||
|    trig = l->trig; | ||||
|    for (i=0;i<shift;i++) | ||||
|    { | ||||
|       N >>= 1; | ||||
|       trig += N; | ||||
|    } | ||||
|    N2 = N>>1; | ||||
|    N4 = N>>2; | ||||
| 
 | ||||
|    /* Pre-rotate */ | ||||
|    { | ||||
|       /* Temp pointers to make it really clear to the compiler what we're doing */ | ||||
|       const kiss_fft_scalar * OPUS_RESTRICT xp1 = in; | ||||
|       const kiss_fft_scalar * OPUS_RESTRICT xp2 = in+stride*(N2-1); | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp = out+(overlap>>1); | ||||
|       const kiss_twiddle_scalar * OPUS_RESTRICT t = &trig[0]; | ||||
|       const opus_int16 * OPUS_RESTRICT bitrev = l->kfft[shift]->bitrev; | ||||
|       for(i=0;i<N4;i++) | ||||
|       { | ||||
|          int rev; | ||||
|          kiss_fft_scalar yr, yi; | ||||
|          rev = *bitrev++; | ||||
|          yr = S_MUL_ADD(*xp2, t[i] , *xp1, t[N4+i]); | ||||
|          yi = S_MUL_SUB(*xp1, t[i] , *xp2, t[N4+i]); | ||||
|          /* We swap real and imag because we use an FFT instead of an IFFT. */ | ||||
|          yp[2*rev+1] = yr; | ||||
|          yp[2*rev] = yi; | ||||
|          /* Storing the pre-rotation directly in the bitrev order. */ | ||||
|          xp1+=2*stride; | ||||
|          xp2-=2*stride; | ||||
|       } | ||||
|    } | ||||
| 
 | ||||
|    opus_fft_impl(l->kfft[shift], (kiss_fft_cpx*)(out+(overlap>>1))); | ||||
| 
 | ||||
|    /* Post-rotate and de-shuffle from both ends of the buffer at once to make
 | ||||
|       it in-place. */ | ||||
|    { | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp0 = out+(overlap>>1); | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp1 = out+(overlap>>1)+N2-2; | ||||
|       const kiss_twiddle_scalar *t = &trig[0]; | ||||
|       /* Loop to (N4+1)>>1 to handle odd N4. When N4 is odd, the
 | ||||
|          middle pair will be computed twice. */ | ||||
|       for(i=0;i<(N4+1)>>1;i++) | ||||
|       { | ||||
|          kiss_fft_scalar re, im, yr, yi; | ||||
|          kiss_twiddle_scalar t0, t1; | ||||
|          /* We swap real and imag because we're using an FFT instead of an IFFT. */ | ||||
|          re = yp0[1]; | ||||
|          im = yp0[0]; | ||||
|          t0 = t[i]; | ||||
|          t1 = t[N4+i]; | ||||
|          /* We'd scale up by 2 here, but instead it's done when mixing the windows */ | ||||
|          yr = S_MUL_ADD(re,t0 , im,t1); | ||||
|          yi = S_MUL_SUB(re,t1 , im,t0); | ||||
|          /* We swap real and imag because we're using an FFT instead of an IFFT. */ | ||||
|          re = yp1[1]; | ||||
|          im = yp1[0]; | ||||
|          yp0[0] = yr; | ||||
|          yp1[1] = yi; | ||||
| 
 | ||||
|          t0 = t[(N4-i-1)]; | ||||
|          t1 = t[(N2-i-1)]; | ||||
|          /* We'd scale up by 2 here, but instead it's done when mixing the windows */ | ||||
|          yr = S_MUL_ADD(re,t0,im,t1); | ||||
|          yi = S_MUL_SUB(re,t1,im,t0); | ||||
|          yp1[0] = yr; | ||||
|          yp0[1] = yi; | ||||
|          yp0 += 2; | ||||
|          yp1 -= 2; | ||||
|       } | ||||
|    } | ||||
| 
 | ||||
|    /* Mirror on both sides for TDAC */ | ||||
|    { | ||||
|       kiss_fft_scalar * OPUS_RESTRICT xp1 = out+overlap-1; | ||||
|       kiss_fft_scalar * OPUS_RESTRICT yp1 = out; | ||||
|       const opus_val16 * OPUS_RESTRICT wp1 = window; | ||||
|       const opus_val16 * OPUS_RESTRICT wp2 = window+overlap-1; | ||||
| 
 | ||||
|       for(i = 0; i < overlap/2; i++) | ||||
|       { | ||||
|          kiss_fft_scalar x1, x2; | ||||
|          x1 = *xp1; | ||||
|          x2 = *yp1; | ||||
|          *yp1++ = MULT16_32_Q15(*wp2, x2) - MULT16_32_Q15(*wp1, x1); | ||||
|          *xp1-- = MULT16_32_Q15(*wp1, x2) + MULT16_32_Q15(*wp2, x1); | ||||
|          wp1++; | ||||
|          wp2--; | ||||
|       } | ||||
|    } | ||||
| } | ||||
| #endif /* __MDCT_MIPSR1_H__ */ | ||||
							
								
								
									
										161
									
								
								lib/rbcodec/codecs/libopus/celt/mips/pitch_mipsr1.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										161
									
								
								lib/rbcodec/codecs/libopus/celt/mips/pitch_mipsr1.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,161 @@ | |||
| /* Copyright (c) 2007-2008 CSIRO
 | ||||
|    Copyright (c) 2007-2009 Xiph.Org Foundation | ||||
|    Written by Jean-Marc Valin */ | ||||
| /**
 | ||||
|    @file pitch.h | ||||
|    @brief Pitch analysis | ||||
|  */ | ||||
| 
 | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef PITCH_MIPSR1_H | ||||
| #define PITCH_MIPSR1_H | ||||
| 
 | ||||
| #define OVERRIDE_DUAL_INNER_PROD | ||||
| static inline void dual_inner_prod(const opus_val16 *x, const opus_val16 *y01, const opus_val16 *y02, | ||||
|       int N, opus_val32 *xy1, opus_val32 *xy2, int arch) | ||||
| { | ||||
|    int j; | ||||
|    opus_val32 xy01=0; | ||||
|    opus_val32 xy02=0; | ||||
| 
 | ||||
|    (void)arch; | ||||
| 
 | ||||
|    asm volatile("MULT $ac1, $0, $0"); | ||||
|    asm volatile("MULT $ac2, $0, $0"); | ||||
|    /* Compute the norm of X+Y and X-Y as |X|^2 + |Y|^2 +/- sum(xy) */ | ||||
|    for (j=0;j<N;j++) | ||||
|    { | ||||
|       asm volatile("MADD $ac1, %0, %1" : : "r" ((int)x[j]), "r" ((int)y01[j])); | ||||
|       asm volatile("MADD $ac2, %0, %1" : : "r" ((int)x[j]), "r" ((int)y02[j])); | ||||
|       ++j; | ||||
|       asm volatile("MADD $ac1, %0, %1" : : "r" ((int)x[j]), "r" ((int)y01[j])); | ||||
|       asm volatile("MADD $ac2, %0, %1" : : "r" ((int)x[j]), "r" ((int)y02[j])); | ||||
|    } | ||||
|    asm volatile ("mflo %0, $ac1": "=r"(xy01)); | ||||
|    asm volatile ("mflo %0, $ac2": "=r"(xy02)); | ||||
|    *xy1 = xy01; | ||||
|    *xy2 = xy02; | ||||
| } | ||||
| 
 | ||||
| static inline void xcorr_kernel_mips(const opus_val16 * x, | ||||
|       const opus_val16 * y, opus_val32 sum[4], int len) | ||||
| { | ||||
|    int j; | ||||
|    opus_val16 y_0, y_1, y_2, y_3; | ||||
| 
 | ||||
|     opus_int64 sum_0, sum_1, sum_2, sum_3; | ||||
|     sum_0 =  (opus_int64)sum[0]; | ||||
|     sum_1 =  (opus_int64)sum[1]; | ||||
|     sum_2 =  (opus_int64)sum[2]; | ||||
|     sum_3 =  (opus_int64)sum[3]; | ||||
| 
 | ||||
|     y_3=0; /* gcc doesn't realize that y_3 can't be used uninitialized */ | ||||
|     y_0=*y++; | ||||
|     y_1=*y++; | ||||
|     y_2=*y++; | ||||
|     for (j=0;j<len-3;j+=4) | ||||
|     { | ||||
|         opus_val16 tmp; | ||||
|         tmp = *x++; | ||||
|         y_3=*y++; | ||||
| 
 | ||||
|         sum_0 = __builtin_mips_madd( sum_0, tmp, y_0); | ||||
|         sum_1 = __builtin_mips_madd( sum_1, tmp, y_1); | ||||
|         sum_2 = __builtin_mips_madd( sum_2, tmp, y_2); | ||||
|         sum_3 = __builtin_mips_madd( sum_3, tmp, y_3); | ||||
| 
 | ||||
|         tmp=*x++; | ||||
|         y_0=*y++; | ||||
| 
 | ||||
|         sum_0 = __builtin_mips_madd( sum_0, tmp, y_1 ); | ||||
|         sum_1 = __builtin_mips_madd( sum_1, tmp, y_2 ); | ||||
|         sum_2 = __builtin_mips_madd( sum_2, tmp, y_3); | ||||
|         sum_3 = __builtin_mips_madd( sum_3, tmp, y_0); | ||||
| 
 | ||||
|        tmp=*x++; | ||||
|        y_1=*y++; | ||||
| 
 | ||||
|        sum_0 = __builtin_mips_madd( sum_0, tmp, y_2 ); | ||||
|        sum_1 = __builtin_mips_madd( sum_1, tmp, y_3 ); | ||||
|        sum_2 = __builtin_mips_madd( sum_2, tmp, y_0); | ||||
|        sum_3 = __builtin_mips_madd( sum_3, tmp, y_1); | ||||
| 
 | ||||
| 
 | ||||
|       tmp=*x++; | ||||
|       y_2=*y++; | ||||
| 
 | ||||
|        sum_0 = __builtin_mips_madd( sum_0, tmp, y_3 ); | ||||
|        sum_1 = __builtin_mips_madd( sum_1, tmp, y_0 ); | ||||
|        sum_2 = __builtin_mips_madd( sum_2, tmp, y_1); | ||||
|        sum_3 = __builtin_mips_madd( sum_3, tmp, y_2); | ||||
| 
 | ||||
|    } | ||||
|    if (j++<len) | ||||
|    { | ||||
|       opus_val16 tmp = *x++; | ||||
|       y_3=*y++; | ||||
| 
 | ||||
|        sum_0 = __builtin_mips_madd( sum_0, tmp, y_0 ); | ||||
|        sum_1 = __builtin_mips_madd( sum_1, tmp, y_1 ); | ||||
|        sum_2 = __builtin_mips_madd( sum_2, tmp, y_2); | ||||
|        sum_3 = __builtin_mips_madd( sum_3, tmp, y_3); | ||||
|    } | ||||
| 
 | ||||
|    if (j++<len) | ||||
|    { | ||||
|       opus_val16 tmp=*x++; | ||||
|       y_0=*y++; | ||||
| 
 | ||||
|       sum_0 = __builtin_mips_madd( sum_0, tmp, y_1 ); | ||||
|       sum_1 = __builtin_mips_madd( sum_1, tmp, y_2 ); | ||||
|       sum_2 = __builtin_mips_madd( sum_2, tmp, y_3); | ||||
|       sum_3 = __builtin_mips_madd( sum_3, tmp, y_0); | ||||
|    } | ||||
| 
 | ||||
|    if (j<len) | ||||
|    { | ||||
|       opus_val16 tmp=*x++; | ||||
|       y_1=*y++; | ||||
| 
 | ||||
|        sum_0 = __builtin_mips_madd( sum_0, tmp, y_2 ); | ||||
|        sum_1 = __builtin_mips_madd( sum_1, tmp, y_3 ); | ||||
|        sum_2 = __builtin_mips_madd( sum_2, tmp, y_0); | ||||
|        sum_3 = __builtin_mips_madd( sum_3, tmp, y_1); | ||||
| 
 | ||||
|    } | ||||
| 
 | ||||
|    sum[0] = (opus_val32)sum_0; | ||||
|    sum[1] = (opus_val32)sum_1; | ||||
|    sum[2] = (opus_val32)sum_2; | ||||
|    sum[3] = (opus_val32)sum_3; | ||||
| } | ||||
| 
 | ||||
| #define OVERRIDE_XCORR_KERNEL | ||||
| #define xcorr_kernel(x, y, sum, len, arch) \ | ||||
|     ((void)(arch), xcorr_kernel_mips(x, y, sum, len)) | ||||
| 
 | ||||
| #endif /* PITCH_MIPSR1_H */ | ||||
							
								
								
									
										122
									
								
								lib/rbcodec/codecs/libopus/celt/mips/vq_mipsr1.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										122
									
								
								lib/rbcodec/codecs/libopus/celt/mips/vq_mipsr1.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,122 @@ | |||
| /* Copyright (c) 2007-2008 CSIRO
 | ||||
|    Copyright (c) 2007-2009 Xiph.Org Foundation | ||||
|    Written by Jean-Marc Valin */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef __VQ_MIPSR1_H__ | ||||
| #define __VQ_MIPSR1_H__ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include "mathops.h" | ||||
| #include "arch.h" | ||||
| 
 | ||||
| static void renormalise_vector_mips(celt_norm *X, int N, opus_val16 gain, int arch); | ||||
| 
 | ||||
| #define OVERRIDE_vq_exp_rotation1 | ||||
| static void exp_rotation1(celt_norm *X, int len, int stride, opus_val16 c, opus_val16 s) | ||||
| { | ||||
|    int i; | ||||
|    opus_val16 ms; | ||||
|    celt_norm *Xptr; | ||||
|    Xptr = X; | ||||
|    ms = NEG16(s); | ||||
|    for (i=0;i<len-stride;i++) | ||||
|    { | ||||
|       celt_norm x1, x2; | ||||
|       x1 = Xptr[0]; | ||||
|       x2 = Xptr[stride]; | ||||
|       Xptr[stride] = EXTRACT16(PSHR32(MAC16_16(MULT16_16(c, x2),  s, x1), 15)); | ||||
|       *Xptr++      = EXTRACT16(PSHR32(MAC16_16(MULT16_16(c, x1), ms, x2), 15)); | ||||
|    } | ||||
|    Xptr = &X[len-2*stride-1]; | ||||
|    for (i=len-2*stride-1;i>=0;i--) | ||||
|    { | ||||
|       celt_norm x1, x2; | ||||
|       x1 = Xptr[0]; | ||||
|       x2 = Xptr[stride]; | ||||
|       Xptr[stride] = EXTRACT16(PSHR32(MAC16_16(MULT16_16(c, x2),  s, x1), 15)); | ||||
|       *Xptr--      = EXTRACT16(PSHR32(MAC16_16(MULT16_16(c, x1), ms, x2), 15)); | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| #define OVERRIDE_renormalise_vector | ||||
| 
 | ||||
| #define renormalise_vector(X, N, gain, arch) \ | ||||
|  (renormalise_vector_mips(X, N, gain, arch)) | ||||
| 
 | ||||
| void renormalise_vector_mips(celt_norm *X, int N, opus_val16 gain, int arch) | ||||
| { | ||||
|    int i; | ||||
| #ifdef FIXED_POINT | ||||
|    int k; | ||||
| #endif | ||||
|    opus_val32 E = EPSILON; | ||||
|    opus_val16 g; | ||||
|    opus_val32 t; | ||||
|    celt_norm *xptr = X; | ||||
|    int X0, X1; | ||||
| 
 | ||||
|    (void)arch; | ||||
| 
 | ||||
|    asm volatile("mult $ac1, $0, $0"); | ||||
|    asm volatile("MTLO %0, $ac1" : :"r" (E)); | ||||
|    /*if(N %4)
 | ||||
|        printf("error");*/ | ||||
|    for (i=0;i<N-2;i+=2) | ||||
|    { | ||||
|       X0 = (int)*xptr++; | ||||
|       asm volatile("MADD $ac1, %0, %1" : : "r" (X0), "r" (X0)); | ||||
| 
 | ||||
|       X1 = (int)*xptr++; | ||||
|       asm volatile("MADD $ac1, %0, %1" : : "r" (X1), "r" (X1)); | ||||
|    } | ||||
| 
 | ||||
|    for (;i<N;i++) | ||||
|    { | ||||
|       X0 = (int)*xptr++; | ||||
|       asm volatile("MADD $ac1, %0, %1" : : "r" (X0), "r" (X0)); | ||||
|    } | ||||
| 
 | ||||
|    asm volatile("MFLO %0, $ac1" : "=r" (E)); | ||||
| #ifdef FIXED_POINT | ||||
|    k = celt_ilog2(E)>>1; | ||||
| #endif | ||||
|    t = VSHR32(E, 2*(k-7)); | ||||
|    g = MULT16_16_P15(celt_rsqrt_norm(t),gain); | ||||
| 
 | ||||
|    xptr = X; | ||||
|    for (i=0;i<N;i++) | ||||
|    { | ||||
|       *xptr = EXTRACT16(PSHR32(MULT16_16(g, *xptr), k+1)); | ||||
|       xptr++; | ||||
|    } | ||||
|    /*return celt_sqrt(E);*/ | ||||
| } | ||||
| 
 | ||||
| #endif /* __VQ_MIPSR1_H__ */ | ||||
|  | @ -37,6 +37,7 @@ | |||
| #include "os_support.h" | ||||
| #include "stack_alloc.h" | ||||
| #include "quant_bands.h" | ||||
| #include "cpu_support.h" | ||||
| 
 | ||||
| static const opus_int16 eband5ms[] = { | ||||
| /*0  200 400 600 800  1k 1.2 1.4 1.6  2k 2.4 2.8 3.2  4k 4.8 5.6 6.8  8k 9.6 12k 15.6 */ | ||||
|  | @ -229,6 +230,7 @@ CELTMode *opus_custom_mode_create(opus_int32 Fs, int frame_size, int *error) | |||
|    opus_val16 *window; | ||||
|    opus_int16 *logN; | ||||
|    int LM; | ||||
|    int arch = opus_select_arch(); | ||||
|    ALLOC_STACK; | ||||
| #if !defined(VAR_ARRAYS) && !defined(USE_ALLOCA) | ||||
|    if (global_stack==NULL) | ||||
|  | @ -389,7 +391,7 @@ CELTMode *opus_custom_mode_create(opus_int32 Fs, int frame_size, int *error) | |||
|    compute_pulse_cache(mode, mode->maxLM); | ||||
| 
 | ||||
|    if (clt_mdct_init(&mode->mdct, 2*mode->shortMdctSize*mode->nbShortMdcts, | ||||
|            mode->maxLM) == 0) | ||||
|            mode->maxLM, arch) == 0) | ||||
|       goto failure; | ||||
| 
 | ||||
|    if (error) | ||||
|  | @ -408,6 +410,8 @@ failure: | |||
| #ifdef CUSTOM_MODES | ||||
| void opus_custom_mode_destroy(CELTMode *mode) | ||||
| { | ||||
|    int arch = opus_select_arch(); | ||||
| 
 | ||||
|    if (mode == NULL) | ||||
|       return; | ||||
| #ifndef CUSTOM_MODES_ONLY | ||||
|  | @ -423,7 +427,7 @@ void opus_custom_mode_destroy(CELTMode *mode) | |||
|    } | ||||
| #endif /* CUSTOM_MODES_ONLY */ | ||||
|    opus_free((opus_int16*)mode->eBands); | ||||
|    opus_free((opus_int16*)mode->allocVectors); | ||||
|    opus_free((unsigned char*)mode->allocVectors); | ||||
| 
 | ||||
|    opus_free((opus_val16*)mode->window); | ||||
|    opus_free((opus_int16*)mode->logN); | ||||
|  | @ -431,7 +435,7 @@ void opus_custom_mode_destroy(CELTMode *mode) | |||
|    opus_free((opus_int16*)mode->cache.index); | ||||
|    opus_free((unsigned char*)mode->cache.bits); | ||||
|    opus_free((unsigned char*)mode->cache.caps); | ||||
|    clt_mdct_clear(&mode->mdct); | ||||
|    clt_mdct_clear(&mode->mdct, arch); | ||||
| 
 | ||||
|    opus_free((CELTMode *)mode); | ||||
| } | ||||
|  |  | |||
							
								
								
									
										210
									
								
								lib/rbcodec/codecs/libopus/celt/opus_custom_demo.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										210
									
								
								lib/rbcodec/codecs/libopus/celt/opus_custom_demo.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,210 @@ | |||
| /* Copyright (c) 2007-2008 CSIRO
 | ||||
|    Copyright (c) 2007-2009 Xiph.Org Foundation | ||||
|    Written by Jean-Marc Valin */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include "opus_custom.h" | ||||
| #include "arch.h" | ||||
| #include <stdio.h> | ||||
| #include <stdlib.h> | ||||
| #include <math.h> | ||||
| #include <string.h> | ||||
| 
 | ||||
| #define MAX_PACKET 1275 | ||||
| 
 | ||||
| int main(int argc, char *argv[]) | ||||
| { | ||||
|    int err; | ||||
|    char *inFile, *outFile; | ||||
|    FILE *fin, *fout; | ||||
|    OpusCustomMode *mode=NULL; | ||||
|    OpusCustomEncoder *enc; | ||||
|    OpusCustomDecoder *dec; | ||||
|    int len; | ||||
|    opus_int32 frame_size, channels, rate; | ||||
|    int bytes_per_packet; | ||||
|    unsigned char data[MAX_PACKET]; | ||||
|    int complexity; | ||||
| #if !(defined (FIXED_POINT) && !defined(CUSTOM_MODES)) && defined(RESYNTH) | ||||
|    int i; | ||||
|    double rmsd = 0; | ||||
| #endif | ||||
|    int count = 0; | ||||
|    opus_int32 skip; | ||||
|    opus_int16 *in, *out; | ||||
|    if (argc != 9 && argc != 8 && argc != 7) | ||||
|    { | ||||
|       fprintf (stderr, "Usage: test_opus_custom <rate> <channels> <frame size> " | ||||
|                " <bytes per packet> [<complexity> [packet loss rate]] " | ||||
|                "<input> <output>\n"); | ||||
|       return 1; | ||||
|    } | ||||
| 
 | ||||
|    rate = (opus_int32)atol(argv[1]); | ||||
|    channels = atoi(argv[2]); | ||||
|    frame_size = atoi(argv[3]); | ||||
|    mode = opus_custom_mode_create(rate, frame_size, NULL); | ||||
|    if (mode == NULL) | ||||
|    { | ||||
|       fprintf(stderr, "failed to create a mode\n"); | ||||
|       return 1; | ||||
|    } | ||||
| 
 | ||||
|    bytes_per_packet = atoi(argv[4]); | ||||
|    if (bytes_per_packet < 0 || bytes_per_packet > MAX_PACKET) | ||||
|    { | ||||
|       fprintf (stderr, "bytes per packet must be between 0 and %d\n", | ||||
|                         MAX_PACKET); | ||||
|       return 1; | ||||
|    } | ||||
| 
 | ||||
|    inFile = argv[argc-2]; | ||||
|    fin = fopen(inFile, "rb"); | ||||
|    if (!fin) | ||||
|    { | ||||
|       fprintf (stderr, "Could not open input file %s\n", argv[argc-2]); | ||||
|       return 1; | ||||
|    } | ||||
|    outFile = argv[argc-1]; | ||||
|    fout = fopen(outFile, "wb+"); | ||||
|    if (!fout) | ||||
|    { | ||||
|       fprintf (stderr, "Could not open output file %s\n", argv[argc-1]); | ||||
|       fclose(fin); | ||||
|       return 1; | ||||
|    } | ||||
| 
 | ||||
|    enc = opus_custom_encoder_create(mode, channels, &err); | ||||
|    if (err != 0) | ||||
|    { | ||||
|       fprintf(stderr, "Failed to create the encoder: %s\n", opus_strerror(err)); | ||||
|       fclose(fin); | ||||
|       fclose(fout); | ||||
|       return 1; | ||||
|    } | ||||
|    dec = opus_custom_decoder_create(mode, channels, &err); | ||||
|    if (err != 0) | ||||
|    { | ||||
|       fprintf(stderr, "Failed to create the decoder: %s\n", opus_strerror(err)); | ||||
|       fclose(fin); | ||||
|       fclose(fout); | ||||
|       return 1; | ||||
|    } | ||||
|    opus_custom_decoder_ctl(dec, OPUS_GET_LOOKAHEAD(&skip)); | ||||
| 
 | ||||
|    if (argc>7) | ||||
|    { | ||||
|       complexity=atoi(argv[5]); | ||||
|       opus_custom_encoder_ctl(enc,OPUS_SET_COMPLEXITY(complexity)); | ||||
|    } | ||||
| 
 | ||||
|    in = (opus_int16*)malloc(frame_size*channels*sizeof(opus_int16)); | ||||
|    out = (opus_int16*)malloc(frame_size*channels*sizeof(opus_int16)); | ||||
| 
 | ||||
|    while (!feof(fin)) | ||||
|    { | ||||
|       int ret; | ||||
|       err = fread(in, sizeof(short), frame_size*channels, fin); | ||||
|       if (feof(fin)) | ||||
|          break; | ||||
|       len = opus_custom_encode(enc, in, frame_size, data, bytes_per_packet); | ||||
|       if (len <= 0) | ||||
|          fprintf (stderr, "opus_custom_encode() failed: %s\n", opus_strerror(len)); | ||||
| 
 | ||||
|       /* This is for simulating bit errors */ | ||||
| #if 0 | ||||
|       int errors = 0; | ||||
|       int eid = 0; | ||||
|       /* This simulates random bit error */ | ||||
|       for (i=0;i<len*8;i++) | ||||
|       { | ||||
|          if (rand()%atoi(argv[8])==0) | ||||
|          { | ||||
|             if (i<64) | ||||
|             { | ||||
|                errors++; | ||||
|                eid = i; | ||||
|             } | ||||
|             data[i/8] ^= 1<<(7-(i%8)); | ||||
|          } | ||||
|       } | ||||
|       if (errors == 1) | ||||
|          data[eid/8] ^= 1<<(7-(eid%8)); | ||||
|       else if (errors%2 == 1) | ||||
|          data[rand()%8] ^= 1<<rand()%8; | ||||
| #endif | ||||
| 
 | ||||
| #if 1 /* Set to zero to use the encoder's output instead */ | ||||
|       /* This is to simulate packet loss */ | ||||
|       if (argc==9 && rand()%1000<atoi(argv[argc-3])) | ||||
|       /*if (errors && (errors%2==0))*/ | ||||
|          ret = opus_custom_decode(dec, NULL, len, out, frame_size); | ||||
|       else | ||||
|          ret = opus_custom_decode(dec, data, len, out, frame_size); | ||||
|       if (ret < 0) | ||||
|          fprintf(stderr, "opus_custom_decode() failed: %s\n", opus_strerror(ret)); | ||||
| #else | ||||
|       for (i=0;i<ret*channels;i++) | ||||
|          out[i] = in[i]; | ||||
| #endif | ||||
| #if !(defined (FIXED_POINT) && !defined(CUSTOM_MODES)) && defined(RESYNTH) | ||||
|       for (i=0;i<ret*channels;i++) | ||||
|       { | ||||
|          rmsd += (in[i]-out[i])*1.0*(in[i]-out[i]); | ||||
|          /*out[i] -= in[i];*/ | ||||
|       } | ||||
| #endif | ||||
|       count++; | ||||
|       fwrite(out+skip*channels, sizeof(short), (ret-skip)*channels, fout); | ||||
|       skip = 0; | ||||
|    } | ||||
|    PRINT_MIPS(stderr); | ||||
| 
 | ||||
|    opus_custom_encoder_destroy(enc); | ||||
|    opus_custom_decoder_destroy(dec); | ||||
|    fclose(fin); | ||||
|    fclose(fout); | ||||
|    opus_custom_mode_destroy(mode); | ||||
|    free(in); | ||||
|    free(out); | ||||
| #if !(defined (FIXED_POINT) && !defined(CUSTOM_MODES)) && defined(RESYNTH) | ||||
|    if (rmsd > 0) | ||||
|    { | ||||
|       rmsd = sqrt(rmsd/(1.0*frame_size*channels*count)); | ||||
|       fprintf (stderr, "Error: encoder doesn't match decoder\n"); | ||||
|       fprintf (stderr, "RMS mismatch is %f\n", rmsd); | ||||
|       return 1; | ||||
|    } else { | ||||
|       fprintf (stderr, "Encoder matches decoder!!\n"); | ||||
|    } | ||||
| #endif | ||||
|    return 0; | ||||
| } | ||||
| 
 | ||||
|  | @ -67,18 +67,18 @@ static OPUS_INLINE void opus_free (void *ptr) | |||
| } | ||||
| #endif | ||||
| 
 | ||||
| /** Copy n bytes of memory from src to dst. The 0* term provides compile-time type checking  */ | ||||
| /** Copy n elements from src to dst. The 0* term provides compile-time type checking  */ | ||||
| #ifndef OVERRIDE_OPUS_COPY | ||||
| #define OPUS_COPY(dst, src, n) (memcpy((dst), (src), (n)*sizeof(*(dst)) + 0*((dst)-(src)) )) | ||||
| #endif | ||||
| 
 | ||||
| /** Copy n bytes of memory from src to dst, allowing overlapping regions. The 0* term
 | ||||
| /** Copy n elements from src to dst, allowing overlapping regions. The 0* term
 | ||||
|     provides compile-time type checking */ | ||||
| #ifndef OVERRIDE_OPUS_MOVE | ||||
| #define OPUS_MOVE(dst, src, n) (memmove((dst), (src), (n)*sizeof(*(dst)) + 0*((dst)-(src)) )) | ||||
| #endif | ||||
| 
 | ||||
| /** Set n elements of dst to zero, starting at address s */ | ||||
| /** Set n elements of dst to zero */ | ||||
| #ifndef OVERRIDE_OPUS_CLEAR | ||||
| #define OPUS_CLEAR(dst, n) (memset((dst), 0, (n)*sizeof(*(dst)))) | ||||
| #endif | ||||
|  |  | |||
|  | @ -102,11 +102,9 @@ static void find_best_pitch(opus_val32 *xcorr, opus_val16 *y, int len, | |||
|    } | ||||
| } | ||||
| 
 | ||||
| static void celt_fir5(const opus_val16 *x, | ||||
| static void celt_fir5(opus_val16 *x, | ||||
|          const opus_val16 *num, | ||||
|          opus_val16 *y, | ||||
|          int N, | ||||
|          opus_val16 *mem) | ||||
|          int N) | ||||
| { | ||||
|    int i; | ||||
|    opus_val16 num0, num1, num2, num3, num4; | ||||
|  | @ -116,11 +114,11 @@ static void celt_fir5(const opus_val16 *x, | |||
|    num2=num[2]; | ||||
|    num3=num[3]; | ||||
|    num4=num[4]; | ||||
|    mem0=mem[0]; | ||||
|    mem1=mem[1]; | ||||
|    mem2=mem[2]; | ||||
|    mem3=mem[3]; | ||||
|    mem4=mem[4]; | ||||
|    mem0=0; | ||||
|    mem1=0; | ||||
|    mem2=0; | ||||
|    mem3=0; | ||||
|    mem4=0; | ||||
|    for (i=0;i<N;i++) | ||||
|    { | ||||
|       opus_val32 sum = SHL32(EXTEND32(x[i]), SIG_SHIFT); | ||||
|  | @ -134,13 +132,8 @@ static void celt_fir5(const opus_val16 *x, | |||
|       mem2 = mem1; | ||||
|       mem1 = mem0; | ||||
|       mem0 = x[i]; | ||||
|       y[i] = ROUND16(sum, SIG_SHIFT); | ||||
|       x[i] = ROUND16(sum, SIG_SHIFT); | ||||
|    } | ||||
|    mem[0]=mem0; | ||||
|    mem[1]=mem1; | ||||
|    mem[2]=mem2; | ||||
|    mem[3]=mem3; | ||||
|    mem[4]=mem4; | ||||
| } | ||||
| 
 | ||||
| 
 | ||||
|  | @ -150,7 +143,7 @@ void pitch_downsample(celt_sig * OPUS_RESTRICT x[], opus_val16 * OPUS_RESTRICT x | |||
|    int i; | ||||
|    opus_val32 ac[5]; | ||||
|    opus_val16 tmp=Q15ONE; | ||||
|    opus_val16 lpc[4], mem[5]={0,0,0,0,0}; | ||||
|    opus_val16 lpc[4]; | ||||
|    opus_val16 lpc2[5]; | ||||
|    opus_val16 c1 = QCONST16(.8f,15); | ||||
| #ifdef FIXED_POINT | ||||
|  | @ -211,28 +204,33 @@ void pitch_downsample(celt_sig * OPUS_RESTRICT x[], opus_val16 * OPUS_RESTRICT x | |||
|    lpc2[2] = lpc[2] + MULT16_16_Q15(c1,lpc[1]); | ||||
|    lpc2[3] = lpc[3] + MULT16_16_Q15(c1,lpc[2]); | ||||
|    lpc2[4] = MULT16_16_Q15(c1,lpc[3]); | ||||
|    celt_fir5(x_lp, lpc2, x_lp, len>>1, mem); | ||||
|    celt_fir5(x_lp, lpc2, len>>1); | ||||
| } | ||||
| 
 | ||||
| #if 0 /* This is a simple version of the pitch correlation that should work
 | ||||
|          well on DSPs like Blackfin and TI C5x/C6x */ | ||||
| 
 | ||||
| /* Pure C implementation. */ | ||||
| #ifdef FIXED_POINT | ||||
| opus_val32 | ||||
| #else | ||||
| void | ||||
| #endif | ||||
| celt_pitch_xcorr(opus_val16 *x, opus_val16 *y, opus_val32 *xcorr, int len, int max_pitch) | ||||
| celt_pitch_xcorr_c(const opus_val16 *_x, const opus_val16 *_y, | ||||
|       opus_val32 *xcorr, int len, int max_pitch, int arch) | ||||
| { | ||||
| 
 | ||||
| #if 0 /* This is a simple version of the pitch correlation that should work
 | ||||
|          well on DSPs like Blackfin and TI C5x/C6x */ | ||||
|    int i, j; | ||||
| #ifdef FIXED_POINT | ||||
|    opus_val32 maxcorr=1; | ||||
| #endif | ||||
| #if !defined(OVERRIDE_PITCH_XCORR) | ||||
|    (void)arch; | ||||
| #endif | ||||
|    for (i=0;i<max_pitch;i++) | ||||
|    { | ||||
|       opus_val32 sum = 0; | ||||
|       for (j=0;j<len;j++) | ||||
|          sum = MAC16_16(sum, x[j],y[i+j]); | ||||
|          sum = MAC16_16(sum, _x[j], _y[i+j]); | ||||
|       xcorr[i] = sum; | ||||
| #ifdef FIXED_POINT | ||||
|       maxcorr = MAX32(maxcorr, sum); | ||||
|  | @ -241,17 +239,8 @@ celt_pitch_xcorr(opus_val16 *x, opus_val16 *y, opus_val32 *xcorr, int len, int m | |||
| #ifdef FIXED_POINT | ||||
|    return maxcorr; | ||||
| #endif | ||||
| } | ||||
| 
 | ||||
| #else /* Unrolled version of the pitch correlation -- runs faster on x86 and ARM */ | ||||
| 
 | ||||
| #ifdef FIXED_POINT | ||||
| opus_val32 | ||||
| #else | ||||
| void | ||||
| #endif | ||||
| celt_pitch_xcorr_c(const opus_val16 *_x, const opus_val16 *_y, opus_val32 *xcorr, int len, int max_pitch) | ||||
| { | ||||
|    int i; | ||||
|    /*The EDSP version requires that max_pitch is at least 1, and that _x is
 | ||||
|       32-bit aligned. | ||||
|  | @ -260,11 +249,11 @@ celt_pitch_xcorr_c(const opus_val16 *_x, const opus_val16 *_y, opus_val32 *xcorr | |||
|    opus_val32 maxcorr=1; | ||||
| #endif | ||||
|    celt_assert(max_pitch>0); | ||||
|    celt_assert((((unsigned char *)_x-(unsigned char *)NULL)&3)==0); | ||||
|    celt_sig_assert((((unsigned char *)_x-(unsigned char *)NULL)&3)==0); | ||||
|    for (i=0;i<max_pitch-3;i+=4) | ||||
|    { | ||||
|       opus_val32 sum[4]={0,0,0,0}; | ||||
|       xcorr_kernel(_x, _y+i, sum, len); | ||||
|       xcorr_kernel(_x, _y+i, sum, len, arch); | ||||
|       xcorr[i]=sum[0]; | ||||
|       xcorr[i+1]=sum[1]; | ||||
|       xcorr[i+2]=sum[2]; | ||||
|  | @ -280,7 +269,7 @@ celt_pitch_xcorr_c(const opus_val16 *_x, const opus_val16 *_y, opus_val32 *xcorr | |||
|    for (;i<max_pitch;i++) | ||||
|    { | ||||
|       opus_val32 sum; | ||||
|       sum = celt_inner_prod(_x, _y+i, len); | ||||
|       sum = celt_inner_prod(_x, _y+i, len, arch); | ||||
|       xcorr[i] = sum; | ||||
| #ifdef FIXED_POINT | ||||
|       maxcorr = MAX32(maxcorr, sum); | ||||
|  | @ -289,9 +278,9 @@ celt_pitch_xcorr_c(const opus_val16 *_x, const opus_val16 *_y, opus_val32 *xcorr | |||
| #ifdef FIXED_POINT | ||||
|    return maxcorr; | ||||
| #endif | ||||
| #endif | ||||
| } | ||||
| 
 | ||||
| #endif | ||||
| void pitch_search(const opus_val16 * OPUS_RESTRICT x_lp, opus_val16 * OPUS_RESTRICT y, | ||||
|                   int len, int max_pitch, int *pitch, int arch) | ||||
| { | ||||
|  | @ -369,7 +358,7 @@ void pitch_search(const opus_val16 * OPUS_RESTRICT x_lp, opus_val16 * OPUS_RESTR | |||
|       for (j=0;j<len>>1;j++) | ||||
|          sum += SHR32(MULT16_16(x_lp[j],y[i+j]), shift); | ||||
| #else | ||||
|       sum = celt_inner_prod(x_lp, y+i, len>>1); | ||||
|       sum = celt_inner_prod(x_lp, y+i, len>>1, arch); | ||||
| #endif | ||||
|       xcorr[i] = MAX32(-1, sum); | ||||
| #ifdef FIXED_POINT | ||||
|  | @ -403,10 +392,44 @@ void pitch_search(const opus_val16 * OPUS_RESTRICT x_lp, opus_val16 * OPUS_RESTR | |||
|    RESTORE_STACK; | ||||
| } | ||||
| 
 | ||||
| #if 0 | ||||
| #ifdef FIXED_POINT | ||||
| static opus_val16 compute_pitch_gain(opus_val32 xy, opus_val32 xx, opus_val32 yy) | ||||
| { | ||||
|    opus_val32 x2y2; | ||||
|    int sx, sy, shift; | ||||
|    opus_val32 g; | ||||
|    opus_val16 den; | ||||
|    if (xy == 0 || xx == 0 || yy == 0) | ||||
|       return 0; | ||||
|    sx = celt_ilog2(xx)-14; | ||||
|    sy = celt_ilog2(yy)-14; | ||||
|    shift = sx + sy; | ||||
|    x2y2 = SHR32(MULT16_16(VSHR32(xx, sx), VSHR32(yy, sy)), 14); | ||||
|    if (shift & 1) { | ||||
|       if (x2y2 < 32768) | ||||
|       { | ||||
|          x2y2 <<= 1; | ||||
|          shift--; | ||||
|       } else { | ||||
|          x2y2 >>= 1; | ||||
|          shift++; | ||||
|       } | ||||
|    } | ||||
|    den = celt_rsqrt_norm(x2y2); | ||||
|    g = MULT16_32_Q15(den, xy); | ||||
|    g = VSHR32(g, (shift>>1)-1); | ||||
|    return EXTRACT16(MIN32(g, Q15ONE)); | ||||
| } | ||||
| #else | ||||
| static opus_val16 compute_pitch_gain(opus_val32 xy, opus_val32 xx, opus_val32 yy) | ||||
| { | ||||
|    return xy/celt_sqrt(1+xx*yy); | ||||
| } | ||||
| #endif | ||||
| 
 | ||||
| static const int second_check[16] = {0, 0, 3, 2, 3, 2, 5, 2, 3, 2, 3, 2, 5, 2, 3, 2}; | ||||
| opus_val16 remove_doubling(opus_val16 *x, int maxperiod, int minperiod, | ||||
|       int N, int *T0_, int prev_period, opus_val16 prev_gain) | ||||
|       int N, int *T0_, int prev_period, opus_val16 prev_gain, int arch) | ||||
| { | ||||
|    int k, i, T, T0; | ||||
|    opus_val16 g, g0; | ||||
|  | @ -431,7 +454,7 @@ opus_val16 remove_doubling(opus_val16 *x, int maxperiod, int minperiod, | |||
| 
 | ||||
|    T = T0 = *T0_; | ||||
|    ALLOC(yy_lookup, maxperiod+1, opus_val32); | ||||
|    dual_inner_prod(x, x, x-T0, N, &xx, &xy); | ||||
|    dual_inner_prod(x, x, x-T0, N, &xx, &xy, arch); | ||||
|    yy_lookup[0] = xx; | ||||
|    yy=xx; | ||||
|    for (i=1;i<=maxperiod;i++) | ||||
|  | @ -442,18 +465,7 @@ opus_val16 remove_doubling(opus_val16 *x, int maxperiod, int minperiod, | |||
|    yy = yy_lookup[T0]; | ||||
|    best_xy = xy; | ||||
|    best_yy = yy; | ||||
| #ifdef FIXED_POINT | ||||
|       { | ||||
|          opus_val32 x2y2; | ||||
|          int sh, t; | ||||
|          x2y2 = 1+HALF32(MULT32_32_Q31(xx,yy)); | ||||
|          sh = celt_ilog2(x2y2)>>1; | ||||
|          t = VSHR32(x2y2, 2*(sh-7)); | ||||
|          g = g0 = VSHR32(MULT16_32_Q15(celt_rsqrt_norm(t), xy),sh+1); | ||||
|       } | ||||
| #else | ||||
|       g = g0 = xy/celt_sqrt(1+xx*yy); | ||||
| #endif | ||||
|    g = g0 = compute_pitch_gain(xy, xx, yy); | ||||
|    /* Look for any pitch at T/k */ | ||||
|    for (k=2;k<=15;k++) | ||||
|    { | ||||
|  | @ -475,25 +487,14 @@ opus_val16 remove_doubling(opus_val16 *x, int maxperiod, int minperiod, | |||
|       { | ||||
|          T1b = celt_udiv(2*second_check[k]*T0+k, 2*k); | ||||
|       } | ||||
|       dual_inner_prod(x, &x[-T1], &x[-T1b], N, &xy, &xy2); | ||||
|       xy += xy2; | ||||
|       yy = yy_lookup[T1] + yy_lookup[T1b]; | ||||
| #ifdef FIXED_POINT | ||||
|       { | ||||
|          opus_val32 x2y2; | ||||
|          int sh, t; | ||||
|          x2y2 = 1+MULT32_32_Q31(xx,yy); | ||||
|          sh = celt_ilog2(x2y2)>>1; | ||||
|          t = VSHR32(x2y2, 2*(sh-7)); | ||||
|          g1 = VSHR32(MULT16_32_Q15(celt_rsqrt_norm(t), xy),sh+1); | ||||
|       } | ||||
| #else | ||||
|       g1 = xy/celt_sqrt(1+2.f*xx*1.f*yy); | ||||
| #endif | ||||
|       dual_inner_prod(x, &x[-T1], &x[-T1b], N, &xy, &xy2, arch); | ||||
|       xy = HALF32(xy + xy2); | ||||
|       yy = HALF32(yy_lookup[T1] + yy_lookup[T1b]); | ||||
|       g1 = compute_pitch_gain(xy, xx, yy); | ||||
|       if (abs(T1-prev_period)<=1) | ||||
|          cont = prev_gain; | ||||
|       else if (abs(T1-prev_period)<=2 && 5*k*k < T0) | ||||
|          cont = HALF32(prev_gain); | ||||
|          cont = HALF16(prev_gain); | ||||
|       else | ||||
|          cont = 0; | ||||
|       thresh = MAX16(QCONST16(.3f,15), MULT16_16_Q15(QCONST16(.7f,15),g0)-cont); | ||||
|  | @ -518,7 +519,7 @@ opus_val16 remove_doubling(opus_val16 *x, int maxperiod, int minperiod, | |||
|       pg = SHR32(frac_div32(best_xy,best_yy+1),16); | ||||
| 
 | ||||
|    for (k=0;k<3;k++) | ||||
|       xcorr[k] = celt_inner_prod(x, x-(T+k-1), N); | ||||
|       xcorr[k] = celt_inner_prod(x, x-(T+k-1), N, arch); | ||||
|    if ((xcorr[2]-xcorr[0]) > MULT16_32_Q15(QCONST16(.7f,15),xcorr[1]-xcorr[0])) | ||||
|       offset = 1; | ||||
|    else if ((xcorr[0]-xcorr[2]) > MULT16_32_Q15(QCONST16(.7f,15),xcorr[1]-xcorr[2])) | ||||
|  | @ -534,4 +535,3 @@ opus_val16 remove_doubling(opus_val16 *x, int maxperiod, int minperiod, | |||
|    RESTORE_STACK; | ||||
|    return pg; | ||||
| } | ||||
| #endif | ||||
|  |  | |||
|  | @ -37,7 +37,8 @@ | |||
| #include "modes.h" | ||||
| #include "cpu_support.h" | ||||
| 
 | ||||
| #if defined(__SSE__) && !defined(FIXED_POINT) | ||||
| #if (defined(OPUS_X86_MAY_HAVE_SSE) && !defined(FIXED_POINT)) \ | ||||
|   || ((defined(OPUS_X86_MAY_HAVE_SSE4_1) || defined(OPUS_X86_MAY_HAVE_SSE2)) && defined(FIXED_POINT)) | ||||
| #include "x86/pitch_sse.h" | ||||
| #endif | ||||
| 
 | ||||
|  | @ -45,8 +46,8 @@ | |||
| #include "mips/pitch_mipsr1.h" | ||||
| #endif | ||||
| 
 | ||||
| #if defined(OPUS_ARM_ASM) && defined(FIXED_POINT) | ||||
| //# include "arm/pitch_arm.h"
 | ||||
| #if (defined(OPUS_ARM_ASM) || defined(OPUS_ARM_MAY_HAVE_NEON_INTR)) | ||||
| # include "arm/pitch_arm.h" | ||||
| #endif | ||||
| 
 | ||||
| void pitch_downsample(celt_sig * OPUS_RESTRICT x[], opus_val16 * OPUS_RESTRICT x_lp, | ||||
|  | @ -56,12 +57,12 @@ void pitch_search(const opus_val16 * OPUS_RESTRICT x_lp, opus_val16 * OPUS_RESTR | |||
|                   int len, int max_pitch, int *pitch, int arch); | ||||
| 
 | ||||
| opus_val16 remove_doubling(opus_val16 *x, int maxperiod, int minperiod, | ||||
|       int N, int *T0, int prev_period, opus_val16 prev_gain); | ||||
|       int N, int *T0, int prev_period, opus_val16 prev_gain, int arch); | ||||
| 
 | ||||
| 
 | ||||
| /* OPT: This is the kernel you really want to optimize. It gets used a lot
 | ||||
|    by the prefilter and by the PLC. */ | ||||
| #ifndef OVERRIDE_XCORR_KERNEL | ||||
| static OPUS_INLINE void xcorr_kernel(const opus_val16 * x, const opus_val16 * y, opus_val32 sum[4], int len) | ||||
| static OPUS_INLINE void xcorr_kernel_c(const opus_val16 * x, const opus_val16 * y, opus_val32 sum[4], int len) | ||||
| { | ||||
|    int j; | ||||
|    opus_val16 y_0, y_1, y_2, y_3; | ||||
|  | @ -126,10 +127,14 @@ static OPUS_INLINE void xcorr_kernel(const opus_val16 * x, const opus_val16 * y, | |||
|       sum[3] = MAC16_16(sum[3],tmp,y_1); | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| #ifndef OVERRIDE_XCORR_KERNEL | ||||
| #define xcorr_kernel(x, y, sum, len, arch) \ | ||||
|     ((void)(arch),xcorr_kernel_c(x, y, sum, len)) | ||||
| #endif /* OVERRIDE_XCORR_KERNEL */ | ||||
| 
 | ||||
| #ifndef OVERRIDE_DUAL_INNER_PROD | ||||
| static OPUS_INLINE void dual_inner_prod(const opus_val16 *x, const opus_val16 *y01, const opus_val16 *y02, | ||||
| 
 | ||||
| static OPUS_INLINE void dual_inner_prod_c(const opus_val16 *x, const opus_val16 *y01, const opus_val16 *y02, | ||||
|       int N, opus_val32 *xy1, opus_val32 *xy2) | ||||
| { | ||||
|    int i; | ||||
|  | @ -143,11 +148,16 @@ static OPUS_INLINE void dual_inner_prod(const opus_val16 *x, const opus_val16 *y | |||
|    *xy1 = xy01; | ||||
|    *xy2 = xy02; | ||||
| } | ||||
| 
 | ||||
| #ifndef OVERRIDE_DUAL_INNER_PROD | ||||
| # define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) \ | ||||
|     ((void)(arch),dual_inner_prod_c(x, y01, y02, N, xy1, xy2)) | ||||
| #endif | ||||
| 
 | ||||
| #ifndef OVERRIDE_CELT_INNER_PROD | ||||
| static OPUS_INLINE opus_val32 celt_inner_prod(const opus_val16 *x, const opus_val16 *y, | ||||
|       int N) | ||||
| /*We make sure a C version is always available for cases where the overhead of
 | ||||
|   vectorization and passing around an arch flag aren't worth it.*/ | ||||
| static OPUS_INLINE opus_val32 celt_inner_prod_c(const opus_val16 *x, | ||||
|       const opus_val16 *y, int N) | ||||
| { | ||||
|    int i; | ||||
|    opus_val32 xy=0; | ||||
|  | @ -155,35 +165,28 @@ static OPUS_INLINE opus_val32 celt_inner_prod(const opus_val16 *x, const opus_va | |||
|       xy = MAC16_16(xy, x[i], y[i]); | ||||
|    return xy; | ||||
| } | ||||
| 
 | ||||
| #if !defined(OVERRIDE_CELT_INNER_PROD) | ||||
| # define celt_inner_prod(x, y, N, arch) \ | ||||
|     ((void)(arch),celt_inner_prod_c(x, y, N)) | ||||
| #endif | ||||
| 
 | ||||
| #ifdef NON_STATIC_COMB_FILTER_CONST_C | ||||
| void comb_filter_const_c(opus_val32 *y, opus_val32 *x, int T, int N, | ||||
|      opus_val16 g10, opus_val16 g11, opus_val16 g12); | ||||
| #endif | ||||
| 
 | ||||
| 
 | ||||
| #ifdef FIXED_POINT | ||||
| opus_val32 | ||||
| #else | ||||
| void | ||||
| #endif | ||||
| celt_pitch_xcorr_c(const opus_val16 *_x, const opus_val16 *_y, | ||||
|       opus_val32 *xcorr, int len, int max_pitch); | ||||
|       opus_val32 *xcorr, int len, int max_pitch, int arch); | ||||
| 
 | ||||
| #if !defined(OVERRIDE_PITCH_XCORR) | ||||
| /*Is run-time CPU detection enabled on this platform?*/ | ||||
| # if defined(OPUS_HAVE_RTCD) | ||||
| extern | ||||
| #  if defined(FIXED_POINT) | ||||
| opus_val32 | ||||
| #  else | ||||
| void | ||||
| #  endif | ||||
| (*const CELT_PITCH_XCORR_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *, | ||||
|       const opus_val16 *, opus_val32 *, int, int); | ||||
| 
 | ||||
| #  define celt_pitch_xcorr(_x, _y, xcorr, len, max_pitch, arch) \ | ||||
|   ((*CELT_PITCH_XCORR_IMPL[(arch)&OPUS_ARCHMASK])(_x, _y, \ | ||||
|         xcorr, len, max_pitch)) | ||||
| # else | ||||
| #  define celt_pitch_xcorr(_x, _y, xcorr, len, max_pitch, arch) \ | ||||
|   ((void)(arch),celt_pitch_xcorr_c(_x, _y, xcorr, len, max_pitch)) | ||||
| # endif | ||||
| #ifndef OVERRIDE_PITCH_XCORR | ||||
| # define celt_pitch_xcorr celt_pitch_xcorr_c | ||||
| #endif | ||||
| 
 | ||||
| #endif | ||||
|  |  | |||
|  | @ -292,7 +292,7 @@ void quant_coarse_energy(const CELTMode *m, int start, int end, int effEnd, | |||
| #endif | ||||
|    } | ||||
|    if (lfe) | ||||
|       max_decay=3; | ||||
|       max_decay = QCONST16(3.f,DB_SHIFT); | ||||
|    enc_start_state = *enc; | ||||
| 
 | ||||
|    ALLOC(oldEBands_intra, C*m->nbEBands, opus_val16); | ||||
|  | @ -418,6 +418,7 @@ void quant_energy_finalise(const CELTMode *m, int start, int end, opus_val16 *ol | |||
|             offset = (q2-.5f)*(1<<(14-fine_quant[i]-1))*(1.f/16384); | ||||
| #endif | ||||
|             oldEBands[i+c*m->nbEBands] += offset; | ||||
|             error[i+c*m->nbEBands] -= offset; | ||||
|             bits_left--; | ||||
|          } while (++c < C); | ||||
|       } | ||||
|  | @ -456,7 +457,7 @@ void unquant_coarse_energy(const CELTMode *m, int start, int end, opus_val16 *ol | |||
|          /* It would be better to express this invariant as a
 | ||||
|             test on C at function entry, but that isn't enough | ||||
|             to make the static analyzer happy. */ | ||||
|          celt_assert(c<2); | ||||
|          celt_sig_assert(c<2); | ||||
|          tell = ec_tell(dec); | ||||
|          if(budget-tell>=15) | ||||
|          { | ||||
|  | @ -547,9 +548,15 @@ void amp2Log2(const CELTMode *m, int effEnd, int end, | |||
|    c=0; | ||||
|    do { | ||||
|       for (i=0;i<effEnd;i++) | ||||
|       { | ||||
|          bandLogE[i+c*m->nbEBands] = | ||||
|                celt_log2(SHL32(bandE[i+c*m->nbEBands],2)) | ||||
|                celt_log2(bandE[i+c*m->nbEBands]) | ||||
|                - SHL16((opus_val16)eMeans[i],6); | ||||
| #ifdef FIXED_POINT | ||||
|          /* Compensate for bandE[] being Q12 but celt_log2() taking a Q14 input. */ | ||||
|          bandLogE[i+c*m->nbEBands] += QCONST16(2.f, DB_SHIFT); | ||||
| #endif | ||||
|       } | ||||
|       for (i=effEnd;i<end;i++) | ||||
|          bandLogE[c*m->nbEBands+i] = -QCONST16(14.f,DB_SHIFT); | ||||
|    } while (++c < C); | ||||
|  |  | |||
|  | @ -131,7 +131,7 @@ void compute_pulse_cache(CELTMode *m, int LM) | |||
|    for (i=0;i<nbEntries;i++) | ||||
|    { | ||||
|       unsigned char *ptr = bits+entryI[i]; | ||||
|       opus_int16 tmp[MAX_PULSES+1]; | ||||
|       opus_int16 tmp[CELT_MAX_PULSES+1]; | ||||
|       get_required_bits(tmp, entryN[i], get_pulses(entryK[i]), BITRES); | ||||
|       for (j=1;j<=entryK[i];j++) | ||||
|          ptr[j] = tmp[get_pulses(j)]-1; | ||||
|  | @ -296,7 +296,7 @@ static OPUS_INLINE int interp_bits2pulses(const CELTMode *m, int start, int end, | |||
|    done = 0; | ||||
|    for (j=end;j-->start;) | ||||
|    { | ||||
|       int tmp = bits1[j] + (lo*bits2[j]>>ALLOC_STEPS); | ||||
|       int tmp = bits1[j] + ((opus_int32)lo*bits2[j]>>ALLOC_STEPS); | ||||
|       if (tmp < thresh[j] && !done) | ||||
|       { | ||||
|          if (tmp >= alloc_floor) | ||||
|  | @ -348,12 +348,17 @@ static OPUS_INLINE int interp_bits2pulses(const CELTMode *m, int start, int end, | |||
|             /*This if() block is the only part of the allocation function that
 | ||||
|                is not a mandatory part of the bitstream: any bands we choose to | ||||
|                skip here must be explicitly signaled.*/ | ||||
|             /*Choose a threshold with some hysteresis to keep bands from
 | ||||
|                fluctuating in and out.*/ | ||||
|             int depth_threshold; | ||||
|             /*We choose a threshold with some hysteresis to keep bands from
 | ||||
|                fluctuating in and out, but we try not to fold below a certain point. */ | ||||
|             if (codedBands > 17) | ||||
|                depth_threshold = j<prev ? 7 : 9; | ||||
|             else | ||||
|                depth_threshold = 0; | ||||
| #ifdef FUZZING | ||||
|             if ((rand()&0x1) == 0) | ||||
| #else | ||||
|             if (codedBands<=start+2 || (band_bits > ((j<prev?7:9)*band_width<<LM<<BITRES)>>4 && j<=signalBandwidth)) | ||||
|             if (codedBands<=start+2 || (band_bits > (depth_threshold*band_width<<LM<<BITRES)>>4 && j<=signalBandwidth)) | ||||
| #endif | ||||
|             { | ||||
|                ec_enc_bit_logp(ec, 1, 1); | ||||
|  | @ -524,7 +529,7 @@ static OPUS_INLINE int interp_bits2pulses(const CELTMode *m, int start, int end, | |||
|    return codedBands; | ||||
| } | ||||
| 
 | ||||
| int compute_allocation(const CELTMode *m, int start, int end, const int *offsets, const int *cap, int alloc_trim, int *intensity, int *dual_stereo, | ||||
| int clt_compute_allocation(const CELTMode *m, int start, int end, const int *offsets, const int *cap, int alloc_trim, int *intensity, int *dual_stereo, | ||||
|       opus_int32 total, opus_int32 *balance, int *pulses, int *ebits, int *fine_priority, int C, int LM, ec_ctx *ec, int encode, int prev, int signalBandwidth) | ||||
| { | ||||
|    int lo, hi, len, j; | ||||
|  |  | |||
|  | @ -32,7 +32,7 @@ | |||
| #define MAX_PSEUDO 40 | ||||
| #define LOG_MAX_PSEUDO 6 | ||||
| 
 | ||||
| #define MAX_PULSES 128 | ||||
| #define CELT_MAX_PULSES 128 | ||||
| 
 | ||||
| #define MAX_FINE_BITS 8 | ||||
| 
 | ||||
|  | @ -95,7 +95,7 @@ static OPUS_INLINE int pulses2bits(const CELTMode *m, int band, int LM, int puls | |||
|  @param pulses Number of pulses per band (returned) | ||||
|  @return Total number of bits allocated | ||||
| */ | ||||
| int compute_allocation(const CELTMode *m, int start, int end, const int *offsets, const int *cap, int alloc_trim, int *intensity, int *dual_stero, | ||||
| int clt_compute_allocation(const CELTMode *m, int start, int end, const int *offsets, const int *cap, int alloc_trim, int *intensity, int *dual_stero, | ||||
|       opus_int32 total, opus_int32 *balance, int *pulses, int *ebits, int *fine_priority, int C, int LM, ec_ctx *ec, int encode, int prev, int signalBandwidth); | ||||
| 
 | ||||
| #endif | ||||
|  |  | |||
|  | @ -4,9 +4,14 @@ | |||
| #include "modes.h" | ||||
| #include "rate.h" | ||||
| 
 | ||||
| #ifdef HAVE_ARM_NE10 | ||||
| #define OVERRIDE_FFT 1 | ||||
| #include "static_modes_fixed_arm_ne10.h" | ||||
| #endif | ||||
| 
 | ||||
| #ifndef DEF_WINDOW120 | ||||
| #define DEF_WINDOW120 | ||||
| static const opus_val16 window120[120] ICONST_ATTR = { | ||||
| static const opus_val16 window120[120] = { | ||||
| 2, 20, 55, 108, 178, | ||||
| 266, 372, 494, 635, 792, | ||||
| 966, 1157, 1365, 1590, 1831, | ||||
|  | @ -36,13 +41,13 @@ static const opus_val16 window120[120] ICONST_ATTR = { | |||
| 
 | ||||
| #ifndef DEF_LOGN400 | ||||
| #define DEF_LOGN400 | ||||
| static const opus_int16 logN400[21] ICONST_ATTR = { | ||||
| static const opus_int16 logN400[21] = { | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 8, 8, 8, 8, 16, 16, 16, 21, 21, 24, 29, 34, 36, }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef DEF_PULSE_CACHE50 | ||||
| #define DEF_PULSE_CACHE50 | ||||
| static const opus_int16 cache_index50[105] ICONST_ATTR = { | ||||
| static const opus_int16 cache_index50[105] = { | ||||
| -1, -1, -1, -1, -1, -1, -1, -1, 0, 0, 0, 0, 41, 41, 41, | ||||
| 82, 82, 123, 164, 200, 222, 0, 0, 0, 0, 0, 0, 0, 0, 41, | ||||
| 41, 41, 41, 123, 123, 123, 164, 164, 240, 266, 283, 295, 41, 41, 41, | ||||
|  | @ -51,7 +56,7 @@ static const opus_int16 cache_index50[105] ICONST_ATTR = { | |||
| 305, 305, 305, 318, 318, 343, 351, 358, 364, 240, 240, 240, 240, 240, 240, | ||||
| 240, 240, 305, 305, 305, 305, 343, 343, 343, 351, 351, 370, 376, 382, 387, | ||||
| }; | ||||
| static const unsigned char cache_bits50[392] ICONST_ATTR = { | ||||
| static const unsigned char cache_bits50[392] = { | ||||
| 40, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, | ||||
| 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, | ||||
| 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 40, 15, 23, 28, | ||||
|  | @ -79,7 +84,7 @@ static const unsigned char cache_bits50[392] ICONST_ATTR = { | |||
| 106, 151, 192, 231, 5, 59, 111, 158, 202, 243, 5, 55, 103, 147, 187, | ||||
| 224, 5, 60, 113, 161, 206, 248, 4, 65, 122, 175, 224, 4, 67, 127, | ||||
| 182, 234, }; | ||||
| static const unsigned char cache_caps50[168] ICONST_ATTR = { | ||||
| static const unsigned char cache_caps50[168] = { | ||||
| 224, 224, 224, 224, 224, 224, 224, 224, 160, 160, 160, 160, 185, 185, 185, | ||||
| 178, 178, 168, 134, 61, 37, 224, 224, 224, 224, 224, 224, 224, 224, 240, | ||||
| 240, 240, 240, 207, 207, 207, 198, 198, 183, 144, 66, 40, 160, 160, 160, | ||||
|  | @ -96,7 +101,7 @@ static const unsigned char cache_caps50[168] ICONST_ATTR = { | |||
| 
 | ||||
| #ifndef FFT_TWIDDLES48000_960 | ||||
| #define FFT_TWIDDLES48000_960 | ||||
| static const kiss_twiddle_cpx fft_twiddles48000_960[480] ICONST_ATTR = { | ||||
| static const kiss_twiddle_cpx fft_twiddles48000_960[480] = { | ||||
| {32767, 0}, {32766, -429}, | ||||
| {32757, -858}, {32743, -1287}, | ||||
| {32724, -1715}, {32698, -2143}, | ||||
|  | @ -424,53 +429,73 @@ static const opus_int16 fft_bitrev60[60] = { | |||
| 
 | ||||
| #ifndef FFT_STATE48000_960_0 | ||||
| #define FFT_STATE48000_960_0 | ||||
| static const kiss_fft_state fft_state48000_960_0 ICONST_ATTR = { | ||||
| static const kiss_fft_state fft_state48000_960_0 = { | ||||
| 480,    /* nfft */ | ||||
| 17476,	/* scale */ | ||||
| 17476,    /* scale */ | ||||
| 8,      /* scale_shift */ | ||||
| -1,     /* shift */ | ||||
| {5, 96, 3, 32, 4, 8, 2, 4, 4, 1, 0, 0, 0, 0, 0, 0, },	/* factors */ | ||||
| {5, 96, 3, 32, 4, 8, 2, 4, 4, 1, 0, 0, 0, 0, 0, 0, },    /* factors */ | ||||
| fft_bitrev480,  /* bitrev */ | ||||
| fft_twiddles48000_960,  /* bitrev */ | ||||
| #ifdef OVERRIDE_FFT | ||||
| (arch_fft_state *)&cfg_arch_480, | ||||
| #else | ||||
| NULL, | ||||
| #endif | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef FFT_STATE48000_960_1 | ||||
| #define FFT_STATE48000_960_1 | ||||
| static const kiss_fft_state fft_state48000_960_1 ICONST_ATTR = { | ||||
| static const kiss_fft_state fft_state48000_960_1 = { | ||||
| 240,    /* nfft */ | ||||
| 17476,	/* scale */ | ||||
| 17476,    /* scale */ | ||||
| 7,      /* scale_shift */ | ||||
| 1,      /* shift */ | ||||
| {5, 48, 3, 16, 4, 4, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, },	/* factors */ | ||||
| {5, 48, 3, 16, 4, 4, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, },    /* factors */ | ||||
| fft_bitrev240,  /* bitrev */ | ||||
| fft_twiddles48000_960,  /* bitrev */ | ||||
| #ifdef OVERRIDE_FFT | ||||
| (arch_fft_state *)&cfg_arch_240, | ||||
| #else | ||||
| NULL, | ||||
| #endif | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef FFT_STATE48000_960_2 | ||||
| #define FFT_STATE48000_960_2 | ||||
| static const kiss_fft_state fft_state48000_960_2 ICONST_ATTR = { | ||||
| static const kiss_fft_state fft_state48000_960_2 = { | ||||
| 120,    /* nfft */ | ||||
| 17476,	/* scale */ | ||||
| 17476,    /* scale */ | ||||
| 6,      /* scale_shift */ | ||||
| 2,      /* shift */ | ||||
| {5, 24, 3, 8, 2, 4, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, },	/* factors */ | ||||
| {5, 24, 3, 8, 2, 4, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, },    /* factors */ | ||||
| fft_bitrev120,  /* bitrev */ | ||||
| fft_twiddles48000_960,  /* bitrev */ | ||||
| #ifdef OVERRIDE_FFT | ||||
| (arch_fft_state *)&cfg_arch_120, | ||||
| #else | ||||
| NULL, | ||||
| #endif | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef FFT_STATE48000_960_3 | ||||
| #define FFT_STATE48000_960_3 | ||||
| static const kiss_fft_state fft_state48000_960_3 ICONST_ATTR = { | ||||
| static const kiss_fft_state fft_state48000_960_3 = { | ||||
| 60,     /* nfft */ | ||||
| 17476,	/* scale */ | ||||
| 17476,    /* scale */ | ||||
| 5,      /* scale_shift */ | ||||
| 3,      /* shift */ | ||||
| {5, 12, 3, 4, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, },	/* factors */ | ||||
| {5, 12, 3, 4, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, },    /* factors */ | ||||
| fft_bitrev60,   /* bitrev */ | ||||
| fft_twiddles48000_960,  /* bitrev */ | ||||
| #ifdef OVERRIDE_FFT | ||||
| (arch_fft_state *)&cfg_arch_60, | ||||
| #else | ||||
| NULL, | ||||
| #endif | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
|  | @ -478,7 +503,7 @@ fft_twiddles48000_960,  /* bitrev */ | |||
| 
 | ||||
| #ifndef MDCT_TWIDDLES960 | ||||
| #define MDCT_TWIDDLES960 | ||||
| static const opus_val16 mdct_twiddles960[1800] ICONST_ATTR = { | ||||
| static const opus_val16 mdct_twiddles960[1800] = { | ||||
| 32767, 32767, 32767, 32766, 32765, | ||||
| 32763, 32761, 32759, 32756, 32753, | ||||
| 32750, 32746, 32742, 32738, 32733, | ||||
|  | @ -842,7 +867,7 @@ static const opus_val16 mdct_twiddles960[1800] ICONST_ATTR = { | |||
| }; | ||||
| #endif | ||||
| 
 | ||||
| static const CELTMode mode48000_960_120 ICONST_ATTR = { | ||||
| static const CELTMode mode48000_960_120 = { | ||||
| 48000,  /* Fs */ | ||||
| 120,    /* overlap */ | ||||
| 21,     /* nbEBands */ | ||||
|  |  | |||
							
								
								
									
										388
									
								
								lib/rbcodec/codecs/libopus/celt/static_modes_fixed_arm_ne10.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										388
									
								
								lib/rbcodec/codecs/libopus/celt/static_modes_fixed_arm_ne10.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,388 @@ | |||
| /* The contents of this file was automatically generated by
 | ||||
|  * dump_mode_arm_ne10.c with arguments: 48000 960 | ||||
|  * It contains static definitions for some pre-defined modes. */ | ||||
| #include <NE10_types.h> | ||||
| 
 | ||||
| #ifndef NE10_FFT_PARAMS48000_960 | ||||
| #define NE10_FFT_PARAMS48000_960 | ||||
| static const ne10_int32_t ne10_factors_480[64] = { | ||||
| 4, 40, 4, 30, 2, 15, 5, 3, 3, 1, 1, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, }; | ||||
| static const ne10_int32_t ne10_factors_240[64] = { | ||||
| 3, 20, 4, 15, 5, 3, 3, 1, 1, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, }; | ||||
| static const ne10_int32_t ne10_factors_120[64] = { | ||||
| 3, 10, 2, 15, 5, 3, 3, 1, 1, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, }; | ||||
| static const ne10_int32_t ne10_factors_60[64] = { | ||||
| 2, 5, 5, 3, 3, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, }; | ||||
| static const ne10_fft_cpx_int32_t ne10_twiddles_480[480] = { | ||||
| {0,0}, {2147483647,0}, {2147483647,0}, | ||||
| {2147483647,0}, {1961823921,-873460313}, {1436946998,-1595891394}, | ||||
| {2147483647,0}, {1436946998,-1595891394}, {-224473265,-2135719496}, | ||||
| {2147483647,0}, {663608871,-2042378339}, {-1737350854,-1262259096}, | ||||
| {2147483647,0}, {-224473265,-2135719496}, {-2100555935,446487152}, | ||||
| {2147483647,0}, {2100555974,-446486968}, {1961823921,-873460313}, | ||||
| {1737350743,-1262259248}, {1436946998,-1595891394}, {1073741769,-1859775424}, | ||||
| {663608871,-2042378339}, {224473078,-2135719516}, {-224473265,-2135719496}, | ||||
| {-663609049,-2042378281}, {-1073741932,-1859775330}, {-1436947137,-1595891268}, | ||||
| {-1737350854,-1262259096}, {-1961823997,-873460141}, {-2100556013,-446486785}, | ||||
| {2147483647,0}, {2144540595,-112390613}, {2135719506,-224473172}, | ||||
| {2121044558,-335940465}, {2100555974,-446486968}, {2074309912,-555809682}, | ||||
| {2042378310,-663608960}, {2004848691,-769589332}, {1961823921,-873460313}, | ||||
| {1913421927,-974937199}, {1859775377,-1073741851}, {1801031311,-1169603450}, | ||||
| {1737350743,-1262259248}, {1668908218,-1351455280}, {1595891331,-1436947067}, | ||||
| {1518500216,-1518500282}, {1436946998,-1595891394}, {1351455207,-1668908277}, | ||||
| {1262259172,-1737350799}, {1169603371,-1801031362}, {1073741769,-1859775424}, | ||||
| {974937230,-1913421912}, {873460227,-1961823959}, {769589125,-2004848771}, | ||||
| {663608871,-2042378339}, {555809715,-2074309903}, {446486876,-2100555994}, | ||||
| {335940246,-2121044593}, {224473078,-2135719516}, {112390647,-2144540593}, | ||||
| {2147483647,0}, {2135719506,-224473172}, {2100555974,-446486968}, | ||||
| {2042378310,-663608960}, {1961823921,-873460313}, {1859775377,-1073741851}, | ||||
| {1737350743,-1262259248}, {1595891331,-1436947067}, {1436946998,-1595891394}, | ||||
| {1262259172,-1737350799}, {1073741769,-1859775424}, {873460227,-1961823959}, | ||||
| {663608871,-2042378339}, {446486876,-2100555994}, {224473078,-2135719516}, | ||||
| {-94,-2147483647}, {-224473265,-2135719496}, {-446487060,-2100555955}, | ||||
| {-663609049,-2042378281}, {-873460398,-1961823883}, {-1073741932,-1859775330}, | ||||
| {-1262259116,-1737350839}, {-1436947137,-1595891268}, {-1595891628,-1436946738}, | ||||
| {-1737350854,-1262259096}, {-1859775343,-1073741910}, {-1961823997,-873460141}, | ||||
| {-2042378447,-663608538}, {-2100556013,-446486785}, {-2135719499,-224473240}, | ||||
| {2147483647,0}, {2121044558,-335940465}, {2042378310,-663608960}, | ||||
| {1913421927,-974937199}, {1737350743,-1262259248}, {1518500216,-1518500282}, | ||||
| {1262259172,-1737350799}, {974937230,-1913421912}, {663608871,-2042378339}, | ||||
| {335940246,-2121044593}, {-94,-2147483647}, {-335940431,-2121044564}, | ||||
| {-663609049,-2042378281}, {-974937397,-1913421827}, {-1262259116,-1737350839}, | ||||
| {-1518500258,-1518500240}, {-1737350854,-1262259096}, {-1913422071,-974936918}, | ||||
| {-2042378447,-663608538}, {-2121044568,-335940406}, {-2147483647,188}, | ||||
| {-2121044509,335940777}, {-2042378331,663608895}, {-1913421900,974937252}, | ||||
| {-1737350633,1262259400}, {-1518499993,1518500506}, {-1262258813,1737351059}, | ||||
| {-974936606,1913422229}, {-663609179,2042378239}, {-335940566,2121044542}, | ||||
| {2147483647,0}, {2147299667,-28109693}, {2146747758,-56214570}, | ||||
| {2145828015,-84309815}, {2144540595,-112390613}, {2142885719,-140452154}, | ||||
| {2140863671,-168489630}, {2138474797,-196498235}, {2135719506,-224473172}, | ||||
| {2132598271,-252409646}, {2129111626,-280302871}, {2125260168,-308148068}, | ||||
| {2121044558,-335940465}, {2116465518,-363675300}, {2111523833,-391347822}, | ||||
| {2106220349,-418953288}, {2100555974,-446486968}, {2094531681,-473944146}, | ||||
| {2088148500,-501320115}, {2081407525,-528610186}, {2074309912,-555809682}, | ||||
| {2066856885,-582913912}, {2059049696,-609918325}, {2050889698,-636818231}, | ||||
| {2042378310,-663608960}, {2033516972,-690285983}, {2024307180,-716844791}, | ||||
| {2014750533,-743280770}, {2004848691,-769589332}, {1994603329,-795766029}, | ||||
| {1984016179,-821806435}, {1973089077,-847706028}, {1961823921,-873460313}, | ||||
| {1950222618,-899064934}, {1938287127,-924515564}, {1926019520,-949807783}, | ||||
| {1913421927,-974937199}, {1900496481,-999899565}, {1887245364,-1024690661}, | ||||
| {1873670877,-1049306180}, {1859775377,-1073741851}, {1845561215,-1097993541}, | ||||
| {1831030826,-1122057097}, {1816186632,-1145928502}, {1801031311,-1169603450}, | ||||
| {1785567394,-1193077993}, {1769797456,-1216348214}, {1753724345,-1239409914}, | ||||
| {1737350743,-1262259248}, {1720679456,-1284892300}, {1703713340,-1307305194}, | ||||
| {1686455222,-1329494189}, {1668908218,-1351455280}, {1651075255,-1373184807}, | ||||
| {1632959307,-1394679144}, {1614563642,-1415934412}, {1595891331,-1436947067}, | ||||
| {1576945572,-1457713510}, {1557729613,-1478230181}, {1538246655,-1498493658}, | ||||
| {1518500216,-1518500282}, {1498493590,-1538246721}, {1478230113,-1557729677}, | ||||
| {1457713441,-1576945636}, {1436946998,-1595891394}, {1415934341,-1614563704}, | ||||
| {1394679073,-1632959368}, {1373184735,-1651075315}, {1351455207,-1668908277}, | ||||
| {1329494115,-1686455280}, {1307305120,-1703713397}, {1284892225,-1720679512}, | ||||
| {1262259172,-1737350799}, {1239409837,-1753724400}, {1216348136,-1769797510}, | ||||
| {1193077915,-1785567446}, {1169603371,-1801031362}, {1145928423,-1816186682}, | ||||
| {1122057017,-1831030875}, {1097993571,-1845561197}, {1073741769,-1859775424}, | ||||
| {1049305987,-1873670985}, {1024690635,-1887245378}, {999899482,-1900496524}, | ||||
| {974937230,-1913421912}, {949807699,-1926019561}, {924515422,-1938287195}, | ||||
| {899064965,-1950222603}, {873460227,-1961823959}, {847705824,-1973089164}, | ||||
| {821806407,-1984016190}, {795765941,-1994603364}, {769589125,-2004848771}, | ||||
| {743280682,-2014750566}, {716844642,-2024307233}, {690286016,-2033516961}, | ||||
| {663608871,-2042378339}, {636818019,-2050889764}, {609918296,-2059049705}, | ||||
| {582913822,-2066856911}, {555809715,-2074309903}, {528610126,-2081407540}, | ||||
| {501319962,-2088148536}, {473944148,-2094531680}, {446486876,-2100555994}, | ||||
| {418953102,-2106220386}, {391347792,-2111523838}, {363675176,-2116465540}, | ||||
| {335940246,-2121044593}, {308148006,-2125260177}, {280302715,-2129111646}, | ||||
| {252409648,-2132598271}, {224473078,-2135719516}, {196498046,-2138474814}, | ||||
| {168489600,-2140863674}, {140452029,-2142885728}, {112390647,-2144540593}, | ||||
| {84309753,-2145828017}, {56214412,-2146747762}, {28109695,-2147299667}, | ||||
| {2147483647,0}, {2146747758,-56214570}, {2144540595,-112390613}, | ||||
| {2140863671,-168489630}, {2135719506,-224473172}, {2129111626,-280302871}, | ||||
| {2121044558,-335940465}, {2111523833,-391347822}, {2100555974,-446486968}, | ||||
| {2088148500,-501320115}, {2074309912,-555809682}, {2059049696,-609918325}, | ||||
| {2042378310,-663608960}, {2024307180,-716844791}, {2004848691,-769589332}, | ||||
| {1984016179,-821806435}, {1961823921,-873460313}, {1938287127,-924515564}, | ||||
| {1913421927,-974937199}, {1887245364,-1024690661}, {1859775377,-1073741851}, | ||||
| {1831030826,-1122057097}, {1801031311,-1169603450}, {1769797456,-1216348214}, | ||||
| {1737350743,-1262259248}, {1703713340,-1307305194}, {1668908218,-1351455280}, | ||||
| {1632959307,-1394679144}, {1595891331,-1436947067}, {1557729613,-1478230181}, | ||||
| {1518500216,-1518500282}, {1478230113,-1557729677}, {1436946998,-1595891394}, | ||||
| {1394679073,-1632959368}, {1351455207,-1668908277}, {1307305120,-1703713397}, | ||||
| {1262259172,-1737350799}, {1216348136,-1769797510}, {1169603371,-1801031362}, | ||||
| {1122057017,-1831030875}, {1073741769,-1859775424}, {1024690635,-1887245378}, | ||||
| {974937230,-1913421912}, {924515422,-1938287195}, {873460227,-1961823959}, | ||||
| {821806407,-1984016190}, {769589125,-2004848771}, {716844642,-2024307233}, | ||||
| {663608871,-2042378339}, {609918296,-2059049705}, {555809715,-2074309903}, | ||||
| {501319962,-2088148536}, {446486876,-2100555994}, {391347792,-2111523838}, | ||||
| {335940246,-2121044593}, {280302715,-2129111646}, {224473078,-2135719516}, | ||||
| {168489600,-2140863674}, {112390647,-2144540593}, {56214412,-2146747762}, | ||||
| {-94,-2147483647}, {-56214600,-2146747757}, {-112390835,-2144540584}, | ||||
| {-168489787,-2140863659}, {-224473265,-2135719496}, {-280302901,-2129111622}, | ||||
| {-335940431,-2121044564}, {-391347977,-2111523804}, {-446487060,-2100555955}, | ||||
| {-501320144,-2088148493}, {-555809896,-2074309855}, {-609918476,-2059049651}, | ||||
| {-663609049,-2042378281}, {-716844819,-2024307170}, {-769589300,-2004848703}, | ||||
| {-821806581,-1984016118}, {-873460398,-1961823883}, {-924515591,-1938287114}, | ||||
| {-974937397,-1913421827}, {-1024690575,-1887245411}, {-1073741932,-1859775330}, | ||||
| {-1122057395,-1831030643}, {-1169603421,-1801031330}, {-1216348291,-1769797403}, | ||||
| {-1262259116,-1737350839}, {-1307305268,-1703713283}, {-1351455453,-1668908078}, | ||||
| {-1394679021,-1632959413}, {-1436947137,-1595891268}, {-1478230435,-1557729372}, | ||||
| {-1518500258,-1518500240}, {-1557729742,-1478230045}, {-1595891628,-1436946738}, | ||||
| {-1632959429,-1394679001}, {-1668908417,-1351455035}, {-1703713298,-1307305248}, | ||||
| {-1737350854,-1262259096}, {-1769797708,-1216347848}, {-1801031344,-1169603400}, | ||||
| {-1831030924,-1122056937}, {-1859775343,-1073741910}, {-1887245423,-1024690552}, | ||||
| {-1913422071,-974936918}, {-1938287125,-924515568}, {-1961823997,-873460141}, | ||||
| {-1984016324,-821806084}, {-2004848713,-769589276}, {-2024307264,-716844553}, | ||||
| {-2042378447,-663608538}, {-2059049731,-609918206}, {-2074309994,-555809377}, | ||||
| {-2088148499,-501320119}, {-2100556013,-446486785}, {-2111523902,-391347448}, | ||||
| {-2121044568,-335940406}, {-2129111659,-280302621}, {-2135719499,-224473240}, | ||||
| {-2140863681,-168489506}, {-2144540612,-112390298}, {-2146747758,-56214574}, | ||||
| {2147483647,0}, {2145828015,-84309815}, {2140863671,-168489630}, | ||||
| {2132598271,-252409646}, {2121044558,-335940465}, {2106220349,-418953288}, | ||||
| {2088148500,-501320115}, {2066856885,-582913912}, {2042378310,-663608960}, | ||||
| {2014750533,-743280770}, {1984016179,-821806435}, {1950222618,-899064934}, | ||||
| {1913421927,-974937199}, {1873670877,-1049306180}, {1831030826,-1122057097}, | ||||
| {1785567394,-1193077993}, {1737350743,-1262259248}, {1686455222,-1329494189}, | ||||
| {1632959307,-1394679144}, {1576945572,-1457713510}, {1518500216,-1518500282}, | ||||
| {1457713441,-1576945636}, {1394679073,-1632959368}, {1329494115,-1686455280}, | ||||
| {1262259172,-1737350799}, {1193077915,-1785567446}, {1122057017,-1831030875}, | ||||
| {1049305987,-1873670985}, {974937230,-1913421912}, {899064965,-1950222603}, | ||||
| {821806407,-1984016190}, {743280682,-2014750566}, {663608871,-2042378339}, | ||||
| {582913822,-2066856911}, {501319962,-2088148536}, {418953102,-2106220386}, | ||||
| {335940246,-2121044593}, {252409648,-2132598271}, {168489600,-2140863674}, | ||||
| {84309753,-2145828017}, {-94,-2147483647}, {-84309940,-2145828010}, | ||||
| {-168489787,-2140863659}, {-252409834,-2132598249}, {-335940431,-2121044564}, | ||||
| {-418953286,-2106220349}, {-501320144,-2088148493}, {-582914003,-2066856860}, | ||||
| {-663609049,-2042378281}, {-743280858,-2014750501}, {-821806581,-1984016118}, | ||||
| {-899065136,-1950222525}, {-974937397,-1913421827}, {-1049306374,-1873670768}, | ||||
| {-1122057395,-1831030643}, {-1193078284,-1785567199}, {-1262259116,-1737350839}, | ||||
| {-1329494061,-1686455323}, {-1394679021,-1632959413}, {-1457713485,-1576945595}, | ||||
| {-1518500258,-1518500240}, {-1576945613,-1457713466}, {-1632959429,-1394679001}, | ||||
| {-1686455338,-1329494041}, {-1737350854,-1262259096}, {-1785567498,-1193077837}, | ||||
| {-1831030924,-1122056937}, {-1873671031,-1049305905}, {-1913422071,-974936918}, | ||||
| {-1950222750,-899064648}, {-1984016324,-821806084}, {-2014750687,-743280354}, | ||||
| {-2042378447,-663608538}, {-2066856867,-582913978}, {-2088148499,-501320119}, | ||||
| {-2106220354,-418953261}, {-2121044568,-335940406}, {-2132598282,-252409555}, | ||||
| {-2140863681,-168489506}, {-2145828021,-84309659}, {-2147483647,188}, | ||||
| {-2145828006,84310034}, {-2140863651,168489881}, {-2132598237,252409928}, | ||||
| {-2121044509,335940777}, {-2106220281,418953629}, {-2088148411,501320484}, | ||||
| {-2066856765,582914339}, {-2042378331,663608895}, {-2014750557,743280706}, | ||||
| {-1984016181,821806431}, {-1950222593,899064989}, {-1913421900,974937252}, | ||||
| {-1873670848,1049306232}, {-1831030728,1122057257}, {-1785567289,1193078149}, | ||||
| {-1737350633,1262259400}, {-1686455106,1329494336}, {-1632959185,1394679287}, | ||||
| {-1576945358,1457713742}, {-1518499993,1518500506}, {-1457713209,1576945850}, | ||||
| {-1394678735,1632959656}, {-1329493766,1686455555}, {-1262258813,1737351059}, | ||||
| {-1193077546,1785567692}, {-1122056638,1831031107}, {-1049305599,1873671202}, | ||||
| {-974936606,1913422229}, {-899064330,1950222896}, {-821805761,1984016458}, | ||||
| {-743280025,2014750808}, {-663609179,2042378239}, {-582914134,2066856823}, | ||||
| {-501320277,2088148461}, {-418953420,2106220322}, {-335940566,2121044542}, | ||||
| {-252409716,2132598263}, {-168489668,2140863668}, {-84309821,2145828015}, | ||||
| }; | ||||
| static const ne10_fft_cpx_int32_t ne10_twiddles_240[240] = { | ||||
| {0,0}, {2147483647,0}, {2147483647,0}, | ||||
| {2147483647,0}, {1961823921,-873460313}, {1436946998,-1595891394}, | ||||
| {2147483647,0}, {1436946998,-1595891394}, {-224473265,-2135719496}, | ||||
| {2147483647,0}, {663608871,-2042378339}, {-1737350854,-1262259096}, | ||||
| {2147483647,0}, {-224473265,-2135719496}, {-2100555935,446487152}, | ||||
| {2147483647,0}, {2135719506,-224473172}, {2100555974,-446486968}, | ||||
| {2042378310,-663608960}, {1961823921,-873460313}, {1859775377,-1073741851}, | ||||
| {1737350743,-1262259248}, {1595891331,-1436947067}, {1436946998,-1595891394}, | ||||
| {1262259172,-1737350799}, {1073741769,-1859775424}, {873460227,-1961823959}, | ||||
| {663608871,-2042378339}, {446486876,-2100555994}, {224473078,-2135719516}, | ||||
| {2147483647,0}, {2100555974,-446486968}, {1961823921,-873460313}, | ||||
| {1737350743,-1262259248}, {1436946998,-1595891394}, {1073741769,-1859775424}, | ||||
| {663608871,-2042378339}, {224473078,-2135719516}, {-224473265,-2135719496}, | ||||
| {-663609049,-2042378281}, {-1073741932,-1859775330}, {-1436947137,-1595891268}, | ||||
| {-1737350854,-1262259096}, {-1961823997,-873460141}, {-2100556013,-446486785}, | ||||
| {2147483647,0}, {2042378310,-663608960}, {1737350743,-1262259248}, | ||||
| {1262259172,-1737350799}, {663608871,-2042378339}, {-94,-2147483647}, | ||||
| {-663609049,-2042378281}, {-1262259116,-1737350839}, {-1737350854,-1262259096}, | ||||
| {-2042378447,-663608538}, {-2147483647,188}, {-2042378331,663608895}, | ||||
| {-1737350633,1262259400}, {-1262258813,1737351059}, {-663609179,2042378239}, | ||||
| {2147483647,0}, {2146747758,-56214570}, {2144540595,-112390613}, | ||||
| {2140863671,-168489630}, {2135719506,-224473172}, {2129111626,-280302871}, | ||||
| {2121044558,-335940465}, {2111523833,-391347822}, {2100555974,-446486968}, | ||||
| {2088148500,-501320115}, {2074309912,-555809682}, {2059049696,-609918325}, | ||||
| {2042378310,-663608960}, {2024307180,-716844791}, {2004848691,-769589332}, | ||||
| {1984016179,-821806435}, {1961823921,-873460313}, {1938287127,-924515564}, | ||||
| {1913421927,-974937199}, {1887245364,-1024690661}, {1859775377,-1073741851}, | ||||
| {1831030826,-1122057097}, {1801031311,-1169603450}, {1769797456,-1216348214}, | ||||
| {1737350743,-1262259248}, {1703713340,-1307305194}, {1668908218,-1351455280}, | ||||
| {1632959307,-1394679144}, {1595891331,-1436947067}, {1557729613,-1478230181}, | ||||
| {1518500216,-1518500282}, {1478230113,-1557729677}, {1436946998,-1595891394}, | ||||
| {1394679073,-1632959368}, {1351455207,-1668908277}, {1307305120,-1703713397}, | ||||
| {1262259172,-1737350799}, {1216348136,-1769797510}, {1169603371,-1801031362}, | ||||
| {1122057017,-1831030875}, {1073741769,-1859775424}, {1024690635,-1887245378}, | ||||
| {974937230,-1913421912}, {924515422,-1938287195}, {873460227,-1961823959}, | ||||
| {821806407,-1984016190}, {769589125,-2004848771}, {716844642,-2024307233}, | ||||
| {663608871,-2042378339}, {609918296,-2059049705}, {555809715,-2074309903}, | ||||
| {501319962,-2088148536}, {446486876,-2100555994}, {391347792,-2111523838}, | ||||
| {335940246,-2121044593}, {280302715,-2129111646}, {224473078,-2135719516}, | ||||
| {168489600,-2140863674}, {112390647,-2144540593}, {56214412,-2146747762}, | ||||
| {2147483647,0}, {2144540595,-112390613}, {2135719506,-224473172}, | ||||
| {2121044558,-335940465}, {2100555974,-446486968}, {2074309912,-555809682}, | ||||
| {2042378310,-663608960}, {2004848691,-769589332}, {1961823921,-873460313}, | ||||
| {1913421927,-974937199}, {1859775377,-1073741851}, {1801031311,-1169603450}, | ||||
| {1737350743,-1262259248}, {1668908218,-1351455280}, {1595891331,-1436947067}, | ||||
| {1518500216,-1518500282}, {1436946998,-1595891394}, {1351455207,-1668908277}, | ||||
| {1262259172,-1737350799}, {1169603371,-1801031362}, {1073741769,-1859775424}, | ||||
| {974937230,-1913421912}, {873460227,-1961823959}, {769589125,-2004848771}, | ||||
| {663608871,-2042378339}, {555809715,-2074309903}, {446486876,-2100555994}, | ||||
| {335940246,-2121044593}, {224473078,-2135719516}, {112390647,-2144540593}, | ||||
| {-94,-2147483647}, {-112390835,-2144540584}, {-224473265,-2135719496}, | ||||
| {-335940431,-2121044564}, {-446487060,-2100555955}, {-555809896,-2074309855}, | ||||
| {-663609049,-2042378281}, {-769589300,-2004848703}, {-873460398,-1961823883}, | ||||
| {-974937397,-1913421827}, {-1073741932,-1859775330}, {-1169603421,-1801031330}, | ||||
| {-1262259116,-1737350839}, {-1351455453,-1668908078}, {-1436947137,-1595891268}, | ||||
| {-1518500258,-1518500240}, {-1595891628,-1436946738}, {-1668908417,-1351455035}, | ||||
| {-1737350854,-1262259096}, {-1801031344,-1169603400}, {-1859775343,-1073741910}, | ||||
| {-1913422071,-974936918}, {-1961823997,-873460141}, {-2004848713,-769589276}, | ||||
| {-2042378447,-663608538}, {-2074309994,-555809377}, {-2100556013,-446486785}, | ||||
| {-2121044568,-335940406}, {-2135719499,-224473240}, {-2144540612,-112390298}, | ||||
| {2147483647,0}, {2140863671,-168489630}, {2121044558,-335940465}, | ||||
| {2088148500,-501320115}, {2042378310,-663608960}, {1984016179,-821806435}, | ||||
| {1913421927,-974937199}, {1831030826,-1122057097}, {1737350743,-1262259248}, | ||||
| {1632959307,-1394679144}, {1518500216,-1518500282}, {1394679073,-1632959368}, | ||||
| {1262259172,-1737350799}, {1122057017,-1831030875}, {974937230,-1913421912}, | ||||
| {821806407,-1984016190}, {663608871,-2042378339}, {501319962,-2088148536}, | ||||
| {335940246,-2121044593}, {168489600,-2140863674}, {-94,-2147483647}, | ||||
| {-168489787,-2140863659}, {-335940431,-2121044564}, {-501320144,-2088148493}, | ||||
| {-663609049,-2042378281}, {-821806581,-1984016118}, {-974937397,-1913421827}, | ||||
| {-1122057395,-1831030643}, {-1262259116,-1737350839}, {-1394679021,-1632959413}, | ||||
| {-1518500258,-1518500240}, {-1632959429,-1394679001}, {-1737350854,-1262259096}, | ||||
| {-1831030924,-1122056937}, {-1913422071,-974936918}, {-1984016324,-821806084}, | ||||
| {-2042378447,-663608538}, {-2088148499,-501320119}, {-2121044568,-335940406}, | ||||
| {-2140863681,-168489506}, {-2147483647,188}, {-2140863651,168489881}, | ||||
| {-2121044509,335940777}, {-2088148411,501320484}, {-2042378331,663608895}, | ||||
| {-1984016181,821806431}, {-1913421900,974937252}, {-1831030728,1122057257}, | ||||
| {-1737350633,1262259400}, {-1632959185,1394679287}, {-1518499993,1518500506}, | ||||
| {-1394678735,1632959656}, {-1262258813,1737351059}, {-1122056638,1831031107}, | ||||
| {-974936606,1913422229}, {-821805761,1984016458}, {-663609179,2042378239}, | ||||
| {-501320277,2088148461}, {-335940566,2121044542}, {-168489668,2140863668}, | ||||
| }; | ||||
| static const ne10_fft_cpx_int32_t ne10_twiddles_120[120] = { | ||||
| {0,0}, {2147483647,0}, {2147483647,0}, | ||||
| {2147483647,0}, {1961823921,-873460313}, {1436946998,-1595891394}, | ||||
| {2147483647,0}, {1436946998,-1595891394}, {-224473265,-2135719496}, | ||||
| {2147483647,0}, {663608871,-2042378339}, {-1737350854,-1262259096}, | ||||
| {2147483647,0}, {-224473265,-2135719496}, {-2100555935,446487152}, | ||||
| {2147483647,0}, {2100555974,-446486968}, {1961823921,-873460313}, | ||||
| {1737350743,-1262259248}, {1436946998,-1595891394}, {1073741769,-1859775424}, | ||||
| {663608871,-2042378339}, {224473078,-2135719516}, {-224473265,-2135719496}, | ||||
| {-663609049,-2042378281}, {-1073741932,-1859775330}, {-1436947137,-1595891268}, | ||||
| {-1737350854,-1262259096}, {-1961823997,-873460141}, {-2100556013,-446486785}, | ||||
| {2147483647,0}, {2144540595,-112390613}, {2135719506,-224473172}, | ||||
| {2121044558,-335940465}, {2100555974,-446486968}, {2074309912,-555809682}, | ||||
| {2042378310,-663608960}, {2004848691,-769589332}, {1961823921,-873460313}, | ||||
| {1913421927,-974937199}, {1859775377,-1073741851}, {1801031311,-1169603450}, | ||||
| {1737350743,-1262259248}, {1668908218,-1351455280}, {1595891331,-1436947067}, | ||||
| {1518500216,-1518500282}, {1436946998,-1595891394}, {1351455207,-1668908277}, | ||||
| {1262259172,-1737350799}, {1169603371,-1801031362}, {1073741769,-1859775424}, | ||||
| {974937230,-1913421912}, {873460227,-1961823959}, {769589125,-2004848771}, | ||||
| {663608871,-2042378339}, {555809715,-2074309903}, {446486876,-2100555994}, | ||||
| {335940246,-2121044593}, {224473078,-2135719516}, {112390647,-2144540593}, | ||||
| {2147483647,0}, {2135719506,-224473172}, {2100555974,-446486968}, | ||||
| {2042378310,-663608960}, {1961823921,-873460313}, {1859775377,-1073741851}, | ||||
| {1737350743,-1262259248}, {1595891331,-1436947067}, {1436946998,-1595891394}, | ||||
| {1262259172,-1737350799}, {1073741769,-1859775424}, {873460227,-1961823959}, | ||||
| {663608871,-2042378339}, {446486876,-2100555994}, {224473078,-2135719516}, | ||||
| {-94,-2147483647}, {-224473265,-2135719496}, {-446487060,-2100555955}, | ||||
| {-663609049,-2042378281}, {-873460398,-1961823883}, {-1073741932,-1859775330}, | ||||
| {-1262259116,-1737350839}, {-1436947137,-1595891268}, {-1595891628,-1436946738}, | ||||
| {-1737350854,-1262259096}, {-1859775343,-1073741910}, {-1961823997,-873460141}, | ||||
| {-2042378447,-663608538}, {-2100556013,-446486785}, {-2135719499,-224473240}, | ||||
| {2147483647,0}, {2121044558,-335940465}, {2042378310,-663608960}, | ||||
| {1913421927,-974937199}, {1737350743,-1262259248}, {1518500216,-1518500282}, | ||||
| {1262259172,-1737350799}, {974937230,-1913421912}, {663608871,-2042378339}, | ||||
| {335940246,-2121044593}, {-94,-2147483647}, {-335940431,-2121044564}, | ||||
| {-663609049,-2042378281}, {-974937397,-1913421827}, {-1262259116,-1737350839}, | ||||
| {-1518500258,-1518500240}, {-1737350854,-1262259096}, {-1913422071,-974936918}, | ||||
| {-2042378447,-663608538}, {-2121044568,-335940406}, {-2147483647,188}, | ||||
| {-2121044509,335940777}, {-2042378331,663608895}, {-1913421900,974937252}, | ||||
| {-1737350633,1262259400}, {-1518499993,1518500506}, {-1262258813,1737351059}, | ||||
| {-974936606,1913422229}, {-663609179,2042378239}, {-335940566,2121044542}, | ||||
| }; | ||||
| static const ne10_fft_cpx_int32_t ne10_twiddles_60[60] = { | ||||
| {0,0}, {2147483647,0}, {2147483647,0}, | ||||
| {2147483647,0}, {1961823921,-873460313}, {1436946998,-1595891394}, | ||||
| {2147483647,0}, {1436946998,-1595891394}, {-224473265,-2135719496}, | ||||
| {2147483647,0}, {663608871,-2042378339}, {-1737350854,-1262259096}, | ||||
| {2147483647,0}, {-224473265,-2135719496}, {-2100555935,446487152}, | ||||
| {2147483647,0}, {2135719506,-224473172}, {2100555974,-446486968}, | ||||
| {2042378310,-663608960}, {1961823921,-873460313}, {1859775377,-1073741851}, | ||||
| {1737350743,-1262259248}, {1595891331,-1436947067}, {1436946998,-1595891394}, | ||||
| {1262259172,-1737350799}, {1073741769,-1859775424}, {873460227,-1961823959}, | ||||
| {663608871,-2042378339}, {446486876,-2100555994}, {224473078,-2135719516}, | ||||
| {2147483647,0}, {2100555974,-446486968}, {1961823921,-873460313}, | ||||
| {1737350743,-1262259248}, {1436946998,-1595891394}, {1073741769,-1859775424}, | ||||
| {663608871,-2042378339}, {224473078,-2135719516}, {-224473265,-2135719496}, | ||||
| {-663609049,-2042378281}, {-1073741932,-1859775330}, {-1436947137,-1595891268}, | ||||
| {-1737350854,-1262259096}, {-1961823997,-873460141}, {-2100556013,-446486785}, | ||||
| {2147483647,0}, {2042378310,-663608960}, {1737350743,-1262259248}, | ||||
| {1262259172,-1737350799}, {663608871,-2042378339}, {-94,-2147483647}, | ||||
| {-663609049,-2042378281}, {-1262259116,-1737350839}, {-1737350854,-1262259096}, | ||||
| {-2042378447,-663608538}, {-2147483647,188}, {-2042378331,663608895}, | ||||
| {-1737350633,1262259400}, {-1262258813,1737351059}, {-663609179,2042378239}, | ||||
| }; | ||||
| static const ne10_fft_state_int32_t ne10_fft_state_int32_t_480 = { | ||||
| 120, | ||||
| (ne10_int32_t *)ne10_factors_480, | ||||
| (ne10_fft_cpx_int32_t *)ne10_twiddles_480, | ||||
| NULL, | ||||
| (ne10_fft_cpx_int32_t *)&ne10_twiddles_480[120], | ||||
| }; | ||||
| static const arch_fft_state cfg_arch_480 = { | ||||
| 1, | ||||
| (void *)&ne10_fft_state_int32_t_480, | ||||
| }; | ||||
| 
 | ||||
| static const ne10_fft_state_int32_t ne10_fft_state_int32_t_240 = { | ||||
| 60, | ||||
| (ne10_int32_t *)ne10_factors_240, | ||||
| (ne10_fft_cpx_int32_t *)ne10_twiddles_240, | ||||
| NULL, | ||||
| (ne10_fft_cpx_int32_t *)&ne10_twiddles_240[60], | ||||
| }; | ||||
| static const arch_fft_state cfg_arch_240 = { | ||||
| 1, | ||||
| (void *)&ne10_fft_state_int32_t_240, | ||||
| }; | ||||
| 
 | ||||
| static const ne10_fft_state_int32_t ne10_fft_state_int32_t_120 = { | ||||
| 30, | ||||
| (ne10_int32_t *)ne10_factors_120, | ||||
| (ne10_fft_cpx_int32_t *)ne10_twiddles_120, | ||||
| NULL, | ||||
| (ne10_fft_cpx_int32_t *)&ne10_twiddles_120[30], | ||||
| }; | ||||
| static const arch_fft_state cfg_arch_120 = { | ||||
| 1, | ||||
| (void *)&ne10_fft_state_int32_t_120, | ||||
| }; | ||||
| 
 | ||||
| static const ne10_fft_state_int32_t ne10_fft_state_int32_t_60 = { | ||||
| 15, | ||||
| (ne10_int32_t *)ne10_factors_60, | ||||
| (ne10_fft_cpx_int32_t *)ne10_twiddles_60, | ||||
| NULL, | ||||
| (ne10_fft_cpx_int32_t *)&ne10_twiddles_60[15], | ||||
| }; | ||||
| static const arch_fft_state cfg_arch_60 = { | ||||
| 1, | ||||
| (void *)&ne10_fft_state_int32_t_60, | ||||
| }; | ||||
| 
 | ||||
| #endif  /* end NE10_FFT_PARAMS48000_960 */ | ||||
							
								
								
									
										888
									
								
								lib/rbcodec/codecs/libopus/celt/static_modes_float.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										888
									
								
								lib/rbcodec/codecs/libopus/celt/static_modes_float.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,888 @@ | |||
| /* The contents of this file was automatically generated by dump_modes.c
 | ||||
|    with arguments: 48000 960 | ||||
|    It contains static definitions for some pre-defined modes. */ | ||||
| #include "modes.h" | ||||
| #include "rate.h" | ||||
| 
 | ||||
| #ifdef HAVE_ARM_NE10 | ||||
| #define OVERRIDE_FFT 1 | ||||
| #include "static_modes_float_arm_ne10.h" | ||||
| #endif | ||||
| 
 | ||||
| #ifndef DEF_WINDOW120 | ||||
| #define DEF_WINDOW120 | ||||
| static const opus_val16 window120[120] = { | ||||
| 6.7286966e-05f, 0.00060551348f, 0.0016815970f, 0.0032947962f, 0.0054439943f, | ||||
| 0.0081276923f, 0.011344001f, 0.015090633f, 0.019364886f, 0.024163635f, | ||||
| 0.029483315f, 0.035319905f, 0.041668911f, 0.048525347f, 0.055883718f, | ||||
| 0.063737999f, 0.072081616f, 0.080907428f, 0.090207705f, 0.099974111f, | ||||
| 0.11019769f, 0.12086883f, 0.13197729f, 0.14351214f, 0.15546177f, | ||||
| 0.16781389f, 0.18055550f, 0.19367290f, 0.20715171f, 0.22097682f, | ||||
| 0.23513243f, 0.24960208f, 0.26436860f, 0.27941419f, 0.29472040f, | ||||
| 0.31026818f, 0.32603788f, 0.34200931f, 0.35816177f, 0.37447407f, | ||||
| 0.39092462f, 0.40749142f, 0.42415215f, 0.44088423f, 0.45766484f, | ||||
| 0.47447104f, 0.49127978f, 0.50806798f, 0.52481261f, 0.54149077f, | ||||
| 0.55807973f, 0.57455701f, 0.59090049f, 0.60708841f, 0.62309951f, | ||||
| 0.63891306f, 0.65450896f, 0.66986776f, 0.68497077f, 0.69980010f, | ||||
| 0.71433873f, 0.72857055f, 0.74248043f, 0.75605424f, 0.76927895f, | ||||
| 0.78214257f, 0.79463430f, 0.80674445f, 0.81846456f, 0.82978733f, | ||||
| 0.84070669f, 0.85121779f, 0.86131698f, 0.87100183f, 0.88027111f, | ||||
| 0.88912479f, 0.89756398f, 0.90559094f, 0.91320904f, 0.92042270f, | ||||
| 0.92723738f, 0.93365955f, 0.93969656f, 0.94535671f, 0.95064907f, | ||||
| 0.95558353f, 0.96017067f, 0.96442171f, 0.96834849f, 0.97196334f, | ||||
| 0.97527906f, 0.97830883f, 0.98106616f, 0.98356480f, 0.98581869f, | ||||
| 0.98784191f, 0.98964856f, 0.99125274f, 0.99266849f, 0.99390969f, | ||||
| 0.99499004f, 0.99592297f, 0.99672162f, 0.99739874f, 0.99796667f, | ||||
| 0.99843728f, 0.99882195f, 0.99913147f, 0.99937606f, 0.99956527f, | ||||
| 0.99970802f, 0.99981248f, 0.99988613f, 0.99993565f, 0.99996697f, | ||||
| 0.99998518f, 0.99999457f, 0.99999859f, 0.99999982f, 1.0000000f, | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef DEF_LOGN400 | ||||
| #define DEF_LOGN400 | ||||
| static const opus_int16 logN400[21] = { | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 8, 8, 8, 8, 16, 16, 16, 21, 21, 24, 29, 34, 36, }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef DEF_PULSE_CACHE50 | ||||
| #define DEF_PULSE_CACHE50 | ||||
| static const opus_int16 cache_index50[105] = { | ||||
| -1, -1, -1, -1, -1, -1, -1, -1, 0, 0, 0, 0, 41, 41, 41, | ||||
| 82, 82, 123, 164, 200, 222, 0, 0, 0, 0, 0, 0, 0, 0, 41, | ||||
| 41, 41, 41, 123, 123, 123, 164, 164, 240, 266, 283, 295, 41, 41, 41, | ||||
| 41, 41, 41, 41, 41, 123, 123, 123, 123, 240, 240, 240, 266, 266, 305, | ||||
| 318, 328, 336, 123, 123, 123, 123, 123, 123, 123, 123, 240, 240, 240, 240, | ||||
| 305, 305, 305, 318, 318, 343, 351, 358, 364, 240, 240, 240, 240, 240, 240, | ||||
| 240, 240, 305, 305, 305, 305, 343, 343, 343, 351, 351, 370, 376, 382, 387, | ||||
| }; | ||||
| static const unsigned char cache_bits50[392] = { | ||||
| 40, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, | ||||
| 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, | ||||
| 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 40, 15, 23, 28, | ||||
| 31, 34, 36, 38, 39, 41, 42, 43, 44, 45, 46, 47, 47, 49, 50, | ||||
| 51, 52, 53, 54, 55, 55, 57, 58, 59, 60, 61, 62, 63, 63, 65, | ||||
| 66, 67, 68, 69, 70, 71, 71, 40, 20, 33, 41, 48, 53, 57, 61, | ||||
| 64, 66, 69, 71, 73, 75, 76, 78, 80, 82, 85, 87, 89, 91, 92, | ||||
| 94, 96, 98, 101, 103, 105, 107, 108, 110, 112, 114, 117, 119, 121, 123, | ||||
| 124, 126, 128, 40, 23, 39, 51, 60, 67, 73, 79, 83, 87, 91, 94, | ||||
| 97, 100, 102, 105, 107, 111, 115, 118, 121, 124, 126, 129, 131, 135, 139, | ||||
| 142, 145, 148, 150, 153, 155, 159, 163, 166, 169, 172, 174, 177, 179, 35, | ||||
| 28, 49, 65, 78, 89, 99, 107, 114, 120, 126, 132, 136, 141, 145, 149, | ||||
| 153, 159, 165, 171, 176, 180, 185, 189, 192, 199, 205, 211, 216, 220, 225, | ||||
| 229, 232, 239, 245, 251, 21, 33, 58, 79, 97, 112, 125, 137, 148, 157, | ||||
| 166, 174, 182, 189, 195, 201, 207, 217, 227, 235, 243, 251, 17, 35, 63, | ||||
| 86, 106, 123, 139, 152, 165, 177, 187, 197, 206, 214, 222, 230, 237, 250, | ||||
| 25, 31, 55, 75, 91, 105, 117, 128, 138, 146, 154, 161, 168, 174, 180, | ||||
| 185, 190, 200, 208, 215, 222, 229, 235, 240, 245, 255, 16, 36, 65, 89, | ||||
| 110, 128, 144, 159, 173, 185, 196, 207, 217, 226, 234, 242, 250, 11, 41, | ||||
| 74, 103, 128, 151, 172, 191, 209, 225, 241, 255, 9, 43, 79, 110, 138, | ||||
| 163, 186, 207, 227, 246, 12, 39, 71, 99, 123, 144, 164, 182, 198, 214, | ||||
| 228, 241, 253, 9, 44, 81, 113, 142, 168, 192, 214, 235, 255, 7, 49, | ||||
| 90, 127, 160, 191, 220, 247, 6, 51, 95, 134, 170, 203, 234, 7, 47, | ||||
| 87, 123, 155, 184, 212, 237, 6, 52, 97, 137, 174, 208, 240, 5, 57, | ||||
| 106, 151, 192, 231, 5, 59, 111, 158, 202, 243, 5, 55, 103, 147, 187, | ||||
| 224, 5, 60, 113, 161, 206, 248, 4, 65, 122, 175, 224, 4, 67, 127, | ||||
| 182, 234, }; | ||||
| static const unsigned char cache_caps50[168] = { | ||||
| 224, 224, 224, 224, 224, 224, 224, 224, 160, 160, 160, 160, 185, 185, 185, | ||||
| 178, 178, 168, 134, 61, 37, 224, 224, 224, 224, 224, 224, 224, 224, 240, | ||||
| 240, 240, 240, 207, 207, 207, 198, 198, 183, 144, 66, 40, 160, 160, 160, | ||||
| 160, 160, 160, 160, 160, 185, 185, 185, 185, 193, 193, 193, 183, 183, 172, | ||||
| 138, 64, 38, 240, 240, 240, 240, 240, 240, 240, 240, 207, 207, 207, 207, | ||||
| 204, 204, 204, 193, 193, 180, 143, 66, 40, 185, 185, 185, 185, 185, 185, | ||||
| 185, 185, 193, 193, 193, 193, 193, 193, 193, 183, 183, 172, 138, 65, 39, | ||||
| 207, 207, 207, 207, 207, 207, 207, 207, 204, 204, 204, 204, 201, 201, 201, | ||||
| 188, 188, 176, 141, 66, 40, 193, 193, 193, 193, 193, 193, 193, 193, 193, | ||||
| 193, 193, 193, 194, 194, 194, 184, 184, 173, 139, 65, 39, 204, 204, 204, | ||||
| 204, 204, 204, 204, 204, 201, 201, 201, 201, 198, 198, 198, 187, 187, 175, | ||||
| 140, 66, 40, }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef FFT_TWIDDLES48000_960 | ||||
| #define FFT_TWIDDLES48000_960 | ||||
| static const kiss_twiddle_cpx fft_twiddles48000_960[480] = { | ||||
| {1.0000000f, -0.0000000f}, {0.99991433f, -0.013089596f}, | ||||
| {0.99965732f, -0.026176948f}, {0.99922904f, -0.039259816f}, | ||||
| {0.99862953f, -0.052335956f}, {0.99785892f, -0.065403129f}, | ||||
| {0.99691733f, -0.078459096f}, {0.99580493f, -0.091501619f}, | ||||
| {0.99452190f, -0.10452846f}, {0.99306846f, -0.11753740f}, | ||||
| {0.99144486f, -0.13052619f}, {0.98965139f, -0.14349262f}, | ||||
| {0.98768834f, -0.15643447f}, {0.98555606f, -0.16934950f}, | ||||
| {0.98325491f, -0.18223553f}, {0.98078528f, -0.19509032f}, | ||||
| {0.97814760f, -0.20791169f}, {0.97534232f, -0.22069744f}, | ||||
| {0.97236992f, -0.23344536f}, {0.96923091f, -0.24615329f}, | ||||
| {0.96592583f, -0.25881905f}, {0.96245524f, -0.27144045f}, | ||||
| {0.95881973f, -0.28401534f}, {0.95501994f, -0.29654157f}, | ||||
| {0.95105652f, -0.30901699f}, {0.94693013f, -0.32143947f}, | ||||
| {0.94264149f, -0.33380686f}, {0.93819134f, -0.34611706f}, | ||||
| {0.93358043f, -0.35836795f}, {0.92880955f, -0.37055744f}, | ||||
| {0.92387953f, -0.38268343f}, {0.91879121f, -0.39474386f}, | ||||
| {0.91354546f, -0.40673664f}, {0.90814317f, -0.41865974f}, | ||||
| {0.90258528f, -0.43051110f}, {0.89687274f, -0.44228869f}, | ||||
| {0.89100652f, -0.45399050f}, {0.88498764f, -0.46561452f}, | ||||
| {0.87881711f, -0.47715876f}, {0.87249601f, -0.48862124f}, | ||||
| {0.86602540f, -0.50000000f}, {0.85940641f, -0.51129309f}, | ||||
| {0.85264016f, -0.52249856f}, {0.84572782f, -0.53361452f}, | ||||
| {0.83867057f, -0.54463904f}, {0.83146961f, -0.55557023f}, | ||||
| {0.82412619f, -0.56640624f}, {0.81664156f, -0.57714519f}, | ||||
| {0.80901699f, -0.58778525f}, {0.80125381f, -0.59832460f}, | ||||
| {0.79335334f, -0.60876143f}, {0.78531693f, -0.61909395f}, | ||||
| {0.77714596f, -0.62932039f}, {0.76884183f, -0.63943900f}, | ||||
| {0.76040597f, -0.64944805f}, {0.75183981f, -0.65934582f}, | ||||
| {0.74314483f, -0.66913061f}, {0.73432251f, -0.67880075f}, | ||||
| {0.72537437f, -0.68835458f}, {0.71630194f, -0.69779046f}, | ||||
| {0.70710678f, -0.70710678f}, {0.69779046f, -0.71630194f}, | ||||
| {0.68835458f, -0.72537437f}, {0.67880075f, -0.73432251f}, | ||||
| {0.66913061f, -0.74314483f}, {0.65934582f, -0.75183981f}, | ||||
| {0.64944805f, -0.76040597f}, {0.63943900f, -0.76884183f}, | ||||
| {0.62932039f, -0.77714596f}, {0.61909395f, -0.78531693f}, | ||||
| {0.60876143f, -0.79335334f}, {0.59832460f, -0.80125381f}, | ||||
| {0.58778525f, -0.80901699f}, {0.57714519f, -0.81664156f}, | ||||
| {0.56640624f, -0.82412619f}, {0.55557023f, -0.83146961f}, | ||||
| {0.54463904f, -0.83867057f}, {0.53361452f, -0.84572782f}, | ||||
| {0.52249856f, -0.85264016f}, {0.51129309f, -0.85940641f}, | ||||
| {0.50000000f, -0.86602540f}, {0.48862124f, -0.87249601f}, | ||||
| {0.47715876f, -0.87881711f}, {0.46561452f, -0.88498764f}, | ||||
| {0.45399050f, -0.89100652f}, {0.44228869f, -0.89687274f}, | ||||
| {0.43051110f, -0.90258528f}, {0.41865974f, -0.90814317f}, | ||||
| {0.40673664f, -0.91354546f}, {0.39474386f, -0.91879121f}, | ||||
| {0.38268343f, -0.92387953f}, {0.37055744f, -0.92880955f}, | ||||
| {0.35836795f, -0.93358043f}, {0.34611706f, -0.93819134f}, | ||||
| {0.33380686f, -0.94264149f}, {0.32143947f, -0.94693013f}, | ||||
| {0.30901699f, -0.95105652f}, {0.29654157f, -0.95501994f}, | ||||
| {0.28401534f, -0.95881973f}, {0.27144045f, -0.96245524f}, | ||||
| {0.25881905f, -0.96592583f}, {0.24615329f, -0.96923091f}, | ||||
| {0.23344536f, -0.97236992f}, {0.22069744f, -0.97534232f}, | ||||
| {0.20791169f, -0.97814760f}, {0.19509032f, -0.98078528f}, | ||||
| {0.18223553f, -0.98325491f}, {0.16934950f, -0.98555606f}, | ||||
| {0.15643447f, -0.98768834f}, {0.14349262f, -0.98965139f}, | ||||
| {0.13052619f, -0.99144486f}, {0.11753740f, -0.99306846f}, | ||||
| {0.10452846f, -0.99452190f}, {0.091501619f, -0.99580493f}, | ||||
| {0.078459096f, -0.99691733f}, {0.065403129f, -0.99785892f}, | ||||
| {0.052335956f, -0.99862953f}, {0.039259816f, -0.99922904f}, | ||||
| {0.026176948f, -0.99965732f}, {0.013089596f, -0.99991433f}, | ||||
| {6.1230318e-17f, -1.0000000f}, {-0.013089596f, -0.99991433f}, | ||||
| {-0.026176948f, -0.99965732f}, {-0.039259816f, -0.99922904f}, | ||||
| {-0.052335956f, -0.99862953f}, {-0.065403129f, -0.99785892f}, | ||||
| {-0.078459096f, -0.99691733f}, {-0.091501619f, -0.99580493f}, | ||||
| {-0.10452846f, -0.99452190f}, {-0.11753740f, -0.99306846f}, | ||||
| {-0.13052619f, -0.99144486f}, {-0.14349262f, -0.98965139f}, | ||||
| {-0.15643447f, -0.98768834f}, {-0.16934950f, -0.98555606f}, | ||||
| {-0.18223553f, -0.98325491f}, {-0.19509032f, -0.98078528f}, | ||||
| {-0.20791169f, -0.97814760f}, {-0.22069744f, -0.97534232f}, | ||||
| {-0.23344536f, -0.97236992f}, {-0.24615329f, -0.96923091f}, | ||||
| {-0.25881905f, -0.96592583f}, {-0.27144045f, -0.96245524f}, | ||||
| {-0.28401534f, -0.95881973f}, {-0.29654157f, -0.95501994f}, | ||||
| {-0.30901699f, -0.95105652f}, {-0.32143947f, -0.94693013f}, | ||||
| {-0.33380686f, -0.94264149f}, {-0.34611706f, -0.93819134f}, | ||||
| {-0.35836795f, -0.93358043f}, {-0.37055744f, -0.92880955f}, | ||||
| {-0.38268343f, -0.92387953f}, {-0.39474386f, -0.91879121f}, | ||||
| {-0.40673664f, -0.91354546f}, {-0.41865974f, -0.90814317f}, | ||||
| {-0.43051110f, -0.90258528f}, {-0.44228869f, -0.89687274f}, | ||||
| {-0.45399050f, -0.89100652f}, {-0.46561452f, -0.88498764f}, | ||||
| {-0.47715876f, -0.87881711f}, {-0.48862124f, -0.87249601f}, | ||||
| {-0.50000000f, -0.86602540f}, {-0.51129309f, -0.85940641f}, | ||||
| {-0.52249856f, -0.85264016f}, {-0.53361452f, -0.84572782f}, | ||||
| {-0.54463904f, -0.83867057f}, {-0.55557023f, -0.83146961f}, | ||||
| {-0.56640624f, -0.82412619f}, {-0.57714519f, -0.81664156f}, | ||||
| {-0.58778525f, -0.80901699f}, {-0.59832460f, -0.80125381f}, | ||||
| {-0.60876143f, -0.79335334f}, {-0.61909395f, -0.78531693f}, | ||||
| {-0.62932039f, -0.77714596f}, {-0.63943900f, -0.76884183f}, | ||||
| {-0.64944805f, -0.76040597f}, {-0.65934582f, -0.75183981f}, | ||||
| {-0.66913061f, -0.74314483f}, {-0.67880075f, -0.73432251f}, | ||||
| {-0.68835458f, -0.72537437f}, {-0.69779046f, -0.71630194f}, | ||||
| {-0.70710678f, -0.70710678f}, {-0.71630194f, -0.69779046f}, | ||||
| {-0.72537437f, -0.68835458f}, {-0.73432251f, -0.67880075f}, | ||||
| {-0.74314483f, -0.66913061f}, {-0.75183981f, -0.65934582f}, | ||||
| {-0.76040597f, -0.64944805f}, {-0.76884183f, -0.63943900f}, | ||||
| {-0.77714596f, -0.62932039f}, {-0.78531693f, -0.61909395f}, | ||||
| {-0.79335334f, -0.60876143f}, {-0.80125381f, -0.59832460f}, | ||||
| {-0.80901699f, -0.58778525f}, {-0.81664156f, -0.57714519f}, | ||||
| {-0.82412619f, -0.56640624f}, {-0.83146961f, -0.55557023f}, | ||||
| {-0.83867057f, -0.54463904f}, {-0.84572782f, -0.53361452f}, | ||||
| {-0.85264016f, -0.52249856f}, {-0.85940641f, -0.51129309f}, | ||||
| {-0.86602540f, -0.50000000f}, {-0.87249601f, -0.48862124f}, | ||||
| {-0.87881711f, -0.47715876f}, {-0.88498764f, -0.46561452f}, | ||||
| {-0.89100652f, -0.45399050f}, {-0.89687274f, -0.44228869f}, | ||||
| {-0.90258528f, -0.43051110f}, {-0.90814317f, -0.41865974f}, | ||||
| {-0.91354546f, -0.40673664f}, {-0.91879121f, -0.39474386f}, | ||||
| {-0.92387953f, -0.38268343f}, {-0.92880955f, -0.37055744f}, | ||||
| {-0.93358043f, -0.35836795f}, {-0.93819134f, -0.34611706f}, | ||||
| {-0.94264149f, -0.33380686f}, {-0.94693013f, -0.32143947f}, | ||||
| {-0.95105652f, -0.30901699f}, {-0.95501994f, -0.29654157f}, | ||||
| {-0.95881973f, -0.28401534f}, {-0.96245524f, -0.27144045f}, | ||||
| {-0.96592583f, -0.25881905f}, {-0.96923091f, -0.24615329f}, | ||||
| {-0.97236992f, -0.23344536f}, {-0.97534232f, -0.22069744f}, | ||||
| {-0.97814760f, -0.20791169f}, {-0.98078528f, -0.19509032f}, | ||||
| {-0.98325491f, -0.18223553f}, {-0.98555606f, -0.16934950f}, | ||||
| {-0.98768834f, -0.15643447f}, {-0.98965139f, -0.14349262f}, | ||||
| {-0.99144486f, -0.13052619f}, {-0.99306846f, -0.11753740f}, | ||||
| {-0.99452190f, -0.10452846f}, {-0.99580493f, -0.091501619f}, | ||||
| {-0.99691733f, -0.078459096f}, {-0.99785892f, -0.065403129f}, | ||||
| {-0.99862953f, -0.052335956f}, {-0.99922904f, -0.039259816f}, | ||||
| {-0.99965732f, -0.026176948f}, {-0.99991433f, -0.013089596f}, | ||||
| {-1.0000000f, -1.2246064e-16f}, {-0.99991433f, 0.013089596f}, | ||||
| {-0.99965732f, 0.026176948f}, {-0.99922904f, 0.039259816f}, | ||||
| {-0.99862953f, 0.052335956f}, {-0.99785892f, 0.065403129f}, | ||||
| {-0.99691733f, 0.078459096f}, {-0.99580493f, 0.091501619f}, | ||||
| {-0.99452190f, 0.10452846f}, {-0.99306846f, 0.11753740f}, | ||||
| {-0.99144486f, 0.13052619f}, {-0.98965139f, 0.14349262f}, | ||||
| {-0.98768834f, 0.15643447f}, {-0.98555606f, 0.16934950f}, | ||||
| {-0.98325491f, 0.18223553f}, {-0.98078528f, 0.19509032f}, | ||||
| {-0.97814760f, 0.20791169f}, {-0.97534232f, 0.22069744f}, | ||||
| {-0.97236992f, 0.23344536f}, {-0.96923091f, 0.24615329f}, | ||||
| {-0.96592583f, 0.25881905f}, {-0.96245524f, 0.27144045f}, | ||||
| {-0.95881973f, 0.28401534f}, {-0.95501994f, 0.29654157f}, | ||||
| {-0.95105652f, 0.30901699f}, {-0.94693013f, 0.32143947f}, | ||||
| {-0.94264149f, 0.33380686f}, {-0.93819134f, 0.34611706f}, | ||||
| {-0.93358043f, 0.35836795f}, {-0.92880955f, 0.37055744f}, | ||||
| {-0.92387953f, 0.38268343f}, {-0.91879121f, 0.39474386f}, | ||||
| {-0.91354546f, 0.40673664f}, {-0.90814317f, 0.41865974f}, | ||||
| {-0.90258528f, 0.43051110f}, {-0.89687274f, 0.44228869f}, | ||||
| {-0.89100652f, 0.45399050f}, {-0.88498764f, 0.46561452f}, | ||||
| {-0.87881711f, 0.47715876f}, {-0.87249601f, 0.48862124f}, | ||||
| {-0.86602540f, 0.50000000f}, {-0.85940641f, 0.51129309f}, | ||||
| {-0.85264016f, 0.52249856f}, {-0.84572782f, 0.53361452f}, | ||||
| {-0.83867057f, 0.54463904f}, {-0.83146961f, 0.55557023f}, | ||||
| {-0.82412619f, 0.56640624f}, {-0.81664156f, 0.57714519f}, | ||||
| {-0.80901699f, 0.58778525f}, {-0.80125381f, 0.59832460f}, | ||||
| {-0.79335334f, 0.60876143f}, {-0.78531693f, 0.61909395f}, | ||||
| {-0.77714596f, 0.62932039f}, {-0.76884183f, 0.63943900f}, | ||||
| {-0.76040597f, 0.64944805f}, {-0.75183981f, 0.65934582f}, | ||||
| {-0.74314483f, 0.66913061f}, {-0.73432251f, 0.67880075f}, | ||||
| {-0.72537437f, 0.68835458f}, {-0.71630194f, 0.69779046f}, | ||||
| {-0.70710678f, 0.70710678f}, {-0.69779046f, 0.71630194f}, | ||||
| {-0.68835458f, 0.72537437f}, {-0.67880075f, 0.73432251f}, | ||||
| {-0.66913061f, 0.74314483f}, {-0.65934582f, 0.75183981f}, | ||||
| {-0.64944805f, 0.76040597f}, {-0.63943900f, 0.76884183f}, | ||||
| {-0.62932039f, 0.77714596f}, {-0.61909395f, 0.78531693f}, | ||||
| {-0.60876143f, 0.79335334f}, {-0.59832460f, 0.80125381f}, | ||||
| {-0.58778525f, 0.80901699f}, {-0.57714519f, 0.81664156f}, | ||||
| {-0.56640624f, 0.82412619f}, {-0.55557023f, 0.83146961f}, | ||||
| {-0.54463904f, 0.83867057f}, {-0.53361452f, 0.84572782f}, | ||||
| {-0.52249856f, 0.85264016f}, {-0.51129309f, 0.85940641f}, | ||||
| {-0.50000000f, 0.86602540f}, {-0.48862124f, 0.87249601f}, | ||||
| {-0.47715876f, 0.87881711f}, {-0.46561452f, 0.88498764f}, | ||||
| {-0.45399050f, 0.89100652f}, {-0.44228869f, 0.89687274f}, | ||||
| {-0.43051110f, 0.90258528f}, {-0.41865974f, 0.90814317f}, | ||||
| {-0.40673664f, 0.91354546f}, {-0.39474386f, 0.91879121f}, | ||||
| {-0.38268343f, 0.92387953f}, {-0.37055744f, 0.92880955f}, | ||||
| {-0.35836795f, 0.93358043f}, {-0.34611706f, 0.93819134f}, | ||||
| {-0.33380686f, 0.94264149f}, {-0.32143947f, 0.94693013f}, | ||||
| {-0.30901699f, 0.95105652f}, {-0.29654157f, 0.95501994f}, | ||||
| {-0.28401534f, 0.95881973f}, {-0.27144045f, 0.96245524f}, | ||||
| {-0.25881905f, 0.96592583f}, {-0.24615329f, 0.96923091f}, | ||||
| {-0.23344536f, 0.97236992f}, {-0.22069744f, 0.97534232f}, | ||||
| {-0.20791169f, 0.97814760f}, {-0.19509032f, 0.98078528f}, | ||||
| {-0.18223553f, 0.98325491f}, {-0.16934950f, 0.98555606f}, | ||||
| {-0.15643447f, 0.98768834f}, {-0.14349262f, 0.98965139f}, | ||||
| {-0.13052619f, 0.99144486f}, {-0.11753740f, 0.99306846f}, | ||||
| {-0.10452846f, 0.99452190f}, {-0.091501619f, 0.99580493f}, | ||||
| {-0.078459096f, 0.99691733f}, {-0.065403129f, 0.99785892f}, | ||||
| {-0.052335956f, 0.99862953f}, {-0.039259816f, 0.99922904f}, | ||||
| {-0.026176948f, 0.99965732f}, {-0.013089596f, 0.99991433f}, | ||||
| {-1.8369095e-16f, 1.0000000f}, {0.013089596f, 0.99991433f}, | ||||
| {0.026176948f, 0.99965732f}, {0.039259816f, 0.99922904f}, | ||||
| {0.052335956f, 0.99862953f}, {0.065403129f, 0.99785892f}, | ||||
| {0.078459096f, 0.99691733f}, {0.091501619f, 0.99580493f}, | ||||
| {0.10452846f, 0.99452190f}, {0.11753740f, 0.99306846f}, | ||||
| {0.13052619f, 0.99144486f}, {0.14349262f, 0.98965139f}, | ||||
| {0.15643447f, 0.98768834f}, {0.16934950f, 0.98555606f}, | ||||
| {0.18223553f, 0.98325491f}, {0.19509032f, 0.98078528f}, | ||||
| {0.20791169f, 0.97814760f}, {0.22069744f, 0.97534232f}, | ||||
| {0.23344536f, 0.97236992f}, {0.24615329f, 0.96923091f}, | ||||
| {0.25881905f, 0.96592583f}, {0.27144045f, 0.96245524f}, | ||||
| {0.28401534f, 0.95881973f}, {0.29654157f, 0.95501994f}, | ||||
| {0.30901699f, 0.95105652f}, {0.32143947f, 0.94693013f}, | ||||
| {0.33380686f, 0.94264149f}, {0.34611706f, 0.93819134f}, | ||||
| {0.35836795f, 0.93358043f}, {0.37055744f, 0.92880955f}, | ||||
| {0.38268343f, 0.92387953f}, {0.39474386f, 0.91879121f}, | ||||
| {0.40673664f, 0.91354546f}, {0.41865974f, 0.90814317f}, | ||||
| {0.43051110f, 0.90258528f}, {0.44228869f, 0.89687274f}, | ||||
| {0.45399050f, 0.89100652f}, {0.46561452f, 0.88498764f}, | ||||
| {0.47715876f, 0.87881711f}, {0.48862124f, 0.87249601f}, | ||||
| {0.50000000f, 0.86602540f}, {0.51129309f, 0.85940641f}, | ||||
| {0.52249856f, 0.85264016f}, {0.53361452f, 0.84572782f}, | ||||
| {0.54463904f, 0.83867057f}, {0.55557023f, 0.83146961f}, | ||||
| {0.56640624f, 0.82412619f}, {0.57714519f, 0.81664156f}, | ||||
| {0.58778525f, 0.80901699f}, {0.59832460f, 0.80125381f}, | ||||
| {0.60876143f, 0.79335334f}, {0.61909395f, 0.78531693f}, | ||||
| {0.62932039f, 0.77714596f}, {0.63943900f, 0.76884183f}, | ||||
| {0.64944805f, 0.76040597f}, {0.65934582f, 0.75183981f}, | ||||
| {0.66913061f, 0.74314483f}, {0.67880075f, 0.73432251f}, | ||||
| {0.68835458f, 0.72537437f}, {0.69779046f, 0.71630194f}, | ||||
| {0.70710678f, 0.70710678f}, {0.71630194f, 0.69779046f}, | ||||
| {0.72537437f, 0.68835458f}, {0.73432251f, 0.67880075f}, | ||||
| {0.74314483f, 0.66913061f}, {0.75183981f, 0.65934582f}, | ||||
| {0.76040597f, 0.64944805f}, {0.76884183f, 0.63943900f}, | ||||
| {0.77714596f, 0.62932039f}, {0.78531693f, 0.61909395f}, | ||||
| {0.79335334f, 0.60876143f}, {0.80125381f, 0.59832460f}, | ||||
| {0.80901699f, 0.58778525f}, {0.81664156f, 0.57714519f}, | ||||
| {0.82412619f, 0.56640624f}, {0.83146961f, 0.55557023f}, | ||||
| {0.83867057f, 0.54463904f}, {0.84572782f, 0.53361452f}, | ||||
| {0.85264016f, 0.52249856f}, {0.85940641f, 0.51129309f}, | ||||
| {0.86602540f, 0.50000000f}, {0.87249601f, 0.48862124f}, | ||||
| {0.87881711f, 0.47715876f}, {0.88498764f, 0.46561452f}, | ||||
| {0.89100652f, 0.45399050f}, {0.89687274f, 0.44228869f}, | ||||
| {0.90258528f, 0.43051110f}, {0.90814317f, 0.41865974f}, | ||||
| {0.91354546f, 0.40673664f}, {0.91879121f, 0.39474386f}, | ||||
| {0.92387953f, 0.38268343f}, {0.92880955f, 0.37055744f}, | ||||
| {0.93358043f, 0.35836795f}, {0.93819134f, 0.34611706f}, | ||||
| {0.94264149f, 0.33380686f}, {0.94693013f, 0.32143947f}, | ||||
| {0.95105652f, 0.30901699f}, {0.95501994f, 0.29654157f}, | ||||
| {0.95881973f, 0.28401534f}, {0.96245524f, 0.27144045f}, | ||||
| {0.96592583f, 0.25881905f}, {0.96923091f, 0.24615329f}, | ||||
| {0.97236992f, 0.23344536f}, {0.97534232f, 0.22069744f}, | ||||
| {0.97814760f, 0.20791169f}, {0.98078528f, 0.19509032f}, | ||||
| {0.98325491f, 0.18223553f}, {0.98555606f, 0.16934950f}, | ||||
| {0.98768834f, 0.15643447f}, {0.98965139f, 0.14349262f}, | ||||
| {0.99144486f, 0.13052619f}, {0.99306846f, 0.11753740f}, | ||||
| {0.99452190f, 0.10452846f}, {0.99580493f, 0.091501619f}, | ||||
| {0.99691733f, 0.078459096f}, {0.99785892f, 0.065403129f}, | ||||
| {0.99862953f, 0.052335956f}, {0.99922904f, 0.039259816f}, | ||||
| {0.99965732f, 0.026176948f}, {0.99991433f, 0.013089596f}, | ||||
| }; | ||||
| #ifndef FFT_BITREV480 | ||||
| #define FFT_BITREV480 | ||||
| static const opus_int16 fft_bitrev480[480] = { | ||||
| 0, 96, 192, 288, 384, 32, 128, 224, 320, 416, 64, 160, 256, 352, 448, | ||||
| 8, 104, 200, 296, 392, 40, 136, 232, 328, 424, 72, 168, 264, 360, 456, | ||||
| 16, 112, 208, 304, 400, 48, 144, 240, 336, 432, 80, 176, 272, 368, 464, | ||||
| 24, 120, 216, 312, 408, 56, 152, 248, 344, 440, 88, 184, 280, 376, 472, | ||||
| 4, 100, 196, 292, 388, 36, 132, 228, 324, 420, 68, 164, 260, 356, 452, | ||||
| 12, 108, 204, 300, 396, 44, 140, 236, 332, 428, 76, 172, 268, 364, 460, | ||||
| 20, 116, 212, 308, 404, 52, 148, 244, 340, 436, 84, 180, 276, 372, 468, | ||||
| 28, 124, 220, 316, 412, 60, 156, 252, 348, 444, 92, 188, 284, 380, 476, | ||||
| 1, 97, 193, 289, 385, 33, 129, 225, 321, 417, 65, 161, 257, 353, 449, | ||||
| 9, 105, 201, 297, 393, 41, 137, 233, 329, 425, 73, 169, 265, 361, 457, | ||||
| 17, 113, 209, 305, 401, 49, 145, 241, 337, 433, 81, 177, 273, 369, 465, | ||||
| 25, 121, 217, 313, 409, 57, 153, 249, 345, 441, 89, 185, 281, 377, 473, | ||||
| 5, 101, 197, 293, 389, 37, 133, 229, 325, 421, 69, 165, 261, 357, 453, | ||||
| 13, 109, 205, 301, 397, 45, 141, 237, 333, 429, 77, 173, 269, 365, 461, | ||||
| 21, 117, 213, 309, 405, 53, 149, 245, 341, 437, 85, 181, 277, 373, 469, | ||||
| 29, 125, 221, 317, 413, 61, 157, 253, 349, 445, 93, 189, 285, 381, 477, | ||||
| 2, 98, 194, 290, 386, 34, 130, 226, 322, 418, 66, 162, 258, 354, 450, | ||||
| 10, 106, 202, 298, 394, 42, 138, 234, 330, 426, 74, 170, 266, 362, 458, | ||||
| 18, 114, 210, 306, 402, 50, 146, 242, 338, 434, 82, 178, 274, 370, 466, | ||||
| 26, 122, 218, 314, 410, 58, 154, 250, 346, 442, 90, 186, 282, 378, 474, | ||||
| 6, 102, 198, 294, 390, 38, 134, 230, 326, 422, 70, 166, 262, 358, 454, | ||||
| 14, 110, 206, 302, 398, 46, 142, 238, 334, 430, 78, 174, 270, 366, 462, | ||||
| 22, 118, 214, 310, 406, 54, 150, 246, 342, 438, 86, 182, 278, 374, 470, | ||||
| 30, 126, 222, 318, 414, 62, 158, 254, 350, 446, 94, 190, 286, 382, 478, | ||||
| 3, 99, 195, 291, 387, 35, 131, 227, 323, 419, 67, 163, 259, 355, 451, | ||||
| 11, 107, 203, 299, 395, 43, 139, 235, 331, 427, 75, 171, 267, 363, 459, | ||||
| 19, 115, 211, 307, 403, 51, 147, 243, 339, 435, 83, 179, 275, 371, 467, | ||||
| 27, 123, 219, 315, 411, 59, 155, 251, 347, 443, 91, 187, 283, 379, 475, | ||||
| 7, 103, 199, 295, 391, 39, 135, 231, 327, 423, 71, 167, 263, 359, 455, | ||||
| 15, 111, 207, 303, 399, 47, 143, 239, 335, 431, 79, 175, 271, 367, 463, | ||||
| 23, 119, 215, 311, 407, 55, 151, 247, 343, 439, 87, 183, 279, 375, 471, | ||||
| 31, 127, 223, 319, 415, 63, 159, 255, 351, 447, 95, 191, 287, 383, 479, | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef FFT_BITREV240 | ||||
| #define FFT_BITREV240 | ||||
| static const opus_int16 fft_bitrev240[240] = { | ||||
| 0, 48, 96, 144, 192, 16, 64, 112, 160, 208, 32, 80, 128, 176, 224, | ||||
| 4, 52, 100, 148, 196, 20, 68, 116, 164, 212, 36, 84, 132, 180, 228, | ||||
| 8, 56, 104, 152, 200, 24, 72, 120, 168, 216, 40, 88, 136, 184, 232, | ||||
| 12, 60, 108, 156, 204, 28, 76, 124, 172, 220, 44, 92, 140, 188, 236, | ||||
| 1, 49, 97, 145, 193, 17, 65, 113, 161, 209, 33, 81, 129, 177, 225, | ||||
| 5, 53, 101, 149, 197, 21, 69, 117, 165, 213, 37, 85, 133, 181, 229, | ||||
| 9, 57, 105, 153, 201, 25, 73, 121, 169, 217, 41, 89, 137, 185, 233, | ||||
| 13, 61, 109, 157, 205, 29, 77, 125, 173, 221, 45, 93, 141, 189, 237, | ||||
| 2, 50, 98, 146, 194, 18, 66, 114, 162, 210, 34, 82, 130, 178, 226, | ||||
| 6, 54, 102, 150, 198, 22, 70, 118, 166, 214, 38, 86, 134, 182, 230, | ||||
| 10, 58, 106, 154, 202, 26, 74, 122, 170, 218, 42, 90, 138, 186, 234, | ||||
| 14, 62, 110, 158, 206, 30, 78, 126, 174, 222, 46, 94, 142, 190, 238, | ||||
| 3, 51, 99, 147, 195, 19, 67, 115, 163, 211, 35, 83, 131, 179, 227, | ||||
| 7, 55, 103, 151, 199, 23, 71, 119, 167, 215, 39, 87, 135, 183, 231, | ||||
| 11, 59, 107, 155, 203, 27, 75, 123, 171, 219, 43, 91, 139, 187, 235, | ||||
| 15, 63, 111, 159, 207, 31, 79, 127, 175, 223, 47, 95, 143, 191, 239, | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef FFT_BITREV120 | ||||
| #define FFT_BITREV120 | ||||
| static const opus_int16 fft_bitrev120[120] = { | ||||
| 0, 24, 48, 72, 96, 8, 32, 56, 80, 104, 16, 40, 64, 88, 112, | ||||
| 4, 28, 52, 76, 100, 12, 36, 60, 84, 108, 20, 44, 68, 92, 116, | ||||
| 1, 25, 49, 73, 97, 9, 33, 57, 81, 105, 17, 41, 65, 89, 113, | ||||
| 5, 29, 53, 77, 101, 13, 37, 61, 85, 109, 21, 45, 69, 93, 117, | ||||
| 2, 26, 50, 74, 98, 10, 34, 58, 82, 106, 18, 42, 66, 90, 114, | ||||
| 6, 30, 54, 78, 102, 14, 38, 62, 86, 110, 22, 46, 70, 94, 118, | ||||
| 3, 27, 51, 75, 99, 11, 35, 59, 83, 107, 19, 43, 67, 91, 115, | ||||
| 7, 31, 55, 79, 103, 15, 39, 63, 87, 111, 23, 47, 71, 95, 119, | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef FFT_BITREV60 | ||||
| #define FFT_BITREV60 | ||||
| static const opus_int16 fft_bitrev60[60] = { | ||||
| 0, 12, 24, 36, 48, 4, 16, 28, 40, 52, 8, 20, 32, 44, 56, | ||||
| 1, 13, 25, 37, 49, 5, 17, 29, 41, 53, 9, 21, 33, 45, 57, | ||||
| 2, 14, 26, 38, 50, 6, 18, 30, 42, 54, 10, 22, 34, 46, 58, | ||||
| 3, 15, 27, 39, 51, 7, 19, 31, 43, 55, 11, 23, 35, 47, 59, | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef FFT_STATE48000_960_0 | ||||
| #define FFT_STATE48000_960_0 | ||||
| static const kiss_fft_state fft_state48000_960_0 = { | ||||
| 480,    /* nfft */ | ||||
| 0.002083333f,   /* scale */ | ||||
| -1,     /* shift */ | ||||
| {5, 96, 3, 32, 4, 8, 2, 4, 4, 1, 0, 0, 0, 0, 0, 0, },   /* factors */ | ||||
| fft_bitrev480,  /* bitrev */ | ||||
| fft_twiddles48000_960,  /* bitrev */ | ||||
| #ifdef OVERRIDE_FFT | ||||
| (arch_fft_state *)&cfg_arch_480, | ||||
| #else | ||||
| NULL, | ||||
| #endif | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef FFT_STATE48000_960_1 | ||||
| #define FFT_STATE48000_960_1 | ||||
| static const kiss_fft_state fft_state48000_960_1 = { | ||||
| 240,    /* nfft */ | ||||
| 0.004166667f,   /* scale */ | ||||
| 1,      /* shift */ | ||||
| {5, 48, 3, 16, 4, 4, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, },    /* factors */ | ||||
| fft_bitrev240,  /* bitrev */ | ||||
| fft_twiddles48000_960,  /* bitrev */ | ||||
| #ifdef OVERRIDE_FFT | ||||
| (arch_fft_state *)&cfg_arch_240, | ||||
| #else | ||||
| NULL, | ||||
| #endif | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef FFT_STATE48000_960_2 | ||||
| #define FFT_STATE48000_960_2 | ||||
| static const kiss_fft_state fft_state48000_960_2 = { | ||||
| 120,    /* nfft */ | ||||
| 0.008333333f,   /* scale */ | ||||
| 2,      /* shift */ | ||||
| {5, 24, 3, 8, 2, 4, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, },    /* factors */ | ||||
| fft_bitrev120,  /* bitrev */ | ||||
| fft_twiddles48000_960,  /* bitrev */ | ||||
| #ifdef OVERRIDE_FFT | ||||
| (arch_fft_state *)&cfg_arch_120, | ||||
| #else | ||||
| NULL, | ||||
| #endif | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #ifndef FFT_STATE48000_960_3 | ||||
| #define FFT_STATE48000_960_3 | ||||
| static const kiss_fft_state fft_state48000_960_3 = { | ||||
| 60,     /* nfft */ | ||||
| 0.016666667f,   /* scale */ | ||||
| 3,      /* shift */ | ||||
| {5, 12, 3, 4, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, },    /* factors */ | ||||
| fft_bitrev60,   /* bitrev */ | ||||
| fft_twiddles48000_960,  /* bitrev */ | ||||
| #ifdef OVERRIDE_FFT | ||||
| (arch_fft_state *)&cfg_arch_60, | ||||
| #else | ||||
| NULL, | ||||
| #endif | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #endif | ||||
| 
 | ||||
| #ifndef MDCT_TWIDDLES960 | ||||
| #define MDCT_TWIDDLES960 | ||||
| static const opus_val16 mdct_twiddles960[1800] = { | ||||
| 0.99999994f, 0.99999321f, 0.99997580f, 0.99994773f, 0.99990886f, | ||||
| 0.99985933f, 0.99979913f, 0.99972820f, 0.99964654f, 0.99955416f, | ||||
| 0.99945110f, 0.99933738f, 0.99921292f, 0.99907774f, 0.99893188f, | ||||
| 0.99877530f, 0.99860805f, 0.99843007f, 0.99824142f, 0.99804211f, | ||||
| 0.99783206f, 0.99761140f, 0.99737996f, 0.99713790f, 0.99688518f, | ||||
| 0.99662173f, 0.99634761f, 0.99606287f, 0.99576741f, 0.99546129f, | ||||
| 0.99514455f, 0.99481714f, 0.99447906f, 0.99413031f, 0.99377096f, | ||||
| 0.99340093f, 0.99302030f, 0.99262899f, 0.99222708f, 0.99181455f, | ||||
| 0.99139136f, 0.99095762f, 0.99051321f, 0.99005818f, 0.98959261f, | ||||
| 0.98911643f, 0.98862964f, 0.98813224f, 0.98762429f, 0.98710573f, | ||||
| 0.98657662f, 0.98603696f, 0.98548669f, 0.98492593f, 0.98435456f, | ||||
| 0.98377270f, 0.98318028f, 0.98257732f, 0.98196387f, 0.98133987f, | ||||
| 0.98070538f, 0.98006040f, 0.97940493f, 0.97873890f, 0.97806245f, | ||||
| 0.97737551f, 0.97667813f, 0.97597027f, 0.97525197f, 0.97452319f, | ||||
| 0.97378403f, 0.97303438f, 0.97227436f, 0.97150391f, 0.97072303f, | ||||
| 0.96993178f, 0.96913016f, 0.96831810f, 0.96749574f, 0.96666300f, | ||||
| 0.96581990f, 0.96496642f, 0.96410263f, 0.96322852f, 0.96234411f, | ||||
| 0.96144938f, 0.96054435f, 0.95962906f, 0.95870346f, 0.95776761f, | ||||
| 0.95682150f, 0.95586514f, 0.95489854f, 0.95392174f, 0.95293468f, | ||||
| 0.95193744f, 0.95093000f, 0.94991243f, 0.94888461f, 0.94784665f, | ||||
| 0.94679856f, 0.94574034f, 0.94467193f, 0.94359344f, 0.94250488f, | ||||
| 0.94140619f, 0.94029742f, 0.93917859f, 0.93804967f, 0.93691075f, | ||||
| 0.93576175f, 0.93460274f, 0.93343377f, 0.93225473f, 0.93106574f, | ||||
| 0.92986679f, 0.92865789f, 0.92743903f, 0.92621022f, 0.92497152f, | ||||
| 0.92372292f, 0.92246443f, 0.92119598f, 0.91991776f, 0.91862965f, | ||||
| 0.91733170f, 0.91602397f, 0.91470635f, 0.91337901f, 0.91204184f, | ||||
| 0.91069490f, 0.90933824f, 0.90797186f, 0.90659571f, 0.90520984f, | ||||
| 0.90381432f, 0.90240908f, 0.90099424f, 0.89956969f, 0.89813554f, | ||||
| 0.89669174f, 0.89523834f, 0.89377540f, 0.89230281f, 0.89082074f, | ||||
| 0.88932908f, 0.88782793f, 0.88631725f, 0.88479710f, 0.88326746f, | ||||
| 0.88172835f, 0.88017982f, 0.87862182f, 0.87705445f, 0.87547767f, | ||||
| 0.87389153f, 0.87229604f, 0.87069118f, 0.86907703f, 0.86745358f, | ||||
| 0.86582077f, 0.86417878f, 0.86252749f, 0.86086690f, 0.85919720f, | ||||
| 0.85751826f, 0.85583007f, 0.85413277f, 0.85242635f, 0.85071075f, | ||||
| 0.84898609f, 0.84725231f, 0.84550947f, 0.84375757f, 0.84199661f, | ||||
| 0.84022665f, 0.83844769f, 0.83665979f, 0.83486289f, 0.83305705f, | ||||
| 0.83124226f, 0.82941860f, 0.82758605f, 0.82574469f, 0.82389444f, | ||||
| 0.82203537f, 0.82016748f, 0.81829083f, 0.81640542f, 0.81451124f, | ||||
| 0.81260836f, 0.81069672f, 0.80877650f, 0.80684757f, 0.80490994f, | ||||
| 0.80296379f, 0.80100900f, 0.79904562f, 0.79707366f, 0.79509324f, | ||||
| 0.79310423f, 0.79110676f, 0.78910083f, 0.78708643f, 0.78506362f, | ||||
| 0.78303236f, 0.78099275f, 0.77894479f, 0.77688843f, 0.77482378f, | ||||
| 0.77275085f, 0.77066964f, 0.76858020f, 0.76648247f, 0.76437658f, | ||||
| 0.76226246f, 0.76014024f, 0.75800985f, 0.75587130f, 0.75372469f, | ||||
| 0.75157005f, 0.74940729f, 0.74723655f, 0.74505776f, 0.74287105f, | ||||
| 0.74067634f, 0.73847371f, 0.73626316f, 0.73404479f, 0.73181850f, | ||||
| 0.72958434f, 0.72734243f, 0.72509271f, 0.72283524f, 0.72057003f, | ||||
| 0.71829706f, 0.71601641f, 0.71372813f, 0.71143216f, 0.70912862f, | ||||
| 0.70681745f, 0.70449871f, 0.70217246f, 0.69983864f, 0.69749737f, | ||||
| 0.69514859f, 0.69279242f, 0.69042879f, 0.68805778f, 0.68567938f, | ||||
| 0.68329364f, 0.68090063f, 0.67850029f, 0.67609268f, 0.67367786f, | ||||
| 0.67125577f, 0.66882652f, 0.66639012f, 0.66394657f, 0.66149592f, | ||||
| 0.65903819f, 0.65657341f, 0.65410155f, 0.65162271f, 0.64913690f, | ||||
| 0.64664418f, 0.64414448f, 0.64163786f, 0.63912445f, 0.63660413f, | ||||
| 0.63407701f, 0.63154310f, 0.62900239f, 0.62645501f, 0.62390089f, | ||||
| 0.62134010f, 0.61877263f, 0.61619854f, 0.61361790f, 0.61103064f, | ||||
| 0.60843682f, 0.60583651f, 0.60322970f, 0.60061646f, 0.59799677f, | ||||
| 0.59537065f, 0.59273821f, 0.59009939f, 0.58745426f, 0.58480281f, | ||||
| 0.58214509f, 0.57948118f, 0.57681108f, 0.57413477f, 0.57145232f, | ||||
| 0.56876373f, 0.56606907f, 0.56336832f, 0.56066155f, 0.55794877f, | ||||
| 0.55523002f, 0.55250537f, 0.54977477f, 0.54703826f, 0.54429591f, | ||||
| 0.54154772f, 0.53879374f, 0.53603399f, 0.53326851f, 0.53049731f, | ||||
| 0.52772039f, 0.52493787f, 0.52214974f, 0.51935595f, 0.51655668f, | ||||
| 0.51375180f, 0.51094145f, 0.50812566f, 0.50530440f, 0.50247771f, | ||||
| 0.49964568f, 0.49680826f, 0.49396557f, 0.49111754f, 0.48826426f, | ||||
| 0.48540577f, 0.48254207f, 0.47967321f, 0.47679919f, 0.47392011f, | ||||
| 0.47103590f, 0.46814668f, 0.46525243f, 0.46235323f, 0.45944905f, | ||||
| 0.45653993f, 0.45362595f, 0.45070711f, 0.44778344f, 0.44485497f, | ||||
| 0.44192174f, 0.43898380f, 0.43604112f, 0.43309379f, 0.43014181f, | ||||
| 0.42718524f, 0.42422408f, 0.42125839f, 0.41828820f, 0.41531351f, | ||||
| 0.41233435f, 0.40935081f, 0.40636289f, 0.40337059f, 0.40037400f, | ||||
| 0.39737311f, 0.39436796f, 0.39135858f, 0.38834500f, 0.38532731f, | ||||
| 0.38230544f, 0.37927949f, 0.37624949f, 0.37321547f, 0.37017745f, | ||||
| 0.36713544f, 0.36408952f, 0.36103970f, 0.35798600f, 0.35492846f, | ||||
| 0.35186714f, 0.34880206f, 0.34573323f, 0.34266070f, 0.33958447f, | ||||
| 0.33650464f, 0.33342120f, 0.33033419f, 0.32724363f, 0.32414958f, | ||||
| 0.32105204f, 0.31795108f, 0.31484672f, 0.31173897f, 0.30862790f, | ||||
| 0.30551350f, 0.30239585f, 0.29927495f, 0.29615086f, 0.29302359f, | ||||
| 0.28989318f, 0.28675964f, 0.28362307f, 0.28048345f, 0.27734083f, | ||||
| 0.27419522f, 0.27104670f, 0.26789525f, 0.26474094f, 0.26158381f, | ||||
| 0.25842386f, 0.25526115f, 0.25209570f, 0.24892756f, 0.24575676f, | ||||
| 0.24258332f, 0.23940729f, 0.23622867f, 0.23304754f, 0.22986393f, | ||||
| 0.22667783f, 0.22348931f, 0.22029841f, 0.21710514f, 0.21390954f, | ||||
| 0.21071166f, 0.20751151f, 0.20430915f, 0.20110460f, 0.19789790f, | ||||
| 0.19468907f, 0.19147816f, 0.18826519f, 0.18505022f, 0.18183327f, | ||||
| 0.17861435f, 0.17539354f, 0.17217083f, 0.16894630f, 0.16571994f, | ||||
| 0.16249183f, 0.15926196f, 0.15603039f, 0.15279715f, 0.14956227f, | ||||
| 0.14632578f, 0.14308774f, 0.13984816f, 0.13660708f, 0.13336454f, | ||||
| 0.13012058f, 0.12687522f, 0.12362850f, 0.12038045f, 0.11713112f, | ||||
| 0.11388054f, 0.11062872f, 0.10737573f, 0.10412160f, 0.10086634f, | ||||
| 0.097609997f, 0.094352618f, 0.091094226f, 0.087834857f, 0.084574550f, | ||||
| 0.081313334f, 0.078051247f, 0.074788325f, 0.071524605f, 0.068260118f, | ||||
| 0.064994894f, 0.061728980f, 0.058462404f, 0.055195201f, 0.051927410f, | ||||
| 0.048659060f, 0.045390189f, 0.042120833f, 0.038851023f, 0.035580799f, | ||||
| 0.032310195f, 0.029039243f, 0.025767982f, 0.022496443f, 0.019224664f, | ||||
| 0.015952680f, 0.012680525f, 0.0094082337f, 0.0061358409f, 0.0028633832f, | ||||
| -0.00040910527f, -0.0036815894f, -0.0069540343f, -0.010226404f, -0.013498665f, | ||||
| -0.016770782f, -0.020042717f, -0.023314439f, -0.026585912f, -0.029857099f, | ||||
| -0.033127967f, -0.036398482f, -0.039668605f, -0.042938303f, -0.046207540f, | ||||
| -0.049476285f, -0.052744497f, -0.056012146f, -0.059279196f, -0.062545612f, | ||||
| -0.065811358f, -0.069076397f, -0.072340697f, -0.075604223f, -0.078866936f, | ||||
| -0.082128808f, -0.085389800f, -0.088649876f, -0.091909006f, -0.095167145f, | ||||
| -0.098424271f, -0.10168034f, -0.10493532f, -0.10818918f, -0.11144188f, | ||||
| -0.11469338f, -0.11794366f, -0.12119267f, -0.12444039f, -0.12768677f, | ||||
| -0.13093179f, -0.13417540f, -0.13741758f, -0.14065829f, -0.14389749f, | ||||
| -0.14713514f, -0.15037122f, -0.15360570f, -0.15683852f, -0.16006967f, | ||||
| -0.16329910f, -0.16652679f, -0.16975269f, -0.17297678f, -0.17619900f, | ||||
| -0.17941935f, -0.18263777f, -0.18585424f, -0.18906870f, -0.19228116f, | ||||
| -0.19549155f, -0.19869985f, -0.20190603f, -0.20511003f, -0.20831184f, | ||||
| -0.21151142f, -0.21470875f, -0.21790376f, -0.22109644f, -0.22428675f, | ||||
| -0.22747467f, -0.23066014f, -0.23384315f, -0.23702365f, -0.24020162f, | ||||
| -0.24337701f, -0.24654980f, -0.24971995f, -0.25288740f, -0.25605217f, | ||||
| -0.25921419f, -0.26237345f, -0.26552987f, -0.26868346f, -0.27183419f, | ||||
| -0.27498198f, -0.27812684f, -0.28126872f, -0.28440759f, -0.28754342f, | ||||
| -0.29067615f, -0.29380578f, -0.29693225f, -0.30005556f, -0.30317566f, | ||||
| -0.30629250f, -0.30940607f, -0.31251630f, -0.31562322f, -0.31872672f, | ||||
| -0.32182685f, -0.32492352f, -0.32801670f, -0.33110636f, -0.33419248f, | ||||
| -0.33727503f, -0.34035397f, -0.34342924f, -0.34650084f, -0.34956875f, | ||||
| -0.35263291f, -0.35569328f, -0.35874987f, -0.36180258f, -0.36485144f, | ||||
| -0.36789638f, -0.37093741f, -0.37397444f, -0.37700745f, -0.38003644f, | ||||
| -0.38306138f, -0.38608220f, -0.38909888f, -0.39211139f, -0.39511973f, | ||||
| -0.39812380f, -0.40112361f, -0.40411916f, -0.40711036f, -0.41009718f, | ||||
| -0.41307965f, -0.41605768f, -0.41903123f, -0.42200032f, -0.42496487f, | ||||
| -0.42792490f, -0.43088034f, -0.43383113f, -0.43677729f, -0.43971881f, | ||||
| -0.44265559f, -0.44558764f, -0.44851488f, -0.45143735f, -0.45435500f, | ||||
| -0.45726776f, -0.46017563f, -0.46307856f, -0.46597654f, -0.46886954f, | ||||
| -0.47175750f, -0.47464043f, -0.47751826f, -0.48039100f, -0.48325855f, | ||||
| -0.48612097f, -0.48897815f, -0.49183011f, -0.49467680f, -0.49751821f, | ||||
| -0.50035429f, -0.50318497f, -0.50601029f, -0.50883019f, -0.51164466f, | ||||
| -0.51445359f, -0.51725709f, -0.52005500f, -0.52284735f, -0.52563411f, | ||||
| -0.52841520f, -0.53119069f, -0.53396046f, -0.53672451f, -0.53948283f, | ||||
| -0.54223537f, -0.54498214f, -0.54772300f, -0.55045801f, -0.55318713f, | ||||
| -0.55591035f, -0.55862761f, -0.56133890f, -0.56404412f, -0.56674337f, | ||||
| -0.56943649f, -0.57212353f, -0.57480448f, -0.57747924f, -0.58014780f, | ||||
| -0.58281022f, -0.58546633f, -0.58811617f, -0.59075975f, -0.59339696f, | ||||
| -0.59602785f, -0.59865236f, -0.60127044f, -0.60388207f, -0.60648727f, | ||||
| -0.60908598f, -0.61167812f, -0.61426371f, -0.61684275f, -0.61941516f, | ||||
| -0.62198097f, -0.62454009f, -0.62709254f, -0.62963831f, -0.63217729f, | ||||
| -0.63470948f, -0.63723493f, -0.63975352f, -0.64226526f, -0.64477009f, | ||||
| -0.64726806f, -0.64975911f, -0.65224314f, -0.65472025f, -0.65719032f, | ||||
| -0.65965337f, -0.66210932f, -0.66455823f, -0.66700000f, -0.66943461f, | ||||
| -0.67186207f, -0.67428231f, -0.67669535f, -0.67910111f, -0.68149966f, | ||||
| -0.68389088f, -0.68627477f, -0.68865126f, -0.69102043f, -0.69338220f, | ||||
| -0.69573659f, -0.69808346f, -0.70042288f, -0.70275480f, -0.70507920f, | ||||
| -0.70739603f, -0.70970529f, -0.71200693f, -0.71430099f, -0.71658736f, | ||||
| -0.71886611f, -0.72113711f, -0.72340041f, -0.72565591f, -0.72790372f, | ||||
| -0.73014367f, -0.73237586f, -0.73460019f, -0.73681659f, -0.73902518f, | ||||
| -0.74122584f, -0.74341851f, -0.74560326f, -0.74778003f, -0.74994880f, | ||||
| -0.75210953f, -0.75426215f, -0.75640678f, -0.75854325f, -0.76067162f, | ||||
| -0.76279181f, -0.76490390f, -0.76700771f, -0.76910341f, -0.77119076f, | ||||
| -0.77326995f, -0.77534080f, -0.77740335f, -0.77945763f, -0.78150350f, | ||||
| -0.78354102f, -0.78557014f, -0.78759086f, -0.78960317f, -0.79160696f, | ||||
| -0.79360235f, -0.79558921f, -0.79756755f, -0.79953730f, -0.80149853f, | ||||
| -0.80345118f, -0.80539525f, -0.80733067f, -0.80925739f, -0.81117553f, | ||||
| -0.81308490f, -0.81498563f, -0.81687760f, -0.81876087f, -0.82063532f, | ||||
| -0.82250100f, -0.82435787f, -0.82620591f, -0.82804507f, -0.82987541f, | ||||
| -0.83169687f, -0.83350939f, -0.83531296f, -0.83710766f, -0.83889335f, | ||||
| -0.84067005f, -0.84243774f, -0.84419644f, -0.84594607f, -0.84768665f, | ||||
| -0.84941816f, -0.85114056f, -0.85285389f, -0.85455805f, -0.85625303f, | ||||
| -0.85793889f, -0.85961550f, -0.86128294f, -0.86294121f, -0.86459017f, | ||||
| -0.86622989f, -0.86786032f, -0.86948150f, -0.87109333f, -0.87269586f, | ||||
| -0.87428904f, -0.87587279f, -0.87744725f, -0.87901229f, -0.88056785f, | ||||
| -0.88211405f, -0.88365078f, -0.88517809f, -0.88669586f, -0.88820416f, | ||||
| -0.88970292f, -0.89119220f, -0.89267188f, -0.89414203f, -0.89560264f, | ||||
| -0.89705360f, -0.89849502f, -0.89992678f, -0.90134889f, -0.90276134f, | ||||
| -0.90416414f, -0.90555727f, -0.90694070f, -0.90831441f, -0.90967834f, | ||||
| -0.91103262f, -0.91237706f, -0.91371179f, -0.91503674f, -0.91635185f, | ||||
| -0.91765714f, -0.91895264f, -0.92023826f, -0.92151409f, -0.92277998f, | ||||
| -0.92403603f, -0.92528218f, -0.92651838f, -0.92774469f, -0.92896110f, | ||||
| -0.93016750f, -0.93136400f, -0.93255049f, -0.93372697f, -0.93489349f, | ||||
| -0.93604994f, -0.93719643f, -0.93833286f, -0.93945926f, -0.94057560f, | ||||
| -0.94168180f, -0.94277799f, -0.94386405f, -0.94494003f, -0.94600588f, | ||||
| -0.94706154f, -0.94810712f, -0.94914252f, -0.95016778f, -0.95118284f, | ||||
| -0.95218778f, -0.95318246f, -0.95416695f, -0.95514119f, -0.95610523f, | ||||
| -0.95705903f, -0.95800257f, -0.95893586f, -0.95985889f, -0.96077162f, | ||||
| -0.96167403f, -0.96256620f, -0.96344805f, -0.96431959f, -0.96518075f, | ||||
| -0.96603161f, -0.96687216f, -0.96770233f, -0.96852213f, -0.96933156f, | ||||
| -0.97013056f, -0.97091925f, -0.97169751f, -0.97246534f, -0.97322279f, | ||||
| -0.97396982f, -0.97470641f, -0.97543252f, -0.97614825f, -0.97685349f, | ||||
| -0.97754824f, -0.97823256f, -0.97890645f, -0.97956979f, -0.98022264f, | ||||
| -0.98086500f, -0.98149687f, -0.98211825f, -0.98272908f, -0.98332942f, | ||||
| -0.98391914f, -0.98449844f, -0.98506713f, -0.98562527f, -0.98617285f, | ||||
| -0.98670989f, -0.98723638f, -0.98775226f, -0.98825759f, -0.98875231f, | ||||
| -0.98923647f, -0.98971003f, -0.99017298f, -0.99062532f, -0.99106705f, | ||||
| -0.99149817f, -0.99191868f, -0.99232858f, -0.99272782f, -0.99311644f, | ||||
| -0.99349445f, -0.99386179f, -0.99421853f, -0.99456459f, -0.99489999f, | ||||
| -0.99522477f, -0.99553883f, -0.99584228f, -0.99613506f, -0.99641716f, | ||||
| -0.99668860f, -0.99694937f, -0.99719942f, -0.99743885f, -0.99766755f, | ||||
| -0.99788558f, -0.99809295f, -0.99828959f, -0.99847561f, -0.99865085f, | ||||
| -0.99881548f, -0.99896932f, -0.99911255f, -0.99924499f, -0.99936682f, | ||||
| -0.99947786f, -0.99957830f, -0.99966794f, -0.99974692f, -0.99981517f, | ||||
| -0.99987274f, -0.99991959f, -0.99995571f, -0.99998116f, -0.99999589f, | ||||
| 0.99999964f, 0.99997288f, 0.99990326f, 0.99979085f, 0.99963558f, | ||||
| 0.99943751f, 0.99919659f, 0.99891287f, 0.99858636f, 0.99821711f, | ||||
| 0.99780506f, 0.99735034f, 0.99685282f, 0.99631262f, 0.99572974f, | ||||
| 0.99510419f, 0.99443603f, 0.99372530f, 0.99297196f, 0.99217612f, | ||||
| 0.99133772f, 0.99045694f, 0.98953366f, 0.98856801f, 0.98756003f, | ||||
| 0.98650974f, 0.98541719f, 0.98428243f, 0.98310548f, 0.98188645f, | ||||
| 0.98062533f, 0.97932225f, 0.97797716f, 0.97659022f, 0.97516143f, | ||||
| 0.97369087f, 0.97217858f, 0.97062469f, 0.96902919f, 0.96739221f, | ||||
| 0.96571374f, 0.96399397f, 0.96223283f, 0.96043050f, 0.95858705f, | ||||
| 0.95670253f, 0.95477700f, 0.95281059f, 0.95080340f, 0.94875544f, | ||||
| 0.94666684f, 0.94453770f, 0.94236809f, 0.94015813f, 0.93790787f, | ||||
| 0.93561745f, 0.93328691f, 0.93091643f, 0.92850608f, 0.92605597f, | ||||
| 0.92356616f, 0.92103678f, 0.91846794f, 0.91585976f, 0.91321236f, | ||||
| 0.91052586f, 0.90780038f, 0.90503591f, 0.90223277f, 0.89939094f, | ||||
| 0.89651060f, 0.89359182f, 0.89063478f, 0.88763964f, 0.88460642f, | ||||
| 0.88153529f, 0.87842643f, 0.87527996f, 0.87209594f, 0.86887461f, | ||||
| 0.86561602f, 0.86232042f, 0.85898781f, 0.85561842f, 0.85221243f, | ||||
| 0.84876984f, 0.84529096f, 0.84177583f, 0.83822471f, 0.83463764f, | ||||
| 0.83101481f, 0.82735640f, 0.82366252f, 0.81993335f, 0.81616908f, | ||||
| 0.81236988f, 0.80853581f, 0.80466717f, 0.80076402f, 0.79682660f, | ||||
| 0.79285502f, 0.78884947f, 0.78481019f, 0.78073722f, 0.77663082f, | ||||
| 0.77249116f, 0.76831841f, 0.76411277f, 0.75987434f, 0.75560343f, | ||||
| 0.75130010f, 0.74696463f, 0.74259710f, 0.73819780f, 0.73376691f, | ||||
| 0.72930455f, 0.72481096f, 0.72028631f, 0.71573079f, 0.71114463f, | ||||
| 0.70652801f, 0.70188117f, 0.69720417f, 0.69249737f, 0.68776089f, | ||||
| 0.68299496f, 0.67819971f, 0.67337549f, 0.66852236f, 0.66364062f, | ||||
| 0.65873051f, 0.65379208f, 0.64882571f, 0.64383155f, 0.63880974f, | ||||
| 0.63376063f, 0.62868434f, 0.62358117f, 0.61845124f, 0.61329484f, | ||||
| 0.60811216f, 0.60290343f, 0.59766883f, 0.59240872f, 0.58712316f, | ||||
| 0.58181250f, 0.57647687f, 0.57111657f, 0.56573176f, 0.56032276f, | ||||
| 0.55488980f, 0.54943299f, 0.54395270f, 0.53844911f, 0.53292239f, | ||||
| 0.52737290f, 0.52180082f, 0.51620632f, 0.51058978f, 0.50495136f, | ||||
| 0.49929130f, 0.49360985f, 0.48790723f, 0.48218375f, 0.47643960f, | ||||
| 0.47067502f, 0.46489030f, 0.45908567f, 0.45326138f, 0.44741765f, | ||||
| 0.44155475f, 0.43567297f, 0.42977250f, 0.42385364f, 0.41791660f, | ||||
| 0.41196167f, 0.40598908f, 0.39999911f, 0.39399201f, 0.38796803f, | ||||
| 0.38192743f, 0.37587047f, 0.36979741f, 0.36370850f, 0.35760403f, | ||||
| 0.35148421f, 0.34534934f, 0.33919969f, 0.33303553f, 0.32685706f, | ||||
| 0.32066461f, 0.31445843f, 0.30823877f, 0.30200592f, 0.29576012f, | ||||
| 0.28950164f, 0.28323078f, 0.27694780f, 0.27065292f, 0.26434645f, | ||||
| 0.25802869f, 0.25169984f, 0.24536023f, 0.23901010f, 0.23264973f, | ||||
| 0.22627939f, 0.21989937f, 0.21350993f, 0.20711134f, 0.20070387f, | ||||
| 0.19428782f, 0.18786344f, 0.18143101f, 0.17499080f, 0.16854310f, | ||||
| 0.16208819f, 0.15562633f, 0.14915779f, 0.14268288f, 0.13620184f, | ||||
| 0.12971498f, 0.12322257f, 0.11672486f, 0.11022217f, 0.10371475f, | ||||
| 0.097202882f, 0.090686858f, 0.084166944f, 0.077643424f, 0.071116582f, | ||||
| 0.064586692f, 0.058054037f, 0.051518895f, 0.044981543f, 0.038442269f, | ||||
| 0.031901345f, 0.025359053f, 0.018815678f, 0.012271495f, 0.0057267868f, | ||||
| -0.00081816671f, -0.0073630852f, -0.013907688f, -0.020451695f, -0.026994826f, | ||||
| -0.033536803f, -0.040077340f, -0.046616159f, -0.053152986f, -0.059687532f, | ||||
| -0.066219524f, -0.072748676f, -0.079274714f, -0.085797355f, -0.092316322f, | ||||
| -0.098831341f, -0.10534211f, -0.11184838f, -0.11834986f, -0.12484626f, | ||||
| -0.13133731f, -0.13782275f, -0.14430228f, -0.15077563f, -0.15724251f, | ||||
| -0.16370267f, -0.17015581f, -0.17660165f, -0.18303993f, -0.18947038f, | ||||
| -0.19589271f, -0.20230664f, -0.20871192f, -0.21510825f, -0.22149536f, | ||||
| -0.22787298f, -0.23424086f, -0.24059868f, -0.24694622f, -0.25328314f, | ||||
| -0.25960925f, -0.26592422f, -0.27222782f, -0.27851975f, -0.28479972f, | ||||
| -0.29106751f, -0.29732284f, -0.30356544f, -0.30979502f, -0.31601134f, | ||||
| -0.32221413f, -0.32840309f, -0.33457801f, -0.34073856f, -0.34688455f, | ||||
| -0.35301566f, -0.35913166f, -0.36523229f, -0.37131724f, -0.37738630f, | ||||
| -0.38343921f, -0.38947567f, -0.39549544f, -0.40149832f, -0.40748394f, | ||||
| -0.41345215f, -0.41940263f, -0.42533514f, -0.43124944f, -0.43714526f, | ||||
| -0.44302234f, -0.44888046f, -0.45471936f, -0.46053877f, -0.46633846f, | ||||
| -0.47211814f, -0.47787762f, -0.48361665f, -0.48933494f, -0.49503228f, | ||||
| -0.50070840f, -0.50636309f, -0.51199609f, -0.51760709f, -0.52319598f, | ||||
| -0.52876246f, -0.53430629f, -0.53982723f, -0.54532504f, -0.55079949f, | ||||
| -0.55625033f, -0.56167740f, -0.56708032f, -0.57245898f, -0.57781315f, | ||||
| -0.58314258f, -0.58844697f, -0.59372622f, -0.59897995f, -0.60420811f, | ||||
| -0.60941035f, -0.61458647f, -0.61973625f, -0.62485951f, -0.62995601f, | ||||
| -0.63502556f, -0.64006782f, -0.64508271f, -0.65007001f, -0.65502942f, | ||||
| -0.65996075f, -0.66486382f, -0.66973841f, -0.67458433f, -0.67940134f, | ||||
| -0.68418926f, -0.68894786f, -0.69367695f, -0.69837630f, -0.70304573f, | ||||
| -0.70768511f, -0.71229410f, -0.71687263f, -0.72142041f, -0.72593731f, | ||||
| -0.73042315f, -0.73487765f, -0.73930067f, -0.74369204f, -0.74805158f, | ||||
| -0.75237900f, -0.75667429f, -0.76093709f, -0.76516730f, -0.76936477f, | ||||
| -0.77352923f, -0.77766061f, -0.78175867f, -0.78582323f, -0.78985411f, | ||||
| -0.79385114f, -0.79781419f, -0.80174309f, -0.80563760f, -0.80949765f, | ||||
| -0.81332302f, -0.81711352f, -0.82086903f, -0.82458937f, -0.82827437f, | ||||
| -0.83192390f, -0.83553779f, -0.83911592f, -0.84265804f, -0.84616417f, | ||||
| -0.84963393f, -0.85306740f, -0.85646427f, -0.85982448f, -0.86314780f, | ||||
| -0.86643422f, -0.86968350f, -0.87289548f, -0.87607014f, -0.87920725f, | ||||
| -0.88230664f, -0.88536829f, -0.88839203f, -0.89137769f, -0.89432514f, | ||||
| -0.89723432f, -0.90010506f, -0.90293723f, -0.90573072f, -0.90848541f, | ||||
| -0.91120118f, -0.91387796f, -0.91651553f, -0.91911387f, -0.92167282f, | ||||
| -0.92419231f, -0.92667222f, -0.92911243f, -0.93151283f, -0.93387336f, | ||||
| -0.93619382f, -0.93847424f, -0.94071442f, -0.94291431f, -0.94507378f, | ||||
| -0.94719279f, -0.94927126f, -0.95130903f, -0.95330608f, -0.95526224f, | ||||
| -0.95717752f, -0.95905179f, -0.96088499f, -0.96267700f, -0.96442777f, | ||||
| -0.96613729f, -0.96780539f, -0.96943200f, -0.97101706f, -0.97256058f, | ||||
| -0.97406244f, -0.97552258f, -0.97694093f, -0.97831738f, -0.97965199f, | ||||
| -0.98094457f, -0.98219514f, -0.98340368f, -0.98457009f, -0.98569429f, | ||||
| -0.98677629f, -0.98781598f, -0.98881340f, -0.98976845f, -0.99068111f, | ||||
| -0.99155134f, -0.99237907f, -0.99316430f, -0.99390697f, -0.99460709f, | ||||
| -0.99526459f, -0.99587947f, -0.99645168f, -0.99698120f, -0.99746799f, | ||||
| -0.99791211f, -0.99831343f, -0.99867201f, -0.99898779f, -0.99926084f, | ||||
| -0.99949104f, -0.99967843f, -0.99982297f, -0.99992472f, -0.99998361f, | ||||
| 0.99999869f, 0.99989158f, 0.99961317f, 0.99916345f, 0.99854255f, | ||||
| 0.99775058f, 0.99678761f, 0.99565387f, 0.99434954f, 0.99287480f, | ||||
| 0.99122995f, 0.98941529f, 0.98743105f, 0.98527765f, 0.98295540f, | ||||
| 0.98046476f, 0.97780609f, 0.97497988f, 0.97198665f, 0.96882683f, | ||||
| 0.96550101f, 0.96200979f, 0.95835376f, 0.95453346f, 0.95054960f, | ||||
| 0.94640291f, 0.94209403f, 0.93762374f, 0.93299282f, 0.92820197f, | ||||
| 0.92325211f, 0.91814411f, 0.91287869f, 0.90745693f, 0.90187967f, | ||||
| 0.89614785f, 0.89026248f, 0.88422459f, 0.87803519f, 0.87169534f, | ||||
| 0.86520612f, 0.85856867f, 0.85178405f, 0.84485358f, 0.83777827f, | ||||
| 0.83055943f, 0.82319832f, 0.81569612f, 0.80805415f, 0.80027372f, | ||||
| 0.79235619f, 0.78430289f, 0.77611518f, 0.76779449f, 0.75934225f, | ||||
| 0.75075996f, 0.74204898f, 0.73321080f, 0.72424710f, 0.71515924f, | ||||
| 0.70594883f, 0.69661748f, 0.68716675f, 0.67759830f, 0.66791373f, | ||||
| 0.65811473f, 0.64820296f, 0.63818014f, 0.62804794f, 0.61780810f, | ||||
| 0.60746247f, 0.59701276f, 0.58646071f, 0.57580817f, 0.56505698f, | ||||
| 0.55420899f, 0.54326600f, 0.53222996f, 0.52110273f, 0.50988621f, | ||||
| 0.49858227f, 0.48719296f, 0.47572014f, 0.46416581f, 0.45253196f, | ||||
| 0.44082057f, 0.42903364f, 0.41717321f, 0.40524128f, 0.39323992f, | ||||
| 0.38117120f, 0.36903715f, 0.35683987f, 0.34458145f, 0.33226398f, | ||||
| 0.31988961f, 0.30746040f, 0.29497850f, 0.28244606f, 0.26986524f, | ||||
| 0.25723818f, 0.24456702f, 0.23185398f, 0.21910121f, 0.20631088f, | ||||
| 0.19348522f, 0.18062639f, 0.16773662f, 0.15481812f, 0.14187308f, | ||||
| 0.12890373f, 0.11591230f, 0.10290100f, 0.089872077f, 0.076827750f, | ||||
| 0.063770257f, 0.050701842f, 0.037624735f, 0.024541186f, 0.011453429f, | ||||
| -0.0016362892f, -0.014725727f, -0.027812643f, -0.040894791f, -0.053969935f, | ||||
| -0.067035832f, -0.080090240f, -0.093130924f, -0.10615565f, -0.11916219f, | ||||
| -0.13214831f, -0.14511178f, -0.15805040f, -0.17096193f, -0.18384418f, | ||||
| -0.19669491f, -0.20951195f, -0.22229309f, -0.23503613f, -0.24773891f, | ||||
| -0.26039925f, -0.27301496f, -0.28558388f, -0.29810387f, -0.31057280f, | ||||
| -0.32298848f, -0.33534884f, -0.34765175f, -0.35989508f, -0.37207675f, | ||||
| -0.38419467f, -0.39624676f, -0.40823093f, -0.42014518f, -0.43198743f, | ||||
| -0.44375566f, -0.45544785f, -0.46706200f, -0.47859612f, -0.49004826f, | ||||
| -0.50141639f, -0.51269865f, -0.52389306f, -0.53499764f, -0.54601061f, | ||||
| -0.55693001f, -0.56775403f, -0.57848072f, -0.58910829f, -0.59963489f, | ||||
| -0.61005878f, -0.62037814f, -0.63059121f, -0.64069623f, -0.65069145f, | ||||
| -0.66057515f, -0.67034572f, -0.68000144f, -0.68954057f, -0.69896162f, | ||||
| -0.70826286f, -0.71744281f, -0.72649974f, -0.73543227f, -0.74423873f, | ||||
| -0.75291771f, -0.76146764f, -0.76988715f, -0.77817470f, -0.78632891f, | ||||
| -0.79434842f, -0.80223179f, -0.80997771f, -0.81758487f, -0.82505190f, | ||||
| -0.83237761f, -0.83956063f, -0.84659988f, -0.85349399f, -0.86024189f, | ||||
| -0.86684239f, -0.87329435f, -0.87959671f, -0.88574833f, -0.89174819f, | ||||
| -0.89759529f, -0.90328854f, -0.90882701f, -0.91420978f, -0.91943592f, | ||||
| -0.92450452f, -0.92941469f, -0.93416560f, -0.93875647f, -0.94318646f, | ||||
| -0.94745487f, -0.95156091f, -0.95550388f, -0.95928317f, -0.96289814f, | ||||
| -0.96634805f, -0.96963239f, -0.97275060f, -0.97570217f, -0.97848648f, | ||||
| -0.98110318f, -0.98355180f, -0.98583186f, -0.98794299f, -0.98988485f, | ||||
| -0.99165714f, -0.99325943f, -0.99469161f, -0.99595332f, -0.99704438f, | ||||
| -0.99796462f, -0.99871385f, -0.99929196f, -0.99969882f, -0.99993443f, | ||||
| 0.99999464f, 0.99956632f, 0.99845290f, 0.99665523f, 0.99417448f, | ||||
| 0.99101239f, 0.98717111f, 0.98265326f, 0.97746199f, 0.97160077f, | ||||
| 0.96507365f, 0.95788515f, 0.95004016f, 0.94154406f, 0.93240267f, | ||||
| 0.92262226f, 0.91220951f, 0.90117162f, 0.88951606f, 0.87725091f, | ||||
| 0.86438453f, 0.85092574f, 0.83688372f, 0.82226819f, 0.80708915f, | ||||
| 0.79135692f, 0.77508235f, 0.75827658f, 0.74095112f, 0.72311783f, | ||||
| 0.70478898f, 0.68597710f, 0.66669506f, 0.64695615f, 0.62677377f, | ||||
| 0.60616189f, 0.58513457f, 0.56370622f, 0.54189157f, 0.51970547f, | ||||
| 0.49716324f, 0.47428027f, 0.45107225f, 0.42755505f, 0.40374488f, | ||||
| 0.37965798f, 0.35531086f, 0.33072025f, 0.30590299f, 0.28087607f, | ||||
| 0.25565663f, 0.23026201f, 0.20470956f, 0.17901683f, 0.15320139f, | ||||
| 0.12728097f, 0.10127331f, 0.075196236f, 0.049067631f, 0.022905400f, | ||||
| -0.0032725304f, -0.029448219f, -0.055603724f, -0.081721120f, -0.10778251f, | ||||
| -0.13377003f, -0.15966587f, -0.18545228f, -0.21111161f, -0.23662624f, | ||||
| -0.26197869f, -0.28715160f, -0.31212771f, -0.33688989f, -0.36142120f, | ||||
| -0.38570482f, -0.40972409f, -0.43346253f, -0.45690393f, -0.48003218f, | ||||
| -0.50283146f, -0.52528608f, -0.54738069f, -0.56910020f, -0.59042966f, | ||||
| -0.61135447f, -0.63186026f, -0.65193301f, -0.67155898f, -0.69072473f, | ||||
| -0.70941705f, -0.72762316f, -0.74533063f, -0.76252723f, -0.77920127f, | ||||
| -0.79534131f, -0.81093621f, -0.82597536f, -0.84044844f, -0.85434550f, | ||||
| -0.86765707f, -0.88037395f, -0.89248747f, -0.90398932f, -0.91487163f, | ||||
| -0.92512697f, -0.93474823f, -0.94372886f, -0.95206273f, -0.95974404f, | ||||
| -0.96676767f, -0.97312868f, -0.97882277f, -0.98384601f, -0.98819500f, | ||||
| -0.99186671f, -0.99485862f, -0.99716878f, -0.99879545f, -0.99973762f, | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| static const CELTMode mode48000_960_120 = { | ||||
| 48000,  /* Fs */ | ||||
| 120,    /* overlap */ | ||||
| 21,     /* nbEBands */ | ||||
| 21,     /* effEBands */ | ||||
| {0.85000610f, 0.0000000f, 1.0000000f, 1.0000000f, },    /* preemph */ | ||||
| eband5ms,       /* eBands */ | ||||
| 3,      /* maxLM */ | ||||
| 8,      /* nbShortMdcts */ | ||||
| 120,    /* shortMdctSize */ | ||||
| 11,     /* nbAllocVectors */ | ||||
| band_allocation,        /* allocVectors */ | ||||
| logN400,        /* logN */ | ||||
| window120,      /* window */ | ||||
| {1920, 3, {&fft_state48000_960_0, &fft_state48000_960_1, &fft_state48000_960_2, &fft_state48000_960_3, }, mdct_twiddles960},    /* mdct */ | ||||
| {392, cache_index50, cache_bits50, cache_caps50},       /* cache */ | ||||
| }; | ||||
| 
 | ||||
| /* List of all the available modes */ | ||||
| #define TOTAL_MODES 1 | ||||
| static const CELTMode * const static_mode_list[TOTAL_MODES] = { | ||||
| &mode48000_960_120, | ||||
| }; | ||||
							
								
								
									
										404
									
								
								lib/rbcodec/codecs/libopus/celt/static_modes_float_arm_ne10.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										404
									
								
								lib/rbcodec/codecs/libopus/celt/static_modes_float_arm_ne10.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,404 @@ | |||
| /* The contents of this file was automatically generated by
 | ||||
|  * dump_mode_arm_ne10.c with arguments: 48000 960 | ||||
|  * It contains static definitions for some pre-defined modes. */ | ||||
| #include <NE10_types.h> | ||||
| 
 | ||||
| #ifndef NE10_FFT_PARAMS48000_960 | ||||
| #define NE10_FFT_PARAMS48000_960 | ||||
| static const ne10_int32_t ne10_factors_480[64] = { | ||||
| 4, 40, 4, 30, 2, 15, 5, 3, 3, 1, 1, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, }; | ||||
| static const ne10_int32_t ne10_factors_240[64] = { | ||||
| 3, 20, 4, 15, 5, 3, 3, 1, 1, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, }; | ||||
| static const ne10_int32_t ne10_factors_120[64] = { | ||||
| 3, 10, 2, 15, 5, 3, 3, 1, 1, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, }; | ||||
| static const ne10_int32_t ne10_factors_60[64] = { | ||||
| 2, 5, 5, 3, 3, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||
| 0, 0, 0, 0, }; | ||||
| static const ne10_fft_cpx_float32_t ne10_twiddles_480[480] = { | ||||
| {1.0000000f,0.0000000f}, {1.0000000f,-0.0000000f}, {1.0000000f,-0.0000000f}, | ||||
| {1.0000000f,-0.0000000f}, {0.91354543f,-0.40673664f}, {0.66913056f,-0.74314487f}, | ||||
| {1.0000000f,-0.0000000f}, {0.66913056f,-0.74314487f}, {-0.10452851f,-0.99452192f}, | ||||
| {1.0000000f,-0.0000000f}, {0.30901697f,-0.95105654f}, {-0.80901700f,-0.58778518f}, | ||||
| {1.0000000f,-0.0000000f}, {-0.10452851f,-0.99452192f}, {-0.97814757f,0.20791179f}, | ||||
| {1.0000000f,-0.0000000f}, {0.97814763f,-0.20791170f}, {0.91354543f,-0.40673664f}, | ||||
| {0.80901700f,-0.58778524f}, {0.66913056f,-0.74314487f}, {0.49999997f,-0.86602545f}, | ||||
| {0.30901697f,-0.95105654f}, {0.10452842f,-0.99452192f}, {-0.10452851f,-0.99452192f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.50000006f,-0.86602533f}, {-0.66913068f,-0.74314475f}, | ||||
| {-0.80901700f,-0.58778518f}, {-0.91354549f,-0.40673658f}, {-0.97814763f,-0.20791161f}, | ||||
| {1.0000000f,-0.0000000f}, {0.99862951f,-0.052335959f}, {0.99452192f,-0.10452846f}, | ||||
| {0.98768836f,-0.15643448f}, {0.97814763f,-0.20791170f}, {0.96592581f,-0.25881904f}, | ||||
| {0.95105648f,-0.30901700f}, {0.93358040f,-0.35836795f}, {0.91354543f,-0.40673664f}, | ||||
| {0.89100653f,-0.45399052f}, {0.86602545f,-0.50000000f}, {0.83867055f,-0.54463905f}, | ||||
| {0.80901700f,-0.58778524f}, {0.77714598f,-0.62932038f}, {0.74314475f,-0.66913062f}, | ||||
| {0.70710677f,-0.70710683f}, {0.66913056f,-0.74314487f}, {0.62932038f,-0.77714598f}, | ||||
| {0.58778524f,-0.80901700f}, {0.54463899f,-0.83867055f}, {0.49999997f,-0.86602545f}, | ||||
| {0.45399052f,-0.89100653f}, {0.40673661f,-0.91354549f}, {0.35836786f,-0.93358046f}, | ||||
| {0.30901697f,-0.95105654f}, {0.25881907f,-0.96592581f}, {0.20791166f,-0.97814763f}, | ||||
| {0.15643437f,-0.98768836f}, {0.10452842f,-0.99452192f}, {0.052335974f,-0.99862951f}, | ||||
| {1.0000000f,-0.0000000f}, {0.99452192f,-0.10452846f}, {0.97814763f,-0.20791170f}, | ||||
| {0.95105648f,-0.30901700f}, {0.91354543f,-0.40673664f}, {0.86602545f,-0.50000000f}, | ||||
| {0.80901700f,-0.58778524f}, {0.74314475f,-0.66913062f}, {0.66913056f,-0.74314487f}, | ||||
| {0.58778524f,-0.80901700f}, {0.49999997f,-0.86602545f}, {0.40673661f,-0.91354549f}, | ||||
| {0.30901697f,-0.95105654f}, {0.20791166f,-0.97814763f}, {0.10452842f,-0.99452192f}, | ||||
| {-4.3711388e-08f,-1.0000000f}, {-0.10452851f,-0.99452192f}, {-0.20791174f,-0.97814757f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.40673670f,-0.91354543f}, {-0.50000006f,-0.86602533f}, | ||||
| {-0.58778518f,-0.80901700f}, {-0.66913068f,-0.74314475f}, {-0.74314493f,-0.66913044f}, | ||||
| {-0.80901700f,-0.58778518f}, {-0.86602539f,-0.50000006f}, {-0.91354549f,-0.40673658f}, | ||||
| {-0.95105654f,-0.30901679f}, {-0.97814763f,-0.20791161f}, {-0.99452192f,-0.10452849f}, | ||||
| {1.0000000f,-0.0000000f}, {0.98768836f,-0.15643448f}, {0.95105648f,-0.30901700f}, | ||||
| {0.89100653f,-0.45399052f}, {0.80901700f,-0.58778524f}, {0.70710677f,-0.70710683f}, | ||||
| {0.58778524f,-0.80901700f}, {0.45399052f,-0.89100653f}, {0.30901697f,-0.95105654f}, | ||||
| {0.15643437f,-0.98768836f}, {-4.3711388e-08f,-1.0000000f}, {-0.15643445f,-0.98768836f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.45399061f,-0.89100647f}, {-0.58778518f,-0.80901700f}, | ||||
| {-0.70710677f,-0.70710677f}, {-0.80901700f,-0.58778518f}, {-0.89100659f,-0.45399037f}, | ||||
| {-0.95105654f,-0.30901679f}, {-0.98768836f,-0.15643445f}, {-1.0000000f,8.7422777e-08f}, | ||||
| {-0.98768830f,0.15643461f}, {-0.95105654f,0.30901697f}, {-0.89100653f,0.45399055f}, | ||||
| {-0.80901694f,0.58778536f}, {-0.70710665f,0.70710689f}, {-0.58778507f,0.80901712f}, | ||||
| {-0.45399022f,0.89100665f}, {-0.30901709f,0.95105648f}, {-0.15643452f,0.98768830f}, | ||||
| {1.0000000f,-0.0000000f}, {0.99991435f,-0.013089596f}, {0.99965733f,-0.026176950f}, | ||||
| {0.99922901f,-0.039259817f}, {0.99862951f,-0.052335959f}, {0.99785894f,-0.065403134f}, | ||||
| {0.99691731f,-0.078459099f}, {0.99580491f,-0.091501623f}, {0.99452192f,-0.10452846f}, | ||||
| {0.99306846f,-0.11753740f}, {0.99144489f,-0.13052620f}, {0.98965138f,-0.14349262f}, | ||||
| {0.98768836f,-0.15643448f}, {0.98555607f,-0.16934951f}, {0.98325491f,-0.18223552f}, | ||||
| {0.98078525f,-0.19509032f}, {0.97814763f,-0.20791170f}, {0.97534233f,-0.22069745f}, | ||||
| {0.97236991f,-0.23344538f}, {0.96923089f,-0.24615330f}, {0.96592581f,-0.25881904f}, | ||||
| {0.96245521f,-0.27144045f}, {0.95881975f,-0.28401536f}, {0.95501995f,-0.29654160f}, | ||||
| {0.95105648f,-0.30901700f}, {0.94693011f,-0.32143945f}, {0.94264150f,-0.33380687f}, | ||||
| {0.93819129f,-0.34611708f}, {0.93358040f,-0.35836795f}, {0.92880952f,-0.37055743f}, | ||||
| {0.92387956f,-0.38268346f}, {0.91879117f,-0.39474389f}, {0.91354543f,-0.40673664f}, | ||||
| {0.90814316f,-0.41865975f}, {0.90258527f,-0.43051112f}, {0.89687270f,-0.44228873f}, | ||||
| {0.89100653f,-0.45399052f}, {0.88498765f,-0.46561453f}, {0.87881708f,-0.47715878f}, | ||||
| {0.87249601f,-0.48862126f}, {0.86602545f,-0.50000000f}, {0.85940641f,-0.51129311f}, | ||||
| {0.85264015f,-0.52249855f}, {0.84572786f,-0.53361452f}, {0.83867055f,-0.54463905f}, | ||||
| {0.83146960f,-0.55557024f}, {0.82412618f,-0.56640625f}, {0.81664151f,-0.57714522f}, | ||||
| {0.80901700f,-0.58778524f}, {0.80125380f,-0.59832460f}, {0.79335332f,-0.60876143f}, | ||||
| {0.78531694f,-0.61909395f}, {0.77714598f,-0.62932038f}, {0.76884180f,-0.63943899f}, | ||||
| {0.76040596f,-0.64944810f}, {0.75183982f,-0.65934587f}, {0.74314475f,-0.66913062f}, | ||||
| {0.73432249f,-0.67880076f}, {0.72537434f,-0.68835455f}, {0.71630192f,-0.69779050f}, | ||||
| {0.70710677f,-0.70710683f}, {0.69779044f,-0.71630198f}, {0.68835455f,-0.72537440f}, | ||||
| {0.67880070f,-0.73432255f}, {0.66913056f,-0.74314487f}, {0.65934581f,-0.75183982f}, | ||||
| {0.64944804f,-0.76040596f}, {0.63943899f,-0.76884186f}, {0.62932038f,-0.77714598f}, | ||||
| {0.61909395f,-0.78531694f}, {0.60876137f,-0.79335338f}, {0.59832460f,-0.80125386f}, | ||||
| {0.58778524f,-0.80901700f}, {0.57714516f,-0.81664151f}, {0.56640625f,-0.82412618f}, | ||||
| {0.55557019f,-0.83146960f}, {0.54463899f,-0.83867055f}, {0.53361452f,-0.84572786f}, | ||||
| {0.52249849f,-0.85264015f}, {0.51129311f,-0.85940641f}, {0.49999997f,-0.86602545f}, | ||||
| {0.48862118f,-0.87249601f}, {0.47715876f,-0.87881708f}, {0.46561447f,-0.88498765f}, | ||||
| {0.45399052f,-0.89100653f}, {0.44228867f,-0.89687276f}, {0.43051103f,-0.90258533f}, | ||||
| {0.41865975f,-0.90814316f}, {0.40673661f,-0.91354549f}, {0.39474380f,-0.91879129f}, | ||||
| {0.38268343f,-0.92387956f}, {0.37055740f,-0.92880958f}, {0.35836786f,-0.93358046f}, | ||||
| {0.34611705f,-0.93819135f}, {0.33380681f,-0.94264150f}, {0.32143947f,-0.94693011f}, | ||||
| {0.30901697f,-0.95105654f}, {0.29654151f,-0.95501995f}, {0.28401533f,-0.95881975f}, | ||||
| {0.27144039f,-0.96245527f}, {0.25881907f,-0.96592581f}, {0.24615327f,-0.96923089f}, | ||||
| {0.23344530f,-0.97236991f}, {0.22069745f,-0.97534233f}, {0.20791166f,-0.97814763f}, | ||||
| {0.19509023f,-0.98078531f}, {0.18223552f,-0.98325491f}, {0.16934945f,-0.98555607f}, | ||||
| {0.15643437f,-0.98768836f}, {0.14349259f,-0.98965138f}, {0.13052613f,-0.99144489f}, | ||||
| {0.11753740f,-0.99306846f}, {0.10452842f,-0.99452192f}, {0.091501534f,-0.99580491f}, | ||||
| {0.078459084f,-0.99691731f}, {0.065403074f,-0.99785894f}, {0.052335974f,-0.99862951f}, | ||||
| {0.039259788f,-0.99922901f}, {0.026176875f,-0.99965733f}, {0.013089597f,-0.99991435f}, | ||||
| {1.0000000f,-0.0000000f}, {0.99965733f,-0.026176950f}, {0.99862951f,-0.052335959f}, | ||||
| {0.99691731f,-0.078459099f}, {0.99452192f,-0.10452846f}, {0.99144489f,-0.13052620f}, | ||||
| {0.98768836f,-0.15643448f}, {0.98325491f,-0.18223552f}, {0.97814763f,-0.20791170f}, | ||||
| {0.97236991f,-0.23344538f}, {0.96592581f,-0.25881904f}, {0.95881975f,-0.28401536f}, | ||||
| {0.95105648f,-0.30901700f}, {0.94264150f,-0.33380687f}, {0.93358040f,-0.35836795f}, | ||||
| {0.92387956f,-0.38268346f}, {0.91354543f,-0.40673664f}, {0.90258527f,-0.43051112f}, | ||||
| {0.89100653f,-0.45399052f}, {0.87881708f,-0.47715878f}, {0.86602545f,-0.50000000f}, | ||||
| {0.85264015f,-0.52249855f}, {0.83867055f,-0.54463905f}, {0.82412618f,-0.56640625f}, | ||||
| {0.80901700f,-0.58778524f}, {0.79335332f,-0.60876143f}, {0.77714598f,-0.62932038f}, | ||||
| {0.76040596f,-0.64944810f}, {0.74314475f,-0.66913062f}, {0.72537434f,-0.68835455f}, | ||||
| {0.70710677f,-0.70710683f}, {0.68835455f,-0.72537440f}, {0.66913056f,-0.74314487f}, | ||||
| {0.64944804f,-0.76040596f}, {0.62932038f,-0.77714598f}, {0.60876137f,-0.79335338f}, | ||||
| {0.58778524f,-0.80901700f}, {0.56640625f,-0.82412618f}, {0.54463899f,-0.83867055f}, | ||||
| {0.52249849f,-0.85264015f}, {0.49999997f,-0.86602545f}, {0.47715876f,-0.87881708f}, | ||||
| {0.45399052f,-0.89100653f}, {0.43051103f,-0.90258533f}, {0.40673661f,-0.91354549f}, | ||||
| {0.38268343f,-0.92387956f}, {0.35836786f,-0.93358046f}, {0.33380681f,-0.94264150f}, | ||||
| {0.30901697f,-0.95105654f}, {0.28401533f,-0.95881975f}, {0.25881907f,-0.96592581f}, | ||||
| {0.23344530f,-0.97236991f}, {0.20791166f,-0.97814763f}, {0.18223552f,-0.98325491f}, | ||||
| {0.15643437f,-0.98768836f}, {0.13052613f,-0.99144489f}, {0.10452842f,-0.99452192f}, | ||||
| {0.078459084f,-0.99691731f}, {0.052335974f,-0.99862951f}, {0.026176875f,-0.99965733f}, | ||||
| {-4.3711388e-08f,-1.0000000f}, {-0.026176963f,-0.99965733f}, {-0.052336060f,-0.99862951f}, | ||||
| {-0.078459173f,-0.99691731f}, {-0.10452851f,-0.99452192f}, {-0.13052621f,-0.99144489f}, | ||||
| {-0.15643445f,-0.98768836f}, {-0.18223560f,-0.98325491f}, {-0.20791174f,-0.97814757f}, | ||||
| {-0.23344538f,-0.97236991f}, {-0.25881916f,-0.96592581f}, {-0.28401542f,-0.95881969f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.33380687f,-0.94264150f}, {-0.35836795f,-0.93358040f}, | ||||
| {-0.38268352f,-0.92387950f}, {-0.40673670f,-0.91354543f}, {-0.43051112f,-0.90258527f}, | ||||
| {-0.45399061f,-0.89100647f}, {-0.47715873f,-0.87881708f}, {-0.50000006f,-0.86602533f}, | ||||
| {-0.52249867f,-0.85264009f}, {-0.54463905f,-0.83867055f}, {-0.56640631f,-0.82412612f}, | ||||
| {-0.58778518f,-0.80901700f}, {-0.60876143f,-0.79335332f}, {-0.62932050f,-0.77714586f}, | ||||
| {-0.64944804f,-0.76040596f}, {-0.66913068f,-0.74314475f}, {-0.68835467f,-0.72537428f}, | ||||
| {-0.70710677f,-0.70710677f}, {-0.72537446f,-0.68835449f}, {-0.74314493f,-0.66913044f}, | ||||
| {-0.76040596f,-0.64944804f}, {-0.77714604f,-0.62932026f}, {-0.79335332f,-0.60876143f}, | ||||
| {-0.80901700f,-0.58778518f}, {-0.82412624f,-0.56640613f}, {-0.83867055f,-0.54463899f}, | ||||
| {-0.85264021f,-0.52249849f}, {-0.86602539f,-0.50000006f}, {-0.87881714f,-0.47715873f}, | ||||
| {-0.89100659f,-0.45399037f}, {-0.90258527f,-0.43051112f}, {-0.91354549f,-0.40673658f}, | ||||
| {-0.92387956f,-0.38268328f}, {-0.93358040f,-0.35836792f}, {-0.94264150f,-0.33380675f}, | ||||
| {-0.95105654f,-0.30901679f}, {-0.95881975f,-0.28401530f}, {-0.96592587f,-0.25881892f}, | ||||
| {-0.97236991f,-0.23344538f}, {-0.97814763f,-0.20791161f}, {-0.98325491f,-0.18223536f}, | ||||
| {-0.98768836f,-0.15643445f}, {-0.99144489f,-0.13052608f}, {-0.99452192f,-0.10452849f}, | ||||
| {-0.99691737f,-0.078459039f}, {-0.99862957f,-0.052335810f}, {-0.99965733f,-0.026176952f}, | ||||
| {1.0000000f,-0.0000000f}, {0.99922901f,-0.039259817f}, {0.99691731f,-0.078459099f}, | ||||
| {0.99306846f,-0.11753740f}, {0.98768836f,-0.15643448f}, {0.98078525f,-0.19509032f}, | ||||
| {0.97236991f,-0.23344538f}, {0.96245521f,-0.27144045f}, {0.95105648f,-0.30901700f}, | ||||
| {0.93819129f,-0.34611708f}, {0.92387956f,-0.38268346f}, {0.90814316f,-0.41865975f}, | ||||
| {0.89100653f,-0.45399052f}, {0.87249601f,-0.48862126f}, {0.85264015f,-0.52249855f}, | ||||
| {0.83146960f,-0.55557024f}, {0.80901700f,-0.58778524f}, {0.78531694f,-0.61909395f}, | ||||
| {0.76040596f,-0.64944810f}, {0.73432249f,-0.67880076f}, {0.70710677f,-0.70710683f}, | ||||
| {0.67880070f,-0.73432255f}, {0.64944804f,-0.76040596f}, {0.61909395f,-0.78531694f}, | ||||
| {0.58778524f,-0.80901700f}, {0.55557019f,-0.83146960f}, {0.52249849f,-0.85264015f}, | ||||
| {0.48862118f,-0.87249601f}, {0.45399052f,-0.89100653f}, {0.41865975f,-0.90814316f}, | ||||
| {0.38268343f,-0.92387956f}, {0.34611705f,-0.93819135f}, {0.30901697f,-0.95105654f}, | ||||
| {0.27144039f,-0.96245527f}, {0.23344530f,-0.97236991f}, {0.19509023f,-0.98078531f}, | ||||
| {0.15643437f,-0.98768836f}, {0.11753740f,-0.99306846f}, {0.078459084f,-0.99691731f}, | ||||
| {0.039259788f,-0.99922901f}, {-4.3711388e-08f,-1.0000000f}, {-0.039259877f,-0.99922901f}, | ||||
| {-0.078459173f,-0.99691731f}, {-0.11753749f,-0.99306846f}, {-0.15643445f,-0.98768836f}, | ||||
| {-0.19509032f,-0.98078525f}, {-0.23344538f,-0.97236991f}, {-0.27144048f,-0.96245521f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.34611711f,-0.93819129f}, {-0.38268352f,-0.92387950f}, | ||||
| {-0.41865984f,-0.90814310f}, {-0.45399061f,-0.89100647f}, {-0.48862135f,-0.87249595f}, | ||||
| {-0.52249867f,-0.85264009f}, {-0.55557036f,-0.83146954f}, {-0.58778518f,-0.80901700f}, | ||||
| {-0.61909389f,-0.78531694f}, {-0.64944804f,-0.76040596f}, {-0.67880076f,-0.73432249f}, | ||||
| {-0.70710677f,-0.70710677f}, {-0.73432249f,-0.67880070f}, {-0.76040596f,-0.64944804f}, | ||||
| {-0.78531694f,-0.61909389f}, {-0.80901700f,-0.58778518f}, {-0.83146966f,-0.55557019f}, | ||||
| {-0.85264021f,-0.52249849f}, {-0.87249607f,-0.48862115f}, {-0.89100659f,-0.45399037f}, | ||||
| {-0.90814322f,-0.41865960f}, {-0.92387956f,-0.38268328f}, {-0.93819135f,-0.34611690f}, | ||||
| {-0.95105654f,-0.30901679f}, {-0.96245521f,-0.27144048f}, {-0.97236991f,-0.23344538f}, | ||||
| {-0.98078531f,-0.19509031f}, {-0.98768836f,-0.15643445f}, {-0.99306846f,-0.11753736f}, | ||||
| {-0.99691737f,-0.078459039f}, {-0.99922901f,-0.039259743f}, {-1.0000000f,8.7422777e-08f}, | ||||
| {-0.99922901f,0.039259918f}, {-0.99691731f,0.078459218f}, {-0.99306846f,0.11753753f}, | ||||
| {-0.98768830f,0.15643461f}, {-0.98078525f,0.19509049f}, {-0.97236985f,0.23344554f}, | ||||
| {-0.96245515f,0.27144065f}, {-0.95105654f,0.30901697f}, {-0.93819135f,0.34611705f}, | ||||
| {-0.92387956f,0.38268346f}, {-0.90814316f,0.41865975f}, {-0.89100653f,0.45399055f}, | ||||
| {-0.87249601f,0.48862129f}, {-0.85264015f,0.52249861f}, {-0.83146960f,0.55557030f}, | ||||
| {-0.80901694f,0.58778536f}, {-0.78531688f,0.61909401f}, {-0.76040590f,0.64944816f}, | ||||
| {-0.73432243f,0.67880082f}, {-0.70710665f,0.70710689f}, {-0.67880058f,0.73432261f}, | ||||
| {-0.64944792f,0.76040608f}, {-0.61909378f,0.78531706f}, {-0.58778507f,0.80901712f}, | ||||
| {-0.55557001f,0.83146977f}, {-0.52249837f,0.85264033f}, {-0.48862100f,0.87249613f}, | ||||
| {-0.45399022f,0.89100665f}, {-0.41865945f,0.90814328f}, {-0.38268313f,0.92387968f}, | ||||
| {-0.34611672f,0.93819147f}, {-0.30901709f,0.95105648f}, {-0.27144054f,0.96245521f}, | ||||
| {-0.23344545f,0.97236991f}, {-0.19509038f,0.98078525f}, {-0.15643452f,0.98768830f}, | ||||
| {-0.11753743f,0.99306846f}, {-0.078459114f,0.99691731f}, {-0.039259821f,0.99922901f}, | ||||
| }; | ||||
| static const ne10_fft_cpx_float32_t ne10_twiddles_240[240] = { | ||||
| {1.0000000f,0.0000000f}, {1.0000000f,-0.0000000f}, {1.0000000f,-0.0000000f}, | ||||
| {1.0000000f,-0.0000000f}, {0.91354543f,-0.40673664f}, {0.66913056f,-0.74314487f}, | ||||
| {1.0000000f,-0.0000000f}, {0.66913056f,-0.74314487f}, {-0.10452851f,-0.99452192f}, | ||||
| {1.0000000f,-0.0000000f}, {0.30901697f,-0.95105654f}, {-0.80901700f,-0.58778518f}, | ||||
| {1.0000000f,-0.0000000f}, {-0.10452851f,-0.99452192f}, {-0.97814757f,0.20791179f}, | ||||
| {1.0000000f,-0.0000000f}, {0.99452192f,-0.10452846f}, {0.97814763f,-0.20791170f}, | ||||
| {0.95105648f,-0.30901700f}, {0.91354543f,-0.40673664f}, {0.86602545f,-0.50000000f}, | ||||
| {0.80901700f,-0.58778524f}, {0.74314475f,-0.66913062f}, {0.66913056f,-0.74314487f}, | ||||
| {0.58778524f,-0.80901700f}, {0.49999997f,-0.86602545f}, {0.40673661f,-0.91354549f}, | ||||
| {0.30901697f,-0.95105654f}, {0.20791166f,-0.97814763f}, {0.10452842f,-0.99452192f}, | ||||
| {1.0000000f,-0.0000000f}, {0.97814763f,-0.20791170f}, {0.91354543f,-0.40673664f}, | ||||
| {0.80901700f,-0.58778524f}, {0.66913056f,-0.74314487f}, {0.49999997f,-0.86602545f}, | ||||
| {0.30901697f,-0.95105654f}, {0.10452842f,-0.99452192f}, {-0.10452851f,-0.99452192f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.50000006f,-0.86602533f}, {-0.66913068f,-0.74314475f}, | ||||
| {-0.80901700f,-0.58778518f}, {-0.91354549f,-0.40673658f}, {-0.97814763f,-0.20791161f}, | ||||
| {1.0000000f,-0.0000000f}, {0.95105648f,-0.30901700f}, {0.80901700f,-0.58778524f}, | ||||
| {0.58778524f,-0.80901700f}, {0.30901697f,-0.95105654f}, {-4.3711388e-08f,-1.0000000f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.58778518f,-0.80901700f}, {-0.80901700f,-0.58778518f}, | ||||
| {-0.95105654f,-0.30901679f}, {-1.0000000f,8.7422777e-08f}, {-0.95105654f,0.30901697f}, | ||||
| {-0.80901694f,0.58778536f}, {-0.58778507f,0.80901712f}, {-0.30901709f,0.95105648f}, | ||||
| {1.0000000f,-0.0000000f}, {0.99965733f,-0.026176950f}, {0.99862951f,-0.052335959f}, | ||||
| {0.99691731f,-0.078459099f}, {0.99452192f,-0.10452846f}, {0.99144489f,-0.13052620f}, | ||||
| {0.98768836f,-0.15643448f}, {0.98325491f,-0.18223552f}, {0.97814763f,-0.20791170f}, | ||||
| {0.97236991f,-0.23344538f}, {0.96592581f,-0.25881904f}, {0.95881975f,-0.28401536f}, | ||||
| {0.95105648f,-0.30901700f}, {0.94264150f,-0.33380687f}, {0.93358040f,-0.35836795f}, | ||||
| {0.92387956f,-0.38268346f}, {0.91354543f,-0.40673664f}, {0.90258527f,-0.43051112f}, | ||||
| {0.89100653f,-0.45399052f}, {0.87881708f,-0.47715878f}, {0.86602545f,-0.50000000f}, | ||||
| {0.85264015f,-0.52249855f}, {0.83867055f,-0.54463905f}, {0.82412618f,-0.56640625f}, | ||||
| {0.80901700f,-0.58778524f}, {0.79335332f,-0.60876143f}, {0.77714598f,-0.62932038f}, | ||||
| {0.76040596f,-0.64944810f}, {0.74314475f,-0.66913062f}, {0.72537434f,-0.68835455f}, | ||||
| {0.70710677f,-0.70710683f}, {0.68835455f,-0.72537440f}, {0.66913056f,-0.74314487f}, | ||||
| {0.64944804f,-0.76040596f}, {0.62932038f,-0.77714598f}, {0.60876137f,-0.79335338f}, | ||||
| {0.58778524f,-0.80901700f}, {0.56640625f,-0.82412618f}, {0.54463899f,-0.83867055f}, | ||||
| {0.52249849f,-0.85264015f}, {0.49999997f,-0.86602545f}, {0.47715876f,-0.87881708f}, | ||||
| {0.45399052f,-0.89100653f}, {0.43051103f,-0.90258533f}, {0.40673661f,-0.91354549f}, | ||||
| {0.38268343f,-0.92387956f}, {0.35836786f,-0.93358046f}, {0.33380681f,-0.94264150f}, | ||||
| {0.30901697f,-0.95105654f}, {0.28401533f,-0.95881975f}, {0.25881907f,-0.96592581f}, | ||||
| {0.23344530f,-0.97236991f}, {0.20791166f,-0.97814763f}, {0.18223552f,-0.98325491f}, | ||||
| {0.15643437f,-0.98768836f}, {0.13052613f,-0.99144489f}, {0.10452842f,-0.99452192f}, | ||||
| {0.078459084f,-0.99691731f}, {0.052335974f,-0.99862951f}, {0.026176875f,-0.99965733f}, | ||||
| {1.0000000f,-0.0000000f}, {0.99862951f,-0.052335959f}, {0.99452192f,-0.10452846f}, | ||||
| {0.98768836f,-0.15643448f}, {0.97814763f,-0.20791170f}, {0.96592581f,-0.25881904f}, | ||||
| {0.95105648f,-0.30901700f}, {0.93358040f,-0.35836795f}, {0.91354543f,-0.40673664f}, | ||||
| {0.89100653f,-0.45399052f}, {0.86602545f,-0.50000000f}, {0.83867055f,-0.54463905f}, | ||||
| {0.80901700f,-0.58778524f}, {0.77714598f,-0.62932038f}, {0.74314475f,-0.66913062f}, | ||||
| {0.70710677f,-0.70710683f}, {0.66913056f,-0.74314487f}, {0.62932038f,-0.77714598f}, | ||||
| {0.58778524f,-0.80901700f}, {0.54463899f,-0.83867055f}, {0.49999997f,-0.86602545f}, | ||||
| {0.45399052f,-0.89100653f}, {0.40673661f,-0.91354549f}, {0.35836786f,-0.93358046f}, | ||||
| {0.30901697f,-0.95105654f}, {0.25881907f,-0.96592581f}, {0.20791166f,-0.97814763f}, | ||||
| {0.15643437f,-0.98768836f}, {0.10452842f,-0.99452192f}, {0.052335974f,-0.99862951f}, | ||||
| {-4.3711388e-08f,-1.0000000f}, {-0.052336060f,-0.99862951f}, {-0.10452851f,-0.99452192f}, | ||||
| {-0.15643445f,-0.98768836f}, {-0.20791174f,-0.97814757f}, {-0.25881916f,-0.96592581f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.35836795f,-0.93358040f}, {-0.40673670f,-0.91354543f}, | ||||
| {-0.45399061f,-0.89100647f}, {-0.50000006f,-0.86602533f}, {-0.54463905f,-0.83867055f}, | ||||
| {-0.58778518f,-0.80901700f}, {-0.62932050f,-0.77714586f}, {-0.66913068f,-0.74314475f}, | ||||
| {-0.70710677f,-0.70710677f}, {-0.74314493f,-0.66913044f}, {-0.77714604f,-0.62932026f}, | ||||
| {-0.80901700f,-0.58778518f}, {-0.83867055f,-0.54463899f}, {-0.86602539f,-0.50000006f}, | ||||
| {-0.89100659f,-0.45399037f}, {-0.91354549f,-0.40673658f}, {-0.93358040f,-0.35836792f}, | ||||
| {-0.95105654f,-0.30901679f}, {-0.96592587f,-0.25881892f}, {-0.97814763f,-0.20791161f}, | ||||
| {-0.98768836f,-0.15643445f}, {-0.99452192f,-0.10452849f}, {-0.99862957f,-0.052335810f}, | ||||
| {1.0000000f,-0.0000000f}, {0.99691731f,-0.078459099f}, {0.98768836f,-0.15643448f}, | ||||
| {0.97236991f,-0.23344538f}, {0.95105648f,-0.30901700f}, {0.92387956f,-0.38268346f}, | ||||
| {0.89100653f,-0.45399052f}, {0.85264015f,-0.52249855f}, {0.80901700f,-0.58778524f}, | ||||
| {0.76040596f,-0.64944810f}, {0.70710677f,-0.70710683f}, {0.64944804f,-0.76040596f}, | ||||
| {0.58778524f,-0.80901700f}, {0.52249849f,-0.85264015f}, {0.45399052f,-0.89100653f}, | ||||
| {0.38268343f,-0.92387956f}, {0.30901697f,-0.95105654f}, {0.23344530f,-0.97236991f}, | ||||
| {0.15643437f,-0.98768836f}, {0.078459084f,-0.99691731f}, {-4.3711388e-08f,-1.0000000f}, | ||||
| {-0.078459173f,-0.99691731f}, {-0.15643445f,-0.98768836f}, {-0.23344538f,-0.97236991f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.38268352f,-0.92387950f}, {-0.45399061f,-0.89100647f}, | ||||
| {-0.52249867f,-0.85264009f}, {-0.58778518f,-0.80901700f}, {-0.64944804f,-0.76040596f}, | ||||
| {-0.70710677f,-0.70710677f}, {-0.76040596f,-0.64944804f}, {-0.80901700f,-0.58778518f}, | ||||
| {-0.85264021f,-0.52249849f}, {-0.89100659f,-0.45399037f}, {-0.92387956f,-0.38268328f}, | ||||
| {-0.95105654f,-0.30901679f}, {-0.97236991f,-0.23344538f}, {-0.98768836f,-0.15643445f}, | ||||
| {-0.99691737f,-0.078459039f}, {-1.0000000f,8.7422777e-08f}, {-0.99691731f,0.078459218f}, | ||||
| {-0.98768830f,0.15643461f}, {-0.97236985f,0.23344554f}, {-0.95105654f,0.30901697f}, | ||||
| {-0.92387956f,0.38268346f}, {-0.89100653f,0.45399055f}, {-0.85264015f,0.52249861f}, | ||||
| {-0.80901694f,0.58778536f}, {-0.76040590f,0.64944816f}, {-0.70710665f,0.70710689f}, | ||||
| {-0.64944792f,0.76040608f}, {-0.58778507f,0.80901712f}, {-0.52249837f,0.85264033f}, | ||||
| {-0.45399022f,0.89100665f}, {-0.38268313f,0.92387968f}, {-0.30901709f,0.95105648f}, | ||||
| {-0.23344545f,0.97236991f}, {-0.15643452f,0.98768830f}, {-0.078459114f,0.99691731f}, | ||||
| }; | ||||
| static const ne10_fft_cpx_float32_t ne10_twiddles_120[120] = { | ||||
| {1.0000000f,0.0000000f}, {1.0000000f,-0.0000000f}, {1.0000000f,-0.0000000f}, | ||||
| {1.0000000f,-0.0000000f}, {0.91354543f,-0.40673664f}, {0.66913056f,-0.74314487f}, | ||||
| {1.0000000f,-0.0000000f}, {0.66913056f,-0.74314487f}, {-0.10452851f,-0.99452192f}, | ||||
| {1.0000000f,-0.0000000f}, {0.30901697f,-0.95105654f}, {-0.80901700f,-0.58778518f}, | ||||
| {1.0000000f,-0.0000000f}, {-0.10452851f,-0.99452192f}, {-0.97814757f,0.20791179f}, | ||||
| {1.0000000f,-0.0000000f}, {0.97814763f,-0.20791170f}, {0.91354543f,-0.40673664f}, | ||||
| {0.80901700f,-0.58778524f}, {0.66913056f,-0.74314487f}, {0.49999997f,-0.86602545f}, | ||||
| {0.30901697f,-0.95105654f}, {0.10452842f,-0.99452192f}, {-0.10452851f,-0.99452192f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.50000006f,-0.86602533f}, {-0.66913068f,-0.74314475f}, | ||||
| {-0.80901700f,-0.58778518f}, {-0.91354549f,-0.40673658f}, {-0.97814763f,-0.20791161f}, | ||||
| {1.0000000f,-0.0000000f}, {0.99862951f,-0.052335959f}, {0.99452192f,-0.10452846f}, | ||||
| {0.98768836f,-0.15643448f}, {0.97814763f,-0.20791170f}, {0.96592581f,-0.25881904f}, | ||||
| {0.95105648f,-0.30901700f}, {0.93358040f,-0.35836795f}, {0.91354543f,-0.40673664f}, | ||||
| {0.89100653f,-0.45399052f}, {0.86602545f,-0.50000000f}, {0.83867055f,-0.54463905f}, | ||||
| {0.80901700f,-0.58778524f}, {0.77714598f,-0.62932038f}, {0.74314475f,-0.66913062f}, | ||||
| {0.70710677f,-0.70710683f}, {0.66913056f,-0.74314487f}, {0.62932038f,-0.77714598f}, | ||||
| {0.58778524f,-0.80901700f}, {0.54463899f,-0.83867055f}, {0.49999997f,-0.86602545f}, | ||||
| {0.45399052f,-0.89100653f}, {0.40673661f,-0.91354549f}, {0.35836786f,-0.93358046f}, | ||||
| {0.30901697f,-0.95105654f}, {0.25881907f,-0.96592581f}, {0.20791166f,-0.97814763f}, | ||||
| {0.15643437f,-0.98768836f}, {0.10452842f,-0.99452192f}, {0.052335974f,-0.99862951f}, | ||||
| {1.0000000f,-0.0000000f}, {0.99452192f,-0.10452846f}, {0.97814763f,-0.20791170f}, | ||||
| {0.95105648f,-0.30901700f}, {0.91354543f,-0.40673664f}, {0.86602545f,-0.50000000f}, | ||||
| {0.80901700f,-0.58778524f}, {0.74314475f,-0.66913062f}, {0.66913056f,-0.74314487f}, | ||||
| {0.58778524f,-0.80901700f}, {0.49999997f,-0.86602545f}, {0.40673661f,-0.91354549f}, | ||||
| {0.30901697f,-0.95105654f}, {0.20791166f,-0.97814763f}, {0.10452842f,-0.99452192f}, | ||||
| {-4.3711388e-08f,-1.0000000f}, {-0.10452851f,-0.99452192f}, {-0.20791174f,-0.97814757f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.40673670f,-0.91354543f}, {-0.50000006f,-0.86602533f}, | ||||
| {-0.58778518f,-0.80901700f}, {-0.66913068f,-0.74314475f}, {-0.74314493f,-0.66913044f}, | ||||
| {-0.80901700f,-0.58778518f}, {-0.86602539f,-0.50000006f}, {-0.91354549f,-0.40673658f}, | ||||
| {-0.95105654f,-0.30901679f}, {-0.97814763f,-0.20791161f}, {-0.99452192f,-0.10452849f}, | ||||
| {1.0000000f,-0.0000000f}, {0.98768836f,-0.15643448f}, {0.95105648f,-0.30901700f}, | ||||
| {0.89100653f,-0.45399052f}, {0.80901700f,-0.58778524f}, {0.70710677f,-0.70710683f}, | ||||
| {0.58778524f,-0.80901700f}, {0.45399052f,-0.89100653f}, {0.30901697f,-0.95105654f}, | ||||
| {0.15643437f,-0.98768836f}, {-4.3711388e-08f,-1.0000000f}, {-0.15643445f,-0.98768836f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.45399061f,-0.89100647f}, {-0.58778518f,-0.80901700f}, | ||||
| {-0.70710677f,-0.70710677f}, {-0.80901700f,-0.58778518f}, {-0.89100659f,-0.45399037f}, | ||||
| {-0.95105654f,-0.30901679f}, {-0.98768836f,-0.15643445f}, {-1.0000000f,8.7422777e-08f}, | ||||
| {-0.98768830f,0.15643461f}, {-0.95105654f,0.30901697f}, {-0.89100653f,0.45399055f}, | ||||
| {-0.80901694f,0.58778536f}, {-0.70710665f,0.70710689f}, {-0.58778507f,0.80901712f}, | ||||
| {-0.45399022f,0.89100665f}, {-0.30901709f,0.95105648f}, {-0.15643452f,0.98768830f}, | ||||
| }; | ||||
| static const ne10_fft_cpx_float32_t ne10_twiddles_60[60] = { | ||||
| {1.0000000f,0.0000000f}, {1.0000000f,-0.0000000f}, {1.0000000f,-0.0000000f}, | ||||
| {1.0000000f,-0.0000000f}, {0.91354543f,-0.40673664f}, {0.66913056f,-0.74314487f}, | ||||
| {1.0000000f,-0.0000000f}, {0.66913056f,-0.74314487f}, {-0.10452851f,-0.99452192f}, | ||||
| {1.0000000f,-0.0000000f}, {0.30901697f,-0.95105654f}, {-0.80901700f,-0.58778518f}, | ||||
| {1.0000000f,-0.0000000f}, {-0.10452851f,-0.99452192f}, {-0.97814757f,0.20791179f}, | ||||
| {1.0000000f,-0.0000000f}, {0.99452192f,-0.10452846f}, {0.97814763f,-0.20791170f}, | ||||
| {0.95105648f,-0.30901700f}, {0.91354543f,-0.40673664f}, {0.86602545f,-0.50000000f}, | ||||
| {0.80901700f,-0.58778524f}, {0.74314475f,-0.66913062f}, {0.66913056f,-0.74314487f}, | ||||
| {0.58778524f,-0.80901700f}, {0.49999997f,-0.86602545f}, {0.40673661f,-0.91354549f}, | ||||
| {0.30901697f,-0.95105654f}, {0.20791166f,-0.97814763f}, {0.10452842f,-0.99452192f}, | ||||
| {1.0000000f,-0.0000000f}, {0.97814763f,-0.20791170f}, {0.91354543f,-0.40673664f}, | ||||
| {0.80901700f,-0.58778524f}, {0.66913056f,-0.74314487f}, {0.49999997f,-0.86602545f}, | ||||
| {0.30901697f,-0.95105654f}, {0.10452842f,-0.99452192f}, {-0.10452851f,-0.99452192f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.50000006f,-0.86602533f}, {-0.66913068f,-0.74314475f}, | ||||
| {-0.80901700f,-0.58778518f}, {-0.91354549f,-0.40673658f}, {-0.97814763f,-0.20791161f}, | ||||
| {1.0000000f,-0.0000000f}, {0.95105648f,-0.30901700f}, {0.80901700f,-0.58778524f}, | ||||
| {0.58778524f,-0.80901700f}, {0.30901697f,-0.95105654f}, {-4.3711388e-08f,-1.0000000f}, | ||||
| {-0.30901703f,-0.95105648f}, {-0.58778518f,-0.80901700f}, {-0.80901700f,-0.58778518f}, | ||||
| {-0.95105654f,-0.30901679f}, {-1.0000000f,8.7422777e-08f}, {-0.95105654f,0.30901697f}, | ||||
| {-0.80901694f,0.58778536f}, {-0.58778507f,0.80901712f}, {-0.30901709f,0.95105648f}, | ||||
| }; | ||||
| static const ne10_fft_state_float32_t ne10_fft_state_float32_t_480 = { | ||||
| 120, | ||||
| (ne10_int32_t *)ne10_factors_480, | ||||
| (ne10_fft_cpx_float32_t *)ne10_twiddles_480, | ||||
| NULL, | ||||
| (ne10_fft_cpx_float32_t *)&ne10_twiddles_480[120], | ||||
| /* is_forward_scaled = true */ | ||||
| (ne10_int32_t) 1, | ||||
| /* is_backward_scaled = false */ | ||||
| (ne10_int32_t) 0, | ||||
| }; | ||||
| static const arch_fft_state cfg_arch_480 = { | ||||
| 1, | ||||
| (void *)&ne10_fft_state_float32_t_480, | ||||
| }; | ||||
| 
 | ||||
| static const ne10_fft_state_float32_t ne10_fft_state_float32_t_240 = { | ||||
| 60, | ||||
| (ne10_int32_t *)ne10_factors_240, | ||||
| (ne10_fft_cpx_float32_t *)ne10_twiddles_240, | ||||
| NULL, | ||||
| (ne10_fft_cpx_float32_t *)&ne10_twiddles_240[60], | ||||
| /* is_forward_scaled = true */ | ||||
| (ne10_int32_t) 1, | ||||
| /* is_backward_scaled = false */ | ||||
| (ne10_int32_t) 0, | ||||
| }; | ||||
| static const arch_fft_state cfg_arch_240 = { | ||||
| 1, | ||||
| (void *)&ne10_fft_state_float32_t_240, | ||||
| }; | ||||
| 
 | ||||
| static const ne10_fft_state_float32_t ne10_fft_state_float32_t_120 = { | ||||
| 30, | ||||
| (ne10_int32_t *)ne10_factors_120, | ||||
| (ne10_fft_cpx_float32_t *)ne10_twiddles_120, | ||||
| NULL, | ||||
| (ne10_fft_cpx_float32_t *)&ne10_twiddles_120[30], | ||||
| /* is_forward_scaled = true */ | ||||
| (ne10_int32_t) 1, | ||||
| /* is_backward_scaled = false */ | ||||
| (ne10_int32_t) 0, | ||||
| }; | ||||
| static const arch_fft_state cfg_arch_120 = { | ||||
| 1, | ||||
| (void *)&ne10_fft_state_float32_t_120, | ||||
| }; | ||||
| 
 | ||||
| static const ne10_fft_state_float32_t ne10_fft_state_float32_t_60 = { | ||||
| 15, | ||||
| (ne10_int32_t *)ne10_factors_60, | ||||
| (ne10_fft_cpx_float32_t *)ne10_twiddles_60, | ||||
| NULL, | ||||
| (ne10_fft_cpx_float32_t *)&ne10_twiddles_60[15], | ||||
| /* is_forward_scaled = true */ | ||||
| (ne10_int32_t) 1, | ||||
| /* is_backward_scaled = false */ | ||||
| (ne10_int32_t) 0, | ||||
| }; | ||||
| static const arch_fft_state cfg_arch_60 = { | ||||
| 1, | ||||
| (void *)&ne10_fft_state_float32_t_60, | ||||
| }; | ||||
| 
 | ||||
| #endif  /* end NE10_FFT_PARAMS48000_960 */ | ||||
							
								
								
									
										161
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_cwrs32.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										161
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_cwrs32.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,161 @@ | |||
| /* Copyright (c) 2008-2011 Xiph.Org Foundation, Mozilla Corporation,
 | ||||
|                            Gregory Maxwell | ||||
|    Written by Jean-Marc Valin, Gregory Maxwell, and Timothy B. Terriberry */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <stdio.h> | ||||
| #include <string.h> | ||||
| 
 | ||||
| #ifndef CUSTOM_MODES | ||||
| #define CUSTOM_MODES | ||||
| #else | ||||
| #define TEST_CUSTOM_MODES | ||||
| #endif | ||||
| 
 | ||||
| #define CELT_C | ||||
| #include "stack_alloc.h" | ||||
| #include "entenc.c" | ||||
| #include "entdec.c" | ||||
| #include "entcode.c" | ||||
| #include "cwrs.c" | ||||
| #include "mathops.c" | ||||
| #include "rate.h" | ||||
| 
 | ||||
| #define NMAX (240) | ||||
| #define KMAX (128) | ||||
| 
 | ||||
| #ifdef TEST_CUSTOM_MODES | ||||
| 
 | ||||
| #define NDIMS (44) | ||||
| static const int pn[NDIMS]={ | ||||
|    2,   3,   4,   5,   6,   7,   8,   9,  10, | ||||
|   11,  12,  13,  14,  15,  16,  18,  20,  22, | ||||
|   24,  26,  28,  30,  32,  36,  40,  44,  48, | ||||
|   52,  56,  60,  64,  72,  80,  88,  96, 104, | ||||
|  112, 120, 128, 144, 160, 176, 192, 208 | ||||
| }; | ||||
| static const int pkmax[NDIMS]={ | ||||
|  128, 128, 128, 128,  88,  52,  36,  26,  22, | ||||
|   18,  16,  15,  13,  12,  12,  11,  10,   9, | ||||
|    9,   8,   8,   7,   7,   7,   7,   6,   6, | ||||
|    6,   6,   6,   5,   5,   5,   5,   5,   5, | ||||
|    4,   4,   4,   4,   4,   4,   4,   4 | ||||
| }; | ||||
| 
 | ||||
| #else /* TEST_CUSTOM_MODES */ | ||||
| 
 | ||||
| #define NDIMS (22) | ||||
| static const int pn[NDIMS]={ | ||||
|    2,   3,   4,   6,   8,   9,  11,  12,  16, | ||||
|   18,  22,  24,  32,  36,  44,  48,  64,  72, | ||||
|   88,  96, 144, 176 | ||||
| }; | ||||
| static const int pkmax[NDIMS]={ | ||||
|  128, 128, 128,  88,  36,  26,  18,  16,  12, | ||||
|   11,   9,   9,   7,   7,   6,   6,   5,   5, | ||||
|    5,   5,   4,   4 | ||||
| }; | ||||
| 
 | ||||
| #endif | ||||
| 
 | ||||
| int main(void){ | ||||
|   int t; | ||||
|   int n; | ||||
|   ALLOC_STACK; | ||||
|   for(t=0;t<NDIMS;t++){ | ||||
|     int pseudo; | ||||
|     n=pn[t]; | ||||
|     for(pseudo=1;pseudo<41;pseudo++) | ||||
|     { | ||||
|       int k; | ||||
| #if defined(SMALL_FOOTPRINT) | ||||
|       opus_uint32 uu[KMAX+2U]; | ||||
| #endif | ||||
|       opus_uint32 inc; | ||||
|       opus_uint32 nc; | ||||
|       opus_uint32 i; | ||||
|       k=get_pulses(pseudo); | ||||
|       if (k>pkmax[t])break; | ||||
|       printf("Testing CWRS with N=%i, K=%i...\n",n,k); | ||||
| #if defined(SMALL_FOOTPRINT) | ||||
|       nc=ncwrs_urow(n,k,uu); | ||||
| #else | ||||
|       nc=CELT_PVQ_V(n,k); | ||||
| #endif | ||||
|       inc=nc/20000; | ||||
|       if(inc<1)inc=1; | ||||
|       for(i=0;i<nc;i+=inc){ | ||||
| #if defined(SMALL_FOOTPRINT) | ||||
|         opus_uint32 u[KMAX+2U]; | ||||
| #endif | ||||
|         int         y[NMAX]; | ||||
|         int         sy; | ||||
|         opus_uint32 v; | ||||
|         opus_uint32 ii; | ||||
|         int         j; | ||||
| #if defined(SMALL_FOOTPRINT) | ||||
|         memcpy(u,uu,(k+2U)*sizeof(*u)); | ||||
|         cwrsi(n,k,i,y,u); | ||||
| #else | ||||
|         cwrsi(n,k,i,y); | ||||
| #endif | ||||
|         sy=0; | ||||
|         for(j=0;j<n;j++)sy+=abs(y[j]); | ||||
|         if(sy!=k){ | ||||
|           fprintf(stderr,"N=%d Pulse count mismatch in cwrsi (%d!=%d).\n", | ||||
|            n,sy,k); | ||||
|           return 99; | ||||
|         } | ||||
|         /*printf("%6u of %u:",i,nc);
 | ||||
|         for(j=0;j<n;j++)printf(" %+3i",y[j]); | ||||
|         printf(" ->");*/ | ||||
| #if defined(SMALL_FOOTPRINT) | ||||
|         ii=icwrs(n,k,&v,y,u); | ||||
| #else | ||||
|         ii=icwrs(n,y); | ||||
|         v=CELT_PVQ_V(n,k); | ||||
| #endif | ||||
|         if(ii!=i){ | ||||
|           fprintf(stderr,"Combination-index mismatch (%lu!=%lu).\n", | ||||
|            (long)ii,(long)i); | ||||
|           return 1; | ||||
|         } | ||||
|         if(v!=nc){ | ||||
|           fprintf(stderr,"Combination count mismatch (%lu!=%lu).\n", | ||||
|            (long)v,(long)nc); | ||||
|           return 2; | ||||
|         } | ||||
|         /*printf(" %6u\n",i);*/ | ||||
|       } | ||||
|       /*printf("\n");*/ | ||||
|     } | ||||
|   } | ||||
|   return 0; | ||||
| } | ||||
							
								
								
									
										179
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_dft.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										179
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_dft.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,179 @@ | |||
| /* Copyright (c) 2008 Xiph.Org Foundation
 | ||||
|    Written by Jean-Marc Valin */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <stdio.h> | ||||
| 
 | ||||
| #include "stack_alloc.h" | ||||
| #include "kiss_fft.h" | ||||
| #include "mathops.h" | ||||
| #include "modes.h" | ||||
| 
 | ||||
| #ifndef M_PI | ||||
| #define M_PI 3.141592653 | ||||
| #endif | ||||
| 
 | ||||
| int ret = 0; | ||||
| 
 | ||||
| void check(kiss_fft_cpx  * in,kiss_fft_cpx  * out,int nfft,int isinverse) | ||||
| { | ||||
|     int bin,k; | ||||
|     double errpow=0,sigpow=0, snr; | ||||
| 
 | ||||
|     for (bin=0;bin<nfft;++bin) { | ||||
|         double ansr = 0; | ||||
|         double ansi = 0; | ||||
|         double difr; | ||||
|         double difi; | ||||
| 
 | ||||
|         for (k=0;k<nfft;++k) { | ||||
|             double phase = -2*M_PI*bin*k/nfft; | ||||
|             double re = cos(phase); | ||||
|             double im = sin(phase); | ||||
|             if (isinverse) | ||||
|                 im = -im; | ||||
| 
 | ||||
|             if (!isinverse) | ||||
|             { | ||||
|                re /= nfft; | ||||
|                im /= nfft; | ||||
|             } | ||||
| 
 | ||||
|             ansr += in[k].r * re - in[k].i * im; | ||||
|             ansi += in[k].r * im + in[k].i * re; | ||||
|         } | ||||
|         /*printf ("%d %d ", (int)ansr, (int)ansi);*/ | ||||
|         difr = ansr - out[bin].r; | ||||
|         difi = ansi - out[bin].i; | ||||
|         errpow += difr*difr + difi*difi; | ||||
|         sigpow += ansr*ansr+ansi*ansi; | ||||
|     } | ||||
|     snr = 10*log10(sigpow/errpow); | ||||
|     printf("nfft=%d inverse=%d,snr = %f\n",nfft,isinverse,snr ); | ||||
|     if (snr<60) { | ||||
|        printf( "** poor snr: %f ** \n", snr); | ||||
|        ret = 1; | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| void test1d(int nfft,int isinverse,int arch) | ||||
| { | ||||
|     size_t buflen = sizeof(kiss_fft_cpx)*nfft; | ||||
|     kiss_fft_cpx *in; | ||||
|     kiss_fft_cpx *out; | ||||
|     int k; | ||||
| #ifdef CUSTOM_MODES | ||||
|     kiss_fft_state *cfg = opus_fft_alloc(nfft,0,0,arch); | ||||
| #else | ||||
|     int id; | ||||
|     const kiss_fft_state *cfg; | ||||
|     CELTMode *mode = opus_custom_mode_create(48000, 960, NULL); | ||||
|     if (nfft == 480) id = 0; | ||||
|     else if (nfft == 240) id = 1; | ||||
|     else if (nfft == 120) id = 2; | ||||
|     else if (nfft == 60) id = 3; | ||||
|     else return; | ||||
|     cfg = mode->mdct.kfft[id]; | ||||
| #endif | ||||
| 
 | ||||
|     in = (kiss_fft_cpx*)malloc(buflen); | ||||
|     out = (kiss_fft_cpx*)malloc(buflen); | ||||
| 
 | ||||
|     for (k=0;k<nfft;++k) { | ||||
|         in[k].r = (rand() % 32767) - 16384; | ||||
|         in[k].i = (rand() % 32767) - 16384; | ||||
|     } | ||||
| 
 | ||||
|     for (k=0;k<nfft;++k) { | ||||
|        in[k].r *= 32768; | ||||
|        in[k].i *= 32768; | ||||
|     } | ||||
| 
 | ||||
|     if (isinverse) | ||||
|     { | ||||
|        for (k=0;k<nfft;++k) { | ||||
|           in[k].r /= nfft; | ||||
|           in[k].i /= nfft; | ||||
|        } | ||||
|     } | ||||
| 
 | ||||
|     /*for (k=0;k<nfft;++k) printf("%d %d ", in[k].r, in[k].i);printf("\n");*/ | ||||
| 
 | ||||
|     if (isinverse) | ||||
|        opus_ifft(cfg,in,out, arch); | ||||
|     else | ||||
|        opus_fft(cfg,in,out, arch); | ||||
| 
 | ||||
|     /*for (k=0;k<nfft;++k) printf("%d %d ", out[k].r, out[k].i);printf("\n");*/ | ||||
| 
 | ||||
|     check(in,out,nfft,isinverse); | ||||
| 
 | ||||
|     free(in); | ||||
|     free(out); | ||||
| #ifdef CUSTOM_MODES | ||||
|     opus_fft_free(cfg, arch); | ||||
| #endif | ||||
| } | ||||
| 
 | ||||
| int main(int argc,char ** argv) | ||||
| { | ||||
|     ALLOC_STACK; | ||||
|     int arch = opus_select_arch(); | ||||
| 
 | ||||
|     if (argc>1) { | ||||
|         int k; | ||||
|         for (k=1;k<argc;++k) { | ||||
|             test1d(atoi(argv[k]),0,arch); | ||||
|             test1d(atoi(argv[k]),1,arch); | ||||
|         } | ||||
|     }else{ | ||||
|         test1d(32,0,arch); | ||||
|         test1d(32,1,arch); | ||||
|         test1d(128,0,arch); | ||||
|         test1d(128,1,arch); | ||||
|         test1d(256,0,arch); | ||||
|         test1d(256,1,arch); | ||||
| #ifndef RADIX_TWO_ONLY | ||||
|         test1d(36,0,arch); | ||||
|         test1d(36,1,arch); | ||||
|         test1d(50,0,arch); | ||||
|         test1d(50,1,arch); | ||||
|         test1d(60,0,arch); | ||||
|         test1d(60,1,arch); | ||||
|         test1d(120,0,arch); | ||||
|         test1d(120,1,arch); | ||||
|         test1d(240,0,arch); | ||||
|         test1d(240,1,arch); | ||||
|         test1d(480,0,arch); | ||||
|         test1d(480,1,arch); | ||||
| #endif | ||||
|     } | ||||
|     return ret; | ||||
| } | ||||
							
								
								
									
										383
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_entropy.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										383
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_entropy.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,383 @@ | |||
| /* Copyright (c) 2007-2011 Xiph.Org Foundation, Mozilla Corporation,
 | ||||
|                            Gregory Maxwell | ||||
|    Written by Jean-Marc Valin, Gregory Maxwell, and Timothy B. Terriberry */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <stdlib.h> | ||||
| #include <stdio.h> | ||||
| #include <math.h> | ||||
| #include <time.h> | ||||
| #define CELT_C | ||||
| #include "entcode.h" | ||||
| #include "entenc.h" | ||||
| #include "entdec.h" | ||||
| #include <string.h> | ||||
| 
 | ||||
| #include "entenc.c" | ||||
| #include "entdec.c" | ||||
| #include "entcode.c" | ||||
| 
 | ||||
| #ifndef M_LOG2E | ||||
| # define M_LOG2E    1.4426950408889634074 | ||||
| #endif | ||||
| #define DATA_SIZE 10000000 | ||||
| #define DATA_SIZE2 10000 | ||||
| 
 | ||||
| int main(int _argc,char **_argv){ | ||||
|   ec_enc         enc; | ||||
|   ec_dec         dec; | ||||
|   long           nbits; | ||||
|   long           nbits2; | ||||
|   double         entropy; | ||||
|   int            ft; | ||||
|   int            ftb; | ||||
|   int            sz; | ||||
|   int            i; | ||||
|   int            ret; | ||||
|   unsigned int   sym; | ||||
|   unsigned int   seed; | ||||
|   unsigned char *ptr; | ||||
|   const char    *env_seed; | ||||
|   ret=0; | ||||
|   entropy=0; | ||||
|   if (_argc > 2) { | ||||
|     fprintf(stderr, "Usage: %s [<seed>]\n", _argv[0]); | ||||
|     return 1; | ||||
|   } | ||||
|   env_seed = getenv("SEED"); | ||||
|   if (_argc > 1) | ||||
|     seed = atoi(_argv[1]); | ||||
|   else if (env_seed) | ||||
|     seed = atoi(env_seed); | ||||
|   else | ||||
|     seed = time(NULL); | ||||
|   /*Testing encoding of raw bit values.*/ | ||||
|   ptr = (unsigned char *)malloc(DATA_SIZE); | ||||
|   ec_enc_init(&enc,ptr, DATA_SIZE); | ||||
|   for(ft=2;ft<1024;ft++){ | ||||
|     for(i=0;i<ft;i++){ | ||||
|       entropy+=log(ft)*M_LOG2E; | ||||
|       ec_enc_uint(&enc,i,ft); | ||||
|     } | ||||
|   } | ||||
|   /*Testing encoding of raw bit values.*/ | ||||
|   for(ftb=1;ftb<16;ftb++){ | ||||
|     for(i=0;i<(1<<ftb);i++){ | ||||
|       entropy+=ftb; | ||||
|       nbits=ec_tell(&enc); | ||||
|       ec_enc_bits(&enc,i,ftb); | ||||
|       nbits2=ec_tell(&enc); | ||||
|       if(nbits2-nbits!=ftb){ | ||||
|         fprintf(stderr,"Used %li bits to encode %i bits directly.\n", | ||||
|          nbits2-nbits,ftb); | ||||
|         ret=-1; | ||||
|       } | ||||
|     } | ||||
|   } | ||||
|   nbits=ec_tell_frac(&enc); | ||||
|   ec_enc_done(&enc); | ||||
|   fprintf(stderr, | ||||
|    "Encoded %0.2lf bits of entropy to %0.2lf bits (%0.3lf%% wasted).\n", | ||||
|    entropy,ldexp(nbits,-3),100*(nbits-ldexp(entropy,3))/nbits); | ||||
|   fprintf(stderr,"Packed to %li bytes.\n",(long)ec_range_bytes(&enc)); | ||||
|   ec_dec_init(&dec,ptr,DATA_SIZE); | ||||
|   for(ft=2;ft<1024;ft++){ | ||||
|     for(i=0;i<ft;i++){ | ||||
|       sym=ec_dec_uint(&dec,ft); | ||||
|       if(sym!=(unsigned)i){ | ||||
|         fprintf(stderr,"Decoded %i instead of %i with ft of %i.\n",sym,i,ft); | ||||
|         ret=-1; | ||||
|       } | ||||
|     } | ||||
|   } | ||||
|   for(ftb=1;ftb<16;ftb++){ | ||||
|     for(i=0;i<(1<<ftb);i++){ | ||||
|       sym=ec_dec_bits(&dec,ftb); | ||||
|       if(sym!=(unsigned)i){ | ||||
|         fprintf(stderr,"Decoded %i instead of %i with ftb of %i.\n",sym,i,ftb); | ||||
|         ret=-1; | ||||
|       } | ||||
|     } | ||||
|   } | ||||
|   nbits2=ec_tell_frac(&dec); | ||||
|   if(nbits!=nbits2){ | ||||
|     fprintf(stderr, | ||||
|      "Reported number of bits used was %0.2lf, should be %0.2lf.\n", | ||||
|      ldexp(nbits2,-3),ldexp(nbits,-3)); | ||||
|     ret=-1; | ||||
|   } | ||||
|   /*Testing an encoder bust prefers range coder data over raw bits.
 | ||||
|     This isn't a general guarantee, will only work for data that is buffered in | ||||
|      the encoder state and not yet stored in the user buffer, and should never | ||||
|      get used in practice. | ||||
|     It's mostly here for code coverage completeness.*/ | ||||
|   /*Start with a 16-bit buffer.*/ | ||||
|   ec_enc_init(&enc,ptr,2); | ||||
|   /*Write 7 raw bits.*/ | ||||
|   ec_enc_bits(&enc,0x55,7); | ||||
|   /*Write 12.3 bits of range coder data.*/ | ||||
|   ec_enc_uint(&enc,1,2); | ||||
|   ec_enc_uint(&enc,1,3); | ||||
|   ec_enc_uint(&enc,1,4); | ||||
|   ec_enc_uint(&enc,1,5); | ||||
|   ec_enc_uint(&enc,2,6); | ||||
|   ec_enc_uint(&enc,6,7); | ||||
|   ec_enc_done(&enc); | ||||
|   ec_dec_init(&dec,ptr,2); | ||||
|   if(!enc.error | ||||
|    /*The raw bits should have been overwritten by the range coder data.*/ | ||||
|    ||ec_dec_bits(&dec,7)!=0x05 | ||||
|    /*And all the range coder data should have been encoded correctly.*/ | ||||
|    ||ec_dec_uint(&dec,2)!=1 | ||||
|    ||ec_dec_uint(&dec,3)!=1 | ||||
|    ||ec_dec_uint(&dec,4)!=1 | ||||
|    ||ec_dec_uint(&dec,5)!=1 | ||||
|    ||ec_dec_uint(&dec,6)!=2 | ||||
|    ||ec_dec_uint(&dec,7)!=6){ | ||||
|     fprintf(stderr,"Encoder bust overwrote range coder data with raw bits.\n"); | ||||
|     ret=-1; | ||||
|   } | ||||
|   srand(seed); | ||||
|   fprintf(stderr,"Testing random streams... Random seed: %u (%.4X)\n", seed, rand() % 65536); | ||||
|   for(i=0;i<409600;i++){ | ||||
|     unsigned *data; | ||||
|     unsigned *tell; | ||||
|     unsigned tell_bits; | ||||
|     int       j; | ||||
|     int zeros; | ||||
|     ft=rand()/((RAND_MAX>>(rand()%11U))+1U)+10; | ||||
|     sz=rand()/((RAND_MAX>>(rand()%9U))+1U); | ||||
|     data=(unsigned *)malloc(sz*sizeof(*data)); | ||||
|     tell=(unsigned *)malloc((sz+1)*sizeof(*tell)); | ||||
|     ec_enc_init(&enc,ptr,DATA_SIZE2); | ||||
|     zeros = rand()%13==0; | ||||
|     tell[0]=ec_tell_frac(&enc); | ||||
|     for(j=0;j<sz;j++){ | ||||
|       if (zeros) | ||||
|         data[j]=0; | ||||
|       else | ||||
|         data[j]=rand()%ft; | ||||
|       ec_enc_uint(&enc,data[j],ft); | ||||
|       tell[j+1]=ec_tell_frac(&enc); | ||||
|     } | ||||
|     if (rand()%2==0) | ||||
|       while(ec_tell(&enc)%8 != 0) | ||||
|         ec_enc_uint(&enc, rand()%2, 2); | ||||
|     tell_bits = ec_tell(&enc); | ||||
|     ec_enc_done(&enc); | ||||
|     if(tell_bits!=(unsigned)ec_tell(&enc)){ | ||||
|       fprintf(stderr,"ec_tell() changed after ec_enc_done(): %i instead of %i (Random seed: %u)\n", | ||||
|        ec_tell(&enc),tell_bits,seed); | ||||
|       ret=-1; | ||||
|     } | ||||
|     if ((tell_bits+7)/8 < ec_range_bytes(&enc)) | ||||
|     { | ||||
|       fprintf (stderr, "ec_tell() lied, there's %i bytes instead of %d (Random seed: %u)\n", | ||||
|                ec_range_bytes(&enc), (tell_bits+7)/8,seed); | ||||
|       ret=-1; | ||||
|     } | ||||
|     ec_dec_init(&dec,ptr,DATA_SIZE2); | ||||
|     if(ec_tell_frac(&dec)!=tell[0]){ | ||||
|       fprintf(stderr, | ||||
|        "Tell mismatch between encoder and decoder at symbol %i: %i instead of %i (Random seed: %u).\n", | ||||
|        0,ec_tell_frac(&dec),tell[0],seed); | ||||
|     } | ||||
|     for(j=0;j<sz;j++){ | ||||
|       sym=ec_dec_uint(&dec,ft); | ||||
|       if(sym!=data[j]){ | ||||
|         fprintf(stderr, | ||||
|          "Decoded %i instead of %i with ft of %i at position %i of %i (Random seed: %u).\n", | ||||
|          sym,data[j],ft,j,sz,seed); | ||||
|         ret=-1; | ||||
|       } | ||||
|       if(ec_tell_frac(&dec)!=tell[j+1]){ | ||||
|         fprintf(stderr, | ||||
|          "Tell mismatch between encoder and decoder at symbol %i: %i instead of %i (Random seed: %u).\n", | ||||
|          j+1,ec_tell_frac(&dec),tell[j+1],seed); | ||||
|       } | ||||
|     } | ||||
|     free(tell); | ||||
|     free(data); | ||||
|   } | ||||
|   /*Test compatibility between multiple different encode/decode routines.*/ | ||||
|   for(i=0;i<409600;i++){ | ||||
|     unsigned *logp1; | ||||
|     unsigned *data; | ||||
|     unsigned *tell; | ||||
|     unsigned *enc_method; | ||||
|     int       j; | ||||
|     sz=rand()/((RAND_MAX>>(rand()%9U))+1U); | ||||
|     logp1=(unsigned *)malloc(sz*sizeof(*logp1)); | ||||
|     data=(unsigned *)malloc(sz*sizeof(*data)); | ||||
|     tell=(unsigned *)malloc((sz+1)*sizeof(*tell)); | ||||
|     enc_method=(unsigned *)malloc(sz*sizeof(*enc_method)); | ||||
|     ec_enc_init(&enc,ptr,DATA_SIZE2); | ||||
|     tell[0]=ec_tell_frac(&enc); | ||||
|     for(j=0;j<sz;j++){ | ||||
|       data[j]=rand()/((RAND_MAX>>1)+1); | ||||
|       logp1[j]=(rand()%15)+1; | ||||
|       enc_method[j]=rand()/((RAND_MAX>>2)+1); | ||||
|       switch(enc_method[j]){ | ||||
|         case 0:{ | ||||
|           ec_encode(&enc,data[j]?(1<<logp1[j])-1:0, | ||||
|            (1<<logp1[j])-(data[j]?0:1),1<<logp1[j]); | ||||
|         }break; | ||||
|         case 1:{ | ||||
|           ec_encode_bin(&enc,data[j]?(1<<logp1[j])-1:0, | ||||
|            (1<<logp1[j])-(data[j]?0:1),logp1[j]); | ||||
|         }break; | ||||
|         case 2:{ | ||||
|           ec_enc_bit_logp(&enc,data[j],logp1[j]); | ||||
|         }break; | ||||
|         case 3:{ | ||||
|           unsigned char icdf[2]; | ||||
|           icdf[0]=1; | ||||
|           icdf[1]=0; | ||||
|           ec_enc_icdf(&enc,data[j],icdf,logp1[j]); | ||||
|         }break; | ||||
|       } | ||||
|       tell[j+1]=ec_tell_frac(&enc); | ||||
|     } | ||||
|     ec_enc_done(&enc); | ||||
|     if((ec_tell(&enc)+7U)/8U<ec_range_bytes(&enc)){ | ||||
|       fprintf(stderr,"tell() lied, there's %i bytes instead of %d (Random seed: %u)\n", | ||||
|        ec_range_bytes(&enc),(ec_tell(&enc)+7)/8,seed); | ||||
|       ret=-1; | ||||
|     } | ||||
|     ec_dec_init(&dec,ptr,DATA_SIZE2); | ||||
|     if(ec_tell_frac(&dec)!=tell[0]){ | ||||
|       fprintf(stderr, | ||||
|        "Tell mismatch between encoder and decoder at symbol %i: %i instead of %i (Random seed: %u).\n", | ||||
|        0,ec_tell_frac(&dec),tell[0],seed); | ||||
|     } | ||||
|     for(j=0;j<sz;j++){ | ||||
|       int fs; | ||||
|       int dec_method; | ||||
|       dec_method=rand()/((RAND_MAX>>2)+1); | ||||
|       switch(dec_method){ | ||||
|         case 0:{ | ||||
|           fs=ec_decode(&dec,1<<logp1[j]); | ||||
|           sym=fs>=(1<<logp1[j])-1; | ||||
|           ec_dec_update(&dec,sym?(1<<logp1[j])-1:0, | ||||
|            (1<<logp1[j])-(sym?0:1),1<<logp1[j]); | ||||
|         }break; | ||||
|         case 1:{ | ||||
|           fs=ec_decode_bin(&dec,logp1[j]); | ||||
|           sym=fs>=(1<<logp1[j])-1; | ||||
|           ec_dec_update(&dec,sym?(1<<logp1[j])-1:0, | ||||
|            (1<<logp1[j])-(sym?0:1),1<<logp1[j]); | ||||
|         }break; | ||||
|         case 2:{ | ||||
|           sym=ec_dec_bit_logp(&dec,logp1[j]); | ||||
|         }break; | ||||
|         case 3:{ | ||||
|           unsigned char icdf[2]; | ||||
|           icdf[0]=1; | ||||
|           icdf[1]=0; | ||||
|           sym=ec_dec_icdf(&dec,icdf,logp1[j]); | ||||
|         }break; | ||||
|       } | ||||
|       if(sym!=data[j]){ | ||||
|         fprintf(stderr, | ||||
|          "Decoded %i instead of %i with logp1 of %i at position %i of %i (Random seed: %u).\n", | ||||
|          sym,data[j],logp1[j],j,sz,seed); | ||||
|         fprintf(stderr,"Encoding method: %i, decoding method: %i\n", | ||||
|          enc_method[j],dec_method); | ||||
|         ret=-1; | ||||
|       } | ||||
|       if(ec_tell_frac(&dec)!=tell[j+1]){ | ||||
|         fprintf(stderr, | ||||
|          "Tell mismatch between encoder and decoder at symbol %i: %i instead of %i (Random seed: %u).\n", | ||||
|          j+1,ec_tell_frac(&dec),tell[j+1],seed); | ||||
|       } | ||||
|     } | ||||
|     free(enc_method); | ||||
|     free(tell); | ||||
|     free(data); | ||||
|     free(logp1); | ||||
|   } | ||||
|   ec_enc_init(&enc,ptr,DATA_SIZE2); | ||||
|   ec_enc_bit_logp(&enc,0,1); | ||||
|   ec_enc_bit_logp(&enc,0,1); | ||||
|   ec_enc_bit_logp(&enc,0,1); | ||||
|   ec_enc_bit_logp(&enc,0,1); | ||||
|   ec_enc_bit_logp(&enc,0,2); | ||||
|   ec_enc_patch_initial_bits(&enc,3,2); | ||||
|   if(enc.error){ | ||||
|     fprintf(stderr,"patch_initial_bits failed"); | ||||
|     ret=-1; | ||||
|   } | ||||
|   ec_enc_patch_initial_bits(&enc,0,5); | ||||
|   if(!enc.error){ | ||||
|     fprintf(stderr,"patch_initial_bits didn't fail when it should have"); | ||||
|     ret=-1; | ||||
|   } | ||||
|   ec_enc_done(&enc); | ||||
|   if(ec_range_bytes(&enc)!=1||ptr[0]!=192){ | ||||
|     fprintf(stderr,"Got %d when expecting 192 for patch_initial_bits",ptr[0]); | ||||
|     ret=-1; | ||||
|   } | ||||
|   ec_enc_init(&enc,ptr,DATA_SIZE2); | ||||
|   ec_enc_bit_logp(&enc,0,1); | ||||
|   ec_enc_bit_logp(&enc,0,1); | ||||
|   ec_enc_bit_logp(&enc,1,6); | ||||
|   ec_enc_bit_logp(&enc,0,2); | ||||
|   ec_enc_patch_initial_bits(&enc,0,2); | ||||
|   if(enc.error){ | ||||
|     fprintf(stderr,"patch_initial_bits failed"); | ||||
|     ret=-1; | ||||
|   } | ||||
|   ec_enc_done(&enc); | ||||
|   if(ec_range_bytes(&enc)!=2||ptr[0]!=63){ | ||||
|     fprintf(stderr,"Got %d when expecting 63 for patch_initial_bits",ptr[0]); | ||||
|     ret=-1; | ||||
|   } | ||||
|   ec_enc_init(&enc,ptr,2); | ||||
|   ec_enc_bit_logp(&enc,0,2); | ||||
|   for(i=0;i<48;i++){ | ||||
|     ec_enc_bits(&enc,0,1); | ||||
|   } | ||||
|   ec_enc_done(&enc); | ||||
|   if(!enc.error){ | ||||
|     fprintf(stderr,"Raw bits overfill didn't fail when it should have"); | ||||
|     ret=-1; | ||||
|   } | ||||
|   ec_enc_init(&enc,ptr,2); | ||||
|   for(i=0;i<17;i++){ | ||||
|     ec_enc_bits(&enc,0,1); | ||||
|   } | ||||
|   ec_enc_done(&enc); | ||||
|   if(!enc.error){ | ||||
|     fprintf(stderr,"17 raw bits encoded in two bytes"); | ||||
|     ret=-1; | ||||
|   } | ||||
|   free(ptr); | ||||
|   return ret; | ||||
| } | ||||
							
								
								
									
										93
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_laplace.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										93
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_laplace.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,93 @@ | |||
| /* Copyright (c) 2008-2011 Xiph.Org Foundation, Mozilla Corporation
 | ||||
|    Written by Jean-Marc Valin and Timothy B. Terriberry */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <stdio.h> | ||||
| #include <stdlib.h> | ||||
| #define CELT_C | ||||
| #include "laplace.h" | ||||
| #include "stack_alloc.h" | ||||
| 
 | ||||
| #include "entenc.c" | ||||
| #include "entdec.c" | ||||
| #include "entcode.c" | ||||
| #include "laplace.c" | ||||
| 
 | ||||
| #define DATA_SIZE 40000 | ||||
| 
 | ||||
| int ec_laplace_get_start_freq(int decay) | ||||
| { | ||||
|    opus_uint32 ft = 32768 - LAPLACE_MINP*(2*LAPLACE_NMIN+1); | ||||
|    int fs = (ft*(16384-decay))/(16384+decay); | ||||
|    return fs+LAPLACE_MINP; | ||||
| } | ||||
| 
 | ||||
| int main(void) | ||||
| { | ||||
|    int i; | ||||
|    int ret = 0; | ||||
|    ec_enc enc; | ||||
|    ec_dec dec; | ||||
|    unsigned char *ptr; | ||||
|    int val[10000], decay[10000]; | ||||
|    ALLOC_STACK; | ||||
|    ptr = (unsigned char *)malloc(DATA_SIZE); | ||||
|    ec_enc_init(&enc,ptr,DATA_SIZE); | ||||
| 
 | ||||
|    val[0] = 3; decay[0] = 6000; | ||||
|    val[1] = 0; decay[1] = 5800; | ||||
|    val[2] = -1; decay[2] = 5600; | ||||
|    for (i=3;i<10000;i++) | ||||
|    { | ||||
|       val[i] = rand()%15-7; | ||||
|       decay[i] = rand()%11000+5000; | ||||
|    } | ||||
|    for (i=0;i<10000;i++) | ||||
|       ec_laplace_encode(&enc, &val[i], | ||||
|             ec_laplace_get_start_freq(decay[i]), decay[i]); | ||||
| 
 | ||||
|    ec_enc_done(&enc); | ||||
| 
 | ||||
|    ec_dec_init(&dec,ec_get_buffer(&enc),ec_range_bytes(&enc)); | ||||
| 
 | ||||
|    for (i=0;i<10000;i++) | ||||
|    { | ||||
|       int d = ec_laplace_decode(&dec, | ||||
|             ec_laplace_get_start_freq(decay[i]), decay[i]); | ||||
|       if (d != val[i]) | ||||
|       { | ||||
|          fprintf (stderr, "Got %d instead of %d\n", d, val[i]); | ||||
|          ret = 1; | ||||
|       } | ||||
|    } | ||||
| 
 | ||||
|    free(ptr); | ||||
|    return ret; | ||||
| } | ||||
							
								
								
									
										266
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_mathops.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										266
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_mathops.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,266 @@ | |||
| /* Copyright (c) 2008-2011 Xiph.Org Foundation, Mozilla Corporation,
 | ||||
|                            Gregory Maxwell | ||||
|    Written by Jean-Marc Valin, Gregory Maxwell, and Timothy B. Terriberry */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #ifndef CUSTOM_MODES | ||||
| #define CUSTOM_MODES | ||||
| #endif | ||||
| 
 | ||||
| #include <stdio.h> | ||||
| #include <math.h> | ||||
| #include "mathops.h" | ||||
| #include "bands.h" | ||||
| 
 | ||||
| #ifdef FIXED_POINT | ||||
| #define WORD "%d" | ||||
| #else | ||||
| #define WORD "%f" | ||||
| #endif | ||||
| 
 | ||||
| int ret = 0; | ||||
| 
 | ||||
| void testdiv(void) | ||||
| { | ||||
|    opus_int32 i; | ||||
|    for (i=1;i<=327670;i++) | ||||
|    { | ||||
|       double prod; | ||||
|       opus_val32 val; | ||||
|       val = celt_rcp(i); | ||||
| #ifdef FIXED_POINT | ||||
|       prod = (1./32768./65526.)*val*i; | ||||
| #else | ||||
|       prod = val*i; | ||||
| #endif | ||||
|       if (fabs(prod-1) > .00025) | ||||
|       { | ||||
|          fprintf (stderr, "div failed: 1/%d="WORD" (product = %f)\n", i, val, prod); | ||||
|          ret = 1; | ||||
|       } | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| void testsqrt(void) | ||||
| { | ||||
|    opus_int32 i; | ||||
|    for (i=1;i<=1000000000;i++) | ||||
|    { | ||||
|       double ratio; | ||||
|       opus_val16 val; | ||||
|       val = celt_sqrt(i); | ||||
|       ratio = val/sqrt(i); | ||||
|       if (fabs(ratio - 1) > .0005 && fabs(val-sqrt(i)) > 2) | ||||
|       { | ||||
|          fprintf (stderr, "sqrt failed: sqrt(%d)="WORD" (ratio = %f)\n", i, val, ratio); | ||||
|          ret = 1; | ||||
|       } | ||||
|       i+= i>>10; | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| void testbitexactcos(void) | ||||
| { | ||||
|    int i; | ||||
|    opus_int32 min_d,max_d,last,chk; | ||||
|    chk=max_d=0; | ||||
|    last=min_d=32767; | ||||
|    for(i=64;i<=16320;i++) | ||||
|    { | ||||
|       opus_int32 d; | ||||
|       opus_int32 q=bitexact_cos(i); | ||||
|       chk ^= q*i; | ||||
|       d = last - q; | ||||
|       if (d>max_d)max_d=d; | ||||
|       if (d<min_d)min_d=d; | ||||
|       last = q; | ||||
|    } | ||||
|    if ((chk!=89408644)||(max_d!=5)||(min_d!=0)||(bitexact_cos(64)!=32767)|| | ||||
|        (bitexact_cos(16320)!=200)||(bitexact_cos(8192)!=23171)) | ||||
|    { | ||||
|       fprintf (stderr, "bitexact_cos failed\n"); | ||||
|       ret = 1; | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| void testbitexactlog2tan(void) | ||||
| { | ||||
|    int i,fail; | ||||
|    opus_int32 min_d,max_d,last,chk; | ||||
|    fail=chk=max_d=0; | ||||
|    last=min_d=15059; | ||||
|    for(i=64;i<8193;i++) | ||||
|    { | ||||
|       opus_int32 d; | ||||
|       opus_int32 mid=bitexact_cos(i); | ||||
|       opus_int32 side=bitexact_cos(16384-i); | ||||
|       opus_int32 q=bitexact_log2tan(mid,side); | ||||
|       chk ^= q*i; | ||||
|       d = last - q; | ||||
|       if (q!=-1*bitexact_log2tan(side,mid)) | ||||
|         fail = 1; | ||||
|       if (d>max_d)max_d=d; | ||||
|       if (d<min_d)min_d=d; | ||||
|       last = q; | ||||
|    } | ||||
|    if ((chk!=15821257)||(max_d!=61)||(min_d!=-2)||fail|| | ||||
|        (bitexact_log2tan(32767,200)!=15059)||(bitexact_log2tan(30274,12540)!=2611)|| | ||||
|        (bitexact_log2tan(23171,23171)!=0)) | ||||
|    { | ||||
|       fprintf (stderr, "bitexact_log2tan failed\n"); | ||||
|       ret = 1; | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| #ifndef FIXED_POINT | ||||
| void testlog2(void) | ||||
| { | ||||
|    float x; | ||||
|    for (x=0.001;x<1677700.0;x+=(x/8.0)) | ||||
|    { | ||||
|       float error = fabs((1.442695040888963387*log(x))-celt_log2(x)); | ||||
|       if (error>0.0009) | ||||
|       { | ||||
|          fprintf (stderr, "celt_log2 failed: fabs((1.442695040888963387*log(x))-celt_log2(x))>0.001 (x = %f, error = %f)\n", x,error); | ||||
|          ret = 1; | ||||
|       } | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| void testexp2(void) | ||||
| { | ||||
|    float x; | ||||
|    for (x=-11.0;x<24.0;x+=0.0007) | ||||
|    { | ||||
|       float error = fabs(x-(1.442695040888963387*log(celt_exp2(x)))); | ||||
|       if (error>0.0002) | ||||
|       { | ||||
|          fprintf (stderr, "celt_exp2 failed: fabs(x-(1.442695040888963387*log(celt_exp2(x))))>0.0005 (x = %f, error = %f)\n", x,error); | ||||
|          ret = 1; | ||||
|       } | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| void testexp2log2(void) | ||||
| { | ||||
|    float x; | ||||
|    for (x=-11.0;x<24.0;x+=0.0007) | ||||
|    { | ||||
|       float error = fabs(x-(celt_log2(celt_exp2(x)))); | ||||
|       if (error>0.001) | ||||
|       { | ||||
|          fprintf (stderr, "celt_log2/celt_exp2 failed: fabs(x-(celt_log2(celt_exp2(x))))>0.001 (x = %f, error = %f)\n", x,error); | ||||
|          ret = 1; | ||||
|       } | ||||
|    } | ||||
| } | ||||
| #else | ||||
| void testlog2(void) | ||||
| { | ||||
|    opus_val32 x; | ||||
|    for (x=8;x<1073741824;x+=(x>>3)) | ||||
|    { | ||||
|       float error = fabs((1.442695040888963387*log(x/16384.0))-celt_log2(x)/1024.0); | ||||
|       if (error>0.003) | ||||
|       { | ||||
|          fprintf (stderr, "celt_log2 failed: x = %ld, error = %f\n", (long)x,error); | ||||
|          ret = 1; | ||||
|       } | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| void testexp2(void) | ||||
| { | ||||
|    opus_val16 x; | ||||
|    for (x=-32768;x<15360;x++) | ||||
|    { | ||||
|       float error1 = fabs(x/1024.0-(1.442695040888963387*log(celt_exp2(x)/65536.0))); | ||||
|       float error2 = fabs(exp(0.6931471805599453094*x/1024.0)-celt_exp2(x)/65536.0); | ||||
|       if (error1>0.0002&&error2>0.00004) | ||||
|       { | ||||
|          fprintf (stderr, "celt_exp2 failed: x = "WORD", error1 = %f, error2 = %f\n", x,error1,error2); | ||||
|          ret = 1; | ||||
|       } | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| void testexp2log2(void) | ||||
| { | ||||
|    opus_val32 x; | ||||
|    for (x=8;x<65536;x+=(x>>3)) | ||||
|    { | ||||
|       float error = fabs(x-0.25*celt_exp2(celt_log2(x)))/16384; | ||||
|       if (error>0.004) | ||||
|       { | ||||
|          fprintf (stderr, "celt_log2/celt_exp2 failed: fabs(x-(celt_exp2(celt_log2(x))))>0.001 (x = %ld, error = %f)\n", (long)x,error); | ||||
|          ret = 1; | ||||
|       } | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| void testilog2(void) | ||||
| { | ||||
|    opus_val32 x; | ||||
|    for (x=1;x<=268435455;x+=127) | ||||
|    { | ||||
|       opus_val32 lg; | ||||
|       opus_val32 y; | ||||
| 
 | ||||
|       lg = celt_ilog2(x); | ||||
|       if (lg<0 || lg>=31) | ||||
|       { | ||||
|          printf("celt_ilog2 failed: 0<=celt_ilog2(x)<31 (x = %d, celt_ilog2(x) = %d)\n",x,lg); | ||||
|          ret = 1; | ||||
|       } | ||||
|       y = 1<<lg; | ||||
| 
 | ||||
|       if (x<y || (x>>1)>=y) | ||||
|       { | ||||
|          printf("celt_ilog2 failed: 2**celt_ilog2(x)<=x<2**(celt_ilog2(x)+1) (x = %d, 2**celt_ilog2(x) = %d)\n",x,y); | ||||
|          ret = 1; | ||||
|       } | ||||
|    } | ||||
| } | ||||
| #endif | ||||
| 
 | ||||
| int main(void) | ||||
| { | ||||
|    testbitexactcos(); | ||||
|    testbitexactlog2tan(); | ||||
|    testdiv(); | ||||
|    testsqrt(); | ||||
|    testlog2(); | ||||
|    testexp2(); | ||||
|    testexp2log2(); | ||||
| #ifdef FIXED_POINT | ||||
|    testilog2(); | ||||
| #endif | ||||
|    return ret; | ||||
| } | ||||
							
								
								
									
										227
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_mdct.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										227
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_mdct.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,227 @@ | |||
| /* Copyright (c) 2008-2011 Xiph.Org Foundation
 | ||||
|    Written by Jean-Marc Valin */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <stdio.h> | ||||
| 
 | ||||
| #include "mdct.h" | ||||
| #include "stack_alloc.h" | ||||
| #include "kiss_fft.h" | ||||
| #include "mdct.h" | ||||
| #include "modes.h" | ||||
| 
 | ||||
| #ifndef M_PI | ||||
| #define M_PI 3.141592653 | ||||
| #endif | ||||
| 
 | ||||
| int ret = 0; | ||||
| void check(kiss_fft_scalar  * in,kiss_fft_scalar  * out,int nfft,int isinverse) | ||||
| { | ||||
|     int bin,k; | ||||
|     double errpow=0,sigpow=0; | ||||
|     double snr; | ||||
|     for (bin=0;bin<nfft/2;++bin) { | ||||
|         double ansr = 0; | ||||
|         double difr; | ||||
| 
 | ||||
|         for (k=0;k<nfft;++k) { | ||||
|            double phase = 2*M_PI*(k+.5+.25*nfft)*(bin+.5)/nfft; | ||||
|            double re = cos(phase); | ||||
| 
 | ||||
|            re /= nfft/4; | ||||
| 
 | ||||
|            ansr += in[k] * re; | ||||
|         } | ||||
|         /*printf ("%f %f\n", ansr, out[bin]);*/ | ||||
|         difr = ansr - out[bin]; | ||||
|         errpow += difr*difr; | ||||
|         sigpow += ansr*ansr; | ||||
|     } | ||||
|     snr = 10*log10(sigpow/errpow); | ||||
|     printf("nfft=%d inverse=%d,snr = %f\n",nfft,isinverse,snr ); | ||||
|     if (snr<60) { | ||||
|        printf( "** poor snr: %f **\n", snr); | ||||
|        ret = 1; | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| void check_inv(kiss_fft_scalar  * in,kiss_fft_scalar  * out,int nfft,int isinverse) | ||||
| { | ||||
|    int bin,k; | ||||
|    double errpow=0,sigpow=0; | ||||
|    double snr; | ||||
|    for (bin=0;bin<nfft;++bin) { | ||||
|       double ansr = 0; | ||||
|       double difr; | ||||
| 
 | ||||
|       for (k=0;k<nfft/2;++k) { | ||||
|          double phase = 2*M_PI*(bin+.5+.25*nfft)*(k+.5)/nfft; | ||||
|          double re = cos(phase); | ||||
| 
 | ||||
|          /*re *= 2;*/ | ||||
| 
 | ||||
|          ansr += in[k] * re; | ||||
|       } | ||||
|       /*printf ("%f %f\n", ansr, out[bin]);*/ | ||||
|       difr = ansr - out[bin]; | ||||
|       errpow += difr*difr; | ||||
|       sigpow += ansr*ansr; | ||||
|    } | ||||
|    snr = 10*log10(sigpow/errpow); | ||||
|    printf("nfft=%d inverse=%d,snr = %f\n",nfft,isinverse,snr ); | ||||
|    if (snr<60) { | ||||
|       printf( "** poor snr: %f **\n", snr); | ||||
|       ret = 1; | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| 
 | ||||
| void test1d(int nfft,int isinverse,int arch) | ||||
| { | ||||
|     size_t buflen = sizeof(kiss_fft_scalar)*nfft; | ||||
|     kiss_fft_scalar *in; | ||||
|     kiss_fft_scalar *in_copy; | ||||
|     kiss_fft_scalar *out; | ||||
|     opus_val16 *window; | ||||
|     int k; | ||||
| 
 | ||||
| #ifdef CUSTOM_MODES | ||||
|     int shift = 0; | ||||
|     const mdct_lookup *cfg; | ||||
|     mdct_lookup _cfg; | ||||
|     clt_mdct_init(&_cfg, nfft, 0, arch); | ||||
|     cfg = &_cfg; | ||||
| #else | ||||
|     int shift; | ||||
|     const mdct_lookup *cfg; | ||||
|     CELTMode *mode = opus_custom_mode_create(48000, 960, NULL); | ||||
|     if (nfft == 1920) shift = 0; | ||||
|     else if (nfft == 960) shift = 1; | ||||
|     else if (nfft == 480) shift = 2; | ||||
|     else if (nfft == 240) shift = 3; | ||||
|     else return; | ||||
|     cfg = &mode->mdct; | ||||
| #endif | ||||
| 
 | ||||
|     in = (kiss_fft_scalar*)malloc(buflen); | ||||
|     in_copy = (kiss_fft_scalar*)malloc(buflen); | ||||
|     out = (kiss_fft_scalar*)malloc(buflen); | ||||
|     window = (opus_val16*)malloc(sizeof(opus_val16)*nfft/2); | ||||
| 
 | ||||
|     for (k=0;k<nfft;++k) { | ||||
|         in[k] = (rand() % 32768) - 16384; | ||||
|     } | ||||
| 
 | ||||
|     for (k=0;k<nfft/2;++k) { | ||||
|        window[k] = Q15ONE; | ||||
|     } | ||||
|     for (k=0;k<nfft;++k) { | ||||
|        in[k] *= 32768; | ||||
|     } | ||||
| 
 | ||||
|     if (isinverse) | ||||
|     { | ||||
|        for (k=0;k<nfft;++k) { | ||||
|           in[k] /= nfft; | ||||
|        } | ||||
|     } | ||||
| 
 | ||||
|     for (k=0;k<nfft;++k) | ||||
|        in_copy[k] = in[k]; | ||||
|     /*for (k=0;k<nfft;++k) printf("%d %d ", in[k].r, in[k].i);printf("\n");*/ | ||||
| 
 | ||||
|     if (isinverse) | ||||
|     { | ||||
|        for (k=0;k<nfft;++k) | ||||
|           out[k] = 0; | ||||
|        clt_mdct_backward(cfg,in,out, window, nfft/2, shift, 1, arch); | ||||
|        /* apply TDAC because clt_mdct_backward() no longer does that */ | ||||
|        for (k=0;k<nfft/4;++k) | ||||
|           out[nfft-k-1] = out[nfft/2+k]; | ||||
|        check_inv(in,out,nfft,isinverse); | ||||
|     } else { | ||||
|        clt_mdct_forward(cfg,in,out,window, nfft/2, shift, 1, arch); | ||||
|        check(in_copy,out,nfft,isinverse); | ||||
|     } | ||||
|     /*for (k=0;k<nfft;++k) printf("%d %d ", out[k].r, out[k].i);printf("\n");*/ | ||||
| 
 | ||||
| 
 | ||||
|     free(in); | ||||
|     free(in_copy); | ||||
|     free(out); | ||||
|     free(window); | ||||
| #ifdef CUSTOM_MODES | ||||
|     clt_mdct_clear(&_cfg, arch); | ||||
| #endif | ||||
| } | ||||
| 
 | ||||
| int main(int argc,char ** argv) | ||||
| { | ||||
|     ALLOC_STACK; | ||||
|     int arch = opus_select_arch(); | ||||
| 
 | ||||
|     if (argc>1) { | ||||
|         int k; | ||||
|         for (k=1;k<argc;++k) { | ||||
|             test1d(atoi(argv[k]),0,arch); | ||||
|             test1d(atoi(argv[k]),1,arch); | ||||
|         } | ||||
|     }else{ | ||||
|         test1d(32,0,arch); | ||||
|         test1d(32,1,arch); | ||||
|         test1d(256,0,arch); | ||||
|         test1d(256,1,arch); | ||||
|         test1d(512,0,arch); | ||||
|         test1d(512,1,arch); | ||||
|         test1d(1024,0,arch); | ||||
|         test1d(1024,1,arch); | ||||
|         test1d(2048,0,arch); | ||||
|         test1d(2048,1,arch); | ||||
| #ifndef RADIX_TWO_ONLY | ||||
|         test1d(36,0,arch); | ||||
|         test1d(36,1,arch); | ||||
|         test1d(40,0,arch); | ||||
|         test1d(40,1,arch); | ||||
|         test1d(60,0,arch); | ||||
|         test1d(60,1,arch); | ||||
|         test1d(120,0,arch); | ||||
|         test1d(120,1,arch); | ||||
|         test1d(240,0,arch); | ||||
|         test1d(240,1,arch); | ||||
|         test1d(480,0,arch); | ||||
|         test1d(480,1,arch); | ||||
|         test1d(960,0,arch); | ||||
|         test1d(960,1,arch); | ||||
|         test1d(1920,0,arch); | ||||
|         test1d(1920,1,arch); | ||||
| #endif | ||||
|     } | ||||
|     return ret; | ||||
| } | ||||
							
								
								
									
										86
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_rotation.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										86
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_rotation.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,86 @@ | |||
| /* Copyright (c) 2008-2011 Xiph.Org Foundation
 | ||||
|    Written by Jean-Marc Valin */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #ifndef CUSTOM_MODES | ||||
| #define CUSTOM_MODES | ||||
| #endif | ||||
| 
 | ||||
| #include <stdio.h> | ||||
| #include <stdlib.h> | ||||
| #include "vq.h" | ||||
| #include "bands.h" | ||||
| #include "stack_alloc.h" | ||||
| #include <math.h> | ||||
| 
 | ||||
| 
 | ||||
| #define MAX_SIZE 100 | ||||
| 
 | ||||
| int ret=0; | ||||
| void test_rotation(int N, int K) | ||||
| { | ||||
|    int i; | ||||
|    double err = 0, ener = 0, snr, snr0; | ||||
|    opus_val16 x0[MAX_SIZE]; | ||||
|    opus_val16 x1[MAX_SIZE]; | ||||
|    for (i=0;i<N;i++) | ||||
|       x1[i] = x0[i] = rand()%32767-16384; | ||||
|    exp_rotation(x1, N, 1, 1, K, SPREAD_NORMAL); | ||||
|    for (i=0;i<N;i++) | ||||
|    { | ||||
|       err += (x0[i]-(double)x1[i])*(x0[i]-(double)x1[i]); | ||||
|       ener += x0[i]*(double)x0[i]; | ||||
|    } | ||||
|    snr0 = 20*log10(ener/err); | ||||
|    err = ener = 0; | ||||
|    exp_rotation(x1, N, -1, 1, K, SPREAD_NORMAL); | ||||
|    for (i=0;i<N;i++) | ||||
|    { | ||||
|       err += (x0[i]-(double)x1[i])*(x0[i]-(double)x1[i]); | ||||
|       ener += x0[i]*(double)x0[i]; | ||||
|    } | ||||
|    snr = 20*log10(ener/err); | ||||
|    printf ("SNR for size %d (%d pulses) is %f (was %f without inverse)\n", N, K, snr, snr0); | ||||
|    if (snr < 60 || snr0 > 20) | ||||
|    { | ||||
|       fprintf(stderr, "FAIL!\n"); | ||||
|       ret = 1; | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| int main(void) | ||||
| { | ||||
|    ALLOC_STACK; | ||||
|    test_rotation(15, 3); | ||||
|    test_rotation(23, 5); | ||||
|    test_rotation(50, 3); | ||||
|    test_rotation(80, 1); | ||||
|    return ret; | ||||
| } | ||||
							
								
								
									
										50
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_types.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										50
									
								
								lib/rbcodec/codecs/libopus/celt/tests/test_unit_types.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,50 @@ | |||
| /* Copyright (c) 2008-2011 Xiph.Org Foundation
 | ||||
|    Written by Jean-Marc Valin */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include "opus_types.h" | ||||
| #include <stdio.h> | ||||
| 
 | ||||
| int main(void) | ||||
| { | ||||
|    opus_int16 i = 1; | ||||
|    i <<= 14; | ||||
|    if (i>>14 != 1) | ||||
|    { | ||||
|       fprintf(stderr, "opus_int16 isn't 16 bits\n"); | ||||
|       return 1; | ||||
|    } | ||||
|    if (sizeof(opus_int16)*2 != sizeof(opus_int32)) | ||||
|    { | ||||
|       fprintf(stderr, "16*2 != 32\n"); | ||||
|       return 1; | ||||
|    } | ||||
|    return 0; | ||||
| } | ||||
|  | @ -39,10 +39,6 @@ | |||
| #include "rate.h" | ||||
| #include "pitch.h" | ||||
| 
 | ||||
| #if defined(MIPSr1_ASM) | ||||
| #include "mips/vq_mipsr1.h" | ||||
| #endif | ||||
| 
 | ||||
| #ifndef OVERRIDE_vq_exp_rotation1 | ||||
| static void exp_rotation1(celt_norm *X, int len, int stride, opus_val16 c, opus_val16 s) | ||||
| { | ||||
|  | @ -71,7 +67,7 @@ static void exp_rotation1(celt_norm *X, int len, int stride, opus_val16 c, opus_ | |||
| } | ||||
| #endif /* OVERRIDE_vq_exp_rotation1 */ | ||||
| 
 | ||||
| static void exp_rotation(celt_norm *X, int len, int dir, int stride, int K, int spread) | ||||
| void exp_rotation(celt_norm *X, int len, int dir, int stride, int K, int spread) | ||||
| { | ||||
|    static const int SPREAD_FACTOR[3]={15,10,5}; | ||||
|    int i; | ||||
|  | @ -162,42 +158,27 @@ static unsigned extract_collapse_mask(int *iy, int N, int B) | |||
|    return collapse_mask; | ||||
| } | ||||
| 
 | ||||
| unsigned alg_quant(celt_norm *X, int N, int K, int spread, int B, ec_enc *enc | ||||
| #ifdef RESYNTH | ||||
|    , opus_val16 gain | ||||
| #endif | ||||
|    ) | ||||
| opus_val16 op_pvq_search_c(celt_norm *X, int *iy, int K, int N, int arch) | ||||
| { | ||||
|    VARDECL(celt_norm, y); | ||||
|    VARDECL(int, iy); | ||||
|    VARDECL(opus_val16, signx); | ||||
|    VARDECL(int, signx); | ||||
|    int i, j; | ||||
|    opus_val16 s; | ||||
|    int pulsesLeft; | ||||
|    opus_val32 sum; | ||||
|    opus_val32 xy; | ||||
|    opus_val16 yy; | ||||
|    unsigned collapse_mask; | ||||
|    SAVE_STACK; | ||||
| 
 | ||||
|    celt_assert2(K>0, "alg_quant() needs at least one pulse"); | ||||
|    celt_assert2(N>1, "alg_quant() needs at least two dimensions"); | ||||
| 
 | ||||
|    (void)arch; | ||||
|    ALLOC(y, N, celt_norm); | ||||
|    ALLOC(iy, N, int); | ||||
|    ALLOC(signx, N, opus_val16); | ||||
| 
 | ||||
|    exp_rotation(X, N, 1, B, K, spread); | ||||
|    ALLOC(signx, N, int); | ||||
| 
 | ||||
|    /* Get rid of the sign */ | ||||
|    sum = 0; | ||||
|    j=0; do { | ||||
|       if (X[j]>0) | ||||
|          signx[j]=1; | ||||
|       else { | ||||
|          signx[j]=-1; | ||||
|          X[j]=-X[j]; | ||||
|       } | ||||
|       signx[j] = X[j]<0; | ||||
|       /* OPT: Make sure the compiler doesn't use a branch on ABS16(). */ | ||||
|       X[j] = ABS16(X[j]); | ||||
|       iy[j] = 0; | ||||
|       y[j] = 0; | ||||
|    } while (++j<N); | ||||
|  | @ -229,7 +210,12 @@ unsigned alg_quant(celt_norm *X, int N, int K, int spread, int B, ec_enc *enc | |||
|          while (++j<N); | ||||
|          sum = QCONST16(1.f,14); | ||||
|       } | ||||
|       rcp = EXTRACT16(MULT16_32_Q16(K-1, celt_rcp(sum))); | ||||
| #ifdef FIXED_POINT | ||||
|       rcp = EXTRACT16(MULT16_32_Q16(K, celt_rcp(sum))); | ||||
| #else | ||||
|       /* Using K+e with e < 1 guarantees we cannot get more than K pulses. */ | ||||
|       rcp = EXTRACT16(MULT16_32_Q16(K+0.8f, celt_rcp(sum))); | ||||
| #endif | ||||
|       j=0; do { | ||||
| #ifdef FIXED_POINT | ||||
|          /* It's really important to round *towards zero* here */ | ||||
|  | @ -244,12 +230,12 @@ unsigned alg_quant(celt_norm *X, int N, int K, int spread, int B, ec_enc *enc | |||
|          pulsesLeft -= iy[j]; | ||||
|       }  while (++j<N); | ||||
|    } | ||||
|    celt_assert2(pulsesLeft>=1, "Allocated too many pulses in the quick pass"); | ||||
|    celt_sig_assert(pulsesLeft>=0); | ||||
| 
 | ||||
|    /* This should never happen, but just in case it does (e.g. on silence)
 | ||||
|       we fill the first bin with pulses. */ | ||||
| #ifdef FIXED_POINT_DEBUG | ||||
|    celt_assert2(pulsesLeft<=N+3, "Not enough pulses in the quick pass"); | ||||
|    celt_sig_assert(pulsesLeft<=N+3); | ||||
| #endif | ||||
|    if (pulsesLeft > N+3) | ||||
|    { | ||||
|  | @ -260,12 +246,12 @@ unsigned alg_quant(celt_norm *X, int N, int K, int spread, int B, ec_enc *enc | |||
|       pulsesLeft=0; | ||||
|    } | ||||
| 
 | ||||
|    s = 1; | ||||
|    for (i=0;i<pulsesLeft;i++) | ||||
|    { | ||||
|       opus_val16 Rxy, Ryy; | ||||
|       int best_id; | ||||
|       opus_val32 best_num = -VERY_LARGE16; | ||||
|       opus_val16 best_den = 0; | ||||
|       opus_val32 best_num; | ||||
|       opus_val16 best_den; | ||||
| #ifdef FIXED_POINT | ||||
|       int rshift; | ||||
| #endif | ||||
|  | @ -275,10 +261,23 @@ unsigned alg_quant(celt_norm *X, int N, int K, int spread, int B, ec_enc *enc | |||
|       best_id = 0; | ||||
|       /* The squared magnitude term gets added anyway, so we might as well
 | ||||
|          add it outside the loop */ | ||||
|       yy = ADD32(yy, 1); | ||||
|       j=0; | ||||
|       yy = ADD16(yy, 1); | ||||
| 
 | ||||
|       /* Calculations for position 0 are out of the loop, in part to reduce
 | ||||
|          mispredicted branches (since the if condition is usually false) | ||||
|          in the loop. */ | ||||
|       /* Temporary sums of the new pulse(s) */ | ||||
|       Rxy = EXTRACT16(SHR32(ADD32(xy, EXTEND32(X[0])),rshift)); | ||||
|       /* We're multiplying y[j] by two so we don't have to do it here */ | ||||
|       Ryy = ADD16(yy, y[0]); | ||||
| 
 | ||||
|       /* Approximate score: we maximise Rxy/sqrt(Ryy) (we're guaranteed that
 | ||||
|          Rxy is positive because the sign is pre-computed) */ | ||||
|       Rxy = MULT16_16_Q15(Rxy,Rxy); | ||||
|       best_den = Ryy; | ||||
|       best_num = Rxy; | ||||
|       j=1; | ||||
|       do { | ||||
|          opus_val16 Rxy, Ryy; | ||||
|          /* Temporary sums of the new pulse(s) */ | ||||
|          Rxy = EXTRACT16(SHR32(ADD32(xy, EXTEND32(X[j])),rshift)); | ||||
|          /* We're multiplying y[j] by two so we don't have to do it here */ | ||||
|  | @ -289,8 +288,11 @@ unsigned alg_quant(celt_norm *X, int N, int K, int spread, int B, ec_enc *enc | |||
|          Rxy = MULT16_16_Q15(Rxy,Rxy); | ||||
|          /* The idea is to check for num/den >= best_num/best_den, but that way
 | ||||
|             we can do it without any division */ | ||||
|          /* OPT: Make sure to use conditional moves here */ | ||||
|          if (MULT16_16(best_den, Rxy) > MULT16_16(Ryy, best_num)) | ||||
|          /* OPT: It's not clear whether a cmov is faster than a branch here
 | ||||
|             since the condition is more often false than true and using | ||||
|             a cmov introduces data dependencies across iterations. The optimal | ||||
|             choice may be architecture-dependent. */ | ||||
|          if (opus_unlikely(MULT16_16(best_den, Rxy) > MULT16_16(Ryy, best_num))) | ||||
|          { | ||||
|             best_den = Ryy; | ||||
|             best_num = Rxy; | ||||
|  | @ -305,23 +307,47 @@ unsigned alg_quant(celt_norm *X, int N, int K, int spread, int B, ec_enc *enc | |||
| 
 | ||||
|       /* Only now that we've made the final choice, update y/iy */ | ||||
|       /* Multiplying y[j] by 2 so we don't have to do it everywhere else */ | ||||
|       y[best_id] += 2*s; | ||||
|       y[best_id] += 2; | ||||
|       iy[best_id]++; | ||||
|    } | ||||
| 
 | ||||
|    /* Put the original sign back */ | ||||
|    j=0; | ||||
|    do { | ||||
|       X[j] = MULT16_16(signx[j],X[j]); | ||||
|       if (signx[j] < 0) | ||||
|          iy[j] = -iy[j]; | ||||
|       /*iy[j] = signx[j] ? -iy[j] : iy[j];*/ | ||||
|       /* OPT: The is more likely to be compiled without a branch than the code above
 | ||||
|          but has the same performance otherwise. */ | ||||
|       iy[j] = (iy[j]^-signx[j]) + signx[j]; | ||||
|    } while (++j<N); | ||||
|    RESTORE_STACK; | ||||
|    return yy; | ||||
| } | ||||
| 
 | ||||
| unsigned alg_quant(celt_norm *X, int N, int K, int spread, int B, ec_enc *enc, | ||||
|       opus_val16 gain, int resynth, int arch) | ||||
| { | ||||
|    VARDECL(int, iy); | ||||
|    opus_val16 yy; | ||||
|    unsigned collapse_mask; | ||||
|    SAVE_STACK; | ||||
| 
 | ||||
|    celt_assert2(K>0, "alg_quant() needs at least one pulse"); | ||||
|    celt_assert2(N>1, "alg_quant() needs at least two dimensions"); | ||||
| 
 | ||||
|    /* Covers vectorization by up to 4. */ | ||||
|    ALLOC(iy, N+3, int); | ||||
| 
 | ||||
|    exp_rotation(X, N, 1, B, K, spread); | ||||
| 
 | ||||
|    yy = op_pvq_search(X, iy, K, N, arch); | ||||
| 
 | ||||
|    encode_pulses(iy, N, K, enc); | ||||
| 
 | ||||
| #ifdef RESYNTH | ||||
|    normalise_residual(iy, X, N, yy, gain); | ||||
|    exp_rotation(X, N, -1, B, K, spread); | ||||
| #endif | ||||
|    if (resynth) | ||||
|    { | ||||
|       normalise_residual(iy, X, N, yy, gain); | ||||
|       exp_rotation(X, N, -1, B, K, spread); | ||||
|    } | ||||
| 
 | ||||
|    collapse_mask = extract_collapse_mask(iy, N, B); | ||||
|    RESTORE_STACK; | ||||
|  | @ -350,7 +376,7 @@ unsigned alg_unquant(celt_norm *X, int N, int K, int spread, int B, | |||
| } | ||||
| 
 | ||||
| #ifndef OVERRIDE_renormalise_vector | ||||
| void renormalise_vector(celt_norm *X, int N, opus_val16 gain) | ||||
| void renormalise_vector(celt_norm *X, int N, opus_val16 gain, int arch) | ||||
| { | ||||
|    int i; | ||||
| #ifdef FIXED_POINT | ||||
|  | @ -360,7 +386,7 @@ void renormalise_vector(celt_norm *X, int N, opus_val16 gain) | |||
|    opus_val16 g; | ||||
|    opus_val32 t; | ||||
|    celt_norm *xptr; | ||||
|    E = EPSILON + celt_inner_prod(X, X, N); | ||||
|    E = EPSILON + celt_inner_prod(X, X, N, arch); | ||||
| #ifdef FIXED_POINT | ||||
|    k = celt_ilog2(E)>>1; | ||||
| #endif | ||||
|  | @ -377,7 +403,7 @@ void renormalise_vector(celt_norm *X, int N, opus_val16 gain) | |||
| } | ||||
| #endif /* OVERRIDE_renormalise_vector */ | ||||
| 
 | ||||
| int stereo_itheta(const celt_norm *X, const celt_norm *Y, int stereo, int N) | ||||
| int stereo_itheta(const celt_norm *X, const celt_norm *Y, int stereo, int N, int arch) | ||||
| { | ||||
|    int i; | ||||
|    int itheta; | ||||
|  | @ -396,8 +422,8 @@ int stereo_itheta(const celt_norm *X, const celt_norm *Y, int stereo, int N) | |||
|          Eside = MAC16_16(Eside, s, s); | ||||
|       } | ||||
|    } else { | ||||
|       Emid += celt_inner_prod(X, X, N); | ||||
|       Eside += celt_inner_prod(Y, Y, N); | ||||
|       Emid += celt_inner_prod(X, X, N, arch); | ||||
|       Eside += celt_inner_prod(Y, Y, N, arch); | ||||
|    } | ||||
|    mid = celt_sqrt(Emid); | ||||
|    side = celt_sqrt(Eside); | ||||
|  | @ -405,7 +431,7 @@ int stereo_itheta(const celt_norm *X, const celt_norm *Y, int stereo, int N) | |||
|    /* 0.63662 = 2/pi */ | ||||
|    itheta = MULT16_16_Q15(QCONST16(0.63662f,15),celt_atan2p(side, mid)); | ||||
| #else | ||||
|    itheta = (int)floor(.5f+16384*0.63662f*atan2(side,mid)); | ||||
|    itheta = (int)floor(.5f+16384*0.63662f*fast_atan2f(side,mid)); | ||||
| #endif | ||||
| 
 | ||||
|    return itheta; | ||||
|  |  | |||
|  | @ -37,6 +37,23 @@ | |||
| #include "entdec.h" | ||||
| #include "modes.h" | ||||
| 
 | ||||
| #if (defined(OPUS_X86_MAY_HAVE_SSE2) && !defined(FIXED_POINT)) | ||||
| #include "x86/vq_sse.h" | ||||
| #endif | ||||
| 
 | ||||
| #if defined(MIPSr1_ASM) | ||||
| #include "mips/vq_mipsr1.h" | ||||
| #endif | ||||
| 
 | ||||
| void exp_rotation(celt_norm *X, int len, int dir, int stride, int K, int spread); | ||||
| 
 | ||||
| opus_val16 op_pvq_search_c(celt_norm *X, int *iy, int K, int N, int arch); | ||||
| 
 | ||||
| #if !defined(OVERRIDE_OP_PVQ_SEARCH) | ||||
| #define op_pvq_search(x, iy, K, N, arch) \ | ||||
|     (op_pvq_search_c(x, iy, K, N, arch)) | ||||
| #endif | ||||
| 
 | ||||
| /** Algebraic pulse-vector quantiser. The signal x is replaced by the sum of
 | ||||
|   * the pitch and a combination of pulses such that its norm is still equal | ||||
|   * to 1. This is the function that will typically require the most CPU. | ||||
|  | @ -46,12 +63,8 @@ | |||
|  * @param enc Entropy encoder state | ||||
|  * @ret A mask indicating which blocks in the band received pulses | ||||
| */ | ||||
| unsigned alg_quant(celt_norm *X, int N, int K, int spread, int B, | ||||
|       ec_enc *enc | ||||
| #ifdef RESYNTH | ||||
|       , opus_val16 gain | ||||
| #endif | ||||
|       ); | ||||
| unsigned alg_quant(celt_norm *X, int N, int K, int spread, int B, ec_enc *enc, | ||||
|       opus_val16 gain, int resynth, int arch); | ||||
| 
 | ||||
| /** Algebraic pulse decoder
 | ||||
|  * @param X Decoded normalised spectrum (returned) | ||||
|  | @ -63,8 +76,8 @@ unsigned alg_quant(celt_norm *X, int N, int K, int spread, int B, | |||
| unsigned alg_unquant(celt_norm *X, int N, int K, int spread, int B, | ||||
|       ec_dec *dec, opus_val16 gain); | ||||
| 
 | ||||
| void renormalise_vector(celt_norm *X, int N, opus_val16 gain); | ||||
| void renormalise_vector(celt_norm *X, int N, opus_val16 gain, int arch); | ||||
| 
 | ||||
| int stereo_itheta(const celt_norm *X, const celt_norm *Y, int stereo, int N); | ||||
| int stereo_itheta(const celt_norm *X, const celt_norm *Y, int stereo, int N, int arch); | ||||
| 
 | ||||
| #endif /* VQ_H */ | ||||
|  |  | |||
							
								
								
									
										66
									
								
								lib/rbcodec/codecs/libopus/celt/x86/celt_lpc_sse.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										66
									
								
								lib/rbcodec/codecs/libopus/celt/x86/celt_lpc_sse.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,66 @@ | |||
| /* Copyright (c) 2014, Cisco Systems, INC
 | ||||
|    Written by XiangMingZhu WeiZhou MinPeng YanWang | ||||
| 
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef CELT_LPC_SSE_H | ||||
| #define CELT_LPC_SSE_H | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE4_1) && defined(FIXED_POINT) | ||||
| #define OVERRIDE_CELT_FIR | ||||
| 
 | ||||
| void celt_fir_sse4_1( | ||||
|          const opus_val16 *x, | ||||
|          const opus_val16 *num, | ||||
|          opus_val16 *y, | ||||
|          int N, | ||||
|          int ord, | ||||
|          int arch); | ||||
| 
 | ||||
| #if defined(OPUS_X86_PRESUME_SSE4_1) | ||||
| #define celt_fir(x, num, y, N, ord, arch) \ | ||||
|     ((void)arch, celt_fir_sse4_1(x, num, y, N, ord, arch)) | ||||
| 
 | ||||
| #else | ||||
| 
 | ||||
| extern void (*const CELT_FIR_IMPL[OPUS_ARCHMASK + 1])( | ||||
|          const opus_val16 *x, | ||||
|          const opus_val16 *num, | ||||
|          opus_val16 *y, | ||||
|          int N, | ||||
|          int ord, | ||||
|          int arch); | ||||
| 
 | ||||
| #  define celt_fir(x, num, y, N, ord, arch) \ | ||||
|     ((*CELT_FIR_IMPL[(arch) & OPUS_ARCHMASK])(x, num, y, N, ord, arch)) | ||||
| 
 | ||||
| #endif | ||||
| #endif | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										89
									
								
								lib/rbcodec/codecs/libopus/celt/x86/celt_lpc_sse4_1.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										89
									
								
								lib/rbcodec/codecs/libopus/celt/x86/celt_lpc_sse4_1.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,89 @@ | |||
| /* Copyright (c) 2014, Cisco Systems, INC
 | ||||
|    Written by XiangMingZhu WeiZhou MinPeng YanWang | ||||
| 
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <xmmintrin.h> | ||||
| #include <emmintrin.h> | ||||
| #include <smmintrin.h> | ||||
| #include "celt_lpc.h" | ||||
| #include "stack_alloc.h" | ||||
| #include "mathops.h" | ||||
| #include "pitch.h" | ||||
| #include "x86cpu.h" | ||||
| 
 | ||||
| #if defined(FIXED_POINT) | ||||
| 
 | ||||
| void celt_fir_sse4_1(const opus_val16 *x, | ||||
|          const opus_val16 *num, | ||||
|          opus_val16 *y, | ||||
|          int N, | ||||
|          int ord, | ||||
|          int arch) | ||||
| { | ||||
|     int i,j; | ||||
|     VARDECL(opus_val16, rnum); | ||||
| 
 | ||||
|     __m128i vecNoA; | ||||
|     opus_int32 noA ; | ||||
|     SAVE_STACK; | ||||
| 
 | ||||
|    ALLOC(rnum, ord, opus_val16); | ||||
|    for(i=0;i<ord;i++) | ||||
|       rnum[i] = num[ord-i-1]; | ||||
|    noA = EXTEND32(1) << SIG_SHIFT >> 1; | ||||
|    vecNoA = _mm_set_epi32(noA, noA, noA, noA); | ||||
| 
 | ||||
|    for (i=0;i<N-3;i+=4) | ||||
|    { | ||||
|       opus_val32 sums[4] = {0}; | ||||
|       __m128i vecSum, vecX; | ||||
| 
 | ||||
|       xcorr_kernel(rnum, x+i-ord, sums, ord, arch); | ||||
| 
 | ||||
|       vecSum = _mm_loadu_si128((__m128i *)sums); | ||||
|       vecSum = _mm_add_epi32(vecSum, vecNoA); | ||||
|       vecSum = _mm_srai_epi32(vecSum, SIG_SHIFT); | ||||
|       vecX = OP_CVTEPI16_EPI32_M64(x + i); | ||||
|       vecSum = _mm_add_epi32(vecSum, vecX); | ||||
|       vecSum = _mm_packs_epi32(vecSum, vecSum); | ||||
|       _mm_storel_epi64((__m128i *)(y + i), vecSum); | ||||
|    } | ||||
|    for (;i<N;i++) | ||||
|    { | ||||
|       opus_val32 sum = 0; | ||||
|       for (j=0;j<ord;j++) | ||||
|          sum = MAC16_16(sum, rnum[j], x[i+j-ord]); | ||||
|       y[i] = SATURATE16(ADD32(EXTEND32(x[i]), PSHR32(sum, SIG_SHIFT))); | ||||
|    } | ||||
| 
 | ||||
|    RESTORE_STACK; | ||||
| } | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										185
									
								
								lib/rbcodec/codecs/libopus/celt/x86/pitch_sse.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										185
									
								
								lib/rbcodec/codecs/libopus/celt/x86/pitch_sse.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,185 @@ | |||
| /* Copyright (c) 2014, Cisco Systems, INC
 | ||||
|    Written by XiangMingZhu WeiZhou MinPeng YanWang | ||||
| 
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include "macros.h" | ||||
| #include "celt_lpc.h" | ||||
| #include "stack_alloc.h" | ||||
| #include "mathops.h" | ||||
| #include "pitch.h" | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE) && !defined(FIXED_POINT) | ||||
| 
 | ||||
| #include <xmmintrin.h> | ||||
| #include "arch.h" | ||||
| 
 | ||||
| void xcorr_kernel_sse(const opus_val16 *x, const opus_val16 *y, opus_val32 sum[4], int len) | ||||
| { | ||||
|    int j; | ||||
|    __m128 xsum1, xsum2; | ||||
|    xsum1 = _mm_loadu_ps(sum); | ||||
|    xsum2 = _mm_setzero_ps(); | ||||
| 
 | ||||
|    for (j = 0; j < len-3; j += 4) | ||||
|    { | ||||
|       __m128 x0 = _mm_loadu_ps(x+j); | ||||
|       __m128 yj = _mm_loadu_ps(y+j); | ||||
|       __m128 y3 = _mm_loadu_ps(y+j+3); | ||||
| 
 | ||||
|       xsum1 = _mm_add_ps(xsum1,_mm_mul_ps(_mm_shuffle_ps(x0,x0,0x00),yj)); | ||||
|       xsum2 = _mm_add_ps(xsum2,_mm_mul_ps(_mm_shuffle_ps(x0,x0,0x55), | ||||
|                                           _mm_shuffle_ps(yj,y3,0x49))); | ||||
|       xsum1 = _mm_add_ps(xsum1,_mm_mul_ps(_mm_shuffle_ps(x0,x0,0xaa), | ||||
|                                           _mm_shuffle_ps(yj,y3,0x9e))); | ||||
|       xsum2 = _mm_add_ps(xsum2,_mm_mul_ps(_mm_shuffle_ps(x0,x0,0xff),y3)); | ||||
|    } | ||||
|    if (j < len) | ||||
|    { | ||||
|       xsum1 = _mm_add_ps(xsum1,_mm_mul_ps(_mm_load1_ps(x+j),_mm_loadu_ps(y+j))); | ||||
|       if (++j < len) | ||||
|       { | ||||
|          xsum2 = _mm_add_ps(xsum2,_mm_mul_ps(_mm_load1_ps(x+j),_mm_loadu_ps(y+j))); | ||||
|          if (++j < len) | ||||
|          { | ||||
|             xsum1 = _mm_add_ps(xsum1,_mm_mul_ps(_mm_load1_ps(x+j),_mm_loadu_ps(y+j))); | ||||
|          } | ||||
|       } | ||||
|    } | ||||
|    _mm_storeu_ps(sum,_mm_add_ps(xsum1,xsum2)); | ||||
| } | ||||
| 
 | ||||
| 
 | ||||
| void dual_inner_prod_sse(const opus_val16 *x, const opus_val16 *y01, const opus_val16 *y02, | ||||
|       int N, opus_val32 *xy1, opus_val32 *xy2) | ||||
| { | ||||
|    int i; | ||||
|    __m128 xsum1, xsum2; | ||||
|    xsum1 = _mm_setzero_ps(); | ||||
|    xsum2 = _mm_setzero_ps(); | ||||
|    for (i=0;i<N-3;i+=4) | ||||
|    { | ||||
|       __m128 xi = _mm_loadu_ps(x+i); | ||||
|       __m128 y1i = _mm_loadu_ps(y01+i); | ||||
|       __m128 y2i = _mm_loadu_ps(y02+i); | ||||
|       xsum1 = _mm_add_ps(xsum1,_mm_mul_ps(xi, y1i)); | ||||
|       xsum2 = _mm_add_ps(xsum2,_mm_mul_ps(xi, y2i)); | ||||
|    } | ||||
|    /* Horizontal sum */ | ||||
|    xsum1 = _mm_add_ps(xsum1, _mm_movehl_ps(xsum1, xsum1)); | ||||
|    xsum1 = _mm_add_ss(xsum1, _mm_shuffle_ps(xsum1, xsum1, 0x55)); | ||||
|    _mm_store_ss(xy1, xsum1); | ||||
|    xsum2 = _mm_add_ps(xsum2, _mm_movehl_ps(xsum2, xsum2)); | ||||
|    xsum2 = _mm_add_ss(xsum2, _mm_shuffle_ps(xsum2, xsum2, 0x55)); | ||||
|    _mm_store_ss(xy2, xsum2); | ||||
|    for (;i<N;i++) | ||||
|    { | ||||
|       *xy1 = MAC16_16(*xy1, x[i], y01[i]); | ||||
|       *xy2 = MAC16_16(*xy2, x[i], y02[i]); | ||||
|    } | ||||
| } | ||||
| 
 | ||||
| opus_val32 celt_inner_prod_sse(const opus_val16 *x, const opus_val16 *y, | ||||
|       int N) | ||||
| { | ||||
|    int i; | ||||
|    float xy; | ||||
|    __m128 sum; | ||||
|    sum = _mm_setzero_ps(); | ||||
|    /* FIXME: We should probably go 8-way and use 2 sums. */ | ||||
|    for (i=0;i<N-3;i+=4) | ||||
|    { | ||||
|       __m128 xi = _mm_loadu_ps(x+i); | ||||
|       __m128 yi = _mm_loadu_ps(y+i); | ||||
|       sum = _mm_add_ps(sum,_mm_mul_ps(xi, yi)); | ||||
|    } | ||||
|    /* Horizontal sum */ | ||||
|    sum = _mm_add_ps(sum, _mm_movehl_ps(sum, sum)); | ||||
|    sum = _mm_add_ss(sum, _mm_shuffle_ps(sum, sum, 0x55)); | ||||
|    _mm_store_ss(&xy, sum); | ||||
|    for (;i<N;i++) | ||||
|    { | ||||
|       xy = MAC16_16(xy, x[i], y[i]); | ||||
|    } | ||||
|    return xy; | ||||
| } | ||||
| 
 | ||||
| void comb_filter_const_sse(opus_val32 *y, opus_val32 *x, int T, int N, | ||||
|       opus_val16 g10, opus_val16 g11, opus_val16 g12) | ||||
| { | ||||
|    int i; | ||||
|    __m128 x0v; | ||||
|    __m128 g10v, g11v, g12v; | ||||
|    g10v = _mm_load1_ps(&g10); | ||||
|    g11v = _mm_load1_ps(&g11); | ||||
|    g12v = _mm_load1_ps(&g12); | ||||
|    x0v = _mm_loadu_ps(&x[-T-2]); | ||||
|    for (i=0;i<N-3;i+=4) | ||||
|    { | ||||
|       __m128 yi, yi2, x1v, x2v, x3v, x4v; | ||||
|       const opus_val32 *xp = &x[i-T-2]; | ||||
|       yi = _mm_loadu_ps(x+i); | ||||
|       x4v = _mm_loadu_ps(xp+4); | ||||
| #if 0 | ||||
|       /* Slower version with all loads */ | ||||
|       x1v = _mm_loadu_ps(xp+1); | ||||
|       x2v = _mm_loadu_ps(xp+2); | ||||
|       x3v = _mm_loadu_ps(xp+3); | ||||
| #else | ||||
|       x2v = _mm_shuffle_ps(x0v, x4v, 0x4e); | ||||
|       x1v = _mm_shuffle_ps(x0v, x2v, 0x99); | ||||
|       x3v = _mm_shuffle_ps(x2v, x4v, 0x99); | ||||
| #endif | ||||
| 
 | ||||
|       yi = _mm_add_ps(yi, _mm_mul_ps(g10v,x2v)); | ||||
| #if 0 /* Set to 1 to make it bit-exact with the non-SSE version */
 | ||||
|       yi = _mm_add_ps(yi, _mm_mul_ps(g11v,_mm_add_ps(x3v,x1v))); | ||||
|       yi = _mm_add_ps(yi, _mm_mul_ps(g12v,_mm_add_ps(x4v,x0v))); | ||||
| #else | ||||
|       /* Use partial sums */ | ||||
|       yi2 = _mm_add_ps(_mm_mul_ps(g11v,_mm_add_ps(x3v,x1v)), | ||||
|                        _mm_mul_ps(g12v,_mm_add_ps(x4v,x0v))); | ||||
|       yi = _mm_add_ps(yi, yi2); | ||||
| #endif | ||||
|       x0v=x4v; | ||||
|       _mm_storeu_ps(y+i, yi); | ||||
|    } | ||||
| #ifdef CUSTOM_MODES | ||||
|    for (;i<N;i++) | ||||
|    { | ||||
|       y[i] = x[i] | ||||
|                + MULT16_32_Q15(g10,x[i-T]) | ||||
|                + MULT16_32_Q15(g11,ADD32(x[i-T+1],x[i-T-1])) | ||||
|                + MULT16_32_Q15(g12,ADD32(x[i-T+2],x[i-T-2])); | ||||
|    } | ||||
| #endif | ||||
| } | ||||
| 
 | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										192
									
								
								lib/rbcodec/codecs/libopus/celt/x86/pitch_sse.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										192
									
								
								lib/rbcodec/codecs/libopus/celt/x86/pitch_sse.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,192 @@ | |||
| /* Copyright (c) 2013 Jean-Marc Valin and John Ridges
 | ||||
|    Copyright (c) 2014, Cisco Systems, INC MingXiang WeiZhou MinPeng YanWang*/ | ||||
| /**
 | ||||
|    @file pitch_sse.h | ||||
|    @brief Pitch analysis | ||||
|  */ | ||||
| 
 | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef PITCH_SSE_H | ||||
| #define PITCH_SSE_H | ||||
| 
 | ||||
| #if defined(HAVE_CONFIG_H) | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE4_1) && defined(FIXED_POINT) | ||||
| void xcorr_kernel_sse4_1( | ||||
|                     const opus_int16 *x, | ||||
|                     const opus_int16 *y, | ||||
|                     opus_val32       sum[4], | ||||
|                     int              len); | ||||
| #endif | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE) && !defined(FIXED_POINT) | ||||
| void xcorr_kernel_sse( | ||||
|                     const opus_val16 *x, | ||||
|                     const opus_val16 *y, | ||||
|                     opus_val32       sum[4], | ||||
|                     int              len); | ||||
| #endif | ||||
| 
 | ||||
| #if defined(OPUS_X86_PRESUME_SSE4_1) && defined(FIXED_POINT) | ||||
| #define OVERRIDE_XCORR_KERNEL | ||||
| #define xcorr_kernel(x, y, sum, len, arch) \ | ||||
|     ((void)arch, xcorr_kernel_sse4_1(x, y, sum, len)) | ||||
| 
 | ||||
| #elif defined(OPUS_X86_PRESUME_SSE) && !defined(FIXED_POINT) | ||||
| #define OVERRIDE_XCORR_KERNEL | ||||
| #define xcorr_kernel(x, y, sum, len, arch) \ | ||||
|     ((void)arch, xcorr_kernel_sse(x, y, sum, len)) | ||||
| 
 | ||||
| #elif (defined(OPUS_X86_MAY_HAVE_SSE4_1) && defined(FIXED_POINT)) || (defined(OPUS_X86_MAY_HAVE_SSE) && !defined(FIXED_POINT)) | ||||
| 
 | ||||
| extern void (*const XCORR_KERNEL_IMPL[OPUS_ARCHMASK + 1])( | ||||
|                     const opus_val16 *x, | ||||
|                     const opus_val16 *y, | ||||
|                     opus_val32       sum[4], | ||||
|                     int              len); | ||||
| 
 | ||||
| #define OVERRIDE_XCORR_KERNEL | ||||
| #define xcorr_kernel(x, y, sum, len, arch) \ | ||||
|     ((*XCORR_KERNEL_IMPL[(arch) & OPUS_ARCHMASK])(x, y, sum, len)) | ||||
| 
 | ||||
| #endif | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE4_1) && defined(FIXED_POINT) | ||||
| opus_val32 celt_inner_prod_sse4_1( | ||||
|     const opus_int16 *x, | ||||
|     const opus_int16 *y, | ||||
|     int               N); | ||||
| #endif | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE2) && defined(FIXED_POINT) | ||||
| opus_val32 celt_inner_prod_sse2( | ||||
|     const opus_int16 *x, | ||||
|     const opus_int16 *y, | ||||
|     int               N); | ||||
| #endif | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE2) && !defined(FIXED_POINT) | ||||
| opus_val32 celt_inner_prod_sse( | ||||
|     const opus_val16 *x, | ||||
|     const opus_val16 *y, | ||||
|     int               N); | ||||
| #endif | ||||
| 
 | ||||
| 
 | ||||
| #if defined(OPUS_X86_PRESUME_SSE4_1) && defined(FIXED_POINT) | ||||
| #define OVERRIDE_CELT_INNER_PROD | ||||
| #define celt_inner_prod(x, y, N, arch) \ | ||||
|     ((void)arch, celt_inner_prod_sse4_1(x, y, N)) | ||||
| 
 | ||||
| #elif defined(OPUS_X86_PRESUME_SSE2) && defined(FIXED_POINT) && !defined(OPUS_X86_MAY_HAVE_SSE4_1) | ||||
| #define OVERRIDE_CELT_INNER_PROD | ||||
| #define celt_inner_prod(x, y, N, arch) \ | ||||
|     ((void)arch, celt_inner_prod_sse2(x, y, N)) | ||||
| 
 | ||||
| #elif defined(OPUS_X86_PRESUME_SSE) && !defined(FIXED_POINT) | ||||
| #define OVERRIDE_CELT_INNER_PROD | ||||
| #define celt_inner_prod(x, y, N, arch) \ | ||||
|     ((void)arch, celt_inner_prod_sse(x, y, N)) | ||||
| 
 | ||||
| 
 | ||||
| #elif ((defined(OPUS_X86_MAY_HAVE_SSE4_1) || defined(OPUS_X86_MAY_HAVE_SSE2)) && defined(FIXED_POINT)) || \ | ||||
|     (defined(OPUS_X86_MAY_HAVE_SSE) && !defined(FIXED_POINT)) | ||||
| 
 | ||||
| extern opus_val32 (*const CELT_INNER_PROD_IMPL[OPUS_ARCHMASK + 1])( | ||||
|                     const opus_val16 *x, | ||||
|                     const opus_val16 *y, | ||||
|                     int               N); | ||||
| 
 | ||||
| #define OVERRIDE_CELT_INNER_PROD | ||||
| #define celt_inner_prod(x, y, N, arch) \ | ||||
|     ((*CELT_INNER_PROD_IMPL[(arch) & OPUS_ARCHMASK])(x, y, N)) | ||||
| 
 | ||||
| #endif | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE) && !defined(FIXED_POINT) | ||||
| 
 | ||||
| #define OVERRIDE_DUAL_INNER_PROD | ||||
| #define OVERRIDE_COMB_FILTER_CONST | ||||
| 
 | ||||
| #undef dual_inner_prod | ||||
| #undef comb_filter_const | ||||
| 
 | ||||
| void dual_inner_prod_sse(const opus_val16 *x, | ||||
|     const opus_val16 *y01, | ||||
|     const opus_val16 *y02, | ||||
|     int               N, | ||||
|     opus_val32       *xy1, | ||||
|     opus_val32       *xy2); | ||||
| 
 | ||||
| void comb_filter_const_sse(opus_val32 *y, | ||||
|     opus_val32 *x, | ||||
|     int         T, | ||||
|     int         N, | ||||
|     opus_val16  g10, | ||||
|     opus_val16  g11, | ||||
|     opus_val16  g12); | ||||
| 
 | ||||
| 
 | ||||
| #if defined(OPUS_X86_PRESUME_SSE) | ||||
| # define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) \ | ||||
|     ((void)(arch),dual_inner_prod_sse(x, y01, y02, N, xy1, xy2)) | ||||
| 
 | ||||
| # define comb_filter_const(y, x, T, N, g10, g11, g12, arch) \ | ||||
|     ((void)(arch),comb_filter_const_sse(y, x, T, N, g10, g11, g12)) | ||||
| #else | ||||
| 
 | ||||
| extern void (*const DUAL_INNER_PROD_IMPL[OPUS_ARCHMASK + 1])( | ||||
|               const opus_val16 *x, | ||||
|               const opus_val16 *y01, | ||||
|               const opus_val16 *y02, | ||||
|               int               N, | ||||
|               opus_val32       *xy1, | ||||
|               opus_val32       *xy2); | ||||
| 
 | ||||
| #define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) \ | ||||
|     ((*DUAL_INNER_PROD_IMPL[(arch) & OPUS_ARCHMASK])(x, y01, y02, N, xy1, xy2)) | ||||
| 
 | ||||
| extern void (*const COMB_FILTER_CONST_IMPL[OPUS_ARCHMASK + 1])( | ||||
|               opus_val32 *y, | ||||
|               opus_val32 *x, | ||||
|               int         T, | ||||
|               int         N, | ||||
|               opus_val16  g10, | ||||
|               opus_val16  g11, | ||||
|               opus_val16  g12); | ||||
| 
 | ||||
| #define comb_filter_const(y, x, T, N, g10, g11, g12, arch) \ | ||||
|     ((*COMB_FILTER_CONST_IMPL[(arch) & OPUS_ARCHMASK])(y, x, T, N, g10, g11, g12)) | ||||
| 
 | ||||
| #define NON_STATIC_COMB_FILTER_CONST_C | ||||
| 
 | ||||
| #endif | ||||
| #endif | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										95
									
								
								lib/rbcodec/codecs/libopus/celt/x86/pitch_sse2.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										95
									
								
								lib/rbcodec/codecs/libopus/celt/x86/pitch_sse2.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,95 @@ | |||
| /* Copyright (c) 2014, Cisco Systems, INC
 | ||||
|    Written by XiangMingZhu WeiZhou MinPeng YanWang | ||||
| 
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <xmmintrin.h> | ||||
| #include <emmintrin.h> | ||||
| 
 | ||||
| #include "macros.h" | ||||
| #include "celt_lpc.h" | ||||
| #include "stack_alloc.h" | ||||
| #include "mathops.h" | ||||
| #include "pitch.h" | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE2) && defined(FIXED_POINT) | ||||
| opus_val32 celt_inner_prod_sse2(const opus_val16 *x, const opus_val16 *y, | ||||
|       int N) | ||||
| { | ||||
|     opus_int  i, dataSize16; | ||||
|     opus_int32 sum; | ||||
| 
 | ||||
|     __m128i inVec1_76543210, inVec1_FEDCBA98, acc1; | ||||
|     __m128i inVec2_76543210, inVec2_FEDCBA98, acc2; | ||||
| 
 | ||||
|     sum = 0; | ||||
|     dataSize16 = N & ~15; | ||||
| 
 | ||||
|     acc1 = _mm_setzero_si128(); | ||||
|     acc2 = _mm_setzero_si128(); | ||||
| 
 | ||||
|     for (i=0;i<dataSize16;i+=16) | ||||
|     { | ||||
|         inVec1_76543210 = _mm_loadu_si128((__m128i *)(&x[i + 0])); | ||||
|         inVec2_76543210 = _mm_loadu_si128((__m128i *)(&y[i + 0])); | ||||
| 
 | ||||
|         inVec1_FEDCBA98 = _mm_loadu_si128((__m128i *)(&x[i + 8])); | ||||
|         inVec2_FEDCBA98 = _mm_loadu_si128((__m128i *)(&y[i + 8])); | ||||
| 
 | ||||
|         inVec1_76543210 = _mm_madd_epi16(inVec1_76543210, inVec2_76543210); | ||||
|         inVec1_FEDCBA98 = _mm_madd_epi16(inVec1_FEDCBA98, inVec2_FEDCBA98); | ||||
| 
 | ||||
|         acc1 = _mm_add_epi32(acc1, inVec1_76543210); | ||||
|         acc2 = _mm_add_epi32(acc2, inVec1_FEDCBA98); | ||||
|     } | ||||
| 
 | ||||
|     acc1 = _mm_add_epi32( acc1, acc2 ); | ||||
| 
 | ||||
|     if (N - i >= 8) | ||||
|     { | ||||
|         inVec1_76543210 = _mm_loadu_si128((__m128i *)(&x[i + 0])); | ||||
|         inVec2_76543210 = _mm_loadu_si128((__m128i *)(&y[i + 0])); | ||||
| 
 | ||||
|         inVec1_76543210 = _mm_madd_epi16(inVec1_76543210, inVec2_76543210); | ||||
| 
 | ||||
|         acc1 = _mm_add_epi32(acc1, inVec1_76543210); | ||||
|         i += 8; | ||||
|     } | ||||
| 
 | ||||
|     acc1 = _mm_add_epi32(acc1, _mm_unpackhi_epi64( acc1, acc1)); | ||||
|     acc1 = _mm_add_epi32(acc1, _mm_shufflelo_epi16( acc1, 0x0E)); | ||||
|     sum += _mm_cvtsi128_si32(acc1); | ||||
| 
 | ||||
|     for (;i<N;i++) { | ||||
|         sum = silk_SMLABB(sum, x[i], y[i]); | ||||
|     } | ||||
| 
 | ||||
|     return sum; | ||||
| } | ||||
| #endif | ||||
							
								
								
									
										195
									
								
								lib/rbcodec/codecs/libopus/celt/x86/pitch_sse4_1.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										195
									
								
								lib/rbcodec/codecs/libopus/celt/x86/pitch_sse4_1.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,195 @@ | |||
| /* Copyright (c) 2014, Cisco Systems, INC
 | ||||
|    Written by XiangMingZhu WeiZhou MinPeng YanWang | ||||
| 
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <xmmintrin.h> | ||||
| #include <emmintrin.h> | ||||
| 
 | ||||
| #include "macros.h" | ||||
| #include "celt_lpc.h" | ||||
| #include "stack_alloc.h" | ||||
| #include "mathops.h" | ||||
| #include "pitch.h" | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE4_1) && defined(FIXED_POINT) | ||||
| #include <smmintrin.h> | ||||
| #include "x86cpu.h" | ||||
| 
 | ||||
| opus_val32 celt_inner_prod_sse4_1(const opus_val16 *x, const opus_val16 *y, | ||||
|       int N) | ||||
| { | ||||
|     opus_int  i, dataSize16; | ||||
|     opus_int32 sum; | ||||
|     __m128i inVec1_76543210, inVec1_FEDCBA98, acc1; | ||||
|     __m128i inVec2_76543210, inVec2_FEDCBA98, acc2; | ||||
|     __m128i inVec1_3210, inVec2_3210; | ||||
| 
 | ||||
|     sum = 0; | ||||
|     dataSize16 = N & ~15; | ||||
| 
 | ||||
|     acc1 = _mm_setzero_si128(); | ||||
|     acc2 = _mm_setzero_si128(); | ||||
| 
 | ||||
|     for (i=0;i<dataSize16;i+=16) { | ||||
|         inVec1_76543210 = _mm_loadu_si128((__m128i *)(&x[i + 0])); | ||||
|         inVec2_76543210 = _mm_loadu_si128((__m128i *)(&y[i + 0])); | ||||
| 
 | ||||
|         inVec1_FEDCBA98 = _mm_loadu_si128((__m128i *)(&x[i + 8])); | ||||
|         inVec2_FEDCBA98 = _mm_loadu_si128((__m128i *)(&y[i + 8])); | ||||
| 
 | ||||
|         inVec1_76543210 = _mm_madd_epi16(inVec1_76543210, inVec2_76543210); | ||||
|         inVec1_FEDCBA98 = _mm_madd_epi16(inVec1_FEDCBA98, inVec2_FEDCBA98); | ||||
| 
 | ||||
|         acc1 = _mm_add_epi32(acc1, inVec1_76543210); | ||||
|         acc2 = _mm_add_epi32(acc2, inVec1_FEDCBA98); | ||||
|     } | ||||
| 
 | ||||
|     acc1 = _mm_add_epi32(acc1, acc2); | ||||
| 
 | ||||
|     if (N - i >= 8) | ||||
|     { | ||||
|         inVec1_76543210 = _mm_loadu_si128((__m128i *)(&x[i + 0])); | ||||
|         inVec2_76543210 = _mm_loadu_si128((__m128i *)(&y[i + 0])); | ||||
| 
 | ||||
|         inVec1_76543210 = _mm_madd_epi16(inVec1_76543210, inVec2_76543210); | ||||
| 
 | ||||
|         acc1 = _mm_add_epi32(acc1, inVec1_76543210); | ||||
|         i += 8; | ||||
|     } | ||||
| 
 | ||||
|     if (N - i >= 4) | ||||
|     { | ||||
|         inVec1_3210 = OP_CVTEPI16_EPI32_M64(&x[i + 0]); | ||||
|         inVec2_3210 = OP_CVTEPI16_EPI32_M64(&y[i + 0]); | ||||
| 
 | ||||
|         inVec1_3210 = _mm_mullo_epi32(inVec1_3210, inVec2_3210); | ||||
| 
 | ||||
|         acc1 = _mm_add_epi32(acc1, inVec1_3210); | ||||
|         i += 4; | ||||
|     } | ||||
| 
 | ||||
|     acc1 = _mm_add_epi32(acc1, _mm_unpackhi_epi64(acc1, acc1)); | ||||
|     acc1 = _mm_add_epi32(acc1, _mm_shufflelo_epi16(acc1, 0x0E)); | ||||
| 
 | ||||
|     sum += _mm_cvtsi128_si32(acc1); | ||||
| 
 | ||||
|     for (;i<N;i++) | ||||
|     { | ||||
|         sum = silk_SMLABB(sum, x[i], y[i]); | ||||
|     } | ||||
| 
 | ||||
|     return sum; | ||||
| } | ||||
| 
 | ||||
| void xcorr_kernel_sse4_1(const opus_val16 * x, const opus_val16 * y, opus_val32 sum[ 4 ], int len) | ||||
| { | ||||
|     int j; | ||||
| 
 | ||||
|     __m128i vecX, vecX0, vecX1, vecX2, vecX3; | ||||
|     __m128i vecY0, vecY1, vecY2, vecY3; | ||||
|     __m128i sum0, sum1, sum2, sum3, vecSum; | ||||
|     __m128i initSum; | ||||
| 
 | ||||
|     celt_assert(len >= 3); | ||||
| 
 | ||||
|     sum0 = _mm_setzero_si128(); | ||||
|     sum1 = _mm_setzero_si128(); | ||||
|     sum2 = _mm_setzero_si128(); | ||||
|     sum3 = _mm_setzero_si128(); | ||||
| 
 | ||||
|     for (j=0;j<(len-7);j+=8) | ||||
|     { | ||||
|         vecX = _mm_loadu_si128((__m128i *)(&x[j + 0])); | ||||
|         vecY0 = _mm_loadu_si128((__m128i *)(&y[j + 0])); | ||||
|         vecY1 = _mm_loadu_si128((__m128i *)(&y[j + 1])); | ||||
|         vecY2 = _mm_loadu_si128((__m128i *)(&y[j + 2])); | ||||
|         vecY3 = _mm_loadu_si128((__m128i *)(&y[j + 3])); | ||||
| 
 | ||||
|         sum0 = _mm_add_epi32(sum0, _mm_madd_epi16(vecX, vecY0)); | ||||
|         sum1 = _mm_add_epi32(sum1, _mm_madd_epi16(vecX, vecY1)); | ||||
|         sum2 = _mm_add_epi32(sum2, _mm_madd_epi16(vecX, vecY2)); | ||||
|         sum3 = _mm_add_epi32(sum3, _mm_madd_epi16(vecX, vecY3)); | ||||
|     } | ||||
| 
 | ||||
|     sum0 = _mm_add_epi32(sum0, _mm_unpackhi_epi64( sum0, sum0)); | ||||
|     sum0 = _mm_add_epi32(sum0, _mm_shufflelo_epi16( sum0, 0x0E)); | ||||
| 
 | ||||
|     sum1 = _mm_add_epi32(sum1, _mm_unpackhi_epi64( sum1, sum1)); | ||||
|     sum1 = _mm_add_epi32(sum1, _mm_shufflelo_epi16( sum1, 0x0E)); | ||||
| 
 | ||||
|     sum2 = _mm_add_epi32(sum2, _mm_unpackhi_epi64( sum2, sum2)); | ||||
|     sum2 = _mm_add_epi32(sum2, _mm_shufflelo_epi16( sum2, 0x0E)); | ||||
| 
 | ||||
|     sum3 = _mm_add_epi32(sum3, _mm_unpackhi_epi64( sum3, sum3)); | ||||
|     sum3 = _mm_add_epi32(sum3, _mm_shufflelo_epi16( sum3, 0x0E)); | ||||
| 
 | ||||
|     vecSum = _mm_unpacklo_epi64(_mm_unpacklo_epi32(sum0, sum1), | ||||
|           _mm_unpacklo_epi32(sum2, sum3)); | ||||
| 
 | ||||
|     for (;j<(len-3);j+=4) | ||||
|     { | ||||
|         vecX = OP_CVTEPI16_EPI32_M64(&x[j + 0]); | ||||
|         vecX0 = _mm_shuffle_epi32(vecX, 0x00); | ||||
|         vecX1 = _mm_shuffle_epi32(vecX, 0x55); | ||||
|         vecX2 = _mm_shuffle_epi32(vecX, 0xaa); | ||||
|         vecX3 = _mm_shuffle_epi32(vecX, 0xff); | ||||
| 
 | ||||
|         vecY0 = OP_CVTEPI16_EPI32_M64(&y[j + 0]); | ||||
|         vecY1 = OP_CVTEPI16_EPI32_M64(&y[j + 1]); | ||||
|         vecY2 = OP_CVTEPI16_EPI32_M64(&y[j + 2]); | ||||
|         vecY3 = OP_CVTEPI16_EPI32_M64(&y[j + 3]); | ||||
| 
 | ||||
|         sum0 = _mm_mullo_epi32(vecX0, vecY0); | ||||
|         sum1 = _mm_mullo_epi32(vecX1, vecY1); | ||||
|         sum2 = _mm_mullo_epi32(vecX2, vecY2); | ||||
|         sum3 = _mm_mullo_epi32(vecX3, vecY3); | ||||
| 
 | ||||
|         sum0 = _mm_add_epi32(sum0, sum1); | ||||
|         sum2 = _mm_add_epi32(sum2, sum3); | ||||
|         vecSum = _mm_add_epi32(vecSum, sum0); | ||||
|         vecSum = _mm_add_epi32(vecSum, sum2); | ||||
|     } | ||||
| 
 | ||||
|     for (;j<len;j++) | ||||
|     { | ||||
|         vecX = OP_CVTEPI16_EPI32_M64(&x[j + 0]); | ||||
|         vecX0 = _mm_shuffle_epi32(vecX, 0x00); | ||||
| 
 | ||||
|         vecY0 = OP_CVTEPI16_EPI32_M64(&y[j + 0]); | ||||
| 
 | ||||
|         sum0 = _mm_mullo_epi32(vecX0, vecY0); | ||||
|         vecSum = _mm_add_epi32(vecSum, sum0); | ||||
|     } | ||||
| 
 | ||||
|     initSum = _mm_loadu_si128((__m128i *)(&sum[0])); | ||||
|     initSum = _mm_add_epi32(initSum, vecSum); | ||||
|     _mm_storeu_si128((__m128i *)sum, initSum); | ||||
| } | ||||
| #endif | ||||
							
								
								
									
										50
									
								
								lib/rbcodec/codecs/libopus/celt/x86/vq_sse.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										50
									
								
								lib/rbcodec/codecs/libopus/celt/x86/vq_sse.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,50 @@ | |||
| /* Copyright (c) 2016  Jean-Marc Valin */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifndef VQ_SSE_H | ||||
| #define VQ_SSE_H | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE2) && !defined(FIXED_POINT) | ||||
| #define OVERRIDE_OP_PVQ_SEARCH | ||||
| 
 | ||||
| opus_val16 op_pvq_search_sse2(celt_norm *_X, int *iy, int K, int N, int arch); | ||||
| 
 | ||||
| #if defined(OPUS_X86_PRESUME_SSE2) | ||||
| #define op_pvq_search(x, iy, K, N, arch) \ | ||||
|     (op_pvq_search_sse2(x, iy, K, N, arch)) | ||||
| 
 | ||||
| #else | ||||
| 
 | ||||
| extern opus_val16 (*const OP_PVQ_SEARCH_IMPL[OPUS_ARCHMASK + 1])( | ||||
|       celt_norm *_X, int *iy, int K, int N, int arch); | ||||
| 
 | ||||
| #  define op_pvq_search(X, iy, K, N, arch) \ | ||||
|     ((*OP_PVQ_SEARCH_IMPL[(arch) & OPUS_ARCHMASK])(X, iy, K, N, arch)) | ||||
| 
 | ||||
| #endif | ||||
| #endif | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										217
									
								
								lib/rbcodec/codecs/libopus/celt/x86/vq_sse2.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										217
									
								
								lib/rbcodec/codecs/libopus/celt/x86/vq_sse2.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,217 @@ | |||
| /* Copyright (c) 2007-2008 CSIRO
 | ||||
|    Copyright (c) 2007-2009 Xiph.Org Foundation | ||||
|    Copyright (c) 2007-2016 Jean-Marc Valin */ | ||||
| /*
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include <xmmintrin.h> | ||||
| #include <emmintrin.h> | ||||
| #include "celt_lpc.h" | ||||
| #include "stack_alloc.h" | ||||
| #include "mathops.h" | ||||
| #include "vq.h" | ||||
| #include "x86cpu.h" | ||||
| 
 | ||||
| 
 | ||||
| #ifndef FIXED_POINT | ||||
| 
 | ||||
| opus_val16 op_pvq_search_sse2(celt_norm *_X, int *iy, int K, int N, int arch) | ||||
| { | ||||
|    int i, j; | ||||
|    int pulsesLeft; | ||||
|    float xy, yy; | ||||
|    VARDECL(celt_norm, y); | ||||
|    VARDECL(celt_norm, X); | ||||
|    VARDECL(float, signy); | ||||
|    __m128 signmask; | ||||
|    __m128 sums; | ||||
|    __m128i fours; | ||||
|    SAVE_STACK; | ||||
| 
 | ||||
|    (void)arch; | ||||
|    /* All bits set to zero, except for the sign bit. */ | ||||
|    signmask = _mm_set_ps1(-0.f); | ||||
|    fours = _mm_set_epi32(4, 4, 4, 4); | ||||
|    ALLOC(y, N+3, celt_norm); | ||||
|    ALLOC(X, N+3, celt_norm); | ||||
|    ALLOC(signy, N+3, float); | ||||
| 
 | ||||
|    OPUS_COPY(X, _X, N); | ||||
|    X[N] = X[N+1] = X[N+2] = 0; | ||||
|    sums = _mm_setzero_ps(); | ||||
|    for (j=0;j<N;j+=4) | ||||
|    { | ||||
|       __m128 x4, s4; | ||||
|       x4 = _mm_loadu_ps(&X[j]); | ||||
|       s4 = _mm_cmplt_ps(x4, _mm_setzero_ps()); | ||||
|       /* Get rid of the sign */ | ||||
|       x4 = _mm_andnot_ps(signmask, x4); | ||||
|       sums = _mm_add_ps(sums, x4); | ||||
|       /* Clear y and iy in case we don't do the projection. */ | ||||
|       _mm_storeu_ps(&y[j], _mm_setzero_ps()); | ||||
|       _mm_storeu_si128((__m128i*)&iy[j], _mm_setzero_si128()); | ||||
|       _mm_storeu_ps(&X[j], x4); | ||||
|       _mm_storeu_ps(&signy[j], s4); | ||||
|    } | ||||
|    sums = _mm_add_ps(sums, _mm_shuffle_ps(sums, sums, _MM_SHUFFLE(1, 0, 3, 2))); | ||||
|    sums = _mm_add_ps(sums, _mm_shuffle_ps(sums, sums, _MM_SHUFFLE(2, 3, 0, 1))); | ||||
| 
 | ||||
|    xy = yy = 0; | ||||
| 
 | ||||
|    pulsesLeft = K; | ||||
| 
 | ||||
|    /* Do a pre-search by projecting on the pyramid */ | ||||
|    if (K > (N>>1)) | ||||
|    { | ||||
|       __m128i pulses_sum; | ||||
|       __m128 yy4, xy4; | ||||
|       __m128 rcp4; | ||||
|       opus_val32 sum = _mm_cvtss_f32(sums); | ||||
|       /* If X is too small, just replace it with a pulse at 0 */ | ||||
|       /* Prevents infinities and NaNs from causing too many pulses
 | ||||
|          to be allocated. 64 is an approximation of infinity here. */ | ||||
|       if (!(sum > EPSILON && sum < 64)) | ||||
|       { | ||||
|          X[0] = QCONST16(1.f,14); | ||||
|          j=1; do | ||||
|             X[j]=0; | ||||
|          while (++j<N); | ||||
|          sums = _mm_set_ps1(1.f); | ||||
|       } | ||||
|       /* Using K+e with e < 1 guarantees we cannot get more than K pulses. */ | ||||
|       rcp4 = _mm_mul_ps(_mm_set_ps1((float)(K+.8)), _mm_rcp_ps(sums)); | ||||
|       xy4 = yy4 = _mm_setzero_ps(); | ||||
|       pulses_sum = _mm_setzero_si128(); | ||||
|       for (j=0;j<N;j+=4) | ||||
|       { | ||||
|          __m128 rx4, x4, y4; | ||||
|          __m128i iy4; | ||||
|          x4 = _mm_loadu_ps(&X[j]); | ||||
|          rx4 = _mm_mul_ps(x4, rcp4); | ||||
|          iy4 = _mm_cvttps_epi32(rx4); | ||||
|          pulses_sum = _mm_add_epi32(pulses_sum, iy4); | ||||
|          _mm_storeu_si128((__m128i*)&iy[j], iy4); | ||||
|          y4 = _mm_cvtepi32_ps(iy4); | ||||
|          xy4 = _mm_add_ps(xy4, _mm_mul_ps(x4, y4)); | ||||
|          yy4 = _mm_add_ps(yy4, _mm_mul_ps(y4, y4)); | ||||
|          /* double the y[] vector so we don't have to do it in the search loop. */ | ||||
|          _mm_storeu_ps(&y[j], _mm_add_ps(y4, y4)); | ||||
|       } | ||||
|       pulses_sum = _mm_add_epi32(pulses_sum, _mm_shuffle_epi32(pulses_sum, _MM_SHUFFLE(1, 0, 3, 2))); | ||||
|       pulses_sum = _mm_add_epi32(pulses_sum, _mm_shuffle_epi32(pulses_sum, _MM_SHUFFLE(2, 3, 0, 1))); | ||||
|       pulsesLeft -= _mm_cvtsi128_si32(pulses_sum); | ||||
|       xy4 = _mm_add_ps(xy4, _mm_shuffle_ps(xy4, xy4, _MM_SHUFFLE(1, 0, 3, 2))); | ||||
|       xy4 = _mm_add_ps(xy4, _mm_shuffle_ps(xy4, xy4, _MM_SHUFFLE(2, 3, 0, 1))); | ||||
|       xy = _mm_cvtss_f32(xy4); | ||||
|       yy4 = _mm_add_ps(yy4, _mm_shuffle_ps(yy4, yy4, _MM_SHUFFLE(1, 0, 3, 2))); | ||||
|       yy4 = _mm_add_ps(yy4, _mm_shuffle_ps(yy4, yy4, _MM_SHUFFLE(2, 3, 0, 1))); | ||||
|       yy = _mm_cvtss_f32(yy4); | ||||
|    } | ||||
|    X[N] = X[N+1] = X[N+2] = -100; | ||||
|    y[N] = y[N+1] = y[N+2] = 100; | ||||
|    celt_sig_assert(pulsesLeft>=0); | ||||
| 
 | ||||
|    /* This should never happen, but just in case it does (e.g. on silence)
 | ||||
|       we fill the first bin with pulses. */ | ||||
|    if (pulsesLeft > N+3) | ||||
|    { | ||||
|       opus_val16 tmp = (opus_val16)pulsesLeft; | ||||
|       yy = MAC16_16(yy, tmp, tmp); | ||||
|       yy = MAC16_16(yy, tmp, y[0]); | ||||
|       iy[0] += pulsesLeft; | ||||
|       pulsesLeft=0; | ||||
|    } | ||||
| 
 | ||||
|    for (i=0;i<pulsesLeft;i++) | ||||
|    { | ||||
|       int best_id; | ||||
|       __m128 xy4, yy4; | ||||
|       __m128 max, max2; | ||||
|       __m128i count; | ||||
|       __m128i pos; | ||||
|       /* The squared magnitude term gets added anyway, so we might as well
 | ||||
|          add it outside the loop */ | ||||
|       yy = ADD16(yy, 1); | ||||
|       xy4 = _mm_load1_ps(&xy); | ||||
|       yy4 = _mm_load1_ps(&yy); | ||||
|       max = _mm_setzero_ps(); | ||||
|       pos = _mm_setzero_si128(); | ||||
|       count = _mm_set_epi32(3, 2, 1, 0); | ||||
|       for (j=0;j<N;j+=4) | ||||
|       { | ||||
|          __m128 x4, y4, r4; | ||||
|          x4 = _mm_loadu_ps(&X[j]); | ||||
|          y4 = _mm_loadu_ps(&y[j]); | ||||
|          x4 = _mm_add_ps(x4, xy4); | ||||
|          y4 = _mm_add_ps(y4, yy4); | ||||
|          y4 = _mm_rsqrt_ps(y4); | ||||
|          r4 = _mm_mul_ps(x4, y4); | ||||
|          /* Update the index of the max. */ | ||||
|          pos = _mm_max_epi16(pos, _mm_and_si128(count, _mm_castps_si128(_mm_cmpgt_ps(r4, max)))); | ||||
|          /* Update the max. */ | ||||
|          max = _mm_max_ps(max, r4); | ||||
|          /* Update the indices (+4) */ | ||||
|          count = _mm_add_epi32(count, fours); | ||||
|       } | ||||
|       /* Horizontal max */ | ||||
|       max2 = _mm_max_ps(max, _mm_shuffle_ps(max, max, _MM_SHUFFLE(1, 0, 3, 2))); | ||||
|       max2 = _mm_max_ps(max2, _mm_shuffle_ps(max2, max2, _MM_SHUFFLE(2, 3, 0, 1))); | ||||
|       /* Now that max2 contains the max at all positions, look at which value(s) of the
 | ||||
|          partial max is equal to the global max. */ | ||||
|       pos = _mm_and_si128(pos, _mm_castps_si128(_mm_cmpeq_ps(max, max2))); | ||||
|       pos = _mm_max_epi16(pos, _mm_unpackhi_epi64(pos, pos)); | ||||
|       pos = _mm_max_epi16(pos, _mm_shufflelo_epi16(pos, _MM_SHUFFLE(1, 0, 3, 2))); | ||||
|       best_id = _mm_cvtsi128_si32(pos); | ||||
| 
 | ||||
|       /* Updating the sums of the new pulse(s) */ | ||||
|       xy = ADD32(xy, EXTEND32(X[best_id])); | ||||
|       /* We're multiplying y[j] by two so we don't have to do it here */ | ||||
|       yy = ADD16(yy, y[best_id]); | ||||
| 
 | ||||
|       /* Only now that we've made the final choice, update y/iy */ | ||||
|       /* Multiplying y[j] by 2 so we don't have to do it everywhere else */ | ||||
|       y[best_id] += 2; | ||||
|       iy[best_id]++; | ||||
|    } | ||||
| 
 | ||||
|    /* Put the original sign back */ | ||||
|    for (j=0;j<N;j+=4) | ||||
|    { | ||||
|       __m128i y4; | ||||
|       __m128i s4; | ||||
|       y4 = _mm_loadu_si128((__m128i*)&iy[j]); | ||||
|       s4 = _mm_castps_si128(_mm_loadu_ps(&signy[j])); | ||||
|       y4 = _mm_xor_si128(_mm_add_epi32(y4, s4), s4); | ||||
|       _mm_storeu_si128((__m128i*)&iy[j], y4); | ||||
|    } | ||||
|    RESTORE_STACK; | ||||
|    return yy; | ||||
| } | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										167
									
								
								lib/rbcodec/codecs/libopus/celt/x86/x86_celt_map.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										167
									
								
								lib/rbcodec/codecs/libopus/celt/x86/x86_celt_map.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,167 @@ | |||
| /* Copyright (c) 2014, Cisco Systems, INC
 | ||||
|    Written by XiangMingZhu WeiZhou MinPeng YanWang | ||||
| 
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #if defined(HAVE_CONFIG_H) | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include "x86/x86cpu.h" | ||||
| #include "celt_lpc.h" | ||||
| #include "pitch.h" | ||||
| #include "pitch_sse.h" | ||||
| #include "vq.h" | ||||
| 
 | ||||
| #if defined(OPUS_HAVE_RTCD) | ||||
| 
 | ||||
| # if defined(FIXED_POINT) | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE4_1) && !defined(OPUS_X86_PRESUME_SSE4_1) | ||||
| 
 | ||||
| void (*const CELT_FIR_IMPL[OPUS_ARCHMASK + 1])( | ||||
|          const opus_val16 *x, | ||||
|          const opus_val16 *num, | ||||
|          opus_val16       *y, | ||||
|          int              N, | ||||
|          int              ord, | ||||
|          int              arch | ||||
| ) = { | ||||
|   celt_fir_c,                /* non-sse */ | ||||
|   celt_fir_c, | ||||
|   celt_fir_c, | ||||
|   MAY_HAVE_SSE4_1(celt_fir), /* sse4.1  */ | ||||
|   MAY_HAVE_SSE4_1(celt_fir)  /* avx  */ | ||||
| }; | ||||
| 
 | ||||
| void (*const XCORR_KERNEL_IMPL[OPUS_ARCHMASK + 1])( | ||||
|          const opus_val16 *x, | ||||
|          const opus_val16 *y, | ||||
|          opus_val32       sum[4], | ||||
|          int              len | ||||
| ) = { | ||||
|   xcorr_kernel_c,                /* non-sse */ | ||||
|   xcorr_kernel_c, | ||||
|   xcorr_kernel_c, | ||||
|   MAY_HAVE_SSE4_1(xcorr_kernel), /* sse4.1  */ | ||||
|   MAY_HAVE_SSE4_1(xcorr_kernel)  /* avx  */ | ||||
| }; | ||||
| 
 | ||||
| #endif | ||||
| 
 | ||||
| #if (defined(OPUS_X86_MAY_HAVE_SSE4_1) && !defined(OPUS_X86_PRESUME_SSE4_1)) ||  \ | ||||
|  (!defined(OPUS_X86_MAY_HAVE_SSE_4_1) && defined(OPUS_X86_MAY_HAVE_SSE2) && !defined(OPUS_X86_PRESUME_SSE2)) | ||||
| 
 | ||||
| opus_val32 (*const CELT_INNER_PROD_IMPL[OPUS_ARCHMASK + 1])( | ||||
|          const opus_val16 *x, | ||||
|          const opus_val16 *y, | ||||
|          int              N | ||||
| ) = { | ||||
|   celt_inner_prod_c,                /* non-sse */ | ||||
|   celt_inner_prod_c, | ||||
|   MAY_HAVE_SSE2(celt_inner_prod), | ||||
|   MAY_HAVE_SSE4_1(celt_inner_prod), /* sse4.1  */ | ||||
|   MAY_HAVE_SSE4_1(celt_inner_prod)  /* avx  */ | ||||
| }; | ||||
| 
 | ||||
| #endif | ||||
| 
 | ||||
| # else | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE) && !defined(OPUS_X86_PRESUME_SSE) | ||||
| 
 | ||||
| void (*const XCORR_KERNEL_IMPL[OPUS_ARCHMASK + 1])( | ||||
|          const opus_val16 *x, | ||||
|          const opus_val16 *y, | ||||
|          opus_val32       sum[4], | ||||
|          int              len | ||||
| ) = { | ||||
|   xcorr_kernel_c,                /* non-sse */ | ||||
|   MAY_HAVE_SSE(xcorr_kernel), | ||||
|   MAY_HAVE_SSE(xcorr_kernel), | ||||
|   MAY_HAVE_SSE(xcorr_kernel), | ||||
|   MAY_HAVE_SSE(xcorr_kernel) | ||||
| }; | ||||
| 
 | ||||
| opus_val32 (*const CELT_INNER_PROD_IMPL[OPUS_ARCHMASK + 1])( | ||||
|          const opus_val16 *x, | ||||
|          const opus_val16 *y, | ||||
|          int              N | ||||
| ) = { | ||||
|   celt_inner_prod_c,                /* non-sse */ | ||||
|   MAY_HAVE_SSE(celt_inner_prod), | ||||
|   MAY_HAVE_SSE(celt_inner_prod), | ||||
|   MAY_HAVE_SSE(celt_inner_prod), | ||||
|   MAY_HAVE_SSE(celt_inner_prod) | ||||
| }; | ||||
| 
 | ||||
| void (*const DUAL_INNER_PROD_IMPL[OPUS_ARCHMASK + 1])( | ||||
|                     const opus_val16 *x, | ||||
|                     const opus_val16 *y01, | ||||
|                     const opus_val16 *y02, | ||||
|                     int               N, | ||||
|                     opus_val32       *xy1, | ||||
|                     opus_val32       *xy2 | ||||
| ) = { | ||||
|   dual_inner_prod_c,                /* non-sse */ | ||||
|   MAY_HAVE_SSE(dual_inner_prod), | ||||
|   MAY_HAVE_SSE(dual_inner_prod), | ||||
|   MAY_HAVE_SSE(dual_inner_prod), | ||||
|   MAY_HAVE_SSE(dual_inner_prod) | ||||
| }; | ||||
| 
 | ||||
| void (*const COMB_FILTER_CONST_IMPL[OPUS_ARCHMASK + 1])( | ||||
|               opus_val32 *y, | ||||
|               opus_val32 *x, | ||||
|               int         T, | ||||
|               int         N, | ||||
|               opus_val16  g10, | ||||
|               opus_val16  g11, | ||||
|               opus_val16  g12 | ||||
| ) = { | ||||
|   comb_filter_const_c,                /* non-sse */ | ||||
|   MAY_HAVE_SSE(comb_filter_const), | ||||
|   MAY_HAVE_SSE(comb_filter_const), | ||||
|   MAY_HAVE_SSE(comb_filter_const), | ||||
|   MAY_HAVE_SSE(comb_filter_const) | ||||
| }; | ||||
| 
 | ||||
| 
 | ||||
| #endif | ||||
| 
 | ||||
| #if defined(OPUS_X86_MAY_HAVE_SSE2) && !defined(OPUS_X86_PRESUME_SSE2) | ||||
| opus_val16 (*const OP_PVQ_SEARCH_IMPL[OPUS_ARCHMASK + 1])( | ||||
|       celt_norm *_X, int *iy, int K, int N, int arch | ||||
| ) = { | ||||
|   op_pvq_search_c,                /* non-sse */ | ||||
|   op_pvq_search_c, | ||||
|   MAY_HAVE_SSE2(op_pvq_search), | ||||
|   MAY_HAVE_SSE2(op_pvq_search), | ||||
|   MAY_HAVE_SSE2(op_pvq_search) | ||||
| }; | ||||
| #endif | ||||
| 
 | ||||
| #endif | ||||
| #endif | ||||
							
								
								
									
										157
									
								
								lib/rbcodec/codecs/libopus/celt/x86/x86cpu.c
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										157
									
								
								lib/rbcodec/codecs/libopus/celt/x86/x86cpu.c
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,157 @@ | |||
| /* Copyright (c) 2014, Cisco Systems, INC
 | ||||
|    Written by XiangMingZhu WeiZhou MinPeng YanWang | ||||
| 
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #ifdef HAVE_CONFIG_H | ||||
| #include "config.h" | ||||
| #endif | ||||
| 
 | ||||
| #include "cpu_support.h" | ||||
| #include "macros.h" | ||||
| #include "main.h" | ||||
| #include "pitch.h" | ||||
| #include "x86cpu.h" | ||||
| 
 | ||||
| #if (defined(OPUS_X86_MAY_HAVE_SSE) && !defined(OPUS_X86_PRESUME_SSE)) || \ | ||||
|   (defined(OPUS_X86_MAY_HAVE_SSE2) && !defined(OPUS_X86_PRESUME_SSE2)) || \ | ||||
|   (defined(OPUS_X86_MAY_HAVE_SSE4_1) && !defined(OPUS_X86_PRESUME_SSE4_1)) || \ | ||||
|   (defined(OPUS_X86_MAY_HAVE_AVX) && !defined(OPUS_X86_PRESUME_AVX)) | ||||
| 
 | ||||
| 
 | ||||
| #if defined(_MSC_VER) | ||||
| 
 | ||||
| #include <intrin.h> | ||||
| static _inline void cpuid(unsigned int CPUInfo[4], unsigned int InfoType) | ||||
| { | ||||
|     __cpuid((int*)CPUInfo, InfoType); | ||||
| } | ||||
| 
 | ||||
| #else | ||||
| 
 | ||||
| #if defined(CPU_INFO_BY_C) | ||||
| #include <cpuid.h> | ||||
| #endif | ||||
| 
 | ||||
| static void cpuid(unsigned int CPUInfo[4], unsigned int InfoType) | ||||
| { | ||||
| #if defined(CPU_INFO_BY_ASM) | ||||
| #if defined(__i386__) && defined(__PIC__) | ||||
| /* %ebx is PIC register in 32-bit, so mustn't clobber it. */ | ||||
|     __asm__ __volatile__ ( | ||||
|         "xchg %%ebx, %1\n" | ||||
|         "cpuid\n" | ||||
|         "xchg %%ebx, %1\n": | ||||
|         "=a" (CPUInfo[0]), | ||||
|         "=r" (CPUInfo[1]), | ||||
|         "=c" (CPUInfo[2]), | ||||
|         "=d" (CPUInfo[3]) : | ||||
|         "0" (InfoType) | ||||
|     ); | ||||
| #else | ||||
|     __asm__ __volatile__ ( | ||||
|         "cpuid": | ||||
|         "=a" (CPUInfo[0]), | ||||
|         "=b" (CPUInfo[1]), | ||||
|         "=c" (CPUInfo[2]), | ||||
|         "=d" (CPUInfo[3]) : | ||||
|         "0" (InfoType) | ||||
|     ); | ||||
| #endif | ||||
| #elif defined(CPU_INFO_BY_C) | ||||
|     __get_cpuid(InfoType, &(CPUInfo[0]), &(CPUInfo[1]), &(CPUInfo[2]), &(CPUInfo[3])); | ||||
| #endif | ||||
| } | ||||
| 
 | ||||
| #endif | ||||
| 
 | ||||
| typedef struct CPU_Feature{ | ||||
|     /*  SIMD: 128-bit */ | ||||
|     int HW_SSE; | ||||
|     int HW_SSE2; | ||||
|     int HW_SSE41; | ||||
|     /*  SIMD: 256-bit */ | ||||
|     int HW_AVX; | ||||
| } CPU_Feature; | ||||
| 
 | ||||
| static void opus_cpu_feature_check(CPU_Feature *cpu_feature) | ||||
| { | ||||
|     unsigned int info[4] = {0}; | ||||
|     unsigned int nIds = 0; | ||||
| 
 | ||||
|     cpuid(info, 0); | ||||
|     nIds = info[0]; | ||||
| 
 | ||||
|     if (nIds >= 1){ | ||||
|         cpuid(info, 1); | ||||
|         cpu_feature->HW_SSE = (info[3] & (1 << 25)) != 0; | ||||
|         cpu_feature->HW_SSE2 = (info[3] & (1 << 26)) != 0; | ||||
|         cpu_feature->HW_SSE41 = (info[2] & (1 << 19)) != 0; | ||||
|         cpu_feature->HW_AVX = (info[2] & (1 << 28)) != 0; | ||||
|     } | ||||
|     else { | ||||
|         cpu_feature->HW_SSE = 0; | ||||
|         cpu_feature->HW_SSE2 = 0; | ||||
|         cpu_feature->HW_SSE41 = 0; | ||||
|         cpu_feature->HW_AVX = 0; | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| int opus_select_arch(void) | ||||
| { | ||||
|     CPU_Feature cpu_feature; | ||||
|     int arch; | ||||
| 
 | ||||
|     opus_cpu_feature_check(&cpu_feature); | ||||
| 
 | ||||
|     arch = 0; | ||||
|     if (!cpu_feature.HW_SSE) | ||||
|     { | ||||
|        return arch; | ||||
|     } | ||||
|     arch++; | ||||
| 
 | ||||
|     if (!cpu_feature.HW_SSE2) | ||||
|     { | ||||
|        return arch; | ||||
|     } | ||||
|     arch++; | ||||
| 
 | ||||
|     if (!cpu_feature.HW_SSE41) | ||||
|     { | ||||
|         return arch; | ||||
|     } | ||||
|     arch++; | ||||
| 
 | ||||
|     if (!cpu_feature.HW_AVX) | ||||
|     { | ||||
|         return arch; | ||||
|     } | ||||
|     arch++; | ||||
| 
 | ||||
|     return arch; | ||||
| } | ||||
| 
 | ||||
| #endif | ||||
							
								
								
									
										95
									
								
								lib/rbcodec/codecs/libopus/celt/x86/x86cpu.h
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										95
									
								
								lib/rbcodec/codecs/libopus/celt/x86/x86cpu.h
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,95 @@ | |||
| /* Copyright (c) 2014, Cisco Systems, INC
 | ||||
|    Written by XiangMingZhu WeiZhou MinPeng YanWang | ||||
| 
 | ||||
|    Redistribution and use in source and binary forms, with or without | ||||
|    modification, are permitted provided that the following conditions | ||||
|    are met: | ||||
| 
 | ||||
|    - Redistributions of source code must retain the above copyright | ||||
|    notice, this list of conditions and the following disclaimer. | ||||
| 
 | ||||
|    - Redistributions in binary form must reproduce the above copyright | ||||
|    notice, this list of conditions and the following disclaimer in the | ||||
|    documentation and/or other materials provided with the distribution. | ||||
| 
 | ||||
|    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS | ||||
|    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT | ||||
|    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR | ||||
|    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER | ||||
|    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | ||||
|    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | ||||
|    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | ||||
|    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF | ||||
|    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING | ||||
|    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
|    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| */ | ||||
| 
 | ||||
| #if !defined(X86CPU_H) | ||||
| # define X86CPU_H | ||||
| 
 | ||||
| # if defined(OPUS_X86_MAY_HAVE_SSE) | ||||
| #  define MAY_HAVE_SSE(name) name ## _sse | ||||
| # else | ||||
| #  define MAY_HAVE_SSE(name) name ## _c | ||||
| # endif | ||||
| 
 | ||||
| # if defined(OPUS_X86_MAY_HAVE_SSE2) | ||||
| #  define MAY_HAVE_SSE2(name) name ## _sse2 | ||||
| # else | ||||
| #  define MAY_HAVE_SSE2(name) name ## _c | ||||
| # endif | ||||
| 
 | ||||
| # if defined(OPUS_X86_MAY_HAVE_SSE4_1) | ||||
| #  define MAY_HAVE_SSE4_1(name) name ## _sse4_1 | ||||
| # else | ||||
| #  define MAY_HAVE_SSE4_1(name) name ## _c | ||||
| # endif | ||||
| 
 | ||||
| # if defined(OPUS_X86_MAY_HAVE_AVX) | ||||
| #  define MAY_HAVE_AVX(name) name ## _avx | ||||
| # else | ||||
| #  define MAY_HAVE_AVX(name) name ## _c | ||||
| # endif | ||||
| 
 | ||||
| # if defined(OPUS_HAVE_RTCD) | ||||
| int opus_select_arch(void); | ||||
| # endif | ||||
| 
 | ||||
| /*gcc appears to emit MOVDQA's to load the argument of an _mm_cvtepi8_epi32()
 | ||||
|   or _mm_cvtepi16_epi32() when optimizations are disabled, even though the | ||||
|   actual PMOVSXWD instruction takes an m32 or m64. Unlike a normal memory | ||||
|   reference, these require 16-byte alignment and load a full 16 bytes (instead | ||||
|   of 4 or 8), possibly reading out of bounds. | ||||
| 
 | ||||
|   We can insert an explicit MOVD or MOVQ using _mm_cvtsi32_si128() or | ||||
|   _mm_loadl_epi64(), which should have the same semantics as an m32 or m64 | ||||
|   reference in the PMOVSXWD instruction itself, but gcc is not smart enough to | ||||
|   optimize this out when optimizations ARE enabled. | ||||
| 
 | ||||
|   Clang, in contrast, requires us to do this always for _mm_cvtepi8_epi32 | ||||
|   (which is fair, since technically the compiler is always allowed to do the | ||||
|   dereference before invoking the function implementing the intrinsic). | ||||
|   However, it is smart enough to eliminate the extra MOVD instruction. | ||||
|   For _mm_cvtepi16_epi32, it does the right thing, though does *not* optimize out | ||||
|   the extra MOVQ if it's specified explicitly */ | ||||
| 
 | ||||
| # if defined(__clang__) || !defined(__OPTIMIZE__) | ||||
| #  define OP_CVTEPI8_EPI32_M32(x) \ | ||||
|  (_mm_cvtepi8_epi32(_mm_cvtsi32_si128(*(int *)(x)))) | ||||
| # else | ||||
| #  define OP_CVTEPI8_EPI32_M32(x) \ | ||||
|  (_mm_cvtepi8_epi32(*(__m128i *)(x))) | ||||
| #endif | ||||
| 
 | ||||
| /* similar reasoning about the instruction sequence as in the 32-bit macro above,
 | ||||
|  */ | ||||
| # if defined(__clang__) || !defined(__OPTIMIZE__) | ||||
| #  define OP_CVTEPI16_EPI32_M64(x) \ | ||||
|  (_mm_cvtepi16_epi32(_mm_loadl_epi64((__m128i *)(x)))) | ||||
| # else | ||||
| #  define OP_CVTEPI16_EPI32_M64(x) \ | ||||
|  (_mm_cvtepi16_epi32(*(__m128i *)(x))) | ||||
| # endif | ||||
| 
 | ||||
| #endif | ||||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue