forked from len0rd/rockbox
Extend av_log2 in codeclib into a generic for scanning for set bits, which can provide either log2 or leading-zero-count output, and can force mapping 0 input to 0 output if needed (otherwise 0 input produces undefined result). Replace av_log2 in lib/codeclib.h, floor_log2 and wl_min_lzc in libfaad/common.c and common.h, and count_leading_zeros in libalac/alac.c with macros using bs_generic.
git-svn-id: svn://svn.rockbox.org/rockbox/trunk@23903 a1c6a512-1295-4272-9138-f99709370657
This commit is contained in:
parent
3683bb67db
commit
85aad9b397
6 changed files with 96 additions and 141 deletions
|
@ -33,6 +33,15 @@ unsigned char* mp3buf; // The actual MP3 buffer from Rockbox
|
||||||
unsigned char* mallocbuf; // 512K from the start of MP3 buffer
|
unsigned char* mallocbuf; // 512K from the start of MP3 buffer
|
||||||
unsigned char* filebuf; // The rest of the MP3 buffer
|
unsigned char* filebuf; // The rest of the MP3 buffer
|
||||||
|
|
||||||
|
unsigned bs_log2(unsigned x)
|
||||||
|
{ return bs_generic(x, BS_LOG2); }
|
||||||
|
unsigned bs_log2_0(unsigned x)
|
||||||
|
{ return bs_generic(x, BS_LOG2|BS_0_0); }
|
||||||
|
unsigned bs_clz(unsigned x)
|
||||||
|
{ return bs_generic(x, BS_CLZ); }
|
||||||
|
unsigned bs_clz_0(unsigned x)
|
||||||
|
{ return bs_generic(x, BS_CLZ|BS_0_0); }
|
||||||
|
|
||||||
int codec_init(void)
|
int codec_init(void)
|
||||||
{
|
{
|
||||||
mem_ptr = 0;
|
mem_ptr = 0;
|
||||||
|
@ -139,7 +148,7 @@ void qsort(void *base, size_t nmemb, size_t size,
|
||||||
}
|
}
|
||||||
|
|
||||||
/* From ffmpeg - libavutil/common.h */
|
/* From ffmpeg - libavutil/common.h */
|
||||||
const uint8_t ff_log2_tab[256] ICONST_ATTR = {
|
const uint8_t bs_log2_tab[256] ICONST_ATTR = {
|
||||||
0,0,1,1,2,2,2,2,3,3,3,3,3,3,3,3,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,
|
0,0,1,1,2,2,2,2,3,3,3,3,3,3,3,3,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,
|
||||||
5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,
|
5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,
|
||||||
6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,
|
6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,
|
||||||
|
@ -150,6 +159,17 @@ const uint8_t ff_log2_tab[256] ICONST_ATTR = {
|
||||||
7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7
|
7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7
|
||||||
};
|
};
|
||||||
|
|
||||||
|
const uint8_t bs_clz_tab[256] ICONST_ATTR = {
|
||||||
|
8,7,6,6,5,5,5,5,4,4,4,4,4,4,4,4,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,
|
||||||
|
2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,
|
||||||
|
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
|
||||||
|
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
|
||||||
|
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
|
||||||
|
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
|
||||||
|
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
|
||||||
|
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
|
||||||
|
};
|
||||||
|
|
||||||
#ifdef RB_PROFILE
|
#ifdef RB_PROFILE
|
||||||
void __cyg_profile_func_enter(void *this_fn, void *call_site) {
|
void __cyg_profile_func_enter(void *this_fn, void *call_site) {
|
||||||
#ifdef CPU_COLDFIRE
|
#ifdef CPU_COLDFIRE
|
||||||
|
|
|
@ -74,45 +74,80 @@ unsigned udiv32_arm(unsigned a, unsigned b);
|
||||||
#define UDIV32(a, b) (a / b)
|
#define UDIV32(a, b) (a / b)
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
#if !defined(CPU_ARM) || ARM_ARCH < 5
|
||||||
|
/* From libavutil/common.h */
|
||||||
|
extern const uint8_t bs_log2_tab[256] ICONST_ATTR;
|
||||||
|
extern const uint8_t bs_clz_tab[256] ICONST_ATTR;
|
||||||
|
#endif
|
||||||
|
|
||||||
|
#define BS_LOG2 0 /* default personality, equivalent floor(log2(x)) */
|
||||||
|
#define BS_CLZ 1 /* alternate personality, Count Leading Zeros */
|
||||||
|
#define BS_SHORT 2 /* input guaranteed not to exceed 16 bits */
|
||||||
|
#define BS_0_0 4 /* guarantee mapping of 0 input to 0 output */
|
||||||
|
|
||||||
|
/* Generic bit-scanning function, used to wrap platform CLZ instruction or
|
||||||
|
scan-and-lookup code, and to provide control over output for 0 inputs. */
|
||||||
|
static inline unsigned int bs_generic(unsigned int v, int mode)
|
||||||
|
{
|
||||||
|
#if defined(CPU_ARM) && ARM_ARCH >= 5
|
||||||
|
unsigned int r = __builtin_clz(v);
|
||||||
|
if (mode & BS_CLZ)
|
||||||
|
{
|
||||||
|
if (mode & BS_0_0)
|
||||||
|
r &= 31;
|
||||||
|
} else {
|
||||||
|
r = 31 - r;
|
||||||
|
/* If mode is constant, this is a single conditional instruction */
|
||||||
|
if (mode & BS_0_0 && (signed)r < 0)
|
||||||
|
r += 1;
|
||||||
|
}
|
||||||
|
#else
|
||||||
|
const uint8_t *bs_tab;
|
||||||
|
unsigned int r;
|
||||||
|
unsigned int n = v;
|
||||||
|
int inc;
|
||||||
|
/* Set up table, increment, and initial result value based on
|
||||||
|
personality. */
|
||||||
|
if (mode & BS_CLZ)
|
||||||
|
{
|
||||||
|
bs_tab = bs_clz_tab;
|
||||||
|
r = 24;
|
||||||
|
inc = -16;
|
||||||
|
} else {
|
||||||
|
bs_tab = bs_log2_tab;
|
||||||
|
r = 0;
|
||||||
|
inc = 16;
|
||||||
|
}
|
||||||
|
if (!(mode & BS_SHORT) && n >= 0x10000) {
|
||||||
|
n >>= 16;
|
||||||
|
r += inc;
|
||||||
|
}
|
||||||
|
if (n > 0xff) {
|
||||||
|
n >>= 8;
|
||||||
|
r += inc / 2;
|
||||||
|
}
|
||||||
|
#ifdef CPU_COLDFIRE
|
||||||
|
/* The high 24 bits of n are guaranteed empty after the above, so a
|
||||||
|
superfluous ext.b instruction can be saved by loading the LUT value over
|
||||||
|
n with asm */
|
||||||
|
asm volatile (
|
||||||
|
"move.b (%1,%0.l),%0"
|
||||||
|
: "+d" (n)
|
||||||
|
: "a" (bs_tab)
|
||||||
|
);
|
||||||
|
#else
|
||||||
|
n = bs_tab[n];
|
||||||
|
#endif
|
||||||
|
r += n;
|
||||||
|
if (mode & BS_CLZ && mode & BS_0_0 && v == 0)
|
||||||
|
r = 0;
|
||||||
|
#endif
|
||||||
|
return r;
|
||||||
|
}
|
||||||
|
|
||||||
/* TODO figure out if we really need to care about calculating
|
/* TODO figure out if we really need to care about calculating
|
||||||
av_log2(0) */
|
av_log2(0) */
|
||||||
#if defined(CPU_ARM) && ARM_ARCH >= 6
|
#define av_log2(v) bs_generic(v, BS_0_0)
|
||||||
static inline unsigned int av_log2(uint32_t v)
|
|
||||||
{
|
|
||||||
unsigned int r;
|
|
||||||
asm volatile("clz %[r], %[v]\n\t" /* count leading zeroes */
|
|
||||||
"rsb %[r], %[r], #31\n\t" /* r = 31 - leading zeroes */
|
|
||||||
"usat %[r], #5, %[r]\n\t" /* unsigned saturate r so -1 -> 0 */
|
|
||||||
:[r] "=r" (r) : [v] "r" (v));
|
|
||||||
return(r);
|
|
||||||
}
|
|
||||||
#elif defined(CPU_ARM) && ARM_ARCH >= 5
|
|
||||||
static inline unsigned int av_log2(uint32_t v)
|
|
||||||
{
|
|
||||||
return v ? 31 - __builtin_clz(v) : 0;
|
|
||||||
}
|
|
||||||
#else /* CPU_ARM */
|
|
||||||
/* From libavutil/common.h */
|
|
||||||
extern const uint8_t ff_log2_tab[256] ICONST_ATTR;
|
|
||||||
|
|
||||||
static inline unsigned int av_log2(unsigned int v)
|
|
||||||
{
|
|
||||||
int n;
|
|
||||||
|
|
||||||
n = 0;
|
|
||||||
if (v & 0xffff0000) {
|
|
||||||
v >>= 16;
|
|
||||||
n += 16;
|
|
||||||
}
|
|
||||||
if (v & 0xff00) {
|
|
||||||
v >>= 8;
|
|
||||||
n += 8;
|
|
||||||
}
|
|
||||||
n += ff_log2_tab[v];
|
|
||||||
|
|
||||||
return n;
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
|
|
||||||
/* Various codec helper functions */
|
/* Various codec helper functions */
|
||||||
|
|
||||||
|
|
|
@ -166,46 +166,7 @@ static inline void unreadbits(alac_file *alac, int bits)
|
||||||
alac->input_buffer_bitaccumulator *= -1;
|
alac->input_buffer_bitaccumulator *= -1;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* ARMv5+ has a clz instruction equivalent to our function.
|
#define count_leading_zeros(x) bs_generic(x, BS_CLZ|BS_SHORT)
|
||||||
*/
|
|
||||||
#if (defined(CPU_ARM) && (ARM_ARCH > 4))
|
|
||||||
static inline int count_leading_zeros(uint32_t v)
|
|
||||||
{
|
|
||||||
return __builtin_clz(v);
|
|
||||||
}
|
|
||||||
#else
|
|
||||||
|
|
||||||
static const unsigned char bittab[16] ICONST_ATTR = {
|
|
||||||
0, 1, 2, 2, 3, 3, 3, 3, 4, 4, 4, 4, 4, 4, 4, 4
|
|
||||||
};
|
|
||||||
|
|
||||||
static inline int count_leading_zeros(int input)
|
|
||||||
{
|
|
||||||
int output = 32;
|
|
||||||
|
|
||||||
#if 0
|
|
||||||
/* Experimentation has shown that the following test is always false,
|
|
||||||
so we don't bother to perform it. */
|
|
||||||
if (input & 0xffff0000)
|
|
||||||
{
|
|
||||||
input >>= 16;
|
|
||||||
output -= 16;
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
if (input & 0xff00)
|
|
||||||
{
|
|
||||||
input >>= 8;
|
|
||||||
output -= 8;
|
|
||||||
}
|
|
||||||
if (input & 0xf0)
|
|
||||||
{
|
|
||||||
input >>= 4;
|
|
||||||
output -= 4;
|
|
||||||
}
|
|
||||||
output -= bittab[input];
|
|
||||||
return output;
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
|
|
||||||
void basterdised_rice_decompress(alac_file *alac,
|
void basterdised_rice_decompress(alac_file *alac,
|
||||||
int32_t *output_buffer,
|
int32_t *output_buffer,
|
||||||
|
|
|
@ -241,58 +241,7 @@ uint32_t random_int(void)
|
||||||
return (__r1 = (t3 >> 1) | t1 ) ^ (__r2 = (t4 + t4) | t2 );
|
return (__r1 = (t3 >> 1) | t1 ) ^ (__r2 = (t4 + t4) | t2 );
|
||||||
}
|
}
|
||||||
|
|
||||||
uint32_t ones32(uint32_t x)
|
#define floor_log2(x) bs_generic(x, BS_LOG2)
|
||||||
{
|
|
||||||
x -= ((x >> 1) & 0x55555555);
|
|
||||||
x = (((x >> 2) & 0x33333333) + (x & 0x33333333));
|
|
||||||
x = (((x >> 4) + x) & 0x0f0f0f0f);
|
|
||||||
x += (x >> 8);
|
|
||||||
x += (x >> 16);
|
|
||||||
|
|
||||||
return (x & 0x0000003f);
|
|
||||||
}
|
|
||||||
|
|
||||||
uint32_t floor_log2(uint32_t x)
|
|
||||||
{
|
|
||||||
#if 1
|
|
||||||
x |= (x >> 1);
|
|
||||||
x |= (x >> 2);
|
|
||||||
x |= (x >> 4);
|
|
||||||
x |= (x >> 8);
|
|
||||||
x |= (x >> 16);
|
|
||||||
|
|
||||||
return (ones32(x) - 1);
|
|
||||||
#else
|
|
||||||
uint32_t count = 0;
|
|
||||||
|
|
||||||
while (x >>= 1)
|
|
||||||
count++;
|
|
||||||
|
|
||||||
return count;
|
|
||||||
#endif
|
|
||||||
}
|
|
||||||
|
|
||||||
/* returns position of first bit that is not 0 from msb,
|
|
||||||
* starting count at lsb */
|
|
||||||
uint32_t wl_min_lzc(uint32_t x)
|
|
||||||
{
|
|
||||||
#if 1
|
|
||||||
x |= (x >> 1);
|
|
||||||
x |= (x >> 2);
|
|
||||||
x |= (x >> 4);
|
|
||||||
x |= (x >> 8);
|
|
||||||
x |= (x >> 16);
|
|
||||||
|
|
||||||
return (ones32(x));
|
|
||||||
#else
|
|
||||||
uint32_t count = 0;
|
|
||||||
|
|
||||||
while (x >>= 1)
|
|
||||||
count++;
|
|
||||||
|
|
||||||
return (count + 1);
|
|
||||||
#endif
|
|
||||||
}
|
|
||||||
|
|
||||||
#ifdef FIXED_POINT
|
#ifdef FIXED_POINT
|
||||||
|
|
||||||
|
|
|
@ -399,9 +399,7 @@ typedef real_t complex_t[2];
|
||||||
/* common functions */
|
/* common functions */
|
||||||
uint8_t cpu_has_sse(void);
|
uint8_t cpu_has_sse(void);
|
||||||
uint32_t random_int(void);
|
uint32_t random_int(void);
|
||||||
uint32_t ones32(uint32_t x);
|
#define wl_min_lzc(x) bs_generic(x, BS_LOG2|BS_0_0)
|
||||||
uint32_t floor_log2(uint32_t x);
|
|
||||||
uint32_t wl_min_lzc(uint32_t x);
|
|
||||||
#ifdef FIXED_POINT
|
#ifdef FIXED_POINT
|
||||||
#define LOG2_MIN_INF REAL_CONST(-10000)
|
#define LOG2_MIN_INF REAL_CONST(-10000)
|
||||||
int32_t log2_int(uint32_t val);
|
int32_t log2_int(uint32_t val);
|
||||||
|
|
|
@ -222,10 +222,6 @@ static void auto_correlation(sbr_info *sbr, acorr_coef *ac,
|
||||||
|
|
||||||
exp = wl_min_lzc(mask);
|
exp = wl_min_lzc(mask);
|
||||||
|
|
||||||
/* improves accuracy */
|
|
||||||
if (exp > 0)
|
|
||||||
exp -= 1;
|
|
||||||
|
|
||||||
for (j = offset; j < len + offset; j++)
|
for (j = offset; j < len + offset; j++)
|
||||||
{
|
{
|
||||||
real_t buf_j = ((QMF_RE(buffer[j][bd])+(1<<(exp-1)))>>exp);
|
real_t buf_j = ((QMF_RE(buffer[j][bd])+(1<<(exp-1)))>>exp);
|
||||||
|
@ -292,10 +288,6 @@ static void auto_correlation(sbr_info *sbr, acorr_coef *ac, qmf_t buffer[MAX_NTS
|
||||||
}
|
}
|
||||||
|
|
||||||
exp = wl_min_lzc(mask);
|
exp = wl_min_lzc(mask);
|
||||||
|
|
||||||
/* improves accuracy */
|
|
||||||
if (exp > 0)
|
|
||||||
exp -= 1;
|
|
||||||
|
|
||||||
pow2_to_exp = 1<<(exp-1);
|
pow2_to_exp = 1<<(exp-1);
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue