1
0
Fork 0
forked from len0rd/rockbox

Extend av_log2 in codeclib into a generic for scanning for set bits, which can provide either log2 or leading-zero-count output, and can force mapping 0 input to 0 output if needed (otherwise 0 input produces undefined result). Replace av_log2 in lib/codeclib.h, floor_log2 and wl_min_lzc in libfaad/common.c and common.h, and count_leading_zeros in libalac/alac.c with macros using bs_generic.

git-svn-id: svn://svn.rockbox.org/rockbox/trunk@23903 a1c6a512-1295-4272-9138-f99709370657
This commit is contained in:
Andrew Mahone 2009-12-09 02:24:45 +00:00
parent 3683bb67db
commit 85aad9b397
6 changed files with 96 additions and 141 deletions

View file

@ -33,6 +33,15 @@ unsigned char* mp3buf; // The actual MP3 buffer from Rockbox
unsigned char* mallocbuf; // 512K from the start of MP3 buffer unsigned char* mallocbuf; // 512K from the start of MP3 buffer
unsigned char* filebuf; // The rest of the MP3 buffer unsigned char* filebuf; // The rest of the MP3 buffer
unsigned bs_log2(unsigned x)
{ return bs_generic(x, BS_LOG2); }
unsigned bs_log2_0(unsigned x)
{ return bs_generic(x, BS_LOG2|BS_0_0); }
unsigned bs_clz(unsigned x)
{ return bs_generic(x, BS_CLZ); }
unsigned bs_clz_0(unsigned x)
{ return bs_generic(x, BS_CLZ|BS_0_0); }
int codec_init(void) int codec_init(void)
{ {
mem_ptr = 0; mem_ptr = 0;
@ -139,7 +148,7 @@ void qsort(void *base, size_t nmemb, size_t size,
} }
/* From ffmpeg - libavutil/common.h */ /* From ffmpeg - libavutil/common.h */
const uint8_t ff_log2_tab[256] ICONST_ATTR = { const uint8_t bs_log2_tab[256] ICONST_ATTR = {
0,0,1,1,2,2,2,2,3,3,3,3,3,3,3,3,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4, 0,0,1,1,2,2,2,2,3,3,3,3,3,3,3,3,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,
5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5, 5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,
6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6, 6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,6,
@ -150,6 +159,17 @@ const uint8_t ff_log2_tab[256] ICONST_ATTR = {
7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7 7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7
}; };
const uint8_t bs_clz_tab[256] ICONST_ATTR = {
8,7,6,6,5,5,5,5,4,4,4,4,4,4,4,4,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,
2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
};
#ifdef RB_PROFILE #ifdef RB_PROFILE
void __cyg_profile_func_enter(void *this_fn, void *call_site) { void __cyg_profile_func_enter(void *this_fn, void *call_site) {
#ifdef CPU_COLDFIRE #ifdef CPU_COLDFIRE

View file

@ -74,45 +74,80 @@ unsigned udiv32_arm(unsigned a, unsigned b);
#define UDIV32(a, b) (a / b) #define UDIV32(a, b) (a / b)
#endif #endif
#if !defined(CPU_ARM) || ARM_ARCH < 5
/* From libavutil/common.h */
extern const uint8_t bs_log2_tab[256] ICONST_ATTR;
extern const uint8_t bs_clz_tab[256] ICONST_ATTR;
#endif
#define BS_LOG2 0 /* default personality, equivalent floor(log2(x)) */
#define BS_CLZ 1 /* alternate personality, Count Leading Zeros */
#define BS_SHORT 2 /* input guaranteed not to exceed 16 bits */
#define BS_0_0 4 /* guarantee mapping of 0 input to 0 output */
/* Generic bit-scanning function, used to wrap platform CLZ instruction or
scan-and-lookup code, and to provide control over output for 0 inputs. */
static inline unsigned int bs_generic(unsigned int v, int mode)
{
#if defined(CPU_ARM) && ARM_ARCH >= 5
unsigned int r = __builtin_clz(v);
if (mode & BS_CLZ)
{
if (mode & BS_0_0)
r &= 31;
} else {
r = 31 - r;
/* If mode is constant, this is a single conditional instruction */
if (mode & BS_0_0 && (signed)r < 0)
r += 1;
}
#else
const uint8_t *bs_tab;
unsigned int r;
unsigned int n = v;
int inc;
/* Set up table, increment, and initial result value based on
personality. */
if (mode & BS_CLZ)
{
bs_tab = bs_clz_tab;
r = 24;
inc = -16;
} else {
bs_tab = bs_log2_tab;
r = 0;
inc = 16;
}
if (!(mode & BS_SHORT) && n >= 0x10000) {
n >>= 16;
r += inc;
}
if (n > 0xff) {
n >>= 8;
r += inc / 2;
}
#ifdef CPU_COLDFIRE
/* The high 24 bits of n are guaranteed empty after the above, so a
superfluous ext.b instruction can be saved by loading the LUT value over
n with asm */
asm volatile (
"move.b (%1,%0.l),%0"
: "+d" (n)
: "a" (bs_tab)
);
#else
n = bs_tab[n];
#endif
r += n;
if (mode & BS_CLZ && mode & BS_0_0 && v == 0)
r = 0;
#endif
return r;
}
/* TODO figure out if we really need to care about calculating /* TODO figure out if we really need to care about calculating
av_log2(0) */ av_log2(0) */
#if defined(CPU_ARM) && ARM_ARCH >= 6 #define av_log2(v) bs_generic(v, BS_0_0)
static inline unsigned int av_log2(uint32_t v)
{
unsigned int r;
asm volatile("clz %[r], %[v]\n\t" /* count leading zeroes */
"rsb %[r], %[r], #31\n\t" /* r = 31 - leading zeroes */
"usat %[r], #5, %[r]\n\t" /* unsigned saturate r so -1 -> 0 */
:[r] "=r" (r) : [v] "r" (v));
return(r);
}
#elif defined(CPU_ARM) && ARM_ARCH >= 5
static inline unsigned int av_log2(uint32_t v)
{
return v ? 31 - __builtin_clz(v) : 0;
}
#else /* CPU_ARM */
/* From libavutil/common.h */
extern const uint8_t ff_log2_tab[256] ICONST_ATTR;
static inline unsigned int av_log2(unsigned int v)
{
int n;
n = 0;
if (v & 0xffff0000) {
v >>= 16;
n += 16;
}
if (v & 0xff00) {
v >>= 8;
n += 8;
}
n += ff_log2_tab[v];
return n;
}
#endif
/* Various codec helper functions */ /* Various codec helper functions */

View file

@ -166,46 +166,7 @@ static inline void unreadbits(alac_file *alac, int bits)
alac->input_buffer_bitaccumulator *= -1; alac->input_buffer_bitaccumulator *= -1;
} }
/* ARMv5+ has a clz instruction equivalent to our function. #define count_leading_zeros(x) bs_generic(x, BS_CLZ|BS_SHORT)
*/
#if (defined(CPU_ARM) && (ARM_ARCH > 4))
static inline int count_leading_zeros(uint32_t v)
{
return __builtin_clz(v);
}
#else
static const unsigned char bittab[16] ICONST_ATTR = {
0, 1, 2, 2, 3, 3, 3, 3, 4, 4, 4, 4, 4, 4, 4, 4
};
static inline int count_leading_zeros(int input)
{
int output = 32;
#if 0
/* Experimentation has shown that the following test is always false,
so we don't bother to perform it. */
if (input & 0xffff0000)
{
input >>= 16;
output -= 16;
}
#endif
if (input & 0xff00)
{
input >>= 8;
output -= 8;
}
if (input & 0xf0)
{
input >>= 4;
output -= 4;
}
output -= bittab[input];
return output;
}
#endif
void basterdised_rice_decompress(alac_file *alac, void basterdised_rice_decompress(alac_file *alac,
int32_t *output_buffer, int32_t *output_buffer,

View file

@ -241,58 +241,7 @@ uint32_t random_int(void)
return (__r1 = (t3 >> 1) | t1 ) ^ (__r2 = (t4 + t4) | t2 ); return (__r1 = (t3 >> 1) | t1 ) ^ (__r2 = (t4 + t4) | t2 );
} }
uint32_t ones32(uint32_t x) #define floor_log2(x) bs_generic(x, BS_LOG2)
{
x -= ((x >> 1) & 0x55555555);
x = (((x >> 2) & 0x33333333) + (x & 0x33333333));
x = (((x >> 4) + x) & 0x0f0f0f0f);
x += (x >> 8);
x += (x >> 16);
return (x & 0x0000003f);
}
uint32_t floor_log2(uint32_t x)
{
#if 1
x |= (x >> 1);
x |= (x >> 2);
x |= (x >> 4);
x |= (x >> 8);
x |= (x >> 16);
return (ones32(x) - 1);
#else
uint32_t count = 0;
while (x >>= 1)
count++;
return count;
#endif
}
/* returns position of first bit that is not 0 from msb,
* starting count at lsb */
uint32_t wl_min_lzc(uint32_t x)
{
#if 1
x |= (x >> 1);
x |= (x >> 2);
x |= (x >> 4);
x |= (x >> 8);
x |= (x >> 16);
return (ones32(x));
#else
uint32_t count = 0;
while (x >>= 1)
count++;
return (count + 1);
#endif
}
#ifdef FIXED_POINT #ifdef FIXED_POINT

View file

@ -399,9 +399,7 @@ typedef real_t complex_t[2];
/* common functions */ /* common functions */
uint8_t cpu_has_sse(void); uint8_t cpu_has_sse(void);
uint32_t random_int(void); uint32_t random_int(void);
uint32_t ones32(uint32_t x); #define wl_min_lzc(x) bs_generic(x, BS_LOG2|BS_0_0)
uint32_t floor_log2(uint32_t x);
uint32_t wl_min_lzc(uint32_t x);
#ifdef FIXED_POINT #ifdef FIXED_POINT
#define LOG2_MIN_INF REAL_CONST(-10000) #define LOG2_MIN_INF REAL_CONST(-10000)
int32_t log2_int(uint32_t val); int32_t log2_int(uint32_t val);

View file

@ -222,10 +222,6 @@ static void auto_correlation(sbr_info *sbr, acorr_coef *ac,
exp = wl_min_lzc(mask); exp = wl_min_lzc(mask);
/* improves accuracy */
if (exp > 0)
exp -= 1;
for (j = offset; j < len + offset; j++) for (j = offset; j < len + offset; j++)
{ {
real_t buf_j = ((QMF_RE(buffer[j][bd])+(1<<(exp-1)))>>exp); real_t buf_j = ((QMF_RE(buffer[j][bd])+(1<<(exp-1)))>>exp);
@ -292,10 +288,6 @@ static void auto_correlation(sbr_info *sbr, acorr_coef *ac, qmf_t buffer[MAX_NTS
} }
exp = wl_min_lzc(mask); exp = wl_min_lzc(mask);
/* improves accuracy */
if (exp > 0)
exp -= 1;
pow2_to_exp = 1<<(exp-1); pow2_to_exp = 1<<(exp-1);