1
0
Fork 0
forked from len0rd/rockbox

Submit next part of FS#11498. Unroll loop for minor speedup of libwmapro on ARM (1%).

git-svn-id: svn://svn.rockbox.org/rockbox/trunk@27595 a1c6a512-1295-4272-9138-f99709370657
This commit is contained in:
Andree Buschmann 2010-07-28 18:15:53 +00:00
parent f0aac62dd5
commit 8cc8bb9bde

View file

@ -218,13 +218,13 @@ static inline void vector_fixmul_window(int32_t *dst, const int32_t *src0,
dst += len; dst += len;
win += len; win += len;
src0+= len; src0+= len;
for(i=-len, j=len-1; i<0; i++, j--) { for(i=-len, j=len-1; i<0; i++, j--) {
int32_t s0 = src0[i]; int32_t s0 = src0[i]; /* s0 = src0[ 0 ... len-1] */
int32_t s1 = src1[j]; int32_t s1 = src1[j]; /* s1 = src1[2*len-1 ... len] */
int32_t wi = -win[i]; int32_t wi = -win[i]; /* wi = -win[ 0 ... len-1] */
int32_t wj = -win[j]; int32_t wj = -win[j]; /* wj = -win[2*len-1 ... len] */
dst[i] = fixmul31(s0, wj) - fixmul31(s1, wi); dst[i] = fixmul31(s0, wj) - fixmul31(s1, wi); /* dst[ 0 ... len-1] */
dst[j] = fixmul31(s0, wi) + fixmul31(s1, wj); dst[j] = fixmul31(s0, wi) + fixmul31(s1, wj); /* dst[2*len-1 ... len] */
} }
} }
#endif #endif
@ -232,9 +232,15 @@ static inline void vector_fixmul_window(int32_t *dst, const int32_t *src0,
static inline void vector_fixmul_scalar(int32_t *dst, const int32_t *src, static inline void vector_fixmul_scalar(int32_t *dst, const int32_t *src,
int32_t mul, int len) int32_t mul, int len)
{ {
/* len is _always_ a multiple of 4, because len is the difference of sfb's
* which themselves are always a multiple of 4. */
int i; int i;
for(i=0; i<len; i++) for (i=0; i<len; i+=4) {
dst[i] = fixmul24(src[i], mul); dst[i ] = fixmul24(src[i ], mul);
dst[i+1] = fixmul24(src[i+1], mul);
dst[i+2] = fixmul24(src[i+2], mul);
dst[i+3] = fixmul24(src[i+3], mul);
}
} }
static inline int av_clip(int a, int amin, int amax) static inline int av_clip(int a, int amin, int amax)