forked from len0rd/rockbox
		
	swr/swl instructions used for word aligning were wrong. This made memset() terribly broken. I can't imagine how it went uncaught for soooo long. Spotted by Solomon Peachy. I run unit tests for alignments 0,1,2,3 size 1, 2, 3, 4, 5, 63, 64, 65, 127, 128, 129; and fill pattern 0x00 and other (since 0 is special case in this implementation). Change-Id: I513a10734335fe97734c10ab5a6c3e3fb3f4687a
		
			
				
	
	
		
			130 lines
		
	
	
	
		
			3.9 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
			
		
		
	
	
			130 lines
		
	
	
	
		
			3.9 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
| /***************************************************************************
 | |
|  *             __________               __   ___.
 | |
|  *   Open      \______   \ ____   ____ |  | _\_ |__   _______  ___
 | |
|  *   Source     |       _//  _ \_/ ___\|  |/ /| __ \ /  _ \  \/  /
 | |
|  *   Jukebox    |    |   (  <_> )  \___|    < | \_\ (  <_> > <  <
 | |
|  *   Firmware   |____|_  /\____/ \___  >__|_ \|___  /\____/__/\_ \
 | |
|  *                     \/            \/     \/    \/            \/
 | |
|  * $Id$
 | |
|  *
 | |
|  * This file was originally part of the Linux/MIPS GNU C Library
 | |
|  * Copyright (C) 1998 by Ralf Baechle
 | |
|  * Adapted for Rockbox by Maurus Cuelenaere, 2009
 | |
|  *
 | |
|  * This program is free software; you can redistribute it and/or
 | |
|  * modify it under the terms of the GNU General Public License
 | |
|  * as published by the Free Software Foundation; either version 2
 | |
|  * of the License, or (at your option) any later version.
 | |
|  *
 | |
|  * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
 | |
|  * KIND, either express or implied.
 | |
|  *
 | |
|  ****************************************************************************/
 | |
| 
 | |
| #include "config.h"
 | |
| #include "mips.h"
 | |
| 
 | |
| #define FILL64(dst, offset, val)      \
 | |
|     sw  val, (offset + 0x00)(dst);    \
 | |
|     sw  val, (offset + 0x04)(dst);    \
 | |
|     sw  val, (offset + 0x08)(dst);    \
 | |
|     sw  val, (offset + 0x0c)(dst);    \
 | |
|     sw  val, (offset + 0x10)(dst);    \
 | |
|     sw  val, (offset + 0x14)(dst);    \
 | |
|     sw  val, (offset + 0x18)(dst);    \
 | |
|     sw  val, (offset + 0x1c)(dst);    \
 | |
|     sw  val, (offset + 0x20)(dst);    \
 | |
|     sw  val, (offset + 0x24)(dst);    \
 | |
|     sw  val, (offset + 0x28)(dst);    \
 | |
|     sw  val, (offset + 0x2c)(dst);    \
 | |
|     sw  val, (offset + 0x30)(dst);    \
 | |
|     sw  val, (offset + 0x34)(dst);    \
 | |
|     sw  val, (offset + 0x38)(dst);    \
 | |
|     sw  val, (offset + 0x3c)(dst);
 | |
| 
 | |
| #define FILL    64
 | |
| #define F_FILL  FILL64
 | |
| 
 | |
| #ifdef ROCKBOX_BIG_ENDIAN
 | |
| # define SWHI   swl                /* high part is left in big-endian        */
 | |
| # define SWLO   swr
 | |
| #else
 | |
| # define SWHI   swr                /* high part is right in little-endian    */
 | |
| # define SWLO   swl
 | |
| #endif
 | |
| 
 | |
| /*
 | |
|  * memset(void *s, int c, size_t n)
 | |
|  *
 | |
|  * a0: start of area to clear
 | |
|  * a1: char to fill with
 | |
|  * a2: size of area to clear
 | |
|  */
 | |
|     .section   .icode, "ax", %progbits
 | |
| 
 | |
|     .global    memset
 | |
|     .type      memset, %function
 | |
|     
 | |
|     .set       noreorder
 | |
|     .align     5
 | |
| memset:
 | |
|     beqz    a1, 1f
 | |
|     move    v0, a0                /* result */
 | |
| 
 | |
|     andi    a1, 0xff              /* spread fillword */
 | |
|     sll     t1, a1, 8
 | |
|     or      a1, t1
 | |
|     sll     t1, a1, 16
 | |
|     or      a1, t1
 | |
| 1:
 | |
| 
 | |
|     sltiu   t0, a2, 4             /* very small region? */
 | |
|     bnez    t0, small_memset
 | |
|     andi    t0, a0, 3             /* aligned? */
 | |
| 
 | |
|     beqz    t0, 1f
 | |
|     subu    t0, 4                 /* alignment in bytes */
 | |
| 
 | |
|     SWHI    a1, (a0)              /* make word aligned */
 | |
|     subu    a0, t0                /* word align ptr */
 | |
|     addu    a2, t0                /* correct size */
 | |
| 
 | |
| 1:  ori     t1, a2, (FILL-1)      /* # of full blocks */
 | |
|     xori    t1, (FILL-1)
 | |
|     beqz    t1, memset_partial    /* no block to fill */
 | |
|     andi    t0, a2, (FILL-4)
 | |
| 
 | |
|     addu    t1, a0                /* end address */
 | |
|     .set    reorder
 | |
| 1:  addiu   a0, FILL
 | |
|     F_FILL( a0, -FILL, a1 )
 | |
|     bne     t1, a0, 1b
 | |
|     .set    noreorder
 | |
| 
 | |
| memset_partial:
 | |
|     la      t1, 2f                /* where to start */
 | |
|     subu    t1, t0
 | |
|     jr      t1
 | |
|     addu    a0, t0                /* dest ptr */
 | |
| 
 | |
|     F_FILL( a0, -FILL, a1 )       /* ... but first do words ... */
 | |
| 2:  andi    a2, 3                 /* 0 <= n <= 3 to go */
 | |
| 
 | |
|     beqz    a2, 1f
 | |
|     addu    a0, a2                /* What's left */
 | |
|     SWLO    a1, -1(a0)
 | |
| 1:  jr      ra
 | |
|     move    a2, zero
 | |
| 
 | |
| small_memset:
 | |
|     beqz    a2, 2f
 | |
|     addu    t1, a0, a2
 | |
| 
 | |
| 1:  addiu   a0, 1                 /* fill bytewise */
 | |
|     bne     t1, a0, 1b
 | |
|     sb      a1, -1(a0)
 | |
| 
 | |
| 2:  jr      ra                    /* done */
 | |
|     move    a2, zero
 | |
| 
 | |
|     .set       reorder
 |