linux/arch/arm/lib/memset.S

/*
 *  linux/arch/arm/lib/memset.S
 *
 *  Copyright (C) 1995-2000 Russell King
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License version 2 as
 * published by the Free Software Foundation.
 *
 *  ASM optimised string functions
 */
#include <linux/linkage.h>
#include <asm/assembler.h>

	.text
	.align	5
	.word	0

1:	subs	r2, r2, #4		@ 1 do we have enough
	blt	5f			@ 1 bytes to align with?
	cmp	r3, #2			@ 1
	strltb	r1, [r0], #1		@ 1
	strleb	r1, [r0], #1		@ 1
	strb	r1, [r0], #1		@ 1
	add	r2, r2, r3		@ 1 (r2 = r2 - (4 - r3))
/*
 * The pointer is now aligned and the length is adjusted.  Try doing the
 * memset again.
 */

ENTRY(memset)
	ands	r3, r0, #3		@ 1 unaligned?
	bne	1b			@ 1
/*
 * we know that the pointer in r0 is aligned to a word boundary.
 */
	orr	r1, r1, r1, lsl #8
	orr	r1, r1, r1, lsl #16
	mov	r3, r1
	cmp	r2, #16
	blt	4f

#if ! CALGN(1)+0

/*
 * We need an extra register for this loop - save the return address and
 * use the LR
 */
	str	lr, [sp, #-4]!
	mov	ip, r1
	mov	lr, r1

2:	subs	r2, r2, #64
	stmgeia	r0!, {r1, r3, ip, lr}	@ 64 bytes at a time.
	stmgeia	r0!, {r1, r3, ip, lr}
	stmgeia	r0!, {r1, r3, ip, lr}
	stmgeia	r0!, {r1, r3, ip, lr}
	bgt	2b
	ldmeqfd	sp!, {pc}		@ Now <64 bytes to go.
/*
 * No need to correct the count; we're only testing bits from now on
 */
	tst	r2, #32
	stmneia	r0!, {r1, r3, ip, lr}
	stmneia	r0!, {r1, r3, ip, lr}
	tst	r2, #16
	stmneia	r0!, {r1, r3, ip, lr}
	ldr	lr, [sp], #4

#else

/*
 * This version aligns the destination pointer in order to write
 * whole cache lines at once.
 */

	stmfd	sp!, {r4-r7, lr}
	mov	r4, r1
	mov	r5, r1
	mov	r6, r1
	mov	r7, r1
	mov	ip, r1
	mov	lr, r1

	cmp	r2, #96
	tstgt	r0, #31
	ble	3f

	and	ip, r0, #31
	rsb	ip, ip, #32
	sub	r2, r2, ip
	movs	ip, ip, lsl #(32 - 4)
	stmcsia	r0!, {r4, r5, r6, r7}
	stmmiia	r0!, {r4, r5}
	tst	ip, #(1 << 30)
	mov	ip, r1
	strne	r1, [r0], #4

3:	subs	r2, r2, #64
	stmgeia	r0!, {r1, r3-r7, ip, lr}
	stmgeia	r0!, {r1, r3-r7, ip, lr}
	bgt	3b
	ldmeqfd	sp!, {r4-r7, pc}

	tst	r2, #32
	stmneia	r0!, {r1, r3-r7, ip, lr}
	tst	r2, #16
	stmneia	r0!, {r4-r7}
	ldmfd	sp!, {r4-r7, lr}

#endif

4:	tst	r2, #8
	stmneia	r0!, {r1, r3}
	tst	r2, #4
	strne	r1, [r0], #4
/*
 * When we get here, we've got less than 4 bytes to zero.  We
 * may have an unaligned pointer as well.
 */
5:	tst	r2, #2
	strneb	r1, [r0], #1
	strneb	r1, [r0], #1
	tst	r2, #1
	strneb	r1, [r0], #1
	mov	pc, lr
ENDPROC(memset)
Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 00:20:36 +02:00			`/*`
			`* linux/arch/arm/lib/memset.S`
			`*`
			`* Copyright (C) 1995-2000 Russell King`
			`*`
			`* This program is free software; you can redistribute it and/or modify`
			`* it under the terms of the GNU General Public License version 2 as`
			`* published by the Free Software Foundation.`
			`*`
			`* ASM optimised string functions`
			`*/`
			`#include <linux/linkage.h>`
			`#include <asm/assembler.h>`

			`.text`
			`.align 5`
			`.word 0`

			`1: subs r2, r2, #4 @ 1 do we have enough`
			`blt 5f @ 1 bytes to align with?`
			`cmp r3, #2 @ 1`
			`strltb r1, [r0], #1 @ 1`
			`strleb r1, [r0], #1 @ 1`
			`strb r1, [r0], #1 @ 1`
			`add r2, r2, r3 @ 1 (r2 = r2 - (4 - r3))`
			`/*`
			`* The pointer is now aligned and the length is adjusted. Try doing the`
[ARM] remove memzero() As suggested by Andrew Morton, remove memzero() - it's not supported on other architectures so use of it is a potential build breaking bug. Since the compiler optimizes memset(x,0,n) to __memzero() perfectly well, we don't miss out on the underlying benefits of memzero(). Signed-off-by: Russell King <rmk+kernel@arm.linux.org.uk> 2008-10-27 12:24:09 +01:00			`* memset again.`
Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 00:20:36 +02:00			`*/`

			`ENTRY(memset)`
			`ands r3, r0, #3 @ 1 unaligned?`
			`bne 1b @ 1`
			`/*`
			`* we know that the pointer in r0 is aligned to a word boundary.`
			`*/`
			`orr r1, r1, r1, lsl #8`
			`orr r1, r1, r1, lsl #16`
			`mov r3, r1`
			`cmp r2, #16`
			`blt 4f`
[ARM] cache align memset and memzero This is a natural extension following the previous patch. Non Feroceon based targets are unchanged. Signed-off-by: Nicolas Pitre <nico@marvell.com> Signed-off-by: Lennert Buytenhek <buytenh@marvell.com> 2008-04-12 03:04:28 +02:00
			`#if ! CALGN(1)+0`

Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 00:20:36 +02:00			`/*`
			`* We need an extra register for this loop - save the return address and`
			`* use the LR`
			`*/`
			`str lr, [sp, #-4]!`
			`mov ip, r1`
			`mov lr, r1`

			`2: subs r2, r2, #64`
			`stmgeia r0!, {r1, r3, ip, lr} @ 64 bytes at a time.`
			`stmgeia r0!, {r1, r3, ip, lr}`
			`stmgeia r0!, {r1, r3, ip, lr}`
			`stmgeia r0!, {r1, r3, ip, lr}`
			`bgt 2b`
[ARM] Remove LOADREGS macro As for RETINSTR, LOADREGS is a left-over from the 26-bit days. Remove it. Signed-off-by: Russell King <rmk+kernel@arm.linux.org.uk> 2006-06-25 12:23:45 +02:00			`ldmeqfd sp!, {pc} @ Now <64 bytes to go.`
Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 00:20:36 +02:00			`/*`
			`* No need to correct the count; we're only testing bits from now on`
			`*/`
			`tst r2, #32`
			`stmneia r0!, {r1, r3, ip, lr}`
			`stmneia r0!, {r1, r3, ip, lr}`
			`tst r2, #16`
			`stmneia r0!, {r1, r3, ip, lr}`
			`ldr lr, [sp], #4`

[ARM] cache align memset and memzero This is a natural extension following the previous patch. Non Feroceon based targets are unchanged. Signed-off-by: Nicolas Pitre <nico@marvell.com> Signed-off-by: Lennert Buytenhek <buytenh@marvell.com> 2008-04-12 03:04:28 +02:00			`#else`

			`/*`
			`* This version aligns the destination pointer in order to write`
			`* whole cache lines at once.`
			`*/`

			`stmfd sp!, {r4-r7, lr}`
			`mov r4, r1`
			`mov r5, r1`
			`mov r6, r1`
			`mov r7, r1`
			`mov ip, r1`
			`mov lr, r1`

			`cmp r2, #96`
			`tstgt r0, #31`
			`ble 3f`

			`and ip, r0, #31`
			`rsb ip, ip, #32`
			`sub r2, r2, ip`
			`movs ip, ip, lsl #(32 - 4)`
			`stmcsia r0!, {r4, r5, r6, r7}`
			`stmmiia r0!, {r4, r5}`
			`tst ip, #(1 << 30)`
			`mov ip, r1`
			`strne r1, [r0], #4`

			`3: subs r2, r2, #64`
			`stmgeia r0!, {r1, r3-r7, ip, lr}`
			`stmgeia r0!, {r1, r3-r7, ip, lr}`
			`bgt 3b`
			`ldmeqfd sp!, {r4-r7, pc}`

			`tst r2, #32`
			`stmneia r0!, {r1, r3-r7, ip, lr}`
			`tst r2, #16`
			`stmneia r0!, {r4-r7}`
			`ldmfd sp!, {r4-r7, lr}`

			`#endif`

Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 00:20:36 +02:00			`4: tst r2, #8`
			`stmneia r0!, {r1, r3}`
			`tst r2, #4`
			`strne r1, [r0], #4`
			`/*`
			`* When we get here, we've got less than 4 bytes to zero. We`
			`* may have an unaligned pointer as well.`
			`*/`
			`5: tst r2, #2`
			`strneb r1, [r0], #1`
			`strneb r1, [r0], #1`
			`tst r2, #1`
			`strneb r1, [r0], #1`
[ARM] Remove RETINSTR macro RETINSTR is a left-over from the days when we had 26-bit and 32-bit CPU support integrated into the same tree. Since this is no longer the case, we can now remove RETINSTR. Signed-off-by: Russell King <rmk+kernel@arm.linux.org.uk> 2006-06-25 12:17:23 +02:00			`mov pc, lr`
[ARM] 5227/1: Add the ENDPROC declarations to the .S files This declaration specifies the "function" type and size for various assembly functions, mainly needed for generating the correct branch instructions in Thumb-2. Signed-off-by: Catalin Marinas <catalin.marinas@arm.com> Signed-off-by: Russell King <rmk+kernel@arm.linux.org.uk> 2008-08-28 12:22:32 +02:00			`ENDPROC(memset)`