xref: /minix3/common/lib/libc/arch/sparc/string/bzero.S (revision b6cbf7203b080219de306404f8022a65b7884f33)
1*b6cbf720SGianluca Guida/*	$NetBSD: bzero.S,v 1.1 2005/12/20 19:28:50 christos Exp $	*/
2*b6cbf720SGianluca Guida
3*b6cbf720SGianluca Guida/*
4*b6cbf720SGianluca Guida * Copyright (c) 1992, 1993
5*b6cbf720SGianluca Guida *	The Regents of the University of California.  All rights reserved.
6*b6cbf720SGianluca Guida *
7*b6cbf720SGianluca Guida * This software was developed by the Computer Systems Engineering group
8*b6cbf720SGianluca Guida * at Lawrence Berkeley Laboratory under DARPA contract BG 91-66 and
9*b6cbf720SGianluca Guida * contributed to Berkeley.
10*b6cbf720SGianluca Guida *
11*b6cbf720SGianluca Guida * Redistribution and use in source and binary forms, with or without
12*b6cbf720SGianluca Guida * modification, are permitted provided that the following conditions
13*b6cbf720SGianluca Guida * are met:
14*b6cbf720SGianluca Guida * 1. Redistributions of source code must retain the above copyright
15*b6cbf720SGianluca Guida *    notice, this list of conditions and the following disclaimer.
16*b6cbf720SGianluca Guida * 2. Redistributions in binary form must reproduce the above copyright
17*b6cbf720SGianluca Guida *    notice, this list of conditions and the following disclaimer in the
18*b6cbf720SGianluca Guida *    documentation and/or other materials provided with the distribution.
19*b6cbf720SGianluca Guida * 3. Neither the name of the University nor the names of its contributors
20*b6cbf720SGianluca Guida *    may be used to endorse or promote products derived from this software
21*b6cbf720SGianluca Guida *    without specific prior written permission.
22*b6cbf720SGianluca Guida *
23*b6cbf720SGianluca Guida * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24*b6cbf720SGianluca Guida * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25*b6cbf720SGianluca Guida * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26*b6cbf720SGianluca Guida * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27*b6cbf720SGianluca Guida * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28*b6cbf720SGianluca Guida * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29*b6cbf720SGianluca Guida * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30*b6cbf720SGianluca Guida * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31*b6cbf720SGianluca Guida * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32*b6cbf720SGianluca Guida * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33*b6cbf720SGianluca Guida * SUCH DAMAGE.
34*b6cbf720SGianluca Guida *
35*b6cbf720SGianluca Guida * from: Header: bzero.s,v 1.1 92/06/25 12:52:46 torek Exp
36*b6cbf720SGianluca Guida */
37*b6cbf720SGianluca Guida
38*b6cbf720SGianluca Guida#include <machine/asm.h>
39*b6cbf720SGianluca Guida#if defined(LIBC_SCCS) && !defined(lint)
40*b6cbf720SGianluca Guida#if 0
41*b6cbf720SGianluca Guida	.asciz "@(#)bzero.s	8.1 (Berkeley) 6/4/93"
42*b6cbf720SGianluca Guida#else
43*b6cbf720SGianluca Guida	RCSID("$NetBSD: bzero.S,v 1.1 2005/12/20 19:28:50 christos Exp $")
44*b6cbf720SGianluca Guida#endif
45*b6cbf720SGianluca Guida#endif  /* LIBC_SCCS and not lint */
46*b6cbf720SGianluca Guida
47*b6cbf720SGianluca Guida/*
48*b6cbf720SGianluca Guida * We should unroll the loop, but at the moment this would
49*b6cbf720SGianluca Guida * gain nothing since the `std' instructions are what limits us.
50*b6cbf720SGianluca Guida */
51*b6cbf720SGianluca Guida
52*b6cbf720SGianluca Guida#ifdef MEMSET
53*b6cbf720SGianluca Guida/*
54*b6cbf720SGianluca Guida * void *
55*b6cbf720SGianluca Guida * memset(void *addr, int pattern, size_t len)
56*b6cbf720SGianluca Guida */
57*b6cbf720SGianluca GuidaENTRY(memset)
58*b6cbf720SGianluca Guida	! %o0 = addr, %o1 = pattern, %o2 = len
59*b6cbf720SGianluca Guida	/*
60*b6cbf720SGianluca Guida	 * Expand the byte pattern to fill 64 bits in an even-aligned
61*b6cbf720SGianluca Guida	 * register pair; shuffle arguments to match those of bzero.
62*b6cbf720SGianluca Guida	 */
63*b6cbf720SGianluca Guida	and	%o1, 0xff, %o3
64*b6cbf720SGianluca Guida	mov	%o2, %o1		! shuffle argument
65*b6cbf720SGianluca Guida	sll	%o3, 8, %o2
66*b6cbf720SGianluca Guida	or	%o2, %o3, %o2
67*b6cbf720SGianluca Guida	mov	%o0, %g1		! save original pointer
68*b6cbf720SGianluca Guida	sll	%o2, 16, %o3
69*b6cbf720SGianluca Guida	or	%o2, %o3, %o2
70*b6cbf720SGianluca Guida	! Optimize a common case: addr and len are both multiples of 8.
71*b6cbf720SGianluca Guida	or	%o0, %o1, %o5
72*b6cbf720SGianluca Guida	btst	7, %o5			! ((addr | len) & 7) != 0?
73*b6cbf720SGianluca Guida	bnz	1f			! if so, cannot optimize
74*b6cbf720SGianluca Guida	 mov	%o2, %o3		! in any case, complete pat expansion
75*b6cbf720SGianluca Guida#else
76*b6cbf720SGianluca Guida/*
77*b6cbf720SGianluca Guida * void
78*b6cbf720SGianluca Guida * bzero(void *addr, size_t len)
79*b6cbf720SGianluca Guida */
80*b6cbf720SGianluca GuidaENTRY(bzero)
81*b6cbf720SGianluca Guida	! %o0 = addr, %o1 = len
82*b6cbf720SGianluca Guida
83*b6cbf720SGianluca Guida	clr	%o2
84*b6cbf720SGianluca Guida	! Optimize a common case: addr and len are both multiples of 8.
85*b6cbf720SGianluca Guida	or	%o0, %o1, %o5
86*b6cbf720SGianluca Guida	btst	7, %o5			! ((addr | len) & 7) != 0?
87*b6cbf720SGianluca Guida	bnz	1f			! if so, cannot optimize
88*b6cbf720SGianluca Guida	 clr	%o3			! in any case, we want o3=0
89*b6cbf720SGianluca Guida#endif
90*b6cbf720SGianluca Guida
91*b6cbf720SGianluca Guida	/* `Good' operands, can just store doubles. */
92*b6cbf720SGianluca Guida0:
93*b6cbf720SGianluca Guida	deccc	8, %o1			! while ((len -= 8) >= 0)
94*b6cbf720SGianluca Guida	bge,a	0b
95*b6cbf720SGianluca Guida	 std	%o2, [%o0 + %o1]	!	*(quad *)(addr + len) = 0;
96*b6cbf720SGianluca Guida	retl
97*b6cbf720SGianluca Guida	 nop
98*b6cbf720SGianluca Guida
99*b6cbf720SGianluca Guida	/*
100*b6cbf720SGianluca Guida	 * Either the address is unaligned, or the count is not a
101*b6cbf720SGianluca Guida	 * multiple of 8, or both.  We will have to align the address
102*b6cbf720SGianluca Guida	 * in order to use anything `better' than stb.
103*b6cbf720SGianluca Guida	 */
104*b6cbf720SGianluca Guida1:
105*b6cbf720SGianluca Guida	cmp	%o1, 15			! len >= 15?
106*b6cbf720SGianluca Guida	bge,a	Lstd			! yes, use std
107*b6cbf720SGianluca Guida	 btst	1, %o0			! (but first check alignment)
108*b6cbf720SGianluca Guida
109*b6cbf720SGianluca Guida	! not enough to bother: do byte-at-a-time loop.
110*b6cbf720SGianluca Guida2:
111*b6cbf720SGianluca Guida	deccc	%o1			! while (--len >= 0)
112*b6cbf720SGianluca Guida	bge,a	2b
113*b6cbf720SGianluca Guida	 stb	%o2, [%o0 + %o1]	!	addr[len] = 0;
114*b6cbf720SGianluca Guida	retl
115*b6cbf720SGianluca Guida	 nop
116*b6cbf720SGianluca Guida
117*b6cbf720SGianluca GuidaLstd:
118*b6cbf720SGianluca Guida	/*
119*b6cbf720SGianluca Guida	 * There are at least 15 bytes to zero.
120*b6cbf720SGianluca Guida	 * We may have to zero some initial stuff to align
121*b6cbf720SGianluca Guida	 * the address.
122*b6cbf720SGianluca Guida	 */
123*b6cbf720SGianluca Guida	bz,a	1f			! if (addr & 1) {
124*b6cbf720SGianluca Guida	 btst	2, %o0
125*b6cbf720SGianluca Guida	stb	%o2, [%o0]		!	*addr = 0;
126*b6cbf720SGianluca Guida	inc	%o0			!	addr++;
127*b6cbf720SGianluca Guida	dec	%o1			!	len--;
128*b6cbf720SGianluca Guida	btst	2, %o0			! }
129*b6cbf720SGianluca Guida1:
130*b6cbf720SGianluca Guida	bz,a	1f			! if (addr & 2) {
131*b6cbf720SGianluca Guida	 btst	4, %o0
132*b6cbf720SGianluca Guida	sth	%o2, [%o0]		!	*(short *)addr = 0;
133*b6cbf720SGianluca Guida	inc	2, %o0			!	addr += 2;
134*b6cbf720SGianluca Guida	dec	2, %o1			!	len -= 2;
135*b6cbf720SGianluca Guida	btst	4, %o0			! }
136*b6cbf720SGianluca Guida1:
137*b6cbf720SGianluca Guida	bz	1f			! if (addr & 4) {
138*b6cbf720SGianluca Guida	 dec	8, %o1
139*b6cbf720SGianluca Guida	st	%o2, [%o0]		!	*(int *)addr = 0;
140*b6cbf720SGianluca Guida	inc	4, %o0			!	addr += 4;
141*b6cbf720SGianluca Guida	dec	4, %o1			!	len -= 4;
142*b6cbf720SGianluca Guida					! }
143*b6cbf720SGianluca Guida	/*
144*b6cbf720SGianluca Guida	 * Address is double word aligned; len is 8 less than
145*b6cbf720SGianluca Guida	 * the number of bytes remaining (i.e., len is 0 if
146*b6cbf720SGianluca Guida	 * the remaining count is 8, 1 if it is 9, etc.).
147*b6cbf720SGianluca Guida	 */
148*b6cbf720SGianluca Guida1:
149*b6cbf720SGianluca Guida	std	%o2, [%o0]		! do {
150*b6cbf720SGianluca Guida2:					!	*(quad *)addr = 0;
151*b6cbf720SGianluca Guida	inc	8, %o0			!	addr += 8;
152*b6cbf720SGianluca Guida	deccc	8, %o1			! } while ((len -= 8) >= 0);
153*b6cbf720SGianluca Guida	 bge,a	2b
154*b6cbf720SGianluca Guida	std	%o2, [%o0]
155*b6cbf720SGianluca Guida
156*b6cbf720SGianluca Guida	/*
157*b6cbf720SGianluca Guida	 * Len is in [-8..-1] where -8 => done, -7 => 1 byte to zero,
158*b6cbf720SGianluca Guida	 * -6 => two bytes, etc.  Mop up this remainder, if any.
159*b6cbf720SGianluca Guida	 */
160*b6cbf720SGianluca Guida	btst	4, %o1
161*b6cbf720SGianluca Guida	bz	1f			! if (len & 4) {
162*b6cbf720SGianluca Guida	 btst	2, %o1
163*b6cbf720SGianluca Guida	st	%o2, [%o0]		!	*(int *)addr = 0;
164*b6cbf720SGianluca Guida	inc	4, %o0			!	addr += 4;
165*b6cbf720SGianluca Guida1:
166*b6cbf720SGianluca Guida	bz	1f			! if (len & 2) {
167*b6cbf720SGianluca Guida	 btst	1, %o1
168*b6cbf720SGianluca Guida	sth	%o2, [%o0]		!	*(short *)addr = 0;
169*b6cbf720SGianluca Guida	inc	2, %o0			!	addr += 2;
170*b6cbf720SGianluca Guida1:
171*b6cbf720SGianluca Guida	bnz,a	1f			! if (len & 1)
172*b6cbf720SGianluca Guida	 stb	%o2, [%o0]		!	*addr = 0;
173*b6cbf720SGianluca Guida1:
174*b6cbf720SGianluca Guida	retl
175*b6cbf720SGianluca Guida#ifdef MEMSET
176*b6cbf720SGianluca Guida	 mov	%g1, %o0		! restore original pointer
177*b6cbf720SGianluca Guida#else
178*b6cbf720SGianluca Guida	 nop
179*b6cbf720SGianluca Guida#endif
180