1*b6cbf720SGianluca Guida/* $NetBSD: bzero.S,v 1.1 2005/12/20 19:28:50 christos Exp $ */ 2*b6cbf720SGianluca Guida 3*b6cbf720SGianluca Guida/* 4*b6cbf720SGianluca Guida * Copyright (c) 1992, 1993 5*b6cbf720SGianluca Guida * The Regents of the University of California. All rights reserved. 6*b6cbf720SGianluca Guida * 7*b6cbf720SGianluca Guida * This software was developed by the Computer Systems Engineering group 8*b6cbf720SGianluca Guida * at Lawrence Berkeley Laboratory under DARPA contract BG 91-66 and 9*b6cbf720SGianluca Guida * contributed to Berkeley. 10*b6cbf720SGianluca Guida * 11*b6cbf720SGianluca Guida * Redistribution and use in source and binary forms, with or without 12*b6cbf720SGianluca Guida * modification, are permitted provided that the following conditions 13*b6cbf720SGianluca Guida * are met: 14*b6cbf720SGianluca Guida * 1. Redistributions of source code must retain the above copyright 15*b6cbf720SGianluca Guida * notice, this list of conditions and the following disclaimer. 16*b6cbf720SGianluca Guida * 2. Redistributions in binary form must reproduce the above copyright 17*b6cbf720SGianluca Guida * notice, this list of conditions and the following disclaimer in the 18*b6cbf720SGianluca Guida * documentation and/or other materials provided with the distribution. 19*b6cbf720SGianluca Guida * 3. Neither the name of the University nor the names of its contributors 20*b6cbf720SGianluca Guida * may be used to endorse or promote products derived from this software 21*b6cbf720SGianluca Guida * without specific prior written permission. 22*b6cbf720SGianluca Guida * 23*b6cbf720SGianluca Guida * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 24*b6cbf720SGianluca Guida * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 25*b6cbf720SGianluca Guida * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 26*b6cbf720SGianluca Guida * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 27*b6cbf720SGianluca Guida * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 28*b6cbf720SGianluca Guida * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 29*b6cbf720SGianluca Guida * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 30*b6cbf720SGianluca Guida * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 31*b6cbf720SGianluca Guida * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 32*b6cbf720SGianluca Guida * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 33*b6cbf720SGianluca Guida * SUCH DAMAGE. 34*b6cbf720SGianluca Guida * 35*b6cbf720SGianluca Guida * from: Header: bzero.s,v 1.1 92/06/25 12:52:46 torek Exp 36*b6cbf720SGianluca Guida */ 37*b6cbf720SGianluca Guida 38*b6cbf720SGianluca Guida#include <machine/asm.h> 39*b6cbf720SGianluca Guida#if defined(LIBC_SCCS) && !defined(lint) 40*b6cbf720SGianluca Guida#if 0 41*b6cbf720SGianluca Guida .asciz "@(#)bzero.s 8.1 (Berkeley) 6/4/93" 42*b6cbf720SGianluca Guida#else 43*b6cbf720SGianluca Guida RCSID("$NetBSD: bzero.S,v 1.1 2005/12/20 19:28:50 christos Exp $") 44*b6cbf720SGianluca Guida#endif 45*b6cbf720SGianluca Guida#endif /* LIBC_SCCS and not lint */ 46*b6cbf720SGianluca Guida 47*b6cbf720SGianluca Guida/* 48*b6cbf720SGianluca Guida * We should unroll the loop, but at the moment this would 49*b6cbf720SGianluca Guida * gain nothing since the `std' instructions are what limits us. 50*b6cbf720SGianluca Guida */ 51*b6cbf720SGianluca Guida 52*b6cbf720SGianluca Guida#ifdef MEMSET 53*b6cbf720SGianluca Guida/* 54*b6cbf720SGianluca Guida * void * 55*b6cbf720SGianluca Guida * memset(void *addr, int pattern, size_t len) 56*b6cbf720SGianluca Guida */ 57*b6cbf720SGianluca GuidaENTRY(memset) 58*b6cbf720SGianluca Guida ! %o0 = addr, %o1 = pattern, %o2 = len 59*b6cbf720SGianluca Guida /* 60*b6cbf720SGianluca Guida * Expand the byte pattern to fill 64 bits in an even-aligned 61*b6cbf720SGianluca Guida * register pair; shuffle arguments to match those of bzero. 62*b6cbf720SGianluca Guida */ 63*b6cbf720SGianluca Guida and %o1, 0xff, %o3 64*b6cbf720SGianluca Guida mov %o2, %o1 ! shuffle argument 65*b6cbf720SGianluca Guida sll %o3, 8, %o2 66*b6cbf720SGianluca Guida or %o2, %o3, %o2 67*b6cbf720SGianluca Guida mov %o0, %g1 ! save original pointer 68*b6cbf720SGianluca Guida sll %o2, 16, %o3 69*b6cbf720SGianluca Guida or %o2, %o3, %o2 70*b6cbf720SGianluca Guida ! Optimize a common case: addr and len are both multiples of 8. 71*b6cbf720SGianluca Guida or %o0, %o1, %o5 72*b6cbf720SGianluca Guida btst 7, %o5 ! ((addr | len) & 7) != 0? 73*b6cbf720SGianluca Guida bnz 1f ! if so, cannot optimize 74*b6cbf720SGianluca Guida mov %o2, %o3 ! in any case, complete pat expansion 75*b6cbf720SGianluca Guida#else 76*b6cbf720SGianluca Guida/* 77*b6cbf720SGianluca Guida * void 78*b6cbf720SGianluca Guida * bzero(void *addr, size_t len) 79*b6cbf720SGianluca Guida */ 80*b6cbf720SGianluca GuidaENTRY(bzero) 81*b6cbf720SGianluca Guida ! %o0 = addr, %o1 = len 82*b6cbf720SGianluca Guida 83*b6cbf720SGianluca Guida clr %o2 84*b6cbf720SGianluca Guida ! Optimize a common case: addr and len are both multiples of 8. 85*b6cbf720SGianluca Guida or %o0, %o1, %o5 86*b6cbf720SGianluca Guida btst 7, %o5 ! ((addr | len) & 7) != 0? 87*b6cbf720SGianluca Guida bnz 1f ! if so, cannot optimize 88*b6cbf720SGianluca Guida clr %o3 ! in any case, we want o3=0 89*b6cbf720SGianluca Guida#endif 90*b6cbf720SGianluca Guida 91*b6cbf720SGianluca Guida /* `Good' operands, can just store doubles. */ 92*b6cbf720SGianluca Guida0: 93*b6cbf720SGianluca Guida deccc 8, %o1 ! while ((len -= 8) >= 0) 94*b6cbf720SGianluca Guida bge,a 0b 95*b6cbf720SGianluca Guida std %o2, [%o0 + %o1] ! *(quad *)(addr + len) = 0; 96*b6cbf720SGianluca Guida retl 97*b6cbf720SGianluca Guida nop 98*b6cbf720SGianluca Guida 99*b6cbf720SGianluca Guida /* 100*b6cbf720SGianluca Guida * Either the address is unaligned, or the count is not a 101*b6cbf720SGianluca Guida * multiple of 8, or both. We will have to align the address 102*b6cbf720SGianluca Guida * in order to use anything `better' than stb. 103*b6cbf720SGianluca Guida */ 104*b6cbf720SGianluca Guida1: 105*b6cbf720SGianluca Guida cmp %o1, 15 ! len >= 15? 106*b6cbf720SGianluca Guida bge,a Lstd ! yes, use std 107*b6cbf720SGianluca Guida btst 1, %o0 ! (but first check alignment) 108*b6cbf720SGianluca Guida 109*b6cbf720SGianluca Guida ! not enough to bother: do byte-at-a-time loop. 110*b6cbf720SGianluca Guida2: 111*b6cbf720SGianluca Guida deccc %o1 ! while (--len >= 0) 112*b6cbf720SGianluca Guida bge,a 2b 113*b6cbf720SGianluca Guida stb %o2, [%o0 + %o1] ! addr[len] = 0; 114*b6cbf720SGianluca Guida retl 115*b6cbf720SGianluca Guida nop 116*b6cbf720SGianluca Guida 117*b6cbf720SGianluca GuidaLstd: 118*b6cbf720SGianluca Guida /* 119*b6cbf720SGianluca Guida * There are at least 15 bytes to zero. 120*b6cbf720SGianluca Guida * We may have to zero some initial stuff to align 121*b6cbf720SGianluca Guida * the address. 122*b6cbf720SGianluca Guida */ 123*b6cbf720SGianluca Guida bz,a 1f ! if (addr & 1) { 124*b6cbf720SGianluca Guida btst 2, %o0 125*b6cbf720SGianluca Guida stb %o2, [%o0] ! *addr = 0; 126*b6cbf720SGianluca Guida inc %o0 ! addr++; 127*b6cbf720SGianluca Guida dec %o1 ! len--; 128*b6cbf720SGianluca Guida btst 2, %o0 ! } 129*b6cbf720SGianluca Guida1: 130*b6cbf720SGianluca Guida bz,a 1f ! if (addr & 2) { 131*b6cbf720SGianluca Guida btst 4, %o0 132*b6cbf720SGianluca Guida sth %o2, [%o0] ! *(short *)addr = 0; 133*b6cbf720SGianluca Guida inc 2, %o0 ! addr += 2; 134*b6cbf720SGianluca Guida dec 2, %o1 ! len -= 2; 135*b6cbf720SGianluca Guida btst 4, %o0 ! } 136*b6cbf720SGianluca Guida1: 137*b6cbf720SGianluca Guida bz 1f ! if (addr & 4) { 138*b6cbf720SGianluca Guida dec 8, %o1 139*b6cbf720SGianluca Guida st %o2, [%o0] ! *(int *)addr = 0; 140*b6cbf720SGianluca Guida inc 4, %o0 ! addr += 4; 141*b6cbf720SGianluca Guida dec 4, %o1 ! len -= 4; 142*b6cbf720SGianluca Guida ! } 143*b6cbf720SGianluca Guida /* 144*b6cbf720SGianluca Guida * Address is double word aligned; len is 8 less than 145*b6cbf720SGianluca Guida * the number of bytes remaining (i.e., len is 0 if 146*b6cbf720SGianluca Guida * the remaining count is 8, 1 if it is 9, etc.). 147*b6cbf720SGianluca Guida */ 148*b6cbf720SGianluca Guida1: 149*b6cbf720SGianluca Guida std %o2, [%o0] ! do { 150*b6cbf720SGianluca Guida2: ! *(quad *)addr = 0; 151*b6cbf720SGianluca Guida inc 8, %o0 ! addr += 8; 152*b6cbf720SGianluca Guida deccc 8, %o1 ! } while ((len -= 8) >= 0); 153*b6cbf720SGianluca Guida bge,a 2b 154*b6cbf720SGianluca Guida std %o2, [%o0] 155*b6cbf720SGianluca Guida 156*b6cbf720SGianluca Guida /* 157*b6cbf720SGianluca Guida * Len is in [-8..-1] where -8 => done, -7 => 1 byte to zero, 158*b6cbf720SGianluca Guida * -6 => two bytes, etc. Mop up this remainder, if any. 159*b6cbf720SGianluca Guida */ 160*b6cbf720SGianluca Guida btst 4, %o1 161*b6cbf720SGianluca Guida bz 1f ! if (len & 4) { 162*b6cbf720SGianluca Guida btst 2, %o1 163*b6cbf720SGianluca Guida st %o2, [%o0] ! *(int *)addr = 0; 164*b6cbf720SGianluca Guida inc 4, %o0 ! addr += 4; 165*b6cbf720SGianluca Guida1: 166*b6cbf720SGianluca Guida bz 1f ! if (len & 2) { 167*b6cbf720SGianluca Guida btst 1, %o1 168*b6cbf720SGianluca Guida sth %o2, [%o0] ! *(short *)addr = 0; 169*b6cbf720SGianluca Guida inc 2, %o0 ! addr += 2; 170*b6cbf720SGianluca Guida1: 171*b6cbf720SGianluca Guida bnz,a 1f ! if (len & 1) 172*b6cbf720SGianluca Guida stb %o2, [%o0] ! *addr = 0; 173*b6cbf720SGianluca Guida1: 174*b6cbf720SGianluca Guida retl 175*b6cbf720SGianluca Guida#ifdef MEMSET 176*b6cbf720SGianluca Guida mov %g1, %o0 ! restore original pointer 177*b6cbf720SGianluca Guida#else 178*b6cbf720SGianluca Guida nop 179*b6cbf720SGianluca Guida#endif 180