1*2fe8fb19SBen Gras/* $NetBSD: bzero.S,v 1.4 2008/04/28 20:22:57 martin Exp $ */ 2*2fe8fb19SBen Gras 3*2fe8fb19SBen Gras/*- 4*2fe8fb19SBen Gras * Copyright (c) 2006 The NetBSD Foundation, Inc. 5*2fe8fb19SBen Gras * All rights reserved. 6*2fe8fb19SBen Gras * 7*2fe8fb19SBen Gras * This code is derived from software contributed to The NetBSD Foundation 8*2fe8fb19SBen Gras * by Ross Harvey. 9*2fe8fb19SBen Gras * 10*2fe8fb19SBen Gras * Redistribution and use in source and binary forms, with or without 11*2fe8fb19SBen Gras * modification, are permitted provided that the following conditions 12*2fe8fb19SBen Gras * are met: 13*2fe8fb19SBen Gras * 1. Redistributions of source code must retain the above copyright 14*2fe8fb19SBen Gras * notice, this list of conditions and the following disclaimer. 15*2fe8fb19SBen Gras * 2. Redistributions in binary form must reproduce the above copyright 16*2fe8fb19SBen Gras * notice, this list of conditions and the following disclaimer in the 17*2fe8fb19SBen Gras * documentation and/or other materials provided with the distribution. 18*2fe8fb19SBen Gras * 19*2fe8fb19SBen Gras * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS 20*2fe8fb19SBen Gras * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED 21*2fe8fb19SBen Gras * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 22*2fe8fb19SBen Gras * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS 23*2fe8fb19SBen Gras * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 24*2fe8fb19SBen Gras * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 25*2fe8fb19SBen Gras * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 26*2fe8fb19SBen Gras * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 27*2fe8fb19SBen Gras * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 28*2fe8fb19SBen Gras * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 29*2fe8fb19SBen Gras * POSSIBILITY OF SUCH DAMAGE. 30*2fe8fb19SBen Gras */ 31*2fe8fb19SBen Gras 32*2fe8fb19SBen Gras#include <machine/asm.h> 33*2fe8fb19SBen Gras 34*2fe8fb19SBen Gras .file "bzero.c" 35*2fe8fb19SBen GrasENTRY(bzero) 36*2fe8fb19SBen Gras mr 5, 4 # translate to memcpy signature 37*2fe8fb19SBen Gras li 4, 0 # add missing memcpy param 38*2fe8fb19SBen GrasENTRY(memset) 39*2fe8fb19SBen Gras cmpldi 7, 5, 7 # only optimize if len >= 8 40*2fe8fb19SBen Gras mr 9, 3 41*2fe8fb19SBen Gras ble 7, 2f 42*2fe8fb19SBen Gras rldicl. 0, 3, 0, 61 # only optimize if aligned 43*2fe8fb19SBen Gras beq 0, 4f 44*2fe8fb19SBen Gras2: 45*2fe8fb19SBen Gras cmpdi 7, 5, 0 46*2fe8fb19SBen Gras beqlr 7 47*2fe8fb19SBen Gras3: 48*2fe8fb19SBen Gras mtctr 5 49*2fe8fb19SBen Gras rldicl 0, 4, 0, 56 50*2fe8fb19SBen Gras .p2align 4,, 15 51*2fe8fb19SBen Gras2: 52*2fe8fb19SBen Gras stb 0, 0(9) # byte-at-a-time loop 53*2fe8fb19SBen Gras addi 9, 9, 1 54*2fe8fb19SBen Gras bdnz 2b 55*2fe8fb19SBen Gras blr # done 56*2fe8fb19SBen Gras4: 57*2fe8fb19SBen Gras rldicl 4, 4, 0, 56 # construct parallel store 58*2fe8fb19SBen Gras cmpldi 7, 5, 31 59*2fe8fb19SBen Gras mr 10, 3 60*2fe8fb19SBen Gras sldi 0, 4, 8 61*2fe8fb19SBen Gras or 0, 0, 4 62*2fe8fb19SBen Gras sldi 9, 0, 16 63*2fe8fb19SBen Gras or 0, 0, 9 64*2fe8fb19SBen Gras sldi 11, 0, 32 65*2fe8fb19SBen Gras or 0, 0, 11 66*2fe8fb19SBen Gras ble 7, 5f 67*2fe8fb19SBen Gras addi 9, 5, -32 68*2fe8fb19SBen Gras srdi 9, 9, 5 69*2fe8fb19SBen Gras addi 9, 9, 1 70*2fe8fb19SBen Gras mtctr 9 71*2fe8fb19SBen Gras .p2align 4,, 15 72*2fe8fb19SBen Gras2: 73*2fe8fb19SBen Gras std 0, 0(10) # 8-way + unrolled store loop 74*2fe8fb19SBen Gras std 0, 8(10) 75*2fe8fb19SBen Gras addi 5, 5, -32 # schedule count decrement 76*2fe8fb19SBen Gras std 0, 16(10) 77*2fe8fb19SBen Gras std 0, 24(10) 78*2fe8fb19SBen Gras addi 10, 10, 32 79*2fe8fb19SBen Gras bdnz 2b 80*2fe8fb19SBen Gras cmpldi 7, 5, 7 81*2fe8fb19SBen Gras ble 7, 8f 82*2fe8fb19SBen Gras5: 83*2fe8fb19SBen Gras addi 9, 5, -8 84*2fe8fb19SBen Gras srdi 9, 9, 3 85*2fe8fb19SBen Gras addi 9, 9, 1 86*2fe8fb19SBen Gras mtctr 9 87*2fe8fb19SBen Gras .p2align 4,, 15 88*2fe8fb19SBen Gras14: 89*2fe8fb19SBen Gras std 0, 0(10) # 8-way not-unrolled loop 90*2fe8fb19SBen Gras addi 5, 5, -8 91*2fe8fb19SBen Gras addi 10, 10, 8 92*2fe8fb19SBen Gras bdnz 14b 93*2fe8fb19SBen Gras8: 94*2fe8fb19SBen Gras cmpdi 7, 5, 0 95*2fe8fb19SBen Gras mr 9, 10 96*2fe8fb19SBen Gras bne 7, 3b 97*2fe8fb19SBen Gras blr 98*2fe8fb19SBen Gras .long 0 99*2fe8fb19SBen Gras .byte 0, 0, 0, 0, 0, 0, 0, 0 100*2fe8fb19SBen Gras .size .memset, .-.memset 101