xref: /minix3/lib/libc/arch/powerpc64/string/bzero.S (revision 2fe8fb192fe7e8720e3e7a77f928da545e872a6a)
1*2fe8fb19SBen Gras/*	$NetBSD: bzero.S,v 1.4 2008/04/28 20:22:57 martin Exp $	*/
2*2fe8fb19SBen Gras
3*2fe8fb19SBen Gras/*-
4*2fe8fb19SBen Gras * Copyright (c) 2006 The NetBSD Foundation, Inc.
5*2fe8fb19SBen Gras * All rights reserved.
6*2fe8fb19SBen Gras *
7*2fe8fb19SBen Gras * This code is derived from software contributed to The NetBSD Foundation
8*2fe8fb19SBen Gras * by Ross Harvey.
9*2fe8fb19SBen Gras *
10*2fe8fb19SBen Gras * Redistribution and use in source and binary forms, with or without
11*2fe8fb19SBen Gras * modification, are permitted provided that the following conditions
12*2fe8fb19SBen Gras * are met:
13*2fe8fb19SBen Gras * 1. Redistributions of source code must retain the above copyright
14*2fe8fb19SBen Gras *    notice, this list of conditions and the following disclaimer.
15*2fe8fb19SBen Gras * 2. Redistributions in binary form must reproduce the above copyright
16*2fe8fb19SBen Gras *    notice, this list of conditions and the following disclaimer in the
17*2fe8fb19SBen Gras *    documentation and/or other materials provided with the distribution.
18*2fe8fb19SBen Gras *
19*2fe8fb19SBen Gras * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20*2fe8fb19SBen Gras * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING,  BUT NOT LIMITED
21*2fe8fb19SBen Gras * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22*2fe8fb19SBen Gras * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23*2fe8fb19SBen Gras * BE LIABLE FOR ANY DIRECT, INDIRECT,  INCIDENTAL,  SPECIAL,  EXEMPLARY,  OR
24*2fe8fb19SBen Gras * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,  PROCUREMENT OF
25*2fe8fb19SBen Gras * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA,  OR PROFITS; OR BUSINESS
26*2fe8fb19SBen Gras * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27*2fe8fb19SBen Gras * CONTRACT, STRICT LIABILITY,  OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28*2fe8fb19SBen Gras * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29*2fe8fb19SBen Gras * POSSIBILITY OF SUCH DAMAGE.
30*2fe8fb19SBen Gras */
31*2fe8fb19SBen Gras
32*2fe8fb19SBen Gras#include	<machine/asm.h>
33*2fe8fb19SBen Gras
34*2fe8fb19SBen Gras	.file	"bzero.c"
35*2fe8fb19SBen GrasENTRY(bzero)
36*2fe8fb19SBen Gras	mr	5, 4		# translate to memcpy signature
37*2fe8fb19SBen Gras	li	4, 0		# add missing memcpy param
38*2fe8fb19SBen GrasENTRY(memset)
39*2fe8fb19SBen Gras	cmpldi	7, 5, 7		# only optimize if len >= 8
40*2fe8fb19SBen Gras	mr	9, 3
41*2fe8fb19SBen Gras	ble	7, 2f
42*2fe8fb19SBen Gras	rldicl.	0, 3, 0, 61	# only optimize if aligned
43*2fe8fb19SBen Gras	beq	0, 4f
44*2fe8fb19SBen Gras2:
45*2fe8fb19SBen Gras	cmpdi	7, 5, 0
46*2fe8fb19SBen Gras	beqlr	7
47*2fe8fb19SBen Gras3:
48*2fe8fb19SBen Gras	mtctr	5
49*2fe8fb19SBen Gras	rldicl	0, 4, 0, 56
50*2fe8fb19SBen Gras	.p2align 4,, 15
51*2fe8fb19SBen Gras2:
52*2fe8fb19SBen Gras	stb	0, 0(9)		# byte-at-a-time loop
53*2fe8fb19SBen Gras	addi	9, 9, 1
54*2fe8fb19SBen Gras	bdnz	2b
55*2fe8fb19SBen Gras	blr			# done
56*2fe8fb19SBen Gras4:
57*2fe8fb19SBen Gras	rldicl	4, 4, 0, 56	# construct parallel store
58*2fe8fb19SBen Gras	cmpldi	7, 5, 31
59*2fe8fb19SBen Gras	mr	10, 3
60*2fe8fb19SBen Gras	sldi	0, 4, 8
61*2fe8fb19SBen Gras	or	0, 0, 4
62*2fe8fb19SBen Gras	sldi	9, 0, 16
63*2fe8fb19SBen Gras	or	0, 0, 9
64*2fe8fb19SBen Gras	sldi	11, 0, 32
65*2fe8fb19SBen Gras	or	0, 0, 11
66*2fe8fb19SBen Gras	ble	7, 5f
67*2fe8fb19SBen Gras	addi	9, 5, -32
68*2fe8fb19SBen Gras	srdi	9, 9, 5
69*2fe8fb19SBen Gras	addi	9, 9, 1
70*2fe8fb19SBen Gras	mtctr	9
71*2fe8fb19SBen Gras	.p2align 4,, 15
72*2fe8fb19SBen Gras2:
73*2fe8fb19SBen Gras	std	0, 0(10)	# 8-way + unrolled store loop
74*2fe8fb19SBen Gras	std	0, 8(10)
75*2fe8fb19SBen Gras	addi	5, 5, -32	# schedule count decrement
76*2fe8fb19SBen Gras	std	0, 16(10)
77*2fe8fb19SBen Gras	std	0, 24(10)
78*2fe8fb19SBen Gras	addi	10, 10, 32
79*2fe8fb19SBen Gras	bdnz	2b
80*2fe8fb19SBen Gras	cmpldi	7, 5, 7
81*2fe8fb19SBen Gras	ble	7, 8f
82*2fe8fb19SBen Gras5:
83*2fe8fb19SBen Gras	addi	9, 5, -8
84*2fe8fb19SBen Gras	srdi	9, 9, 3
85*2fe8fb19SBen Gras	addi	9, 9, 1
86*2fe8fb19SBen Gras	mtctr	9
87*2fe8fb19SBen Gras	.p2align 4,, 15
88*2fe8fb19SBen Gras14:
89*2fe8fb19SBen Gras	std	0, 0(10)	# 8-way not-unrolled loop
90*2fe8fb19SBen Gras	addi	5, 5, -8
91*2fe8fb19SBen Gras	addi	10, 10, 8
92*2fe8fb19SBen Gras	bdnz	14b
93*2fe8fb19SBen Gras8:
94*2fe8fb19SBen Gras	cmpdi	7, 5, 0
95*2fe8fb19SBen Gras	mr	9, 10
96*2fe8fb19SBen Gras	bne	7, 3b
97*2fe8fb19SBen Gras	blr
98*2fe8fb19SBen Gras	.long	0
99*2fe8fb19SBen Gras	.byte	0, 0, 0, 0, 0, 0, 0, 0
100*2fe8fb19SBen Gras	.size	.memset, .-.memset
101