xref: /minix3/common/lib/libc/arch/or1k/string/memcmp.S (revision 0a6a1f1d05b60e214de2f05a7310ddd1f0e590e7)
1/* $NetBSD: memcmp.S,v 1.1 2014/09/03 19:34:25 matt Exp $ */
2
3/*-
4 * Copyright (c) 2014 The NetBSD Foundation, Inc.
5 * All rights reserved.
6 *
7 * This code is derived from software contributed to The NetBSD Foundation
8 * by Matt Thomas of 3am Software Foundry.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 *    notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 *    notice, this list of conditions and the following disclaimer in the
17 *    documentation and/or other materials provided with the distribution.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
20 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
21 * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
23 * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 * POSSIBILITY OF SUCH DAMAGE.
30 */
31
32/*
33 *
34 *
35 * int memcmp(const char *s1, const char *s2, size_t n);
36 *
37 *	for (; n-- != 0; s1++, s2++) {
38 *		if (*s1 < *s2)
39 *			return -1;
40 *		if (*s1 > *s2)
41 *			return 1;
42 *	}
43 *	return 0;
44 *
45 * Return:	((s1 > s2) ? 1 : (s1 < s2) ? -1 : 0)
46 *
47 * ==========================================================================
48 */
49
50#include <machine/asm.h>
51
52        .text
53        .align 4
54/* LINTSTUB: Func: void *memcmp(const void *, const void *, size_t) */
55ENTRY(memcmp)
56
57	/*
58	 * Check count passed in R5. If zero, return 0; otherwise continue.
59	 */
60	l.sfeqi	r5, 0			/* nothing to compare?		*/
61	l.bf	.Lret_0			/*   yes, return equality	*/
62	l.nop
63
64#ifdef _KERNEL
65	l.sfeqi	r5, 6			/* less than two words?		*/
66	l.bnf	.Lsixbyte_compare	/*   yes, just compare by bytes */
67	l.nop
68#endif
69
70	l.sfgesi r5, 7			/* less than two words?		*/
71	l.bnf	.Lbyte_compare		/*   yes, just compare by bytes */
72	l.nop
73
74	l.xor	r6, r3, r4		/* check alignment compatibility */
75	l.andi	r6, r6, 3		/* only care about the two bits */
76	l.sfeqi	r6, 0			/* same alignment? */
77	l.bnf	.Lmisaligned		/*   no, avoid alignment errors */
78	l.nop
79
80	/*
81	 * At this point, we know we read the data via word accesses.
82	 */
83
84	l.andi	r7, r3, 3		/* check alignment		*/
85	l.sfeqi	r7, 0			/* word aligned?		*/
86	l.bf	.Lword_compare		/*   yes, it is.		*/
87
88	l.sub	r3, r3, r7		/* align string 1		*/
89	l.sub	r4, r4, r7		/* align string 2		*/
90	l.add	r5, r5, r7		/* pad length			*/
91
92	l.lwz	r15, 0(r3)		/* load word from s1		*/
93	l.lwz	r17, 0(r4)		/* load word from s2		*/
94
95	l.slli	r7, r7, 3		/* bytes to bits		*/
96	l.sll	r15, r15, r7		/* shift away leading bytes	*/
97	l.sll	r17, r17, r7		/* shift away leading bytes	*/
98	l.j	.Lword_compare		/* now we can compare them	*/
99	l.nop
100
101.Lword_loop:
102	l.lwz	r15, 0(r3)		/* load s1 word			*/
103	l.lwz	r17, 0(r4)		/* load s2 word			*/
104.Lword_compare:
105	l.sfeq	r15, r17		/* compare s1 and s2 words	*/
106	l.bnf	.Lall_done		/*   different? we're done	*/
107
108	l.addi	r3, r3, 4		/* advance s1 one word		*/
109	l.addi	r4, r4, 4		/* advance s2 one word		*/
110	l.addi	r5, r5, -4		/* decrement one word		*/
111	l.sfgtsi r5, 4			/* at least more than a word?	*/
112	l.bf	.Lword_loop		/*    yes, loop around		*/
113	l.nop
114	l.sfeqi	r5, 0			/* nothing left?		*/
115	l.bf	.Lret_0			/*   yes, return equality	*/
116	l.nop
117
118	/*
119	 * Fall through to handle the last word
120	 */
121
122	l.sub	r3, r0, r5		/* If count <= 4, handle 	*/
123	l.andi	r3, r3, 3		/* mask off low 2 bits		*/
124	l.slli	r3, r3, 3		/* count *= 8			*/
125	l.srl	r15, r15, r3		/* discard extra s1 bytes	*/
126	l.srl	r17, r17, r3		/* discard extra s2 bytes	*/
127
128	l.sfeq	r17, r15		/* compare result		*/
129	l.bnf	.Lall_done
130.Lret_0:
131	l.addi	r11, r0, 0
132	l.jr	lr
133	l.nop
134
135/*
136 * The two string don't have the same word alignment.
137 */
138.Lmisaligned:
139	l.sfeqi	r6, 2			/* check for halfword alignment */
140	l.bnf	.Lbyte_compare
141	l.nop
142	l.andi	r7, r3, 1
143	l.sfeqi	r7, 0
144	l.bf	.Lhalfword_loop
145	l.nop
146	l.addi	r5, r5, 1
147	l.addi	r3, r3, -1
148	l.addi	r4, r4, -1
149	l.lbz	r15, 1(r3)
150	l.lbz	r17, 1(r4)
151	l.j	.Lhalfword_compare
152	l.nop
153.Lhalfword_loop:
154	l.lhz	r15, 0(r3)
155	l.lhz	r17, 0(r4)
156.Lhalfword_compare:
157	l.sfeq	r15, r17
158	l.bnf	.Lall_done
159	l.nop
160	l.addi	r3, r3, 2
161	l.addi	r4, r4, 2
162	l.addi	r5, r5, -2
163	l.sfgesi r5, 2
164	l.bf	.Lhalfword_loop
165	l.nop
166
167.Lbyte_compare:
168	l.addi	r5, r5, -1
169	l.sfgesi r5, 0
170	l.bnf	.Lret_0
171	l.nop
172	l.lbz	r15, 0(r3)
173	l.lbz	r17, 0(r4)
174	l.addi	r3, r3, 1
175	l.addi	r4, r4, 1
176	l.sfeq	r15, r17
177	l.bf	.Lbyte_compare
178	l.nop
179
180.Lall_done:
181	l.sub	r11, r15, r17		/* subtract s2 from s1		*/
182	l.srai	r11, r11, 30		/* replicate sign bit thru bit 1 */
183	l.ori	r11, r11, 1		/* make sure bit 0 is set	*/
184	l.jr	lr
185	l.nop
186
187#ifdef _KERNEL
188.Lsixbyte_compare:
189	l.or	r7, r3, r4
190	l.andi	r7, r7, 1
191	l.sfeqi	r7, 0
192	l.bnf	.Lbyte_compare
193	l.nop
194	l.lhz	r15, 0(r3)
195	l.lhz	r17, 0(r4)
196	l.sfeq	r15, r17
197	l.bnf	.Lall_done
198	l.nop
199	l.lhz	r15, 2(r3)
200	l.lhz	r17, 2(r4)
201	l.sfeq	r15, r17
202	l.bnf	.Lall_done
203	l.nop
204	l.lhz	r15, 4(r3)
205	l.lhz	r17, 4(r4)
206	l.sfeq	r15, r17
207	l.bnf	.Lall_done
208	l.nop
209	l.addi	r11, r0, 0
210	l.jr	lr
211	l.nop
212#endif
213END(memcmp)
214