xref: /dflybsd-src/lib/libc/string/strcoll.c (revision 84bfc1a1b84f23538385f60e555d3723a9c81c33)
1 /*
2  * Copyright 2010 Nexenta Systems, Inc.  All rights reserved.
3  * Copyright (c) 1995 Alex Tatmanjants <alex@elvisti.kiev.ua>
4  *		at Electronni Visti IA, Kiev, Ukraine.
5  *			All rights reserved.
6  *
7  * Copyright (c) 2011 The FreeBSD Foundation
8  * All rights reserved.
9  * Portions of this software were developed by David Chisnall
10  * under sponsorship from the FreeBSD Foundation.
11  *
12  * Redistribution and use in source and binary forms, with or without
13  * modification, are permitted provided that the following conditions
14  * are met:
15  * 1. Redistributions of source code must retain the above copyright
16  *    notice, this list of conditions and the following disclaimer.
17  * 2. Redistributions in binary form must reproduce the above copyright
18  *    notice, this list of conditions and the following disclaimer in the
19  *    documentation and/or other materials provided with the distribution.
20  *
21  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND
22  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE
25  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31  * SUCH DAMAGE.
32  */
33 
34 #include <stdlib.h>
35 #include <string.h>
36 #include <errno.h>
37 #include <wchar.h>
38 #include "collate.h"
39 
40 
41 /*
42  * In order to properly handle multibyte locales, its easiet to just
43  * convert to wide characters and then use wcscoll.  However if an
44  * error occurs, we gracefully fall back to simple strcmp.  Caller
45  * should check errno.
46  */
47 int
48 strcoll_l(const char *s, const char *s2, locale_t locale)
49 {
50 	int ret;
51 	wchar_t *t1 = NULL, *t2 = NULL;
52 	wchar_t *w1 = NULL, *w2 = NULL;
53 	mbstate_t mbs1 = { 0 };
54 	mbstate_t mbs2 = { 0 };
55 	size_t sz1, sz2;
56 	FIX_LOCALE(locale);
57 	struct xlocale_collate *table =
58 		(struct xlocale_collate*)locale->components[XLC_COLLATE];
59 
60 	if (table->__collate_load_error)
61 		goto error;
62 
63 	sz1 = strlen(s) + 1;
64 	sz2 = strlen(s2) + 1;
65 
66 	/*
67 	 * Simple assumption: conversion to wide format is strictly
68 	 * reducing, i.e. a single byte (or multibyte character)
69 	 * cannot result in multiple wide characters.
70 	 */
71 	if ((t1 = malloc(sz1 * sizeof (wchar_t))) == NULL)
72 		goto error;
73 	w1 = t1;
74 	if ((t2 = malloc(sz2 * sizeof (wchar_t))) == NULL)
75 		goto error;
76 	w2 = t2;
77 
78 	if ((mbsrtowcs_l(w1, &s, sz1, &mbs1, locale)) == (size_t)-1)
79 		goto error;
80 
81 	if ((mbsrtowcs_l(w2, &s2, sz2, &mbs2, locale)) == (size_t)-1)
82 		goto error;
83 
84 	ret = wcscoll_l(w1, w2, locale);
85 	if (t1)
86 		free(t1);
87 	if (t2)
88 		free(t2);
89 
90 	return (ret);
91 
92 error:
93 	if (t1)
94 		free(t1);
95 	if (t2)
96 		free(t2);
97 	return (strcmp(s, s2));
98 }
99 
100 int
101 strcoll(const char *s, const char *s2)
102 {
103 	return strcoll_l(s, s2, __get_locale());
104 }
105 
106