1fd4f1dd9STim J. Robbins /*-
2*4d846d26SWarner Losh * SPDX-License-Identifier: BSD-2-Clause
3d915a14eSPedro F. Giffuni *
4c48dc2a1SBaptiste Daroussin * Copyright 2017 Nexenta Systems, Inc.
5fd4f1dd9STim J. Robbins * Copyright (c) 2002 Tim J. Robbins
6fd4f1dd9STim J. Robbins * All rights reserved.
7fd4f1dd9STim J. Robbins *
83c87aa1dSDavid Chisnall * Copyright (c) 2011 The FreeBSD Foundation
95b5fa75aSEd Maste *
103c87aa1dSDavid Chisnall * Portions of this software were developed by David Chisnall
113c87aa1dSDavid Chisnall * under sponsorship from the FreeBSD Foundation.
123c87aa1dSDavid Chisnall *
13fd4f1dd9STim J. Robbins * Redistribution and use in source and binary forms, with or without
14fd4f1dd9STim J. Robbins * modification, are permitted provided that the following conditions
15fd4f1dd9STim J. Robbins * are met:
16fd4f1dd9STim J. Robbins * 1. Redistributions of source code must retain the above copyright
17fd4f1dd9STim J. Robbins * notice, this list of conditions and the following disclaimer.
18fd4f1dd9STim J. Robbins * 2. Redistributions in binary form must reproduce the above copyright
19fd4f1dd9STim J. Robbins * notice, this list of conditions and the following disclaimer in the
20fd4f1dd9STim J. Robbins * documentation and/or other materials provided with the distribution.
21fd4f1dd9STim J. Robbins *
22fd4f1dd9STim J. Robbins * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
23fd4f1dd9STim J. Robbins * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24fd4f1dd9STim J. Robbins * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25fd4f1dd9STim J. Robbins * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
26fd4f1dd9STim J. Robbins * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27fd4f1dd9STim J. Robbins * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28fd4f1dd9STim J. Robbins * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29fd4f1dd9STim J. Robbins * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30fd4f1dd9STim J. Robbins * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31fd4f1dd9STim J. Robbins * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32fd4f1dd9STim J. Robbins * SUCH DAMAGE.
33fd4f1dd9STim J. Robbins */
34fd4f1dd9STim J. Robbins
35fd4f1dd9STim J. Robbins #include <errno.h>
36fd4f1dd9STim J. Robbins #include <stdlib.h>
37fd4f1dd9STim J. Robbins #include <string.h>
38fd4f1dd9STim J. Robbins #include <wchar.h>
39fd4f1dd9STim J. Robbins #include "collate.h"
40fd4f1dd9STim J. Robbins
41fd4f1dd9STim J. Robbins int
wcscoll_l(const wchar_t * ws1,const wchar_t * ws2,locale_t locale)423c87aa1dSDavid Chisnall wcscoll_l(const wchar_t *ws1, const wchar_t *ws2, locale_t locale)
43fd4f1dd9STim J. Robbins {
44c48dc2a1SBaptiste Daroussin int len1, len2, pri1, pri2;
45a1df81e7SBaptiste Daroussin wchar_t *tr1 = NULL, *tr2 = NULL;
46a1df81e7SBaptiste Daroussin int direc, pass;
47c48dc2a1SBaptiste Daroussin int ret = wcscmp(ws1, ws2);
48a1df81e7SBaptiste Daroussin
493c87aa1dSDavid Chisnall FIX_LOCALE(locale);
503c87aa1dSDavid Chisnall struct xlocale_collate *table =
513c87aa1dSDavid Chisnall (struct xlocale_collate*)locale->components[XLC_COLLATE];
52fd4f1dd9STim J. Robbins
53c48dc2a1SBaptiste Daroussin if (table->__collate_load_error || ret == 0)
54c48dc2a1SBaptiste Daroussin return (ret);
55fd4f1dd9STim J. Robbins
56c48dc2a1SBaptiste Daroussin if (*ws1 == 0 && *ws2 != 0)
57c48dc2a1SBaptiste Daroussin return (-1);
58c48dc2a1SBaptiste Daroussin if (*ws1 != 0 && *ws2 == 0)
59c48dc2a1SBaptiste Daroussin return (1);
60a1df81e7SBaptiste Daroussin
61fd4f1dd9STim J. Robbins /*
62a1df81e7SBaptiste Daroussin * Once upon a time we had code to try to optimize this, but
63a1df81e7SBaptiste Daroussin * it turns out that you really can't make many assumptions
64a1df81e7SBaptiste Daroussin * safely. You absolutely have to run this pass by pass,
65a1df81e7SBaptiste Daroussin * because some passes will be ignored for a given character,
66a1df81e7SBaptiste Daroussin * while others will not. Simpler locales will benefit from
6732223c1bSPedro F. Giffuni * having fewer passes, and most comparisons should resolve
68a1df81e7SBaptiste Daroussin * during the primary pass anyway.
69a1df81e7SBaptiste Daroussin *
70a1df81e7SBaptiste Daroussin * Note that we do one final extra pass at the end to pick
71a1df81e7SBaptiste Daroussin * up UNDEFINED elements. There is special handling for them.
72fd4f1dd9STim J. Robbins */
73a1df81e7SBaptiste Daroussin for (pass = 0; pass <= table->info->directive_count; pass++) {
74a1df81e7SBaptiste Daroussin
75a1df81e7SBaptiste Daroussin const int32_t *st1 = NULL;
76a1df81e7SBaptiste Daroussin const int32_t *st2 = NULL;
77a1df81e7SBaptiste Daroussin const wchar_t *w1 = ws1;
78a1df81e7SBaptiste Daroussin const wchar_t *w2 = ws2;
79a1df81e7SBaptiste Daroussin
80a1df81e7SBaptiste Daroussin /* special pass for UNDEFINED */
81a1df81e7SBaptiste Daroussin if (pass == table->info->directive_count) {
82c48dc2a1SBaptiste Daroussin direc = DIRECTIVE_FORWARD;
83a1df81e7SBaptiste Daroussin } else {
84a1df81e7SBaptiste Daroussin direc = table->info->directive[pass];
85fd4f1dd9STim J. Robbins }
86fd4f1dd9STim J. Robbins
87a1df81e7SBaptiste Daroussin if (direc & DIRECTIVE_BACKWARD) {
88a1df81e7SBaptiste Daroussin wchar_t *bp, *fp, c;
89c48dc2a1SBaptiste Daroussin free(tr1);
90a1df81e7SBaptiste Daroussin if ((tr1 = wcsdup(w1)) == NULL)
91c48dc2a1SBaptiste Daroussin goto end;
92a1df81e7SBaptiste Daroussin bp = tr1;
93a1df81e7SBaptiste Daroussin fp = tr1 + wcslen(tr1) - 1;
94a1df81e7SBaptiste Daroussin while (bp < fp) {
95a1df81e7SBaptiste Daroussin c = *bp;
96a1df81e7SBaptiste Daroussin *bp++ = *fp;
97a1df81e7SBaptiste Daroussin *fp-- = c;
98a1df81e7SBaptiste Daroussin }
99c48dc2a1SBaptiste Daroussin free(tr2);
100a1df81e7SBaptiste Daroussin if ((tr2 = wcsdup(w2)) == NULL)
101c48dc2a1SBaptiste Daroussin goto end;
102a1df81e7SBaptiste Daroussin bp = tr2;
103a1df81e7SBaptiste Daroussin fp = tr2 + wcslen(tr2) - 1;
104a1df81e7SBaptiste Daroussin while (bp < fp) {
105a1df81e7SBaptiste Daroussin c = *bp;
106a1df81e7SBaptiste Daroussin *bp++ = *fp;
107a1df81e7SBaptiste Daroussin *fp-- = c;
108a1df81e7SBaptiste Daroussin }
109a1df81e7SBaptiste Daroussin w1 = tr1;
110a1df81e7SBaptiste Daroussin w2 = tr2;
111a1df81e7SBaptiste Daroussin }
112fd4f1dd9STim J. Robbins
113a1df81e7SBaptiste Daroussin if (direc & DIRECTIVE_POSITION) {
114c48dc2a1SBaptiste Daroussin int check1, check2;
11576e6db68SBaptiste Daroussin while (*w1 && *w2) {
116a1df81e7SBaptiste Daroussin pri1 = pri2 = 0;
11776e6db68SBaptiste Daroussin check1 = check2 = 1;
11876e6db68SBaptiste Daroussin while ((pri1 == pri2) && (check1 || check2)) {
11976e6db68SBaptiste Daroussin if (check1) {
12076e6db68SBaptiste Daroussin _collate_lookup(table, w1, &len1,
12176e6db68SBaptiste Daroussin &pri1, pass, &st1);
122a1df81e7SBaptiste Daroussin if (pri1 < 0) {
123a1df81e7SBaptiste Daroussin errno = EINVAL;
124c48dc2a1SBaptiste Daroussin goto end;
125a1df81e7SBaptiste Daroussin }
12676e6db68SBaptiste Daroussin if (!pri1) {
127a1df81e7SBaptiste Daroussin pri1 = COLLATE_MAX_PRIORITY;
12876e6db68SBaptiste Daroussin st1 = NULL;
129a1df81e7SBaptiste Daroussin }
13076e6db68SBaptiste Daroussin check1 = (st1 != NULL);
13176e6db68SBaptiste Daroussin }
13276e6db68SBaptiste Daroussin if (check2) {
13376e6db68SBaptiste Daroussin _collate_lookup(table, w2, &len2,
13476e6db68SBaptiste Daroussin &pri2, pass, &st2);
135a1df81e7SBaptiste Daroussin if (pri2 < 0) {
136a1df81e7SBaptiste Daroussin errno = EINVAL;
137c48dc2a1SBaptiste Daroussin goto end;
138a1df81e7SBaptiste Daroussin }
13976e6db68SBaptiste Daroussin if (!pri2) {
140a1df81e7SBaptiste Daroussin pri2 = COLLATE_MAX_PRIORITY;
14176e6db68SBaptiste Daroussin st2 = NULL;
14276e6db68SBaptiste Daroussin }
14376e6db68SBaptiste Daroussin check2 = (st2 != NULL);
14476e6db68SBaptiste Daroussin }
145a1df81e7SBaptiste Daroussin }
146a1df81e7SBaptiste Daroussin if (pri1 != pri2) {
147a1df81e7SBaptiste Daroussin ret = pri1 - pri2;
148a1df81e7SBaptiste Daroussin goto end;
149a1df81e7SBaptiste Daroussin }
150a1df81e7SBaptiste Daroussin w1 += len1;
151a1df81e7SBaptiste Daroussin w2 += len2;
152a1df81e7SBaptiste Daroussin }
153a1df81e7SBaptiste Daroussin if (!*w1) {
154a1df81e7SBaptiste Daroussin if (*w2) {
155a1df81e7SBaptiste Daroussin ret = -(int)*w2;
156a1df81e7SBaptiste Daroussin goto end;
157a1df81e7SBaptiste Daroussin }
158a1df81e7SBaptiste Daroussin } else {
159a1df81e7SBaptiste Daroussin ret = *w1;
160a1df81e7SBaptiste Daroussin goto end;
161a1df81e7SBaptiste Daroussin }
162c48dc2a1SBaptiste Daroussin } else {
163c48dc2a1SBaptiste Daroussin int vpri1 = 0, vpri2 = 0;
164c48dc2a1SBaptiste Daroussin while (*w1 || *w2 || st1 || st2) {
165c48dc2a1SBaptiste Daroussin pri1 = 1;
166c48dc2a1SBaptiste Daroussin while (*w1 || st1) {
167c48dc2a1SBaptiste Daroussin _collate_lookup(table, w1, &len1, &pri1,
168c48dc2a1SBaptiste Daroussin pass, &st1);
169c48dc2a1SBaptiste Daroussin w1 += len1;
170c48dc2a1SBaptiste Daroussin if (pri1 > 0) {
171c48dc2a1SBaptiste Daroussin vpri1++;
172c48dc2a1SBaptiste Daroussin break;
173c48dc2a1SBaptiste Daroussin }
174c48dc2a1SBaptiste Daroussin
175c48dc2a1SBaptiste Daroussin if (pri1 < 0) {
176c48dc2a1SBaptiste Daroussin errno = EINVAL;
177c48dc2a1SBaptiste Daroussin goto end;
178c48dc2a1SBaptiste Daroussin }
179c48dc2a1SBaptiste Daroussin st1 = NULL;
180c48dc2a1SBaptiste Daroussin }
181c48dc2a1SBaptiste Daroussin pri2 = 1;
182c48dc2a1SBaptiste Daroussin while (*w2 || st2) {
183c48dc2a1SBaptiste Daroussin _collate_lookup(table, w2, &len2, &pri2,
184c48dc2a1SBaptiste Daroussin pass, &st2);
185c48dc2a1SBaptiste Daroussin w2 += len2;
186c48dc2a1SBaptiste Daroussin if (pri2 > 0) {
187c48dc2a1SBaptiste Daroussin vpri2++;
188c48dc2a1SBaptiste Daroussin break;
189c48dc2a1SBaptiste Daroussin }
190c48dc2a1SBaptiste Daroussin if (pri2 < 0) {
191c48dc2a1SBaptiste Daroussin errno = EINVAL;
192c48dc2a1SBaptiste Daroussin goto end;
193c48dc2a1SBaptiste Daroussin }
194c48dc2a1SBaptiste Daroussin st2 = NULL;
195c48dc2a1SBaptiste Daroussin }
196c48dc2a1SBaptiste Daroussin if ((!pri1 || !pri2) && (vpri1 == vpri2))
197c48dc2a1SBaptiste Daroussin break;
198c48dc2a1SBaptiste Daroussin if (pri1 != pri2) {
199c48dc2a1SBaptiste Daroussin ret = pri1 - pri2;
200c48dc2a1SBaptiste Daroussin goto end;
201c48dc2a1SBaptiste Daroussin }
202c48dc2a1SBaptiste Daroussin }
203c48dc2a1SBaptiste Daroussin if (vpri1 && !vpri2) {
204c48dc2a1SBaptiste Daroussin ret = 1;
205c48dc2a1SBaptiste Daroussin goto end;
206c48dc2a1SBaptiste Daroussin }
207c48dc2a1SBaptiste Daroussin if (!vpri1 && vpri2) {
208c48dc2a1SBaptiste Daroussin ret = -1;
209c48dc2a1SBaptiste Daroussin goto end;
210c48dc2a1SBaptiste Daroussin }
211c48dc2a1SBaptiste Daroussin }
212a1df81e7SBaptiste Daroussin }
213a1df81e7SBaptiste Daroussin ret = 0;
214a1df81e7SBaptiste Daroussin
215a1df81e7SBaptiste Daroussin end:
216a1df81e7SBaptiste Daroussin free(tr1);
217a1df81e7SBaptiste Daroussin free(tr2);
218a1df81e7SBaptiste Daroussin
219a1df81e7SBaptiste Daroussin return (ret);
220fd4f1dd9STim J. Robbins }
221fd4f1dd9STim J. Robbins
2223c87aa1dSDavid Chisnall int
wcscoll(const wchar_t * ws1,const wchar_t * ws2)2233c87aa1dSDavid Chisnall wcscoll(const wchar_t *ws1, const wchar_t *ws2)
2243c87aa1dSDavid Chisnall {
2253c87aa1dSDavid Chisnall return wcscoll_l(ws1, ws2, __get_locale());
2263c87aa1dSDavid Chisnall }
227