1 /*- 2 * SPDX-License-Identifier: BSD-2-Clause 3 * 4 * Copyright 2010 Nexenta Systems, Inc. All rights reserved. 5 * Copyright (c) 1995 Alex Tatmanjants <alex@elvisti.kiev.ua> 6 * at Electronni Visti IA, Kiev, Ukraine. 7 * All rights reserved. 8 * 9 * Copyright (c) 2011 The FreeBSD Foundation 10 * 11 * Portions of this software were developed by David Chisnall 12 * under sponsorship from the FreeBSD Foundation. 13 * 14 * Redistribution and use in source and binary forms, with or without 15 * modification, are permitted provided that the following conditions 16 * are met: 17 * 1. Redistributions of source code must retain the above copyright 18 * notice, this list of conditions and the following disclaimer. 19 * 2. Redistributions in binary form must reproduce the above copyright 20 * notice, this list of conditions and the following disclaimer in the 21 * documentation and/or other materials provided with the distribution. 22 * 23 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND 24 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 25 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 26 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE 27 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 28 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 29 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 30 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 31 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 32 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 33 * SUCH DAMAGE. 34 */ 35 36 #include <sys/cdefs.h> 37 #include <stdlib.h> 38 #include <string.h> 39 #include <errno.h> 40 #include <wchar.h> 41 #include "collate.h" 42 43 44 /* 45 * In order to properly handle multibyte locales, its easiest to just 46 * convert to wide characters and then use wcscoll. However if an 47 * error occurs, we gracefully fall back to simple strcmp. Caller 48 * should check errno. 49 */ 50 int 51 strcoll_l(const char *s, const char *s2, locale_t locale) 52 { 53 int ret; 54 wchar_t *t1 = NULL, *t2 = NULL; 55 wchar_t *w1 = NULL, *w2 = NULL; 56 const char *cs1, *cs2; 57 mbstate_t mbs1; 58 mbstate_t mbs2; 59 size_t sz1, sz2; 60 61 memset(&mbs1, 0, sizeof (mbstate_t)); 62 memset(&mbs2, 0, sizeof (mbstate_t)); 63 64 /* 65 * The mbsrtowcs_l function can set the src pointer to null upon 66 * failure, so it should act on a copy to avoid: 67 * - sending null pointer to strcmp 68 * - having strcoll/strcoll_l change *s or *s2 to null 69 */ 70 cs1 = s; 71 cs2 = s2; 72 73 FIX_LOCALE(locale); 74 struct xlocale_collate *table = 75 (struct xlocale_collate*)locale->components[XLC_COLLATE]; 76 77 if (table->__collate_load_error) 78 goto error; 79 80 sz1 = strlen(s) + 1; 81 sz2 = strlen(s2) + 1; 82 83 /* 84 * Simple assumption: conversion to wide format is strictly 85 * reducing, i.e. a single byte (or multibyte character) 86 * cannot result in multiple wide characters. 87 */ 88 if ((t1 = malloc(sz1 * sizeof (wchar_t))) == NULL) 89 goto error; 90 w1 = t1; 91 if ((t2 = malloc(sz2 * sizeof (wchar_t))) == NULL) 92 goto error; 93 w2 = t2; 94 95 if ((mbsrtowcs_l(w1, &cs1, sz1, &mbs1, locale)) == (size_t)-1) 96 goto error; 97 98 if ((mbsrtowcs_l(w2, &cs2, sz2, &mbs2, locale)) == (size_t)-1) 99 goto error; 100 101 ret = wcscoll_l(w1, w2, locale); 102 free(t1); 103 free(t2); 104 105 return (ret); 106 107 error: 108 free(t1); 109 free(t2); 110 return (strcmp(s, s2)); 111 } 112 113 int 114 strcoll(const char *s, const char *s2) 115 { 116 return strcoll_l(s, s2, __get_locale()); 117 } 118 119