xref: /freebsd/lib/libc/string/wcsxfrm.c (revision b78ee15e9f04ae15c3e1200df974473167524d17)
1 /*-
2  * Copyright (c) 1995 Alex Tatmanjants <alex@elvisti.kiev.ua>
3  *		at Electronni Visti IA, Kiev, Ukraine.
4  *			All rights reserved.
5  *
6  * Copyright (c) 2011 The FreeBSD Foundation
7  * All rights reserved.
8  * Portions of this software were developed by David Chisnall
9  * under sponsorship from the FreeBSD Foundation.
10  *
11  * Redistribution and use in source and binary forms, with or without
12  * modification, are permitted provided that the following conditions
13  * are met:
14  * 1. Redistributions of source code must retain the above copyright
15  *    notice, this list of conditions and the following disclaimer.
16  * 2. Redistributions in binary form must reproduce the above copyright
17  *    notice, this list of conditions and the following disclaimer in the
18  *    documentation and/or other materials provided with the distribution.
19  *
20  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND
21  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE
24  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30  * SUCH DAMAGE.
31  */
32 
33 #include <sys/cdefs.h>
34 #if 0
35 __FBSDID("FreeBSD: src/lib/libc/string/strxfrm.c,v 1.15 2002/09/06 11:24:06 tjr Exp ");
36 #endif
37 __FBSDID("$FreeBSD$");
38 
39 #include <stdlib.h>
40 #include <string.h>
41 #include <wchar.h>
42 #include "collate.h"
43 
44 static char *__mbsdup(const wchar_t *);
45 
46 /*
47  * Placeholder wcsxfrm() implementation. See wcscoll.c for a description of
48  * the logic used.
49  */
50 size_t
51 wcsxfrm_l(wchar_t * __restrict dest, const wchar_t * __restrict src, size_t len, locale_t locale)
52 {
53 	int prim, sec, l;
54 	size_t slen;
55 	char *mbsrc, *s, *ss;
56 	FIX_LOCALE(locale);
57 	struct xlocale_collate *table =
58 		(struct xlocale_collate*)locale->components[XLC_COLLATE];
59 
60 	if (*src == L'\0') {
61 		if (len != 0)
62 			*dest = L'\0';
63 		return (0);
64 	}
65 
66 	if (table->__collate_load_error || MB_CUR_MAX > 1) {
67 		slen = wcslen(src);
68 		if (len > 0) {
69 			if (slen < len)
70 				wcscpy(dest, src);
71 			else {
72 				wcsncpy(dest, src, len - 1);
73 				dest[len - 1] = L'\0';
74 			}
75 		}
76 		return (slen);
77 	}
78 
79 	mbsrc = __mbsdup(src);
80 	slen = 0;
81 	prim = sec = 0;
82 	ss = s = __collate_substitute(table, mbsrc);
83 	while (*s != '\0') {
84 		while (*s != '\0' && prim == 0) {
85 			__collate_lookup(table, s, &l, &prim, &sec);
86 			s += l;
87 		}
88 		if (prim != 0) {
89 			if (len > 1) {
90 				*dest++ = (wchar_t)prim;
91 				len--;
92 			}
93 			slen++;
94 			prim = 0;
95 		}
96 	}
97 	free(ss);
98 	free(mbsrc);
99 	if (len != 0)
100 		*dest = L'\0';
101 
102 	return (slen);
103 }
104 size_t
105 wcsxfrm(wchar_t * __restrict dest, const wchar_t * __restrict src, size_t len)
106 {
107 	return wcsxfrm_l(dest, src, len, __get_locale());
108 }
109 
110 static char *
111 __mbsdup(const wchar_t *ws)
112 {
113 	static const mbstate_t initial;
114 	mbstate_t st;
115 	const wchar_t *wcp;
116 	size_t len;
117 	char *mbs;
118 
119 	wcp = ws;
120 	st = initial;
121 	if ((len = wcsrtombs(NULL, &wcp, 0, &st)) == (size_t)-1)
122 		return (NULL);
123 	if ((mbs = malloc(len + 1)) == NULL)
124 		return (NULL);
125 	st = initial;
126 	wcsrtombs(mbs, &ws, len + 1, &st);
127 
128 	return (mbs);
129 }
130