xref: /linux/fs/nls/nls_ucs2_utils.c (revision 566ab427f827b0256d3e8ce0235d088e6a9c28bd)
1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /*
3  *   Some of the source code in this file came from fs/cifs/uniupr.h
4  *   Copyright (c) International Business Machines  Corp., 2000,2002
5  *
6  *   Some of the source code in this file came from fs/cifs/cifs_unicode.c
7  *
8  *   Copyright (c) International Business Machines  Corp., 2000,2009
9  *   Modified by Steve French (sfrench@us.ibm.com)
10  *   Modified by Namjae Jeon (linkinjeon@kernel.org)
11  *
12  */
13 #include <linux/fs.h>
14 #include <linux/module.h>
15 #include <linux/slab.h>
16 #include <linux/unaligned.h>
17 #include "nls_ucs2_utils.h"
18 
19 MODULE_DESCRIPTION("NLS UCS-2");
20 MODULE_LICENSE("GPL");
21 
22 /*
23  * Latin upper case
24  */
25 signed char NlsUniUpperTable[512] = {
26 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 000-00f */
27 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 010-01f */
28 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 020-02f */
29 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 030-03f */
30 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 040-04f */
31 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 050-05f */
32 	0, -32, -32, -32, -32, -32, -32, -32, -32, -32, -32,
33 				-32, -32, -32, -32, -32,	/* 060-06f */
34 	-32, -32, -32, -32, -32, -32, -32, -32, -32, -32,
35 				-32, 0, 0, 0, 0, 0,	/* 070-07f */
36 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 080-08f */
37 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 090-09f */
38 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 0a0-0af */
39 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 0b0-0bf */
40 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 0c0-0cf */
41 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 0d0-0df */
42 	-32, -32, -32, -32, -32, -32, -32, -32, -32, -32,
43 			 -32, -32, -32, -32, -32, -32,	/* 0e0-0ef */
44 	-32, -32, -32, -32, -32, -32, -32, 0, -32, -32,
45 			 -32, -32, -32, -32, -32, 121,	/* 0f0-0ff */
46 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 100-10f */
47 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 110-11f */
48 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 120-12f */
49 	0, 0, 0, -1, 0, -1, 0, -1, 0, 0, -1, 0, -1, 0, -1, 0,	/* 130-13f */
50 	-1, 0, -1, 0, -1, 0, -1, 0, -1, 0, 0, -1, 0, -1, 0, -1,	/* 140-14f */
51 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 150-15f */
52 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 160-16f */
53 	0, -1, 0, -1, 0, -1, 0, -1, 0, 0, -1, 0, -1, 0, -1, 0,	/* 170-17f */
54 	0, 0, 0, -1, 0, -1, 0, 0, -1, 0, 0, 0, -1, 0, 0, 0,	/* 180-18f */
55 	0, 0, -1, 0, 0, 0, 0, 0, 0, -1, 0, 0, 0, 0, 0, 0,	/* 190-19f */
56 	0, -1, 0, -1, 0, -1, 0, 0, -1, 0, 0, 0, 0, -1, 0, 0,	/* 1a0-1af */
57 	-1, 0, 0, 0, -1, 0, -1, 0, 0, -1, 0, 0, 0, -1, 0, 0,	/* 1b0-1bf */
58 	0, 0, 0, 0, 0, -1, -2, 0, -1, -2, 0, -1, -2, 0, -1, 0,	/* 1c0-1cf */
59 	-1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, -79, 0, -1, /* 1d0-1df */
60 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1e0-1ef */
61 	0, 0, -1, -2, 0, -1, 0, 0, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1f0-1ff */
62 };
63 EXPORT_SYMBOL_GPL(NlsUniUpperTable);
64 
65 /* Upper case range - Greek */
66 static signed char UniCaseRangeU03a0[47] = {
67 	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, -38, -37, -37, -37,	/* 3a0-3af */
68 	0, -32, -32, -32, -32, -32, -32, -32, -32, -32, -32, -32,
69 					 -32, -32, -32, -32,	/* 3b0-3bf */
70 	-32, -32, -31, -32, -32, -32, -32, -32, -32, -32, -32, -32, -64,
71 	-63, -63,
72 };
73 
74 /* Upper case range - Cyrillic */
75 static signed char UniCaseRangeU0430[48] = {
76 	-32, -32, -32, -32, -32, -32, -32, -32, -32, -32, -32, -32,
77 					 -32, -32, -32, -32,	/* 430-43f */
78 	-32, -32, -32, -32, -32, -32, -32, -32, -32, -32, -32, -32,
79 					 -32, -32, -32, -32,	/* 440-44f */
80 	0, -80, -80, -80, -80, -80, -80, -80, -80, -80, -80,
81 					 -80, -80, 0, -80, -80,	/* 450-45f */
82 };
83 
84 /* Upper case range - Extended cyrillic */
85 static signed char UniCaseRangeU0490[61] = {
86 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 490-49f */
87 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 4a0-4af */
88 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 4b0-4bf */
89 	0, 0, -1, 0, -1, 0, 0, 0, -1, 0, 0, 0, -1,
90 };
91 
92 /* Upper case range - Extended latin and greek */
93 static signed char UniCaseRangeU1e00[509] = {
94 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1e00-1e0f */
95 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1e10-1e1f */
96 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1e20-1e2f */
97 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1e30-1e3f */
98 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1e40-1e4f */
99 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1e50-1e5f */
100 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1e60-1e6f */
101 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1e70-1e7f */
102 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1e80-1e8f */
103 	0, -1, 0, -1, 0, -1, 0, 0, 0, 0, 0, -59, 0, -1, 0, -1,	/* 1e90-1e9f */
104 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1ea0-1eaf */
105 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1eb0-1ebf */
106 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1ec0-1ecf */
107 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1ed0-1edf */
108 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, -1,	/* 1ee0-1eef */
109 	0, -1, 0, -1, 0, -1, 0, -1, 0, -1, 0, 0, 0, 0, 0, 0,	/* 1ef0-1eff */
110 	8, 8, 8, 8, 8, 8, 8, 8, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1f00-1f0f */
111 	8, 8, 8, 8, 8, 8, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1f10-1f1f */
112 	8, 8, 8, 8, 8, 8, 8, 8, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1f20-1f2f */
113 	8, 8, 8, 8, 8, 8, 8, 8, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1f30-1f3f */
114 	8, 8, 8, 8, 8, 8, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1f40-1f4f */
115 	0, 8, 0, 8, 0, 8, 0, 8, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1f50-1f5f */
116 	8, 8, 8, 8, 8, 8, 8, 8, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1f60-1f6f */
117 	74, 74, 86, 86, 86, 86, 100, 100, 0, 0, 112, 112,
118 				 126, 126, 0, 0,	/* 1f70-1f7f */
119 	8, 8, 8, 8, 8, 8, 8, 8, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1f80-1f8f */
120 	8, 8, 8, 8, 8, 8, 8, 8, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1f90-1f9f */
121 	8, 8, 8, 8, 8, 8, 8, 8, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1fa0-1faf */
122 	8, 8, 0, 9, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1fb0-1fbf */
123 	0, 0, 0, 9, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1fc0-1fcf */
124 	8, 8, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1fd0-1fdf */
125 	8, 8, 0, 0, 0, 7, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,	/* 1fe0-1fef */
126 	0, 0, 0, 9, 0, 0, 0, 0, 0, 0, 0, 0, 0,
127 };
128 
129 /* Upper case range - Wide latin */
130 static signed char UniCaseRangeUff40[27] = {
131 	0, -32, -32, -32, -32, -32, -32, -32, -32, -32, -32,
132 			 -32, -32, -32, -32, -32,	/* ff40-ff4f */
133 	-32, -32, -32, -32, -32, -32, -32, -32, -32, -32, -32,
134 };
135 
136 /*
137  * Upper Case Range
138  */
139 const struct UniCaseRange NlsUniUpperRange[] = {
140 	{0x03a0, 0x03ce, UniCaseRangeU03a0},
141 	{0x0430, 0x045f, UniCaseRangeU0430},
142 	{0x0490, 0x04cc, UniCaseRangeU0490},
143 	{0x1e00, 0x1ffc, UniCaseRangeU1e00},
144 	{0xff40, 0xff5a, UniCaseRangeUff40},
145 	{0}
146 };
147 EXPORT_SYMBOL_GPL(NlsUniUpperRange);
148