xref: /linux/fs/ntfs/upcase.c (revision cdd4dc3aebeab43a72ce0bc2b5bab6f0a80b97a5)
11e9ea7e0SNamjae Jeon // SPDX-License-Identifier: GPL-2.0-or-later
21e9ea7e0SNamjae Jeon /*
3*5218cd10SNamjae Jeon  * Generate the full NTFS Unicode upcase table in little endian.
41e9ea7e0SNamjae Jeon  *
51e9ea7e0SNamjae Jeon  * Copyright (c) 2001 Richard Russon <ntfs@flatcap.org>
61e9ea7e0SNamjae Jeon  * Copyright (c) 2001-2006 Anton Altaparmakov
71e9ea7e0SNamjae Jeon  */
81e9ea7e0SNamjae Jeon 
91e9ea7e0SNamjae Jeon #include "ntfs.h"
101e9ea7e0SNamjae Jeon 
11*5218cd10SNamjae Jeon __le16 *generate_default_upcase(void)
121e9ea7e0SNamjae Jeon {
131e9ea7e0SNamjae Jeon 	static const int uc_run_table[][3] = { /* Start, End, Add */
141e9ea7e0SNamjae Jeon 	{0x0061, 0x007B,  -32}, {0x0451, 0x045D, -80}, {0x1F70, 0x1F72,  74},
151e9ea7e0SNamjae Jeon 	{0x00E0, 0x00F7,  -32}, {0x045E, 0x0460, -80}, {0x1F72, 0x1F76,  86},
161e9ea7e0SNamjae Jeon 	{0x00F8, 0x00FF,  -32}, {0x0561, 0x0587, -48}, {0x1F76, 0x1F78, 100},
171e9ea7e0SNamjae Jeon 	{0x0256, 0x0258, -205}, {0x1F00, 0x1F08,   8}, {0x1F78, 0x1F7A, 128},
181e9ea7e0SNamjae Jeon 	{0x028A, 0x028C, -217}, {0x1F10, 0x1F16,   8}, {0x1F7A, 0x1F7C, 112},
191e9ea7e0SNamjae Jeon 	{0x03AC, 0x03AD,  -38}, {0x1F20, 0x1F28,   8}, {0x1F7C, 0x1F7E, 126},
201e9ea7e0SNamjae Jeon 	{0x03AD, 0x03B0,  -37}, {0x1F30, 0x1F38,   8}, {0x1FB0, 0x1FB2,   8},
211e9ea7e0SNamjae Jeon 	{0x03B1, 0x03C2,  -32}, {0x1F40, 0x1F46,   8}, {0x1FD0, 0x1FD2,   8},
221e9ea7e0SNamjae Jeon 	{0x03C2, 0x03C3,  -31}, {0x1F51, 0x1F52,   8}, {0x1FE0, 0x1FE2,   8},
231e9ea7e0SNamjae Jeon 	{0x03C3, 0x03CC,  -32}, {0x1F53, 0x1F54,   8}, {0x1FE5, 0x1FE6,   7},
241e9ea7e0SNamjae Jeon 	{0x03CC, 0x03CD,  -64}, {0x1F55, 0x1F56,   8}, {0x2170, 0x2180, -16},
251e9ea7e0SNamjae Jeon 	{0x03CD, 0x03CF,  -63}, {0x1F57, 0x1F58,   8}, {0x24D0, 0x24EA, -26},
261e9ea7e0SNamjae Jeon 	{0x0430, 0x0450,  -32}, {0x1F60, 0x1F68,   8}, {0xFF41, 0xFF5B, -32},
271e9ea7e0SNamjae Jeon 	{0}
281e9ea7e0SNamjae Jeon 	};
291e9ea7e0SNamjae Jeon 
301e9ea7e0SNamjae Jeon 	static const int uc_dup_table[][2] = { /* Start, End */
311e9ea7e0SNamjae Jeon 	{0x0100, 0x012F}, {0x01A0, 0x01A6}, {0x03E2, 0x03EF}, {0x04CB, 0x04CC},
321e9ea7e0SNamjae Jeon 	{0x0132, 0x0137}, {0x01B3, 0x01B7}, {0x0460, 0x0481}, {0x04D0, 0x04EB},
331e9ea7e0SNamjae Jeon 	{0x0139, 0x0149}, {0x01CD, 0x01DD}, {0x0490, 0x04BF}, {0x04EE, 0x04F5},
341e9ea7e0SNamjae Jeon 	{0x014A, 0x0178}, {0x01DE, 0x01EF}, {0x04BF, 0x04BF}, {0x04F8, 0x04F9},
351e9ea7e0SNamjae Jeon 	{0x0179, 0x017E}, {0x01F4, 0x01F5}, {0x04C1, 0x04C4}, {0x1E00, 0x1E95},
361e9ea7e0SNamjae Jeon 	{0x018B, 0x018B}, {0x01FA, 0x0218}, {0x04C7, 0x04C8}, {0x1EA0, 0x1EF9},
371e9ea7e0SNamjae Jeon 	{0}
381e9ea7e0SNamjae Jeon 	};
391e9ea7e0SNamjae Jeon 
401e9ea7e0SNamjae Jeon 	static const int uc_word_table[][2] = { /* Offset, Value */
411e9ea7e0SNamjae Jeon 	{0x00FF, 0x0178}, {0x01AD, 0x01AC}, {0x01F3, 0x01F1}, {0x0269, 0x0196},
421e9ea7e0SNamjae Jeon 	{0x0183, 0x0182}, {0x01B0, 0x01AF}, {0x0253, 0x0181}, {0x026F, 0x019C},
431e9ea7e0SNamjae Jeon 	{0x0185, 0x0184}, {0x01B9, 0x01B8}, {0x0254, 0x0186}, {0x0272, 0x019D},
441e9ea7e0SNamjae Jeon 	{0x0188, 0x0187}, {0x01BD, 0x01BC}, {0x0259, 0x018F}, {0x0275, 0x019F},
451e9ea7e0SNamjae Jeon 	{0x018C, 0x018B}, {0x01C6, 0x01C4}, {0x025B, 0x0190}, {0x0283, 0x01A9},
461e9ea7e0SNamjae Jeon 	{0x0192, 0x0191}, {0x01C9, 0x01C7}, {0x0260, 0x0193}, {0x0288, 0x01AE},
471e9ea7e0SNamjae Jeon 	{0x0199, 0x0198}, {0x01CC, 0x01CA}, {0x0263, 0x0194}, {0x0292, 0x01B7},
481e9ea7e0SNamjae Jeon 	{0x01A8, 0x01A7}, {0x01DD, 0x018E}, {0x0268, 0x0197},
491e9ea7e0SNamjae Jeon 	{0}
501e9ea7e0SNamjae Jeon 	};
511e9ea7e0SNamjae Jeon 
521e9ea7e0SNamjae Jeon 	int i, r;
53*5218cd10SNamjae Jeon 	__le16 *uc;
541e9ea7e0SNamjae Jeon 
55*5218cd10SNamjae Jeon 	uc = kvcalloc(default_upcase_len, sizeof(__le16), GFP_NOFS);
561e9ea7e0SNamjae Jeon 	if (!uc)
571e9ea7e0SNamjae Jeon 		return uc;
581e9ea7e0SNamjae Jeon 	/* Generate the little endian Unicode upcase table used by ntfs. */
591e9ea7e0SNamjae Jeon 	for (i = 0; i < default_upcase_len; i++)
601e9ea7e0SNamjae Jeon 		uc[i] = cpu_to_le16(i);
611e9ea7e0SNamjae Jeon 	for (r = 0; uc_run_table[r][0]; r++)
621e9ea7e0SNamjae Jeon 		for (i = uc_run_table[r][0]; i < uc_run_table[r][1]; i++)
631e9ea7e0SNamjae Jeon 			le16_add_cpu(&uc[i], uc_run_table[r][2]);
641e9ea7e0SNamjae Jeon 	for (r = 0; uc_dup_table[r][0]; r++)
651e9ea7e0SNamjae Jeon 		for (i = uc_dup_table[r][0]; i < uc_dup_table[r][1]; i += 2)
661e9ea7e0SNamjae Jeon 			le16_add_cpu(&uc[i + 1], -1);
671e9ea7e0SNamjae Jeon 	for (r = 0; uc_word_table[r][0]; r++)
681e9ea7e0SNamjae Jeon 		uc[uc_word_table[r][0]] = cpu_to_le16(uc_word_table[r][1]);
691e9ea7e0SNamjae Jeon 	return uc;
701e9ea7e0SNamjae Jeon }
71