1*c2d2c5c0SNicolas Pitre/* SPDX-License-Identifier: GPL-2.0 */ 2*c2d2c5c0SNicolas Pitre/* 3*c2d2c5c0SNicolas Pitre * ucs_recompose_table.h - Unicode character recomposition 4*c2d2c5c0SNicolas Pitre * 5*c2d2c5c0SNicolas Pitre * Auto-generated by gen_ucs_recompose_table.py 6*c2d2c5c0SNicolas Pitre * 7*c2d2c5c0SNicolas Pitre * Unicode Version: 16.0.0 8*c2d2c5c0SNicolas Pitre * 9*c2d2c5c0SNicolas Pitre * This file contains a table with most commonly used Latin, Greek, and 10*c2d2c5c0SNicolas Pitre * Cyrillic recomposition pairs only (71 entries). To generate a table with 11*c2d2c5c0SNicolas Pitre * all possible recomposition pairs from the Unicode BMP (1000 entries) 12*c2d2c5c0SNicolas Pitre * instead, run: 13*c2d2c5c0SNicolas Pitre * 14*c2d2c5c0SNicolas Pitre * python gen_ucs_recompose_table.py --full 15*c2d2c5c0SNicolas Pitre */ 16*c2d2c5c0SNicolas Pitre 17*c2d2c5c0SNicolas Pitre/* 18*c2d2c5c0SNicolas Pitre * Table of most commonly used Latin, Greek, and Cyrillic recomposition pairs only 19*c2d2c5c0SNicolas Pitre * Sorted by base character and then combining mark for binary search 20*c2d2c5c0SNicolas Pitre */ 21*c2d2c5c0SNicolas Pitrestatic const struct ucs_recomposition ucs_recomposition_table[] = { 22*c2d2c5c0SNicolas Pitre { 0x0041, 0x0300, 0x00C0 }, /* LATIN CAPITAL LETTER A + COMBINING GRAVE ACCENT = LATIN CAPITAL LETTER A WITH GRAVE */ 23*c2d2c5c0SNicolas Pitre { 0x0041, 0x0301, 0x00C1 }, /* LATIN CAPITAL LETTER A + COMBINING ACUTE ACCENT = LATIN CAPITAL LETTER A WITH ACUTE */ 24*c2d2c5c0SNicolas Pitre { 0x0041, 0x0302, 0x00C2 }, /* LATIN CAPITAL LETTER A + COMBINING CIRCUMFLEX ACCENT = LATIN CAPITAL LETTER A WITH CIRCUMFLEX */ 25*c2d2c5c0SNicolas Pitre { 0x0041, 0x0303, 0x00C3 }, /* LATIN CAPITAL LETTER A + COMBINING TILDE = LATIN CAPITAL LETTER A WITH TILDE */ 26*c2d2c5c0SNicolas Pitre { 0x0041, 0x0308, 0x00C4 }, /* LATIN CAPITAL LETTER A + COMBINING DIAERESIS = LATIN CAPITAL LETTER A WITH DIAERESIS */ 27*c2d2c5c0SNicolas Pitre { 0x0041, 0x030A, 0x00C5 }, /* LATIN CAPITAL LETTER A + COMBINING RING ABOVE = LATIN CAPITAL LETTER A WITH RING ABOVE */ 28*c2d2c5c0SNicolas Pitre { 0x0043, 0x0327, 0x00C7 }, /* LATIN CAPITAL LETTER C + COMBINING CEDILLA = LATIN CAPITAL LETTER C WITH CEDILLA */ 29*c2d2c5c0SNicolas Pitre { 0x0045, 0x0300, 0x00C8 }, /* LATIN CAPITAL LETTER E + COMBINING GRAVE ACCENT = LATIN CAPITAL LETTER E WITH GRAVE */ 30*c2d2c5c0SNicolas Pitre { 0x0045, 0x0301, 0x00C9 }, /* LATIN CAPITAL LETTER E + COMBINING ACUTE ACCENT = LATIN CAPITAL LETTER E WITH ACUTE */ 31*c2d2c5c0SNicolas Pitre { 0x0045, 0x0302, 0x00CA }, /* LATIN CAPITAL LETTER E + COMBINING CIRCUMFLEX ACCENT = LATIN CAPITAL LETTER E WITH CIRCUMFLEX */ 32*c2d2c5c0SNicolas Pitre { 0x0045, 0x0308, 0x00CB }, /* LATIN CAPITAL LETTER E + COMBINING DIAERESIS = LATIN CAPITAL LETTER E WITH DIAERESIS */ 33*c2d2c5c0SNicolas Pitre { 0x0049, 0x0300, 0x00CC }, /* LATIN CAPITAL LETTER I + COMBINING GRAVE ACCENT = LATIN CAPITAL LETTER I WITH GRAVE */ 34*c2d2c5c0SNicolas Pitre { 0x0049, 0x0301, 0x00CD }, /* LATIN CAPITAL LETTER I + COMBINING ACUTE ACCENT = LATIN CAPITAL LETTER I WITH ACUTE */ 35*c2d2c5c0SNicolas Pitre { 0x0049, 0x0302, 0x00CE }, /* LATIN CAPITAL LETTER I + COMBINING CIRCUMFLEX ACCENT = LATIN CAPITAL LETTER I WITH CIRCUMFLEX */ 36*c2d2c5c0SNicolas Pitre { 0x0049, 0x0308, 0x00CF }, /* LATIN CAPITAL LETTER I + COMBINING DIAERESIS = LATIN CAPITAL LETTER I WITH DIAERESIS */ 37*c2d2c5c0SNicolas Pitre { 0x004E, 0x0303, 0x00D1 }, /* LATIN CAPITAL LETTER N + COMBINING TILDE = LATIN CAPITAL LETTER N WITH TILDE */ 38*c2d2c5c0SNicolas Pitre { 0x004F, 0x0300, 0x00D2 }, /* LATIN CAPITAL LETTER O + COMBINING GRAVE ACCENT = LATIN CAPITAL LETTER O WITH GRAVE */ 39*c2d2c5c0SNicolas Pitre { 0x004F, 0x0301, 0x00D3 }, /* LATIN CAPITAL LETTER O + COMBINING ACUTE ACCENT = LATIN CAPITAL LETTER O WITH ACUTE */ 40*c2d2c5c0SNicolas Pitre { 0x004F, 0x0302, 0x00D4 }, /* LATIN CAPITAL LETTER O + COMBINING CIRCUMFLEX ACCENT = LATIN CAPITAL LETTER O WITH CIRCUMFLEX */ 41*c2d2c5c0SNicolas Pitre { 0x004F, 0x0303, 0x00D5 }, /* LATIN CAPITAL LETTER O + COMBINING TILDE = LATIN CAPITAL LETTER O WITH TILDE */ 42*c2d2c5c0SNicolas Pitre { 0x004F, 0x0308, 0x00D6 }, /* LATIN CAPITAL LETTER O + COMBINING DIAERESIS = LATIN CAPITAL LETTER O WITH DIAERESIS */ 43*c2d2c5c0SNicolas Pitre { 0x0055, 0x0300, 0x00D9 }, /* LATIN CAPITAL LETTER U + COMBINING GRAVE ACCENT = LATIN CAPITAL LETTER U WITH GRAVE */ 44*c2d2c5c0SNicolas Pitre { 0x0055, 0x0301, 0x00DA }, /* LATIN CAPITAL LETTER U + COMBINING ACUTE ACCENT = LATIN CAPITAL LETTER U WITH ACUTE */ 45*c2d2c5c0SNicolas Pitre { 0x0055, 0x0302, 0x00DB }, /* LATIN CAPITAL LETTER U + COMBINING CIRCUMFLEX ACCENT = LATIN CAPITAL LETTER U WITH CIRCUMFLEX */ 46*c2d2c5c0SNicolas Pitre { 0x0055, 0x0308, 0x00DC }, /* LATIN CAPITAL LETTER U + COMBINING DIAERESIS = LATIN CAPITAL LETTER U WITH DIAERESIS */ 47*c2d2c5c0SNicolas Pitre { 0x0059, 0x0301, 0x00DD }, /* LATIN CAPITAL LETTER Y + COMBINING ACUTE ACCENT = LATIN CAPITAL LETTER Y WITH ACUTE */ 48*c2d2c5c0SNicolas Pitre { 0x0061, 0x0300, 0x00E0 }, /* LATIN SMALL LETTER A + COMBINING GRAVE ACCENT = LATIN SMALL LETTER A WITH GRAVE */ 49*c2d2c5c0SNicolas Pitre { 0x0061, 0x0301, 0x00E1 }, /* LATIN SMALL LETTER A + COMBINING ACUTE ACCENT = LATIN SMALL LETTER A WITH ACUTE */ 50*c2d2c5c0SNicolas Pitre { 0x0061, 0x0302, 0x00E2 }, /* LATIN SMALL LETTER A + COMBINING CIRCUMFLEX ACCENT = LATIN SMALL LETTER A WITH CIRCUMFLEX */ 51*c2d2c5c0SNicolas Pitre { 0x0061, 0x0303, 0x00E3 }, /* LATIN SMALL LETTER A + COMBINING TILDE = LATIN SMALL LETTER A WITH TILDE */ 52*c2d2c5c0SNicolas Pitre { 0x0061, 0x0308, 0x00E4 }, /* LATIN SMALL LETTER A + COMBINING DIAERESIS = LATIN SMALL LETTER A WITH DIAERESIS */ 53*c2d2c5c0SNicolas Pitre { 0x0061, 0x030A, 0x00E5 }, /* LATIN SMALL LETTER A + COMBINING RING ABOVE = LATIN SMALL LETTER A WITH RING ABOVE */ 54*c2d2c5c0SNicolas Pitre { 0x0063, 0x0327, 0x00E7 }, /* LATIN SMALL LETTER C + COMBINING CEDILLA = LATIN SMALL LETTER C WITH CEDILLA */ 55*c2d2c5c0SNicolas Pitre { 0x0065, 0x0300, 0x00E8 }, /* LATIN SMALL LETTER E + COMBINING GRAVE ACCENT = LATIN SMALL LETTER E WITH GRAVE */ 56*c2d2c5c0SNicolas Pitre { 0x0065, 0x0301, 0x00E9 }, /* LATIN SMALL LETTER E + COMBINING ACUTE ACCENT = LATIN SMALL LETTER E WITH ACUTE */ 57*c2d2c5c0SNicolas Pitre { 0x0065, 0x0302, 0x00EA }, /* LATIN SMALL LETTER E + COMBINING CIRCUMFLEX ACCENT = LATIN SMALL LETTER E WITH CIRCUMFLEX */ 58*c2d2c5c0SNicolas Pitre { 0x0065, 0x0308, 0x00EB }, /* LATIN SMALL LETTER E + COMBINING DIAERESIS = LATIN SMALL LETTER E WITH DIAERESIS */ 59*c2d2c5c0SNicolas Pitre { 0x0069, 0x0300, 0x00EC }, /* LATIN SMALL LETTER I + COMBINING GRAVE ACCENT = LATIN SMALL LETTER I WITH GRAVE */ 60*c2d2c5c0SNicolas Pitre { 0x0069, 0x0301, 0x00ED }, /* LATIN SMALL LETTER I + COMBINING ACUTE ACCENT = LATIN SMALL LETTER I WITH ACUTE */ 61*c2d2c5c0SNicolas Pitre { 0x0069, 0x0302, 0x00EE }, /* LATIN SMALL LETTER I + COMBINING CIRCUMFLEX ACCENT = LATIN SMALL LETTER I WITH CIRCUMFLEX */ 62*c2d2c5c0SNicolas Pitre { 0x0069, 0x0308, 0x00EF }, /* LATIN SMALL LETTER I + COMBINING DIAERESIS = LATIN SMALL LETTER I WITH DIAERESIS */ 63*c2d2c5c0SNicolas Pitre { 0x006E, 0x0303, 0x00F1 }, /* LATIN SMALL LETTER N + COMBINING TILDE = LATIN SMALL LETTER N WITH TILDE */ 64*c2d2c5c0SNicolas Pitre { 0x006F, 0x0300, 0x00F2 }, /* LATIN SMALL LETTER O + COMBINING GRAVE ACCENT = LATIN SMALL LETTER O WITH GRAVE */ 65*c2d2c5c0SNicolas Pitre { 0x006F, 0x0301, 0x00F3 }, /* LATIN SMALL LETTER O + COMBINING ACUTE ACCENT = LATIN SMALL LETTER O WITH ACUTE */ 66*c2d2c5c0SNicolas Pitre { 0x006F, 0x0302, 0x00F4 }, /* LATIN SMALL LETTER O + COMBINING CIRCUMFLEX ACCENT = LATIN SMALL LETTER O WITH CIRCUMFLEX */ 67*c2d2c5c0SNicolas Pitre { 0x006F, 0x0303, 0x00F5 }, /* LATIN SMALL LETTER O + COMBINING TILDE = LATIN SMALL LETTER O WITH TILDE */ 68*c2d2c5c0SNicolas Pitre { 0x006F, 0x0308, 0x00F6 }, /* LATIN SMALL LETTER O + COMBINING DIAERESIS = LATIN SMALL LETTER O WITH DIAERESIS */ 69*c2d2c5c0SNicolas Pitre { 0x0075, 0x0300, 0x00F9 }, /* LATIN SMALL LETTER U + COMBINING GRAVE ACCENT = LATIN SMALL LETTER U WITH GRAVE */ 70*c2d2c5c0SNicolas Pitre { 0x0075, 0x0301, 0x00FA }, /* LATIN SMALL LETTER U + COMBINING ACUTE ACCENT = LATIN SMALL LETTER U WITH ACUTE */ 71*c2d2c5c0SNicolas Pitre { 0x0075, 0x0302, 0x00FB }, /* LATIN SMALL LETTER U + COMBINING CIRCUMFLEX ACCENT = LATIN SMALL LETTER U WITH CIRCUMFLEX */ 72*c2d2c5c0SNicolas Pitre { 0x0075, 0x0308, 0x00FC }, /* LATIN SMALL LETTER U + COMBINING DIAERESIS = LATIN SMALL LETTER U WITH DIAERESIS */ 73*c2d2c5c0SNicolas Pitre { 0x0079, 0x0301, 0x00FD }, /* LATIN SMALL LETTER Y + COMBINING ACUTE ACCENT = LATIN SMALL LETTER Y WITH ACUTE */ 74*c2d2c5c0SNicolas Pitre { 0x0079, 0x0308, 0x00FF }, /* LATIN SMALL LETTER Y + COMBINING DIAERESIS = LATIN SMALL LETTER Y WITH DIAERESIS */ 75*c2d2c5c0SNicolas Pitre { 0x0391, 0x0301, 0x0386 }, /* GREEK CAPITAL LETTER ALPHA + COMBINING ACUTE ACCENT = GREEK CAPITAL LETTER ALPHA WITH TONOS */ 76*c2d2c5c0SNicolas Pitre { 0x0395, 0x0301, 0x0388 }, /* GREEK CAPITAL LETTER EPSILON + COMBINING ACUTE ACCENT = GREEK CAPITAL LETTER EPSILON WITH TONOS */ 77*c2d2c5c0SNicolas Pitre { 0x0397, 0x0301, 0x0389 }, /* GREEK CAPITAL LETTER ETA + COMBINING ACUTE ACCENT = GREEK CAPITAL LETTER ETA WITH TONOS */ 78*c2d2c5c0SNicolas Pitre { 0x0399, 0x0301, 0x038A }, /* GREEK CAPITAL LETTER IOTA + COMBINING ACUTE ACCENT = GREEK CAPITAL LETTER IOTA WITH TONOS */ 79*c2d2c5c0SNicolas Pitre { 0x039F, 0x0301, 0x038C }, /* GREEK CAPITAL LETTER OMICRON + COMBINING ACUTE ACCENT = GREEK CAPITAL LETTER OMICRON WITH TONOS */ 80*c2d2c5c0SNicolas Pitre { 0x03A5, 0x0301, 0x038E }, /* GREEK CAPITAL LETTER UPSILON + COMBINING ACUTE ACCENT = GREEK CAPITAL LETTER UPSILON WITH TONOS */ 81*c2d2c5c0SNicolas Pitre { 0x03A9, 0x0301, 0x038F }, /* GREEK CAPITAL LETTER OMEGA + COMBINING ACUTE ACCENT = GREEK CAPITAL LETTER OMEGA WITH TONOS */ 82*c2d2c5c0SNicolas Pitre { 0x03B1, 0x0301, 0x03AC }, /* GREEK SMALL LETTER ALPHA + COMBINING ACUTE ACCENT = GREEK SMALL LETTER ALPHA WITH TONOS */ 83*c2d2c5c0SNicolas Pitre { 0x03B5, 0x0301, 0x03AD }, /* GREEK SMALL LETTER EPSILON + COMBINING ACUTE ACCENT = GREEK SMALL LETTER EPSILON WITH TONOS */ 84*c2d2c5c0SNicolas Pitre { 0x03B7, 0x0301, 0x03AE }, /* GREEK SMALL LETTER ETA + COMBINING ACUTE ACCENT = GREEK SMALL LETTER ETA WITH TONOS */ 85*c2d2c5c0SNicolas Pitre { 0x03B9, 0x0301, 0x03AF }, /* GREEK SMALL LETTER IOTA + COMBINING ACUTE ACCENT = GREEK SMALL LETTER IOTA WITH TONOS */ 86*c2d2c5c0SNicolas Pitre { 0x03BF, 0x0301, 0x03CC }, /* GREEK SMALL LETTER OMICRON + COMBINING ACUTE ACCENT = GREEK SMALL LETTER OMICRON WITH TONOS */ 87*c2d2c5c0SNicolas Pitre { 0x03C5, 0x0301, 0x03CD }, /* GREEK SMALL LETTER UPSILON + COMBINING ACUTE ACCENT = GREEK SMALL LETTER UPSILON WITH TONOS */ 88*c2d2c5c0SNicolas Pitre { 0x03C9, 0x0301, 0x03CE }, /* GREEK SMALL LETTER OMEGA + COMBINING ACUTE ACCENT = GREEK SMALL LETTER OMEGA WITH TONOS */ 89*c2d2c5c0SNicolas Pitre { 0x0418, 0x0306, 0x0419 }, /* CYRILLIC CAPITAL LETTER I + COMBINING BREVE = CYRILLIC CAPITAL LETTER SHORT I */ 90*c2d2c5c0SNicolas Pitre { 0x0423, 0x0306, 0x040E }, /* CYRILLIC CAPITAL LETTER U + COMBINING BREVE = CYRILLIC CAPITAL LETTER SHORT U */ 91*c2d2c5c0SNicolas Pitre { 0x0438, 0x0306, 0x0439 }, /* CYRILLIC SMALL LETTER I + COMBINING BREVE = CYRILLIC SMALL LETTER SHORT I */ 92*c2d2c5c0SNicolas Pitre { 0x0443, 0x0306, 0x045E }, /* CYRILLIC SMALL LETTER U + COMBINING BREVE = CYRILLIC SMALL LETTER SHORT U */ 93*c2d2c5c0SNicolas Pitre}; 94*c2d2c5c0SNicolas Pitre 95*c2d2c5c0SNicolas Pitre/* 96*c2d2c5c0SNicolas Pitre * Boundary values for quick rejection 97*c2d2c5c0SNicolas Pitre * These are calculated by analyzing the table during generation 98*c2d2c5c0SNicolas Pitre */ 99*c2d2c5c0SNicolas Pitre#define UCS_RECOMPOSE_MIN_BASE 0x0041 100*c2d2c5c0SNicolas Pitre#define UCS_RECOMPOSE_MAX_BASE 0x0443 101*c2d2c5c0SNicolas Pitre#define UCS_RECOMPOSE_MIN_MARK 0x0300 102*c2d2c5c0SNicolas Pitre#define UCS_RECOMPOSE_MAX_MARK 0x0327 103