Lines Matching +full:- +full:t
1 /*-
16 #define T 1 /* character appears in plain ASCII text */ macro
17 #define I 2 /* character appears in ISO-8859 text */
18 #define X 3 /* character appears in non-ISO extended ASCII (Mac, IBM PC) */
22 F, F, F, F, F, F, F, T, T, T, T, F, T, T, F, F, /* 0x0X */
24 F, F, F, F, F, F, F, F, F, F, F, T, F, F, F, F, /* 0x1X */
25 T, T, T, T, T, T, T, T, T, T, T, T, T, T, T, T, /* 0x2X */
26 T, T, T, T, T, T, T, T, T, T, T, T, T, T, T, T, /* 0x3X */
27 T, T, T, T, T, T, T, T, T, T, T, T, T, T, T, T, /* 0x4X */
28 T, T, T, T, T, T, T, T, T, T, T, T, T, T, T, T, /* 0x5X */
29 T, T, T, T, T, T, T, T, T, T, T, T, T, T, T, T, /* 0x6X */
30 T, T, T, T, T, T, T, T, T, T, T, T, T, T, T, F, /* 0x7X */
32 X, X, X, X, X, T, X, X, X, X, X, X, X, X, X, X, /* 0x8X */
43 * looks_utf8 --
44 * Decide whether some text looks like UTF-8. Returns:
46 * -1: invalid UTF-8
47 * 0: uses odd control characters, so doesn't look like text
48 * 1: 7-bit text
49 * 2: definitely UTF-8 text (valid high-bit set bytes)
51 * Based on RFC 3629. UTF-8 with BOM is not accepted.
66 * Even if the whole file is valid UTF-8 sequences, in looks_utf8()
70 if (text_chars[buf[i]] != T) in looks_utf8()
73 return -1; in looks_utf8()
74 } else { /* 11xxxxxx begins UTF-8 */ in looks_utf8()
80 else return -1; in looks_utf8()
86 else return -1; /* F5, F6, F7 */ in looks_utf8()
88 return -1; /* F8~FF */ in looks_utf8()
96 return -1; in looks_utf8()
107 * looks_utf16 --
108 * Decide whether some text looks like UTF-16. Returns:
110 * 0: invalid UTF-16
111 * 1: Little-endian UTF-16
112 * 2: Big-endian UTF-16
145 if (c < 128 && text_chars[c] != T) in looks_utf16()
163 #undef T
168 * decode_utf8 --
169 * Decode a UTF-8 character from byte string to Unicode.
170 * Returns -1 if the first byte is a not UTF-8 leader.
180 int u = -1; in decode_utf8()
200 * decode_utf16 --
201 * Decode a UTF-16 character from byte string to Unicode.
202 * Returns -1 if the first unsigned integer is invalid.
212 int u = -1; in decode_utf16()