xref: /freebsd/contrib/file/magic/Magdir/unicode (revision 48c779cdecb5f803e5fe5d761987e976ca9609db)
1b6cee71dSXin LI
2b6cee71dSXin LI#------------------------------------------------------------------------------
3*48c779cdSXin LI# $File: unicode,v 1.7 2019/02/19 20:34:42 christos Exp $
4b6cee71dSXin LI# Unicode:  BOM prefixed text files - Adrian Havill <havill@turbolinux.co.jp>
5*48c779cdSXin LI# These types are recognised in file_ascmagic so these encodings can be
6*48c779cdSXin LI# treated by text patterns.  Missing types are already dealt with internally.
7b6cee71dSXin LI#
8b6cee71dSXin LI0	string	+/v8			Unicode text, UTF-7
9b6cee71dSXin LI0	string	+/v9			Unicode text, UTF-7
10b6cee71dSXin LI0	string	+/v+			Unicode text, UTF-7
11b6cee71dSXin LI0	string	+/v/			Unicode text, UTF-7
12b6cee71dSXin LI0	string	\335\163\146\163	Unicode text, UTF-8-EBCDIC
13b6cee71dSXin LI0	string	\000\000\376\377	Unicode text, UTF-32, big-endian
14b6cee71dSXin LI0	string	\377\376\000\000	Unicode text, UTF-32, little-endian
15b6cee71dSXin LI0	string	\016\376\377		Unicode text, SCSU (Standard Compression Scheme for Unicode)
16