xref: /freebsd/crypto/heimdal/lib/wind/UnicodeData.py (revision 6a068746777241722b2b32c5d0bc443a2a64d80b)
1*ae771770SStanislav Sedov#!/usr/local/bin/python
2*ae771770SStanislav Sedov# -*- coding: iso-8859-1 -*-
3*ae771770SStanislav Sedov
4*ae771770SStanislav Sedov# $Id$
5*ae771770SStanislav Sedov
6*ae771770SStanislav Sedov# Copyright (c) 2004 Kungliga Tekniska Högskolan
7*ae771770SStanislav Sedov# (Royal Institute of Technology, Stockholm, Sweden).
8*ae771770SStanislav Sedov# All rights reserved.
9*ae771770SStanislav Sedov#
10*ae771770SStanislav Sedov# Redistribution and use in source and binary forms, with or without
11*ae771770SStanislav Sedov# modification, are permitted provided that the following conditions
12*ae771770SStanislav Sedov# are met:
13*ae771770SStanislav Sedov#
14*ae771770SStanislav Sedov# 1. Redistributions of source code must retain the above copyright
15*ae771770SStanislav Sedov#    notice, this list of conditions and the following disclaimer.
16*ae771770SStanislav Sedov#
17*ae771770SStanislav Sedov# 2. Redistributions in binary form must reproduce the above copyright
18*ae771770SStanislav Sedov#    notice, this list of conditions and the following disclaimer in the
19*ae771770SStanislav Sedov#    documentation and/or other materials provided with the distribution.
20*ae771770SStanislav Sedov#
21*ae771770SStanislav Sedov# 3. Neither the name of the Institute nor the names of its contributors
22*ae771770SStanislav Sedov#    may be used to endorse or promote products derived from this software
23*ae771770SStanislav Sedov#    without specific prior written permission.
24*ae771770SStanislav Sedov#
25*ae771770SStanislav Sedov# THIS SOFTWARE IS PROVIDED BY THE INSTITUTE AND CONTRIBUTORS ``AS IS'' AND
26*ae771770SStanislav Sedov# ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
27*ae771770SStanislav Sedov# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
28*ae771770SStanislav Sedov# ARE DISCLAIMED.  IN NO EVENT SHALL THE INSTITUTE OR CONTRIBUTORS BE LIABLE
29*ae771770SStanislav Sedov# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
30*ae771770SStanislav Sedov# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
31*ae771770SStanislav Sedov# OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
32*ae771770SStanislav Sedov# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
33*ae771770SStanislav Sedov# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
34*ae771770SStanislav Sedov# OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
35*ae771770SStanislav Sedov# SUCH DAMAGE.
36*ae771770SStanislav Sedov
37*ae771770SStanislav Sedovimport re
38*ae771770SStanislav Sedovimport string
39*ae771770SStanislav Sedov
40*ae771770SStanislav Sedovdef read(filename):
41*ae771770SStanislav Sedov    """return a dict of unicode characters"""
42*ae771770SStanislav Sedov    ud = open(filename, 'r')
43*ae771770SStanislav Sedov    ret = {}
44*ae771770SStanislav Sedov    while True:
45*ae771770SStanislav Sedov        l = ud.readline()
46*ae771770SStanislav Sedov        if not l:
47*ae771770SStanislav Sedov            break
48*ae771770SStanislav Sedov        l = re.sub('#.*$', '', l)
49*ae771770SStanislav Sedov        if l == "\n":
50*ae771770SStanislav Sedov            continue
51*ae771770SStanislav Sedov        f = l.split(';')
52*ae771770SStanislav Sedov        key = int(f[0], 0x10)
53*ae771770SStanislav Sedov	if key in ret:
54*ae771770SStanislav Sedov            raise Exception('Duplicate key in UnicodeData')
55*ae771770SStanislav Sedov        ret[key] = f[1:]
56*ae771770SStanislav Sedov    ud.close()
57*ae771770SStanislav Sedov    return ret
58