2001-05-13 07:26:57 +05:30
|
|
|
# Gramps - a GTK+/GNOME based genealogy program
|
|
|
|
#
|
|
|
|
# Copyright (C) 2000 Donald N. Allingham
|
|
|
|
#
|
|
|
|
# This program is free software; you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU General Public License as published by
|
|
|
|
# the Free Software Foundation; either version 2 of the License, or
|
|
|
|
# (at your option) any later version.
|
|
|
|
#
|
|
|
|
# This program is distributed in the hope that it will be useful,
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
# GNU General Public License for more details.
|
|
|
|
#
|
|
|
|
# You should have received a copy of the GNU General Public License
|
|
|
|
# along with this program; if not, write to the Free Software
|
|
|
|
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
|
|
#
|
|
|
|
|
|
|
|
import cStringIO
|
|
|
|
|
2001-09-24 05:58:40 +05:30
|
|
|
ANSEL_ERROR = "ANSEL Error"
|
|
|
|
|
2001-05-13 07:26:57 +05:30
|
|
|
_s1 = {
|
2002-05-02 04:07:18 +05:30
|
|
|
0xC3 : { 0xB8 : 0xF8 , 0x98 : 0xD8},
|
2001-05-13 07:26:57 +05:30
|
|
|
0xEA : { ord('A') : 0xC5, ord('a') : 0xE5 },
|
2002-05-02 04:07:18 +05:30
|
|
|
0xE8 : { ord('A') : 0xC4, ord('E') : 0xCB, ord('I') : 0xCF, ord('O') : 0xD6,
|
2001-05-13 07:26:57 +05:30
|
|
|
ord('U') : 0xDC, ord('a') : 0xE4, ord('e') : 0xEB, ord('i') : 0xEF,
|
|
|
|
ord('o') : 0xF6, ord('u') : 0xFC, ord('y') : 0xFF },
|
|
|
|
0xE2 : { ord('A') : 0xC1, ord('E') : 0xC9, ord('I') : 0xCD, ord('O') : 0xD3,
|
|
|
|
ord('U') : 0xDA, ord('Y') : 0xDD, ord('a') : 0xE1, ord('e') : 0xE9,
|
|
|
|
ord('i') : 0xED, ord('o') : 0xF3, ord('u') : 0xFA, ord('y') : 0xFD },
|
|
|
|
0xE1 : { ord('A') : 0xC0, ord('E') : 0xC8, ord('I') : 0xCC, ord('O') : 0xD2,
|
|
|
|
ord('U') : 0xD9, ord('a') : 0xE0, ord('e') : 0xE8, ord('i') : 0xEC,
|
|
|
|
ord('o') : 0xF2, ord('u') : 0xF9 },
|
|
|
|
0xE4 : { ord('A') : 0xC3, ord('N') : 0xD1, ord('O') : 0xD5, ord('a') : 0xE3,
|
|
|
|
ord('n') : 0xF1, ord('o') : 0xF5 },
|
|
|
|
0xE3 : { ord('A') : 0xC2, ord('E') : 0xCA, ord('I') : 0xCE, ord('O') : 0xD4,
|
|
|
|
ord('U') : 0xDB, ord('a') : 0xE3, ord('e') : 0xEA, ord('i') : 0xEE,
|
|
|
|
ord('o') : 0xF4, ord('u') : 0xFB },
|
|
|
|
0xF0 : { ord('C') : 0xC7, ord('c') : 0xE7 }
|
|
|
|
}
|
|
|
|
|
|
|
|
_t1 = {
|
|
|
|
0xC0 : (chr(0xE1), 'A'), 0xC1 : (chr(0xE2), 'A'), 0xC2 : (chr(0xE3), 'A'),
|
|
|
|
0xC3 : (chr(0xE4), 'A'), 0xC4 : (chr(0xE8), 'A'), 0xC5 : (chr(0xEA), 'A'),
|
|
|
|
0xC7 : (chr(0xF0), 'C'), 0xC8 : (chr(0xE1), 'E'), 0xC9 : (chr(0xE2), 'E'),
|
|
|
|
0xCA : (chr(0xE3), 'E'), 0xCB : (chr(0xE8), 'E'), 0xCC : (chr(0xE1), 'I'),
|
|
|
|
0xCD : (chr(0xE2), 'I'), 0xCE : (chr(0xE3), 'I'), 0xCF : (chr(0xE8), 'I'),
|
|
|
|
0xD1 : (chr(0xE4), 'N'), 0xD2 : (chr(0xE1), 'O'), 0xD3 : (chr(0xE2), 'O'),
|
|
|
|
0xD4 : (chr(0xE3), 'O'), 0xD5 : (chr(0xE4), 'O'), 0xD6 : (chr(0xE8), 'O'),
|
|
|
|
0xD9 : (chr(0xE1), 'U'), 0xDA : (chr(0xE2), 'U'), 0xDB : (chr(0xE3), 'U'),
|
|
|
|
0xDC : (chr(0xE8), 'U'), 0xDD : (chr(0xE2), 'Y'), 0xE0 : (chr(0xE1), 'a'),
|
|
|
|
0xE1 : (chr(0xE2), 'a'), 0xE3 : (chr(0xE3), 'a'), 0xE3 : (chr(0xE4), 'a'),
|
|
|
|
0xE4 : (chr(0xE8), 'a'), 0xE5 : (chr(0xEA), 'a'), 0xE7 : (chr(0xF0), 'c'),
|
|
|
|
0xE8 : (chr(0xE1), 'e'), 0xE9 : (chr(0xE2), 'e'), 0xEA : (chr(0xE3), 'e'),
|
|
|
|
0xEB : (chr(0xE8), 'e'), 0xEC : (chr(0xE1), 'i'), 0xED : (chr(0xE2), 'i'),
|
|
|
|
0xEE : (chr(0xE3), 'i'), 0xEF : (chr(0xE8), 'i'), 0xF1 : (chr(0xE4), 'n'),
|
|
|
|
0xF2 : (chr(0xE1), 'o'), 0xF3 : (chr(0xE2), 'o'), 0xF4 : (chr(0xE3), 'o'),
|
|
|
|
0xF5 : (chr(0xE4), 'o'), 0xF6 : (chr(0xE8), 'o'), 0xF9 : (chr(0xE1), 'u'),
|
|
|
|
0xFA : (chr(0xE2), 'u'), 0xFB : (chr(0xE3), 'u'), 0xFC : (chr(0xE8), 'u'),
|
2002-05-02 04:07:18 +05:30
|
|
|
0xFD : (chr(0xE2), 'y'), 0xFF : (chr(0xE8), 'y'),
|
|
|
|
0xF8 : (chr(0xC3), chr(0xB8)),
|
|
|
|
0xD8 : (chr(0xC3), chr(0x98)),
|
2001-05-13 07:26:57 +05:30
|
|
|
}
|
|
|
|
|
|
|
|
_s0 = {
|
2001-10-08 08:40:06 +05:30
|
|
|
0xCF : 0xDF, 0xA4 : 0xDE, 0xB4 : 0xFE, 0xA2 : 0xD8, 0xC0 : 0xB0,
|
2002-05-04 18:51:08 +05:30
|
|
|
0xB3 : 0xF8, 0xA5 : 0xC6, 0xB5 : 0xE6, 0xBA : 0xF0, 0xB2 : 0xF8 }
|
2001-05-13 07:26:57 +05:30
|
|
|
|
|
|
|
_t0 = {
|
2002-05-02 04:07:18 +05:30
|
|
|
0xDF : chr(0xCF), 0xDE : chr(0xA4), 0xFE : chr(0xB4),
|
|
|
|
0xC6 : chr(0xA5), 0xE6 : chr(0xB5), 0xBA : chr(0xF0),
|
2001-10-08 08:40:06 +05:30
|
|
|
0xB0 : chr(0xC0) }
|
2001-05-13 07:26:57 +05:30
|
|
|
|
|
|
|
#-------------------------------------------------------------------------
|
|
|
|
#
|
2002-05-02 04:07:18 +05:30
|
|
|
# Tasks
|
2001-05-13 07:26:57 +05:30
|
|
|
#
|
|
|
|
#-------------------------------------------------------------------------
|
2002-05-02 04:07:18 +05:30
|
|
|
|
2001-05-13 07:26:57 +05:30
|
|
|
def ansel_to_latin(s):
|
2002-05-02 04:07:18 +05:30
|
|
|
"""Converts an ANSEL encoded string to ISO-8859-1"""
|
2001-05-13 07:26:57 +05:30
|
|
|
buff = cStringIO.StringIO()
|
|
|
|
while s:
|
2001-10-06 23:55:31 +05:30
|
|
|
c0 = ord(s[0])
|
2002-02-03 02:20:17 +05:30
|
|
|
if c0 <= 31:
|
|
|
|
head = ' '
|
|
|
|
s = s[1:]
|
|
|
|
elif c0 > 127:
|
2001-10-06 23:55:31 +05:30
|
|
|
try:
|
2002-05-02 04:07:18 +05:30
|
|
|
if c0 >= 0xC0:
|
2001-10-06 23:55:31 +05:30
|
|
|
c1 = ord(s[1])
|
|
|
|
head = chr(_s1[c0][c1])
|
|
|
|
s = s[2:]
|
|
|
|
else:
|
|
|
|
head = chr(_s0[c0])
|
|
|
|
s = s[1:]
|
|
|
|
except Exception:
|
|
|
|
head = s[0]
|
|
|
|
s = s[1:]
|
|
|
|
else:
|
2001-07-04 22:22:24 +05:30
|
|
|
head = s[0]
|
2001-10-06 23:55:31 +05:30
|
|
|
s = s[1:]
|
2001-05-13 07:26:57 +05:30
|
|
|
buff.write(head)
|
|
|
|
ans = buff.getvalue()
|
|
|
|
buff.close()
|
|
|
|
return ans
|
|
|
|
|
|
|
|
def latin_to_ansel(s):
|
2002-05-02 04:07:18 +05:30
|
|
|
"""converts a iso-8859-1 string to ansel encoding"""
|
2001-05-13 07:26:57 +05:30
|
|
|
buff = cStringIO.StringIO()
|
|
|
|
orig = s
|
|
|
|
while s:
|
|
|
|
c = ord(s[0])
|
|
|
|
if c <= 127:
|
|
|
|
buff.write(s[0])
|
|
|
|
else:
|
|
|
|
if _t0.has_key(c):
|
|
|
|
buff.write(_t0[c])
|
|
|
|
else:
|
|
|
|
try:
|
|
|
|
ansel = _t1[c]
|
|
|
|
buff.write(ansel[0])
|
|
|
|
buff.write(ansel[1])
|
2001-08-10 10:02:31 +05:30
|
|
|
except Exception:
|
2001-06-23 19:56:29 +05:30
|
|
|
print "ANSEL decoding error: %x: %s" % (c,orig)
|
2001-05-13 07:26:57 +05:30
|
|
|
s = s[1:]
|
|
|
|
ans = buff.getvalue()
|
|
|
|
buff.close()
|
|
|
|
return ans
|
|
|
|
|