Move _GedcomTokens.py and _GedcomUtils.py into _GedcomParse.py.

svn: r13937
2009-12-29 06:01:43 +00:00 · 2009-12-29 06:01:43 +00:00 · 2c6cf26d60
commit 2c6cf26d60
parent c7b595210f
5 changed files with 576 additions and 654 deletions
--- a/po/POTFILES.in
+++ b/po/POTFILES.in
@ -343,7 +343,6 @@ src/docgen/TextBufDoc.py
 # GrampsDbUtils package
 src/GrampsDbUtils/_GedcomParse.py
 src/GrampsDbUtils/_GedcomTokens.py
 src/GrampsDbUtils/__init__.py
 # GrampsLocale package
--- a/src/GrampsDbUtils/Makefile.am
+++ b/src/GrampsDbUtils/Makefile.am
@ -7,8 +7,6 @@ pkgdatadir = $(datadir)/@PACKAGE@/GrampsDbUtils
 pkgdata_PYTHON = \
 	_GedcomParse.py\
 	_GedcomTokens.py\
 	_GedcomUtils.py\
 	__init__.py
 pkgpyexecdir = @pkgpyexecdir@/GrampsDbUtils
--- a/src/GrampsDbUtils/_GedcomParse.py
+++ b/src/GrampsDbUtils/_GedcomParse.py
--- a/src/GrampsDbUtils/_GedcomTokens.py
+++ b/src/GrampsDbUtils/_GedcomTokens.py
@ -1,242 +0,0 @@
 #
 # Gramps - a GTK+/GNOME based genealogy program
 #
 # Copyright (C) 2000-2005  Donald N. Allingham
 #
 # This program is free software; you can redistribute it and/or modify
 # it under the terms of the GNU General Public License as published by
 # the Free Software Foundation; either version 2 of the License, or
 # (at your option) any later version.
 #
 # This program is distributed in the hope that it will be useful,
 # but WITHOUT ANY WARRANTY; without even the implied warranty of
 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 # GNU General Public License for more details.
 #
 # You should have received a copy of the GNU General Public License
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 #
 # $Id$
 TOKEN_UNKNOWN = 0
 TOKEN_ABBR = 1
 TOKEN_ADDR = 2
 TOKEN_ADOP = 3
 TOKEN_ADR1 = 4
 TOKEN_ADR2 = 5
 TOKEN_AFN = 6
 TOKEN_IGNORE = 7
 TOKEN_REFN = 8
 TOKEN__AKA = 9
 TOKEN_ALIA = 11
 TOKEN_ANCI = 12
 TOKEN_ASSO = 13
 TOKEN_AUTH = 14
 TOKEN_BAPL = 15
 TOKEN_BIRT = 16
 TOKEN__CAT = 17
 TOKEN_CAUS = 18
 TOKEN_CHAN = 19
 TOKEN_CHAR = 20
 TOKEN_CHIL = 21
 TOKEN_CITY = 22
 TOKEN__COMM = 23
 TOKEN_CONC = 24
 TOKEN_CONT = 25
 TOKEN_COPR = 26
 TOKEN_CORP = 27
 TOKEN_CTRY = 28
 TOKEN_DATA = 29
 TOKEN_DATE = 30
 TOKEN_DEAT = 32
 TOKEN_DESI = 33
 TOKEN_DEST = 34
 TOKEN_ENDL = 35
 TOKEN_EVEN = 36
 TOKEN_FAM = 38
 TOKEN_FAMC = 39
 TOKEN_FAMS = 40
 TOKEN_FILE = 41
 TOKEN_FORM = 42
 TOKEN__FREL = 43
 TOKEN_GEDC = 44
 TOKEN_GIVN = 45
 TOKEN__GODP = 46
 TOKEN_HUSB = 47
 TOKEN_INDI = 48
 TOKEN_LABL = 49
 TOKEN_LANG = 50
 TOKEN__LOC = 51
 TOKEN__MARNM = 52
 TOKEN__MREL = 53
 TOKEN__NAME = 54
 TOKEN_NAME = 55
 TOKEN_NCHI = 56
 TOKEN_NICK = 57
 TOKEN_NOTE = 58
 TOKEN_NPFX = 59
 TOKEN_NSFX = 60
 TOKEN_OBJE = 61
 TOKEN_OFFI = 62
 TOKEN_PAGE = 63
 TOKEN_PEDI = 64
 TOKEN_PERI = 65
 TOKEN_PHON = 66
 TOKEN_PLAC = 67
 TOKEN_POST = 68
 TOKEN__PRIMARY = 69
 TOKEN__PRIV = 70
 TOKEN_PUBL = 71
 TOKEN_QUAY = 72
 TOKEN_RELI = 74
 TOKEN_REPO = 75
 TOKEN_RESI = 76
 TOKEN_RFN = 77
 TOKEN_RIN = 78
 TOKEN__SCHEMA = 79
 TOKEN_SEX = 80
 TOKEN_SLGC = 81
 TOKEN_SLGS = 82
 TOKEN_SOUR = 83
 TOKEN_SPFX = 84
 TOKEN_STAE = 85
 TOKEN__STAT = 86
 TOKEN_STAT = 87
 TOKEN_SUBM = 88
 TOKEN_SUBN = 89
 TOKEN_SURN = 90
 TOKEN_TAXT = 91
 TOKEN_TEMP = 92
 TOKEN_TEXT = 93
 TOKEN_TIME = 94
 TOKEN_TITL = 95
 TOKEN__TODO = 96
 TOKEN_TRLR = 97
 TOKEN_TYPE = 98
 TOKEN__UID = 99
 TOKEN_VERS = 100
 TOKEN_WIFE = 101
 TOKEN__WITN = 102
 TOKEN__WTN = 103
 TOKEN_AGNC = 104
 TOKEN_HEAD = 105
 TOKEN_CALN = 106
 TOKEN_MEDI = 107
 TOKEN_RELA = 108
 TOKEN__LKD = 109
 TOKEN_BLOB = 110
 TOKEN_CONL = 111
 TOKEN_AGE  = 112
 TOKEN_RESN = 114
 TOKEN_ID = 115
 TOKEN_GEVENT = 116
 TOKEN_RNOTE = 117
 TOKEN_GATTR = 118
 TOKEN_ATTR = 119
 TOKEN_MAP = 120
 TOKEN_LATI = 121
 TOKEN_LONG = 122
 TOKEN_FACT = 123
 TOKENS = {
    "HEAD"         : TOKEN_HEAD,    "MEDI"         : TOKEN_MEDI,
    "HEADER"       : TOKEN_HEAD,    "TRAILER"      : TOKEN_TRLR,
    "CALL_NUMBER"  : TOKEN_CALN,    "MEDIA"        : TOKEN_MEDI,
    "CALN"         : TOKEN_CALN,    "ABBR"         : TOKEN_ABBR,
    "ABBREVIATION" : TOKEN_ABBR,    "ADDR"         : TOKEN_ADDR,
    "ADDRESS"      : TOKEN_ADDR,    "ADOP"         : TOKEN_ADOP,
    "ADOPT"        : TOKEN_ADOP,    "ADR1"         : TOKEN_ADR1,
    "ADDRESS1"     : TOKEN_ADR1,    "ADR2"         : TOKEN_ADR2,
    "ADDRESS2"     : TOKEN_ADR2,    "AFN"          : TOKEN_AFN,
    "AGE"          : TOKEN_AGE,     "AGNC"         : TOKEN_AGNC,
    "AGENCY"       : TOKEN_IGNORE,  "_AKA"         : TOKEN__AKA,
    "_ALIA"        : TOKEN_ALIA,    "ALIA"         : TOKEN_ALIA,
    "ALIAS"        : TOKEN_ALIA,    "ANCI"         : TOKEN_ANCI,
    "ASSO"         : TOKEN_ASSO,    "ASSOCIATES"   : TOKEN_ASSO,
    "AUTH"         : TOKEN_AUTH,    "AUTHOR"       : TOKEN_AUTH,
    "BAPL"         : TOKEN_BAPL,    "BAPTISM-LDS"  : TOKEN_BAPL,
    "BIRT"         : TOKEN_BIRT,    "BIRTH"        : TOKEN_BIRT,
    "_CAT"         : TOKEN_IGNORE,  "CAUS"         : TOKEN_CAUS,
    "CAUSE"        : TOKEN_CAUS,    "CHAN"         : TOKEN_CHAN,
    "CHANGE"       : TOKEN_CHAN,    "CHAR"         : TOKEN_CHAR,
    "CHARACTER"    : TOKEN_CHAR,    "CHIL"         : TOKEN_CHIL,
    "CHILD"        : TOKEN_CHIL,    "CITY"         : TOKEN_CITY,
    "_COMM"        : TOKEN__COMM,   "CONC"         : TOKEN_CONC,
    "CONCATENTATE" : TOKEN_CONC,    "CONT"         : TOKEN_CONT,
    "CONTINUED"    : TOKEN_CONT,    "CONCATENATION": TOKEN_CONC,
    "CONTINUATION" : TOKEN_CONT,    "COPR"         : TOKEN_COPR,
    "COPYRIGHT"    : TOKEN_COPR,    "CORP"         : TOKEN_CORP,
    "CORPORATION"  : TOKEN_CORP,    "CTRY"         : TOKEN_CTRY,
    "COUNTRY"      : TOKEN_CTRY,    "DATA"         : TOKEN_DATA,
    "DATE"         : TOKEN_DATE,    "_DATE2"       : TOKEN_IGNORE,
    "DEAT"         : TOKEN_DEAT,    "DEATH"        : TOKEN_DEAT,
    "DESI"         : TOKEN_DESI,    "DEST"         : TOKEN_DEST,
    "DESTINATION"  : TOKEN_DEST,    "ENDL"         : TOKEN_ENDL,
    "ENDOWMENT"    : TOKEN_ENDL,    "EVEN"         : TOKEN_EVEN,
    "EVENT"        : TOKEN_EVEN,    "_ANCES_ORDRE" : TOKEN_IGNORE,
    "FAM"          : TOKEN_FAM,     "FAMILY"       : TOKEN_FAM,
    "FAMC"         : TOKEN_FAMC,    "FAMILY_CHILD" : TOKEN_FAMC,
    "FAMS"         : TOKEN_FAMS,    "FAMILY_SPOUSE" : TOKEN_FAMS,
    "FILE"          : TOKEN_FILE,   "FORM"          : TOKEN_FORM,
    "_FREL"         : TOKEN__FREL,  "GEDC"          : TOKEN_GEDC,
    "GEDCOM"        : TOKEN_GEDC,   "GIVN"          : TOKEN_GIVN,
    "GIVEN_NAME"    : TOKEN_GIVN,   "_GODP"         : TOKEN__GODP,
    "HUSB"          : TOKEN_HUSB,   "HUSBAND"       : TOKEN_HUSB,
    "INDI"          : TOKEN_INDI,   "INDIVIDUAL"    : TOKEN_INDI,
    "LABL"          : TOKEN_LABL,   "LABEL"         : TOKEN_LABL,
    "LANG"          : TOKEN_LANG,   "_LOC"          : TOKEN__LOC,
    "_MARNM"        : TOKEN__MARNM, "_MREL"         : TOKEN__MREL,
    "_NAME"         : TOKEN__NAME,  "NAME"          : TOKEN_NAME,
    "NCHI"          : TOKEN_NCHI,   "CHILDREN_COUNT": TOKEN_NCHI,
    "NICK"          : TOKEN_NICK,   "NICKNAME"      : TOKEN_NICK,
    "NOTE"          : TOKEN_NOTE,   "NPFX"          : TOKEN_NPFX,
    "NAME_PREFIX"   : TOKEN_NPFX,   "NSFX"          : TOKEN_NSFX,
    "NAME_SUFFIX"   : TOKEN_NSFX,   "OBJE"          : TOKEN_OBJE,
    "OBJECT"        : TOKEN_OBJE,   "OFFI"          : TOKEN_OFFI,
    "PAGE"          : TOKEN_PAGE,   "PEDIGREE"      : TOKEN_PEDI,
    "PEDI"          : TOKEN_PEDI,   "PERI"          : TOKEN_PERI,
    "PHON"          : TOKEN_PHON,   "PHONE"         : TOKEN_PHON,
    "PHONE_NUMBER"  : TOKEN_PHON,   "PLAC"          : TOKEN_PLAC,
    "PLACE"         : TOKEN_PLAC,   "POST"          : TOKEN_POST,
    "POSTAL_CODE"   : TOKEN_POST,   "_PRIMARY"      : TOKEN__PRIMARY,
    "_PRIV"         : TOKEN__PRIV,  "PUBL"          : TOKEN_PUBL,
    "PUBLICATION"   : TOKEN_PUBL,   "QUAY"          : TOKEN_QUAY,
    "QUALITY_OF_DATA": TOKEN_QUAY,  "REFN"          : TOKEN_REFN,
    "REFERENCE"      : TOKEN_REFN,  "RELI"          : TOKEN_RELI,
    "RELIGION"       : TOKEN_RELI,  "REPO"          : TOKEN_REPO,
    "REPOSITORY"     : TOKEN_REPO,  "RFN"           : TOKEN_RFN,
    "RIN"            : TOKEN_RIN,   "_SCHEMA"       : TOKEN__SCHEMA,
    "SEX"            : TOKEN_SEX,   "SCHEMA"        : TOKEN__SCHEMA,
    "SLGC"           : TOKEN_SLGC,  "SLGS"          : TOKEN_SLGS,
    "SOUR"           : TOKEN_SOUR,  "SOURCE"        : TOKEN_SOUR,
    "SPFX"           : TOKEN_SPFX,  "SURN_PREFIX"   : TOKEN_SPFX,
    "STAE"           : TOKEN_STAE,  "STATE"         : TOKEN_STAE,
    "_STAT"          : TOKEN__STAT, "STAT"          : TOKEN_STAT,
    "STATUS"         : TOKEN_STAT,  "SUBM"          : TOKEN_SUBM,
    "SUBMITTER"      : TOKEN_SUBM,  "SUBN"          : TOKEN_SUBN,
    "SUBMISSION"     : TOKEN_SUBN,  "SURN"          : TOKEN_SURN,
    "SURNAME"        : TOKEN_SURN,  "TAXT"          : TOKEN_TAXT,
    "TEMP"           : TOKEN_TEMP,  "TEMPLE"        : TOKEN_TEMP,
    "TEXT"           : TOKEN_TEXT,  "TIME"          : TOKEN_TIME,
    "TITL"           : TOKEN_TITL,  "TITLE"         : TOKEN_TITL,
    "_TODO"          : TOKEN__TODO, "TRLR"          : TOKEN_TRLR,
    "TRAILER"        : TOKEN_TRLR,  "TYPE"          : TOKEN_TYPE,
    "_UID"           : TOKEN__UID,  "VERS"          : TOKEN_VERS,
    "VERSION"        : TOKEN_VERS,  "WIFE"          : TOKEN_WIFE,
    "_WITN"          : TOKEN__WITN, "_WTN"          : TOKEN__WTN,
    "_CHUR"          : TOKEN_IGNORE,"RELA"          : TOKEN_RELA,
    "_DETAIL"        : TOKEN_IGNORE,"_PREF"         : TOKEN__PRIMARY,
    "_LKD"           : TOKEN__LKD,  "_DATE"         : TOKEN_IGNORE,
    "_SCBK"          : TOKEN_IGNORE,"_TYPE"         : TOKEN_TYPE,
    "_PRIM"          : TOKEN_IGNORE,"_SSHOW"        : TOKEN_IGNORE,
    "_PAREN"         : TOKEN_IGNORE,"BLOB"          : TOKEN_BLOB,
    "CONL"           : TOKEN_CONL,  "RESN"          : TOKEN_RESN,
    "_MEDI"          : TOKEN_MEDI,  "_MASTER"       : TOKEN_IGNORE,
    "_LEVEL"         : TOKEN_IGNORE,"_PUBLISHER"    : TOKEN_IGNORE,
    "MAP"            : TOKEN_MAP,   "LATI"          : TOKEN_LATI,
    "LONG"           : TOKEN_LONG,  "_ITALIC"       : TOKEN_IGNORE,
    "_PAREN"         : TOKEN_IGNORE,"_PLACE"        : TOKEN_IGNORE,
    "FACT"           : TOKEN_FACT,
 }
--- a/src/GrampsDbUtils/_GedcomUtils.py
+++ b/src/GrampsDbUtils/_GedcomUtils.py
@ -1,231 +0,0 @@
 #
 # Gramps - a GTK+/GNOME based genealogy program
 #
 # Copyright (C) 2000-2006  Donald N. Allingham
 #
 # This program is free software; you can redistribute it and/or modify
 # it under the terms of the GNU General Public License as published by
 # the Free Software Foundation; either version 2 of the License, or
 # (at your option) any later version.
 #
 # This program is distributed in the hope that it will be useful,
 # but WITHOUT ANY WARRANTY; without even the implied warranty of
 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 # GNU General Public License for more details.
 #
 # You should have received a copy of the GNU General Public License
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 #
 """
 Support classes to simplify GEDCOM importing
 """
 import re
 import gen.lib
 NAME_RE    = re.compile(r"/?([^/]*)(/([^/]*)(/([^/]*))?)?")
 SURNAME_RE = re.compile(r"/([^/]*)/([^/]*)")
 #-------------------------------------------------------------------------
 #
 # CurrentState
 #
 #-------------------------------------------------------------------------
 class CurrentState(object):
    """
    Keep track of the current state variables.
    """
    def __init__(self, person=None, level=0, event=None, event_ref=None):
        """
        Initialize the object.
        """
        self.name_cnt = 0
        self.person = person
        self.level = level
        self.event = event
        self.event_ref = event_ref
        self.source_ref = None
    def __getattr__(self, name):
        """
        Return the value associated with the specified attribute.
        """
        return self.__dict__.get(name)
    def __setattr__(self, name, value):
        """
        Set the value associated with the specified attribute.
        """
        self.__dict__[name] = value
 #-------------------------------------------------------------------------
 #
 # PlaceParser
 #
 #-------------------------------------------------------------------------
 class PlaceParser(object):
    """
    Provide the ability to parse GEDCOM FORM statements for places, and
    the parse the line of text, mapping the text components to Location
    values based of the FORM statement.
    """
    __field_map = {
 	'addr'          : gen.lib.Location.set_street,
 	'subdivision'   : gen.lib.Location.set_street,
 	'addr1'         : gen.lib.Location.set_street,
 	'adr1'          : gen.lib.Location.set_street,
 	'city'          : gen.lib.Location.set_city,
 	'town'          : gen.lib.Location.set_city,
 	'village'       : gen.lib.Location.set_city,
 	'county'        : gen.lib.Location.set_county,
 	'country'       : gen.lib.Location.set_country,
 	'state'         : gen.lib.Location.set_state,
 	'state/province': gen.lib.Location.set_state,
 	'region'        : gen.lib.Location.set_state,
 	'province'      : gen.lib.Location.set_state,
 	'area code'     : gen.lib.Location.set_postal_code,
 	}
    def __init__(self, line=None):
        self.parse_function = []
        if line:
            self.parse_form(line)
    def parse_form(self, line):
        """
        Parses the GEDCOM PLAC.FORM into a list of function
        pointers (if possible). It does this my mapping the text strings
        (separated by commas) to the corresponding gen.lib.Location
        method via the __field_map variable
        """
        for item in line.data.split(','):
            item = item.lower().strip()
            fcn = self.__field_map.get(item, lambda x, y: None)
            self.parse_function.append(fcn)
    def load_place(self, place, text):
        """
        Takes the text string representing a place, splits it into
        its subcomponents (comma separated), and calls the approriate
        function based of its position, depending on the parsed value
        from the FORM statement.
        """
        items = [item.strip() for item in text.split(',')]
        if len(items) != len(self.parse_function):
            return
        loc = place.get_main_location()
        index = 0
        for item in items:
            self.parse_function[index](loc, item)
            index += 1
 #-------------------------------------------------------------------------
 #
 # IdFinder
 #
 #-------------------------------------------------------------------------
 class IdFinder(object):
    """
    Provide method of finding the next available ID.
    """
    def __init__(self, keys, prefix):
        """
        Initialize the object.
        """
        self.ids = set(keys)
        self.index = 0
        self.prefix = prefix
    def find_next(self):
        """
        Return the next available GRAMPS' ID for a Event object based
        off the person ID prefix.
        @return: Returns the next available index
        @rtype: str
        """
        index = self.prefix % self.index
        while str(index) in self.ids:
            self.index += 1
            index = self.prefix % self.index
        self.ids.add(index)
        self.index += 1
        return index
 #-------------------------------------------------------------------------
 #
 # IdMapper
 #
 #-------------------------------------------------------------------------
 class IdMapper(object):
    def __init__(self, trans, find_next, translate):
        self.translate = translate
        self.trans = trans
        self.find_next = find_next
        self.swap = {}
    def __getitem__(self, gid):
        if self.translate:
            return self.get_translate(gid)
        else:
            return self.no_translate(gid)
    def clean(self, gid):
        temp = gid.strip()
        if len(temp) > 1 and temp[0] == '@' and temp[-1] == '@':
            temp = temp[1:-1]
        return temp
    def no_translate(self, gid):
        return self.clean(gid)
    def get_translate(self, gid):
        gid = self.clean(gid)
        if gid in self.swap:
            return self.swap[gid]
        else:
            if self.trans.get(str(gid)):
                new_val = self.find_next()
            else:
                new_val = gid
        self.swap[gid] = new_val
        return new_val
 #------------------------------------------------------------------------
 #
 # Support functions
 #
 #------------------------------------------------------------------------
 def parse_name_personal(text):
    """
    Parses a GEDCOM NAME value into an Name structure
    """
    name = gen.lib.Name()
    match = SURNAME_RE.match(text)
    if match:
        names = match.groups()
        name.set_first_name(names[1].strip())
        name.set_surname(names[0].strip())
    else:
        try:
            names = NAME_RE.match(text).groups()
            name.set_first_name(names[0].strip())
            name.set_surname(names[2].strip())
            name.set_suffix(names[4].strip())
        except:
            name.set_first_name(text.strip())
    return name
 def extract_id(value):
    """
    Extracts a value to use for the GRAMPS ID value from the GEDCOM
    reference token. The value should be in the form of @XYZ@, and the
    returned value will be XYZ
    """
    return value.strip()[1:-1]