gramps/src/plugins/import/ImportGeneWeb.py

931 lines
36 KiB
Python
Raw Normal View History

#
# Gramps - a GTK+/GNOME based genealogy program
#
# Copyright (C) 2000-2006 Martin Hawlisch, Donald N. Allingham
# Copyright (C) 2008 Brian G. Matherly
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
#
# $Id$
"Import from GeneWeb"
#-------------------------------------------------------------------------
#
# standard python modules
#
#-------------------------------------------------------------------------
import re
import time
from gettext import gettext as _
2009-01-31 16:59:44 +05:30
from gettext import ngettext
2006-03-05 10:01:24 +05:30
#------------------------------------------------------------------------
#
# Set up logging
#
#------------------------------------------------------------------------
import logging
log = logging.getLogger(".ImportGeneWeb")
#-------------------------------------------------------------------------
#
# GRAMPS modules
#
#-------------------------------------------------------------------------
import Errors
import gen.lib
from QuestionDialog import ErrorDialog
from gen.plug import PluginManager, ImportPlugin
2005-05-24 18:38:06 +05:30
from htmlentitydefs import name2codepoint
_date_parse = re.compile('([kmes~?<>]+)?([0-9/]+)([J|H|F])?(\.\.)?([0-9/]+)?([J|H|F])?')
2005-12-06 12:08:09 +05:30
_text_parse = re.compile('0\((.*)\)')
_mod_map = {
'>' : gen.lib.Date.MOD_AFTER,
'<' : gen.lib.Date.MOD_BEFORE,
'~' : gen.lib.Date.MOD_ABOUT,
2005-12-06 12:08:09 +05:30
}
_cal_map = {
'J' : gen.lib.Date.CAL_JULIAN,
'H' : gen.lib.Date.CAL_HEBREW,
'F' : gen.lib.Date.CAL_FRENCH,
2005-12-06 12:08:09 +05:30
}
enable_debug = False
#-------------------------------------------------------------------------
#
#
#
#-------------------------------------------------------------------------
def importData(database, filename, cb=None):
global callback
try:
g = GeneWebParser(database,filename)
except IOError,msg:
ErrorDialog(_("%s could not be opened\n") % filename,str(msg))
return
try:
status = g.parse_geneweb_file()
except IOError,msg:
errmsg = _("%s could not be opened\n") % filename
ErrorDialog(errmsg,str(msg))
return
#-------------------------------------------------------------------------
# For a description of the file format see
# http://cristal.inria.fr/~ddr/GeneWeb/en/gwformat.htm
#-------------------------------------------------------------------------
class GeneWebParser:
def __init__(self, dbase, file):
self.db = dbase
self.f = open(file,"rU")
self.filename = file
self.encoding = 'iso-8859-1'
def get_next_line(self):
self.lineno += 1
line = self.f.readline()
if line:
try:
line = unicode(line.strip())
except UnicodeDecodeError:
line = unicode(line.strip(),self.encoding)
else:
line = None
return line
def parse_geneweb_file(self):
self.trans = self.db.transaction_begin("",batch=True)
self.db.disable_signals()
t = time.time()
self.lineno = 0
self.index = 0
self.fam_count = 0
self.indi_count = 0
self.fkeys = []
self.ikeys = {}
self.pkeys = {}
self.skeys = {}
self.current_mode = None
self.current_family = None
self.current_husband_handle = None
self.current_child_birthplace_handle = None
self.current_child_source_handle = None
try:
while 1:
line = self.get_next_line()
if line is None:
break
if line == "":
continue
fields = line.split(" ")
self.debug("LINE: %s" %line)
if fields[0] == "fam":
self.current_mode = "fam"
self.read_family_line(line,fields)
elif fields[0] == "rel":
self.current_mode = "rel"
self.read_relationship_person(line,fields)
elif fields[0] == "src":
self.read_source_line(line,fields)
elif fields[0] in ("wit", "wit:"):
self.read_witness_line(line,fields)
elif fields[0] == "cbp":
self.read_children_birthplace_line(line,fields)
elif fields[0] == "csrc":
self.read_children_source_line(line,fields)
elif fields[0] == "beg" and self.current_mode == "fam":
self.read_children_lines()
elif fields[0] == "beg" and self.current_mode == "rel":
self.read_relation_lines()
elif fields[0] == "comm":
self.read_family_comment(line,fields)
elif fields[0] == "notes":
self.read_person_notes_lines(line,fields)
elif fields[0] == "notes-db":
self.read_database_notes_lines(line,fields)
elif fields[0] == "end":
self.current_mode = None
elif fields[0] == "encoding:":
self.encoding = fields[1]
else:
print "parse_geneweb_file(): Token >%s< unknown. line %d skipped: %s" % (fields[0],self.lineno,line)
except Errors.GedcomError, err:
self.errmsg(str(err))
t = time.time() - t
2009-01-31 16:59:44 +05:30
msg = ngettext('Import Complete: 1 second','Import Complete: %d seconds', t ) % t
self.db.transaction_commit(self.trans,_("GeneWeb import"))
self.db.enable_signals()
self.db.request_rebuild()
print msg
print "Families: %d" % len(self.fkeys)
print "Individuals: %d" % len(self.ikeys)
return None
def read_family_line(self,line,fields):
self.current_husband_handle = None
self.current_child_birthplace_handle = None
self.current_child_source_handle = None
self.current_family = gen.lib.Family()
self.db.add_family(self.current_family,self.trans)
#self.db.commit_family(self.current_family,self.trans)
self.fkeys.append(self.current_family.get_handle())
idx = 1;
self.debug("\nHusband:")
(idx, husband) = self.parse_person(fields,idx,gen.lib.Person.MALE,None)
if husband:
self.current_husband_handle = husband.get_handle()
self.current_family.set_father_handle(husband.get_handle())
self.db.commit_family(self.current_family,self.trans)
husband.add_family_handle(self.current_family.get_handle())
self.db.commit_person(husband,self.trans)
self.debug("Marriage:")
idx = self.parse_marriage(fields,idx)
self.debug("Wife:")
(idx,wife) = self.parse_person(fields,idx,gen.lib.Person.FEMALE,None)
if wife:
self.current_family.set_mother_handle(wife.get_handle())
self.db.commit_family(self.current_family,self.trans)
wife.add_family_handle(self.current_family.get_handle())
self.db.commit_person(wife,self.trans)
return None
def read_relationship_person(self,line,fields):
self.debug("\Relationships:")
(idx,person) = self.parse_person(fields,1,gen.lib.Person.UNKNOWN,None)
if person:
self.current_relationship_person_handle = person.get_handle()
def read_relation_lines(self):
if not self.current_relationship_person_handle:
print "Unknown person for relationship in line %d!" % self.lineno
return None
rel_person = self.db.get_person_from_handle(self.current_relationship_person_handle)
while 1:
line = self.get_next_line()
if line is None or line == "end":
break
if line == "":
continue
# match relationship type and related person
line_re = re.compile("^- ([^:]+): (.*)$")
matches = line_re.match(line)
if matches:
#split related person into fields
fields = matches.groups()[1].split(" ")
if fields:
(idx,asso_p) = self.parse_person(fields,0,gen.lib.Person.UNKNOWN,None)
pref = gen.lib.PersonRef()
pref.set_relation(matches.groups()[0])
print("TODO: Handle association types properly")
pref.set_reference_handle(asso_p.get_handle())
rel_person.add_person_ref(pref)
self.db.commit_person(rel_person,self.trans)
else:
print "Invalid name of person in line %d" % self.lineno
else:
print "Invalid relationship in line %d" % self.lineno
break
self.current_mode = None
return None
def read_source_line(self,line,fields):
if not self.current_family:
print "Unknown family of child in line %d!" % self.lineno
return None
source = self.get_or_create_source(self.decode(fields[1]))
self.current_family.add_source_reference(source)
self.db.commit_family(self.current_family,self.trans)
return None
def read_witness_line(self,line,fields):
self.debug("Witness:")
if fields[1] == "m:":
(idx,wit_p) = self.parse_person(fields,2,gen.lib.Person.MALE,None)
elif fields[1] == "f:":
(idx,wit_p) = self.parse_person(fields,2,gen.lib.Person.FEMALE,None)
else:
(idx,wit_p) = self.parse_person(fields,1,None,None)
if wit_p:
mev = None
# search marriage event
for evr in self.current_family.get_event_ref_list():
ev = self.db.get_event_from_handle(evr.get_reference_handle())
if ev.get_type() == gen.lib.EventType.MARRIAGE:
mev = ev # found.
if not mev: # No marriage event found create a new one
mev = self.create_event(gen.lib.EventType.MARRIAGE, None, None, None, None)
mar_ref = gen.lib.EventRef()
mar_ref.set_reference_handle(mev.get_handle())
self.current_family.add_event_ref(mar_ref)
wit_ref = gen.lib.EventRef()
wit_ref.set_role(gen.lib.EventRoleType(gen.lib.EventRoleType.WITNESS))
wit_ref.set_reference_handle(mev.get_handle())
wit_p.add_event_ref(wit_ref)
self.db.commit_person(wit_p,self.trans)
return None
def read_children_lines(self):
father_surname = "Dummy"
if not self.current_husband_handle:
print "Unknown father for child in line %d!" % self.lineno
return None
husb = self.db.get_person_from_handle(self.current_husband_handle)
father_surname = husb.get_primary_name().get_surname()
if not self.current_family:
print "Unknown family of child in line %d!" % self.lineno
return None
while 1:
line = self.get_next_line()
if line is None:
break
if line == "":
continue
fields = line.split(" ")
if fields[0] == "-":
self.debug("Child:")
child = None
if fields[1] == "h":
(idx,child) = self.parse_person(fields,2,gen.lib.Person.MALE,father_surname)
elif fields[1] == "f":
(idx,child) = self.parse_person(fields,2,gen.lib.Person.FEMALE,father_surname)
else:
(idx,child) = self.parse_person(fields,1,gen.lib.Person.UNKNOWN,father_surname)
2005-12-06 12:08:09 +05:30
if child:
childref = gen.lib.ChildRef()
childref.set_reference_handle(child.get_handle())
self.current_family.add_child_ref( childref)
self.db.commit_family(self.current_family,self.trans)
child.add_parent_family_handle( self.current_family.get_handle())
if self.current_child_birthplace_handle:
birth = None
birth_ref = child.get_birth_ref()
if birth_ref:
birth = self.db.get_event_from_handle(birth_ref.ref)
if not birth:
birth = self.create_event(gen.lib.EventType.BIRTH)
birth_ref = gen.lib.EventRef()
birth_ref.set_reference_handle(birth.get_handle())
child.set_birth_ref(birth_ref)
birth.set_place_handle(self.current_child_birthplace_handle)
self.db.commit_event(birth,self.trans)
if self.current_child_source_handle:
child.add_source_reference(self.current_child_source_handle)
self.db.commit_person(child,self.trans)
else:
break
self.current_mode = None
return None
def read_children_birthplace_line(self,line,fields):
cbp = self.get_or_create_place(self.decode(fields[1]))
if cbp:
self.current_child_birthplace_handle = cbp.get_handle()
return None
def read_children_source_line(self,line,fields):
csrc = self.get_or_create_source(self.decode(fields[1]))
self.current_child_source_handle = csrc
return None
def read_family_comment(self,line,fields):
if not self.current_family:
print "Unknown family of child in line %d!" % self.lineno
return None
n = gen.lib.Note()
n.set(line)
self.db.add_note(n,self.trans)
self.current_family.add_note(n.handle)
self.db.commit_family(self.current_family,self.trans)
return None
def _read_notes_lines(self, note_tag):
note_txt = ""
while True:
line = self.get_next_line()
if line is None:
break
fields = line.split(" ")
if fields[0] == "end" and fields[1] == note_tag:
break
elif fields[0] == "beg":
continue
else:
if note_txt:
2005-12-06 12:08:09 +05:30
note_txt = note_txt + "\n" + line
else:
2005-12-06 12:08:09 +05:30
note_txt = note_txt + line
if note_txt:
n = gen.lib.Note()
n.set(note_txt)
self.db.add_note(n,self.trans)
return n.handle
return None
def read_person_notes_lines(self,line,fields):
(idx,person) = self.parse_person(fields,1,None,None)
note_handle = self._read_notes_lines( fields[0])
if note_handle:
person.add_note(note_handle)
self.db.commit_person(person,self.trans)
def read_database_notes_lines(self,line,fields):
note_handle = self._read_notes_lines( fields[0])
def parse_marriage(self,fields,idx):
mariageDataRe = re.compile("^[+#-0-9].*$")
mar_date = None
mar_place = None
mar_source = None
sep_date = None
div_date = None
married = 1
engaged = 0
# skip to marriage date in case person contained unmatches tokens
#Alex: this failed when fields[idx] was an empty line. Fixed.
#while idx < len(fields) and not fields[idx][0] == "+":
while idx < len(fields) and not (fields[idx] and fields[idx][0] == "+"):
2005-12-06 12:08:09 +05:30
if fields[idx]:
print "parse_marriage(): Unknown field: '%s' in line %d!" %(fields[idx],self.lineno)
idx = idx + 1
while idx < len(fields) and mariageDataRe.match(fields[idx]):
if fields[idx][0] == "+":
mar_date = self.parse_date(self.decode(fields[idx]))
self.debug(" Married at: %s" % fields[idx])
idx = idx + 1
elif fields[idx][0] == "-":
div_date = self.parse_date(self.decode(fields[idx]))
self.debug(" Div at: %s" % fields[idx])
idx = idx + 1
elif fields[idx] == "#mp":
idx = idx + 1
mar_place = self.get_or_create_place(self.decode(fields[idx]))
self.debug(" Marriage place: %s" % fields[idx])
idx = idx + 1
elif fields[idx] == "#ms":
idx = idx + 1
mar_source = self.get_or_create_source(self.decode(fields[idx]))
self.debug(" Marriage source: %s" % fields[idx])
idx = idx + 1
elif fields[idx] == "#sep":
idx = idx + 1
sep_date = self.parse_date(self.decode(fields[idx]))
self.debug(" Seperated since: %s" % fields[idx])
idx = idx + 1
elif fields[idx] == "#nm":
self.debug(" Are not married.")
married = 0
idx = idx + 1
elif fields[idx] == "#noment":
self.debug(" Not mentioned.")
idx = idx + 1
elif fields[idx] == "#eng":
self.debug(" Are engaged.")
engaged = 1
idx = idx + 1
else:
print "parse_marriage(): Unknown field '%s'for mariage in line %d!" % (fields[idx],self.lineno)
idx = idx + 1
if mar_date or mar_place or mar_source:
mar = self.create_event(gen.lib.EventType.MARRIAGE, None, mar_date, mar_place, mar_source)
mar_ref = gen.lib.EventRef()
mar_ref.set_reference_handle(mar.get_handle())
self.current_family.add_event_ref(mar_ref)
if div_date:
div = self.create_event(gen.lib.EventType.DIVORCE, None, div_date, None, None)
div_ref = gen.lib.EventRef()
div_ref.set_reference_handle(div.get_handle())
self.current_family.add_event_ref(div_ref)
if sep_date or engaged:
sep = self.create_event(gen.lib.EventType.ENGAGEMENT, None, sep_date, None, None)
sep_ref = gen.lib.EventRef()
sep_ref.set_reference_handle(sep.get_handle())
self.current_family.add_event_ref(sep_ref)
if not married:
self.current_family.set_relationship(gen.lib.FamilyRelType(gen.lib.FamilyRelType.UNMARRIED))
self.db.commit_family(self.current_family,self.trans)
return idx
def parse_person(self,fields,idx,gender,father_surname):
if not father_surname:
if not idx < len(fields):
print "Missing surname of person in line %d!" % self.lineno
surname =""
else:
surname = self.decode(fields[idx])
idx = idx + 1
else:
surname = father_surname
if not idx < len(fields):
print "Missing firstname of person in line %d!" % self.lineno
firstname = ""
else:
firstname = self.decode(fields[idx])
idx = idx + 1
if idx < len(fields) and father_surname:
noSurnameRe = re.compile("^[({\[~><?0-9#].*$")
2005-12-06 12:08:09 +05:30
if not noSurnameRe.match(fields[idx]):
surname = self.decode(fields[idx])
idx = idx + 1
self.debug("Person: %s %s" % (firstname, surname))
person = self.get_or_create_person(firstname,surname)
name = gen.lib.Name()
name.set_type( gen.lib.NameType(gen.lib.NameType.BIRTH))
name.set_first_name(firstname)
name.set_surname(surname)
person.set_primary_name(name)
if person.get_gender() == gen.lib.Person.UNKNOWN and gender is not None:
person.set_gender(gender)
self.db.commit_person(person,self.trans)
personDataRe = re.compile("^[kmes0-9<>~#\[({!].*$")
dateRe = re.compile("^[kmes0-9~<>?]+.*$")
source = None
birth_parsed = False
birth_date = None
birth_place = None
birth_source = None
bapt_date = None
bapt_place = None
bapt_source = None
death_date = None
death_place = None
death_source = None
death_cause = None
crem_date = None
bur_date = None
bur_place = None
bur_source = None
public_name = None
firstname_aliases = []
nick_names = []
name_aliases = []
surname_aliases = []
while idx < len(fields) and personDataRe.match(fields[idx]):
if fields[idx][0] == '(':
self.debug("Public Name: %s" % fields[idx])
public_name = self.decode(fields[idx][1:-1])
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx][0] == '{':
self.debug("Firstsname Alias: %s" % fields[idx])
firstname_aliases.append(self.decode(fields[idx][1:-1]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx][0] == '[':
self.debug("Title: %s" % fields[idx])
titleparts = self.decode(fields[idx][1:-1]).split(":")
tname = ttitle = tplace = tstart = tend = tnth = None
try:
tname = titleparts[0]
ttitle = titleparts[1]
if( titleparts[2]):
tplace = self.get_or_create_place(titleparts[2])
tstart = self.parse_date(titleparts[3])
tend = self.parse_date(titleparts[4])
tnth = titleparts[5]
except IndexError: # not all parts are written all the time
pass
if tnth: # Append title numer to title
ttitle = "%s, %s" % (ttitle, tnth)
title = self.create_event(gen.lib.EventType.NOB_TITLE,ttitle,tstart,tplace)
# TODO: Geneweb has a start date and an end date, and therefore
# supprts stuff like: FROM about 1955 TO between 1998 and 1999
# gramps only supports one single date ore range.
if tname and tname != "*":
n = gen.lib.Note()
n.set(tname)
self.db.add_note(n,self.trans)
title.add_note( n.handle)
title_ref = gen.lib.EventRef()
title_ref.set_reference_handle(title.get_handle())
person.add_event_ref(title_ref)
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#nick':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Nick Name: %s" % fields[idx])
nick_names.append(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#occu':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Occupation: %s" % fields[idx])
occu = self.create_event(gen.lib.EventType.OCCUPATION,self.decode(fields[idx]))
occu_ref = gen.lib.EventRef()
occu_ref.set_reference_handle(occu.get_handle())
person.add_event_ref(occu_ref)
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#alias':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Name Alias: %s" % fields[idx])
name_aliases.append(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#salias':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Surname Alias: %s" % fields[idx])
surname_aliases.append(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#image':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Image: %s" % fields[idx])
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#src':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Source: %s" % fields[idx])
source = self.get_or_create_source(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#bs':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Birth Source: %s" % fields[idx])
birth_source = self.get_or_create_source(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx][0] == '!':
self.debug("Baptize at: %s" % fields[idx])
bapt_date = self.parse_date(self.decode(fields[idx][1:]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#bp':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Birth Place: %s" % fields[idx])
birth_place = self.get_or_create_place(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#pp':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Baptize Place: %s" % fields[idx])
bapt_place = self.get_or_create_place(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#ps':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Baptize Source: %s" % fields[idx])
bapt_source = self.get_or_create_source(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#dp':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Death Place: %s" % fields[idx])
death_place = self.get_or_create_place(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#ds':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Death Source: %s" % fields[idx])
death_source = self.get_or_create_source(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#buri':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Burial Date: %s" % fields[idx])
2005-12-06 12:08:09 +05:30
try:
bur_date = self.parse_date(self.decode(fields[idx]))
except IndexError:
pass
idx += 1
elif fields[idx] == '#crem':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Cremention Date: %s" % fields[idx])
crem_date = self.parse_date(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#rp':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Burial Place: %s" % fields[idx])
bur_place = self.get_or_create_place(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#rs':
2005-12-06 12:08:09 +05:30
idx += 1
self.debug("Burial Source: %s" % fields[idx])
bur_source = self.get_or_create_source(self.decode(fields[idx]))
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#apubl':
self.debug("This is a public record")
2005-12-06 12:08:09 +05:30
idx += 1
elif fields[idx] == '#apriv':
self.debug("This is a private record")
person.set_privacy(True)
idx += 1
elif fields[idx] == '#h':
self.debug("This is a restricted record")
#TODO: Gramps does currently not feature this level
person.set_privacy(True)
2005-12-06 12:08:09 +05:30
idx += 1
elif dateRe.match( fields[idx]):
if not birth_parsed:
self.debug("Birth Date: %s" % fields[idx])
birth_date = self.parse_date(self.decode(fields[idx]))
birth_parsed = True
else:
self.debug("Death Date: %s" % fields[idx])
death_date = self.parse_date(self.decode(fields[idx]))
if fields[idx] == "mj":
death_cause = "Died joung"
elif fields[idx][0] == "k":
death_cause = "Killed"
elif fields[idx][0] == "m":
death_cause = "Murdered"
elif fields[idx][0] == "e":
death_cause = "Executed"
elif fields[idx][0] == "d":
death_cause = "Disappeared"
#TODO: Set special death types more properly
2005-12-06 12:08:09 +05:30
idx += 1
else:
print "parse_person(): Unknown field '%s' for person in line %d!" % (fields[idx],self.lineno)
2005-12-06 12:08:09 +05:30
idx += 1
if public_name:
name = person.get_primary_name()
name.set_type(gen.lib.NameType(gen.lib.NameType.BIRTH))
person.add_alternate_name(name)
name = gen.lib.Name()
name.set_type(gen.lib.NameType(gen.lib.NameType.AKA))
name.set_first_name(public_name)
name.set_surname(surname)
person.set_primary_name(name)
for aka in nick_names:
name = gen.lib.Attribute()
name.set_type(gen.lib.AttributeType(gen.lib.AttributeType.NICKNAME))
name.set_value(aka)
person.add_attribute(name)
for aka in firstname_aliases:
name = gen.lib.Name()
name.set_type(gen.lib.NameType(gen.lib.NameType.AKA))
name.set_first_name(aka)
name.set_surname(surname)
person.add_alternate_name(name)
for aka in name_aliases:
name = gen.lib.Name()
name.set_type(gen.lib.NameType(gen.lib.NameType.AKA))
name.set_first_name(aka)
name.set_surname(surname)
person.add_alternate_name(name)
for aka in surname_aliases:
name = gen.lib.Name()
name.set_type(gen.lib.NameType(gen.lib.NameType.AKA))
if public_name:
name.set_first_name(public_name)
else:
name.set_first_name(firstname)
name.set_surname(aka)
person.add_alternate_name(name)
if source:
person.add_source_reference(source)
if birth_date or birth_place or birth_source:
birth = self.create_event(gen.lib.EventType.BIRTH, None, birth_date, birth_place, birth_source)
birth_ref = gen.lib.EventRef()
birth_ref.set_reference_handle( birth.get_handle())
person.set_birth_ref( birth_ref)
if bapt_date or bapt_place or bapt_source:
babt = self.create_event(gen.lib.EventType.BAPTISM, None, bapt_date, bapt_place, bapt_source)
babt_ref = gen.lib.EventRef()
babt_ref.set_reference_handle( babt.get_handle())
person.add_event_ref( babt_ref)
if death_date or death_place or death_source or death_cause:
death = self.create_event(gen.lib.EventType.DEATH, None, death_date, death_place, death_source)
if death_cause:
death.set_description(death_cause)
self.db.commit_event(death,self.trans)
death_ref = gen.lib.EventRef()
death_ref.set_reference_handle( death.get_handle())
person.set_death_ref( death_ref)
if bur_date:
bur = self.create_event(gen.lib.EventType.BURIAL, None, bur_date, bur_place, bur_source)
bur_ref = gen.lib.EventRef()
bur_ref.set_reference_handle( bur.get_handle())
person.add_event_ref( bur_ref)
if crem_date:
crem = self.create_event(gen.lib.EventType.CREMATION, None, crem_date, bur_place, bur_source)
crem_ref = gen.lib.EventRef()
crem_ref.set_reference_handle( crem.get_handle())
person.add_event_ref(crem_ref)
self.db.commit_person(person,self.trans)
return (idx,person)
def parse_date(self,field):
if field == "0":
return None
date = gen.lib.Date()
2005-12-06 12:08:09 +05:30
matches = _text_parse.match(field)
if matches:
groups = matches.groups()
date.set_as_text(groups[0])
date.set_modifier(gen.lib.Date.MOD_TEXTONLY)
2005-12-06 12:08:09 +05:30
return date
matches = _date_parse.match(field)
if matches:
groups = matches.groups()
mod = _mod_map.get(groups[0],gen.lib.Date.MOD_NONE)
2005-12-06 12:08:09 +05:30
if groups[3] == "..":
mod = gen.lib.Date.MOD_SPAN
cal2 = _cal_map.get(groups[5],gen.lib.Date.CAL_GREGORIAN)
2005-12-06 12:08:09 +05:30
sub2 = self.sub_date(groups[4])
else:
sub2 = (0,0,0)
cal1 = _cal_map.get(groups[2],gen.lib.Date.CAL_GREGORIAN)
2005-12-06 12:08:09 +05:30
sub1 = self.sub_date(groups[1])
date.set(gen.lib.Date.QUAL_NONE,mod, cal1,
2005-12-06 12:08:09 +05:30
(sub1[0],sub1[1],sub1[2],None,sub2[0],sub2[1],sub2[2],None))
return date
else:
return None
def sub_date(self,data):
vals = data.split('/')
if len(vals) == 1:
return (0,0,int(vals[0]))
elif len(vals) == 2:
return (0,int(vals[0]),int(vals[1]))
else:
return (int(vals[0]),int(vals[1]),int(vals[2]))
def create_event(self,type,desc=None,date=None,place=None,source=None):
event = gen.lib.Event()
if type:
event.set_type(gen.lib.EventType(type))
if desc:
event.set_description(desc)
if date:
event.set_date_object(date)
if place:
event.set_place_handle(place.get_handle())
if source:
event.add_source_reference(source)
self.db.add_event(event,self.trans)
self.db.commit_event(event,self.trans)
return event
def get_or_create_person(self,firstname,lastname):
person = None
mykey = firstname+lastname
2005-05-24 18:38:06 +05:30
if mykey in self.ikeys and firstname != "?" and lastname != "?":
person = self.db.get_person_from_handle(self.ikeys[mykey])
else:
person = gen.lib.Person()
self.db.add_person(person,self.trans)
self.db.commit_person(person,self.trans)
self.ikeys[mykey] = person.get_handle()
return person
def get_or_create_place(self,place_name):
place = None
if place_name in self.pkeys:
place = self.db.get_place_from_handle(self.pkeys[place_name])
else:
place = gen.lib.Place()
place.set_title(place_name)
self.db.add_place(place,self.trans)
self.db.commit_place(place,self.trans)
self.pkeys[place_name] = place.get_handle()
return place
def get_or_create_source(self,source_name):
source = None
if source_name in self.skeys:
source = self.db.get_source_from_handle(self.skeys[source_name])
else:
source = gen.lib.Source()
source.set_title(source_name)
self.db.add_source(source,self.trans)
self.db.commit_source(source,self.trans)
self.skeys[source_name] = source.get_handle()
sref = gen.lib.SourceRef()
sref.set_reference_handle(source.get_handle())
return sref
def decode(self,s):
2005-12-06 12:08:09 +05:30
s = s.replace('_',' ')
2005-05-24 18:38:06 +05:30
charref_re = re.compile('(&#)(x?)([0-9a-zA-Z]+)(;)')
for match in charref_re.finditer(s):
try:
if match.group(2): # HEX
nchar = unichr(int(match.group(3),16))
else: # Decimal
nchar = unichr(int(match.group(3)))
s = s.replace(match.group(0), nchar)
2005-05-24 18:38:06 +05:30
except UnicodeDecodeError:
pass
# replace named entities
entref_re = re.compile('(&)([a-zA-Z]+)(;)')
for match in entref_re.finditer(s):
try:
if match.group(2) in name2codepoint:
nchar = unichr(name2codepoint[match.group(2)])
s = s.replace(match.group(0), nchar)
2005-05-24 18:38:06 +05:30
except UnicodeDecodeError:
pass
return( s)
def debug( self, txt):
if enable_debug:
print txt
#-------------------------------------------------------------------------
#
# Register with the plugin system
#
#-------------------------------------------------------------------------
pmgr = PluginManager.get_instance()
plugin = ImportPlugin(name = _('GeneWeb'),
description = _("Import data from GeneWeb files"),
import_function = importData,
extension = "gw")
pmgr.register_plugin(plugin)