2004-09-25 04:12:21 +05:30
|
|
|
#
|
|
|
|
# Gramps - a GTK+/GNOME based genealogy program
|
|
|
|
#
|
2006-01-19 10:00:40 +05:30
|
|
|
# Copyright (C) 2000-2006 Martin Hawlisch, Donald N. Allingham
|
2004-09-25 04:12:21 +05:30
|
|
|
#
|
|
|
|
# This program is free software; you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU General Public License as published by
|
|
|
|
# the Free Software Foundation; either version 2 of the License, or
|
|
|
|
# (at your option) any later version.
|
|
|
|
#
|
|
|
|
# This program is distributed in the hope that it will be useful,
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
# GNU General Public License for more details.
|
|
|
|
#
|
|
|
|
# You should have received a copy of the GNU General Public License
|
|
|
|
# along with this program; if not, write to the Free Software
|
|
|
|
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
|
|
#
|
|
|
|
|
|
|
|
# $Id$
|
|
|
|
|
|
|
|
"Import from GeneWeb"
|
|
|
|
|
|
|
|
#-------------------------------------------------------------------------
|
|
|
|
#
|
|
|
|
# standard python modules
|
|
|
|
#
|
|
|
|
#-------------------------------------------------------------------------
|
|
|
|
import re
|
|
|
|
import time
|
2006-03-17 01:54:27 +05:30
|
|
|
from TransUtils import sgettext as _
|
2004-09-25 04:12:21 +05:30
|
|
|
|
2006-03-05 10:01:24 +05:30
|
|
|
#------------------------------------------------------------------------
|
|
|
|
#
|
|
|
|
# Set up logging
|
|
|
|
#
|
|
|
|
#------------------------------------------------------------------------
|
|
|
|
import logging
|
|
|
|
log = logging.getLogger(".ImportGeneWeb")
|
|
|
|
|
2004-09-25 04:12:21 +05:30
|
|
|
#-------------------------------------------------------------------------
|
|
|
|
#
|
|
|
|
# GTK/GNOME Modules
|
|
|
|
#
|
|
|
|
#-------------------------------------------------------------------------
|
|
|
|
import gtk
|
|
|
|
import gtk.glade
|
|
|
|
|
|
|
|
#-------------------------------------------------------------------------
|
|
|
|
#
|
|
|
|
# GRAMPS modules
|
|
|
|
#
|
|
|
|
#-------------------------------------------------------------------------
|
|
|
|
import Errors
|
|
|
|
import RelLib
|
2005-02-20 00:35:48 +05:30
|
|
|
import const
|
2004-09-25 04:12:21 +05:30
|
|
|
from QuestionDialog import ErrorDialog
|
2005-02-20 00:35:48 +05:30
|
|
|
from DateHandler import parser as _dp
|
2006-03-11 06:42:06 +05:30
|
|
|
from PluginUtils import register_import
|
2005-05-24 18:38:06 +05:30
|
|
|
from htmlentitydefs import name2codepoint
|
2004-09-25 04:12:21 +05:30
|
|
|
|
2005-12-06 12:08:09 +05:30
|
|
|
_date_parse = re.compile('([~?<>]+)?([0-9/]+)([J|H|F])?(\.\.)?([0-9/]+)?([J|H|F])?')
|
|
|
|
_text_parse = re.compile('0\((.*)\)')
|
|
|
|
|
|
|
|
_mod_map = {
|
2006-02-04 03:33:53 +05:30
|
|
|
'>' : RelLib.Date.MOD_AFTER,
|
|
|
|
'<' : RelLib.Date.MOD_BEFORE,
|
|
|
|
'~' : RelLib.Date.MOD_ABOUT,
|
2005-12-06 12:08:09 +05:30
|
|
|
}
|
|
|
|
|
|
|
|
_cal_map = {
|
2006-02-04 03:33:53 +05:30
|
|
|
'J' : RelLib.Date.CAL_JULIAN,
|
|
|
|
'H' : RelLib.Date.CAL_HEBREW,
|
|
|
|
'F' : RelLib.Date.CAL_FRENCH,
|
2005-12-06 12:08:09 +05:30
|
|
|
}
|
|
|
|
|
2004-09-25 04:12:21 +05:30
|
|
|
#-------------------------------------------------------------------------
|
|
|
|
#
|
|
|
|
#
|
|
|
|
#
|
|
|
|
#-------------------------------------------------------------------------
|
|
|
|
def importData(database, filename, cb=None):
|
|
|
|
|
|
|
|
global callback
|
|
|
|
|
|
|
|
try:
|
|
|
|
g = GeneWebParser(database,filename)
|
|
|
|
except IOError,msg:
|
|
|
|
ErrorDialog(_("%s could not be opened\n") % filename,str(msg))
|
|
|
|
return
|
|
|
|
|
|
|
|
try:
|
|
|
|
status = g.parse_geneweb_file()
|
|
|
|
except IOError,msg:
|
|
|
|
errmsg = _("%s could not be opened\n") % filename
|
|
|
|
ErrorDialog(errmsg,str(msg))
|
|
|
|
return
|
|
|
|
|
|
|
|
#-------------------------------------------------------------------------
|
2005-05-11 19:34:47 +05:30
|
|
|
# For a description of the file format see
|
|
|
|
# http://cristal.inria.fr/~ddr/GeneWeb/en/gwformat.htm
|
2004-09-25 04:12:21 +05:30
|
|
|
#-------------------------------------------------------------------------
|
|
|
|
class GeneWebParser:
|
|
|
|
def __init__(self, dbase, file):
|
|
|
|
self.db = dbase
|
|
|
|
self.f = open(file,"rU")
|
|
|
|
self.filename = file
|
|
|
|
|
|
|
|
def get_next_line(self):
|
2005-04-11 16:40:50 +05:30
|
|
|
self.lineno += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
line = self.f.readline()
|
|
|
|
if line:
|
2006-03-01 01:24:35 +05:30
|
|
|
try:
|
|
|
|
line = unicode(line.strip())
|
|
|
|
except UnicodeDecodeError:
|
|
|
|
line = unicode(line.strip(),'iso-8859-1')
|
2004-09-25 04:12:21 +05:30
|
|
|
else:
|
|
|
|
line = None
|
|
|
|
return line
|
|
|
|
|
|
|
|
def parse_geneweb_file(self):
|
2006-01-19 10:00:40 +05:30
|
|
|
self.trans = self.db.transaction_begin("",batch=True)
|
2005-04-06 15:52:18 +05:30
|
|
|
self.db.disable_signals()
|
2004-09-25 04:12:21 +05:30
|
|
|
t = time.time()
|
2005-04-11 16:40:50 +05:30
|
|
|
self.lineno = 0
|
2004-09-25 04:12:21 +05:30
|
|
|
self.index = 0
|
|
|
|
self.fam_count = 0
|
|
|
|
self.indi_count = 0
|
|
|
|
|
|
|
|
self.fkeys = []
|
|
|
|
self.ikeys = {}
|
|
|
|
self.pkeys = {}
|
|
|
|
self.skeys = {}
|
|
|
|
|
|
|
|
self.current_mode = None
|
|
|
|
self.current_family = None
|
|
|
|
self.current_husband_handle = None
|
2005-04-11 16:40:50 +05:30
|
|
|
self.current_child_birthplace_handle = None
|
|
|
|
self.current_child_source_handle = None
|
2004-09-25 04:12:21 +05:30
|
|
|
try:
|
|
|
|
while 1:
|
|
|
|
line = self.get_next_line()
|
|
|
|
if line == None:
|
|
|
|
break
|
|
|
|
if line == "":
|
|
|
|
continue
|
|
|
|
|
|
|
|
fields = line.split(" ")
|
|
|
|
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "LINE: %s" %line
|
2004-09-25 04:12:21 +05:30
|
|
|
if fields[0] == "fam":
|
|
|
|
self.read_family_line(line,fields)
|
|
|
|
elif fields[0] == "src":
|
|
|
|
self.read_source_line(line,fields)
|
|
|
|
elif fields[0] == "wit":
|
|
|
|
self.read_witness_line(line,fields)
|
|
|
|
elif fields[0] == "cbp":
|
|
|
|
self.read_children_birthplace_line(line,fields)
|
2005-04-11 16:40:50 +05:30
|
|
|
elif fields[0] == "csrc":
|
|
|
|
self.read_children_source_line(line,fields)
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[0] == "beg":
|
|
|
|
self.read_children_lines()
|
|
|
|
elif fields[0] == "comm":
|
|
|
|
self.read_family_comment(line,fields)
|
|
|
|
elif fields[0] == "notes":
|
|
|
|
self.read_notes_lines(line,fields)
|
|
|
|
elif fields[0] == "end":
|
|
|
|
self.current_mode = None
|
|
|
|
else:
|
2005-04-11 16:40:50 +05:30
|
|
|
print "Token >%s< unknown. line %d skipped: %s" % (fields[0],self.lineno,line)
|
2004-09-25 04:12:21 +05:30
|
|
|
except Errors.GedcomError, err:
|
|
|
|
self.errmsg(str(err))
|
|
|
|
|
|
|
|
t = time.time() - t
|
|
|
|
msg = _('Import Complete: %d seconds') % t
|
|
|
|
|
|
|
|
self.db.transaction_commit(self.trans,_("GeneWeb import"))
|
2005-04-06 15:52:18 +05:30
|
|
|
self.db.enable_signals()
|
|
|
|
self.db.request_rebuild()
|
2004-09-25 04:12:21 +05:30
|
|
|
|
|
|
|
print msg
|
|
|
|
print "Families: %d" % len(self.fkeys)
|
|
|
|
print "Individuals: %d" % len(self.ikeys)
|
|
|
|
return None
|
|
|
|
|
|
|
|
def read_family_line(self,line,fields):
|
|
|
|
self.current_husband_handle = None
|
2005-04-11 16:40:50 +05:30
|
|
|
self.current_child_birthplace_handle = None
|
|
|
|
self.current_child_source_handle = None
|
2004-09-25 04:12:21 +05:30
|
|
|
self.current_family = RelLib.Family()
|
|
|
|
self.db.add_family(self.current_family,self.trans)
|
|
|
|
self.db.commit_family(self.current_family,self.trans)
|
|
|
|
self.fkeys.append(self.current_family.get_handle())
|
|
|
|
idx = 1;
|
|
|
|
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "\nHusband:"
|
2005-02-01 09:16:29 +05:30
|
|
|
(idx,husband) = self.parse_person(fields,idx,RelLib.Person.MALE,None)
|
2004-09-25 04:12:21 +05:30
|
|
|
if husband:
|
|
|
|
self.current_husband_handle = husband.get_handle()
|
|
|
|
self.current_family.set_father_handle(husband.get_handle())
|
|
|
|
self.db.commit_family(self.current_family,self.trans)
|
|
|
|
husband.add_family_handle(self.current_family.get_handle())
|
|
|
|
self.db.commit_person(husband,self.trans)
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Marriage:"
|
2004-09-25 04:12:21 +05:30
|
|
|
idx = self.parse_marriage(fields,idx)
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Wife:"
|
2005-02-01 09:16:29 +05:30
|
|
|
(idx,wife) = self.parse_person(fields,idx,RelLib.Person.FEMALE,None)
|
2004-09-25 04:12:21 +05:30
|
|
|
if wife:
|
|
|
|
self.current_family.set_mother_handle(wife.get_handle())
|
|
|
|
self.db.commit_family(self.current_family,self.trans)
|
|
|
|
wife.add_family_handle(self.current_family.get_handle())
|
|
|
|
self.db.commit_person(wife,self.trans)
|
|
|
|
return None
|
|
|
|
|
|
|
|
def read_source_line(self,line,fields):
|
|
|
|
if not self.current_family:
|
2005-04-11 16:40:50 +05:30
|
|
|
print "Unknown family of child in line %d!" % self.lineno
|
2005-02-20 00:35:48 +05:30
|
|
|
return None
|
2004-09-25 04:12:21 +05:30
|
|
|
source = self.get_or_create_source(self.decode(fields[1]))
|
|
|
|
self.current_family.add_source_reference(source)
|
|
|
|
self.db.commit_family(self.current_family,self.trans)
|
|
|
|
return None
|
|
|
|
|
|
|
|
def read_witness_line(self,line,fields):
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Witness:"
|
2004-09-25 04:12:21 +05:30
|
|
|
if fields[1] == "m:":
|
2005-02-01 09:16:29 +05:30
|
|
|
self.parse_person(fields,2,RelLib.Person.MALE,None)
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[1] == "f:":
|
2005-02-01 09:16:29 +05:30
|
|
|
self.parse_person(fields,2,RelLib.Person.FEMALE,None)
|
2004-09-25 04:12:21 +05:30
|
|
|
else:
|
|
|
|
self.parse_person(fields,1,None,None)
|
|
|
|
return None
|
|
|
|
|
|
|
|
def read_children_lines(self):
|
|
|
|
father_surname = "Dummy"
|
|
|
|
if not self.current_husband_handle:
|
2005-04-11 16:40:50 +05:30
|
|
|
print "Unknown father for child in line %d!" % self.lineno
|
2004-09-25 04:12:21 +05:30
|
|
|
return None
|
|
|
|
husb = self.db.get_person_from_handle(self.current_husband_handle)
|
|
|
|
father_surname = husb.get_primary_name().get_surname()
|
|
|
|
if not self.current_family:
|
2005-04-11 16:40:50 +05:30
|
|
|
print "Unknown family of child in line %d!" % self.lineno
|
2005-02-20 00:35:48 +05:30
|
|
|
return None
|
2004-09-25 04:12:21 +05:30
|
|
|
while 1:
|
|
|
|
line = self.get_next_line()
|
|
|
|
if line == None:
|
|
|
|
break
|
|
|
|
if line == "":
|
|
|
|
continue
|
|
|
|
|
|
|
|
fields = line.split(" ")
|
|
|
|
if fields[0] == "-":
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Child:"
|
2004-09-25 04:12:21 +05:30
|
|
|
child = None
|
|
|
|
if fields[1] == "h":
|
2005-02-01 09:16:29 +05:30
|
|
|
(idx,child) = self.parse_person(fields,2,RelLib.Person.MALE,father_surname)
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[1] == "f":
|
2005-02-01 09:16:29 +05:30
|
|
|
(idx,child) = self.parse_person(fields,2,RelLib.Person.FEMALE,father_surname)
|
2004-09-25 04:12:21 +05:30
|
|
|
else:
|
2005-12-06 12:08:09 +05:30
|
|
|
(idx,child) = self.parse_person(fields,1,RelLib.Person.UNKNOWN,father_surname)
|
|
|
|
|
2004-09-25 04:12:21 +05:30
|
|
|
if child:
|
|
|
|
self.current_family.add_child_handle(child.get_handle())
|
|
|
|
self.db.commit_family(self.current_family,self.trans)
|
2005-03-16 02:34:44 +05:30
|
|
|
child.add_parent_family_handle(self.current_family.get_handle(),RelLib.Person.CHILD_REL_BIRTH,RelLib.Person.CHILD_REL_BIRTH)
|
2005-04-11 16:40:50 +05:30
|
|
|
if self.current_child_birthplace_handle:
|
|
|
|
birth_handle = child.get_birth_handle()
|
|
|
|
birth = self.db.get_event_from_handle(birth_handle)
|
|
|
|
if not birth:
|
2005-05-11 19:34:47 +05:30
|
|
|
birth = self.create_event("Birth")
|
|
|
|
child.set_birth_handle(birth.get_handle())
|
2005-04-11 16:40:50 +05:30
|
|
|
birth.set_place_handle(self.current_child_birthplace_handle)
|
|
|
|
self.db.commit_event(birth,self.trans)
|
|
|
|
if self.current_child_source_handle:
|
|
|
|
child.add_source_reference(self.current_child_source_handle)
|
2004-09-25 04:12:21 +05:30
|
|
|
self.db.commit_person(child,self.trans)
|
|
|
|
else:
|
|
|
|
break
|
|
|
|
return None
|
|
|
|
|
|
|
|
|
|
|
|
def read_children_birthplace_line(self,line,fields):
|
2005-04-11 16:40:50 +05:30
|
|
|
cbp = self.get_or_create_place(self.decode(fields[1]))
|
|
|
|
if cbp:
|
|
|
|
self.current_child_birthplace_handle = cbp.get_handle()
|
|
|
|
return None
|
|
|
|
|
|
|
|
def read_children_source_line(self,line,fields):
|
|
|
|
csrc = self.get_or_create_source(self.decode(fields[1]))
|
|
|
|
self.current_child_source_handle = csrc
|
2004-09-25 04:12:21 +05:30
|
|
|
return None
|
|
|
|
|
|
|
|
def read_family_comment(self,line,fields):
|
|
|
|
if not self.current_family:
|
2005-04-11 16:40:50 +05:30
|
|
|
print "Unknown family of child in line %d!" % self.lineno
|
2005-02-20 00:35:48 +05:30
|
|
|
return None
|
2005-12-06 12:08:09 +05:30
|
|
|
self.current_family.set_note(line)
|
2004-09-25 04:12:21 +05:30
|
|
|
self.db.commit_family(self.current_family,self.trans)
|
|
|
|
return None
|
|
|
|
|
|
|
|
def read_notes_lines(self,line,fields):
|
|
|
|
(idx,person) = self.parse_person(fields,1,None,None)
|
|
|
|
note_txt = ""
|
2006-03-01 01:24:35 +05:30
|
|
|
while True:
|
2004-09-25 04:12:21 +05:30
|
|
|
line = self.get_next_line()
|
|
|
|
if line == None:
|
|
|
|
break
|
|
|
|
|
|
|
|
fields = line.split(" ")
|
|
|
|
if fields[0] == "end" and fields[1] == "notes":
|
|
|
|
break
|
|
|
|
elif fields[0] == "beg":
|
|
|
|
continue
|
|
|
|
else:
|
|
|
|
if note_txt:
|
2005-12-06 12:08:09 +05:30
|
|
|
note_txt = note_txt + "\n" + line
|
2004-09-25 04:12:21 +05:30
|
|
|
else:
|
2005-12-06 12:08:09 +05:30
|
|
|
note_txt = note_txt + line
|
2004-09-25 04:12:21 +05:30
|
|
|
if note_txt:
|
|
|
|
person.set_note(note_txt)
|
|
|
|
self.db.commit_person(person,self.trans)
|
|
|
|
return None
|
|
|
|
|
|
|
|
def parse_marriage(self,fields,idx):
|
|
|
|
mariageDataRe = re.compile("^[+#-0-9].*$")
|
|
|
|
|
|
|
|
mar_date = None
|
|
|
|
mar_place = None
|
|
|
|
mar_source = None
|
|
|
|
|
|
|
|
sep_date = None
|
|
|
|
div_date = None
|
|
|
|
|
|
|
|
married = 1
|
|
|
|
engaged = 0
|
|
|
|
|
|
|
|
# skip to marriage date in case person contained unmatches tokens
|
|
|
|
#Alex: this failed when fields[idx] was an empty line. Fixed.
|
2005-02-20 00:35:48 +05:30
|
|
|
#while idx < len(fields) and not fields[idx][0] == "+":
|
2004-09-25 04:12:21 +05:30
|
|
|
while idx < len(fields) and not (fields[idx] and fields[idx][0] == "+"):
|
2005-12-06 12:08:09 +05:30
|
|
|
if fields[idx]:
|
|
|
|
print "Unknown field: '%s' in line %d!" %(fields[idx],self.lineno)
|
2004-09-25 04:12:21 +05:30
|
|
|
idx = idx + 1
|
|
|
|
|
|
|
|
while idx < len(fields) and mariageDataRe.match(fields[idx]):
|
|
|
|
if fields[idx][0] == "+":
|
|
|
|
mar_date = self.parse_date(self.decode(fields[idx]))
|
2005-02-20 00:35:48 +05:30
|
|
|
#print " Married at: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
idx = idx + 1
|
|
|
|
elif fields[idx][0] == "-":
|
|
|
|
div_date = self.parse_date(self.decode(fields[idx]))
|
2005-02-20 00:35:48 +05:30
|
|
|
#print " Div at: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
idx = idx + 1
|
|
|
|
elif fields[idx] == "#mp":
|
|
|
|
idx = idx + 1
|
|
|
|
mar_place = self.get_or_create_place(self.decode(fields[idx]))
|
2005-02-20 00:35:48 +05:30
|
|
|
#print " Marriage place: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
idx = idx + 1
|
|
|
|
elif fields[idx] == "#ms":
|
|
|
|
idx = idx + 1
|
|
|
|
mar_source = self.get_or_create_source(self.decode(fields[idx]))
|
2005-02-20 00:35:48 +05:30
|
|
|
#print " Marriage source: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
idx = idx + 1
|
|
|
|
elif fields[idx] == "#sep":
|
|
|
|
idx = idx + 1
|
|
|
|
sep_date = self.parse_date(self.decode(fields[idx]))
|
2005-02-20 00:35:48 +05:30
|
|
|
#print " Seperated since: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
idx = idx + 1
|
2005-03-16 02:34:44 +05:30
|
|
|
elif fields[idx] == "#nm":
|
2005-02-20 00:35:48 +05:30
|
|
|
#print " Are not married."
|
2004-09-25 04:12:21 +05:30
|
|
|
married = 0
|
|
|
|
idx = idx + 1
|
|
|
|
elif fields[idx] == "#eng":
|
2005-02-20 00:35:48 +05:30
|
|
|
#print " Are engaged."
|
2004-09-25 04:12:21 +05:30
|
|
|
engaged = 1
|
|
|
|
idx = idx + 1
|
|
|
|
else:
|
2005-04-11 16:40:50 +05:30
|
|
|
print "Unknown field '%s'for mariage in line %d!" % (fields[idx],self.lineno)
|
2004-09-25 04:12:21 +05:30
|
|
|
idx = idx + 1
|
|
|
|
|
|
|
|
if mar_date or mar_place or mar_source:
|
|
|
|
mar = self.create_event("Marriage", None, mar_date, mar_place, mar_source)
|
|
|
|
self.current_family.add_event_handle(mar.get_handle())
|
|
|
|
|
|
|
|
if div_date:
|
|
|
|
div = self.create_event("Divorce", None, div_date, None, None)
|
|
|
|
self.current_family.add_event_handle(div.get_handle())
|
|
|
|
|
|
|
|
if sep_date or engaged:
|
|
|
|
sep = self.create_event("Engagement", None, sep_date, None, None)
|
|
|
|
self.current_family.add_event_handle(sep.get_handle())
|
|
|
|
|
|
|
|
if not married:
|
2004-12-25 00:16:34 +05:30
|
|
|
self.current_family.set_relationship(RelLib.Family.UNMARRIED)
|
2004-09-25 04:12:21 +05:30
|
|
|
|
|
|
|
self.db.commit_family(self.current_family,self.trans)
|
|
|
|
return idx
|
|
|
|
|
|
|
|
def parse_person(self,fields,idx,gender,father_surname):
|
|
|
|
|
|
|
|
if not father_surname:
|
|
|
|
if not idx < len(fields):
|
2005-04-11 16:40:50 +05:30
|
|
|
print "Missing surname of person in line %d!" % self.lineno
|
2006-03-01 01:24:35 +05:30
|
|
|
surname =""
|
|
|
|
else:
|
|
|
|
surname = self.decode(fields[idx])
|
2004-09-25 04:12:21 +05:30
|
|
|
idx = idx + 1
|
|
|
|
else:
|
|
|
|
surname = father_surname
|
|
|
|
|
|
|
|
if not idx < len(fields):
|
2005-04-11 16:40:50 +05:30
|
|
|
print "Missing firstname of person in line %d!" % self.lineno
|
2006-03-01 01:24:35 +05:30
|
|
|
firstname = ""
|
|
|
|
else:
|
|
|
|
firstname = self.decode(fields[idx])
|
2004-09-25 04:12:21 +05:30
|
|
|
idx = idx + 1
|
|
|
|
if idx < len(fields) and father_surname:
|
|
|
|
noSurnameRe = re.compile("^[({\[~><?0-9#].*$")
|
2005-12-06 12:08:09 +05:30
|
|
|
if not noSurnameRe.match(fields[idx]):
|
2004-09-25 04:12:21 +05:30
|
|
|
surname = self.decode(fields[idx])
|
|
|
|
idx = idx + 1
|
|
|
|
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Person: %s %s" % (firstname, surname)
|
2004-09-25 04:12:21 +05:30
|
|
|
person = self.get_or_create_person(firstname,surname)
|
|
|
|
name = RelLib.Name()
|
|
|
|
name.set_type("Birth Name")
|
|
|
|
name.set_first_name(firstname)
|
|
|
|
name.set_surname(surname)
|
|
|
|
person.set_primary_name(name)
|
2005-12-06 12:08:09 +05:30
|
|
|
if person.get_gender() == RelLib.Person.UNKNOWN and gender != None:
|
2004-09-25 04:12:21 +05:30
|
|
|
person.set_gender(gender)
|
|
|
|
self.db.commit_person(person,self.trans)
|
|
|
|
personDataRe = re.compile("^[0-9<>~#\[({!].*$")
|
|
|
|
dateRe = re.compile("^[0-9~<>?]+.*$")
|
|
|
|
|
|
|
|
source = None
|
|
|
|
birth_date = None
|
|
|
|
birth_place = None
|
|
|
|
birth_source = None
|
|
|
|
|
|
|
|
bapt_date = None
|
|
|
|
bapt_place = None
|
|
|
|
bapt_source = None
|
|
|
|
|
|
|
|
death_date = None
|
|
|
|
death_place = None
|
|
|
|
death_source = None
|
|
|
|
|
|
|
|
crem_date = None
|
|
|
|
bur_date = None
|
|
|
|
bur_place = None
|
|
|
|
bur_source = None
|
|
|
|
|
|
|
|
public_name = None
|
|
|
|
firstname_aliases = []
|
|
|
|
nick_names = []
|
|
|
|
name_aliases = []
|
|
|
|
surname_aliases = []
|
|
|
|
|
|
|
|
while idx < len(fields) and personDataRe.match(fields[idx]):
|
|
|
|
if fields[idx][0] == '(':
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Public Name: %s" % fields[idx]
|
2005-05-11 19:34:47 +05:30
|
|
|
public_name = self.decode(fields[idx][1:-1])
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx][0] == '{':
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Firstsname Alias: %s" % fields[idx]
|
2005-05-11 19:34:47 +05:30
|
|
|
firstname_aliases.append(self.decode(fields[idx][1:-1]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx][0] == '[':
|
2005-05-11 19:34:47 +05:30
|
|
|
print "TODO: Titles: %s" % fields[idx]
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#nick':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Nick Name: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
nick_names.append(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#occu':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Occupation: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
occu = self.create_event("Occupation",self.decode(fields[idx]))
|
|
|
|
person.add_event_handle(occu.get_handle())
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#alias':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Name Alias: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
name_aliases.append(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#salias':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Surname Alias: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
surname_aliases.append(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#image':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Image: %s" % fields[idx]
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#src':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Source: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
source = self.get_or_create_source(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#bs':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Birth Source: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
birth_source = self.get_or_create_source(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx][0] == '!':
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Baptize at: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
bapt_date = self.parse_date(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#bp':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Birth Place: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
birth_place = self.get_or_create_place(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#pp':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Baptize Place: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
bapt_place = self.get_or_create_place(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#ps':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Baptize Source: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
bapt_source = self.get_or_create_source(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#dp':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Death Place: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
death_place = self.get_or_create_place(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#ds':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Death Source: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
death_source = self.get_or_create_source(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#buri':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Burial Date: %s" % fields[idx]
|
2005-12-06 12:08:09 +05:30
|
|
|
try:
|
|
|
|
bur_date = self.parse_date(self.decode(fields[idx]))
|
|
|
|
except IndexError:
|
|
|
|
pass
|
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#crem':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Cremention Date: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
crem_date = self.parse_date(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-03-16 02:34:44 +05:30
|
|
|
elif fields[idx] == '#rp':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Burial Place: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
bur_place = self.get_or_create_place(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#rs':
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Burial Source: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
bur_source = self.get_or_create_source(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#apubl':
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "This is a public record"
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif fields[idx] == '#apriv':
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "This is a private record"
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
elif dateRe.match( fields[idx]):
|
|
|
|
if not birth_date:
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Birth Date: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
birth_date = self.parse_date(self.decode(fields[idx]))
|
|
|
|
else:
|
2005-02-20 00:35:48 +05:30
|
|
|
#print "Death Date: %s" % fields[idx]
|
2004-09-25 04:12:21 +05:30
|
|
|
death_date = self.parse_date(self.decode(fields[idx]))
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
else:
|
2005-04-11 16:40:50 +05:30
|
|
|
print "Unknown field '%s' for person in line %d!" % (fields[idx],self.lineno)
|
2005-12-06 12:08:09 +05:30
|
|
|
idx += 1
|
2004-09-25 04:12:21 +05:30
|
|
|
|
|
|
|
if public_name:
|
|
|
|
name = person.get_primary_name()
|
|
|
|
name.set_type("Birth Name")
|
|
|
|
person.add_alternate_name(name)
|
|
|
|
name = RelLib.Name()
|
|
|
|
name.set_type("Also Known As")
|
|
|
|
name.set_first_name(public_name)
|
|
|
|
name.set_surname(surname)
|
|
|
|
person.set_primary_name(name)
|
|
|
|
|
|
|
|
i = 0
|
|
|
|
for aka in nick_names:
|
|
|
|
if i == 0:
|
|
|
|
person.set_nick_name(aka)
|
|
|
|
else:
|
|
|
|
name = RelLib.Name()
|
|
|
|
name.set_type("Also Known As")
|
|
|
|
name.set_first_name(aka)
|
|
|
|
name.set_surname(surname)
|
|
|
|
person.add_alternate_name(name)
|
|
|
|
i = i + 1
|
|
|
|
|
|
|
|
for aka in firstname_aliases:
|
|
|
|
name = RelLib.Name()
|
|
|
|
name.set_type("Also Known As")
|
|
|
|
name.set_first_name(aka)
|
|
|
|
name.set_surname(surname)
|
|
|
|
person.add_alternate_name(name)
|
|
|
|
|
|
|
|
for aka in name_aliases:
|
|
|
|
name = RelLib.Name()
|
|
|
|
name.set_type("Also Known As")
|
|
|
|
name.set_first_name(aka)
|
|
|
|
name.set_surname(surname)
|
|
|
|
person.add_alternate_name(name)
|
|
|
|
|
|
|
|
for aka in surname_aliases:
|
|
|
|
name = RelLib.Name()
|
|
|
|
name.set_type("Also Known As")
|
|
|
|
if public_name:
|
|
|
|
name.set_first_name(public_name)
|
|
|
|
else:
|
|
|
|
name.set_first_name(firstname)
|
|
|
|
name.set_surname(aka)
|
|
|
|
person.add_alternate_name(name)
|
|
|
|
|
|
|
|
if source:
|
|
|
|
person.add_source_reference(source)
|
|
|
|
|
|
|
|
if birth_date or birth_place or birth_source:
|
|
|
|
birth = self.create_event("Birth", None, birth_date, birth_place, birth_source)
|
|
|
|
person.set_birth_handle(birth.get_handle())
|
|
|
|
|
|
|
|
if bapt_date or bapt_place or bapt_source:
|
|
|
|
babt = self.create_event("Baptism", None, bapt_date, bapt_place, bapt_source)
|
|
|
|
person.add_event_handle(babt.get_handle())
|
|
|
|
|
|
|
|
if death_date or death_place or death_source:
|
|
|
|
babt = self.create_event("Death", None, death_date, death_place, death_source)
|
|
|
|
person.set_death_handle(babt.get_handle())
|
|
|
|
|
|
|
|
if bur_date:
|
|
|
|
babt = self.create_event("Burial", None, bur_date, bur_place, bur_source)
|
|
|
|
person.add_event_handle(babt.get_handle())
|
|
|
|
|
|
|
|
if crem_date:
|
|
|
|
babt = self.create_event("Cremation", None, crem_date, bur_place, bur_source)
|
|
|
|
person.add_event_handle(babt.get_handle())
|
|
|
|
|
|
|
|
self.db.commit_person(person,self.trans)
|
|
|
|
|
|
|
|
return (idx,person)
|
|
|
|
|
|
|
|
def parse_date(self,field):
|
2005-04-11 16:40:50 +05:30
|
|
|
if field == "0":
|
|
|
|
return None
|
2006-02-04 03:33:53 +05:30
|
|
|
date = RelLib.Date()
|
2005-12-06 12:08:09 +05:30
|
|
|
matches = _text_parse.match(field)
|
|
|
|
if matches:
|
|
|
|
groups = matches.groups()
|
|
|
|
date.set_as_text(groups[0])
|
2006-02-04 03:33:53 +05:30
|
|
|
date.set_modifier(RelLib.Date.MOD_TEXTONLY)
|
2005-12-06 12:08:09 +05:30
|
|
|
return date
|
|
|
|
|
|
|
|
matches = _date_parse.match(field)
|
|
|
|
if matches:
|
|
|
|
groups = matches.groups()
|
2006-02-04 03:33:53 +05:30
|
|
|
mod = _mod_map.get(groups[0],RelLib.Date.MOD_NONE)
|
2005-12-06 12:08:09 +05:30
|
|
|
if groups[3] == "..":
|
2006-02-04 03:33:53 +05:30
|
|
|
mod = RelLib.Date.MOD_SPAN
|
|
|
|
cal2 = _cal_map.get(groups[5],RelLib.Date.CAL_GREGORIAN)
|
2005-12-06 12:08:09 +05:30
|
|
|
sub2 = self.sub_date(groups[4])
|
|
|
|
else:
|
|
|
|
sub2 = (0,0,0)
|
2006-02-04 03:33:53 +05:30
|
|
|
cal1 = _cal_map.get(groups[2],RelLib.Date.CAL_GREGORIAN)
|
2005-12-06 12:08:09 +05:30
|
|
|
sub1 = self.sub_date(groups[1])
|
2006-02-04 03:33:53 +05:30
|
|
|
date.set(RelLib.Date.QUAL_NONE,mod, cal1,
|
2005-12-06 12:08:09 +05:30
|
|
|
(sub1[0],sub1[1],sub1[2],None,sub2[0],sub2[1],sub2[2],None))
|
|
|
|
return date
|
|
|
|
else:
|
|
|
|
return None
|
|
|
|
|
|
|
|
def sub_date(self,data):
|
|
|
|
vals = data.split('/')
|
|
|
|
if len(vals) == 1:
|
|
|
|
return (0,0,int(vals[0]))
|
|
|
|
elif len(vals) == 2:
|
|
|
|
return (0,int(vals[0]),int(vals[1]))
|
|
|
|
else:
|
|
|
|
return (int(vals[0]),int(vals[1]),int(vals[2]))
|
2004-09-25 04:12:21 +05:30
|
|
|
|
|
|
|
def create_event(self,type,desc=None,date=None,place=None,source=None):
|
|
|
|
event = RelLib.Event()
|
|
|
|
if type:
|
|
|
|
event.set_name(type)
|
|
|
|
if desc:
|
|
|
|
event.set_description(desc)
|
|
|
|
if date:
|
|
|
|
event.set_date_object(date)
|
|
|
|
if place:
|
|
|
|
event.set_place_handle(place.get_handle())
|
|
|
|
if source:
|
|
|
|
event.add_source_reference(source)
|
|
|
|
self.db.add_event(event,self.trans)
|
|
|
|
self.db.commit_event(event,self.trans)
|
|
|
|
return event
|
|
|
|
|
|
|
|
def get_or_create_person(self,firstname,lastname):
|
|
|
|
person = None
|
|
|
|
mykey = firstname+lastname
|
2005-05-24 18:38:06 +05:30
|
|
|
if mykey in self.ikeys and firstname != "?" and lastname != "?":
|
2004-09-25 04:12:21 +05:30
|
|
|
person = self.db.get_person_from_handle(self.ikeys[mykey])
|
|
|
|
else:
|
|
|
|
person = RelLib.Person()
|
|
|
|
self.db.add_person(person,self.trans)
|
|
|
|
self.db.commit_person(person,self.trans)
|
|
|
|
self.ikeys[mykey] = person.get_handle()
|
|
|
|
return person
|
|
|
|
|
|
|
|
def get_or_create_place(self,place_name):
|
|
|
|
place = None
|
|
|
|
if place_name in self.pkeys:
|
2005-05-11 19:34:47 +05:30
|
|
|
place = self.db.get_place_from_handle(self.pkeys[place_name])
|
2004-09-25 04:12:21 +05:30
|
|
|
else:
|
|
|
|
place = RelLib.Place()
|
|
|
|
place.set_title(place_name)
|
|
|
|
self.db.add_place(place,self.trans)
|
|
|
|
self.db.commit_place(place,self.trans)
|
|
|
|
self.pkeys[place_name] = place.get_handle()
|
|
|
|
return place
|
|
|
|
|
|
|
|
def get_or_create_source(self,source_name):
|
|
|
|
source = None
|
|
|
|
if source_name in self.skeys:
|
|
|
|
source = self.db.get_source_from_handle(self.skeys[source_name])
|
|
|
|
else:
|
|
|
|
source = RelLib.Source()
|
|
|
|
source.set_title(source_name)
|
|
|
|
self.db.add_source(source,self.trans)
|
|
|
|
self.db.commit_source(source,self.trans)
|
|
|
|
self.skeys[source_name] = source.get_handle()
|
|
|
|
sref = RelLib.SourceRef()
|
|
|
|
sref.set_base_handle(source.get_handle())
|
|
|
|
return sref
|
|
|
|
|
|
|
|
def decode(self,s):
|
2005-12-06 12:08:09 +05:30
|
|
|
s = s.replace('_',' ')
|
2005-05-24 18:38:06 +05:30
|
|
|
charref_re = re.compile('(&#)(x?)([0-9a-zA-Z]+)(;)')
|
|
|
|
for match in charref_re.finditer(s):
|
|
|
|
try:
|
|
|
|
if match.group(2): # HEX
|
|
|
|
nchar = unichr(int(match.group(3),16))
|
|
|
|
else: # Decimal
|
|
|
|
nchar = unichr(int(match.group(3)))
|
|
|
|
s = s.replace(match.group(0),nchar)
|
|
|
|
except UnicodeDecodeError:
|
|
|
|
pass
|
|
|
|
|
|
|
|
# replace named entities
|
|
|
|
entref_re = re.compile('(&)([a-zA-Z]+)(;)')
|
|
|
|
for match in entref_re.finditer(s):
|
|
|
|
try:
|
|
|
|
if match.group(2) in name2codepoint:
|
|
|
|
nchar = unichr(name2codepoint[match.group(2)])
|
|
|
|
s = s.replace(match.group(0),nchar)
|
|
|
|
except UnicodeDecodeError:
|
|
|
|
pass
|
|
|
|
|
|
|
|
return( s)
|
2004-09-25 04:12:21 +05:30
|
|
|
|
|
|
|
#-------------------------------------------------------------------------
|
|
|
|
#
|
|
|
|
#
|
|
|
|
#
|
|
|
|
#-------------------------------------------------------------------------
|
2005-02-20 00:35:48 +05:30
|
|
|
_mime_type = const.app_geneweb
|
2004-09-25 04:12:21 +05:30
|
|
|
_filter = gtk.FileFilter()
|
|
|
|
_filter.set_name(_('GeneWeb files'))
|
|
|
|
_filter.add_mime_type(_mime_type)
|
2005-02-28 07:21:21 +05:30
|
|
|
_format_name = _('GeneWeb')
|
2004-09-25 04:12:21 +05:30
|
|
|
|
2005-02-28 07:21:21 +05:30
|
|
|
register_import(importData,_filter,_mime_type,0,_format_name)
|