# # Gramps - a GTK+/GNOME based genealogy program # # Copyright (C) 2000-2004 Donald N. Allingham # # This program is free software; you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation; either version 2 of the License, or # (at your option) any later version. # # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with this program; if not, write to the Free Software # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA # # $Id$ "Import from GEDCOM" #------------------------------------------------------------------------- # # standard python modules # #------------------------------------------------------------------------- import os import re import string import const import time #------------------------------------------------------------------------- # # GTK/GNOME Modules # #------------------------------------------------------------------------- import gtk import gtk.glade #------------------------------------------------------------------------- # # GRAMPS modules # #------------------------------------------------------------------------- import Errors import RelLib import Julian import FrenchRepublic import Hebrew import Date from ansel_utf8 import ansel_to_utf8 import latin_utf8 import Utils from GedcomInfo import * from QuestionDialog import ErrorDialog from gettext import gettext as _ #------------------------------------------------------------------------- # # constants # #------------------------------------------------------------------------- ANSEL = 1 UNICODE = 2 UPDATE = 25 db = None callback = None _title_string = _("GEDCOM") def nocnv(s): return unicode(s) photo_types = [ "jpeg", "bmp", "pict", "pntg", "tpic", "png", "gif", "jpg", "tiff", "pcx" ] file_systems = { 'VFAT' : _('Windows 9x file system'), 'FAT' : _('Windows 9x file system'), "NTFS" : _('Windows NT file system'), "ISO9660" : _('CD ROM'), "SMBFS" : _('Networked Windows file system') } #------------------------------------------------------------------------- # # GEDCOM events to GRAMPS events conversion # #------------------------------------------------------------------------- ged2gramps = {} for _val in const.personalConstantEvents.keys(): _key = const.personalConstantEvents[_val] if _key != "": ged2gramps[_key] = _val ged2fam = {} for _val in const.familyConstantEvents.keys(): _key = const.familyConstantEvents[_val] if _key != "": ged2fam[_key] = _val #------------------------------------------------------------------------- # # regular expressions # #------------------------------------------------------------------------- intRE = re.compile(r"\s*(\d+)\s*$") lineRE = re.compile(r"\s*(\d+)\s+(\S+)\s*(.*)$") headRE = re.compile(r"\s*(\d+)\s+HEAD") nameRegexp= re.compile(r"/?([^/]*)(/([^/]*)(/([^/]*))?)?") snameRegexp= re.compile(r"/([^/]*)/([^/]*)") calRegexp = re.compile(r"\s*(ABT|BEF|AFT)?\s*@#D([^@]+)@\s*(.*)$") fromtoRegexp = re.compile(r"\s*(FROM|BET)\s+@#D([^@]+)@\s*(.*)\s+(AND|TO)\s+@#D([^@]+)@\s*(.*)$") #------------------------------------------------------------------------- # # # #------------------------------------------------------------------------- def importData(database, filename, cb=None): global callback # add some checking here glade_file = "%s/gedcomimport.glade" % os.path.dirname(__file__) statusTop = gtk.glade.XML(glade_file,"status","gramps") statusWindow = statusTop.get_widget("status") Utils.set_titles(statusWindow,statusTop.get_widget('title'), _('GEDCOM import status')) statusTop.get_widget("close").set_sensitive(0) statusTop.signal_autoconnect({ "destroy_passed_object" : Utils.destroy_passed_object }) try: g = GedcomParser(database,filename,statusTop) except IOError,msg: Utils.destroy_passed_object(statusWindow) ErrorDialog(_("%s could not be opened\n") % filename,str(msg)) return except: Utils.destroy_passed_object(statusWindow) ErrorDialog(_("%s could not be opened\n") % filename) return try: close = g.parse_gedcom_file() g.resolve_refns() except IOError,msg: Utils.destroy_passed_object(statusWindow) errmsg = _("%s could not be opened\n") % filename ErrorDialog(errmsg,str(msg)) return except Errors.GedcomError, val: (m1,m2) = val.messages() Utils.destroy_passed_object(statusWindow) ErrorDialog(m1,m2) return except: import DisplayTrace Utils.destroy_passed_object(statusWindow) DisplayTrace.DisplayTrace() return statusTop.get_widget("close").set_sensitive(1) if close: statusWindow.destroy() if cb: statusWindow.destroy() cb(1) elif callback: callback() #------------------------------------------------------------------------- # # # #------------------------------------------------------------------------- class DateStruct: def __init__(self): self.date = "" self.time = "" #------------------------------------------------------------------------- # # # #------------------------------------------------------------------------- class GedcomParser: SyntaxError = "Syntax Error" BadFile = "Not a GEDCOM file" def __init__(self, dbase, file, window): self.db = dbase self.person = None self.pmap = {} self.fmap = {} self.smap = {} self.nmap = {} self.share_note = [] self.refn = {} self.added = {} self.gedmap = GedcomInfoDB() self.gedsource = None self.dir_path = os.path.dirname(file) self.localref = 0 self.placemap = {} self.broken_conc_list = [ 'FamilyOrigins', 'FTW' ] self.broken_conc = 0 self.is_ftw = 0 self.f = open(file,"r") self.filename = file self.index = 0 self.backoff = 0 self.cnv = nocnv self.geddir = os.path.dirname(os.path.normpath(os.path.abspath(file))) self.trans = string.maketrans('','') self.delc = self.trans[0:31] self.trans2 = self.trans[0:128] + ('?' * 128) self.window = window if window: self.file_obj = window.get_widget("file") self.encoding_obj = window.get_widget("encoding") self.created_obj = window.get_widget("created") self.version_obj = window.get_widget("version") self.families_obj = window.get_widget("families") self.people_obj = window.get_widget("people") self.errors_obj = window.get_widget("errors") self.close_done = window.get_widget('close_done') self.error_text_obj = window.get_widget("error_text") self.info_text_obj = window.get_widget("info_text") self.error_count = 0 map = const.personalConstantAttributes self.attrs = map.values() self.gedattr = {} for val in map.keys(): self.gedattr[map[val]] = val if self.window: self.update(self.file_obj,os.path.basename(file)) self.search_paths = [] try: mypaths = [] f = open("/proc/mounts","r") for line in f.xreadlines(): paths = string.split(line) ftype = paths[2].upper() if ftype in file_systems.keys(): mypaths.append((paths[1],file_systems[ftype])) self.search_paths.append(paths[1]) f.close() if len(mypaths): self.infomsg(_("Windows style path names for images will use the following mount " "points to try to find the images. These paths are based on Windows " "compatible file systems available on this system:\n\n")) for p in mypaths: self.infomsg("\t%s : %s\n" % p) self.infomsg('\n') self.infomsg(_("Images that cannot be found in the specfied path in the GEDCOM file " "will be searched for in the same directory in which the GEDCOM file " "exists (%s).\n") % self.geddir) except: pass def errmsg(self,msg): if self.window: try: self.error_text_obj.get_buffer().insert_at_cursor(msg) except TypeError: self.error_text_obj.get_buffer().insert_at_cursor(msg,len(msg)) else: print msg def infomsg(self,msg): if self.window: try: self.info_text_obj.get_buffer().insert_at_cursor(msg) except TypeError: self.info_text_obj.get_buffer().insert_at_cursor(msg,len(msg)) else: print msg def find_file(self,fullname,altpath): tries = [] fullname = string.replace(fullname,'\\','/') tries.append(fullname) if os.path.isfile(fullname): return (1,fullname) other = os.path.join(altpath,os.path.basename(fullname)) tries.append(other) if os.path.isfile(other): return (1,other) if len(fullname) > 3: if fullname[1] == ':': fullname = fullname[2:] for path in self.search_paths: other = os.path.normpath("%s/%s" % (path,fullname)) tries.append(other) if os.path.isfile(other): return (1,other) return (0,tries) else: return (0,tries) def update(self,field,text): field.set_text(text) while gtk.events_pending(): gtk.main_iteration() def get_next(self): if self.backoff == 0: next_line = self.f.readline() self.text = string.translate(next_line.strip(),self.trans,self.delc) try: self.text = self.cnv(self.text) except: self.text = string.translate(self.text,self.trans2) self.index += 1 l = string.split(self.text, None, 2) ln = len(l) try: if ln == 2: self.groups = (int(l[0]),l[1],"") else: self.groups = (int(l[0]),l[1],l[2]) except: if self.text == "": msg = _("Warning: line %d was blank, so it was ignored.\n") % self.index else: msg = _("Warning: line %d was not understood, so it was ignored.") % self.index msg = "%s\n\t%s\n" % (msg,self.text) self.errmsg(msg) self.error_count = self.error_count + 1 self.groups = (999, "XXX", "XXX") self.backoff = 0 return self.groups def barf(self,level): import traceback msg = _("Warning: line %d was not understood, so it was ignored.") % self.index self.errmsg(msg) msg = "\n\t%s\n" % self.text self.errmsg(msg) self.error_count = self.error_count + 1 # self.errmsg(string.join(traceback.format_stack())) self.ignore_sub_junk(level) def warn(self,msg): self.errmsg(msg) self.error_count = self.error_count + 1 def backup(self): self.backoff = 1 def parse_gedcom_file(self): t = time.time() self.index = 0 self.fam_count = 0 self.indi_count = 0 try: self.parse_header() self.parse_submitter() self.parse_record() self.parse_trailer() except Errors.GedcomError, err: self.errmsg(str(err)) if self.window: self.update(self.families_obj,str(self.fam_count)) self.update(self.people_obj,str(self.indi_count)) self.break_note_links() t = time.time() - t msg = _('Import Complete: %d seconds') % t if self.window: self.infomsg("\n%s" % msg) else: print msg print "Families: %d" % self.fam_count print "Individuals: %d" % self.indi_count return None def break_note_links(self): for o in self.share_note: o.unique_note() def parse_trailer(self): matches = self.get_next() if matches[1] != "TRLR": self.barf(0) self.f.close() def parse_header(self): self.parse_header_head() self.parse_header_source() def parse_submitter(self): matches = self.get_next() if matches[2] != "SUBM": self.backup() return else: self.ignore_sub_junk(1) def parse_source(self,name,level): self.source = self.db.find_source(name,self.smap) note = "" while 1: matches = self.get_next() if int(matches[0]) < level: if note: self.source.set_note(note) if not self.source.get_title(): self.source.set_title("No title - ID %s" % self.source.get_id()) self.db.commit_source(self.source) self.backup() return elif matches[1] == "TITL": title = matches[2] + self.parse_continue_data(level+1) title = string.replace(title,'\n',' ') self.source.set_title(title) elif matches[1] == "TAXT" or matches[1] == "PERI": # EasyTree Sierra On-Line if self.source.get_title() == "": title = matches[2] + self.parse_continue_data(level+1) title = string.replace(title,'\n',' ') self.source.set_title(title) elif matches[1] == "AUTH": self.source.set_author(matches[2] + self.parse_continue_data(level+1)) elif matches[1] == "PUBL": self.source.set_publication_info(matches[2] + self.parse_continue_data(level+1)) elif matches[1] == "OBJE": self.ignore_sub_junk(2) elif matches[1] == "NOTE": note = self.parse_note(matches,self.source,level+1,note) elif matches[1] == "TEXT": note = self.source.get_note() d = self.parse_continue_data(level+1) if note: note = "%s\n%s %s%s" % (note,matches[1],matches[2],d) else: note = "%s %s%s" % (matches[1],matches[2],d) elif matches[1] == "ABBR": self.source.set_abbreviation(matches[2] + self.parse_continue_data(level+1)) else: note = self.source.get_note() if note: note = "%s\n%s %s" % (note,matches[1],matches[2]) else: note = "%s %s" % (matches[1],matches[2]) def parse_record(self): while 1: matches = self.get_next() if matches[2] == "FAM": if self.fam_count % UPDATE == 0 and self.window: self.update(self.families_obj,str(self.fam_count)) self.fam_count = self.fam_count + 1 self.family = self.db.find_family_with_map(matches[1],self.fmap) self.parse_family() if self.addr != None: father = self.family.get_father_id() if father: father.add_address(self.addr) self.db.commit_person(father) mother = self.family.get_mother_id() if mother: mother.add_address(self.addr) self.db.commit_person(mother) for child in self.family.get_child_id_list(): child.add_address(self.addr) self.db.commit_person(child) self.db.commit_family(self.family) del self.family elif matches[2] == "INDI": if self.indi_count % UPDATE == 0 and self.window: self.update(self.people_obj,str(self.indi_count)) self.indi_count = self.indi_count + 1 id = matches[1] id = id[1:-1] self.person = self.find_or_create_person(id) self.added[self.person.get_id()] = 1 self.parse_individual() self.db.commit_person(self.person) del self.person elif matches[2] in ["SUBM","SUBN","REPO"]: self.ignore_sub_junk(1) elif matches[1] in ["SUBM","SUBN","OBJE","_EVENT_DEFN"]: self.ignore_sub_junk(1) elif matches[2] == "SOUR": self.parse_source(matches[1],1) elif matches[2][0:4] == "NOTE": if self.nmap.has_key(matches[1]): noteobj = self.nmap[matches[1]] else: noteobj = RelLib.Note() self.nmap[matches[1]] = noteobj text = matches[2][4:] # noteobj.append(text + self.parse_continue_data(1)) noteobj.append(text + self.parse_note_continue(1)) self.parse_note_data(1) elif matches[1] == "TRLR": self.backup() return else: self.barf(1) def find_or_create_person(self,id): if self.pmap.has_key(id): person = self.db.find_person_from_id(self.pmap[id]) elif self.db.has_person_id(id): person = RelLib.Person() self.pmap[id] = self.db.add_person(person) else: person = RelLib.Person(id) self.db.add_person_as(person) self.pmap[id] = id return person def parse_cause(self,event,level): while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return elif matches[1] == "SOUR": event.add_source_reference(self.handle_source(matches,level+1)) else: self.barf(1) def parse_note_data(self,level): while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return elif matches[1] in ["SOUR","CHAN","REFN"]: self.ignore_sub_junk(level+1) elif matches[1] == "RIN": pass else: self.barf(level+1) def parse_ftw_relations(self,level): mrel = "Birth" frel = "Birth" while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return (mrel,frel) # FTW elif matches[1] == "_FREL": if string.lower(matches[2]) != "natural": frel = string.capitalize(matches[2]) # FTW elif matches[1] == "_MREL": if string.lower(matches[2]) != "natural": mrel = matches[2] elif matches[1] == "ADOP": mrel = "Adopted" frel = "Adopted" # Legacy elif matches[1] == "_STAT": mrel = matches[2] frel = matches[2] # Legacy _PREF elif matches[1][0] == "_": pass else: self.barf(level+1) def parse_family(self): self.addr = None note = "" while 1: matches = self.get_next() if int(matches[0]) == 0: self.backup() return elif matches[1] == "HUSB": id = matches[2] person = self.find_or_create_person(id[1:-1]) self.family.set_father_id(person.get_id()) self.ignore_sub_junk(2) elif matches[1] == "WIFE": id = matches[2] person = self.find_or_create_person(id[1:-1]) self.family.set_mother_id(person.get_id()) self.ignore_sub_junk(2) elif matches[1] == "SLGS": ord = RelLib.LdsOrd() self.family.set_lds_sealing(ord) self.parse_ord(ord,2) elif matches[1] == "ADDR": self.addr = RelLib.Address() self.addr.set_street(matches[2] + self.parse_continue_data(1)) self.parse_address(self.addr,2) elif matches[1] == "CHIL": mrel,frel = self.parse_ftw_relations(2) id = matches[2] child = self.find_or_create_person(id[1:-1]) self.family.add_child_id(child.get_id()) for f in child.get_parent_family_id_list(): if f[0] == self.family.get_id(): break else: if (mrel=="Birth" or mrel=="") and (frel=="Birth" or frel==""): child.set_main_parent_family_id(self.family.get_id()) else: if child.get_main_parents_family_id() == self.family: child.set_main_parent_family_id(None) child.add_parent_family_id(self.family.get_id(),mrel,frel) self.db.commit_person(child) elif matches[1] == "NCHI": a = RelLib.Attribute() a.set_type("Number of Children") a.set_value(matches[2]) self.family.add_attribute(a) elif matches[1] in ["RIN", "SUBM", "REFN","CHAN","SOUR"]: self.ignore_sub_junk(2) elif matches[1] == "OBJE": if matches[2] and matches[2][0] == '@': self.barf(2) else: self.parse_family_object(2) elif matches[1] == "_COMM": note = string.strip(matches[2]) + self.parse_continue_data(1) self.family.set_note(note) self.ignore_sub_junk(2) elif matches[1] == "NOTE": note = self.parse_note(matches,self.family,1,note) else: event = RelLib.Event() try: event.set_name(ged2fam[matches[1]]) except: event.set_name(matches[1]) if event.get_name() == "Marriage": self.family.set_relationship("Married") self.db.add_event(event) self.family.add_event_id(event.get_id()) self.parse_family_event(event,2) self.db.commit_event(event) del event def parse_note_base(self,matches,obj,level,old_note,task): note = old_note if matches[2] and matches[2][0] == "@": if self.nmap.has_key(matches[2]): self.share_note.append(obj) obj.set_note_object(self.nmap[matches[2]]) else: noteobj = RelLib.Note() self.nmap[matches[2]] = noteobj self.share_note.append(obj) obj.set_note_object(noteobj) else: if old_note: note = "%s\n%s%s" % (old_note,matches[2],self.parse_continue_data(level)) else: note = matches[2] + self.parse_continue_data(level) task(note) self.ignore_sub_junk(level+1) return note def parse_note(self,matches,obj,level,old_note): return self.parse_note_base(matches,obj,level,old_note,obj.set_note) def parse_comment(self,matches,obj,level,old_note): return self.parse_note_base(matches,obj,level,old_note,obj.set_comments) def parse_individual(self): name_cnt = 0 note = "" while 1: matches = self.get_next() if int(matches[0]) == 0: self.backup() return elif matches[1] == "NAME": name = RelLib.Name() m = snameRegexp.match(matches[2]) if m: n = m.groups()[0] n2 = m.groups()[1] names = (n2,'',n,'','') else: try: names = nameRegexp.match(matches[2]).groups() except: names = (matches[2],"","","","") if names[0]: name.set_first_name(names[0].strip()) if names[2]: name.set_surname(names[2].strip()) if names[4]: name.set_suffix(names[4].strip()) if name_cnt == 0: self.person.set_primary_name(name) else: self.person.add_alternate_name(name) name_cnt = name_cnt + 1 self.parse_name(name,2) elif matches[1] in ["ALIA","_ALIA"]: aka = RelLib.Name() try: names = nameRegexp.match(matches[2]).groups() except: names = (matches[2],"","","","") if names[0]: aka.set_first_name(names[0]) if names[2]: aka.set_surname(names[2]) if names[4]: aka.set_suffix(names[4]) self.person.add_alternate_name(aka) elif matches[1] == "OBJE": if matches[2] and matches[2][0] == '@': self.barf(2) else: self.parse_person_object(2) elif matches[1] in ["NOTE","_COMM"]: note = self.parse_note(matches,self.person,1,note) elif matches[1] == "SEX": if matches[2] == '': self.person.set_gender(RelLib.Person.unknown) elif matches[2][0] == "M": self.person.set_gender(RelLib.Person.male) else: self.person.set_gender(RelLib.Person.female) elif matches[1] in [ "BAPL", "ENDL", "SLGC" ]: ord = RelLib.LdsOrd() if matches[1] == "BAPL": self.person.set_lds_baptism(ord) elif matches[1] == "ENDL": self.person.set_lds_endowment(ord) else: self.person.set_lds_sealing(ord) self.parse_ord(ord,2) elif matches[1] == "FAMS": family = self.db.find_family_with_map(matches[2],self.fmap) self.person.add_family_id(family.get_id()) if note == "": note = self.parse_optional_note(2) else: note = "%s\n\n%s" % (note,self.parse_optional_note(2)) self.db.commit_family(family) elif matches[1] == "FAMC": type,note = self.parse_famc_type(2) family = self.db.find_family_with_map(matches[2],self.fmap) for f in self.person.get_parent_family_id_list(): if f[0] == family.get_id(): break else: if type == "" or type == "Birth": if self.person.get_main_parents_family_id() == None: self.person.set_main_parent_family_id(family.get_id()) else: self.person.add_parent_family_id(family.get_id(),"Unknown","Unknown") else: if self.person.get_main_parents_family_id() == family.get_id(): self.person.set_main_parent_family_id(None) self.person.add_parent_family_id(family.get_id(),type,type) self.db.commit_family(family) elif matches[1] == "RESI": addr = RelLib.Address() self.person.add_address(addr) self.parse_residence(addr,2) elif matches[1] == "ADDR": addr = RelLib.Address() addr.set_street(matches[2] + self.parse_continue_data(1)) self.parse_address(addr,2) self.person.add_address(addr) elif matches[1] == "PHON": addr = RelLib.Address() addr.set_street("Unknown") addr.set_phone(matches[2]) self.person.add_address(addr) elif matches[1] == "BIRT": event = RelLib.Event() self.db.add_event(event) if self.person.get_birth_id(): event.set_name("Alternate Birth") self.person.add_event_id(event.get_id()) else: event.set_name("Birth") self.person.set_birth_id(event.get_id()) self.parse_person_event(event,2) self.db.commit_event(event) elif matches[1] == "ADOP": event = RelLib.Event() event.set_name("Adopted") self.person.add_event_id(event.get_id()) self.parse_adopt_event(event,2) self.db.add_event(event) elif matches[1] == "DEAT": event = RelLib.Event() self.db.add_event(event) if self.person.get_death_id(): event.set_name("Alternate Death") self.person.add_event_id(event.get_id()) else: event.set_name("Death") self.person.set_death_id(event.get_id()) self.parse_person_event(event,2) self.db.commit_event(event) elif matches[1] == "EVEN": event = RelLib.Event() if matches[2]: event.set_description(matches[2]) self.parse_person_event(event,2) n = string.strip(event.get_name()) if n in self.attrs: attr = RelLib.Attribute() attr.set_type(self.gedattr[n]) attr.set_value(event.get_description()) self.person.add_attribute(attr) else: self.db.add_event(event) self.person.add_event_id(event.get_id()) elif matches[1] == "SOUR": source_ref = self.handle_source(matches,2) self.person.get_primary_name().add_source_reference(source_ref) elif matches[1] == "REFN": if intRE.match(matches[2]): try: self.refn[self.person.get_id()] = int(matches[2]) except: pass elif matches[1] in ["AFN","CHAN","REFN","ASSO"]: self.ignore_sub_junk(2) elif matches[1] in ["ANCI","DESI","RIN","RFN","_UID"]: pass else: event = RelLib.Event() n = string.strip(matches[1]) if ged2gramps.has_key(n): event.set_name(ged2gramps[n]) elif self.gedattr.has_key(n): attr = RelLib.Attribute() attr.set_type(self.gedattr[n]) attr.set_value(event.get_description()) self.person.add_attribute(attr) self.parse_person_attr(attr,2) continue else: val = self.gedsource.tag2gramps(n) if val: event.set_name(val) else: event.set_name(n) self.parse_person_event(event,2) if matches[2]: event.set_description(matches[2]) self.db.add_event(event) self.person.add_event_id(event.get_id()) def parse_optional_note(self,level): note = "" while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return note elif matches[1] == "NOTE": if not string.strip(matches[2]) or matches[2] and matches[2][0] != "@": note = matches[2] + self.parse_continue_data(level+1) self.parse_note_data(level+1) else: self.ignore_sub_junk(level+1) else: self.barf(level+1) def parse_famc_type(self,level): type = "" note = "" while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return (string.capitalize(type),note) elif matches[1] == "PEDI": type = matches[2] elif matches[1] == "SOUR": source_ref = self.handle_source(matches,level+1) self.person.get_primary_name().add_source_reference(source_ref) elif matches[1] == "_PRIMARY": pass #type = matches[1] elif matches[1] == "NOTE": if not string.strip(matches[2]) or matches[2] and matches[2][0] != "@": note = matches[2] + self.parse_continue_data(level+1) self.parse_note_data(level+1) else: self.ignore_sub_junk(level+1) else: self.barf(level+1) def parse_person_object(self,level): form = "" file = "" title = "" note = "" while 1: matches = self.get_next() if matches[1] == "FORM": form = string.lower(matches[2]) elif matches[1] == "TITL": title = matches[2] elif matches[1] == "FILE": file = matches[2] elif matches[1] == "NOTE": note = matches[2] + self.parse_continue_data(level+1) elif matches[1][0] == "_": self.ignore_sub_junk(level+1) elif int(matches[0]) < level: self.backup() break else: self.barf(level+1) if form == "url": url = RelLib.Url() url.set_path(file) url.set_description(title) self.person.add_url(url) else: (ok,path) = self.find_file(file,self.dir_path) if not ok: self.warn(_("Warning: could not import %s") % file + "\n") self.warn(_("\tThe following paths were tried:\n\t\t")) self.warn(string.join(path,"\n\t\t")) self.warn('\n') else: photo = RelLib.MediaObject() photo.set_path(path) photo.set_description(title) photo.set_mime_type(Utils.get_mime_type(path)) self.db.add_object(photo) oref = RelLib.MediaRef() oref.set_reference_id(photo.get_id()) self.person.add_media_reference(oref) self.db.commit_person(self.person) def parse_family_object(self,level): form = "" file = "" title = "" note = "" while 1: matches = self.get_next() if matches[1] == "FORM": form = string.lower(matches[2]) elif matches[1] == "TITL": title = matches[2] elif matches[1] == "FILE": file = matches[2] elif matches[1] == "NOTE": note = matches[2] + self.parse_continue_data(level+1) elif int(matches[0]) < level: self.backup() break else: self.barf(level+1) if form: (ok,path) = self.find_file(file,self.dir_path) if not ok: self.warn(_("Warning: could not import %s") % file + "\n") self.warn(_("\tThe following paths were tried:\n\t\t")) self.warn(string.join(path,"\n\t\t")) self.warn('\n') else: photo = RelLib.MediaObject() photo.set_path(path) photo.set_description(title) photo.set_mime_type(Utils.get_mime_type(path)) self.db.add_object(photo) oref = RelLib.MediaRef() oref.set_reference_id(photo.get_id()) self.family.add_media_reference(photo) self.db.commit_family(self.family) def parse_residence(self,address,level): note = "" while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return elif matches[1] == "DATE": address.set_date_object(self.extract_date(matches[2])) elif matches[1] == "ADDR": address.set_street(matches[2] + self.parse_continue_data(level+1)) self.parse_address(address,level+1) elif matches[1] in ["AGE","AGNC","CAUS","STAT","TEMP","OBJE","TYPE","_DATE2"]: self.ignore_sub_junk(level+1) elif matches[1] == "SOUR": address.add_source_reference(self.handle_source(matches,level+1)) elif matches[1] == "PLAC": address.set_street(matches[2]) self.parse_address(address,level+1) elif matches[1] == "PHON": address.set_street("Unknown") address.set_phone(matches[2]) elif matches[1] == "NOTE": note = self.parse_note(matches,address,level+1,note) else: self.barf(level+1) def parse_address(self,address,level): first = 0 note = "" while 1: matches = self.get_next() if int(matches[0]) < level: if matches[1] == "PHON": address.set_phone(matches[2]) else: self.backup() return elif matches[1] in [ "ADDR", "ADR1", "ADR2" ]: val = address.get_street() data = self.parse_continue_data(level+1) if first == 0: val = "%s %s" % (matches[2],data) first = 1 else: val = "%s,%s %s" % (val,matches[2],data) address.set_street(val) elif matches[1] == "CITY": address.set_city(matches[2]) elif matches[1] == "STAE": address.set_state(matches[2]) elif matches[1] == "POST": address.set_postal_code(matches[2]) elif matches[1] == "CTRY": address.setCountry(matches[2]) else: self.barf(level+1) def parse_ord(self,ord,level): note = "" while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() break elif matches[1] == "TEMP": ord.set_temple(matches[2]) elif matches[1] == "DATE": ord.set_date_object(self.extract_date(matches[2])) elif matches[1] == "FAMC": ord.set_family_id(self.db.find_family_with_map(matches[2],self.fmap)) elif matches[1] == "PLAC": try: val = matches[2] if self.placemap.has_key(val): place_id = self.placemap[val] else: place = RelLib.Place() place.set_title(matches[2]) self.db.add_place(place) place_id = place.get_id() self.placemap[val] = place_id ord.set_place_id(place_id) self.ignore_sub_junk(level+1) except NameError: pass elif matches[1] == "SOUR": ord.add_source_reference(self.handle_source(matches,level+1)) elif matches[1] == "NOTE": note = self.parse_note(matches,ord,level+1,note) elif matches[1] == "STAT": if const.lds_status.has_key(matches[2]): ord.set_status(const.lds_status[matches[2]]) else: self.barf(level+1) def parse_person_event(self,event,level): note = "" while 1: matches = self.get_next() if int(matches[0]) < level: if note: event.set_note(note) self.backup() break elif matches[1] == "TYPE": if event.get_name() == "": if ged2gramps.has_key(matches[2]): name = ged2gramps[matches[2]] else: val = self.gedsource.tag2gramps(matches[2]) if val: name = val else: name = matches[2] event.set_name(name) elif matches[1] == "DATE": event.set_date_object(self.extract_date(matches[2])) elif matches[1] == "SOUR": event.add_source_reference(self.handle_source(matches,level+1)) elif matches[1] == "PLAC": val = matches[2] n = string.strip(event.get_name()) if self.is_ftw and n in ["Occupation","Degree","SSN"]: event.set_description(val) self.ignore_sub_junk(level+1) else: if self.placemap.has_key(val): place_id = self.placemap[val] else: place = RelLib.Place() place.set_title(matches[2]) self.db.add_place(place) place_id = place.get_id() self.placemap[val] = place_id event.set_place_id(place_id) self.ignore_sub_junk(level+1) elif matches[1] == "CAUS": info = matches[2] + self.parse_continue_data(level+1) event.set_cause(info) self.parse_cause(event,level+1) elif matches[1] == "NOTE" or matches[1] == 'OFFI': info = matches[2] + self.parse_continue_data(level+1) if note == "": note = info else: note = "\n%s" % info elif matches[1] == "CONC": d = event.get_description() if self.broken_conc: event.set_description("%s %s" % (d, matches[2])) else: event.set_description("%s%s" % (d, matches[2])) elif matches[1] == "CONT": event.set_description("%s\n%s" % (event.get_description(),matches[2])) elif matches[1] in ["RELI", "TIME","ADDR","AGE","AGNC","STAT","TEMP","OBJE","_DATE2"]: self.ignore_sub_junk(level+1) else: self.barf(level+1) def parse_adopt_event(self,event,level): note = "" while 1: matches = self.get_next() if int(matches[0]) < level: if note != "": event.set_note(note) self.backup() break elif matches[1] == "DATE": event.set_date_object(self.extract_date(matches[2])) elif matches[1] in ["TIME","ADDR","AGE","AGNC","STAT","TEMP","OBJE"]: self.ignore_sub_junk(level+1) elif matches[1] == "SOUR": event.add_source_reference(self.handle_source(matches,level+1)) elif matches[1] == "FAMC": family = self.db.find_family_with_map(matches[2],self.fmap) mrel,frel = self.parse_adopt_famc(level+1); if self.person.get_main_parents_family_id() == family.get_id(): self.person.set_main_parent_family_id(None) self.person.add_parent_family_id(family.get_id(),mrel,frel) elif matches[1] == "PLAC": val = matches[2] if self.placemap.has_key(val): place_id = self.placemap[val] else: place = RelLib.Place() place.set_title(matches[2]) self.db.add_place(place) place_id = place.get_id() self.placemap[val] = place_id event.set_place_id(place_id) self.ignore_sub_junk(level+1) elif matches[1] == "TYPE": # eventually do something intelligent here pass elif matches[1] == "CAUS": info = matches[2] + self.parse_continue_data(level+1) event.set_cause(info) self.parse_cause(event,level+1) elif matches[1] == "NOTE": info = matches[2] + self.parse_continue_data(level+1) if note == "": note = info else: note = "\n%s" % info elif matches[1] == "CONC": d = event.get_description() if self.broken_conc: event.set_description("%s %s" % (d,matches[2])) else: event.set_description("%s%s" % (d,matches[2])) elif matches[1] == "CONT": d = event.get_description() event.set_description("%s\n%s" % (d,matches[2])) else: self.barf(level+1) def parse_adopt_famc(self,level): mrel = "Adopted" frel = "Adopted" while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return (mrel,frel) elif matches[1] == "ADOP": if matches[2] == "HUSB": mrel = "Birth" elif matches[2] == "WIFE": frel = "Birth" else: self.barf(level+1) def parse_person_attr(self,attr,level): note = "" while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() break elif matches[1] == "TYPE": if attr.get_type() == "": if ged2gramps.has_key(matches[2]): name = ged2gramps[matches[2]] else: val = self.gedsource.tag2gramps(matches[2]) if val: name = val else: name = matches[2] attr.set_name(name) elif matches[1] in ["CAUS", "DATE","TIME","ADDR","AGE","AGNC","STAT","TEMP","OBJE"]: self.ignore_sub_junk(level+1) elif matches[1] == "SOUR": attr.add_source_reference(self.handle_source(matches,level+1)) elif matches[1] == "PLAC": val = matches[2] if attr.get_value() == "": attr.set_value(val) self.ignore_sub_junk(level+1) elif matches[1] == "DATE": note = "%s\n\n" % ("Date : %s" % matches[2]) elif matches[1] == "NOTE": info = matches[2] + self.parse_continue_data(level+1) if note == "": note = info else: note = "%s\n\n%s" % (note,info) elif matches[1] == "CONC": if self.broken_conc: attr.set_value("%s %s" % (attr.get_value(), matches[2])) else: attr.set_value("%s %s" % (attr.get_value(), matches[2])) elif matches[1] == "CONT": attr.set_value("%s\n%s" % (attr.get_value(),matches[2])) else: self.barf(level+1) if note != "": attr.set_note(note) def parse_family_event(self,event,level): note = "" while 1: matches = self.get_next() if int(matches[0]) < level: if note: event.set_note(note) self.backup() break elif matches[1] == "TYPE": if event.get_name() == "" or event.get_name() == 'EVEN': try: event.set_name(ged2fam[matches[2]]) except: event.set_name(matches[2]) else: note = 'Status = %s\n' % matches[2] elif matches[1] == "DATE": event.set_date_object(self.extract_date(matches[2])) elif matches[1] == "CAUS": info = matches[2] + self.parse_continue_data(level+1) event.set_cause(info) self.parse_cause(event,level+1) elif matches[1] in ["TIME","AGE","AGNC","ADDR","STAT", "TEMP","HUSB","WIFE","OBJE","_CHUR"]: self.ignore_sub_junk(level+1) elif matches[1] == "SOUR": event.add_source_reference(self.handle_source(matches,level+1)) elif matches[1] == "PLAC": val = matches[2] if self.placemap.has_key(val): place_id = self.placemap[val] else: place = RelLib.Place() place.set_title(matches[2]) self.db.add_place(place) place_id = place.get_id() self.placemap[val] = place_id event.set_place_id(place_id) self.ignore_sub_junk(level+1) elif matches[1] == 'OFFI': if note == "": note = matches[2] else: note = note + "\n" + matches[2] elif matches[1] == "NOTE": note = self.parse_note(matches,event,level+1,note) else: self.barf(level+1) def parse_source_reference(self,source,level): """Reads the data associated with a SOUR reference""" note = "" while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return elif matches[1] == "PAGE": source.set_page(matches[2] + self.parse_continue_data(level+1)) elif matches[1] == "DATA": date,text = self.parse_source_data(level+1) d = Date.Date() d.set(date) source.set_date(d) source.set_text(text) elif matches[1] in ["OBJE","REFN","TEXT"]: self.ignore_sub_junk(level+1) elif matches[1] == "QUAY": val = int(matches[2]) if val > 1: source.set_confidence_level(val+1) else: source.set_confidence_level(val) elif matches[1] == "NOTE": note = self.parse_comment(matches,source,level+1,note) else: self.barf(level+1) def parse_source_data(self,level): """Parses the source data""" date = "" note = "" while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return (date,note) elif matches[1] == "DATE": date = matches[2] elif matches[1] == "TEXT": note = matches[2] + self.parse_continue_data(level+1) else: self.barf(level+1) def parse_name(self,name,level): """Parses the person's name information""" note = "" while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return elif matches[1] in ["ALIA","_ALIA"]: aka = RelLib.Name() try: names = nameRegexp.match(matches[2]).groups() except: names = (matches[2],"","","","") if names[0]: aka.set_first_name(names[0]) if names[2]: aka.set_surname(names[2]) if names[4]: aka.set_suffix(names[4]) self.person.add_alternate_name(aka) elif matches[1] == "NPFX": name.set_title(matches[2]) elif matches[1] == "GIVN": name.set_first_name(matches[2]) elif matches[1] == "SPFX": name.set_surname_prefix(matches[2]) elif matches[1] == "SURN": name.set_surname(matches[2]) elif matches[1] == "_MARNM": self.parse_marnm(self.person,matches[2].strip()) elif matches[1] == "TITL": name.set_suffix(matches[2]) elif matches[1] == "NSFX": if name.get_suffix() == "": name.set_suffix(matches[2]) elif matches[1] == "NICK": self.person.set_nick_name(matches[2]) elif matches[1] == "_AKA": lname = string.split(matches[2]) l = len(lname) if l == 1: self.person.set_nick_name(matches[2]) else: name = RelLib.Name() name.set_surname(lname[-1]) name.set_first_name(string.join(lname[0:l-1])) self.person.add_alternate_name(name) elif matches[1] == "SOUR": name.add_source_reference(self.handle_source(matches,level+1)) elif matches[1][0:4] == "NOTE": note = self.parse_note(matches,name,level+1,note) else: self.barf(level+1) def parse_marnm(self,person,text): data = text.split() if len(data) == 1: name = RelLib.Name(person.get_primary_name()) name.set_surname(data[0]) name.set_type('Married Name') person.add_alternate_name(name) elif len(data) > 1: name = RelLib.Name() name.set_surname(data[-1]) name.set_first_name(string.join(data[0:-1],' ')) name.set_type('Married Name') person.add_alternate_name(name) def parse_header_head(self): """validiates that this is a valid GEDCOM file""" line = string.replace(self.f.readline(),'\r','') match = headRE.search(line) if not match: raise Errors.GedcomError("%s is not a GEDCOM file" % self.filename) self.index = self.index + 1 def parse_header_source(self): genby = "" while 1: matches = self.get_next() if int(matches[0]) == 0: self.backup() return elif matches[1] == "SOUR": if self.window and self.created_obj.get_text(): self.update(self.created_obj,matches[2]) self.gedsource = self.gedmap.get_from_source_tag(matches[2]) self.broken_conc = self.gedsource.get_conc() if matches[2] == "FTW": self.is_ftw = 1 genby = matches[2] elif matches[1] == "NAME" and self.window: self.update(self.created_obj,matches[2]) elif matches[1] == "VERS" and self.window: self.update(self.version_obj,matches[2]) pass elif matches[1] in ["CORP","DATA","SUBM","SUBN","COPR","FILE","LANG"]: self.ignore_sub_junk(2) elif matches[1] == "DEST": if genby == "GRAMPS": self.gedsource = self.gedmap.get_from_source_tag(matches[2]) self.broken_conc = self.gedsource.get_conc() elif matches[1] == "CHAR": if matches[2] == "UNICODE" or matches[2] == "UTF-8" or matches[2] == "UTF8": self.cnv = nocnv elif matches[2] == "ANSEL": self.cnv = ansel_to_utf8 else: self.cnv = latin_utf8.latin_to_utf8 self.ignore_sub_junk(2) if self.window: self.update(self.encoding_obj,matches[2]) elif matches[1] == "GEDC": self.ignore_sub_junk(2) elif matches[1] == "_SCHEMA": self.parse_ftw_schema(2) elif matches[1] == "PLAC": self.parse_place_form(2) elif matches[1] == "DATE": date = self.parse_date(2) date.date = matches[2] elif matches[1] == "NOTE": note = matches[2] + self.parse_continue_data(2) elif matches[1][0] == "_": self.ignore_sub_junk(2) else: self.barf(2) def parse_ftw_schema(self,level): while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return elif matches[1] == "INDI": self.parse_ftw_indi_schema(level+1) elif matches[1] == "FAM": self.parse_ftw_fam_schema(level+1) else: self.barf(2) def parse_ftw_indi_schema(self,level): while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return else: label = self.parse_label(level+1) ged2gramps[matches[1]] = label def parse_label(self,level): while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return elif matches[1] == "LABL": return matches[2] else: self.barf(2) def parse_ftw_fam_schema(self,level): while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return else: label = self.parse_label(level+1) ged2fam[matches[1]] = label def ignore_sub_junk(self,level): while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return def ignore_change_data(self,level): matches = self.get_next() if matches[1] == "CHAN": self.ignore_sub_junk(level+1) else: self.backup() def parse_place_form(self,level): while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return elif matches[1] != "FORM": self.barf(level+1) def parse_continue_data(self,level): data = "" while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return data elif matches[1] == "CONC": if self.broken_conc: data = "%s %s" % (data,matches[2]) else: data = "%s%s" % (data,matches[2]) elif matches[1] == "CONT": data = "%s\n%s" % (data,matches[2]) else: self.backup() return data def parse_note_continue(self,level): data = "" while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return data elif matches[1] == "NOTE": data = "%s\n%s%s" % (data,matches[2],self.parse_continue_data(level+1)) elif matches[1] == "CONC": if self.broken_conc: data = "%s %s" % (data,matches[2]) else: data = "%s%s" % (data,matches[2]) elif matches[1] == "CONT": data = "%s\n%s" % (data,matches[2]) else: self.backup() return data def parse_date(self,level): date = DateStruct() while 1: matches = self.get_next() if int(matches[0]) < level: self.backup() return date elif matches[1] == "TIME": date.time = matches[2] else: self.barf(level+1) def extract_date(self,text): dateobj = Date.Date() try: match = fromtoRegexp.match(text) if match: (cal1,data1,cal2,data2) = match.groups() if cal1 != cal2: pass if cal1 == "FRENCH R": dateobj.set_calendar(FrenchRepublic.FrenchRepublic) elif cal1 == "JULIAN": dateobj.set_calendar(Julian.Julian) elif cal1 == "HEBREW": dateobj.set_calendar(Hebrew.Hebrew) dateobj.get_start_date().set(data1) dateobj.get_stop_date().set(data2) dateobj.set_range(1) return dateobj match = calRegexp.match(text) if match: (abt,cal,data) = match.groups() if cal == "FRENCH R": dateobj.set_calendar(FrenchRepublic.FrenchRepublic) elif cal == "JULIAN": dateobj.set_calendar(Julian.Julian) elif cal == "HEBREW": dateobj.set_calendar(Hebrew.Hebrew) dateobj.set(data) if abt: dateobj.get_start_date().setMode(abt) else: dateobj.set(text) except: dateobj.set_text(text) return dateobj def handle_source(self,matches,level): source_ref = RelLib.SourceRef() if matches[2] and matches[2][0] != "@": self.localref = self.localref + 1 ref = "gsr%d" % self.localref s = self.db.find_source(ref,self.smap) source_ref.set_base_id(s.get_id()) s.set_title('Imported Source #%d' % self.localref) s.set_note(matches[2] + self.parse_continue_data(level)) self.ignore_sub_junk(level+1) else: source_ref.set_base_id(self.db.find_source(matches[2],self.smap).get_id()) self.parse_source_reference(source_ref,level) return source_ref def resolve_refns(self): prefix = self.db.iprefix index = 0 new_pmax = self.db.pmap_index for pid in self.added.keys(): index = index + 1 if self.refn.has_key(pid): val = self.refn[pid] new_key = prefix % val new_pmax = max(new_pmax,val) person = self.db.find_person_from_id(pid) # new ID is not used if not self.db.has_person_id(new_key): self.db.remove_person_id(pid) person.set_id(new_key) self.db.add_person(person) else: tp = self.db.find_person_from_id(new_key) # same person, just change it if person == tp: self.db.remove_person_id(pid) person.set_id(new_key) self.db.add_person_as(person) # give up trying to use the refn as a key else: pass self.db.pmap_index = new_pmax #------------------------------------------------------------------------- # # # #------------------------------------------------------------------------- def readData(database,active_person,cb): global db global callback global file_top db = database callback = cb choose = gtk.FileChooserDialog("%s - GRAMPS" % _title_string, None, gtk.FILE_CHOOSER_ACTION_OPEN, (gtk.STOCK_CANCEL, gtk.RESPONSE_CANCEL, gtk.STOCK_OPEN, gtk.RESPONSE_OK)) filter = gtk.FileFilter() filter.set_name(_('GEDCOM files')) filter.add_pattern('*.ged') filter.add_pattern('*.GED') choose.add_filter(filter) filter = gtk.FileFilter() filter.set_name(_('All files')) filter.add_pattern('*') choose.add_filter(filter) response = choose.run() if response == gtk.RESPONSE_OK: filename = choose.get_filename() choose.destroy() try: importData(db,filename) except: import DisplayTrace DisplayTrace.DisplayTrace() else: choose.destroy() #------------------------------------------------------------------------- # # # #------------------------------------------------------------------------- from Plugins import register_import register_import(readData,_title_string)