#! /usr/bin/env python3 # # update_po - a gramps tool to update translations # # Copyright (C) 2006-2006 Kees Bakker # Copyright (C) 2006 Brian Matherly # Copyright (C) 2008 Stephen George # Copyright (C) 2012 # Copyright (C) 2020 Nick Hall # # This program is free software; you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation; either version 2 of the License, or # (at your option) any later version. # # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with this program; if not, write to the Free Software # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. # """ update_po.py for Gramps translations. Examples: python update_po.py -t Tests if 'gettext' and 'python' are well configured. python update_po.py -h Calls help and command line interface. python update_po.py -p Generates a new template/catalog (gramps.pot). python update_po.py -m de.po Merges 'de.po' file with 'gramps.pot'. python update_po.py -k de.po Checks 'de.po' file, tests to compile and generates a textual resume. """ from __future__ import print_function import os import sys import shutil from argparse import ArgumentParser from tokenize import tokenize, STRING, COMMENT, NL, TokenError # Windows OS if sys.platform in ['linux', 'linux2', 'darwin', 'cygwin'] or shutil.which('msgmerge'): msgmergeCmd = 'msgmerge' msgfmtCmd = 'msgfmt' msgattribCmd = 'msgattrib' xgettextCmd = 'xgettext' pythonCmd = os.path.join(sys.prefix, 'bin', 'python3') elif sys.platform == 'win32': # GetText Win 32 obtained from http://gnuwin32.sourceforge.net/packages/gettext.htm # ....\gettext\bin\msgmerge.exe needs to be on the path msgmergeCmd = os.path.join('C:', 'Program Files(x86)', 'gettext', 'bin', 'msgmerge.exe') msgfmtCmd = os.path.join('C:', 'Program Files(x86)', 'gettext', 'bin', 'msgfmt.exe') msgattribCmd = os.path.join('C:', 'Program Files(x86)', 'gettext', 'bin', 'msgattrib.exe') xgettextCmd = os.path.join('C:', 'Program Files(x86)', 'gettext', 'bin', 'xgettext.exe') pythonCmd = os.path.join(sys.prefix, 'bin', 'python.exe') # Others OS elif sys.platform in ['linux', 'linux2', 'darwin', 'cygwin']: msgmergeCmd = 'msgmerge' msgfmtCmd = 'msgfmt' msgattribCmd = 'msgattrib' xgettextCmd = 'xgettext' pythonCmd = os.path.join(sys.prefix, 'bin', 'python3') else: print("Found platform %s, OS %s" % (sys.platform, os.name)) print ("Update PO ERROR: unknown system, don't know msgmerge, ... commands") sys.exit(0) # List of available languages, useful for grouped actions # need files with po extension LANG = [file for file in os.listdir('.') if file.endswith('.po')] # add a special 'all' argument (for 'check' and 'merge' arguments) LANG.append("all") # visual polish on the languages list LANG.sort() def tests(): """ Testing installed programs. We made tests (-t flag) by displaying versions of tools if properly installed. Cannot run all commands without 'gettext' and 'python'. """ try: print ("\n====='msgmerge'=(merge our translation)================\n") os.system('''%(program)s -V''' % {'program': msgmergeCmd}) except: print ('Please, install %(program)s for updating your translation' % {'program': msgmergeCmd}) try: print ("\n==='msgfmt'=(format our translation for installation)==\n") os.system('''%(program)s -V''' % {'program': msgfmtCmd}) except: print ('Please, install %(program)s for checking your translation' % {'program': msgfmtCmd}) try: print ("\n===='msgattrib'==(list groups of messages)=============\n") os.system('''%(program)s -V''' % {'program': msgattribCmd}) except: print ('Please, install %(program)s for listing groups of messages' % {'program': msgattribCmd}) try: print("\n===='xgettext' =(generate a new template)==============\n") os.system('''%(program)s -V''' % {'program': xgettextCmd}) except: print ('Please, install %(program)s for generating a new template' % {'program': xgettextCmd}) try: print("\n=================='python'=============================\n") os.system('''%(program)s -V''' % {'program': pythonCmd}) except: print ('Please, install python') def main(): """ The utility for handling translation stuff. What is need by Gramps, nothing more. """ parser = ArgumentParser( description='This program generates a new template and ' 'also provides some common features.', ) parser.add_argument("-t", "--test", action="store_true", dest="test", default=True, help="test if 'python' and 'gettext' are properly installed") parser.add_argument("-x", "--xml", action="store_true", dest="xml", default=False, help="extract messages from xml based file formats") parser.add_argument("-g", "--glade", action="store_true", dest="glade", default=False, help="extract messages from glade file format only") parser.add_argument("-c", "--clean", action="store_true", dest="clean", default=False, help="remove created files") parser.add_argument("-p", "--pot", action="store_true", dest="catalog", default=False, help="create a new catalog") update = parser.add_argument_group('Update', 'Maintenance around translations') # need at least one argument (sv.po, de.po, etc ...) # lang.po files maintenance update.add_argument("-m", dest="merge", choices=LANG, help="merge lang.po files with last catalog") update.add_argument("-k", dest="check", choices=LANG, help="check lang.po files") # testing stage trans = parser.add_argument_group('Translation', 'Display content of translations file') # need one argument (eg, de.po) trans.add_argument("-u", dest="untranslated", choices=[file for file in os.listdir('.') if file.endswith('.po')], help="list untranslated messages") trans.add_argument("-f", dest="fuzzy", choices=[file for file in os.listdir('.') if file.endswith('.po')], help="list fuzzy messages") args = parser.parse_args() namespace, extra = parser.parse_known_args() if args.test: tests() if args.xml: extract_xml() if args.glade: create_filesfile() extract_glade() if os.path.isfile('tmpfiles'): os.unlink('tmpfiles') if args.catalog: retrieve() if args.clean: clean() if args.merge: #retrieve() windows os? if sys.argv[2:] == ['all']: sys.argv[2:] = LANG merge(sys.argv[2:]) if args.check: #retrieve() windows os? if sys.argv[2:] == ['all']: sys.argv[2:] = LANG check(sys.argv[2:]) if args.untranslated: untranslated(sys.argv[2:]) if args.fuzzy: fuzzy(sys.argv[2:]) def create_filesfile(): """ Create a file with all files that we should translate. These are all python files not in POTFILES.skip added with those in POTFILES.in """ dir = os.getcwd() topdir = os.path.normpath(os.path.join(dir, '..', 'gramps')) lentopdir = len(topdir) with open('POTFILES.in') as f: infiles = dict(['../' + file.strip(), None] for file in f if file.strip() and not file[0]=='#') with open('POTFILES.skip') as f: notinfiles = dict(['../' + file.strip(), None] for file in f if file and not file[0]=='#') for (dirpath, dirnames, filenames) in os.walk(topdir): root, subdir = os.path.split(dirpath) if subdir.startswith("."): #don't continue in this dir dirnames[:] = [] continue for dirname in dirnames: # Skip hidden and system directories: if dirname.startswith(".") or dirname in ["po", "locale"]: dirnames.remove(dirname) #add the files which are python or glade files # if the directory does not exist or is a link, do nothing if not os.path.isdir(dirpath) or os.path.islink(dirpath): continue for filename in os.listdir(dirpath): name = os.path.split(filename)[1] if name.endswith('.py') or name.endswith('.glade'): full_filename = os.path.join(dirpath, filename) #Skip the file if in POTFILES.skip if full_filename[lentopdir:] in notinfiles: infiles['../gramps' + full_filename[lentopdir:]] = None #now we write out all the files in form ../gramps/filename with open('tmpfiles', 'w') as f: for file in sorted(infiles.keys()): f.write(file) f.write('\n') def listing(name, extensionlist): """ List files according to extensions. Parsing from a textual file (gramps) is faster and easy for maintenance. Like POTFILES.in and POTFILES.skip """ with open('tmpfiles') as f: files = [file.strip() for file in f if file and not file[0]=='#'] with open(name, 'w') as temp: for entry in files: for ext in extensionlist: if entry.endswith(ext): temp.write(entry) temp.write('\n') break def headers(): """ Look at existing C file format headers. Generated by 'intltool-extract' but want to get rid of this dependency (perl, just a set of tools). """ headers = [] # in.h; extract_xml if os.path.isfile('''fragments.pot'''): headers.append('''fragments.pot''') return headers def extract_xml(): """ Extract translation strings from XML based, mime and desktop files. Uses custom ITS rules found in the po/its directory. """ if not os.path.isfile('gramps.pot'): create_template() for input_file in ['../data/holidays.xml', '../data/tips.xml', '../data/gramps.xml.in', '../data/gramps.appdata.xml.in', '../data/gramps.desktop.in']: os.system(('GETTEXTDATADIR=. %(xgettext)s -F -j ' '-o gramps.pot --from-code=UTF-8 %(inputfile)s') % {'xgettext': xgettextCmd, 'inputfile': input_file} ) print (input_file) def create_template(): """ Create a new file for template, if it does not exist. """ with open('gramps.pot', 'w') as template: pass def extract_glade(): """ Extract messages from a temp file with all .glade """ if not os.path.isfile('gramps.pot'): create_template() listing('glade.txt', ['.glade']) os.system('''%(xgettext)s -F --add-comments -j -L Glade ''' '''--from-code=UTF-8 -o gramps.pot --files-from=glade.txt''' % {'xgettext': xgettextCmd} ) def xml_fragments(): """ search through the file for xml fragments that contain the 'translate="yes">string<' pattern. These need to be added to the message catalog """ with open('tmpfiles') as __f: files = [file.strip() for file in __f if file and not (file[0] == '#') and file.endswith('.py\n')] print("Checking for XML fragments in Python files") modop = int(len(files) / 20) wfp = open("fragments.pot", 'w', encoding='utf-8') for indx, filename in enumerate(files): if not indx % modop: print(int(indx / len(files) * 100), end='\r') fp = open(filename, 'rb') try: tokens = tokenize(fp.readline) in_string = False for _token, _text, _start, _end, _line in tokens: if _text.startswith('"""') or _text.startswith("'''"): _text = _text[3:] elif _text.startswith('"') or _text.startswith("'"): _text = _text[1:] if _text.endswith('"""') or _text.endswith("'''"): _text = _text[:-3] elif _text.endswith('"') or _text.endswith("'"): _text = _text[:-1] if _token == STRING and not in_string: in_string = True line_no = _start[0] text = _text continue elif _token == STRING and in_string: text += _text continue elif _token == COMMENT or _token == NL and in_string: # need to ignore comments and concatinate strings _ml = True continue elif in_string: in_string = False end = 0 # _find_message_in_xml(text) while True: fnd = text.find('translatable="yes">', end) if fnd == -1: break end = text.find('<', fnd) if end == -1: print("\nBad xml fragment '%s' at %s line %d" % (text[fnd:], filename, _start[0])) break msg = text[fnd + 19 : end] if "%s" in msg or (msg.startswith('{') and msg.endswith('}')): print('\n#: %s:%d Are you sure you want to ' 'translate the "%%s"???' % (filename, line_no)) break wfp.write('#: %s:%d\nmsgid "%s"\nmsgstr ""\n' % (filename, line_no, msg)) except TokenError as e: print('\n%s: %s, line %d, column %d' % ( e.args[0], filename, e.args[1][0], e.args[1][1]), file=sys.stderr) finally: fp.close() wfp.close() def retrieve(): """ Extract messages from all files used by Gramps (python, glade, xml) """ create_template() create_filesfile() xml_fragments() listing('python.txt', ['.py', '.py.in']) # additional keywords must always be kept in sync with those in genpot.sh os.system('''%(xgettext)s -F -c -j --directory=./ -d gramps ''' '''-L Python -o gramps.pot --files-from=python.txt ''' '''--debug --keyword=_ --keyword=ngettext ''' '''--keyword=_T_ --keyword=trans_text:1,2c ''' '''--keyword=_:1,2c --keyword=_T_:1,2c ''' '''--keyword=sgettext --from-code=UTF-8''' % {'xgettext': xgettextCmd} ) extract_glade() extract_xml() # C format header (.h extension) for h in headers(): print ('xgettext for %s' % h) os.system('''%(xgettext)s -F --add-comments -j -o gramps.pot ''' '''--keyword=N_ --from-code=UTF-8 %(head)s''' % {'xgettext': xgettextCmd, 'head': h} ) clean() def clean(): """ Remove created files (C format headers, temp listings) """ for h in headers(): if os.path.isfile(h): os.unlink(h) print ('Remove %(head)s' % {'head': h}) if os.path.isfile('python.txt'): os.unlink('python.txt') print ("Remove 'python.txt'") if os.path.isfile('glade.txt'): os.unlink('glade.txt') print ("Remove 'glade.txt'") if os.path.isfile('tmpfiles'): os.unlink('tmpfiles') print ("Remove 'tmpfiles'") def merge(args): """ Merge messages with 'gramps.pot' """ for arg in args: if arg == 'all': continue print ('Merge %(lang)s with current template' % {'lang': arg}) os.system('''%(msgmerge)s -U %(lang)s gramps.pot''' \ % {'msgmerge': msgmergeCmd, 'lang': arg}) print ("Updated file: '%(lang)s'." % {'lang': arg}) def check(args): """ Check the translation file """ for arg in args: if arg == 'all': continue print ("Checked file: '%(lang.po)s'. See '%(txt)s.txt'." \ % {'lang.po': arg, 'txt': arg[:-3]}) os.system('''%(python)s ./check_po -s %(lang.po)s > %(lang)s.txt''' \ % {'python': pythonCmd, 'lang.po': arg, 'lang': arg[:-3]}) os.system('''%(msgfmt)s -c -v %(lang.po)s''' % {'msgfmt': msgfmtCmd, 'lang.po': arg}) def untranslated(arg): """ List untranslated messages """ os.system('''%(msgattrib)s --untranslated %(lang.po)s''' % {'msgattrib': msgattribCmd, 'lang.po': arg[0]}) def fuzzy(arg): """ List fuzzy messages """ os.system('''%(msgattrib)s --only-fuzzy --no-obsolete %(lang.po)s''' % {'msgattrib': msgattribCmd, 'lang.po': arg[0]}) if __name__ == "__main__": main()