gramps/po/update_po.py

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

605 lines
18 KiB
Python
Raw Normal View History

#! /usr/bin/env python3
#
# update_po - a gramps tool to update translations
#
# Copyright (C) 2006-2006 Kees Bakker
2012-03-14 14:10:21 +00:00
# Copyright (C) 2006 Brian Matherly
# Copyright (C) 2008 Stephen George
# Copyright (C) 2012
# Copyright (C) 2020 Nick Hall
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
#
"""
update_po.py for Gramps translations.
2016-05-18 05:47:34 -04:00
Examples:
python update_po.py -t
Tests if 'gettext' and 'python' are well configured.
python update_po.py -h
Calls help and command line interface.
python update_po.py -p
Generates a new template/catalog (gramps.pot).
2016-04-19 09:15:05 +10:00
python update_po.py -m de.po
Merges 'de.po' file with 'gramps.pot'.
2016-04-19 09:15:05 +10:00
python update_po.py -k de.po
Checks 'de.po' file, tests to compile and generates a textual resume.
"""
from __future__ import print_function
import os
import sys
2019-01-01 11:33:52 -06:00
import shutil
from argparse import ArgumentParser
from tokenize import tokenize, STRING, COMMENT, NL, TokenError
2023-07-31 14:40:59 +01:00
# Windows OS
2019-01-01 11:33:52 -06:00
if sys.platform in ["linux", "linux2", "darwin", "cygwin"] or shutil.which("msgmerge"):
msgmergeCmd = "msgmerge"
msgfmtCmd = "msgfmt"
msgattribCmd = "msgattrib"
xgettextCmd = "xgettext"
pythonCmd = os.path.join(sys.prefix, "bin", "python3")
elif sys.platform == "win32":
# GetText Win 32 obtained from http://gnuwin32.sourceforge.net/packages/gettext.htm
# ....\gettext\bin\msgmerge.exe needs to be on the path
2012-03-29 09:19:54 +00:00
msgmergeCmd = os.path.join(
"C:", "Program Files(x86)", "gettext", "bin", "msgmerge.exe"
)
msgfmtCmd = os.path.join("C:", "Program Files(x86)", "gettext", "bin", "msgfmt.exe")
msgattribCmd = os.path.join(
"C:", "Program Files(x86)", "gettext", "bin", "msgattrib.exe"
)
xgettextCmd = os.path.join(
"C:", "Program Files(x86)", "gettext", "bin", "xgettext.exe"
)
pythonCmd = os.path.join(sys.prefix, "bin", "python.exe")
# Others OS
2015-03-01 09:00:38 -08:00
elif sys.platform in ["linux", "linux2", "darwin", "cygwin"]:
msgmergeCmd = "msgmerge"
msgfmtCmd = "msgfmt"
msgattribCmd = "msgattrib"
xgettextCmd = "xgettext"
pythonCmd = os.path.join(sys.prefix, "bin", "python3")
else:
print("Found platform %s, OS %s" % (sys.platform, os.name))
print("Update PO ERROR: unknown system, don't know msgmerge, ... commands")
sys.exit(0)
# List of available languages, useful for grouped actions
# need files with po extension
LANG = [file for file in os.listdir(".") if file.endswith(".po")]
# add a special 'all' argument (for 'check' and 'merge' arguments)
LANG.append("all")
# visual polish on the languages list
LANG.sort()
2023-07-31 14:40:59 +01:00
def tests():
"""
Testing installed programs.
We made tests (-t flag) by displaying versions of tools if properly
installed. Cannot run all commands without 'gettext' and 'python'.
"""
try:
print("\n====='msgmerge'=(merge our translation)================\n")
os.system("""%(program)s -V""" % {"program": msgmergeCmd})
except:
2016-04-19 09:15:05 +10:00
print(
"Please, install %(program)s for updating your translation"
% {"program": msgmergeCmd}
)
2016-04-19 09:15:05 +10:00
try:
print("\n==='msgfmt'=(format our translation for installation)==\n")
os.system("""%(program)s -V""" % {"program": msgfmtCmd})
except:
2016-04-19 09:15:05 +10:00
print(
"Please, install %(program)s for checking your translation"
% {"program": msgfmtCmd}
)
2016-04-19 09:15:05 +10:00
try:
print("\n===='msgattrib'==(list groups of messages)=============\n")
os.system("""%(program)s -V""" % {"program": msgattribCmd})
except:
2016-04-19 09:15:05 +10:00
print(
"Please, install %(program)s for listing groups of messages"
% {"program": msgattribCmd}
)
2016-04-19 09:15:05 +10:00
try:
print("\n===='xgettext' =(generate a new template)==============\n")
os.system("""%(program)s -V""" % {"program": xgettextCmd})
except:
2016-04-19 09:15:05 +10:00
print(
"Please, install %(program)s for generating a new template"
% {"program": xgettextCmd}
)
2016-04-19 09:15:05 +10:00
try:
print("\n=================='python'=============================\n")
os.system("""%(program)s -V""" % {"program": pythonCmd})
except:
print("Please, install python")
2023-07-31 14:40:59 +01:00
def main():
"""
The utility for handling translation stuff.
What is need by Gramps, nothing more.
"""
2016-04-19 09:15:05 +10:00
parser = ArgumentParser(
description="This program generates a new template and "
2016-04-19 09:15:05 +10:00
"also provides some common features.",
)
parser.add_argument(
"-t",
"--test",
2012-12-01 09:45:14 +00:00
action="store_true",
dest="test",
default=True,
help="test if 'python' and 'gettext' are properly installed",
)
2023-07-31 14:40:59 +01:00
parser.add_argument(
"-x",
"--xml",
action="store_true",
dest="xml",
default=False,
help="extract messages from xml based file formats",
)
parser.add_argument(
"-g",
"--glade",
action="store_true",
dest="glade",
default=False,
help="extract messages from glade file format only",
)
parser.add_argument(
"-c",
"--clean",
action="store_true",
dest="clean",
default=False,
help="remove created files",
)
2016-05-18 05:47:34 -04:00
parser.add_argument(
"-p",
"--pot",
action="store_true",
dest="catalog",
default=False,
help="create a new catalog",
)
2023-07-31 14:40:59 +01:00
update = parser.add_argument_group("Update", "Maintenance around translations")
2016-04-19 09:15:05 +10:00
# need at least one argument (sv.po, de.po, etc ...)
2016-04-19 09:15:05 +10:00
# lang.po files maintenance
update.add_argument(
"-m", dest="merge", choices=LANG, help="merge lang.po files with last catalog"
)
2016-04-19 09:15:05 +10:00
update.add_argument("-k", dest="check", choices=LANG, help="check lang.po files")
2016-04-19 09:15:05 +10:00
# testing stage
2012-12-02 14:09:44 +00:00
trans = parser.add_argument_group(
"Translation", "Display content of translations file"
)
2016-04-19 09:15:05 +10:00
# need one argument (eg, de.po)
2016-04-19 09:15:05 +10:00
trans.add_argument(
"-u",
dest="untranslated",
choices=[file for file in os.listdir(".") if file.endswith(".po")],
help="list untranslated messages",
)
trans.add_argument(
"-f",
dest="fuzzy",
choices=[file for file in os.listdir(".") if file.endswith(".po")],
help="list fuzzy messages",
)
2016-04-19 09:15:05 +10:00
args = parser.parse_args()
2012-12-01 09:45:14 +00:00
namespace, extra = parser.parse_known_args()
if args.test:
tests()
2016-04-19 09:15:05 +10:00
if args.xml:
extract_xml()
2016-04-19 09:15:05 +10:00
if args.glade:
create_filesfile()
extract_glade()
if os.path.isfile("tmpfiles"):
os.unlink("tmpfiles")
2016-04-19 09:15:05 +10:00
if args.catalog:
retrieve()
2016-04-19 09:15:05 +10:00
if args.clean:
clean()
2016-04-19 09:15:05 +10:00
if args.merge:
# retrieve() windows os?
if sys.argv[2:] == ["all"]:
sys.argv[2:] = LANG
merge(sys.argv[2:])
2016-04-19 09:15:05 +10:00
if args.check:
# retrieve() windows os?
if sys.argv[2:] == ["all"]:
sys.argv[2:] = LANG
check(sys.argv[2:])
2016-04-19 09:15:05 +10:00
if args.untranslated:
untranslated(sys.argv[2:])
2016-04-19 09:15:05 +10:00
if args.fuzzy:
fuzzy(sys.argv[2:])
2023-07-31 14:40:59 +01:00
def create_filesfile():
"""
Create a file with all files that we should translate.
2016-04-19 09:15:05 +10:00
These are all python files not in POTFILES.skip added with those in
POTFILES.in
"""
dir = os.getcwd()
topdir = os.path.normpath(os.path.join(dir, "..", "gramps"))
lentopdir = len(topdir)
with open("POTFILES.in") as f:
infiles = dict(
["../" + file.strip(), None]
for file in f
if file.strip() and not file[0] == "#"
2023-07-31 14:40:59 +01:00
)
with open("POTFILES.skip") as f:
notinfiles = dict(
["../" + file.strip(), None] for file in f if file and not file[0] == "#"
)
2023-07-31 14:40:59 +01:00
for dirpath, dirnames, filenames in os.walk(topdir):
root, subdir = os.path.split(dirpath)
if subdir.startswith("."):
# don't continue in this dir
dirnames[:] = []
continue
for dirname in dirnames:
# Skip hidden and system directories:
if dirname.startswith(".") or dirname in ["po", "locale"]:
dirnames.remove(dirname)
# add the files which are python or glade files
# if the directory does not exist or is a link, do nothing
if not os.path.isdir(dirpath) or os.path.islink(dirpath):
continue
2023-07-31 14:40:59 +01:00
for filename in os.listdir(dirpath):
name = os.path.split(filename)[1]
if name.endswith(".py") or name.endswith(".glade"):
full_filename = os.path.join(dirpath, filename)
# Skip the file if in POTFILES.skip
if full_filename[lentopdir:] in notinfiles:
infiles["../gramps" + full_filename[lentopdir:]] = None
# now we write out all the files in form ../gramps/filename
with open("tmpfiles", "w") as f:
for file in sorted(infiles.keys()):
f.write(file)
f.write("\n")
2023-07-31 14:40:59 +01:00
def listing(name, extensionlist):
"""
List files according to extensions.
Parsing from a textual file (gramps) is faster and easy for maintenance.
Like POTFILES.in and POTFILES.skip
"""
with open("tmpfiles") as f:
files = [file.strip() for file in f if file and not file[0] == "#"]
with open(name, "w") as temp:
for entry in files:
for ext in extensionlist:
if entry.endswith(ext):
temp.write(entry)
temp.write("\n")
break
2023-07-31 14:40:59 +01:00
def headers():
"""
Look at existing C file format headers.
2016-04-19 09:15:05 +10:00
Generated by 'intltool-extract' but want to get rid of this
dependency (perl, just a set of tools).
"""
headers = []
# in.h; extract_xml
if os.path.isfile("""fragments.pot"""):
headers.append("""fragments.pot""")
2016-04-19 09:15:05 +10:00
return headers
2023-07-31 14:40:59 +01:00
def extract_xml():
"""
Extract translation strings from XML based, mime and desktop files.
Uses custom ITS rules found in the po/its directory.
"""
if not os.path.isfile("gramps.pot"):
create_template()
for input_file in [
"../data/holidays.xml",
"../data/tips.xml",
"../data/org.gramps_project.Gramps.xml.in",
"../data/org.gramps_project.Gramps.appdata.xml.in",
"../data/org.gramps_project.Gramps.desktop.in",
]:
os.system(
2023-07-31 14:40:59 +01:00
(
"GETTEXTDATADIR=. %(xgettext)s -F -j "
"-o gramps.pot --from-code=UTF-8 %(inputfile)s"
)
% {"xgettext": xgettextCmd, "inputfile": input_file}
)
print(input_file)
2023-07-31 14:40:59 +01:00
def create_template():
"""
Create a new file for template, if it does not exist.
"""
with open("gramps.pot", "w") as template:
2016-04-19 09:15:05 +10:00
pass
2023-07-31 14:40:59 +01:00
def extract_glade():
"""
Extract messages from a temp file with all .glade
"""
if not os.path.isfile("gramps.pot"):
create_template()
listing("glade.txt", [".glade"])
os.system(
"""%(xgettext)s -F --add-comments -j -L Glade """
"""--from-code=UTF-8 -o gramps.pot --files-from=glade.txt"""
% {"xgettext": xgettextCmd}
)
2023-07-31 14:40:59 +01:00
def xml_fragments():
"""search through the file for xml fragments that contain the
'translate="yes">string<' pattern. These need to be added to the message
catalog"""
with open("tmpfiles") as __f:
files = [
file.strip()
for file in __f
if file and not (file[0] == "#") and file.endswith(".py\n")
]
print("Checking for XML fragments in Python files")
modop = int(len(files) / 20)
wfp = open("fragments.pot", "w", encoding="utf-8")
wfp.write('msgid ""\n')
wfp.write('msgstr ""\n')
wfp.write('"Content-Type: text/plain; charset=UTF-8\\n"\n\n')
for indx, filename in enumerate(files):
if not indx % modop:
print(int(indx / len(files) * 100), end="\r")
fp = open(filename, "rb")
try:
tokens = tokenize(fp.readline)
in_string = False
for _token, _text, _start, _end, _line in tokens:
if _text.startswith('"""') or _text.startswith("'''"):
_text = _text[3:]
elif _text.startswith('"') or _text.startswith("'"):
_text = _text[1:]
if _text.endswith('"""') or _text.endswith("'''"):
_text = _text[:-3]
elif _text.endswith('"') or _text.endswith("'"):
_text = _text[:-1]
if _token == STRING and not in_string:
in_string = True
line_no = _start[0]
text = _text
continue
elif _token == STRING and in_string:
text += _text
continue
elif _token == COMMENT or _token == NL and in_string:
# need to ignore comments and concatinate strings
_ml = True
continue
elif in_string:
in_string = False
end = 0
# _find_message_in_xml(text)
while True:
fnd = text.find('translatable="yes">', end)
if fnd == -1:
break
end = text.find("<", fnd)
if end == -1:
print(
"\nBad xml fragment '%s' at %s line %d"
% (text[fnd:], filename, _start[0])
2023-07-31 14:40:59 +01:00
)
break
msg = text[fnd + 19 : end]
if "%s" in msg or (msg.startswith("{") and msg.endswith("}")):
print(
"\n#: %s:%d Are you sure you want to "
'translate the "%%s"???' % (filename, line_no)
)
break
wfp.write(
'#: %s:%d\nmsgid "%s"\nmsgstr ""\n'
% (filename, line_no, msg)
2023-07-31 14:40:59 +01:00
)
except TokenError as e:
print(
"\n%s: %s, line %d, column %d"
% (e.args[0], filename, e.args[1][0], e.args[1][1]),
file=sys.stderr,
)
finally:
fp.close()
wfp.close()
def retrieve():
"""
Extract messages from all files used by Gramps (python, glade, xml)
"""
create_template()
2016-04-19 09:15:05 +10:00
create_filesfile()
xml_fragments()
listing("python.txt", [".py", ".py.in"])
2016-04-19 09:15:05 +10:00
# additional keywords must always be kept in sync with those in genpot.sh
os.system(
"""%(xgettext)s -F --add-comments=Translators -j """
"""--directory=./ -d gramps -L Python """
"""-o gramps.pot --files-from=python.txt """
"""--debug --keyword=_ --keyword=ngettext """
"""--keyword=_T_ --keyword=trans_text:1,2c """
"""--keyword=_:1,2c --keyword=_T_:1,2c """
"""--keyword=sgettext --from-code=UTF-8""" % {"xgettext": xgettextCmd}
)
2016-04-19 09:15:05 +10:00
extract_glade()
extract_xml()
2016-04-19 09:15:05 +10:00
# C format header (.h extension)
for h in headers():
print("xgettext for %s" % h)
os.system(
"""%(xgettext)s -F --add-comments=Translators -j """
"""-o gramps.pot --keyword=N_ --from-code=UTF-8 %(head)s"""
% {"xgettext": xgettextCmd, "head": h}
)
clean()
2023-07-31 14:40:59 +01:00
def clean():
"""
Remove created files (C format headers, temp listings)
"""
for h in headers():
if os.path.isfile(h):
os.unlink(h)
print("Remove %(head)s" % {"head": h})
2023-07-31 14:40:59 +01:00
if os.path.isfile("python.txt"):
os.unlink("python.txt")
print("Remove 'python.txt'")
if os.path.isfile("glade.txt"):
os.unlink("glade.txt")
print("Remove 'glade.txt'")
if os.path.isfile("tmpfiles"):
os.unlink("tmpfiles")
print("Remove 'tmpfiles'")
def merge(args):
"""
Merge messages with 'gramps.pot'
"""
for arg in args:
if arg == "all":
2016-04-19 09:15:05 +10:00
continue
print("Merge %(lang)s with current template" % {"lang": arg})
2017-03-04 14:55:11 +01:00
os.system(
"""%(msgmerge)s -U %(lang)s gramps.pot"""
% {"msgmerge": msgmergeCmd, "lang": arg}
)
2017-03-04 14:55:11 +01:00
print("Updated file: '%(lang)s'." % {"lang": arg})
2023-07-31 14:40:59 +01:00
def check(args):
"""
Check the translation file
"""
for arg in args:
if arg == "all":
continue
print(
"Checked file: '%(lang.po)s'. See '%(txt)s.txt'."
% {"lang.po": arg, "txt": arg[:-3]}
)
os.system(
"""%(python)s ./check_po -s %(lang.po)s > %(lang)s.txt"""
% {"python": pythonCmd, "lang.po": arg, "lang": arg[:-3]}
)
2016-05-18 05:47:34 -04:00
os.system(
"""%(msgfmt)s -c -v %(lang.po)s""" % {"msgfmt": msgfmtCmd, "lang.po": arg}
)
2023-07-31 14:40:59 +01:00
def untranslated(arg):
"""
List untranslated messages
"""
os.system(
"""%(msgattrib)s --untranslated %(lang.po)s"""
% {"msgattrib": msgattribCmd, "lang.po": arg[0]}
)
2023-07-31 14:40:59 +01:00
def fuzzy(arg):
"""
List fuzzy messages
"""
os.system(
"""%(msgattrib)s --only-fuzzy --no-obsolete %(lang.po)s"""
% {"msgattrib": msgattribCmd, "lang.po": arg[0]}
)
2023-07-31 14:40:59 +01:00
if __name__ == "__main__":
2015-12-31 21:17:35 +00:00
main()