django/scripts/manage_translations.py

220 lines
7.4 KiB
Python

#!/usr/bin/env python
#
# This Python file contains utility scripts to manage Django translations.
# It has to be run inside the django git root directory.
#
# The following commands are available:
#
# * update_catalogs: check for new strings in core and contrib catalogs, and
# output how much strings are new/changed.
#
# * lang_stats: output statistics for each catalog/language combination
#
# * fetch: fetch translations from transifex.com
#
# Each command support the --languages and --resources options to limit their
# operation to the specified language or resource. For example, to get stats
# for Spanish in contrib.admin, run:
#
# $ python scripts/manage_translations.py lang_stats --language=es --resources=admin
import os
from argparse import ArgumentParser
from subprocess import run
import django
from django.conf import settings
from django.core.management import call_command
HAVE_JS = ["admin"]
def _get_locale_dirs(resources, include_core=True):
"""
Return a tuple (contrib name, absolute path) for all locale directories,
optionally including the django core catalog.
If resources list is not None, filter directories matching resources content.
"""
contrib_dir = os.path.join(os.getcwd(), "django", "contrib")
dirs = []
# Collect all locale directories
for contrib_name in os.listdir(contrib_dir):
path = os.path.join(contrib_dir, contrib_name, "locale")
if os.path.isdir(path):
dirs.append((contrib_name, path))
if contrib_name in HAVE_JS:
dirs.append(("%s-js" % contrib_name, path))
if include_core:
dirs.insert(0, ("core", os.path.join(os.getcwd(), "django", "conf", "locale")))
# Filter by resources, if any
if resources is not None:
res_names = [d[0] for d in dirs]
dirs = [ld for ld in dirs if ld[0] in resources]
if len(resources) > len(dirs):
print(
"You have specified some unknown resources. "
"Available resource names are: %s" % (", ".join(res_names),)
)
exit(1)
return dirs
def _tx_resource_for_name(name):
"""Return the Transifex resource name"""
if name == "core":
return "django.core"
else:
return "django.contrib-%s" % name
def _check_diff(cat_name, base_path):
"""
Output the approximate number of changed/added strings in the en catalog.
"""
po_path = "%(path)s/en/LC_MESSAGES/django%(ext)s.po" % {
"path": base_path,
"ext": "js" if cat_name.endswith("-js") else "",
}
p = run(
"git diff -U0 %s | egrep '^[-+]msgid' | wc -l" % po_path,
capture_output=True,
shell=True,
)
num_changes = int(p.stdout.strip())
print("%d changed/added messages in '%s' catalog." % (num_changes, cat_name))
def update_catalogs(resources=None, languages=None):
"""
Update the en/LC_MESSAGES/django.po (main and contrib) files with
new/updated translatable strings.
"""
settings.configure()
django.setup()
if resources is not None:
print("`update_catalogs` will always process all resources.")
contrib_dirs = _get_locale_dirs(None, include_core=False)
os.chdir(os.path.join(os.getcwd(), "django"))
print("Updating en catalogs for Django and contrib apps...")
call_command("makemessages", locale=["en"])
print("Updating en JS catalogs for Django and contrib apps...")
call_command("makemessages", locale=["en"], domain="djangojs")
# Output changed stats
_check_diff("core", os.path.join(os.getcwd(), "conf", "locale"))
for name, dir_ in contrib_dirs:
_check_diff(name, dir_)
def lang_stats(resources=None, languages=None):
"""
Output language statistics of committed translation files for each
Django catalog.
If resources is provided, it should be a list of translation resource to
limit the output (e.g. ['core', 'gis']).
"""
locale_dirs = _get_locale_dirs(resources)
for name, dir_ in locale_dirs:
print("\nShowing translations stats for '%s':" % name)
langs = sorted(d for d in os.listdir(dir_) if not d.startswith("_"))
for lang in langs:
if languages and lang not in languages:
continue
# TODO: merge first with the latest en catalog
po_path = "{path}/{lang}/LC_MESSAGES/django{ext}.po".format(
path=dir_, lang=lang, ext="js" if name.endswith("-js") else ""
)
p = run(
["msgfmt", "-vc", "-o", "/dev/null", po_path],
capture_output=True,
env={"LANG": "C"},
encoding="utf-8",
)
if p.returncode == 0:
# msgfmt output stats on stderr
print("%s: %s" % (lang, p.stderr.strip()))
else:
print(
"Errors happened when checking %s translation for %s:\n%s"
% (lang, name, p.stderr)
)
def fetch(resources=None, languages=None):
"""
Fetch translations from Transifex, wrap long lines, generate mo files.
"""
locale_dirs = _get_locale_dirs(resources)
errors = []
for name, dir_ in locale_dirs:
# Transifex pull
if languages is None:
run(
[
"tx",
"pull",
"-r",
_tx_resource_for_name(name),
"-a",
"-f",
"--minimum-perc=5",
]
)
target_langs = sorted(
d for d in os.listdir(dir_) if not d.startswith("_") and d != "en"
)
else:
for lang in languages:
run(["tx", "pull", "-r", _tx_resource_for_name(name), "-f", "-l", lang])
target_langs = languages
# msgcat to wrap lines and msgfmt for compilation of .mo file
for lang in target_langs:
po_path = "%(path)s/%(lang)s/LC_MESSAGES/django%(ext)s.po" % {
"path": dir_,
"lang": lang,
"ext": "js" if name.endswith("-js") else "",
}
if not os.path.exists(po_path):
print(
"No %(lang)s translation for resource %(name)s"
% {"lang": lang, "name": name}
)
continue
run(["msgcat", "--no-location", "-o", po_path, po_path])
msgfmt = run(["msgfmt", "-c", "-o", "%s.mo" % po_path[:-3], po_path])
if msgfmt.returncode != 0:
errors.append((name, lang))
if errors:
print("\nWARNING: Errors have occurred in following cases:")
for resource, lang in errors:
print("\tResource %s for language %s" % (resource, lang))
exit(1)
if __name__ == "__main__":
RUNABLE_SCRIPTS = ("update_catalogs", "lang_stats", "fetch")
parser = ArgumentParser()
parser.add_argument("cmd", nargs=1, choices=RUNABLE_SCRIPTS)
parser.add_argument(
"-r",
"--resources",
action="append",
help="limit operation to the specified resources",
)
parser.add_argument(
"-l",
"--languages",
action="append",
help="limit operation to the specified languages",
)
options = parser.parse_args()
eval(options.cmd[0])(options.resources, options.languages)