mirror of
				https://github.com/django/django.git
				synced 2025-10-31 01:25:32 +00:00 
			
		
		
		
	Rewrapped long docstrings and block comments to 79 characters + newline using script from https://github.com/medmunds/autofix-w505.
		
			
				
	
	
		
			404 lines
		
	
	
		
			13 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			404 lines
		
	
	
		
			13 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| #!/usr/bin/env python
 | |
| #
 | |
| # This Python file contains utility scripts to manage Django translations.
 | |
| # It has to be run inside the django git root directory.
 | |
| #
 | |
| # The following commands are available:
 | |
| #
 | |
| # * update_catalogs: check for new strings in core and contrib catalogs, and
 | |
| #                    output how much strings are new/changed.
 | |
| #
 | |
| # * lang_stats: output statistics for each catalog/language combination
 | |
| #
 | |
| # * fetch: fetch translations from transifex.com
 | |
| #
 | |
| # Each command support the --languages and --resources options to limit their
 | |
| # operation to the specified language or resource. For example, to get stats
 | |
| # for Spanish in contrib.admin, run:
 | |
| #
 | |
| #  $ python scripts/manage_translations.py lang_stats -l es -r admin
 | |
| #
 | |
| # Also each command supports a --verbosity option to get progress feedback.
 | |
| 
 | |
| import json
 | |
| import os
 | |
| import subprocess
 | |
| from argparse import ArgumentParser
 | |
| from collections import defaultdict
 | |
| from configparser import ConfigParser
 | |
| from datetime import datetime
 | |
| from itertools import product
 | |
| 
 | |
| import requests
 | |
| 
 | |
| import django
 | |
| from django.conf import settings
 | |
| from django.core.management import call_command
 | |
| 
 | |
| HAVE_JS = ["admin"]
 | |
| LANG_OVERRIDES = {
 | |
|     "zh_CN": "zh_Hans",
 | |
|     "zh_TW": "zh_Hant",
 | |
| }
 | |
| 
 | |
| 
 | |
| def run(*args, verbosity=0, **kwargs):
 | |
|     if verbosity > 1:
 | |
|         print(f"\n** subprocess.run ** command: {args=} {kwargs=}")
 | |
|     return subprocess.run(*args, **kwargs)
 | |
| 
 | |
| 
 | |
| def get_api_token():
 | |
|     # Read token from ENV, otherwise read from the ~/.transifexrc file.
 | |
|     api_token = os.getenv("TRANSIFEX_API_TOKEN")
 | |
|     if not api_token:
 | |
|         parser = ConfigParser()
 | |
|         parser.read(os.path.expanduser("~/.transifexrc"))
 | |
|         api_token = parser.get("https://www.transifex.com", "token")
 | |
| 
 | |
|     assert api_token, "Please define the TRANSIFEX_API_TOKEN env var."
 | |
|     return api_token
 | |
| 
 | |
| 
 | |
| def get_api_response(endpoint, api_token=None, params=None, verbosity=0):
 | |
|     if api_token is None:
 | |
|         api_token = get_api_token()
 | |
|     headers = {
 | |
|         "Authorization": f"Bearer {api_token}",
 | |
|         "Accept": "application/vnd.api+json",
 | |
|         "Content-Type": "application/json",
 | |
|     }
 | |
|     endpoint = endpoint.strip("/")
 | |
|     url = f"https://rest.api.transifex.com/{endpoint}"
 | |
|     if verbosity > 2:
 | |
|         print(f"\n>>> GET {url=} {params=}")
 | |
|     response = requests.get(url, headers=headers, params=params)
 | |
|     if verbosity > 2:
 | |
|         print(f">>>> GET {response=}\n")
 | |
|     response.raise_for_status()
 | |
|     return response.json()["data"]
 | |
| 
 | |
| 
 | |
| def list_resources_with_updates(
 | |
|     date_since, resources=None, languages=None, verbosity=0
 | |
| ):
 | |
|     api_token = get_api_token()
 | |
|     project = "o:django:p:django"
 | |
|     date_since_iso = date_since.isoformat().strip("Z") + "Z"
 | |
|     if verbosity:
 | |
|         print(f"\n== Starting list_resources_with_updates at {date_since_iso=}")
 | |
| 
 | |
|     if not languages:
 | |
|         languages = [  # List languages using Transifex projects API.
 | |
|             d["attributes"]["code"]
 | |
|             for d in get_api_response(
 | |
|                 f"projects/{project}/languages", api_token, verbosity=verbosity
 | |
|             )
 | |
|         ]
 | |
|     if verbosity > 1:
 | |
|         print(f"\n=== Languages to process: {languages=}")
 | |
| 
 | |
|     if not resources:
 | |
|         resources = [  # List resources using Transifex resources API.
 | |
|             d["attributes"]["slug"]
 | |
|             for d in get_api_response(
 | |
|                 "resources",
 | |
|                 api_token,
 | |
|                 params={"filter[project]": project},
 | |
|                 verbosity=verbosity,
 | |
|             )
 | |
|         ]
 | |
|     else:
 | |
|         resources = [_tx_resource_slug_for_name(r) for r in resources]
 | |
|     if verbosity > 1:
 | |
|         print(f"\n=== Resources to process: {resources=}")
 | |
| 
 | |
|     resource_lang_changed = defaultdict(list)
 | |
|     for lang, resource in product(languages, resources):
 | |
|         if verbosity:
 | |
|             print(f"\n=== Getting data for: {lang=} {resource=} {date_since_iso=}")
 | |
|         data = get_api_response(
 | |
|             "resource_translations",
 | |
|             api_token,
 | |
|             params={
 | |
|                 "filter[resource]": f"{project}:r:{resource}",
 | |
|                 "filter[language]": f"l:{lang}",
 | |
|                 "filter[date_translated][gt]": date_since_iso,
 | |
|             },
 | |
|             verbosity=verbosity,
 | |
|         )
 | |
|         local_resource = resource.replace("contrib-", "", 1)
 | |
|         local_lang = lang  # XXX: LANG_OVERRIDES.get(lang, lang)
 | |
|         if data:
 | |
|             resource_lang_changed[local_resource].append(local_lang)
 | |
|             if verbosity > 2:
 | |
|                 fname = f"{local_resource}-{local_lang}.json"
 | |
|                 with open(fname, "w") as f:
 | |
|                     f.write(json.dumps(data, sort_keys=True, indent=2))
 | |
|                 print(f"==== Stored full data JSON in: {fname}")
 | |
|         if verbosity > 1:
 | |
|             print(f"==== Result for {local_resource=} {local_lang=}: {len(data)=}")
 | |
| 
 | |
|     return resource_lang_changed
 | |
| 
 | |
| 
 | |
| def _get_locale_dirs(resources, include_core=True):
 | |
|     """
 | |
|     Return a tuple (contrib name, absolute path) for all locale directories,
 | |
|     optionally including the django core catalog.
 | |
|     If resources list is not None, filter directories matching resources
 | |
|     content.
 | |
|     """
 | |
|     contrib_dir = os.path.join(os.getcwd(), "django", "contrib")
 | |
|     dirs = []
 | |
| 
 | |
|     # Collect all locale directories
 | |
|     for contrib_name in os.listdir(contrib_dir):
 | |
|         path = os.path.join(contrib_dir, contrib_name, "locale")
 | |
|         if os.path.isdir(path):
 | |
|             dirs.append((contrib_name, path))
 | |
|             if contrib_name in HAVE_JS:
 | |
|                 dirs.append(("%s-js" % contrib_name, path))
 | |
|     if include_core:
 | |
|         dirs.insert(0, ("core", os.path.join(os.getcwd(), "django", "conf", "locale")))
 | |
| 
 | |
|     # Filter by resources, if any
 | |
|     if resources is not None:
 | |
|         res_names = [d[0] for d in dirs]
 | |
|         dirs = [ld for ld in dirs if ld[0] in resources]
 | |
|         if len(resources) > len(dirs):
 | |
|             print(
 | |
|                 "You have specified some unknown resources. "
 | |
|                 "Available resource names are: %s" % (", ".join(res_names),)
 | |
|             )
 | |
|             exit(1)
 | |
|     return dirs
 | |
| 
 | |
| 
 | |
| def _tx_resource_slug_for_name(name):
 | |
|     """Return the Transifex resource slug for the given name."""
 | |
|     if name != "core":
 | |
|         name = f"contrib-{name}"
 | |
|     return name
 | |
| 
 | |
| 
 | |
| def _tx_resource_for_name(name):
 | |
|     """Return the Transifex resource name."""
 | |
|     return "django." + _tx_resource_slug_for_name(name)
 | |
| 
 | |
| 
 | |
| def _check_diff(cat_name, base_path):
 | |
|     """
 | |
|     Output the approximate number of changed/added strings in the en catalog.
 | |
|     """
 | |
|     po_path = "%(path)s/en/LC_MESSAGES/django%(ext)s.po" % {
 | |
|         "path": base_path,
 | |
|         "ext": "js" if cat_name.endswith("-js") else "",
 | |
|     }
 | |
|     p = run(
 | |
|         "git diff -U0 %s | egrep '^[-+]msgid' | wc -l" % po_path,
 | |
|         capture_output=True,
 | |
|         shell=True,
 | |
|     )
 | |
|     num_changes = int(p.stdout.strip())
 | |
|     print("%d changed/added messages in '%s' catalog." % (num_changes, cat_name))
 | |
| 
 | |
| 
 | |
| def update_catalogs(resources=None, languages=None, verbosity=0):
 | |
|     """
 | |
|     Update the en/LC_MESSAGES/django.po (main and contrib) files with
 | |
|     new/updated translatable strings.
 | |
|     """
 | |
|     settings.configure()
 | |
|     django.setup()
 | |
|     if resources is not None:
 | |
|         print("`update_catalogs` will always process all resources.")
 | |
|     contrib_dirs = _get_locale_dirs(None, include_core=False)
 | |
| 
 | |
|     os.chdir(os.path.join(os.getcwd(), "django"))
 | |
|     print("Updating en catalogs for Django and contrib apps...")
 | |
|     call_command("makemessages", locale=["en"], verbosity=verbosity)
 | |
|     print("Updating en JS catalogs for Django and contrib apps...")
 | |
|     call_command("makemessages", locale=["en"], domain="djangojs", verbosity=verbosity)
 | |
| 
 | |
|     # Output changed stats
 | |
|     _check_diff("core", os.path.join(os.getcwd(), "conf", "locale"))
 | |
|     for name, dir_ in contrib_dirs:
 | |
|         _check_diff(name, dir_)
 | |
| 
 | |
| 
 | |
| def lang_stats(resources=None, languages=None, verbosity=0):
 | |
|     """
 | |
|     Output language statistics of committed translation files for each
 | |
|     Django catalog.
 | |
|     If resources is provided, it should be a list of translation resource to
 | |
|     limit the output (e.g. ['core', 'gis']).
 | |
|     """
 | |
|     locale_dirs = _get_locale_dirs(resources)
 | |
| 
 | |
|     for name, dir_ in locale_dirs:
 | |
|         print("\nShowing translations stats for '%s':" % name)
 | |
|         langs = sorted(d for d in os.listdir(dir_) if not d.startswith("_"))
 | |
|         for lang in langs:
 | |
|             if languages and lang not in languages:
 | |
|                 continue
 | |
|             # TODO: merge first with the latest en catalog
 | |
|             po_path = "{path}/{lang}/LC_MESSAGES/django{ext}.po".format(
 | |
|                 path=dir_, lang=lang, ext="js" if name.endswith("-js") else ""
 | |
|             )
 | |
|             p = run(
 | |
|                 ["msgfmt", "-vc", "-o", "/dev/null", po_path],
 | |
|                 capture_output=True,
 | |
|                 env={"LANG": "C"},
 | |
|                 encoding="utf-8",
 | |
|                 verbosity=verbosity,
 | |
|             )
 | |
|             if p.returncode == 0:
 | |
|                 # msgfmt output stats on stderr
 | |
|                 print("%s: %s" % (lang, p.stderr.strip()))
 | |
|             else:
 | |
|                 print(
 | |
|                     "Errors happened when checking %s translation for %s:\n%s"
 | |
|                     % (lang, name, p.stderr)
 | |
|                 )
 | |
| 
 | |
| 
 | |
| def fetch(resources=None, languages=None, date_since=None, verbosity=0):
 | |
|     """
 | |
|     Fetch translations from Transifex, wrap long lines, generate mo files.
 | |
|     """
 | |
|     if date_since is None:
 | |
|         resource_lang_mapping = {}
 | |
|     else:
 | |
|         # Filter resources and languages that were updates after `date_since`
 | |
|         resource_lang_mapping = list_resources_with_updates(
 | |
|             date_since=date_since,
 | |
|             resources=resources,
 | |
|             languages=languages,
 | |
|             verbosity=verbosity,
 | |
|         )
 | |
|         resources = resource_lang_mapping.keys()
 | |
| 
 | |
|     locale_dirs = _get_locale_dirs(resources)
 | |
|     errors = []
 | |
| 
 | |
|     for name, dir_ in locale_dirs:
 | |
|         cmd = [
 | |
|             "tx",
 | |
|             "pull",
 | |
|             "-r",
 | |
|             _tx_resource_for_name(name),
 | |
|             "-f",
 | |
|             "--minimum-perc=5",
 | |
|         ]
 | |
|         per_resource_langs = resource_lang_mapping.get(name, languages)
 | |
|         # Transifex pull
 | |
|         if per_resource_langs is None:
 | |
|             run([*cmd, "--all"], verbosity=verbosity)
 | |
|             target_langs = sorted(
 | |
|                 d for d in os.listdir(dir_) if not d.startswith("_") and d != "en"
 | |
|             )
 | |
|         else:
 | |
|             run([*cmd, "-l", ",".join(per_resource_langs)], verbosity=verbosity)
 | |
|             target_langs = per_resource_langs
 | |
| 
 | |
|         target_langs = [LANG_OVERRIDES.get(d, d) for d in target_langs]
 | |
| 
 | |
|         # msgcat to wrap lines and msgfmt for compilation of .mo file
 | |
|         for lang in target_langs:
 | |
|             po_path = "%(path)s/%(lang)s/LC_MESSAGES/django%(ext)s.po" % {
 | |
|                 "path": dir_,
 | |
|                 "lang": lang,
 | |
|                 "ext": "js" if name.endswith("-js") else "",
 | |
|             }
 | |
|             if not os.path.exists(po_path):
 | |
|                 print(
 | |
|                     "No %(lang)s translation for resource %(name)s"
 | |
|                     % {"lang": lang, "name": name}
 | |
|                 )
 | |
|                 continue
 | |
|             run(
 | |
|                 ["msgcat", "--no-location", "-o", po_path, po_path], verbosity=verbosity
 | |
|             )
 | |
|             msgfmt = run(
 | |
|                 ["msgfmt", "-c", "-o", "%s.mo" % po_path[:-3], po_path],
 | |
|                 verbosity=verbosity,
 | |
|             )
 | |
|             if msgfmt.returncode != 0:
 | |
|                 errors.append((name, lang))
 | |
|     if errors:
 | |
|         print("\nWARNING: Errors have occurred in following cases:")
 | |
|         for resource, lang in errors:
 | |
|             print("\tResource %s for language %s" % (resource, lang))
 | |
|         exit(1)
 | |
| 
 | |
|     if verbosity:
 | |
|         print("\nCOMPLETED.")
 | |
| 
 | |
| 
 | |
| def add_common_arguments(parser):
 | |
|     parser.add_argument(
 | |
|         "-r",
 | |
|         "--resources",
 | |
|         action="append",
 | |
|         help="limit operation to the specified resources",
 | |
|     )
 | |
|     parser.add_argument(
 | |
|         "-l",
 | |
|         "--languages",
 | |
|         action="append",
 | |
|         help="limit operation to the specified languages",
 | |
|     )
 | |
|     parser.add_argument(
 | |
|         "-v",
 | |
|         "--verbosity",
 | |
|         default=1,
 | |
|         type=int,
 | |
|         choices=[0, 1, 2, 3],
 | |
|         help=(
 | |
|             "Verbosity level; 0=minimal output, 1=normal output, 2=verbose output, "
 | |
|             "3=very verbose output"
 | |
|         ),
 | |
|     )
 | |
| 
 | |
| 
 | |
| if __name__ == "__main__":
 | |
|     parser = ArgumentParser()
 | |
| 
 | |
|     subparsers = parser.add_subparsers(
 | |
|         dest="cmd", help="choose the operation to perform"
 | |
|     )
 | |
| 
 | |
|     parser_update = subparsers.add_parser(
 | |
|         "update_catalogs",
 | |
|         help="update English django.po files with new/updated translatable strings",
 | |
|     )
 | |
|     add_common_arguments(parser_update)
 | |
| 
 | |
|     parser_stats = subparsers.add_parser(
 | |
|         "lang_stats",
 | |
|         help="print the approximate number of changed/added strings in the en catalog",
 | |
|     )
 | |
|     add_common_arguments(parser_stats)
 | |
| 
 | |
|     parser_fetch = subparsers.add_parser(
 | |
|         "fetch",
 | |
|         help="fetch translations from Transifex, wrap long lines, generate mo files",
 | |
|     )
 | |
|     add_common_arguments(parser_fetch)
 | |
|     parser_fetch.add_argument(
 | |
|         "-s",
 | |
|         "--since",
 | |
|         dest="date_since",
 | |
|         metavar="YYYY-MM-DD",
 | |
|         type=datetime.fromisoformat,
 | |
|         help=(
 | |
|             "fetch translations that were done after this date (ISO format YYYY-MM-DD)."
 | |
|         ),
 | |
|     )
 | |
| 
 | |
|     options = parser.parse_args()
 | |
|     kwargs = options.__dict__
 | |
|     cmd = kwargs.pop("cmd")
 | |
|     eval(cmd)(**kwargs)
 |