2016-06-23 11:32:45 +02:00
|
|
|
import os
|
|
|
|
import re
|
2023-10-27 00:31:44 +02:00
|
|
|
import unicodedata
|
2017-11-16 00:43:27 +01:00
|
|
|
from subprocess import CalledProcessError, check_output
|
2024-07-12 02:30:17 +02:00
|
|
|
from typing import Any
|
2016-06-23 11:32:45 +02:00
|
|
|
|
2020-08-07 01:09:47 +02:00
|
|
|
import orjson
|
2020-01-14 21:59:46 +01:00
|
|
|
import polib
|
2016-06-23 11:32:45 +02:00
|
|
|
from django.conf import settings
|
2017-10-20 07:48:47 +02:00
|
|
|
from django.conf.locale import LANG_INFO
|
2017-12-25 05:24:30 +01:00
|
|
|
from django.core.management.base import CommandParser
|
2017-11-16 00:43:27 +01:00
|
|
|
from django.core.management.commands import compilemessages
|
2021-04-16 00:57:30 +02:00
|
|
|
from django.utils.translation import gettext as _
|
2020-09-01 23:16:00 +02:00
|
|
|
from django.utils.translation import override as override_language
|
2021-08-14 16:51:57 +02:00
|
|
|
from django.utils.translation import to_language
|
2020-10-21 23:38:45 +02:00
|
|
|
from pyuca import Collator
|
2023-10-12 19:43:45 +02:00
|
|
|
from typing_extensions import override
|
2016-06-23 11:32:45 +02:00
|
|
|
|
2020-01-14 21:59:46 +01:00
|
|
|
|
2016-06-23 11:32:45 +02:00
|
|
|
class Command(compilemessages.Command):
|
2023-10-12 19:43:45 +02:00
|
|
|
@override
|
2017-12-25 05:24:30 +01:00
|
|
|
def add_arguments(self, parser: CommandParser) -> None:
|
|
|
|
super().add_arguments(parser)
|
|
|
|
|
|
|
|
parser.add_argument(
|
2021-02-12 08:20:45 +01:00
|
|
|
"--strict", "-s", action="store_true", help="Stop execution in case of errors."
|
2021-02-12 08:19:30 +01:00
|
|
|
)
|
2017-12-25 05:24:30 +01:00
|
|
|
|
2023-10-12 19:43:45 +02:00
|
|
|
@override
|
2017-10-26 11:35:57 +02:00
|
|
|
def handle(self, *args: Any, **options: Any) -> None:
|
2017-10-27 08:28:23 +02:00
|
|
|
super().handle(*args, **options)
|
2021-02-12 08:20:45 +01:00
|
|
|
self.strict = options["strict"]
|
2016-06-23 11:32:45 +02:00
|
|
|
self.extract_language_options()
|
2017-09-13 07:04:22 +02:00
|
|
|
self.create_language_name_map()
|
|
|
|
|
2017-10-26 11:35:57 +02:00
|
|
|
def create_language_name_map(self) -> None:
|
2017-09-13 07:04:22 +02:00
|
|
|
join = os.path.join
|
2019-07-02 22:38:09 +02:00
|
|
|
deploy_root = settings.DEPLOY_ROOT
|
2021-02-12 08:20:45 +01:00
|
|
|
path = join(deploy_root, "locale", "language_options.json")
|
|
|
|
output_path = join(deploy_root, "locale", "language_name_map.json")
|
2017-09-13 07:04:22 +02:00
|
|
|
|
2020-08-07 01:09:47 +02:00
|
|
|
with open(path, "rb") as reader:
|
|
|
|
languages = orjson.loads(reader.read())
|
2017-09-13 07:04:22 +02:00
|
|
|
lang_list = []
|
2021-02-12 08:20:45 +01:00
|
|
|
for lang_info in languages["languages"]:
|
|
|
|
lang_info["name"] = lang_info["name_local"]
|
|
|
|
del lang_info["name_local"]
|
2017-09-13 07:04:22 +02:00
|
|
|
lang_list.append(lang_info)
|
|
|
|
|
2020-10-21 23:38:45 +02:00
|
|
|
collator = Collator()
|
2021-02-12 08:20:45 +01:00
|
|
|
lang_list.sort(key=lambda lang: collator.sort_key(lang["name"]))
|
2017-09-13 07:04:22 +02:00
|
|
|
|
2021-02-12 08:20:45 +01:00
|
|
|
with open(output_path, "wb") as output_file:
|
2020-08-07 01:09:47 +02:00
|
|
|
output_file.write(
|
|
|
|
orjson.dumps(
|
2021-02-12 08:20:45 +01:00
|
|
|
{"name_map": lang_list},
|
2020-08-07 01:09:47 +02:00
|
|
|
option=orjson.OPT_APPEND_NEWLINE | orjson.OPT_INDENT_2 | orjson.OPT_SORT_KEYS,
|
|
|
|
)
|
|
|
|
)
|
2016-06-23 11:32:45 +02:00
|
|
|
|
2018-05-10 19:30:04 +02:00
|
|
|
def get_po_filename(self, locale_path: str, locale: str) -> str:
|
2021-02-12 08:20:45 +01:00
|
|
|
po_template = "{}/{}/LC_MESSAGES/django.po"
|
2016-07-26 14:34:18 +02:00
|
|
|
return po_template.format(locale_path, locale)
|
|
|
|
|
2018-05-10 19:30:04 +02:00
|
|
|
def get_json_filename(self, locale_path: str, locale: str) -> str:
|
2020-06-09 00:25:09 +02:00
|
|
|
return f"{locale_path}/{locale}/translations.json"
|
2016-07-26 14:34:18 +02:00
|
|
|
|
2018-05-10 19:30:04 +02:00
|
|
|
def get_name_from_po_file(self, po_filename: str, locale: str) -> str:
|
2020-10-09 03:52:49 +02:00
|
|
|
try:
|
|
|
|
team = polib.pofile(po_filename).metadata["Language-Team"]
|
2021-02-12 08:19:30 +01:00
|
|
|
return team[: team.rindex(" (")]
|
2020-10-09 03:52:49 +02:00
|
|
|
except (KeyError, ValueError):
|
|
|
|
raise Exception(f"Unknown language {locale}")
|
2017-10-20 07:48:47 +02:00
|
|
|
|
2024-07-12 02:30:17 +02:00
|
|
|
def get_locales(self) -> list[str]:
|
2022-01-22 07:52:54 +01:00
|
|
|
output = check_output(["git", "ls-files", "locale"], text=True)
|
2020-10-30 01:36:18 +01:00
|
|
|
tracked_files = output.split()
|
2021-02-12 08:20:45 +01:00
|
|
|
regex = re.compile(r"locale/(\w+)/LC_MESSAGES/django.po")
|
|
|
|
locales = ["en"]
|
2017-10-23 07:31:04 +02:00
|
|
|
for tracked_file in tracked_files:
|
|
|
|
matched = regex.search(tracked_file)
|
|
|
|
if matched:
|
|
|
|
locales.append(matched.group(1))
|
|
|
|
|
|
|
|
return locales
|
|
|
|
|
2017-10-26 11:35:57 +02:00
|
|
|
def extract_language_options(self) -> None:
|
2020-06-09 00:25:09 +02:00
|
|
|
locale_path = f"{settings.DEPLOY_ROOT}/locale"
|
|
|
|
output_path = f"{locale_path}/language_options.json"
|
2016-06-23 11:32:45 +02:00
|
|
|
|
2024-07-12 02:30:17 +02:00
|
|
|
data: dict[str, list[dict[str, Any]]] = {"languages": []}
|
2016-06-23 11:32:45 +02:00
|
|
|
|
2017-10-23 07:31:04 +02:00
|
|
|
try:
|
|
|
|
locales = self.get_locales()
|
|
|
|
except CalledProcessError:
|
|
|
|
# In case we are not under a Git repo, fallback to getting the
|
|
|
|
# locales using listdir().
|
|
|
|
locales = os.listdir(locale_path)
|
2021-02-12 08:20:45 +01:00
|
|
|
locales.append("en")
|
2017-10-23 07:31:04 +02:00
|
|
|
locales = list(set(locales))
|
2016-07-05 09:25:23 +02:00
|
|
|
|
2022-06-22 23:29:26 +02:00
|
|
|
for locale in sorted(locales):
|
2021-02-12 08:20:45 +01:00
|
|
|
if locale == "en":
|
|
|
|
data["languages"].append(
|
2021-02-12 08:19:30 +01:00
|
|
|
{
|
2021-02-12 08:20:45 +01:00
|
|
|
"name": "English",
|
|
|
|
"name_local": "English",
|
|
|
|
"code": "en",
|
|
|
|
"locale": "en",
|
2021-02-12 08:19:30 +01:00
|
|
|
}
|
|
|
|
)
|
2016-06-23 11:32:45 +02:00
|
|
|
continue
|
2017-02-03 23:26:10 +01:00
|
|
|
|
2021-02-12 08:20:45 +01:00
|
|
|
lc_messages_path = os.path.join(locale_path, locale, "LC_MESSAGES")
|
2017-10-20 07:48:47 +02:00
|
|
|
if not os.path.exists(lc_messages_path):
|
|
|
|
# Not a locale.
|
|
|
|
continue
|
2016-06-23 11:32:45 +02:00
|
|
|
|
2024-07-12 02:30:17 +02:00
|
|
|
info: dict[str, Any] = {}
|
2017-10-20 07:48:47 +02:00
|
|
|
code = to_language(locale)
|
2016-07-26 14:34:18 +02:00
|
|
|
percentage = self.get_translation_percentage(locale_path, locale)
|
2017-10-20 07:48:47 +02:00
|
|
|
try:
|
2021-02-12 08:20:45 +01:00
|
|
|
name = LANG_INFO[code]["name"]
|
|
|
|
name_local = LANG_INFO[code]["name_local"]
|
2017-10-20 07:48:47 +02:00
|
|
|
except KeyError:
|
|
|
|
# Fallback to getting the name from PO file.
|
|
|
|
filename = self.get_po_filename(locale_path, locale)
|
|
|
|
name = self.get_name_from_po_file(filename, locale)
|
2020-09-01 23:16:00 +02:00
|
|
|
with override_language(code):
|
|
|
|
name_local = _(name)
|
2016-07-26 14:34:18 +02:00
|
|
|
|
2023-10-27 00:31:44 +02:00
|
|
|
info["name"] = unicodedata.normalize("NFC", name)
|
|
|
|
info["name_local"] = unicodedata.normalize("NFC", name_local)
|
2021-02-12 08:20:45 +01:00
|
|
|
info["code"] = code
|
|
|
|
info["locale"] = locale
|
|
|
|
info["percent_translated"] = percentage
|
|
|
|
data["languages"].append(info)
|
2016-06-23 11:32:45 +02:00
|
|
|
|
2024-11-14 01:30:36 +01:00
|
|
|
with open(output_path, "wb") as writer:
|
|
|
|
writer.write(
|
|
|
|
orjson.dumps(
|
|
|
|
data,
|
|
|
|
option=orjson.OPT_APPEND_NEWLINE | orjson.OPT_INDENT_2 | orjson.OPT_SORT_KEYS,
|
|
|
|
)
|
|
|
|
)
|
2016-07-26 14:34:18 +02:00
|
|
|
|
2018-05-10 19:30:04 +02:00
|
|
|
def get_translation_percentage(self, locale_path: str, locale: str) -> int:
|
2016-07-26 14:34:18 +02:00
|
|
|
# backend stats
|
|
|
|
po = polib.pofile(self.get_po_filename(locale_path, locale))
|
|
|
|
not_translated = len(po.untranslated_entries())
|
|
|
|
total = len(po.translated_entries()) + not_translated
|
|
|
|
|
|
|
|
# frontend stats
|
2020-08-07 01:09:47 +02:00
|
|
|
with open(self.get_json_filename(locale_path, locale), "rb") as reader:
|
2023-07-31 22:16:30 +02:00
|
|
|
for value in orjson.loads(reader.read()).values():
|
2016-07-26 14:34:18 +02:00
|
|
|
total += 1
|
2021-02-12 08:20:45 +01:00
|
|
|
if value == "":
|
2016-07-26 14:34:18 +02:00
|
|
|
not_translated += 1
|
|
|
|
|
2017-12-25 05:24:30 +01:00
|
|
|
# mobile stats
|
2021-02-12 08:20:45 +01:00
|
|
|
with open(os.path.join(locale_path, "mobile_info.json"), "rb") as mob:
|
2020-08-07 01:09:47 +02:00
|
|
|
mobile_info = orjson.loads(mob.read())
|
2017-12-25 05:24:30 +01:00
|
|
|
try:
|
|
|
|
info = mobile_info[locale]
|
|
|
|
except KeyError:
|
|
|
|
if self.strict:
|
|
|
|
raise
|
2021-02-12 08:20:45 +01:00
|
|
|
info = {"total": 0, "not_translated": 0}
|
2017-12-25 05:24:30 +01:00
|
|
|
|
2021-02-12 08:20:45 +01:00
|
|
|
total += info["total"]
|
|
|
|
not_translated += info["not_translated"]
|
2017-12-25 05:24:30 +01:00
|
|
|
|
2016-08-02 14:25:32 +02:00
|
|
|
return (total - not_translated) * 100 // total
|