2023-04-23 08:37:35 +00:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
|
|
|
|
import json
|
|
|
|
import os
|
|
|
|
import sys
|
|
|
|
import urllib.request
|
|
|
|
import shutil
|
|
|
|
import zipfile
|
|
|
|
import re
|
|
|
|
import xml.etree.ElementTree as ET
|
|
|
|
|
|
|
|
def main():
|
|
|
|
use_cache = True
|
|
|
|
|
|
|
|
script_dir = os.path.dirname(os.path.realpath(__file__))
|
2023-04-26 03:09:44 +00:00
|
|
|
root_dir = os.path.dirname(os.path.dirname(script_dir))
|
2023-04-23 08:37:35 +00:00
|
|
|
|
2023-04-26 03:09:44 +00:00
|
|
|
locales_dir = os.path.join(root_dir, 'chrome', 'locale')
|
|
|
|
schema_dir = os.path.join(root_dir, 'resource', 'schema')
|
2023-04-23 08:37:35 +00:00
|
|
|
|
|
|
|
# AMO download links for Firefox language packs
|
|
|
|
language_packs = [
|
|
|
|
["en-US", "https://addons.mozilla.org/en-US/firefox/addon/english-us-language-pack/"],
|
|
|
|
["af", "https://addons.mozilla.org/en-US/firefox/addon/afrikaans-language-pack/", "af-ZA"],
|
|
|
|
["ar", "https://addons.mozilla.org/en-US/firefox/addon/%D8%A7%D9%84%D8%B9%D8%B1%D8%A8%D9%8A%D8%A9-language-pack/"],
|
|
|
|
["bg", "https://addons.mozilla.org/en-US/firefox/addon/%D0%B1%D1%8A%D0%BB%D0%B3%D0%B0%D1%80%D1%81%D0%BA%D0%B8-language-pack/", "bg-BG"],
|
2023-04-26 03:15:30 +00:00
|
|
|
["br", "https://addons.mozilla.org/af/firefox/addon/breton-language-pack-for-firef/", "br"],
|
2023-04-23 08:37:35 +00:00
|
|
|
["ca", "https://addons.mozilla.org/en-US/firefox/addon/ca-language-pack/", "ca-AD"],
|
|
|
|
["cs", "https://addons.mozilla.org/en-US/firefox/addon/czech-cz-language-pack/", "cs-CZ"],
|
|
|
|
["da", "https://addons.mozilla.org/en-US/firefox/addon/dansk-da-language-pack/", "da-DK"],
|
|
|
|
["de", "https://addons.mozilla.org/en-US/firefox/addon/deutsch-de-language-pack/"],
|
|
|
|
["el", "https://addons.mozilla.org/en-US/firefox/addon/greek-gr-language-pack/", "el-GR"],
|
|
|
|
["en-GB", "https://addons.mozilla.org/en-US/firefox/addon/english-gb-language-pack/"],
|
|
|
|
["es-ES", "https://addons.mozilla.org/en-US/firefox/addon/espa%C3%B1ol-espa%C3%B1a-language-pac/"],
|
|
|
|
["eu", "https://addons.mozilla.org/en-US/firefox/addon/basque-language-pack/", "eu-ES"],
|
|
|
|
["fr", "https://addons.mozilla.org/en-US/firefox/addon/fran%C3%A7ais-language-pack/", "fr-FR"],
|
|
|
|
["et", "https://addons.mozilla.org/en-US/firefox/addon/eesti-et-keele-pakk/", "et-EE"],
|
|
|
|
["eu", "https://addons.mozilla.org/en-US/firefox/addon/basque-language-pack/", "eu-ES"],
|
|
|
|
["fa", "https://addons.mozilla.org/en-US/firefox/addon/persian-ir-%D9%81%D8%A7%D8%B1%D8%B3%DB%8C-%D8%A7%DB%8C%D8%B1%D8%A7%D9%86-lang/"],
|
|
|
|
["fi", "https://addons.mozilla.org/en-US/firefox/addon/finnish-language-pack/", "fi-FI"],
|
|
|
|
["gl", "https://addons.mozilla.org/en-US/firefox/addon/galician-galiza-language-pack/", "gl-ES"],
|
|
|
|
["he", "https://addons.mozilla.org/en-US/firefox/addon/hebrew-il-language-pack/", "he-IL"],
|
|
|
|
["hr", "https://addons.mozilla.org/en-US/firefox/addon/hrvatski-hr-language-pack/", "hr-HR"],
|
|
|
|
["hu", "https://addons.mozilla.org/en-US/firefox/addon/magyar-nyelvi/", "hu-HU"],
|
|
|
|
["id", "https://addons.mozilla.org/en-US/firefox/addon/indonesian-langpack/", "id-ID"],
|
|
|
|
["is", "https://addons.mozilla.org/en-US/firefox/addon/icelandic-is-language-pack/", "is-IS"],
|
|
|
|
["it", "https://addons.mozilla.org/en-US/firefox/addon/italiano-it-language-pack/", "it-IT"],
|
|
|
|
["ja", "https://addons.mozilla.org/en-US/firefox/addon/japanese-language-pack-1/", "ja-JP"],
|
|
|
|
["km", "https://addons.mozilla.org/en-US/firefox/addon/%E1%9E%81%E1%9E%98%E1%9E%9A-language-pack/"],
|
|
|
|
["ko", "https://addons.mozilla.org/en-US/firefox/addon/korean-kr-language-pack/", "ko-KR"],
|
|
|
|
["lt", "https://addons.mozilla.org/en-US/firefox/addon/lietuvi%C5%B3-language-pack/", "lt-LT"],
|
|
|
|
["nb-NO", "https://addons.mozilla.org/en-US/firefox/addon/norsk-bokm%C3%A5l-no-language-pa/"],
|
|
|
|
["nn-NO", "https://addons.mozilla.org/en-US/firefox/addon/norsk-nynorsk-no-language-p/"],
|
|
|
|
["nl", "https://addons.mozilla.org/en-US/firefox/addon/nederlands-nl-language-pack/", "nl-NL"],
|
|
|
|
["pl", "https://addons.mozilla.org/en-US/firefox/addon/polski-language-pack/", "pl-PL"],
|
|
|
|
["pt-BR", "https://addons.mozilla.org/en-US/firefox/addon/firefox-br/"],
|
|
|
|
["pt-PT", "https://addons.mozilla.org/en-US/firefox/addon/portugu%C3%AAs-portugal-language/"],
|
|
|
|
["ro", "https://addons.mozilla.org/en-US/firefox/addon/romanian-language-pack/", "ro-RO"],
|
|
|
|
["ru", "https://addons.mozilla.org/en-US/firefox/addon/russian-ru-language-pack/", "ru-RU"],
|
|
|
|
["sk", "https://addons.mozilla.org/en-US/firefox/addon/slovak-sk-language-pack/", "sk-SK"],
|
|
|
|
["sl", "https://addons.mozilla.org/en-US/firefox/addon/slovenski-jezik-language-pa/", "sl-SI"],
|
|
|
|
["sr", "https://addons.mozilla.org/en-US/firefox/addon/%D1%81%D1%80%D0%BF%D1%81%D0%BA%D0%B8-sr-language-pack/", "sr-RS"],
|
|
|
|
["sv-SE", "https://addons.mozilla.org/en-US/firefox/addon/svenska-se-language-pack/", "sv-SE"],
|
2024-02-27 11:58:59 +00:00
|
|
|
#["ta", "https://addons.mozilla.org/en-US/firefox/addon/tamil-language-pack-1/", "ta"],
|
|
|
|
["ta", "https://web.archive.org/web/20210724103430/https://addons.mozilla.org/en-US/firefox/addon/tamil-language-pack-1/", "ta"],
|
2023-04-23 08:37:35 +00:00
|
|
|
["th", "https://addons.mozilla.org/en-US/firefox/addon/thai-language-pack/", "th-TH"],
|
|
|
|
["tr", "https://addons.mozilla.org/en-US/firefox/addon/t%C3%BCrk%C3%A7e-tr-language-pack/", "tr-TR"],
|
|
|
|
["uk", "https://addons.mozilla.org/en-US/firefox/addon/ukrainian-language-pack/", "uk-UA"],
|
|
|
|
["vi", "https://addons.mozilla.org/en-US/firefox/addon/vietnamese-language-pack/", "vi-VN"],
|
|
|
|
["zh-CN", "https://addons.mozilla.org/en-US/firefox/addon/chinese-simplified-zh-cn-la/"],
|
|
|
|
["zh-TW", "https://addons.mozilla.org/en-US/firefox/addon/traditional-chinese-zh-tw-l/"]
|
|
|
|
]
|
|
|
|
|
|
|
|
# Can be a string or a dict containing 'file' and 'patterns'
|
|
|
|
entries = [
|
|
|
|
#"chrome/{0}/locale/{0}/global/dateFormat.properties",
|
2023-05-10 10:23:45 +00:00
|
|
|
#"chrome/{0}/locale/{0}/mozapps/update/updates.properties",
|
2023-04-23 08:37:35 +00:00
|
|
|
"chrome/{0}/locale/{0}/global/editMenuOverlay.dtd",
|
|
|
|
{
|
|
|
|
"file": "chrome/{0}/locale/{0}/global/intl.properties",
|
|
|
|
"grep_patterns": [
|
|
|
|
"^pluralRule",
|
|
|
|
"^intl.accept_languages"
|
|
|
|
]
|
|
|
|
},
|
2023-04-23 06:55:36 +00:00
|
|
|
"browser/localization/{0}/browser/menubar.ftl",
|
|
|
|
"localization/{0}/toolkit/global/textActions.ftl",
|
|
|
|
"localization/{0}/toolkit/global/wizard.ftl"
|
2023-04-23 08:37:35 +00:00
|
|
|
]
|
|
|
|
|
|
|
|
extracted_files = {}
|
|
|
|
for entry in entries:
|
|
|
|
entry_filename = get_entry_filename(entry)
|
|
|
|
if entry_filename != 'dateFormat.properties':
|
|
|
|
extracted_files[entry_filename] = set()
|
|
|
|
|
|
|
|
date_formats = {}
|
|
|
|
|
|
|
|
first = True
|
|
|
|
for pack in language_packs:
|
|
|
|
lang, url, *rest = pack
|
|
|
|
|
|
|
|
if len(rest):
|
|
|
|
locale = rest[0]
|
|
|
|
else:
|
|
|
|
locale = lang
|
|
|
|
|
|
|
|
pack_dir = os.path.join(script_dir, 'packs', lang)
|
|
|
|
locale_dir = os.path.join(locales_dir, locale, 'zotero', 'mozilla')
|
|
|
|
|
|
|
|
if not os.path.exists(pack_dir):
|
|
|
|
os.makedirs(pack_dir)
|
|
|
|
if not os.path.exists(locale_dir):
|
|
|
|
os.mkdir(locale_dir)
|
|
|
|
|
|
|
|
if not first:
|
|
|
|
print()
|
|
|
|
first = False
|
|
|
|
|
|
|
|
print("Loading from " + url)
|
|
|
|
with urllib.request.urlopen(url) as response:
|
|
|
|
code = response.getcode()
|
|
|
|
if code != 200:
|
|
|
|
sys.sterr.write("Got {0} for {1}\n".format(code, url))
|
|
|
|
return 1
|
|
|
|
|
|
|
|
html = str(response.read(), 'utf-8')
|
|
|
|
xpi_url = json.loads(
|
|
|
|
'"' + re.match('.*(https:[^"]+\.xpi)', html, flags=re.DOTALL).group(1) + '"'
|
|
|
|
)
|
|
|
|
file_name = xpi_url.split("/")[-1]
|
|
|
|
pack_file = os.path.join(pack_dir, file_name)
|
|
|
|
|
|
|
|
if use_cache and os.path.isfile(pack_file):
|
|
|
|
print("Using cached file for " + pack_file)
|
|
|
|
else:
|
|
|
|
print("Downloading " + xpi_url)
|
|
|
|
with urllib.request.urlopen(xpi_url) as response, open(pack_file, 'wb') as f:
|
|
|
|
shutil.copyfileobj(response, f)
|
|
|
|
|
2023-05-10 10:23:45 +00:00
|
|
|
# Code to extract 'updates' files from old langpacks
|
|
|
|
#pack_file = None
|
|
|
|
#for file in os.listdir(pack_dir):
|
|
|
|
# print(file)
|
|
|
|
# if file.startswith("addon-"):
|
|
|
|
# pack_file = os.path.join(pack_dir, file)
|
|
|
|
# break
|
|
|
|
#if not pack_file:
|
|
|
|
# continue
|
|
|
|
|
2023-04-23 08:37:35 +00:00
|
|
|
# Unzip selected files straight to target locale dirs
|
|
|
|
with zipfile.ZipFile(pack_file, "r") as zip_ref:
|
|
|
|
for entry in entries:
|
|
|
|
entry_path = get_entry_path(entry)
|
|
|
|
entry_filename = get_entry_filename(entry)
|
|
|
|
formatted_path = entry_path.format(lang)
|
|
|
|
|
|
|
|
try:
|
|
|
|
zip_ref.getinfo(formatted_path)
|
|
|
|
except KeyError:
|
|
|
|
print("'{0}' not found in {1}".format(formatted_path, pack_file))
|
|
|
|
continue
|
|
|
|
|
|
|
|
with zip_ref.open(formatted_path) as source:
|
|
|
|
# Add date formats to JSON object
|
|
|
|
if entry_filename == 'dateFormat.properties':
|
|
|
|
date_formats[locale] = {
|
|
|
|
"short": [],
|
|
|
|
"long": []
|
|
|
|
}
|
|
|
|
pattern = re.compile(r"^month\.\d+\.(Mmm|name)\s*=\s*(.+)$")
|
|
|
|
for line in source:
|
|
|
|
matches = pattern.match(str(line, 'utf-8'))
|
|
|
|
if matches:
|
|
|
|
if matches.group(1) == "Mmm":
|
|
|
|
date_formats[locale]["short"].append(
|
|
|
|
matches.group(2).strip()
|
|
|
|
)
|
|
|
|
else:
|
|
|
|
date_formats[locale]["long"].append(
|
|
|
|
matches.group(2).strip()
|
|
|
|
)
|
|
|
|
# Extract other files
|
|
|
|
else:
|
|
|
|
target_path = os.path.join(locale_dir, entry_filename)
|
|
|
|
print("Extracting " + target_path)
|
|
|
|
with open(target_path, "wb") as target:
|
|
|
|
copied = False
|
|
|
|
|
|
|
|
# Filter lines based on grep patterns
|
|
|
|
if isinstance(entry, dict) and entry['grep_patterns']:
|
|
|
|
lines_to_write = []
|
|
|
|
|
|
|
|
for line in source:
|
|
|
|
line_str = str(line, 'utf-8')
|
|
|
|
for p in entry['grep_patterns']:
|
|
|
|
if re.search(re.compile(p), line_str):
|
|
|
|
lines_to_write.append(line)
|
|
|
|
continue
|
|
|
|
|
|
|
|
if len(lines_to_write):
|
|
|
|
# BOM is required for Firefox to read .dtd files
|
|
|
|
use_bom = entry_filename.endswith('.dtd')
|
|
|
|
|
|
|
|
target.write(
|
|
|
|
('\ufeff'.encode('utf-8') if use_bom else b'')
|
|
|
|
+ b''.join(lines_to_write)
|
|
|
|
)
|
|
|
|
copied = True
|
|
|
|
|
|
|
|
# Copy file directly
|
|
|
|
else:
|
|
|
|
shutil.copyfileobj(source, target)
|
|
|
|
copied = True
|
|
|
|
|
|
|
|
if copied:
|
|
|
|
extracted_files[entry_filename].add(locale)
|
|
|
|
|
|
|
|
print()
|
|
|
|
|
|
|
|
# Copy en-US files to any locales that didn't have localized versions
|
|
|
|
en_locale_dir = os.path.join(locales_dir, 'en-US', 'zotero', 'mozilla')
|
|
|
|
locales = set(os.listdir(locales_dir))
|
|
|
|
locales -= set(['.DS_Store'])
|
|
|
|
for entry_filename, existing_locales in extracted_files.items():
|
|
|
|
missing = locales.difference(existing_locales)
|
|
|
|
|
|
|
|
for locale in missing:
|
2023-04-24 08:24:33 +00:00
|
|
|
if locale == 'en-US':
|
|
|
|
continue
|
2023-04-23 08:37:35 +00:00
|
|
|
dest_dir = os.path.join(locales_dir, locale, 'zotero', 'mozilla')
|
|
|
|
dest_file = os.path.join(dest_dir, entry_filename)
|
|
|
|
if not os.path.exists(dest_dir):
|
|
|
|
os.mkdir(dest_dir)
|
|
|
|
source_file = os.path.join(en_locale_dir, entry_filename)
|
|
|
|
print("Copying en-US {0} to {1}".format(entry_filename, dest_file))
|
|
|
|
shutil.copyfile(source_file, dest_file)
|
|
|
|
|
|
|
|
print()
|
|
|
|
|
|
|
|
# Date format overrides
|
|
|
|
# https://github.com/zotero/zotero/pull/1156
|
|
|
|
#date_formats['fr-FR']['short'][5] = 'juin'
|
|
|
|
#date_formats['fr-FR']['short'][6] = 'juil'
|
|
|
|
#date_formats['fr-FR']['short'][11] = 'déc'
|
|
|
|
|
|
|
|
# Write dateFormats.json from the extracted data
|
|
|
|
#date_formats_path = os.path.join(schema_dir, 'dateFormats.json')
|
|
|
|
#print("Writing " + date_formats_path);
|
|
|
|
#with open(date_formats_path, 'w') as f:
|
|
|
|
# f.write(json.dumps(date_formats, indent='\t', ensure_ascii=False))
|
|
|
|
print("WARNING: dateFormat.properties is no longer processed\n")
|
|
|
|
|
|
|
|
print("Check results before committing!")
|
|
|
|
|
|
|
|
|
|
|
|
def get_entry_path(entry):
|
|
|
|
if isinstance(entry, str):
|
|
|
|
path = entry
|
|
|
|
else:
|
|
|
|
path = entry['file']
|
|
|
|
return path
|
|
|
|
|
|
|
|
|
|
|
|
def get_entry_filename(entry):
|
|
|
|
path = get_entry_path(entry)
|
|
|
|
return path.split("/")[-1]
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
|
sys.exit(main())
|