mirror of
https://github.com/joe7575/lumberjack.git
synced 2024-11-22 15:03:45 +01:00
460 lines
17 KiB
Python
Executable File
460 lines
17 KiB
Python
Executable File
#!/usr/bin/env python3
|
|
# -*- coding: utf-8 -*-
|
|
#
|
|
# Script to generate the template file and update the translation files.
|
|
# Copy the script into the mod or modpack root folder and run it there.
|
|
#
|
|
# Copyright (C) 2019 Joachim Stolberg, 2020 FaceDeer, 2020 Louis Royer
|
|
# LGPLv2.1+
|
|
#
|
|
# See https://github.com/minetest-tools/update_translations for
|
|
# potential future updates to this script.
|
|
|
|
from __future__ import print_function
|
|
import os, fnmatch, re, shutil, errno
|
|
from sys import argv as _argv
|
|
from sys import stderr as _stderr
|
|
|
|
# Running params
|
|
params = {"recursive": False,
|
|
"help": False,
|
|
"mods": False,
|
|
"verbose": False,
|
|
"folders": [],
|
|
"no-old-file": False,
|
|
"break-long-lines": False,
|
|
"sort": False
|
|
}
|
|
# Available CLI options
|
|
options = {"recursive": ['--recursive', '-r'],
|
|
"help": ['--help', '-h'],
|
|
"mods": ['--installed-mods', '-m'],
|
|
"verbose": ['--verbose', '-v'],
|
|
"no-old-file": ['--no-old-file', '-O'],
|
|
"break-long-lines": ['--break-long-lines', '-b'],
|
|
"sort": ['--sort', '-s']
|
|
}
|
|
|
|
# Strings longer than this will have extra space added between
|
|
# them in the translation files to make it easier to distinguish their
|
|
# beginnings and endings at a glance
|
|
doublespace_threshold = 80
|
|
|
|
def set_params_folders(tab: list):
|
|
'''Initialize params["folders"] from CLI arguments.'''
|
|
# Discarding argument 0 (tool name)
|
|
for param in tab[1:]:
|
|
stop_param = False
|
|
for option in options:
|
|
if param in options[option]:
|
|
stop_param = True
|
|
break
|
|
if not stop_param:
|
|
params["folders"].append(os.path.abspath(param))
|
|
|
|
def set_params(tab: list):
|
|
'''Initialize params from CLI arguments.'''
|
|
for option in options:
|
|
for option_name in options[option]:
|
|
if option_name in tab:
|
|
params[option] = True
|
|
break
|
|
|
|
def print_help(name):
|
|
'''Prints some help message.'''
|
|
print(f'''SYNOPSIS
|
|
{name} [OPTIONS] [PATHS...]
|
|
DESCRIPTION
|
|
{', '.join(options["help"])}
|
|
prints this help message
|
|
{', '.join(options["recursive"])}
|
|
run on all subfolders of paths given
|
|
{', '.join(options["mods"])}
|
|
run on locally installed modules
|
|
{', '.join(options["no-old-file"])}
|
|
do not create *.old files
|
|
{', '.join(options["sort"])}
|
|
sort output strings alphabetically
|
|
{', '.join(options["break-long-lines"])}
|
|
add extra line breaks before and after long strings
|
|
{', '.join(options["verbose"])}
|
|
add output information
|
|
''')
|
|
|
|
|
|
def main():
|
|
'''Main function'''
|
|
set_params(_argv)
|
|
set_params_folders(_argv)
|
|
if params["help"]:
|
|
print_help(_argv[0])
|
|
elif params["recursive"] and params["mods"]:
|
|
print("Option --installed-mods is incompatible with --recursive")
|
|
else:
|
|
# Add recursivity message
|
|
print("Running ", end='')
|
|
if params["recursive"]:
|
|
print("recursively ", end='')
|
|
# Running
|
|
if params["mods"]:
|
|
print(f"on all locally installed modules in {os.path.abspath('~/.minetest/mods/')}")
|
|
run_all_subfolders("~/.minetest/mods")
|
|
elif len(params["folders"]) >= 2:
|
|
print("on folder list:", params["folders"])
|
|
for f in params["folders"]:
|
|
if params["recursive"]:
|
|
run_all_subfolders(f)
|
|
else:
|
|
update_folder(f)
|
|
elif len(params["folders"]) == 1:
|
|
print("on folder", params["folders"][0])
|
|
if params["recursive"]:
|
|
run_all_subfolders(params["folders"][0])
|
|
else:
|
|
update_folder(params["folders"][0])
|
|
else:
|
|
print("on folder", os.path.abspath("./"))
|
|
if params["recursive"]:
|
|
run_all_subfolders(os.path.abspath("./"))
|
|
else:
|
|
update_folder(os.path.abspath("./"))
|
|
|
|
#group 2 will be the string, groups 1 and 3 will be the delimiters (" or ')
|
|
#See https://stackoverflow.com/questions/46967465/regex-match-text-in-either-single-or-double-quote
|
|
pattern_lua_s = re.compile(r'[\.=^\t,{\(\s]N?S\(\s*(["\'])((?:\\\1|(?:(?!\1)).)*)(\1)[\s,\)]', re.DOTALL)
|
|
pattern_lua_fs = re.compile(r'[\.=^\t,{\(\s]N?FS\(\s*(["\'])((?:\\\1|(?:(?!\1)).)*)(\1)[\s,\)]', re.DOTALL)
|
|
pattern_lua_bracketed_s = re.compile(r'[\.=^\t,{\(\s]N?S\(\s*\[\[(.*?)\]\][\s,\)]', re.DOTALL)
|
|
pattern_lua_bracketed_fs = re.compile(r'[\.=^\t,{\(\s]N?FS\(\s*\[\[(.*?)\]\][\s,\)]', re.DOTALL)
|
|
|
|
# Handles "concatenation" .. " of strings"
|
|
pattern_concat = re.compile(r'["\'][\s]*\.\.[\s]*["\']', re.DOTALL)
|
|
|
|
pattern_tr = re.compile(r'(.*?[^@])=(.*)')
|
|
pattern_name = re.compile(r'^name[ ]*=[ ]*([^ \n]*)')
|
|
pattern_tr_filename = re.compile(r'\.tr$')
|
|
pattern_po_language_code = re.compile(r'(.*)\.po$')
|
|
|
|
#attempt to read the mod's name from the mod.conf file. Returns None on failure
|
|
def get_modname(folder):
|
|
try:
|
|
with open(os.path.join(folder, "mod.conf"), "r", encoding='utf-8') as mod_conf:
|
|
for line in mod_conf:
|
|
match = pattern_name.match(line)
|
|
if match:
|
|
return match.group(1)
|
|
except FileNotFoundError:
|
|
pass
|
|
return None
|
|
|
|
#If there are already .tr files in /locale, returns a list of their names
|
|
def get_existing_tr_files(folder):
|
|
out = []
|
|
for root, dirs, files in os.walk(os.path.join(folder, 'locale/')):
|
|
for name in files:
|
|
if pattern_tr_filename.search(name):
|
|
out.append(name)
|
|
return out
|
|
|
|
# A series of search and replaces that massage a .po file's contents into
|
|
# a .tr file's equivalent
|
|
def process_po_file(text):
|
|
# The first three items are for unused matches
|
|
text = re.sub(r'#~ msgid "', "", text)
|
|
text = re.sub(r'"\n#~ msgstr ""\n"', "=", text)
|
|
text = re.sub(r'"\n#~ msgstr "', "=", text)
|
|
# comment lines
|
|
text = re.sub(r'#.*\n', "", text)
|
|
# converting msg pairs into "=" pairs
|
|
text = re.sub(r'msgid "', "", text)
|
|
text = re.sub(r'"\nmsgstr ""\n"', "=", text)
|
|
text = re.sub(r'"\nmsgstr "', "=", text)
|
|
# various line breaks and escape codes
|
|
text = re.sub(r'"\n"', "", text)
|
|
text = re.sub(r'"\n', "\n", text)
|
|
text = re.sub(r'\\"', '"', text)
|
|
text = re.sub(r'\\n', '@n', text)
|
|
# remove header text
|
|
text = re.sub(r'=Project-Id-Version:.*\n', "", text)
|
|
# remove double-spaced lines
|
|
text = re.sub(r'\n\n', '\n', text)
|
|
return text
|
|
|
|
# Go through existing .po files and, if a .tr file for that language
|
|
# *doesn't* exist, convert it and create it.
|
|
# The .tr file that results will subsequently be reprocessed so
|
|
# any "no longer used" strings will be preserved.
|
|
# Note that "fuzzy" tags will be lost in this process.
|
|
def process_po_files(folder, modname):
|
|
for root, dirs, files in os.walk(os.path.join(folder, 'locale/')):
|
|
for name in files:
|
|
code_match = pattern_po_language_code.match(name)
|
|
if code_match == None:
|
|
continue
|
|
language_code = code_match.group(1)
|
|
tr_name = modname + "." + language_code + ".tr"
|
|
tr_file = os.path.join(root, tr_name)
|
|
if os.path.exists(tr_file):
|
|
if params["verbose"]:
|
|
print(f"{tr_name} already exists, ignoring {name}")
|
|
continue
|
|
fname = os.path.join(root, name)
|
|
with open(fname, "r", encoding='utf-8') as po_file:
|
|
if params["verbose"]:
|
|
print(f"Importing translations from {name}")
|
|
text = process_po_file(po_file.read())
|
|
with open(tr_file, "wt", encoding='utf-8') as tr_out:
|
|
tr_out.write(text)
|
|
|
|
# from https://stackoverflow.com/questions/600268/mkdir-p-functionality-in-python/600612#600612
|
|
# Creates a directory if it doesn't exist, silently does
|
|
# nothing if it already exists
|
|
def mkdir_p(path):
|
|
try:
|
|
os.makedirs(path)
|
|
except OSError as exc: # Python >2.5
|
|
if exc.errno == errno.EEXIST and os.path.isdir(path):
|
|
pass
|
|
else: raise
|
|
|
|
# Converts the template dictionary to a text to be written as a file
|
|
# dKeyStrings is a dictionary of localized string to source file sets
|
|
# dOld is a dictionary of existing translations and comments from
|
|
# the previous version of this text
|
|
def strings_to_text(dkeyStrings, dOld, mod_name, header_comments):
|
|
lOut = [f"# textdomain: {mod_name}\n"]
|
|
if header_comments is not None:
|
|
lOut.append(header_comments)
|
|
|
|
dGroupedBySource = {}
|
|
|
|
for key in dkeyStrings:
|
|
sourceList = list(dkeyStrings[key])
|
|
if params["sort"]:
|
|
sourceList.sort()
|
|
sourceString = "\n".join(sourceList)
|
|
listForSource = dGroupedBySource.get(sourceString, [])
|
|
listForSource.append(key)
|
|
dGroupedBySource[sourceString] = listForSource
|
|
|
|
lSourceKeys = list(dGroupedBySource.keys())
|
|
lSourceKeys.sort()
|
|
for source in lSourceKeys:
|
|
localizedStrings = dGroupedBySource[source]
|
|
if params["sort"]:
|
|
localizedStrings.sort()
|
|
lOut.append("")
|
|
lOut.append(source)
|
|
lOut.append("")
|
|
for localizedString in localizedStrings:
|
|
val = dOld.get(localizedString, {})
|
|
translation = val.get("translation", "")
|
|
comment = val.get("comment")
|
|
if params["break-long-lines"] and len(localizedString) > doublespace_threshold and not lOut[-1] == "":
|
|
lOut.append("")
|
|
if comment != None:
|
|
lOut.append(comment)
|
|
lOut.append(f"{localizedString}={translation}")
|
|
if params["break-long-lines"] and len(localizedString) > doublespace_threshold:
|
|
lOut.append("")
|
|
|
|
|
|
unusedExist = False
|
|
for key in dOld:
|
|
if key not in dkeyStrings:
|
|
val = dOld[key]
|
|
translation = val.get("translation")
|
|
comment = val.get("comment")
|
|
# only keep an unused translation if there was translated
|
|
# text or a comment associated with it
|
|
if translation != None and (translation != "" or comment):
|
|
if not unusedExist:
|
|
unusedExist = True
|
|
lOut.append("\n\n##### not used anymore #####\n")
|
|
if params["break-long-lines"] and len(key) > doublespace_threshold and not lOut[-1] == "":
|
|
lOut.append("")
|
|
if comment != None:
|
|
lOut.append(comment)
|
|
lOut.append(f"{key}={translation}")
|
|
if params["break-long-lines"] and len(key) > doublespace_threshold:
|
|
lOut.append("")
|
|
return "\n".join(lOut) + '\n'
|
|
|
|
# Writes a template.txt file
|
|
# dkeyStrings is the dictionary returned by generate_template
|
|
def write_template(templ_file, dkeyStrings, mod_name):
|
|
# read existing template file to preserve comments
|
|
existing_template = import_tr_file(templ_file)
|
|
|
|
text = strings_to_text(dkeyStrings, existing_template[0], mod_name, existing_template[2])
|
|
mkdir_p(os.path.dirname(templ_file))
|
|
with open(templ_file, "wt", encoding='utf-8') as template_file:
|
|
template_file.write(text)
|
|
|
|
|
|
# Gets all translatable strings from a lua file
|
|
def read_lua_file_strings(lua_file):
|
|
lOut = []
|
|
with open(lua_file, encoding='utf-8') as text_file:
|
|
text = text_file.read()
|
|
#TODO remove comments here
|
|
|
|
text = re.sub(pattern_concat, "", text)
|
|
|
|
strings = []
|
|
for s in pattern_lua_s.findall(text):
|
|
strings.append(s[1])
|
|
for s in pattern_lua_bracketed_s.findall(text):
|
|
strings.append(s)
|
|
for s in pattern_lua_fs.findall(text):
|
|
strings.append(s[1])
|
|
for s in pattern_lua_bracketed_fs.findall(text):
|
|
strings.append(s)
|
|
|
|
for s in strings:
|
|
s = re.sub(r'"\.\.\s+"', "", s)
|
|
s = re.sub("@[^@=0-9]", "@@", s)
|
|
s = s.replace('\\"', '"')
|
|
s = s.replace("\\'", "'")
|
|
s = s.replace("\n", "@n")
|
|
s = s.replace("\\n", "@n")
|
|
s = s.replace("=", "@=")
|
|
lOut.append(s)
|
|
return lOut
|
|
|
|
# Gets strings from an existing translation file
|
|
# returns both a dictionary of translations
|
|
# and the full original source text so that the new text
|
|
# can be compared to it for changes.
|
|
# Returns also header comments in the third return value.
|
|
def import_tr_file(tr_file):
|
|
dOut = {}
|
|
text = None
|
|
header_comment = None
|
|
if os.path.exists(tr_file):
|
|
with open(tr_file, "r", encoding='utf-8') as existing_file :
|
|
# save the full text to allow for comparison
|
|
# of the old version with the new output
|
|
text = existing_file.read()
|
|
existing_file.seek(0)
|
|
# a running record of the current comment block
|
|
# we're inside, to allow preceeding multi-line comments
|
|
# to be retained for a translation line
|
|
latest_comment_block = None
|
|
for line in existing_file.readlines():
|
|
line = line.rstrip('\n')
|
|
if line[:3] == "###":
|
|
if header_comment is None:
|
|
# Save header comments
|
|
header_comment = latest_comment_block
|
|
# Stip textdomain line
|
|
tmp_h_c = ""
|
|
for l in header_comment.split('\n'):
|
|
if not l.startswith("# textdomain:"):
|
|
tmp_h_c += l + '\n'
|
|
header_comment = tmp_h_c
|
|
|
|
# Reset comment block if we hit a header
|
|
latest_comment_block = None
|
|
continue
|
|
if line[:1] == "#":
|
|
# Save the comment we're inside
|
|
if not latest_comment_block:
|
|
latest_comment_block = line
|
|
else:
|
|
latest_comment_block = latest_comment_block + "\n" + line
|
|
continue
|
|
match = pattern_tr.match(line)
|
|
if match:
|
|
# this line is a translated line
|
|
outval = {}
|
|
outval["translation"] = match.group(2)
|
|
if latest_comment_block:
|
|
# if there was a comment, record that.
|
|
outval["comment"] = latest_comment_block
|
|
latest_comment_block = None
|
|
dOut[match.group(1)] = outval
|
|
return (dOut, text, header_comment)
|
|
|
|
# Walks all lua files in the mod folder, collects translatable strings,
|
|
# and writes it to a template.txt file
|
|
# Returns a dictionary of localized strings to source file sets
|
|
# that can be used with the strings_to_text function.
|
|
def generate_template(folder, mod_name):
|
|
dOut = {}
|
|
for root, dirs, files in os.walk(folder):
|
|
for name in files:
|
|
if fnmatch.fnmatch(name, "*.lua"):
|
|
fname = os.path.join(root, name)
|
|
found = read_lua_file_strings(fname)
|
|
if params["verbose"]:
|
|
print(f"{fname}: {str(len(found))} translatable strings")
|
|
|
|
for s in found:
|
|
sources = dOut.get(s, set())
|
|
sources.add(f"### {os.path.basename(fname)} ###")
|
|
dOut[s] = sources
|
|
|
|
if len(dOut) == 0:
|
|
return None
|
|
templ_file = os.path.join(folder, "locale/template.txt")
|
|
write_template(templ_file, dOut, mod_name)
|
|
return dOut
|
|
|
|
# Updates an existing .tr file, copying the old one to a ".old" file
|
|
# if any changes have happened
|
|
# dNew is the data used to generate the template, it has all the
|
|
# currently-existing localized strings
|
|
def update_tr_file(dNew, mod_name, tr_file):
|
|
if params["verbose"]:
|
|
print(f"updating {tr_file}")
|
|
|
|
tr_import = import_tr_file(tr_file)
|
|
dOld = tr_import[0]
|
|
textOld = tr_import[1]
|
|
|
|
textNew = strings_to_text(dNew, dOld, mod_name, tr_import[2])
|
|
|
|
if textOld and textOld != textNew:
|
|
print(f"{tr_file} has changed.")
|
|
if not params["no-old-file"]:
|
|
shutil.copyfile(tr_file, f"{tr_file}.old")
|
|
|
|
with open(tr_file, "w", encoding='utf-8') as new_tr_file:
|
|
new_tr_file.write(textNew)
|
|
|
|
# Updates translation files for the mod in the given folder
|
|
def update_mod(folder):
|
|
modname = get_modname(folder)
|
|
if modname is not None:
|
|
process_po_files(folder, modname)
|
|
print(f"Updating translations for {modname}")
|
|
data = generate_template(folder, modname)
|
|
if data == None:
|
|
print(f"No translatable strings found in {modname}")
|
|
else:
|
|
for tr_file in get_existing_tr_files(folder):
|
|
update_tr_file(data, modname, os.path.join(folder, "locale/", tr_file))
|
|
else:
|
|
print(f"\033[31mUnable to find modname in folder {folder}.\033[0m", file=_stderr)
|
|
exit(1)
|
|
|
|
# Determines if the folder being pointed to is a mod or a mod pack
|
|
# and then runs update_mod accordingly
|
|
def update_folder(folder):
|
|
is_modpack = os.path.exists(os.path.join(folder, "modpack.txt")) or os.path.exists(os.path.join(folder, "modpack.conf"))
|
|
if is_modpack:
|
|
subfolders = [f.path for f in os.scandir(folder) if f.is_dir()]
|
|
for subfolder in subfolders:
|
|
update_mod(subfolder + "/")
|
|
else:
|
|
update_mod(folder)
|
|
print("Done.")
|
|
|
|
def run_all_subfolders(folder):
|
|
for modfolder in [f.path for f in os.scandir(folder) if f.is_dir()]:
|
|
update_folder(modfolder + "/")
|
|
|
|
|
|
_argv.append("--sort")
|
|
main()
|