123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538 |
- #!/usr/bin/env python3
- # -*- coding: utf-8 -*-
- #
- # Script to generate Minetest translation template files and update
- # translation files.
- #
- # Copyright (C) 2019 Joachim Stolberg, 2020 FaceDeer, 2020 Louis Royer,
- # 2023 Wuzzy.
- # License: LGPLv2.1 or later (see LICENSE file for details)
- import os, fnmatch, re, shutil, errno
- from sys import argv as _argv
- from sys import stderr as _stderr
- # Running params
- params = {"recursive": False,
- "help": False,
- "verbose": False,
- "folders": [],
- "old-file": False,
- "break-long-lines": False,
- "print-source": False,
- "truncate-unused": False,
- }
- # Available CLI options
- options = {"recursive": ['--recursive', '-r'],
- "help": ['--help', '-h'],
- "verbose": ['--verbose', '-v'],
- "old-file": ['--old-file', '-o'],
- "break-long-lines": ['--break-long-lines', '-b'],
- "print-source": ['--print-source', '-p'],
- "truncate-unused": ['--truncate-unused', '-t'],
- }
- # Strings longer than this will have extra space added between
- # them in the translation files to make it easier to distinguish their
- # beginnings and endings at a glance
- doublespace_threshold = 80
- # These symbols mark comment lines showing the source file name.
- # A comment may look like "##[ init.lua ]##".
- symbol_source_prefix = "##["
- symbol_source_suffix = "]##"
- # comment to mark the section of old/unused strings
- comment_unused = "##### not used anymore #####"
- def set_params_folders(tab: list):
- '''Initialize params["folders"] from CLI arguments.'''
- # Discarding argument 0 (tool name)
- for param in tab[1:]:
- stop_param = False
- for option in options:
- if param in options[option]:
- stop_param = True
- break
- if not stop_param:
- params["folders"].append(os.path.abspath(param))
- def set_params(tab: list):
- '''Initialize params from CLI arguments.'''
- for option in options:
- for option_name in options[option]:
- if option_name in tab:
- params[option] = True
- break
- def print_help(name):
- '''Prints some help message.'''
- print(f'''SYNOPSIS
- {name} [OPTIONS] [PATHS...]
- DESCRIPTION
- {', '.join(options["help"])}
- prints this help message
- {', '.join(options["recursive"])}
- run on all subfolders of paths given
- {', '.join(options["old-file"])}
- create *.old files
- {', '.join(options["break-long-lines"])}
- add extra line breaks before and after long strings
- {', '.join(options["print-source"])}
- add comments denoting the source file
- {', '.join(options["verbose"])}
- add output information
- {', '.join(options["truncate-unused"])}
- delete unused strings from files
- ''')
- def main():
- '''Main function'''
- set_params(_argv)
- set_params_folders(_argv)
- if params["help"]:
- print_help(_argv[0])
- else:
- # Add recursivity message
- print("Running ", end='')
- if params["recursive"]:
- print("recursively ", end='')
- # Running
- if len(params["folders"]) >= 2:
- print("on folder list:", params["folders"])
- for f in params["folders"]:
- if params["recursive"]:
- run_all_subfolders(f)
- else:
- update_folder(f)
- elif len(params["folders"]) == 1:
- print("on folder", params["folders"][0])
- if params["recursive"]:
- run_all_subfolders(params["folders"][0])
- else:
- update_folder(params["folders"][0])
- else:
- print("on folder", os.path.abspath("./"))
- if params["recursive"]:
- run_all_subfolders(os.path.abspath("./"))
- else:
- update_folder(os.path.abspath("./"))
- # Compile pattern for matching lua function call
- def compile_func_call_pattern(argument_pattern):
- return re.compile(
- # Look for beginning of file or anything that isn't a function identifier
- r'(?:^|[\.=,{\(\s])' +
- # Matches S, FS, NS, or NFS function call
- r'N?F?S\s*' +
- # The pattern to match argument
- argument_pattern,
- re.DOTALL)
- # Add parentheses around a pattern
- def parenthesize_pattern(pattern):
- return (
- # Start of argument: open parentheses and space (optional)
- r'\(\s*' +
- # The pattern to be parenthesized
- pattern +
- # End of argument or function call: space, comma, or close parentheses
- r'[\s,\)]')
- # Quoted string
- # Group 2 will be the string, group 1 and group 3 will be the delimiters (" or ')
- # See https://stackoverflow.com/questions/46967465/regex-match-text-in-either-single-or-double-quote
- pattern_lua_quoted_string = r'(["\'])((?:\\\1|(?:(?!\1)).)*)(\1)'
- # Double square bracket string (multiline)
- pattern_lua_square_bracket_string = r'\[\[(.*?)\]\]'
- # Handles the " ... " or ' ... ' string delimiters
- pattern_lua_quoted = compile_func_call_pattern(parenthesize_pattern(pattern_lua_quoted_string))
- # Handles the [[ ... ]] string delimiters
- pattern_lua_bracketed = compile_func_call_pattern(parenthesize_pattern(pattern_lua_square_bracket_string))
- # Handles like pattern_lua_quoted, but for single parameter (without parentheses)
- # See https://www.lua.org/pil/5.html for informations about single argument call
- pattern_lua_quoted_single = compile_func_call_pattern(pattern_lua_quoted_string)
- # Same as pattern_lua_quoted_single, but for [[ ... ]] string delimiters
- pattern_lua_bracketed_single = compile_func_call_pattern(pattern_lua_square_bracket_string)
- # Handles "concatenation" .. " of strings"
- pattern_concat = re.compile(r'["\'][\s]*\.\.[\s]*["\']', re.DOTALL)
- # Handles a translation line in *.tr file.
- # Group 1 is the source string left of the equals sign.
- # Group 2 is the translated string, right of the equals sign.
- pattern_tr = re.compile(
- r'(.*)' # Source string
- # the separating equals sign, if NOT preceded by @, unless
- # that @ is preceded by another @
- r'(?:(?<!(?<!@)@)=)'
- r'(.*)' # Translation string
- )
- pattern_name = re.compile(r'^name[ ]*=[ ]*([^ \n]*)')
- pattern_tr_filename = re.compile(r'\.tr$')
- # Matches bad use of @ signs in Lua string
- pattern_bad_luastring = re.compile(
- r'^@$|' # single @, OR
- r'[^@]@$|' # trailing unescaped @, OR
- r'(?<!@)@(?=[^@1-9n])' # an @ that is not escaped or part of a placeholder
- )
- # Attempt to read the mod's name from the mod.conf file or folder name. Returns None on failure
- def get_modname(folder):
- try:
- with open(os.path.join(folder, "mod.conf"), "r", encoding='utf-8') as mod_conf:
- for line in mod_conf:
- match = pattern_name.match(line)
- if match:
- return match.group(1)
- except FileNotFoundError:
- folder_name = os.path.basename(folder)
- # Special case when run in Minetest's builtin directory
- return "__builtin" if folder_name == "builtin" else folder_name
- # If there are already .tr files in /locale, returns a list of their names
- def get_existing_tr_files(folder):
- out = []
- for root, dirs, files in os.walk(os.path.join(folder, 'locale/')):
- for name in files:
- if pattern_tr_filename.search(name):
- out.append(name)
- return out
- # from https://stackoverflow.com/questions/600268/mkdir-p-functionality-in-python/600612#600612
- # Creates a directory if it doesn't exist, silently does
- # nothing if it already exists
- def mkdir_p(path):
- try:
- os.makedirs(path)
- except OSError as exc: # Python >2.5
- if exc.errno == errno.EEXIST and os.path.isdir(path):
- pass
- else: raise
- # Converts the template dictionary to a text to be written as a file
- # dKeyStrings is a dictionary of localized string to source file sets
- # dOld is a dictionary of existing translations and comments from
- # the previous version of this text
- def strings_to_text(dkeyStrings, dOld, mod_name, header_comments, textdomain, templ = None):
- # if textdomain is specified, insert it at the top
- if textdomain != None:
- lOut = [textdomain] # argument is full textdomain line
- # otherwise, use mod name as textdomain automatically
- else:
- lOut = [f"# textdomain: {mod_name}"]
- if templ is not None and templ[2] and (header_comments is None or not header_comments.startswith(templ[2])):
- # header comments in the template file
- lOut.append(templ[2])
- if header_comments is not None:
- lOut.append(header_comments)
- dGroupedBySource = {}
- for key in dkeyStrings:
- sourceList = list(dkeyStrings[key])
- sourceString = "\n".join(sourceList)
- listForSource = dGroupedBySource.get(sourceString, [])
- listForSource.append(key)
- dGroupedBySource[sourceString] = listForSource
- lSourceKeys = list(dGroupedBySource.keys())
- lSourceKeys.sort()
- for source in lSourceKeys:
- localizedStrings = dGroupedBySource[source]
- if params["print-source"]:
- if lOut[-1] != "":
- lOut.append("")
- lOut.append(source)
- for localizedString in localizedStrings:
- val = dOld.get(localizedString, {})
- translation = val.get("translation", "")
- comment = val.get("comment")
- templ_comment = None
- if templ:
- templ_val = templ[0].get(localizedString, {})
- templ_comment = templ_val.get("comment")
- if params["break-long-lines"] and len(localizedString) > doublespace_threshold and not lOut[-1] == "":
- lOut.append("")
- if templ_comment != None and templ_comment != "" and (comment is None or comment == "" or not comment.startswith(templ_comment)):
- lOut.append(templ_comment)
- if comment != None and comment != "" and not comment.startswith("# textdomain:"):
- lOut.append(comment)
- lOut.append(f"{localizedString}={translation}")
- if params["break-long-lines"] and len(localizedString) > doublespace_threshold:
- lOut.append("")
- unusedExist = False
- if not params["truncate-unused"]:
- for key in dOld:
- if key not in dkeyStrings:
- val = dOld[key]
- translation = val.get("translation")
- comment = val.get("comment")
- # only keep an unused translation if there was translated
- # text or a comment associated with it
- if translation != None and (translation != "" or comment):
- if not unusedExist:
- unusedExist = True
- lOut.append("\n\n" + comment_unused + "\n")
- if params["break-long-lines"] and len(key) > doublespace_threshold and not lOut[-1] == "":
- lOut.append("")
- if comment != None:
- lOut.append(comment)
- lOut.append(f"{key}={translation}")
- if params["break-long-lines"] and len(key) > doublespace_threshold:
- lOut.append("")
- return "\n".join(lOut) + '\n'
- # Writes a template.txt file
- # dkeyStrings is the dictionary returned by generate_template
- def write_template(templ_file, dkeyStrings, mod_name):
- # read existing template file to preserve comments
- existing_template = import_tr_file(templ_file)
- text = strings_to_text(dkeyStrings, existing_template[0], mod_name, existing_template[2], existing_template[3])
- mkdir_p(os.path.dirname(templ_file))
- with open(templ_file, "wt", encoding='utf-8') as template_file:
- template_file.write(text)
- # Gets all translatable strings from a lua file
- def read_lua_file_strings(lua_file):
- lOut = []
- with open(lua_file, encoding='utf-8') as text_file:
- text = text_file.read()
- strings = []
- for s in pattern_lua_quoted_single.findall(text):
- strings.append(s[1])
- for s in pattern_lua_bracketed_single.findall(text):
- strings.append(s)
- # Only concatenate strings after matching
- # single parameter call (without parantheses)
- text = re.sub(pattern_concat, "", text)
- for s in pattern_lua_quoted.findall(text):
- strings.append(s[1])
- for s in pattern_lua_bracketed.findall(text):
- strings.append(s)
- for s in strings:
- found_bad = pattern_bad_luastring.search(s)
- if found_bad:
- print("SYNTAX ERROR: Unescaped '@' in Lua string: " + s)
- continue
- s = s.replace('\\"', '"')
- s = s.replace("\\'", "'")
- s = s.replace("\n", "@n")
- s = s.replace("\\n", "@n")
- s = s.replace("=", "@=")
- lOut.append(s)
- return lOut
- # Gets strings from an existing translation file
- # returns both a dictionary of translations
- # and the full original source text so that the new text
- # can be compared to it for changes.
- # Returns also header comments in the third return value.
- def import_tr_file(tr_file):
- dOut = {}
- text = None
- in_header = True
- header_comments = None
- textdomain = None
- if os.path.exists(tr_file):
- with open(tr_file, "r", encoding='utf-8') as existing_file :
- # save the full text to allow for comparison
- # of the old version with the new output
- text = existing_file.read()
- existing_file.seek(0)
- # a running record of the current comment block
- # we're inside, to allow preceeding multi-line comments
- # to be retained for a translation line
- latest_comment_block = None
- for line in existing_file.readlines():
- line = line.rstrip('\n')
- # "##### not used anymore #####" comment
- if line == comment_unused:
- # Always delete the 'not used anymore' comment.
- # It will be re-added to the file if neccessary.
- latest_comment_block = None
- if header_comments != None:
- in_header = False
- continue
- # Comment lines
- elif line.startswith("#"):
- # Source file comments: ##[ file.lua ]##
- if line.startswith(symbol_source_prefix) and line.endswith(symbol_source_suffix):
- # This line marks the end of header comments.
- if params["print-source"]:
- in_header = False
- # Remove those comments; they may be added back automatically.
- continue
- # Store first occurance of textdomain
- # discard all subsequent textdomain lines
- if line.startswith("# textdomain:"):
- if textdomain == None:
- textdomain = line
- continue
- elif in_header:
- # Save header comments (normal comments at top of file)
- if not header_comments:
- header_comments = line
- else:
- header_comments = header_comments + "\n" + line
- else:
- # Save normal comments
- if line.startswith("# textdomain:") and textdomain == None:
- textdomain = line
- elif not latest_comment_block:
- latest_comment_block = line
- else:
- latest_comment_block = latest_comment_block + "\n" + line
- continue
- match = pattern_tr.match(line)
- if match:
- # this line is a translated line
- outval = {}
- outval["translation"] = match.group(2)
- if latest_comment_block:
- # if there was a comment, record that.
- outval["comment"] = latest_comment_block
- latest_comment_block = None
- in_header = False
- dOut[match.group(1)] = outval
- return (dOut, text, header_comments, textdomain)
- # like os.walk but returns sorted filenames
- def sorted_os_walk(folder):
- tuples = []
- t = 0
- for root, dirs, files in os.walk(folder):
- tuples.append( (root, dirs, files) )
- t = t + 1
- tuples = sorted(tuples)
- paths_and_files = []
- f = 0
- for tu in tuples:
- root = tu[0]
- dirs = tu[1]
- files = tu[2]
- files = sorted(files, key=str.lower)
- for filename in files:
- paths_and_files.append( (os.path.join(root, filename), filename) )
- f = f + 1
- return paths_and_files
- # Walks all lua files in the mod folder, collects translatable strings,
- # and writes it to a template.txt file
- # Returns a dictionary of localized strings to source file lists
- # that can be used with the strings_to_text function.
- def generate_template(folder, mod_name):
- dOut = {}
- paths_and_files = sorted_os_walk(folder)
- for paf in paths_and_files:
- fullpath_filename = paf[0]
- filename = paf[1]
- if fnmatch.fnmatch(filename, "*.lua"):
- found = read_lua_file_strings(fullpath_filename)
- if params["verbose"]:
- print(f"{fullpath_filename}: {str(len(found))} translatable strings")
- for s in found:
- sources = dOut.get(s, set())
- sources.add(os.path.relpath(fullpath_filename, start=folder))
- dOut[s] = sources
- if len(dOut) == 0:
- return None
- # Convert source file set to list, sort it and add comment symbols.
- # Needed because a set is unsorted and might result in unpredictable.
- # output orders if any source string appears in multiple files.
- for d in dOut:
- sources = dOut.get(d, set())
- sources = sorted(list(sources), key=str.lower)
- newSources = []
- for i in sources:
- i = i.replace("\\", "/")
- newSources.append(f"{symbol_source_prefix} {i} {symbol_source_suffix}")
- dOut[d] = newSources
- templ_file = os.path.join(folder, "locale/template.txt")
- write_template(templ_file, dOut, mod_name)
- new_template = import_tr_file(templ_file) # re-import to get all new data
- return (dOut, new_template)
- # Updates an existing .tr file, copying the old one to a ".old" file
- # if any changes have happened
- # dNew is the data used to generate the template, it has all the
- # currently-existing localized strings
- def update_tr_file(dNew, templ, mod_name, tr_file):
- if params["verbose"]:
- print(f"updating {tr_file}")
- tr_import = import_tr_file(tr_file)
- dOld = tr_import[0]
- textOld = tr_import[1]
- textNew = strings_to_text(dNew, dOld, mod_name, tr_import[2], tr_import[3], templ)
- if textOld and textOld != textNew:
- print(f"{tr_file} has changed.")
- if params["old-file"]:
- shutil.copyfile(tr_file, f"{tr_file}.old")
- with open(tr_file, "w", encoding='utf-8') as new_tr_file:
- new_tr_file.write(textNew)
- # Updates translation files for the mod in the given folder
- def update_mod(folder):
- if not os.path.exists(os.path.join(folder, "init.lua")):
- print(f"Mod folder {folder} is missing init.lua, aborting.")
- exit(1)
- assert not is_modpack(folder)
- modname = get_modname(folder)
- print(f"Updating translations for {modname}")
- (data, templ) = generate_template(folder, modname)
- if data == None:
- print(f"No translatable strings found in {modname}")
- else:
- for tr_file in get_existing_tr_files(folder):
- update_tr_file(data, templ, modname, os.path.join(folder, "locale/", tr_file))
- def is_modpack(folder):
- return os.path.exists(os.path.join(folder, "modpack.txt")) or os.path.exists(os.path.join(folder, "modpack.conf"))
- def is_game(folder):
- return os.path.exists(os.path.join(folder, "game.conf")) and os.path.exists(os.path.join(folder, "mods"))
- # Determines if the folder being pointed to is a game, mod or a mod pack
- # and then runs update_mod accordingly
- def update_folder(folder):
- if is_game(folder):
- run_all_subfolders(os.path.join(folder, "mods"))
- elif is_modpack(folder):
- run_all_subfolders(folder)
- else:
- update_mod(folder)
- print("Done.")
- def run_all_subfolders(folder):
- for modfolder in [f.path for f in os.scandir(folder) if f.is_dir() and not f.name.startswith('.')]:
- update_folder(modfolder)
- main()
|