diff options
author | Brad Payne (Vir Linden) <vir@lindenlab.com> | 2020-08-12 18:27:00 +0100 |
---|---|---|
committer | Brad Payne (Vir Linden) <vir@lindenlab.com> | 2020-08-12 18:27:00 +0100 |
commit | 1f9852f04c4c430631d10794cce4a3e8186470b5 (patch) | |
tree | dc543c7a6842e0c058e018f65fb0c3dd678cda1f /scripts/code_tools | |
parent | 59de1d58d4aa891cc19372dd6104ec65e1cf4731 (diff) |
SL-13705 - modified_strings.py added, for translation support
Diffstat (limited to 'scripts/code_tools')
-rw-r--r-- | scripts/code_tools/modified_strings.py | 158 |
1 files changed, 158 insertions, 0 deletions
diff --git a/scripts/code_tools/modified_strings.py b/scripts/code_tools/modified_strings.py new file mode 100644 index 0000000000..bb42628f55 --- /dev/null +++ b/scripts/code_tools/modified_strings.py @@ -0,0 +1,158 @@ +"""\
+
+This module contains tools for scanning the SL codebase for translation-related strings.
+
+$LicenseInfo:firstyear=2020&license=viewerlgpl$
+Second Life Viewer Source Code
+Copyright (C) 2020, Linden Research, Inc.
+
+This library is free software; you can redistribute it and/or
+modify it under the terms of the GNU Lesser General Public
+License as published by the Free Software Foundation;
+version 2.1 of the License only.
+
+This library is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+Lesser General Public License for more details.
+
+You should have received a copy of the GNU Lesser General Public
+License along with this library; if not, write to the Free Software
+Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+
+Linden Research, Inc., 945 Battery Street, San Francisco, CA 94111 USA
+$/LicenseInfo$
+"""
+
+from __future__ import print_function
+
+# packages required include: gitpython, pandas
+
+import xml.etree.ElementTree as ET
+import argparse
+import os
+import sys
+from git import Repo, Git # requires the gitpython package
+import pandas as pd
+
+translate_attribs = [
+ "title",
+ "short_title",
+ "value",
+ "label",
+ "label_selected",
+ "tool_tip",
+ "ignoretext",
+ "yestext",
+ "notext",
+ "canceltext",
+ "description",
+ "longdescription"
+]
+
+def codify(val):
+ if isinstance(val, unicode):
+ return val.encode("utf-8")
+ else:
+ return unicode(val, 'utf-8').encode("utf-8")
+
+def failure(*msg):
+ print(*msg)
+ sys.exit(1)
+
+if __name__ == "__main__":
+
+ parser = argparse.ArgumentParser(description="analyze viewer xui files")
+ parser.add_argument("--verbose", action="store_true", help="verbose flag")
+ parser.add_argument("--rev", help="revision with modified strings, default HEAD", default="HEAD")
+ parser.add_argument("--rev_base", help="previous revision to compare against, default master", default="master")
+ parser.add_argument("--base_lang", help="base language, default en (useful only for testing)", default="en")
+ parser.add_argument("--lang", help="target language, default fr", default="fr")
+ #parser.add_argument("infilename", help="name of input file", nargs="?")
+ args = parser.parse_args()
+
+ #root = ET.parse(args.infilename)
+
+ #for child in root.iter("string"):
+ # print child.attrib["name"], "\t", unicode(child.text, 'utf-8').encode("utf-8")
+ # #print unicode(child.text, 'utf-8')
+ # #print u'\u0420\u043e\u0441\u0441\u0438\u044f'.encode("utf-8")
+
+ if args.rev == args.rev_base:
+ failure("Revs are the same, nothing to compare")
+
+ print("Finding changes in", args.rev, "not present in", args.rev_base)
+
+ cwd = os.getcwd()
+ rootdir = Git(cwd).rev_parse("--show-toplevel")
+ repo = Repo(rootdir)
+ try:
+ mod_commit = repo.commit(args.rev)
+ except:
+ failure(args.rev,"is not a valid commit")
+ try:
+ base_commit = repo.commit(args.rev_base)
+ except:
+ failure(args.rev_base,"is not a valid commit")
+
+ mod_tree = mod_commit.tree
+ base_tree = base_commit.tree
+
+ all_attrib = set()
+
+ try:
+ mod_xui_tree = mod_tree["indra/newview/skins/default/xui/{}".format(args.base_lang)]
+ except:
+ print("xui tree not found for language", args.base_lang)
+ sys.exit(1)
+
+ data = []
+ # For all files to be checked for translations
+ for mod_blob in mod_xui_tree.traverse():
+ print(mod_blob.path)
+ filename = mod_blob.path
+ if mod_blob.type == "tree": # directory, skip
+ continue
+
+ mod_contents = mod_blob.data_stream.read()
+ try:
+ base_blob = base_tree[filename]
+ base_contents = base_blob.data_stream.read()
+ except:
+ print("No matching base file found for", filename)
+ base_contents = '<?xml version="1.0" encoding="utf-8" standalone="yes" ?><strings></strings>'
+
+ mod_xml = ET.fromstring(mod_contents)
+ base_xml = ET.fromstring(base_contents)
+
+ mod_dict = {}
+ for child in mod_xml.iter():
+ if "name" in child.attrib:
+ name = child.attrib['name']
+ mod_dict[name] = child
+ base_dict = {}
+ for child in base_xml.iter():
+ if "name" in child.attrib:
+ name = child.attrib['name']
+ base_dict[name] = child
+ for name in mod_dict.keys():
+ if not name in base_dict or mod_dict[name].text != base_dict[name].text:
+ data.append([filename, name, "text", mod_dict[name].text,""])
+ #print(" ", name, "text", codify(mod_dict[name].text))
+ all_attrib = all_attrib.union(set(mod_dict[name].attrib.keys()))
+ for attr in translate_attribs:
+ if attr in mod_dict[name].attrib:
+ if name not in base_dict or attr not in base_dict[name] or mod_dict[name].attrib[attr] != base_dict[name].attrib[attr]:
+ val = mod_dict[name].attrib[attr]
+ data.append([filename, name, attr, mod_dict[name].attrib[attr],""])
+ #print(" ", name, attr, codify(val))
+
+ cols = ["File", "Element", "Field", "EN", "Translation ({})".format(args.lang)]
+ df = pd.DataFrame(data, columns=cols)
+ df.to_excel("SL_Translations_{}.xlsx".format(args.lang.upper()), index=False)
+
+ #print "all_attrib", all_attrib
+
+
+
+
|