Merge branch 'txstats' into calamares

Improve automation in handling translation-lists updates.
This commit is contained in:
Adriaan de Groot 2020-07-31 12:48:57 +02:00
commit 7e60ee059c

View File

@ -10,24 +10,135 @@
import sys import sys
import argparse import argparse
def get_tx_credentials(): class TXError(Exception):
""" pass
Gets the API token out of the user's .transifexrc (this is supposed
to be secure).
"""
import configparser
import os
txconfig_name = os.path.expanduser("~/.transifexrc")
try:
with open(txconfig_name, "r") as f:
parser = configparser.ConfigParser()
parser.read_file(f)
return parser.get("https://www.transifex.com", "password")
except IOError as e:
return None
def output_langs(all_langs, label, filterfunc): class TransifexGetter(object):
"""
Get language data from Transifex.
The object does all the work in __init__, after that
the only relevant data is .languages, a dictionary
of language data.
"""
def __init__(self):
token = self.get_tx_credentials()
if token is None:
raise TXError("Could not get Transifex API token")
import requests
r = requests.get("https://api.transifex.com/organizations/calamares/projects/calamares/resources/calamares/", auth=("api", token))
if r.status_code != 200:
raise TXError("Could not get Transifex data from API")
j = r.json()
self.languages = j["stats"]
def get_tx_credentials(self):
"""
Gets the API token out of the user's .transifexrc (this is supposed
to be secure).
"""
import configparser
import os
txconfig_name = os.path.expanduser("~/.transifexrc")
try:
with open(txconfig_name, "r") as f:
parser = configparser.ConfigParser()
parser.read_file(f)
return parser.get("https://www.transifex.com", "password")
except IOError as e:
return None
class BogusGetter(object):
"""
Fake language data.
This object pretends to retrieve data, and returns fixed language lists and percentages,
for testing purposes without hitting Transifex servers all the time.
"""
def __init__(self):
self.languages = dict()
for lang, completion in ( ("sq", 100), ("ar", 44), ("as", 28), ("de", 15), ("da", 4), ("ts", 82) ):
self.languages[lang] = dict(translated=dict(stringcount=686, percentage=(completion/100.0)))
class PrintOutputter(object):
"""
Output via print-statements.
"""
def __init__(self):
pass
def print(self, s):
print(s)
def __enter__(self):
return self
def __exit__(self, e, v, tb):
pass
class EditingOutputter(object):
"""
Edit CMakeLists in-place.
"""
def __init__(self):
with open("CMakeLists.txt", "r") as f:
lines = f.readlines()
mark = None
for l in lines:
# Note that we didn't strip the lines, so need the \n here
if l.startswith("# Total ") and l.endswith(" languages\n"):
mark = lines.index(l)
break
if mark is None:
raise TXError("No CMakeLists.txt lines for TX stats found")
self.pre_lines = lines[:mark]
nextmark = mark + 1
for l in lines[mark+1:]:
if l.startswith("set( _tx_"):
nextmark += 1
continue
if l.startswith(" "):
nextmark += 1
continue
break
if nextmark > mark + 12 or nextmark > len(lines) - 4:
# Try to catch runaway nextmarks: we know there should
# be four set-lines, which are unlikely to be 3 lines each;
# similarly the CMakeLists.txt is supposed to end with
# some boilerplate.
raise TXError("Could not find end of TX settings in CMakeLists.txt")
self.post_lines = lines[nextmark:]
self.mid_lines = []
print("# Editing CMakeLists.txt in-place")
def print(self, s):
# Add the implicit \n from print()
self.mid_lines.append(s + "\n")
if s.startswith("#"):
print(s)
def __enter__(self):
return self
def __exit__(self, e, v, tb):
if e is None:
with open("CMakeLists.txt", "w") as f:
f.write("".join(self.pre_lines + self.mid_lines + self.post_lines))
print("# CMakeLists.txt updated")
def output_langs(all_langs, outputter, label, filterfunc):
""" """
Output (via print) all of the languages in @p all_langs Output (via print) all of the languages in @p all_langs
that satisfy the translation-percentage filter @p filterfunc. that satisfy the translation-percentage filter @p filterfunc.
@ -43,12 +154,13 @@ def output_langs(all_langs, label, filterfunc):
while len(out) > width - len(prefix): while len(out) > width - len(prefix):
chunk = out[:out[:width].rfind(" ")] chunk = out[:out[:width].rfind(" ")]
print("%s%s" % (prefix, chunk)) outputter.print("%s%s" % (prefix, chunk))
out = out[len(chunk)+1:] out = out[len(chunk)+1:]
prefix = " " prefix = " "
print("%s%s" % (prefix, out)) outputter.print("%s%s" % (prefix, out))
def get_tx_stats(token, verbose):
def get_tx_stats(languages, outputter, verbose):
""" """
Does an API request to Transifex with the given API @p token, getting Does an API request to Transifex with the given API @p token, getting
the translation statistics for the main body of texts. Then prints the translation statistics for the main body of texts. Then prints
@ -57,12 +169,6 @@ def get_tx_stats(token, verbose):
If @p verbose is True, prints out language stats as well. If @p verbose is True, prints out language stats as well.
""" """
import requests
r = requests.get("https://api.transifex.com/organizations/calamares/projects/calamares/resources/calamares/", auth=("api", token))
if r.status_code != 200:
return 1
suppressed_languages = ( "es_ES", ) # In Transifex, but not used suppressed_languages = ( "es_ES", ) # In Transifex, but not used
# Some languages go into the "incomplete" list by definition, # Some languages go into the "incomplete" list by definition,
# regardless of their completion status: this can have various reasons. # regardless of their completion status: this can have various reasons.
@ -75,10 +181,7 @@ def get_tx_stats(token, verbose):
) )
all_langs = [] all_langs = []
outputter.print("# Total %d languages" % len(languages))
j = r.json()
languages = j["stats"]
print("# Total %d languages" % len(languages))
for lang_name in languages: for lang_name in languages:
if lang_name in suppressed_languages: if lang_name in suppressed_languages:
continue continue
@ -92,11 +195,11 @@ def get_tx_stats(token, verbose):
if verbose: if verbose:
for s, l in sorted(all_langs, reverse=True): for s, l in sorted(all_langs, reverse=True):
print("# %16s\t%6.2f" % (l, s * 100.0)) outputter.print("# %16s\t%6.2f" % (l, s * 100.0))
output_langs(all_langs, "complete", lambda s : s == 1.0) output_langs(all_langs, outputter, "complete", lambda s : s == 1.0)
output_langs(all_langs, "good", lambda s : 1.0 > s >= 0.75) output_langs(all_langs, outputter, "good", lambda s : 1.0 > s >= 0.75)
output_langs(all_langs, "ok", lambda s : 0.75 > s >= 0.05) output_langs(all_langs, outputter, "ok", lambda s : 0.75 > s >= 0.05)
output_langs(all_langs, "incomplete", lambda s : 0.05 > s) output_langs(all_langs, outputter, "incomplete", lambda s : 0.05 > s)
return 0 return 0
@ -104,13 +207,23 @@ def get_tx_stats(token, verbose):
def main(): def main():
parser = argparse.ArgumentParser(description="Update Transifex Statistics") parser = argparse.ArgumentParser(description="Update Transifex Statistics")
parser.add_argument("--verbose", "-v", help="Show statistics", action="store_true") parser.add_argument("--verbose", "-v", help="Show statistics", action="store_true")
parser.add_argument("--bogus", "-n", help="Use bogus data (do not query Transifex)", action="store_true")
parser.add_argument("--edit", "-e", help="Edit CMakeLists.txt in-place", action="store_true")
args = parser.parse_args() args = parser.parse_args()
cred = get_tx_credentials() try:
if cred: if args.bogus:
return get_tx_stats(cred, args.verbose) getter = BogusGetter()
else: else:
print("! Could not find API token in ~/.transifexrc") getter = TransifexGetter()
return 1 if args.edit:
outputter = EditingOutputter()
else:
outputter = PrintOutputter()
with outputter:
return get_tx_stats(getter.languages, outputter, args.verbose)
except TXError as e:
print("! " + str(e))
return 1;
return 0 return 0
if __name__ == "__main__": if __name__ == "__main__":