Merge normalize and reconvert l10n scripts, keep author info, format the files properly, remove tabs from data

2024-11-19 14:38:18 +00:00 · 2019-01-06 13:42:37 +01:00 · 2019-01-06 13:42:37 +01:00 · 5090c73250
parent d215c73206
commit 5090c73250
2 changed files with 45 additions and 17 deletions
--- a/scripts/normalize_po.py
+++ b/scripts/normalize_po.py
@ -1,11 +0,0 @@
 import polib
 import sys
 if __name__ == '__main__':
 	for filename in sys.argv[1:]:
 		po = polib.pofile(open(filename).read())
 		entries = list(sorted(sorted(po, key=lambda x: x.msgctxt or ""), key=lambda x: x.msgid))
 		po.clear()
 		for entry in entries:
 			po.append(entry)
 		po.save(filename)
--- a/scripts/reconvert_l10n.py
+++ b/scripts/reconvert_l10n.py
@ -1,12 +1,16 @@
 import json
 import polib
 import json
 import sys
 JSON_KEY_TRANSL="translated strings"
 JSON_KEY_AUTHOR="authors"
 JSON_KEY_MODIFY="modified by"
 JSON_KEY_OR="or"
 JSON_KEY_TR="tr"
 JSON_KEY_CO="context"
-def reconvert(filename):
+def reconvert(filename, json_filename):
 	"""Converts a l10n file.po into a file.json, keeping author info from a previous file.json if possible"""
 	po = polib.pofile(open(filename, encoding='utf-8').read())
 	translations = []
@ -19,18 +23,53 @@ def reconvert(filename):
 				t_entry[JSON_KEY_CO] = entry.msgctxt
 			translations.append(t_entry)
-	result = {JSON_KEY_TRANSL: translations}
+	try:
 		previous_l10n = json.load(open(json_filename, encoding='utf-8'), strict=False)
 		# remove tabs from data
 		authors = previous_l10n[JSON_KEY_AUTHOR]
 		for i, value in enumerate(authors[JSON_KEY_MODIFY]):
 			authors[JSON_KEY_MODIFY][i] = value.replace("\t", "    ")
 		result = {JSON_KEY_AUTHOR: authors, JSON_KEY_TRANSL: translations}
 		print(" extracted author info from " + json_filename)
 	except IOError:
 		result = {JSON_KEY_AUTHOR: "", JSON_KEY_TRANSL: translations}
 		print(" failed to open " + json_filename + ", skipping author info")
 	json.dump(
 		result,
-		open(filename + '.json', 'w', encoding='utf-8'),
+		open(json_filename, 'w', encoding='utf-8'),
 		ensure_ascii=False,
 		indent="\t",
 		separators=(',', ': '),
 		sort_keys=True,
 	)
 def normalize(filename):
 	"""Normalizes a l10n file.po for better version controlling"""
 	po = polib.pofile(open(filename).read())
 	entries = list(sorted(sorted(po, key=lambda x: x.msgctxt or ""), key=lambda x: x.msgid))
 	po.clear()
 	for entry in entries:
 		po.append(entry)
 	po.save(filename)
 def decrement_indent(filename):
 	"""decrement indent level of file"""
 	with open(filename, encoding='utf-8') as f:
 		sanitized_json=f.read().replace('\n\t', '\n')	 
 	with open(filename, 'w', encoding='utf-8') as f:
 		f.write(sanitized_json)
 if __name__ == '__main__':
-	import sys
+	"""Normalizes then converts a l10n file.po into a file.json, keeping author info from a previous file.json if possible"""
 	for filename in sys.argv[1:]:
-		reconvert(filename)
+		assert(len(filename)>len(".po"))
 		json_filename = filename[:-3]+".json"
 		normalize(filename)
 		print(filename + " -> " + filename + " (normalized)")
 		reconvert(filename, json_filename)
 		decrement_indent(json_filename)
 		print(filename + " -> " + json_filename)