forked from xhluca/dl-translate
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathgenerate_langs.py
38 lines (26 loc) · 979 Bytes
/
generate_langs.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
import json
import os
def name_to_var(lang_name):
return (
lang_name.upper()
.replace(" ", "_")
.replace("(", "")
.replace(")", "")
.replace("-", "_")
.replace("'", "")
)
def load_json(name):
filepath = os.path.join(os.path.dirname(__file__), "langs_coverage", f"{name}.json")
return json.loads(open(filepath).read())
auto_gen_comment = f"# Auto-generated. Do not modify, use {__file__} instead.\n"
name2json = {}
for name in ["m2m100", "mbart50", "nllb200"]:
name2json[name] = lang2code = load_json(name)
with open(f"./dl_translate/lang/{name}.py", "w") as f:
f.write(auto_gen_comment)
for lang, code in lang2code.items():
f.write(f'{name_to_var(lang)} = "{lang}"\n')
with open("./dl_translate/_pairs.py", "w") as f:
f.write(auto_gen_comment)
for name, lang2code in name2json.items():
f.write(f"_PAIRS_{name.upper()} = {tuple(lang2code.items())}\n")