-
Notifications
You must be signed in to change notification settings - Fork 0
/
utils.py
73 lines (55 loc) · 1.79 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
import os
import json
from deep_translator import GoogleTranslator
from functools import lru_cache
from pinyin_tone_converter.pinyin_tone_converter import PinyinToneConverter
from dictionaries import *
translator = {}
pt_dict = PTDict("dictionary.json")
cedict = CEDict("cedict_ts.u8")
@lru_cache()
def translate(text, source, target):
key = ",".join([source, target])
if not key in translator.keys():
translator[key] = GoogleTranslator(source=source, target=target)
return translator[key].translate(text = text)
def normalize_dict_entry(entry):
if "simplified" not in entry:
entry["simplified"] = entry["chinese"]
entry["traditional"] = entry["chinese"]
if "english" not in entry:
entry["english"] = ""
if "portuguese" not in entry:
entry["portuguese"] = translate(entry["english"], "en", "pt")
if "1" in entry["pinyin"] or \
"2" in entry["pinyin"] or \
"3" in entry["pinyin"] or \
"4" in entry["pinyin"]:
entry["pinyin"] = PinyinToneConverter().convert_text(entry["pinyin"])
@lru_cache()
def get_dictionary_for(query, truncate=6):
pt_entries = pt_dict.search(query)
en_entries = cedict.search(query)
entries = pt_entries[0]
entries.extend(en_entries[0])
entries.extend(pt_entries[1])
entries.extend(en_entries[1])
if len(entries) > truncate:
t = entries[:truncate + 1]
entries = t
for e in entries:
normalize_dict_entry(e)
return entries
def verbose(f):
def inner(*args, **kwargs):
err = None
ret = None
try:
ret = f(*args, **kwargs)
except Exception as e:
err = e
print(ret, f.__name__, args, kwargs)
if err:
raise err
return ret
return inner