-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathtranslate.py
64 lines (56 loc) · 1.89 KB
/
translate.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
import json
import os
import requests
import spaces_interface
class Translator():
def __init__(self):
self.endpoint = 'https://babelfish.firewallcafe.com/translate'
self.target = 'zh-CN'
with open('config.json') as f:
self.secret = json.loads(f.read())['babelfish_key_id']
def translate(self, text, langFrom, langTo):
return ''
r = requests.post(self.endpoint,
data={'secret':self.secret, 'query':text, 'langFrom':langFrom, 'langTo':langTo}
)
# print(r.status_code, r.text)
try:
j = r.json()
except:
return ''
if j['ok'] > 0:
return j['translated']
else:
return ''
def to_chinese(self, text):
result = self.translate(text, 'en', 'zh-CN')
if len(result) == 0:
print(f"empty translation: {text} => {result}")
return result
def to_english(self, text):
result = self.translate(text, 'zh-CN', 'en')
if len(result) == 0:
print(f"empty translation: {text} => {result}")
return result
def machine_translate(df):
print("running machine translation on list")
translator = Translator()
count = 0
for i,row in df.iterrows():
english_term = row.english
chinese_term = row.chinese
# print(english_term, chinese_term)
if not chinese_term and not english_term:
continue
if not chinese_term:
chinese_term = translator.to_chinese(english_term)
df.at[i, 'chinese'] = chinese_term
if len(chinese_term) > 0:
count += 1
if not english_term:
english_term = translator.to_english(chinese_term)
df.at[i, 'english'] = english_term
if len(english_term) > 0:
count += 1
print("translated", count, "words")
return df