百度翻译的api要收费了,我们就用开源模型翻译英文
from transformers import pipeline, AutoModelWithLMHead, AutoTokenizer
from tqdm import tqdm
import paramiko
from concurrent.futures import ThreadPoolExecutor
def get_en_to_zh_model():
model = AutoModelWithLMHead.from_pretrained("Helsinki-NLP/opus-mt-en-zh")
tokenizer = AutoTokenizer.from_pretrained("Helsinki-NLP/opus-mt-en-zh")
translation = pipeline("translation_en_to_zh", model=model, tokenizer=tokenizer)
return translation
def en_to_ch(text):
# 英文翻译成中文
#text = "Student accommodation centres, resorts"
translated_text = translation(text, max_length=1024)[0]['translation_text']
return translated_text
def ch_to_en():
# 中文翻译成英文
model = AutoModelWithLMHead.from_pretrained("Helsinki-NLP/opus-mt-zh-en")
tokenizer = AutoTokenizer.from_pretrained("Helsinki-NLP/opus-mt-zh-en")
translation = pi