You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
136 lines
4.1 KiB
136 lines
4.1 KiB
"""
|
|
Yandex translator API
|
|
"""
|
|
import requests
|
|
from .constants import BASE_URLS
|
|
from .exceptions import (RequestError, ServerException, TranslationNotFound, TooManyRequests)
|
|
|
|
|
|
class YandexTranslator(object):
|
|
"""
|
|
class that wraps functions, which use the yandex translator under the hood to translate word(s)
|
|
"""
|
|
|
|
def __init__(self, api_key=None, source="en", target="de", **kwargs):
|
|
"""
|
|
@param api_key: your yandex api key
|
|
"""
|
|
if not api_key:
|
|
raise ServerException(401)
|
|
self.__base_url = BASE_URLS.get("YANDEX")
|
|
self.source = source
|
|
self.target = target
|
|
|
|
self.api_key = api_key
|
|
self.api_version = "v1.5"
|
|
self.api_endpoints = {
|
|
"langs": "getLangs",
|
|
"detect": "detect",
|
|
"translate": "translate",
|
|
}
|
|
|
|
@staticmethod
|
|
def get_supported_languages(as_dict=False, **kwargs):
|
|
""" this method is just for consistency."""
|
|
return """ this method is just for consistency. You need to create an instance of yandex and access
|
|
supported languages using the languages property or call _get_supported_languages
|
|
"""
|
|
|
|
def _get_supported_languages(self):
|
|
return set(x.split("-")[0] for x in self.dirs)
|
|
|
|
@property
|
|
def languages(self):
|
|
return self.get_supported_languages()
|
|
|
|
@property
|
|
def dirs(self, proxies=None):
|
|
|
|
try:
|
|
url = self.__base_url.format(version=self.api_version, endpoint="getLangs")
|
|
print("url: ", url)
|
|
response = requests.get(url, params={"key": self.api_key}, proxies=proxies)
|
|
except requests.exceptions.ConnectionError:
|
|
raise ServerException(503)
|
|
else:
|
|
data = response.json()
|
|
|
|
if response.status_code != 200:
|
|
raise ServerException(response.status_code)
|
|
return data.get("dirs")
|
|
|
|
def detect(self, text, proxies=None):
|
|
response = None
|
|
params = {
|
|
"text": text,
|
|
"format": "plain",
|
|
"key": self.api_key,
|
|
}
|
|
try:
|
|
url = self.__base_url.format(version=self.api_version, endpoint="detect")
|
|
response = requests.post(url, data=params, proxies=proxies)
|
|
|
|
except RequestError:
|
|
raise
|
|
except ConnectionError:
|
|
raise ServerException(503)
|
|
except ValueError:
|
|
raise ServerException(response.status_code)
|
|
else:
|
|
response = response.json()
|
|
language = response['lang']
|
|
status_code = response['code']
|
|
if status_code != 200:
|
|
raise RequestError()
|
|
elif not language:
|
|
raise ServerException(501)
|
|
return language
|
|
|
|
def translate(self, text, proxies=None, **kwargs):
|
|
params = {
|
|
"text": text,
|
|
"format": "plain",
|
|
"lang": self.target if self.source == "auto" else "{}-{}".format(self.source, self.target),
|
|
"key": self.api_key
|
|
}
|
|
try:
|
|
url = self.__base_url.format(version=self.api_version, endpoint="translate")
|
|
response = requests.post(url, data=params, proxies=proxies)
|
|
except ConnectionError:
|
|
raise ServerException(503)
|
|
else:
|
|
response = response.json()
|
|
|
|
if response['code'] == 429:
|
|
raise TooManyRequests()
|
|
|
|
if response['code'] != 200:
|
|
raise ServerException(response['code'])
|
|
|
|
if not response['text']:
|
|
raise TranslationNotFound()
|
|
|
|
return response['text']
|
|
|
|
def translate_file(self, path, **kwargs):
|
|
"""
|
|
translate from a file
|
|
@param path: path to file
|
|
@return: translated text
|
|
"""
|
|
try:
|
|
with open(path, 'r', encoding='utf-8') as f:
|
|
text = f.read()
|
|
|
|
return self.translate(text)
|
|
except Exception as e:
|
|
raise e
|
|
|
|
def translate_batch(self, batch, **kwargs):
|
|
"""
|
|
translate a batch of texts
|
|
@param batch: list of texts to translate
|
|
@return: list of translations
|
|
"""
|
|
return [self.translate(text, **kwargs) for text in batch]
|