File size: 3,657 Bytes
f36740b fa90b1d 7a05cd7 58568a7 7a05cd7 2bbc526 7a05cd7 78d0ff1 7a05cd7 78d0ff1 7a05cd7 78d0ff1 3aa1058 58568a7 542d2c5 7ade3be cb15d3a 7ade3be 58568a7 53e803f 78d0ff1 58568a7 7ade3be f36740b 76aa3b2 70f6ed6 78d0ff1 a1d12d2 53e803f f36740b f5c8ab8 3aa1058 f36740b 78d0ff1 906c957 73894d1 f36740b 9a69a65 82f3d24 58568a7 82f3d24 9a69a65 906c957 78d0ff1 906c957 82f3d24 cb15d3a 82f3d24 58568a7 8850921 9a69a65 7ade3be f36740b 9a69a65 55109ff 9a69a65 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 |
"""
pons translator API
"""
__copyright__ = "Copyright (C) 2020 Nidhal Baccouri"
from typing import List, Optional, Union
import requests
from bs4 import BeautifulSoup
from requests.utils import requote_uri
from deep_translator.base import BaseTranslator
from deep_translator.constants import BASE_URLS, PONS_CODES_TO_LANGUAGES
from deep_translator.exceptions import (
ElementNotFoundInGetRequest,
NotValidPayload,
RequestError,
TooManyRequests,
TranslationNotFound,
)
from deep_translator.validate import is_empty, is_input_valid, request_failed
class PonsTranslator(BaseTranslator):
"""
class that uses PONS translator to translate words
"""
def __init__(
self,
source: str,
target: str = "en",
proxies: Optional[dict] = None,
**kwargs,
):
"""
@param source: source language to translate from
@param target: target language to translate to
"""
self.proxies = proxies
super().__init__(
base_url=BASE_URLS.get("PONS"),
languages=PONS_CODES_TO_LANGUAGES,
source=source,
target=target,
payload_key=None,
element_tag="div",
element_query={"class": "target"},
**kwargs,
)
def translate(
self, word: str, return_all: bool = False, **kwargs
) -> Union[str, List[str]]:
"""
function that uses PONS to translate a word
@param word: word to translate
@type word: str
@param return_all: set to True to return all synonym of the translated word
@type return_all: bool
@return: str: translated word
"""
if is_input_valid(word, max_chars=50):
if self._same_source_target() or is_empty(word):
return word
url = f"{self._base_url}{self._source}-{self._target}/{word}"
url = requote_uri(url)
response = requests.get(url, proxies=self.proxies)
if response.status_code == 429:
raise TooManyRequests()
if request_failed(status_code=response.status_code):
raise RequestError()
soup = BeautifulSoup(response.text, "html.parser")
elements = soup.find("div", {"class": "result_list"}).findAll(
self._element_tag, self._element_query
)
response.close()
if not elements:
raise ElementNotFoundInGetRequest(word)
filtered_elements = []
for el in elements:
temp = []
for e in el.findAll("a"):
temp.append(e.get_text())
filtered_elements.append(" ".join(temp))
if not filtered_elements:
raise ElementNotFoundInGetRequest(word)
word_list = [
word for word in filtered_elements if word and len(word) > 1
]
if not word_list:
raise TranslationNotFound(word)
return word_list if return_all else word_list[0]
def translate_words(self, words: List[str], **kwargs) -> List[str]:
"""
translate a batch of words together by providing them in a list
@param words: list of words you want to translate
@param kwargs: additional args
@return: list of translated words
"""
if not words:
raise NotValidPayload(words)
translated_words = []
for word in words:
translated_words.append(self.translate(word=word, **kwargs))
return translated_words
|