Add Speech support

proguy914629bot · proguy914629bot · commit 535c391f1cda · 2021-11-11T15:31:35.000+07:00
diff --git a/openrobot/api_wrapper/__init__.py b/openrobot/api_wrapper/__init__.py
@@ -3,7 +3,8 @@
 from .error import *
 from .results import *
 from .translate import *
+from .speech import *
 
-from . import _async, _sync, translate, results, error
+from . import _async, _sync, translate, results, error, speech
 
 __version__ = '0.2.1.1'
diff --git a/openrobot/api_wrapper/_async.py b/openrobot/api_wrapper/_async.py
@@ -7,6 +7,7 @@
 from .error import *
 from .results import *
 from .translate import Translate
+from .speech import Speech
 
 try:
     from urllib.parse import quote_plus as quote
@@ -249,11 +250,16 @@ async def ocr(self, source: typing.Union[str, io.BytesIO]) -> OCRResult:
 
             js = await self._request('POST', '/api/ocr', data=data)
         else:
-            raise OpenRobotAPIError('source is not a string nor a io.BytesIO.')
+            raise OpenRobotAPIError('source must be a URL or BytesIO.')
 
         return OCRResult(js)
 
     @property
     def translate(self) -> Translate:
         """:class:`Translate`: The Translate client."""
-        return Translate(self, True)
+        return Translate(self, True)
+
+    @property
+    def speech(self) -> Speech:
+        """:class:`Speech`: The Speech client."""
+        return Speech(self, True)
diff --git a/openrobot/api_wrapper/_sync.py b/openrobot/api_wrapper/_sync.py
@@ -6,6 +6,7 @@
 from .error import *
 from .results import *
 from .translate import Translate
+from .speech import Speech
 
 try:
     from urllib.parse import quote_plus as quote
@@ -178,7 +179,7 @@ def celebrity(self, url: str) -> typing.List[CelebrityResult]:
         js = self._request('GET', '/api/celebrity', params={'url': url})
         return [CelebrityResult(data) for data in js]
 
-    def ocr(self, *, url: str = None, fp: io.BytesIO = None) -> OCRResult:
+    def ocr(self, source: typing.Union[str, io.BytesIO]) -> OCRResult:
         """
         Reads text from a image.
 
@@ -202,19 +203,21 @@ def ocr(self, *, url: str = None, fp: io.BytesIO = None) -> OCRResult:
             The OCR/Text found.
         """
 
-        if not url and not fp:
-            raise OpenRobotAPIError('url and fp kwargs cannot be empty.')
-        elif url and fp:
-            raise OpenRobotAPIError('url and fp cannot be both not enpty.')
-
-        if url:
-            js = self._request('POST', '/api/ocr', params={'url': url})
+        if isinstance(source, str):
+            js = self._request('POST', '/api/ocr', params={'url': source})
+        elif isinstance(source, io.BytesIO):
+            js = self._request('POST', '/api/ocr', files={'upload_file': getattr(source, 'getvalue', lambda: source)()})
         else:
-            js = self._request('POST', '/api/ocr', files={'upload_file': getattr(fp, 'getvalue', lambda: fp)()})
+            raise OpenRobotAPIError('source must be a URL or BytesIO.')
 
         return OCRResult(js)
 
     @property
     def translate(self):
         """:class:`Translate`: The Translate client."""
-        return Translate(self, False)
+        return Translate(self, False)
+
+    @property
+    def speech(self) -> Speech:
+        """:class:`Speech`: The Speech client."""
+        return Speech(self, False)
diff --git a/openrobot/api_wrapper/results.py b/openrobot/api_wrapper/results.py
@@ -275,6 +275,96 @@ def __init__(self, js):
         self.gender: typing.Optional[str] = js['Gender'] # TODO: Maybe make this an enum e.g Gender.female or Gender.male
         self.face: CelebrityFaceProperty = CelebrityFaceProperty(js['Face'])
 
+class SpeechToTextResult(OpenRobotAPIBaseResult):
+    """
+    The result of /api/speech/speech-to-text endpoint.
+
+    Attributes
+    ----------
+    text: :class:`str`
+        The text of the recognized speech.
+    duration: Union[:class:`int`, :class:`float`]
+        The time taken to recognize the text in the speech in
+        seconds.
+    """
+
+    def __init__(self, js):
+        super().__init__(js)
+
+        self.text: str = js['text']
+        self.duration: typing.Union[int, float] = js['duration']
+
+class TextToSpeechResult(OpenRobotAPIBaseResult):
+    """
+    The result of /api/speech/text-to-speech endpoint.
+
+    Attributes
+    ----------
+    url: :class:`str`
+        The URL of the speech
+    """
+
+    def __init__(self, js):
+        super().__init__(js)
+
+        self.url: str = js['url']
+
+class TextToSpeechSupportLanguage:
+    """
+    The languages supported by Text To Speech.
+
+    Attributes
+    ----------
+    code: :class:`str`
+        The language code.
+    name: :class:`str`
+        The human-readable language name.
+    """
+
+    def __init__(self, js):
+        self.code: str = js.get('code')
+        self.name: str = js.get('name')
+
+class TextToSpeechSupportVoice:
+    """
+    The supported voices for Text To Speech.
+
+    Attributes
+    ----------
+    gender: :class:`str`
+        The voice's gender.
+    id: :class:`str`
+        The Voice ID.
+    language: :class:`TextToSpeechSupportLanguage`
+        The language of the voice.
+    name: :class:`str`
+        The Voice's name.
+    """
+
+    def __init__(self, js):
+        self.gender: str = js.get('Gender')
+        self.id: str = js.get('Id')
+        self.language: TextToSpeechSupportLanguage = TextToSpeechSupportLanguage({'code': js.get('LanguageCode'),'name': js.get('LanguageName')})
+        self.name: str = js.get('Name')
+
+class TextToSpeechSupportResult(OpenRobotAPIBaseResult):
+    """
+    The result of /api/speech/text-to-speech/support endpoint.
+
+    Attributes
+    ----------
+    languages: List[:class:`TextToSpeechSupportLanguage`]
+        The languages supported by Text To Speech.
+    voices: List[:class:`TextToSpeechSupportVoice`]
+        The supported voices for Text To Speech.
+    """
+
+    def __init__(self, js):
+        super().__init__(js)
+
+        self.languages: typing.List[TextToSpeechSupportLanguage] = [TextToSpeechSupportLanguage(language) for language in js['languages']]
+        self.voices: typing.List[TextToSpeechSupportVoice] = [TextToSpeechSupportVoice(voice) for voice in js['voices']]
+
 class OCRResult(OpenRobotAPIBaseResult):
     """
     The result of /api/ocr endpoint.
diff --git a/openrobot/api_wrapper/speech.py b/openrobot/api_wrapper/speech.py
@@ -0,0 +1,194 @@
+import typing
+import io
+import aiohttp
+from .results import SpeechToTextResult, TextToSpeechResult, TextToSpeechSupportResult
+from .error import OpenRobotAPIError
+
+class Speech:
+    """
+    The speech client.
+    """
+
+    def __init__(self, client, is_async: bool):
+        self._client = client
+
+        self._is_async = is_async
+
+    def speech_to_text(self, source: typing.Union[str, io.BytesIO], language_code: str) -> typing.Union[typing.Coroutine[None, None, SpeechToTextResult], SpeechToTextResult]:
+        """|maybecoro|
+        
+        Speech to text.
+
+        This function is a coroutine if the client is an 
+        :class:`AsyncClient` object, else it would be a synchronous method.
+
+        Parameters
+        ----------
+        source: Union[:class:`str`, :class:`io.BytesIO`]
+            The source of the speech. This can be either a URL or a 
+            :class:`io.BytesIO` object.
+        language_code: :class:`str`
+            The language code of the speech.
+        voice_id: :class:`str`
+            The voice id of the speech.
+        engine: :class:`str`
+            The engine of the speech.
+
+        Raises
+        ------
+        :exc:`Forbidden`
+            API Returned a 403 HTTP Status Code.
+        :exc:`BadRequest`
+            API Returned a 400 HTTP Status Code.
+        :exc:`InternalServerError`
+            API Returned a 500 HTTP Status Code.
+
+        Returns
+        -------
+        Union[Coroutine[None, None, :class:`SpeechToTextResult`], :class:`SpeechToTextResult`]
+            The result of the text to speech.
+        """
+
+        if self._is_async:
+            async def _text_to_speech() -> TextToSpeechResult:
+                if isinstance(source, str):
+                    js = await self._client.request('POST', '/api/speech/speech-to-text', params={'url': source})
+                elif isinstance(source, io.BytesIO):
+                    data = aiohttp.FormData()
+                    data.add_field('file', source)
+
+                    js = await self._client.request('POST', '/api/speech/speech-to-text', data=data)
+                else:
+                    raise OpenRobotAPIError('source must be a URL or BytesIO.')
+
+                return SpeechToTextResult(js)
+
+            return _text_to_speech()
+        else:
+            if isinstance(source, str):
+                js = self._client.request('POST', '/api/speech/speech-to-text', params={'url': source})
+            elif isinstance(source, io.BytesIO):
+                data = aiohttp.FormData()
+                data.add_field('file', source)
+
+                js = self._client.request('POST', '/api/speech/speech-to-text', files={'upload_file': getattr(source, 'getvalue', lambda: source)()})
+            else:
+                raise OpenRobotAPIError('source must be a URL or BytesIO.')
+
+            return SpeechToTextResult(js)
+
+    def speech_to_text_support(self) -> typing.Union[typing.Coroutine[None, None, typing.Dict[str, typing.Any]], typing.Dict[str, typing.Any]]:
+        """|maybecoro|
+        
+        Returns the supported details for Speech To Text.
+
+        This function is a coroutine if the client is an 
+        :class:`AsyncClient` object, else it would be a synchronous method.
+
+        Raises
+        ------
+        :exc:`Forbidden`
+            API Returned a 403 HTTP Status Code.
+        :exc:`BadRequest`
+            API Returned a 400 HTTP Status Code.
+        :exc:`InternalServerError`
+            API Returned a 500 HTTP Status Code.
+
+        Returns
+        -------
+        Union[Coroutine[None, None, typing.Dict[:class:`str`, :class:`typing.Any`]], typing.Dict[:class:`str`, :class:`typing.Any`]]
+            The supported details for Speech To Text.
+        """
+
+        if self._is_async:
+            async def _speech_to_text_support() -> typing.Dict[str, typing.Any]:
+                js = await self._client.request('GET', '/api/speech/speech-to-text/supports')
+
+                return js
+
+            return _speech_to_text_support()
+        else:
+            js = self._client.request('GET', '/api/speech/speech-to-text/supports')
+
+            return js
+        
+    def text_to_speech(self, text: str, language_code: str, voice_id: str, *, engine: str = 'standard') -> typing.Union[typing.Coroutine[None, None, TextToSpeechResult], TextToSpeechResult]:
+        """|maybecoro|
+        
+        Text to speech.
+
+        This function is a coroutine if the client is an 
+        :class:`AsyncClient` object, else it would be a synchronous method.
+
+        Parameters
+        ----------
+        text: :class:`str`
+            The text to be speeched.
+        language_code: :class:`str`
+            The language code of the speech.
+        voice_id: :class:`str`
+            The voice id of the speech.
+        engine: :class:`str`
+            The engine of the speech.
+
+        Raises
+        ------
+        :exc:`Forbidden`
+            API Returned a 403 HTTP Status Code.
+        :exc:`BadRequest`
+            API Returned a 400 HTTP Status Code.
+        :exc:`InternalServerError`
+            API Returned a 500 HTTP Status Code.
+
+        Returns
+        -------
+        Union[Coroutine[None, None, :class:`TextToSpeechResult`], :class:`TextToSpeechResult`]
+            The result of the text to speech.
+        """
+
+        if self._is_async:
+            async def _text_to_speech() -> TextToSpeechResult:
+                js = await self._client.request('GET', '/api/speech/text-to-speech', params={'text': text, 'language_code': language_code, 'voice_id': voice_id, 'engine': engine})
+
+                return TextToSpeechResult(js)
+
+            return _text_to_speech()
+        else:
+            js = self._client.request('GET', '/api/speech/text-to-speech', params={'text': text, 'language_code': language_code, 'voice_id': voice_id, 'engine': engine})
+
+            return TextToSpeechResult(js)
+
+    def text_to_speech_support(self) -> typing.Union[typing.Coroutine[None, None, TextToSpeechSupportResult], TextToSpeechSupportResult]:
+        """|maybecoro|
+
+        Returns the supported details for Text To Speech.
+
+        This function is a coroutine if the client is an 
+        :class:`AsyncClient` object, else it would be a synchronous method.
+
+        Raises
+        ------
+        :exc:`Forbidden`
+            API Returned a 403 HTTP Status Code.
+        :exc:`BadRequest`
+            API Returned a 400 HTTP Status Code.
+        :exc:`InternalServerError`
+            API Returned a 500 HTTP Status Code.
+
+        Returns
+        -------
+        Union[Coroutine[None, None, :class:`TextToSpeechSupportResult`], :class:`TextToSpeechSupportResult`]
+            The supported details for Text To Speech.
+        """
+
+        if self._is_async:
+            async def _text_to_speech_support() -> TextToSpeechSupportResult:
+                js = await self._client.request('GET', '/api/speech/text-to-speech/supports')
+
+                return TextToSpeechSupportResult(js)
+
+            return _text_to_speech_support()
+        else:
+            js = self._client.request('GET', '/api/speech/text-to-speech/supports')
+
+            return TextToSpeechSupportResult(js)
diff --git a/openrobot/api_wrapper/translate.py b/openrobot/api_wrapper/translate.py
diff --git a/pyproject.toml b/pyproject.toml