deepgram.clients.speak.client

View Source

 1# Copyright 2024 Deepgram SDK contributors. All Rights Reserved.
 2# Use of this source code is governed by a MIT license that can be found in the LICENSE file.
 3# SPDX-License-Identifier: MIT
 4
 5# rest
 6from .v1 import (
 7    #### top level
 8    SpeakOptions as SpeakOptionsLatest,
 9    SpeakRESTOptions as SpeakRESTOptionsLatest,
10    # common
11    TextSource as TextSourceLatest,
12    BufferSource as BufferSourceLatest,
13    StreamSource as StreamSourceLatest,
14    FileSource as FileSourceLatest,
15    # unique
16    SpeakSource as SpeakSourceLatest,
17    SpeakRestSource as SpeakRestSourceLatest,
18    SpeakRESTSource as SpeakRESTSourceLatest,
19)
20
21from .v1 import (
22    SpeakRESTClient as SpeakRESTClientLatest,
23    AsyncSpeakRESTClient as AsyncSpeakRESTClientLatest,
24)
25
26from .v1 import (
27    SpeakRESTResponse as SpeakRESTResponseLatest,
28)
29
30# websocket
31from .v1 import (
32    SpeakWebSocketClient as SpeakWebSocketClientLatest,
33    AsyncSpeakWebSocketClient as AsyncSpeakWebSocketClientLatest,
34    SpeakWSClient as SpeakWSClientLatest,
35    AsyncSpeakWSClient as AsyncSpeakWSClientLatest,
36)
37
38from .v1 import (
39    SpeakWSOptions as SpeakWSOptionsLatest,
40)
41from .v1 import (
42    OpenResponse as OpenResponseLatest,
43    SpeakWSMetadataResponse as SpeakWSMetadataResponseLatest,
44    FlushedResponse as FlushedResponseLatest,
45    ClearedResponse as ClearedResponseLatest,
46    CloseResponse as CloseResponseLatest,
47    UnhandledResponse as UnhandledResponseLatest,
48    WarningResponse as WarningResponseLatest,
49    ErrorResponse as ErrorResponseLatest,
50)
51
52# The client.py points to the current supported version in the SDK.
53# Older versions are supported in the SDK for backwards compatibility.
54
55# rest
56# input
57SpeakOptions = SpeakOptionsLatest
58SpeakRESTOptions = SpeakRESTOptionsLatest
59TextSource = TextSourceLatest
60BufferSource = BufferSourceLatest
61StreamSource = StreamSourceLatest
62FileSource = FileSourceLatest
63SpeakSource = SpeakSourceLatest
64SpeakRestSource = SpeakRestSourceLatest
65SpeakRESTSource = SpeakRESTSourceLatest  # pylint: disable=invalid-name
66
67# output
68SpeakRESTResponse = SpeakRESTResponseLatest
69
70# websocket
71# input
72SpeakWSOptions = SpeakWSOptionsLatest
73
74# output
75OpenResponse = OpenResponseLatest
76SpeakWSMetadataResponse = SpeakWSMetadataResponseLatest
77FlushedResponse = FlushedResponseLatest
78ClearedResponse = ClearedResponseLatest
79CloseResponse = CloseResponseLatest
80UnhandledResponse = UnhandledResponseLatest
81WarningResponse = WarningResponseLatest
82ErrorResponse = ErrorResponseLatest
83
84
85# backward compatibility
86SpeakResponse = SpeakRESTResponseLatest
87SpeakClient = SpeakRESTClientLatest
88
89# clients
90SpeakRESTClient = SpeakRESTClientLatest
91AsyncSpeakRESTClient = AsyncSpeakRESTClientLatest
92SpeakWSClient = SpeakWSClientLatest
93AsyncSpeakWSClient = AsyncSpeakWSClientLatest
94SpeakWebSocketClient = SpeakWebSocketClientLatest
95AsyncSpeakWebSocketClient = AsyncSpeakWebSocketClientLatest

SpeakOptions = <class 'SpeakRESTOptions'>

@dataclass

class SpeakRESTOptions(deepgram.clients.common.v1.shared_response.BaseResponse): View Source

17@dataclass
18class SpeakRESTOptions(BaseResponse):
19    """
20    Contains all the options for the SpeakOptions.
21
22    Reference:
23    https://developers.deepgram.com/reference/text-to-speech-api
24    """
25
26    model: Optional[str] = field(
27        default="aura-asteria-en",
28        metadata=dataclass_config(exclude=lambda f: f is None),
29    )
30    encoding: Optional[str] = field(
31        default=None, metadata=dataclass_config(exclude=lambda f: f is None)
32    )
33    container: Optional[str] = field(
34        default=None, metadata=dataclass_config(exclude=lambda f: f is None)
35    )
36    sample_rate: Optional[int] = field(
37        default=None, metadata=dataclass_config(exclude=lambda f: f is None)
38    )
39    bit_rate: Optional[int] = field(
40        default=None, metadata=dataclass_config(exclude=lambda f: f is None)
41    )
42
43    def check(self):
44        """
45        Check the SpeakOptions for any missing or invalid values.
46        """
47        logger = verboselogs.VerboseLogger(__name__)
48        logger.addHandler(logging.StreamHandler())
49        prev = logger.level
50        logger.setLevel(verboselogs.ERROR)
51
52        # no op at the moment
53
54        logger.setLevel(prev)
55
56        return True

Contains all the options for the SpeakOptions.

Reference: https://developers.deepgram.com/reference/text-to-speech-api

SpeakRESTOptions( model: Optional[str] = 'aura-asteria-en', encoding: Optional[str] = None, container: Optional[str] = None, sample_rate: Optional[int] = None, bit_rate: Optional[int] = None)

model: Optional[str] = 'aura-asteria-en'

encoding: Optional[str] = None

container: Optional[str] = None

sample_rate: Optional[int] = None

bit_rate: Optional[int] = None

def check(self): View Source

43    def check(self):
44        """
45        Check the SpeakOptions for any missing or invalid values.
46        """
47        logger = verboselogs.VerboseLogger(__name__)
48        logger.addHandler(logging.StreamHandler())
49        prev = logger.level
50        logger.setLevel(verboselogs.ERROR)
51
52        # no op at the moment
53
54        logger.setLevel(prev)
55
56        return True

Check the SpeakOptions for any missing or invalid values.

Inherited Members

deepgram.clients.common.v1.shared_response.BaseResponse: eval

class TextSource(typing_extensions.TypedDict): View Source

53class TextSource(TypedDict):
54    """
55    Represents a data source for reading binary data from a text-like source.
56
57    This class is used to specify a source of text data that can be read from.
58
59    Attributes:
60        text (str): A string for reading text data.
61    """
62
63    text: str

Represents a data source for reading binary data from a text-like source.

This class is used to specify a source of text data that can be read from.

Attributes: text (str): A string for reading text data.

text: str

class BufferSource(typing_extensions.TypedDict): View Source

39class BufferSource(TypedDict):
40    """
41    Represents a data source for handling raw binary data.
42
43    This class is used to specify raw binary data, such as audio data in its
44    binary form, which can be captured from a microphone or generated synthetically.
45
46    Attributes:
47        buffer (bytes): The binary data.
48    """
49
50    buffer: bytes

Represents a data source for handling raw binary data.

This class is used to specify raw binary data, such as audio data in its binary form, which can be captured from a microphone or generated synthetically.

Attributes: buffer (bytes): The binary data.

buffer: bytes

class StreamSource(typing_extensions.TypedDict): View Source

11class StreamSource(TypedDict):
12    """
13    Represents a data source for reading binary data from a stream-like source.
14
15    This class is used to specify a source of binary data that can be read from
16    a stream, such as an audio file in .wav format.
17
18    Attributes:
19        stream (BufferedReader): A BufferedReader object for reading binary data.
20    """
21
22    stream: BufferedReader

Represents a data source for reading binary data from a stream-like source.

This class is used to specify a source of binary data that can be read from a stream, such as an audio file in .wav format.

Attributes: stream (BufferedReader): A BufferedReader object for reading binary data.

stream: _io.BufferedReader

FileSource = typing.Union[TextSource, BufferSource, StreamSource]

SpeakSource = typing.Union[TextSource, BufferSource, StreamSource, _io.BufferedReader]

SpeakRestSource = typing.Union[TextSource, BufferSource, StreamSource, _io.BufferedReader]

SpeakRESTSource = typing.Union[TextSource, BufferSource, StreamSource, _io.BufferedReader]

@dataclass

class SpeakRESTResponse(deepgram.clients.common.v1.shared_response.BaseResponse): View Source

20@dataclass
21class SpeakRESTResponse(BaseResponse):  # pylint: disable=too-many-instance-attributes
22    """
23    A class for representing a response from the speak endpoint.
24    """
25
26    content_type: str = ""
27    request_id: str = ""
28    model_uuid: str = ""
29    model_name: str = ""
30    characters: int = 0
31    transfer_encoding: str = ""
32    date: str = ""
33    filename: Optional[str] = field(
34        default=None, metadata=dataclass_config(exclude=lambda f: f is None)
35    )
36    # pylint: disable=W0511
37    # TODO: stream will be deprecated in a future release. Please use stream_memory instead.
38    stream: Optional[io.BytesIO] = field(
39        default=None,
40        metadata=dataclass_config(exclude=lambda f: True),
41    )
42    # pylint: enable=W0511
43    stream_memory: Optional[io.BytesIO] = field(
44        default=None,
45        metadata=dataclass_config(exclude=lambda f: True),
46    )

A class for representing a response from the speak endpoint.

SpeakRESTResponse( content_type: str = '', request_id: str = '', model_uuid: str = '', model_name: str = '', characters: int = 0, transfer_encoding: str = '', date: str = '', filename: Optional[str] = None, stream: Optional[_io.BytesIO] = None, stream_memory: Optional[_io.BytesIO] = None)

content_type: str = ''

request_id: str = ''

model_uuid: str = ''

model_name: str = ''

characters: int = 0

transfer_encoding: str = ''

date: str = ''

filename: Optional[str] = None

stream: Optional[_io.BytesIO] = None

stream_memory: Optional[_io.BytesIO] = None

Inherited Members

deepgram.clients.common.v1.shared_response.BaseResponse: eval

@dataclass

class SpeakWSOptions(deepgram.clients.common.v1.shared_response.BaseResponse): View Source

17@dataclass
18class SpeakWSOptions(BaseResponse):
19    """
20    Contains all the options for the SpeakOptions.
21
22    Reference:
23    https://developers.deepgram.com/reference/transform-text-to-speech-websocket
24    """
25
26    model: Optional[str] = field(
27        default="aura-asteria-en",
28        metadata=dataclass_config(exclude=lambda f: f is None),
29    )
30    encoding: Optional[str] = field(
31        default=None, metadata=dataclass_config(exclude=lambda f: f is None)
32    )
33    # container: Optional[str] = field(
34    #     default=None, metadata=dataclass_config(exclude=lambda f: f is None)
35    # )
36    sample_rate: Optional[int] = field(
37        default=None, metadata=dataclass_config(exclude=lambda f: f is None)
38    )
39    bit_rate: Optional[int] = field(
40        default=None, metadata=dataclass_config(exclude=lambda f: f is None)
41    )
42
43    def __getitem__(self, key):
44        _dict = self.to_dict()
45        return _dict[key]
46
47    def __setitem__(self, key, val):
48        self.__dict__[key] = val
49
50    def __str__(self) -> str:
51        return self.to_json(indent=4)
52
53    def check(self):
54        """
55        Check the SpeakOptions for any missing or invalid values.
56        """
57        logger = verboselogs.VerboseLogger(__name__)
58        logger.addHandler(logging.StreamHandler())
59        prev = logger.level
60        logger.setLevel(verboselogs.ERROR)
61
62        # no op at the moment
63
64        logger.setLevel(prev)
65
66        return True

Contains all the options for the SpeakOptions.

Reference: https://developers.deepgram.com/reference/transform-text-to-speech-websocket

SpeakWSOptions( model: Optional[str] = 'aura-asteria-en', encoding: Optional[str] = None, sample_rate: Optional[int] = None, bit_rate: Optional[int] = None)

model: Optional[str] = 'aura-asteria-en'

encoding: Optional[str] = None

sample_rate: Optional[int] = None

bit_rate: Optional[int] = None

def check(self): View Source

53    def check(self):
54        """
55        Check the SpeakOptions for any missing or invalid values.
56        """
57        logger = verboselogs.VerboseLogger(__name__)
58        logger.addHandler(logging.StreamHandler())
59        prev = logger.level
60        logger.setLevel(verboselogs.ERROR)
61
62        # no op at the moment
63
64        logger.setLevel(prev)
65
66        return True

Check the SpeakOptions for any missing or invalid values.

Inherited Members

deepgram.clients.common.v1.shared_response.BaseResponse: eval

@dataclass

class OpenResponse(deepgram.clients.common.v1.shared_response.BaseResponse): View Source

17@dataclass
18class OpenResponse(BaseResponse):
19    """
20    Open Message from the Deepgram Platform
21    """
22
23    type: str = ""

Open Message from the Deepgram Platform

OpenResponse(type: str = '')

type: str = ''

Inherited Members

deepgram.clients.common.v1.shared_response.BaseResponse: eval

SpeakWSMetadataResponse = <class 'deepgram.clients.speak.v1.websocket.response.MetadataResponse'>

@dataclass

class FlushedResponse(deepgram.clients.common.v1.shared_response.BaseResponse): View Source

31@dataclass
32class FlushedResponse(BaseResponse):
33    """
34    Flushed Message from the Deepgram Platform
35    """
36
37    type: str = ""
38    sequence_id: int = 0

Flushed Message from the Deepgram Platform

FlushedResponse(type: str = '', sequence_id: int = 0)

type: str = ''

sequence_id: int = 0

Inherited Members

deepgram.clients.common.v1.shared_response.BaseResponse: eval

@dataclass

class ClearedResponse(deepgram.clients.common.v1.shared_response.BaseResponse): View Source

41@dataclass
42class ClearedResponse(BaseResponse):
43    """
44    Cleared object
45    """
46
47    type: str = ""
48    sequence_id: int = 0

Cleared object

ClearedResponse(type: str = '', sequence_id: int = 0)

type: str = ''

sequence_id: int = 0

Inherited Members

deepgram.clients.common.v1.shared_response.BaseResponse: eval

@dataclass

class CloseResponse(deepgram.clients.common.v1.shared_response.BaseResponse): View Source

29@dataclass
30class CloseResponse(BaseResponse):
31    """
32    Close Message from the Deepgram Platform
33    """
34
35    type: str = ""

Close Message from the Deepgram Platform

CloseResponse(type: str = '')

type: str = ''

Inherited Members

deepgram.clients.common.v1.shared_response.BaseResponse: eval

@dataclass

class UnhandledResponse(deepgram.clients.common.v1.shared_response.BaseResponse): View Source

58@dataclass
59class UnhandledResponse(BaseResponse):
60    """
61    Unhandled Message from the Deepgram Platform
62    """
63
64    type: str = ""
65    raw: str = ""

Unhandled Message from the Deepgram Platform

UnhandledResponse(type: str = '', raw: str = '')

type: str = ''

raw: str = ''

Inherited Members

deepgram.clients.common.v1.shared_response.BaseResponse: eval

@dataclass

class WarningResponse(deepgram.clients.common.v1.shared_response.BaseResponse): View Source

51@dataclass
52class WarningResponse(BaseResponse):
53    """
54    Warning Message from the Deepgram Platform
55    """
56
57    warn_code: str = ""
58    warn_msg: str = ""
59    type: str = ""

Warning Message from the Deepgram Platform

WarningResponse(warn_code: str = '', warn_msg: str = '', type: str = '')

warn_code: str = ''

warn_msg: str = ''

type: str = ''

Inherited Members

deepgram.clients.common.v1.shared_response.BaseResponse: eval

@dataclass

class ErrorResponse(deepgram.clients.common.v1.shared_response.BaseResponse): View Source

41@dataclass
42class ErrorResponse(BaseResponse):
43    """
44    Error Message from the Deepgram Platform
45    """
46
47    description: str = ""
48    message: str = ""
49    type: str = ""
50    variant: Optional[str] = field(
51        default=None, metadata=dataclass_config(exclude=lambda f: f is None)
52    )

Error Message from the Deepgram Platform

ErrorResponse( description: str = '', message: str = '', type: str = '', variant: Optional[str] = None)

description: str = ''

message: str = ''

type: str = ''

variant: Optional[str] = None

Inherited Members

deepgram.clients.common.v1.shared_response.BaseResponse: eval

SpeakResponse = <class 'SpeakRESTResponse'>

SpeakClient = <class 'SpeakRESTClient'>

class SpeakRESTClient(deepgram.clients.common.v1.abstract_sync_rest.AbstractSyncRestClient): View Source

 25class SpeakRESTClient(AbstractSyncRestClient):
 26    """
 27    A client class for doing Text-to-Speech.
 28    Provides methods for speaking from text.
 29    """
 30
 31    _logger: verboselogs.VerboseLogger
 32    _config: DeepgramClientOptions
 33
 34    def __init__(self, config: DeepgramClientOptions):
 35        self._logger = verboselogs.VerboseLogger(__name__)
 36        self._logger.addHandler(logging.StreamHandler())
 37        self._logger.setLevel(config.verbose)
 38        self._config = config
 39        super().__init__(config)
 40
 41    # pylint: disable=too-many-positional-arguments
 42
 43    def stream_raw(
 44        self,
 45        source: FileSource,
 46        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
 47        addons: Optional[Dict] = None,
 48        headers: Optional[Dict] = None,
 49        timeout: Optional[httpx.Timeout] = None,
 50        endpoint: str = "v1/speak",
 51        **kwargs,
 52    ) -> httpx.Response:
 53        """
 54        Speak from a text source and store as a Iterator[byte].
 55
 56        Args:
 57            source (TextSource): The text source to speak.
 58            options (SpeakRESTOptions): Additional options for the ingest (default is None).
 59            addons (Dict): Additional options for the request (default is None).
 60            headers (Dict): Additional headers for the request (default is None).
 61            timeout (httpx.Timeout): The timeout for the request (default is None).
 62            endpoint (str): The endpoint to use for the request (default is "v1/speak").
 63
 64        Returns:
 65            httpx.Response: The direct httpx.Response object from the speak request.
 66            For more information, see https://www.python-httpx.org/api/#response
 67
 68            IMPORTANT: The response object's `close()` method should be called when done
 69            in order to prevent connection leaks.
 70
 71        Raises:
 72            DeepgramTypeError: Raised for known API errors.
 73        """
 74        self._logger.debug("SpeakClient.stream ENTER")
 75
 76        url = f"{self._config.url}/{endpoint}"
 77        if is_text_source(source):
 78            body = source
 79        else:
 80            self._logger.error("Unknown speak source type")
 81            self._logger.debug("SpeakClient.stream LEAVE")
 82            raise DeepgramTypeError("Unknown speak source type")
 83
 84        if isinstance(options, SpeakRESTOptions) and not options.check():
 85            self._logger.error("options.check failed")
 86            self._logger.debug("SpeakClient.stream LEAVE")
 87            raise DeepgramError("Fatal speak options error")
 88
 89        self._logger.info("url: %s", url)
 90        self._logger.info("source: %s", source)
 91        if isinstance(options, SpeakRESTOptions):
 92            self._logger.info("SpeakRESTOptions switching class -> dict")
 93            options = options.to_dict()
 94        self._logger.info("options: %s", options)
 95        self._logger.info("addons: %s", addons)
 96        self._logger.info("headers: %s", headers)
 97
 98        result = self.post_raw(
 99            url,
100            options=options,
101            addons=addons,
102            headers=headers,
103            json=body,
104            timeout=timeout,
105            **kwargs,
106        )
107
108        self._logger.info("result: %s", str(result))
109        self._logger.notice("speak succeeded")
110        self._logger.debug("SpeakClient.stream LEAVE")
111        return result
112
113    def stream_memory(
114        self,
115        source: FileSource,
116        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
117        addons: Optional[Dict] = None,
118        headers: Optional[Dict] = None,
119        timeout: Optional[httpx.Timeout] = None,
120        endpoint: str = "v1/speak",
121        **kwargs,
122    ) -> SpeakRESTResponse:
123        """
124        Speak from a text source and store in memory.
125
126        Args:
127            source (TextSource): The text source to speak.
128            options (SpeakRESTOptions): Additional options for the ingest (default is None).
129            addons (Dict): Additional options for the request (default is None).
130            headers (Dict): Additional headers for the request (default is None).
131            timeout (httpx.Timeout): The timeout for the request (default is None).
132            endpoint (str): The endpoint to use for the request (default is "v1/speak").
133
134        Returns:
135            SpeakRESTResponse: The response from the speak request.
136
137        Raises:
138            DeepgramTypeError: Raised for known API errors.
139        """
140        self._logger.debug("SpeakClient.stream ENTER")
141
142        url = f"{self._config.url}/{endpoint}"
143        if is_text_source(source):
144            body = source
145        else:
146            self._logger.error("Unknown speak source type")
147            self._logger.debug("SpeakClient.stream LEAVE")
148            raise DeepgramTypeError("Unknown speak source type")
149
150        if isinstance(options, SpeakRESTOptions) and not options.check():
151            self._logger.error("options.check failed")
152            self._logger.debug("SpeakClient.stream LEAVE")
153            raise DeepgramError("Fatal speak options error")
154
155        self._logger.info("url: %s", url)
156        self._logger.info("source: %s", source)
157        if isinstance(options, SpeakRESTOptions):
158            self._logger.info("SpeakRESTOptions switching class -> dict")
159            options = options.to_dict()
160        self._logger.info("options: %s", options)
161        self._logger.info("addons: %s", addons)
162        self._logger.info("headers: %s", headers)
163
164        return_vals = [
165            "content-type",
166            "request-id",
167            "model-uuid",
168            "model-name",
169            "char-count",
170            "transfer-encoding",
171            "date",
172        ]
173        result = self.post_memory(
174            url,
175            options=options,
176            addons=addons,
177            headers=headers,
178            json=body,
179            timeout=timeout,
180            file_result=return_vals,
181            **kwargs,
182        )
183
184        self._logger.info("result: %s", result)
185        resp = SpeakRESTResponse(
186            content_type=str(result["content-type"]),
187            request_id=str(result["request-id"]),
188            model_uuid=str(result["model-uuid"]),
189            model_name=str(result["model-name"]),
190            characters=int(str(result["char-count"])),
191            transfer_encoding=str(result["transfer-encoding"]),
192            date=str(result["date"]),
193            stream=cast(io.BytesIO, result["stream"]),
194            stream_memory=cast(io.BytesIO, result["stream"]),
195        )
196        self._logger.verbose("resp Object: %s", resp)
197        self._logger.notice("speak succeeded")
198        self._logger.debug("SpeakClient.stream LEAVE")
199        return resp
200
201    @deprecation.deprecated(
202        deprecated_in="3.4.0",
203        removed_in="4.0.0",
204        current_version=__version__,
205        details="SpeakRESTClient.stream is deprecated. Use SpeakRESTClient.stream_memory instead.",
206    )
207    def stream(
208        self,
209        source: FileSource,
210        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
211        addons: Optional[Dict] = None,
212        headers: Optional[Dict] = None,
213        timeout: Optional[httpx.Timeout] = None,
214        endpoint: str = "v1/speak",
215        **kwargs,
216    ) -> SpeakRESTResponse:
217        """
218        DEPRECATED: stream() is deprecated. Use stream_memory() instead.
219        """
220        return self.stream_memory(
221            source,
222            options=options,
223            addons=addons,
224            headers=headers,
225            timeout=timeout,
226            endpoint=endpoint,
227            **kwargs,
228        )
229
230    async def file(
231        self,
232        filename: str,
233        source: FileSource,
234        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
235        addons: Optional[Dict] = None,
236        timeout: Optional[httpx.Timeout] = None,
237        endpoint: str = "v1/speak",
238        **kwargs,
239    ) -> SpeakRESTResponse:
240        """
241        Speak from a text source and save to a file.
242        """
243        return self.save(
244            filename,
245            source,
246            options=options,
247            addons=addons,
248            timeout=timeout,
249            endpoint=endpoint,
250            **kwargs,
251        )
252
253    def save(
254        self,
255        filename: str,
256        source: FileSource,
257        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
258        addons: Optional[Dict] = None,
259        headers: Optional[Dict] = None,
260        timeout: Optional[httpx.Timeout] = None,
261        endpoint: str = "v1/speak",
262        **kwargs,
263    ) -> SpeakRESTResponse:
264        """
265        Speak from a text source and save to a file.
266
267        Args:
268            source (TextSource): The text source to speak.
269            options (SpeakRESTOptions): Additional options for the ingest (default is None).
270            addons (Dict): Additional options for the request (default is None).
271            headers (Dict): Additional headers for the request (default is None).
272            timeout (httpx.Timeout): The timeout for the request (default is None).
273            endpoint (str): The endpoint to use for the request (default is "v1/speak").
274
275        Returns:
276            SpeakRESTResponse: The response from the speak request.
277
278        Raises:
279            DeepgramTypeError: Raised for known API errors.
280        """
281        self._logger.debug("SpeakClient.save ENTER")
282
283        res = self.stream_memory(
284            source,
285            options=options,
286            addons=addons,
287            headers=headers,
288            timeout=timeout,
289            endpoint=endpoint,
290            **kwargs,
291        )
292
293        if res.stream is None:
294            self._logger.error("stream is None")
295            self._logger.debug("SpeakClient.save LEAVE")
296            raise DeepgramError("BytesIO stream is None")
297
298        # save to file
299        with open(filename, "wb+") as file:
300            file.write(res.stream.getbuffer())
301            file.flush()
302
303        # add filename to response
304        res.stream = None
305        res.filename = filename
306
307        self._logger.debug("SpeakClient.save LEAVE")
308        return res
309
310    # pylint: enable=too-many-positional-arguments

A client class for doing Text-to-Speech. Provides methods for speaking from text.

SpeakRESTClient(config: deepgram.options.DeepgramClientOptions) View Source

34    def __init__(self, config: DeepgramClientOptions):
35        self._logger = verboselogs.VerboseLogger(__name__)
36        self._logger.addHandler(logging.StreamHandler())
37        self._logger.setLevel(config.verbose)
38        self._config = config
39        super().__init__(config)

def stream_raw( self, source: Union[TextSource, BufferSource, StreamSource], options: Union[Dict, SpeakRESTOptions, NoneType] = None, addons: Optional[Dict] = None, headers: Optional[Dict] = None, timeout: Optional[httpx.Timeout] = None, endpoint: str = 'v1/speak', **kwargs) -> httpx.Response: View Source

 43    def stream_raw(
 44        self,
 45        source: FileSource,
 46        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
 47        addons: Optional[Dict] = None,
 48        headers: Optional[Dict] = None,
 49        timeout: Optional[httpx.Timeout] = None,
 50        endpoint: str = "v1/speak",
 51        **kwargs,
 52    ) -> httpx.Response:
 53        """
 54        Speak from a text source and store as a Iterator[byte].
 55
 56        Args:
 57            source (TextSource): The text source to speak.
 58            options (SpeakRESTOptions): Additional options for the ingest (default is None).
 59            addons (Dict): Additional options for the request (default is None).
 60            headers (Dict): Additional headers for the request (default is None).
 61            timeout (httpx.Timeout): The timeout for the request (default is None).
 62            endpoint (str): The endpoint to use for the request (default is "v1/speak").
 63
 64        Returns:
 65            httpx.Response: The direct httpx.Response object from the speak request.
 66            For more information, see https://www.python-httpx.org/api/#response
 67
 68            IMPORTANT: The response object's `close()` method should be called when done
 69            in order to prevent connection leaks.
 70
 71        Raises:
 72            DeepgramTypeError: Raised for known API errors.
 73        """
 74        self._logger.debug("SpeakClient.stream ENTER")
 75
 76        url = f"{self._config.url}/{endpoint}"
 77        if is_text_source(source):
 78            body = source
 79        else:
 80            self._logger.error("Unknown speak source type")
 81            self._logger.debug("SpeakClient.stream LEAVE")
 82            raise DeepgramTypeError("Unknown speak source type")
 83
 84        if isinstance(options, SpeakRESTOptions) and not options.check():
 85            self._logger.error("options.check failed")
 86            self._logger.debug("SpeakClient.stream LEAVE")
 87            raise DeepgramError("Fatal speak options error")
 88
 89        self._logger.info("url: %s", url)
 90        self._logger.info("source: %s", source)
 91        if isinstance(options, SpeakRESTOptions):
 92            self._logger.info("SpeakRESTOptions switching class -> dict")
 93            options = options.to_dict()
 94        self._logger.info("options: %s", options)
 95        self._logger.info("addons: %s", addons)
 96        self._logger.info("headers: %s", headers)
 97
 98        result = self.post_raw(
 99            url,
100            options=options,
101            addons=addons,
102            headers=headers,
103            json=body,
104            timeout=timeout,
105            **kwargs,
106        )
107
108        self._logger.info("result: %s", str(result))
109        self._logger.notice("speak succeeded")
110        self._logger.debug("SpeakClient.stream LEAVE")
111        return result

Speak from a text source and store as a Iterator[byte].

Args: source (TextSource): The text source to speak. options (SpeakRESTOptions): Additional options for the ingest (default is None). addons (Dict): Additional options for the request (default is None). headers (Dict): Additional headers for the request (default is None). timeout (httpx.Timeout): The timeout for the request (default is None). endpoint (str): The endpoint to use for the request (default is "v1/speak").

Returns: httpx.Response: The direct httpx.Response object from the speak request. For more information, see https://www.python-httpx.org/api/#response

IMPORTANT: The response object's `close()` method should be called when done
in order to prevent connection leaks.

Raises: DeepgramTypeError: Raised for known API errors.

def stream_memory( self, source: Union[TextSource, BufferSource, StreamSource], options: Union[Dict, SpeakRESTOptions, NoneType] = None, addons: Optional[Dict] = None, headers: Optional[Dict] = None, timeout: Optional[httpx.Timeout] = None, endpoint: str = 'v1/speak', **kwargs) -> SpeakRESTResponse: View Source

113    def stream_memory(
114        self,
115        source: FileSource,
116        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
117        addons: Optional[Dict] = None,
118        headers: Optional[Dict] = None,
119        timeout: Optional[httpx.Timeout] = None,
120        endpoint: str = "v1/speak",
121        **kwargs,
122    ) -> SpeakRESTResponse:
123        """
124        Speak from a text source and store in memory.
125
126        Args:
127            source (TextSource): The text source to speak.
128            options (SpeakRESTOptions): Additional options for the ingest (default is None).
129            addons (Dict): Additional options for the request (default is None).
130            headers (Dict): Additional headers for the request (default is None).
131            timeout (httpx.Timeout): The timeout for the request (default is None).
132            endpoint (str): The endpoint to use for the request (default is "v1/speak").
133
134        Returns:
135            SpeakRESTResponse: The response from the speak request.
136
137        Raises:
138            DeepgramTypeError: Raised for known API errors.
139        """
140        self._logger.debug("SpeakClient.stream ENTER")
141
142        url = f"{self._config.url}/{endpoint}"
143        if is_text_source(source):
144            body = source
145        else:
146            self._logger.error("Unknown speak source type")
147            self._logger.debug("SpeakClient.stream LEAVE")
148            raise DeepgramTypeError("Unknown speak source type")
149
150        if isinstance(options, SpeakRESTOptions) and not options.check():
151            self._logger.error("options.check failed")
152            self._logger.debug("SpeakClient.stream LEAVE")
153            raise DeepgramError("Fatal speak options error")
154
155        self._logger.info("url: %s", url)
156        self._logger.info("source: %s", source)
157        if isinstance(options, SpeakRESTOptions):
158            self._logger.info("SpeakRESTOptions switching class -> dict")
159            options = options.to_dict()
160        self._logger.info("options: %s", options)
161        self._logger.info("addons: %s", addons)
162        self._logger.info("headers: %s", headers)
163
164        return_vals = [
165            "content-type",
166            "request-id",
167            "model-uuid",
168            "model-name",
169            "char-count",
170            "transfer-encoding",
171            "date",
172        ]
173        result = self.post_memory(
174            url,
175            options=options,
176            addons=addons,
177            headers=headers,
178            json=body,
179            timeout=timeout,
180            file_result=return_vals,
181            **kwargs,
182        )
183
184        self._logger.info("result: %s", result)
185        resp = SpeakRESTResponse(
186            content_type=str(result["content-type"]),
187            request_id=str(result["request-id"]),
188            model_uuid=str(result["model-uuid"]),
189            model_name=str(result["model-name"]),
190            characters=int(str(result["char-count"])),
191            transfer_encoding=str(result["transfer-encoding"]),
192            date=str(result["date"]),
193            stream=cast(io.BytesIO, result["stream"]),
194            stream_memory=cast(io.BytesIO, result["stream"]),
195        )
196        self._logger.verbose("resp Object: %s", resp)
197        self._logger.notice("speak succeeded")
198        self._logger.debug("SpeakClient.stream LEAVE")
199        return resp

Speak from a text source and store in memory.

Returns: SpeakRESTResponse: The response from the speak request.

Raises: DeepgramTypeError: Raised for known API errors.

@deprecation.deprecated(deprecated_in='3.4.0', removed_in='4.0.0', current_version=__version__, details='SpeakRESTClient.stream is deprecated. Use SpeakRESTClient.stream_memory instead.')

def stream( self, source: Union[TextSource, BufferSource, StreamSource], options: Union[Dict, SpeakRESTOptions, NoneType] = None, addons: Optional[Dict] = None, headers: Optional[Dict] = None, timeout: Optional[httpx.Timeout] = None, endpoint: str = 'v1/speak', **kwargs) -> SpeakRESTResponse: View Source

201    @deprecation.deprecated(
202        deprecated_in="3.4.0",
203        removed_in="4.0.0",
204        current_version=__version__,
205        details="SpeakRESTClient.stream is deprecated. Use SpeakRESTClient.stream_memory instead.",
206    )
207    def stream(
208        self,
209        source: FileSource,
210        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
211        addons: Optional[Dict] = None,
212        headers: Optional[Dict] = None,
213        timeout: Optional[httpx.Timeout] = None,
214        endpoint: str = "v1/speak",
215        **kwargs,
216    ) -> SpeakRESTResponse:
217        """
218        DEPRECATED: stream() is deprecated. Use stream_memory() instead.
219        """
220        return self.stream_memory(
221            source,
222            options=options,
223            addons=addons,
224            headers=headers,
225            timeout=timeout,
226            endpoint=endpoint,
227            **kwargs,
228        )

DEPRECATED: stream() is deprecated. Use stream_memory() instead.

async def file( self, filename: str, source: Union[TextSource, BufferSource, StreamSource], options: Union[Dict, SpeakRESTOptions, NoneType] = None, addons: Optional[Dict] = None, timeout: Optional[httpx.Timeout] = None, endpoint: str = 'v1/speak', **kwargs) -> SpeakRESTResponse: View Source

230    async def file(
231        self,
232        filename: str,
233        source: FileSource,
234        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
235        addons: Optional[Dict] = None,
236        timeout: Optional[httpx.Timeout] = None,
237        endpoint: str = "v1/speak",
238        **kwargs,
239    ) -> SpeakRESTResponse:
240        """
241        Speak from a text source and save to a file.
242        """
243        return self.save(
244            filename,
245            source,
246            options=options,
247            addons=addons,
248            timeout=timeout,
249            endpoint=endpoint,
250            **kwargs,
251        )

Speak from a text source and save to a file.

def save( self, filename: str, source: Union[TextSource, BufferSource, StreamSource], options: Union[Dict, SpeakRESTOptions, NoneType] = None, addons: Optional[Dict] = None, headers: Optional[Dict] = None, timeout: Optional[httpx.Timeout] = None, endpoint: str = 'v1/speak', **kwargs) -> SpeakRESTResponse: View Source

253    def save(
254        self,
255        filename: str,
256        source: FileSource,
257        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
258        addons: Optional[Dict] = None,
259        headers: Optional[Dict] = None,
260        timeout: Optional[httpx.Timeout] = None,
261        endpoint: str = "v1/speak",
262        **kwargs,
263    ) -> SpeakRESTResponse:
264        """
265        Speak from a text source and save to a file.
266
267        Args:
268            source (TextSource): The text source to speak.
269            options (SpeakRESTOptions): Additional options for the ingest (default is None).
270            addons (Dict): Additional options for the request (default is None).
271            headers (Dict): Additional headers for the request (default is None).
272            timeout (httpx.Timeout): The timeout for the request (default is None).
273            endpoint (str): The endpoint to use for the request (default is "v1/speak").
274
275        Returns:
276            SpeakRESTResponse: The response from the speak request.
277
278        Raises:
279            DeepgramTypeError: Raised for known API errors.
280        """
281        self._logger.debug("SpeakClient.save ENTER")
282
283        res = self.stream_memory(
284            source,
285            options=options,
286            addons=addons,
287            headers=headers,
288            timeout=timeout,
289            endpoint=endpoint,
290            **kwargs,
291        )
292
293        if res.stream is None:
294            self._logger.error("stream is None")
295            self._logger.debug("SpeakClient.save LEAVE")
296            raise DeepgramError("BytesIO stream is None")
297
298        # save to file
299        with open(filename, "wb+") as file:
300            file.write(res.stream.getbuffer())
301            file.flush()
302
303        # add filename to response
304        res.stream = None
305        res.filename = filename
306
307        self._logger.debug("SpeakClient.save LEAVE")
308        return res

Speak from a text source and save to a file.

Returns: SpeakRESTResponse: The response from the speak request.

Raises: DeepgramTypeError: Raised for known API errors.

Inherited Members

deepgram.clients.common.v1.abstract_sync_rest.AbstractSyncRestClient: get; post_raw; post_memory; post; put; patch; delete

class AsyncSpeakRESTClient(deepgram.clients.common.v1.abstract_async_rest.AbstractAsyncRestClient): View Source

 26class AsyncSpeakRESTClient(AbstractAsyncRestClient):
 27    """
 28    A client class for doing Text-to-Speech.
 29    Provides methods for speaking from text.
 30    """
 31
 32    _logger: verboselogs.VerboseLogger
 33    _config: DeepgramClientOptions
 34
 35    def __init__(self, config: DeepgramClientOptions):
 36        self._logger = verboselogs.VerboseLogger(__name__)
 37        self._logger.addHandler(logging.StreamHandler())
 38        self._logger.setLevel(config.verbose)
 39        self._config = config
 40        super().__init__(config)
 41
 42    # pylint: disable=too-many-positional-arguments
 43
 44    async def stream_raw(
 45        self,
 46        source: FileSource,
 47        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
 48        addons: Optional[Dict] = None,
 49        headers: Optional[Dict] = None,
 50        timeout: Optional[httpx.Timeout] = None,
 51        endpoint: str = "v1/speak",
 52        **kwargs,
 53    ) -> httpx.Response:
 54        """
 55        Speak from a text source and store as a Iterator[byte].
 56
 57        Args:
 58            source (TextSource): The text source to speak.
 59            options (SpeakRESTOptions): Additional options for the ingest (default is None).
 60            addons (Dict): Additional options for the request (default is None).
 61            headers (Dict): Additional headers for the request (default is None).
 62            timeout (httpx.Timeout): The timeout for the request (default is None).
 63            endpoint (str): The endpoint to use for the request (default is "v1/speak").
 64
 65        Returns:
 66            httpx.Response: The direct httpx.Response object from the speak request.
 67            For more information, see https://www.python-httpx.org/api/#response
 68
 69            IMPORTANT: The response object's `close()` method should be called when done
 70            in order to prevent connection leaks.
 71
 72        Raises:
 73            DeepgramTypeError: Raised for known API errors.
 74        """
 75        self._logger.debug("AsyncSpeakClient.stream ENTER")
 76
 77        url = f"{self._config.url}/{endpoint}"
 78        if is_text_source(source):
 79            body = source
 80        else:
 81            self._logger.error("Unknown speak source type")
 82            self._logger.debug("AsyncSpeakClient.stream LEAVE")
 83            raise DeepgramTypeError("Unknown speak source type")
 84
 85        if isinstance(options, SpeakRESTOptions) and not options.check():
 86            self._logger.error("options.check failed")
 87            self._logger.debug("AsyncSpeakClient.stream LEAVE")
 88            raise DeepgramError("Fatal speak options error")
 89
 90        self._logger.info("url: %s", url)
 91        self._logger.info("source: %s", source)
 92        if isinstance(options, SpeakRESTOptions):
 93            self._logger.info("SpeakRESTOptions switching class -> dict")
 94            options = options.to_dict()
 95        self._logger.info("options: %s", options)
 96        self._logger.info("addons: %s", addons)
 97        self._logger.info("headers: %s", headers)
 98
 99        result = await self.post_raw(
100            url,
101            options=options,
102            addons=addons,
103            headers=headers,
104            json=body,
105            timeout=timeout,
106            **kwargs,
107        )
108
109        self._logger.info("result: %s", str(result))
110        self._logger.notice("speak succeeded")
111        self._logger.debug("AsyncSpeakClient.stream LEAVE")
112        return result
113
114    async def stream_memory(
115        self,
116        source: FileSource,
117        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
118        addons: Optional[Dict] = None,
119        headers: Optional[Dict] = None,
120        timeout: Optional[httpx.Timeout] = None,
121        endpoint: str = "v1/speak",
122        **kwargs,
123    ) -> SpeakRESTResponse:
124        """
125        Speak from a text source and store in memory.
126
127        Args:
128            source (TextSource): The text source to speak.
129            options (SpeakRESTOptions): Additional options for the ingest (default is None).
130            addons (Dict): Additional options for the request (default is None).
131            headers (Dict): Additional headers for the request (default is None).
132            timeout (httpx.Timeout): The timeout for the request (default is None).
133            endpoint (str): The endpoint to use for the request (default is "v1/speak").
134
135        Returns:
136            SpeakRESTResponse: The response from the speak request.
137
138        Raises:
139            DeepgramTypeError: Raised for known API errors.
140        """
141        self._logger.debug("AsyncSpeakClient.stream ENTER")
142
143        url = f"{self._config.url}/{endpoint}"
144        if is_text_source(source):
145            body = source
146        else:
147            self._logger.error("Unknown speak source type")
148            self._logger.debug("AsyncSpeakClient.stream LEAVE")
149            raise DeepgramTypeError("Unknown speak source type")
150
151        if isinstance(options, SpeakRESTOptions) and not options.check():
152            self._logger.error("options.check failed")
153            self._logger.debug("AsyncSpeakClient.stream LEAVE")
154            raise DeepgramError("Fatal speak options error")
155
156        self._logger.info("url: %s", url)
157        self._logger.info("source: %s", source)
158        if isinstance(options, SpeakRESTOptions):
159            self._logger.info("SpeakRESTOptions switching class -> dict")
160            options = options.to_dict()
161        self._logger.info("options: %s", options)
162        self._logger.info("addons: %s", addons)
163        self._logger.info("headers: %s", headers)
164
165        return_vals = [
166            "content-type",
167            "request-id",
168            "model-uuid",
169            "model-name",
170            "char-count",
171            "transfer-encoding",
172            "date",
173        ]
174        result = await self.post_memory(
175            url,
176            options=options,
177            addons=addons,
178            headers=headers,
179            json=body,
180            timeout=timeout,
181            file_result=return_vals,
182            **kwargs,
183        )
184        self._logger.info("result: %s", result)
185        resp = SpeakRESTResponse(
186            content_type=str(result["content-type"]),
187            request_id=str(result["request-id"]),
188            model_uuid=str(result["model-uuid"]),
189            model_name=str(result["model-name"]),
190            characters=int(str(result["char-count"])),
191            transfer_encoding=str(result["transfer-encoding"]),
192            date=str(result["date"]),
193            stream=cast(io.BytesIO, result["stream"]),
194            stream_memory=cast(io.BytesIO, result["stream"]),
195        )
196        self._logger.verbose("resp Object: %s", str(resp))
197        self._logger.notice("speak succeeded")
198        self._logger.debug("AsyncSpeakClient.stream LEAVE")
199        return resp
200
201    @deprecation.deprecated(
202        deprecated_in="3.4.0",
203        removed_in="4.0.0",
204        current_version=__version__,
205        details="SpeakRESTClient.stream is deprecated. Use SpeakRESTClient.stream_memory instead.",
206    )
207    async def stream(
208        self,
209        source: FileSource,
210        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
211        addons: Optional[Dict] = None,
212        headers: Optional[Dict] = None,
213        timeout: Optional[httpx.Timeout] = None,
214        endpoint: str = "v1/speak",
215        **kwargs,
216    ) -> SpeakRESTResponse:
217        """
218        DEPRECATED: stream() is deprecated. Use stream_memory() instead.
219        """
220        return await self.stream_memory(
221            source,
222            options=options,
223            addons=addons,
224            headers=headers,
225            timeout=timeout,
226            endpoint=endpoint,
227            **kwargs,
228        )
229
230    async def file(
231        self,
232        filename: str,
233        source: FileSource,
234        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
235        addons: Optional[Dict] = None,
236        timeout: Optional[httpx.Timeout] = None,
237        endpoint: str = "v1/speak",
238        **kwargs,
239    ) -> SpeakRESTResponse:
240        """
241        Speak from a text source and save to a file.
242        """
243        return await self.save(
244            filename,
245            source,
246            options=options,
247            addons=addons,
248            timeout=timeout,
249            endpoint=endpoint,
250            **kwargs,
251        )
252
253    async def save(
254        self,
255        filename: str,
256        source: FileSource,
257        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
258        addons: Optional[Dict] = None,
259        headers: Optional[Dict] = None,
260        timeout: Optional[httpx.Timeout] = None,
261        endpoint: str = "v1/speak",
262        **kwargs,
263    ) -> SpeakRESTResponse:
264        """
265        Speak from a text source and save to a file.
266
267        Args:
268            source (TextSource): The text source to speak.
269            options (SpeakRESTOptions): Additional options for the ingest (default is None).
270            addons (Dict): Additional options for the request (default is None).
271            headers (Dict): Additional headers for the request (default is None).
272            timeout (httpx.Timeout): The timeout for the request (default is None).
273            endpoint (str): The endpoint to use for the request (default is "v1/speak").
274
275        Returns:
276            SpeakRESTResponse: The response from the speak request.
277
278        Raises:
279            DeepgramTypeError: Raised for known API errors.
280        """
281        self._logger.debug("AsyncSpeakClient.save ENTER")
282
283        res = await self.stream_memory(
284            source,
285            options=options,
286            addons=addons,
287            headers=headers,
288            timeout=timeout,
289            endpoint=endpoint,
290            **kwargs,
291        )
292
293        if res.stream is None:
294            self._logger.error("stream is None")
295            self._logger.debug("AsyncSpeakClient.save LEAVE")
296            raise DeepgramError("BytesIO stream is None")
297
298        # save to file
299        async with aiofiles.open(filename, "wb") as out:
300            await out.write(res.stream.getbuffer())
301            await out.flush()
302
303        # add filename to response
304        res.stream = None
305        res.filename = filename
306
307        self._logger.debug("AsyncSpeakClient.save LEAVE")
308        return res
309
310    # pylint: enable=too-many-positional-arguments

A client class for doing Text-to-Speech. Provides methods for speaking from text.

AsyncSpeakRESTClient(config: deepgram.options.DeepgramClientOptions) View Source

35    def __init__(self, config: DeepgramClientOptions):
36        self._logger = verboselogs.VerboseLogger(__name__)
37        self._logger.addHandler(logging.StreamHandler())
38        self._logger.setLevel(config.verbose)
39        self._config = config
40        super().__init__(config)

async def stream_raw( self, source: Union[TextSource, BufferSource, StreamSource], options: Union[Dict, SpeakRESTOptions, NoneType] = None, addons: Optional[Dict] = None, headers: Optional[Dict] = None, timeout: Optional[httpx.Timeout] = None, endpoint: str = 'v1/speak', **kwargs) -> httpx.Response: View Source

 44    async def stream_raw(
 45        self,
 46        source: FileSource,
 47        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
 48        addons: Optional[Dict] = None,
 49        headers: Optional[Dict] = None,
 50        timeout: Optional[httpx.Timeout] = None,
 51        endpoint: str = "v1/speak",
 52        **kwargs,
 53    ) -> httpx.Response:
 54        """
 55        Speak from a text source and store as a Iterator[byte].
 56
 57        Args:
 58            source (TextSource): The text source to speak.
 59            options (SpeakRESTOptions): Additional options for the ingest (default is None).
 60            addons (Dict): Additional options for the request (default is None).
 61            headers (Dict): Additional headers for the request (default is None).
 62            timeout (httpx.Timeout): The timeout for the request (default is None).
 63            endpoint (str): The endpoint to use for the request (default is "v1/speak").
 64
 65        Returns:
 66            httpx.Response: The direct httpx.Response object from the speak request.
 67            For more information, see https://www.python-httpx.org/api/#response
 68
 69            IMPORTANT: The response object's `close()` method should be called when done
 70            in order to prevent connection leaks.
 71
 72        Raises:
 73            DeepgramTypeError: Raised for known API errors.
 74        """
 75        self._logger.debug("AsyncSpeakClient.stream ENTER")
 76
 77        url = f"{self._config.url}/{endpoint}"
 78        if is_text_source(source):
 79            body = source
 80        else:
 81            self._logger.error("Unknown speak source type")
 82            self._logger.debug("AsyncSpeakClient.stream LEAVE")
 83            raise DeepgramTypeError("Unknown speak source type")
 84
 85        if isinstance(options, SpeakRESTOptions) and not options.check():
 86            self._logger.error("options.check failed")
 87            self._logger.debug("AsyncSpeakClient.stream LEAVE")
 88            raise DeepgramError("Fatal speak options error")
 89
 90        self._logger.info("url: %s", url)
 91        self._logger.info("source: %s", source)
 92        if isinstance(options, SpeakRESTOptions):
 93            self._logger.info("SpeakRESTOptions switching class -> dict")
 94            options = options.to_dict()
 95        self._logger.info("options: %s", options)
 96        self._logger.info("addons: %s", addons)
 97        self._logger.info("headers: %s", headers)
 98
 99        result = await self.post_raw(
100            url,
101            options=options,
102            addons=addons,
103            headers=headers,
104            json=body,
105            timeout=timeout,
106            **kwargs,
107        )
108
109        self._logger.info("result: %s", str(result))
110        self._logger.notice("speak succeeded")
111        self._logger.debug("AsyncSpeakClient.stream LEAVE")
112        return result

Speak from a text source and store as a Iterator[byte].

Returns: httpx.Response: The direct httpx.Response object from the speak request. For more information, see https://www.python-httpx.org/api/#response

IMPORTANT: The response object's `close()` method should be called when done
in order to prevent connection leaks.

Raises: DeepgramTypeError: Raised for known API errors.

async def stream_memory( self, source: Union[TextSource, BufferSource, StreamSource], options: Union[Dict, SpeakRESTOptions, NoneType] = None, addons: Optional[Dict] = None, headers: Optional[Dict] = None, timeout: Optional[httpx.Timeout] = None, endpoint: str = 'v1/speak', **kwargs) -> SpeakRESTResponse: View Source

114    async def stream_memory(
115        self,
116        source: FileSource,
117        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
118        addons: Optional[Dict] = None,
119        headers: Optional[Dict] = None,
120        timeout: Optional[httpx.Timeout] = None,
121        endpoint: str = "v1/speak",
122        **kwargs,
123    ) -> SpeakRESTResponse:
124        """
125        Speak from a text source and store in memory.
126
127        Args:
128            source (TextSource): The text source to speak.
129            options (SpeakRESTOptions): Additional options for the ingest (default is None).
130            addons (Dict): Additional options for the request (default is None).
131            headers (Dict): Additional headers for the request (default is None).
132            timeout (httpx.Timeout): The timeout for the request (default is None).
133            endpoint (str): The endpoint to use for the request (default is "v1/speak").
134
135        Returns:
136            SpeakRESTResponse: The response from the speak request.
137
138        Raises:
139            DeepgramTypeError: Raised for known API errors.
140        """
141        self._logger.debug("AsyncSpeakClient.stream ENTER")
142
143        url = f"{self._config.url}/{endpoint}"
144        if is_text_source(source):
145            body = source
146        else:
147            self._logger.error("Unknown speak source type")
148            self._logger.debug("AsyncSpeakClient.stream LEAVE")
149            raise DeepgramTypeError("Unknown speak source type")
150
151        if isinstance(options, SpeakRESTOptions) and not options.check():
152            self._logger.error("options.check failed")
153            self._logger.debug("AsyncSpeakClient.stream LEAVE")
154            raise DeepgramError("Fatal speak options error")
155
156        self._logger.info("url: %s", url)
157        self._logger.info("source: %s", source)
158        if isinstance(options, SpeakRESTOptions):
159            self._logger.info("SpeakRESTOptions switching class -> dict")
160            options = options.to_dict()
161        self._logger.info("options: %s", options)
162        self._logger.info("addons: %s", addons)
163        self._logger.info("headers: %s", headers)
164
165        return_vals = [
166            "content-type",
167            "request-id",
168            "model-uuid",
169            "model-name",
170            "char-count",
171            "transfer-encoding",
172            "date",
173        ]
174        result = await self.post_memory(
175            url,
176            options=options,
177            addons=addons,
178            headers=headers,
179            json=body,
180            timeout=timeout,
181            file_result=return_vals,
182            **kwargs,
183        )
184        self._logger.info("result: %s", result)
185        resp = SpeakRESTResponse(
186            content_type=str(result["content-type"]),
187            request_id=str(result["request-id"]),
188            model_uuid=str(result["model-uuid"]),
189            model_name=str(result["model-name"]),
190            characters=int(str(result["char-count"])),
191            transfer_encoding=str(result["transfer-encoding"]),
192            date=str(result["date"]),
193            stream=cast(io.BytesIO, result["stream"]),
194            stream_memory=cast(io.BytesIO, result["stream"]),
195        )
196        self._logger.verbose("resp Object: %s", str(resp))
197        self._logger.notice("speak succeeded")
198        self._logger.debug("AsyncSpeakClient.stream LEAVE")
199        return resp

Speak from a text source and store in memory.

Returns: SpeakRESTResponse: The response from the speak request.

Raises: DeepgramTypeError: Raised for known API errors.

@deprecation.deprecated(deprecated_in='3.4.0', removed_in='4.0.0', current_version=__version__, details='SpeakRESTClient.stream is deprecated. Use SpeakRESTClient.stream_memory instead.')

async def stream( self, source: Union[TextSource, BufferSource, StreamSource], options: Union[Dict, SpeakRESTOptions, NoneType] = None, addons: Optional[Dict] = None, headers: Optional[Dict] = None, timeout: Optional[httpx.Timeout] = None, endpoint: str = 'v1/speak', **kwargs) -> SpeakRESTResponse: View Source

201    @deprecation.deprecated(
202        deprecated_in="3.4.0",
203        removed_in="4.0.0",
204        current_version=__version__,
205        details="SpeakRESTClient.stream is deprecated. Use SpeakRESTClient.stream_memory instead.",
206    )
207    async def stream(
208        self,
209        source: FileSource,
210        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
211        addons: Optional[Dict] = None,
212        headers: Optional[Dict] = None,
213        timeout: Optional[httpx.Timeout] = None,
214        endpoint: str = "v1/speak",
215        **kwargs,
216    ) -> SpeakRESTResponse:
217        """
218        DEPRECATED: stream() is deprecated. Use stream_memory() instead.
219        """
220        return await self.stream_memory(
221            source,
222            options=options,
223            addons=addons,
224            headers=headers,
225            timeout=timeout,
226            endpoint=endpoint,
227            **kwargs,
228        )

DEPRECATED: stream() is deprecated. Use stream_memory() instead.

230    async def file(
231        self,
232        filename: str,
233        source: FileSource,
234        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
235        addons: Optional[Dict] = None,
236        timeout: Optional[httpx.Timeout] = None,
237        endpoint: str = "v1/speak",
238        **kwargs,
239    ) -> SpeakRESTResponse:
240        """
241        Speak from a text source and save to a file.
242        """
243        return await self.save(
244            filename,
245            source,
246            options=options,
247            addons=addons,
248            timeout=timeout,
249            endpoint=endpoint,
250            **kwargs,
251        )

Speak from a text source and save to a file.

async def save( self, filename: str, source: Union[TextSource, BufferSource, StreamSource], options: Union[Dict, SpeakRESTOptions, NoneType] = None, addons: Optional[Dict] = None, headers: Optional[Dict] = None, timeout: Optional[httpx.Timeout] = None, endpoint: str = 'v1/speak', **kwargs) -> SpeakRESTResponse: View Source

253    async def save(
254        self,
255        filename: str,
256        source: FileSource,
257        options: Optional[Union[Dict, SpeakRESTOptions]] = None,
258        addons: Optional[Dict] = None,
259        headers: Optional[Dict] = None,
260        timeout: Optional[httpx.Timeout] = None,
261        endpoint: str = "v1/speak",
262        **kwargs,
263    ) -> SpeakRESTResponse:
264        """
265        Speak from a text source and save to a file.
266
267        Args:
268            source (TextSource): The text source to speak.
269            options (SpeakRESTOptions): Additional options for the ingest (default is None).
270            addons (Dict): Additional options for the request (default is None).
271            headers (Dict): Additional headers for the request (default is None).
272            timeout (httpx.Timeout): The timeout for the request (default is None).
273            endpoint (str): The endpoint to use for the request (default is "v1/speak").
274
275        Returns:
276            SpeakRESTResponse: The response from the speak request.
277
278        Raises:
279            DeepgramTypeError: Raised for known API errors.
280        """
281        self._logger.debug("AsyncSpeakClient.save ENTER")
282
283        res = await self.stream_memory(
284            source,
285            options=options,
286            addons=addons,
287            headers=headers,
288            timeout=timeout,
289            endpoint=endpoint,
290            **kwargs,
291        )
292
293        if res.stream is None:
294            self._logger.error("stream is None")
295            self._logger.debug("AsyncSpeakClient.save LEAVE")
296            raise DeepgramError("BytesIO stream is None")
297
298        # save to file
299        async with aiofiles.open(filename, "wb") as out:
300            await out.write(res.stream.getbuffer())
301            await out.flush()
302
303        # add filename to response
304        res.stream = None
305        res.filename = filename
306
307        self._logger.debug("AsyncSpeakClient.save LEAVE")
308        return res

Speak from a text source and save to a file.

Returns: SpeakRESTResponse: The response from the speak request.

Raises: DeepgramTypeError: Raised for known API errors.

Inherited Members

deepgram.clients.common.v1.abstract_async_rest.AbstractAsyncRestClient: get; post_raw; post_memory; post; put; patch; delete

SpeakWebSocketClient = <class 'SpeakWSClient'>

AsyncSpeakWebSocketClient = <class 'AsyncSpeakWSClient'>