SDK regeneration

fern-api[bot] · louisjoecodes · commit b5063c5dd093 · 2024-12-12T14:50:45.000Z
diff --git a/poetry.lock b/poetry.lock
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "elevenlabs"
-version = "1.13.4"
+version = "1.13.5"
 description = ""
 readme = "README.md"
 authors = []
diff --git a/reference.md b/reference.md
@@ -1176,10 +1176,12 @@ from elevenlabs import ElevenLabs
 client = ElevenLabs(
     api_key="YOUR_API_KEY",
 )
-client.text_to_speech.stream_with_timestamps(
+response = client.text_to_speech.stream_with_timestamps(
     voice_id="21m00Tcm4TlvDq8ikWAM",
     text="text",
 )
+for chunk in response:
+    yield chunk
 
 ```
 </dd>
diff --git a/src/elevenlabs/__init__.py b/src/elevenlabs/__init__.py
@@ -240,6 +240,9 @@
     BodyTextToSpeechStreamingWithTimestampsV1TextToSpeechVoiceIdStreamWithTimestampsPostApplyTextNormalization,
     BodyTextToSpeechV1TextToSpeechVoiceIdPostApplyTextNormalization,
     BodyTextToSpeechWithTimestampsV1TextToSpeechVoiceIdWithTimestampsPostApplyTextNormalization,
+    TextToSpeechStreamWithTimestampsResponse,
+    TextToSpeechStreamWithTimestampsResponseAlignment,
+    TextToSpeechStreamWithTimestampsResponseNormalizedAlignment,
 )
 from .text_to_voice import TextToVoiceCreatePreviewsRequestOutputFormat
 from .version import __version__
@@ -428,6 +431,9 @@
     "SubscriptionResponseModelCurrency",
     "SubscriptionStatus",
     "TextToSpeechAsStreamRequest",
+    "TextToSpeechStreamWithTimestampsResponse",
+    "TextToSpeechStreamWithTimestampsResponseAlignment",
+    "TextToSpeechStreamWithTimestampsResponseNormalizedAlignment",
     "TextToVoiceCreatePreviewsRequestOutputFormat",
     "TtsConversationalConfig",
     "TtsConversationalConfigOverride",
diff --git a/src/elevenlabs/core/client_wrapper.py b/src/elevenlabs/core/client_wrapper.py
@@ -16,7 +16,7 @@ def get_headers(self) -> typing.Dict[str, str]:
         headers: typing.Dict[str, str] = {
             "X-Fern-Language": "Python",
             "X-Fern-SDK-Name": "elevenlabs",
-            "X-Fern-SDK-Version": "1.13.4",
+            "X-Fern-SDK-Version": "1.13.5",
         }
         if self._api_key is not None:
             headers["xi-api-key"] = self._api_key
diff --git a/src/elevenlabs/text_to_speech/__init__.py b/src/elevenlabs/text_to_speech/__init__.py
@@ -5,11 +5,17 @@
     BodyTextToSpeechStreamingWithTimestampsV1TextToSpeechVoiceIdStreamWithTimestampsPostApplyTextNormalization,
     BodyTextToSpeechV1TextToSpeechVoiceIdPostApplyTextNormalization,
     BodyTextToSpeechWithTimestampsV1TextToSpeechVoiceIdWithTimestampsPostApplyTextNormalization,
+    TextToSpeechStreamWithTimestampsResponse,
+    TextToSpeechStreamWithTimestampsResponseAlignment,
+    TextToSpeechStreamWithTimestampsResponseNormalizedAlignment,
 )
 
 __all__ = [
     "BodyTextToSpeechStreamingV1TextToSpeechVoiceIdStreamPostApplyTextNormalization",
     "BodyTextToSpeechStreamingWithTimestampsV1TextToSpeechVoiceIdStreamWithTimestampsPostApplyTextNormalization",
     "BodyTextToSpeechV1TextToSpeechVoiceIdPostApplyTextNormalization",
     "BodyTextToSpeechWithTimestampsV1TextToSpeechVoiceIdWithTimestampsPostApplyTextNormalization",
+    "TextToSpeechStreamWithTimestampsResponse",
+    "TextToSpeechStreamWithTimestampsResponseAlignment",
+    "TextToSpeechStreamWithTimestampsResponseNormalizedAlignment",
 ]
diff --git a/src/elevenlabs/text_to_speech/client.py b/src/elevenlabs/text_to_speech/client.py
@@ -26,6 +26,8 @@
 from .types.body_text_to_speech_streaming_with_timestamps_v_1_text_to_speech_voice_id_stream_with_timestamps_post_apply_text_normalization import (
     BodyTextToSpeechStreamingWithTimestampsV1TextToSpeechVoiceIdStreamWithTimestampsPostApplyTextNormalization,
 )
+from .types.text_to_speech_stream_with_timestamps_response import TextToSpeechStreamWithTimestampsResponse
+import json
 from ..core.client_wrapper import AsyncClientWrapper
 
 # this is used as the default value for optional parameters
@@ -538,7 +540,7 @@ def stream_with_timestamps(
             BodyTextToSpeechStreamingWithTimestampsV1TextToSpeechVoiceIdStreamWithTimestampsPostApplyTextNormalization
         ] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
-    ) -> None:
+    ) -> typing.Iterator[TextToSpeechStreamWithTimestampsResponse]:
         """
         Converts text into speech using a voice of your choice and returns a stream of JSONs containing audio as a base64 encoded string together with information on when which character was spoken.
 
@@ -595,9 +597,10 @@ def stream_with_timestamps(
         request_options : typing.Optional[RequestOptions]
             Request-specific configuration.
 
-        Returns
-        -------
-        None
+        Yields
+        ------
+        typing.Iterator[TextToSpeechStreamWithTimestampsResponse]
+            Stream of JSON objects containing audio chunks and character timing information
 
         Examples
         --------
@@ -606,12 +609,14 @@ def stream_with_timestamps(
         client = ElevenLabs(
             api_key="YOUR_API_KEY",
         )
-        client.text_to_speech.stream_with_timestamps(
+        response = client.text_to_speech.stream_with_timestamps(
             voice_id="21m00Tcm4TlvDq8ikWAM",
             text="text",
         )
+        for chunk in response:
+            yield chunk
         """
-        _response = self._client_wrapper.httpx_client.request(
+        with self._client_wrapper.httpx_client.stream(
             f"v1/text-to-speech/{jsonable_encoder(voice_id)}/stream/with-timestamps",
             method="POST",
             params={
@@ -644,24 +649,38 @@ def stream_with_timestamps(
             },
             request_options=request_options,
             omit=OMIT,
-        )
-        try:
-            if 200 <= _response.status_code < 300:
-                return
-            if _response.status_code == 422:
-                raise UnprocessableEntityError(
-                    typing.cast(
-                        HttpValidationError,
-                        construct_type(
-                            type_=HttpValidationError,  # type: ignore
-                            object_=_response.json(),
-                        ),
+        ) as _response:
+            try:
+                if 200 <= _response.status_code < 300:
+                    for _text in _response.iter_lines():
+                        try:
+                            if len(_text) == 0:
+                                continue
+                            yield typing.cast(
+                                TextToSpeechStreamWithTimestampsResponse,
+                                construct_type(
+                                    type_=TextToSpeechStreamWithTimestampsResponse,  # type: ignore
+                                    object_=json.loads(_text),
+                                ),
+                            )
+                        except:
+                            pass
+                    return
+                _response.read()
+                if _response.status_code == 422:
+                    raise UnprocessableEntityError(
+                        typing.cast(
+                            HttpValidationError,
+                            construct_type(
+                                type_=HttpValidationError,  # type: ignore
+                                object_=_response.json(),
+                            ),
+                        )
                     )
-                )
-            _response_json = _response.json()
-        except JSONDecodeError:
-            raise ApiError(status_code=_response.status_code, body=_response.text)
-        raise ApiError(status_code=_response.status_code, body=_response_json)
+                _response_json = _response.json()
+            except JSONDecodeError:
+                raise ApiError(status_code=_response.status_code, body=_response.text)
+            raise ApiError(status_code=_response.status_code, body=_response_json)
 
 
 class AsyncTextToSpeechClient:
@@ -1194,7 +1213,7 @@ async def stream_with_timestamps(
             BodyTextToSpeechStreamingWithTimestampsV1TextToSpeechVoiceIdStreamWithTimestampsPostApplyTextNormalization
         ] = OMIT,
         request_options: typing.Optional[RequestOptions] = None,
-    ) -> None:
+    ) -> typing.AsyncIterator[TextToSpeechStreamWithTimestampsResponse]:
         """
         Converts text into speech using a voice of your choice and returns a stream of JSONs containing audio as a base64 encoded string together with information on when which character was spoken.
 
@@ -1251,9 +1270,10 @@ async def stream_with_timestamps(
         request_options : typing.Optional[RequestOptions]
             Request-specific configuration.
 
-        Returns
-        -------
-        None
+        Yields
+        ------
+        typing.AsyncIterator[TextToSpeechStreamWithTimestampsResponse]
+            Stream of JSON objects containing audio chunks and character timing information
 
         Examples
         --------
@@ -1267,15 +1287,17 @@ async def stream_with_timestamps(
 
 
         async def main() -> None:
-            await client.text_to_speech.stream_with_timestamps(
+            response = await client.text_to_speech.stream_with_timestamps(
                 voice_id="21m00Tcm4TlvDq8ikWAM",
                 text="text",
             )
+            async for chunk in response:
+                yield chunk
 
 
         asyncio.run(main())
         """
-        _response = await self._client_wrapper.httpx_client.request(
+        async with self._client_wrapper.httpx_client.stream(
             f"v1/text-to-speech/{jsonable_encoder(voice_id)}/stream/with-timestamps",
             method="POST",
             params={
@@ -1308,21 +1330,35 @@ async def main() -> None:
             },
             request_options=request_options,
             omit=OMIT,
-        )
-        try:
-            if 200 <= _response.status_code < 300:
-                return
-            if _response.status_code == 422:
-                raise UnprocessableEntityError(
-                    typing.cast(
-                        HttpValidationError,
-                        construct_type(
-                            type_=HttpValidationError,  # type: ignore
-                            object_=_response.json(),
-                        ),
+        ) as _response:
+            try:
+                if 200 <= _response.status_code < 300:
+                    async for _text in _response.aiter_lines():
+                        try:
+                            if len(_text) == 0:
+                                continue
+                            yield typing.cast(
+                                TextToSpeechStreamWithTimestampsResponse,
+                                construct_type(
+                                    type_=TextToSpeechStreamWithTimestampsResponse,  # type: ignore
+                                    object_=json.loads(_text),
+                                ),
+                            )
+                        except:
+                            pass
+                    return
+                await _response.aread()
+                if _response.status_code == 422:
+                    raise UnprocessableEntityError(
+                        typing.cast(
+                            HttpValidationError,
+                            construct_type(
+                                type_=HttpValidationError,  # type: ignore
+                                object_=_response.json(),
+                            ),
+                        )
                     )
-                )
-            _response_json = _response.json()
-        except JSONDecodeError:
-            raise ApiError(status_code=_response.status_code, body=_response.text)
-        raise ApiError(status_code=_response.status_code, body=_response_json)
+                _response_json = _response.json()
+            except JSONDecodeError:
+                raise ApiError(status_code=_response.status_code, body=_response.text)
+            raise ApiError(status_code=_response.status_code, body=_response_json)
diff --git a/src/elevenlabs/text_to_speech/types/__init__.py b/src/elevenlabs/text_to_speech/types/__init__.py
@@ -12,10 +12,18 @@
 from .body_text_to_speech_with_timestamps_v_1_text_to_speech_voice_id_with_timestamps_post_apply_text_normalization import (
     BodyTextToSpeechWithTimestampsV1TextToSpeechVoiceIdWithTimestampsPostApplyTextNormalization,
 )
+from .text_to_speech_stream_with_timestamps_response import TextToSpeechStreamWithTimestampsResponse
+from .text_to_speech_stream_with_timestamps_response_alignment import TextToSpeechStreamWithTimestampsResponseAlignment
+from .text_to_speech_stream_with_timestamps_response_normalized_alignment import (
+    TextToSpeechStreamWithTimestampsResponseNormalizedAlignment,
+)
 
 __all__ = [
     "BodyTextToSpeechStreamingV1TextToSpeechVoiceIdStreamPostApplyTextNormalization",
     "BodyTextToSpeechStreamingWithTimestampsV1TextToSpeechVoiceIdStreamWithTimestampsPostApplyTextNormalization",
     "BodyTextToSpeechV1TextToSpeechVoiceIdPostApplyTextNormalization",
     "BodyTextToSpeechWithTimestampsV1TextToSpeechVoiceIdWithTimestampsPostApplyTextNormalization",
+    "TextToSpeechStreamWithTimestampsResponse",
+    "TextToSpeechStreamWithTimestampsResponseAlignment",
+    "TextToSpeechStreamWithTimestampsResponseNormalizedAlignment",
 ]
diff --git a/src/elevenlabs/text_to_speech/types/text_to_speech_stream_with_timestamps_response.py b/src/elevenlabs/text_to_speech/types/text_to_speech_stream_with_timestamps_response.py
@@ -0,0 +1,33 @@
+# This file was auto-generated by Fern from our API Definition.
+
+from ...core.unchecked_base_model import UncheckedBaseModel
+import typing_extensions
+import typing
+from ...core.serialization import FieldMetadata
+import pydantic
+from .text_to_speech_stream_with_timestamps_response_alignment import TextToSpeechStreamWithTimestampsResponseAlignment
+from .text_to_speech_stream_with_timestamps_response_normalized_alignment import (
+    TextToSpeechStreamWithTimestampsResponseNormalizedAlignment,
+)
+from ...core.pydantic_utilities import IS_PYDANTIC_V2
+
+
+class TextToSpeechStreamWithTimestampsResponse(UncheckedBaseModel):
+    audio_base_64: typing_extensions.Annotated[typing.Optional[str], FieldMetadata(alias="audio_base64")] = (
+        pydantic.Field(default=None)
+    )
+    """
+    Base64 encoded audio chunk
+    """
+
+    alignment: typing.Optional[TextToSpeechStreamWithTimestampsResponseAlignment] = None
+    normalized_alignment: typing.Optional[TextToSpeechStreamWithTimestampsResponseNormalizedAlignment] = None
+
+    if IS_PYDANTIC_V2:
+        model_config: typing.ClassVar[pydantic.ConfigDict] = pydantic.ConfigDict(extra="allow", frozen=True)  # type: ignore # Pydantic v2
+    else:
+
+        class Config:
+            frozen = True
+            smart_union = True
+            extra = pydantic.Extra.allow
diff --git a/src/elevenlabs/text_to_speech/types/text_to_speech_stream_with_timestamps_response_alignment.py b/src/elevenlabs/text_to_speech/types/text_to_speech_stream_with_timestamps_response_alignment.py
diff --git a/src/elevenlabs/text_to_speech/types/text_to_speech_stream_with_timestamps_response_normalized_alignment.py b/src/elevenlabs/text_to_speech/types/text_to_speech_stream_with_timestamps_response_normalized_alignment.py

Original file line number	Diff line number	Diff line change
`@@ -1176,10 +1176,12 @@ from elevenlabs import ElevenLabs`
`1176`	`1176`	`client = ElevenLabs(`
`1177`	`1177`	`api_key="YOUR_API_KEY",`
`1178`	`1178`	`)`
`1179`		`-client.text_to_speech.stream_with_timestamps(`
	`1179`	`+response = client.text_to_speech.stream_with_timestamps(`
`1180`	`1180`	`voice_id="21m00Tcm4TlvDq8ikWAM",`
`1181`	`1181`	`text="text",`
`1182`	`1182`	`)`
	`1183`	`+for chunk in response:`
	`1184`	`+ yield chunk`
`1183`	`1185`
`1184`	`1186`	```
`1185`	`1187`	`</dd>`
Original file line number	Diff line number	Diff line change
`@@ -16,7 +16,7 @@ def get_headers(self) -> typing.Dict[str, str]:`
`16`	`16`	`headers: typing.Dict[str, str] = {`
`17`	`17`	`"X-Fern-Language": "Python",`
`18`	`18`	`"X-Fern-SDK-Name": "elevenlabs",`
`19`		`- "X-Fern-SDK-Version": "1.13.4",`
	`19`	`+ "X-Fern-SDK-Version": "1.13.5",`
`20`	`20`	`}`
`21`	`21`	`if self._api_key is not None:`
`22`	`22`	`headers["xi-api-key"] = self._api_key`