feat(api): Add speech endpoint (#219)

stainless-app[bot] · stainless-app[bot] · commit f15080196853 · 2025-03-18T23:33:46.000Z
diff --git a/.stats.yml b/.stats.yml
@@ -1,2 +1,2 @@
-configured_endpoints: 15
+configured_endpoints: 16
 openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/groqcloud%2Fgroqcloud-055e57d5b3cad069182bb870f76dd7936e69fc88c9a1e51ad198400e38c1d076.yml
diff --git a/api.md b/api.md
@@ -60,6 +60,12 @@ Methods:
 
 # Audio
 
+## Speech
+
+Methods:
+
+- <code title="post /openai/v1/audio/speech">client.audio.speech.<a href="./src/groq/resources/audio/speech.py">create</a>(\*\*<a href="src/groq/types/audio/speech_create_params.py">params</a>) -> BinaryAPIResponse</code>
+
 ## Transcriptions
 
 Types:
diff --git a/src/groq/resources/audio/__init__.py b/src/groq/resources/audio/__init__.py
@@ -8,6 +8,14 @@
     AudioWithStreamingResponse,
     AsyncAudioWithStreamingResponse,
 )
+from .speech import (
+    Speech,
+    AsyncSpeech,
+    SpeechWithRawResponse,
+    AsyncSpeechWithRawResponse,
+    SpeechWithStreamingResponse,
+    AsyncSpeechWithStreamingResponse,
+)
 from .translations import (
     Translations,
     AsyncTranslations,
@@ -26,6 +34,12 @@
 )
 
 __all__ = [
+    "Speech",
+    "AsyncSpeech",
+    "SpeechWithRawResponse",
+    "AsyncSpeechWithRawResponse",
+    "SpeechWithStreamingResponse",
+    "AsyncSpeechWithStreamingResponse",
     "Transcriptions",
     "AsyncTranscriptions",
     "TranscriptionsWithRawResponse",
diff --git a/src/groq/resources/audio/audio.py b/src/groq/resources/audio/audio.py
@@ -2,6 +2,14 @@
 
 from __future__ import annotations
 
+from .speech import (
+    Speech,
+    AsyncSpeech,
+    SpeechWithRawResponse,
+    AsyncSpeechWithRawResponse,
+    SpeechWithStreamingResponse,
+    AsyncSpeechWithStreamingResponse,
+)
 from ..._compat import cached_property
 from ..._resource import SyncAPIResource, AsyncAPIResource
 from .translations import (
@@ -25,6 +33,10 @@
 
 
 class Audio(SyncAPIResource):
+    @cached_property
+    def speech(self) -> Speech:
+        return Speech(self._client)
+
     @cached_property
     def transcriptions(self) -> Transcriptions:
         return Transcriptions(self._client)
@@ -54,6 +66,10 @@ def with_streaming_response(self) -> AudioWithStreamingResponse:
 
 
 class AsyncAudio(AsyncAPIResource):
+    @cached_property
+    def speech(self) -> AsyncSpeech:
+        return AsyncSpeech(self._client)
+
     @cached_property
     def transcriptions(self) -> AsyncTranscriptions:
         return AsyncTranscriptions(self._client)
@@ -86,6 +102,10 @@ class AudioWithRawResponse:
     def __init__(self, audio: Audio) -> None:
         self._audio = audio
 
+    @cached_property
+    def speech(self) -> SpeechWithRawResponse:
+        return SpeechWithRawResponse(self._audio.speech)
+
     @cached_property
     def transcriptions(self) -> TranscriptionsWithRawResponse:
         return TranscriptionsWithRawResponse(self._audio.transcriptions)
@@ -99,6 +119,10 @@ class AsyncAudioWithRawResponse:
     def __init__(self, audio: AsyncAudio) -> None:
         self._audio = audio
 
+    @cached_property
+    def speech(self) -> AsyncSpeechWithRawResponse:
+        return AsyncSpeechWithRawResponse(self._audio.speech)
+
     @cached_property
     def transcriptions(self) -> AsyncTranscriptionsWithRawResponse:
         return AsyncTranscriptionsWithRawResponse(self._audio.transcriptions)
@@ -112,6 +136,10 @@ class AudioWithStreamingResponse:
     def __init__(self, audio: Audio) -> None:
         self._audio = audio
 
+    @cached_property
+    def speech(self) -> SpeechWithStreamingResponse:
+        return SpeechWithStreamingResponse(self._audio.speech)
+
     @cached_property
     def transcriptions(self) -> TranscriptionsWithStreamingResponse:
         return TranscriptionsWithStreamingResponse(self._audio.transcriptions)
@@ -125,6 +153,10 @@ class AsyncAudioWithStreamingResponse:
     def __init__(self, audio: AsyncAudio) -> None:
         self._audio = audio
 
+    @cached_property
+    def speech(self) -> AsyncSpeechWithStreamingResponse:
+        return AsyncSpeechWithStreamingResponse(self._audio.speech)
+
     @cached_property
     def transcriptions(self) -> AsyncTranscriptionsWithStreamingResponse:
         return AsyncTranscriptionsWithStreamingResponse(self._audio.transcriptions)
diff --git a/src/groq/resources/audio/speech.py b/src/groq/resources/audio/speech.py
@@ -0,0 +1,227 @@
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+
+from __future__ import annotations
+
+from typing_extensions import Literal
+
+import httpx
+
+from ..._types import NOT_GIVEN, Body, Query, Headers, NotGiven
+from ..._utils import (
+    maybe_transform,
+    async_maybe_transform,
+)
+from ..._compat import cached_property
+from ..._resource import SyncAPIResource, AsyncAPIResource
+from ..._response import (
+    BinaryAPIResponse,
+    AsyncBinaryAPIResponse,
+    StreamedBinaryAPIResponse,
+    AsyncStreamedBinaryAPIResponse,
+    to_custom_raw_response_wrapper,
+    to_custom_streamed_response_wrapper,
+    async_to_custom_raw_response_wrapper,
+    async_to_custom_streamed_response_wrapper,
+)
+from ...types.audio import speech_create_params
+from ..._base_client import make_request_options
+
+__all__ = ["Speech", "AsyncSpeech"]
+
+
+class Speech(SyncAPIResource):
+    @cached_property
+    def with_raw_response(self) -> SpeechWithRawResponse:
+        """
+        This property can be used as a prefix for any HTTP method call to return
+        the raw response object instead of the parsed content.
+
+        For more information, see https://www.github.com/groq/groq-python#accessing-raw-response-data-eg-headers
+        """
+        return SpeechWithRawResponse(self)
+
+    @cached_property
+    def with_streaming_response(self) -> SpeechWithStreamingResponse:
+        """
+        An alternative to `.with_raw_response` that doesn't eagerly read the response body.
+
+        For more information, see https://www.github.com/groq/groq-python#with_streaming_response
+        """
+        return SpeechWithStreamingResponse(self)
+
+    def create(
+        self,
+        *,
+        input: str,
+        model: str,
+        voice: str,
+        response_format: Literal["mp3", "opus", "aac", "flac", "wav", "pcm"] | NotGiven = NOT_GIVEN,
+        speed: float | NotGiven = NOT_GIVEN,
+        # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
+        # The extra values given here take precedence over values defined on the client or passed to this method.
+        extra_headers: Headers | None = None,
+        extra_query: Query | None = None,
+        extra_body: Body | None = None,
+        timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
+    ) -> BinaryAPIResponse:
+        """
+        Generates audio from the input text.
+
+        Args:
+          input: The text to generate audio for.
+
+          model: One of the available TTS models
+
+          voice: The voice to use when generating the audio.
+
+          response_format: The format to audio in. Supported formats are `mp3`, `opus`, `aac`, `flac`,
+              `wav`, and `pcm`.
+
+          speed: The speed of the generated audio. Select a value from `0.25` to `4.0`. `1.0` is
+              the default.
+
+          extra_headers: Send extra headers
+
+          extra_query: Add additional query parameters to the request
+
+          extra_body: Add additional JSON properties to the request
+
+          timeout: Override the client-level default timeout for this request, in seconds
+        """
+        extra_headers = {"Accept": "application/octet-stream", **(extra_headers or {})}
+        return self._post(
+            "/openai/v1/audio/speech",
+            body=maybe_transform(
+                {
+                    "input": input,
+                    "model": model,
+                    "voice": voice,
+                    "response_format": response_format,
+                    "speed": speed,
+                },
+                speech_create_params.SpeechCreateParams,
+            ),
+            options=make_request_options(
+                extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
+            ),
+            cast_to=BinaryAPIResponse,
+        )
+
+
+class AsyncSpeech(AsyncAPIResource):
+    @cached_property
+    def with_raw_response(self) -> AsyncSpeechWithRawResponse:
+        """
+        This property can be used as a prefix for any HTTP method call to return
+        the raw response object instead of the parsed content.
+
+        For more information, see https://www.github.com/groq/groq-python#accessing-raw-response-data-eg-headers
+        """
+        return AsyncSpeechWithRawResponse(self)
+
+    @cached_property
+    def with_streaming_response(self) -> AsyncSpeechWithStreamingResponse:
+        """
+        An alternative to `.with_raw_response` that doesn't eagerly read the response body.
+
+        For more information, see https://www.github.com/groq/groq-python#with_streaming_response
+        """
+        return AsyncSpeechWithStreamingResponse(self)
+
+    async def create(
+        self,
+        *,
+        input: str,
+        model: str,
+        voice: str,
+        response_format: Literal["mp3", "opus", "aac", "flac", "wav", "pcm"] | NotGiven = NOT_GIVEN,
+        speed: float | NotGiven = NOT_GIVEN,
+        # Use the following arguments if you need to pass additional parameters to the API that aren't available via kwargs.
+        # The extra values given here take precedence over values defined on the client or passed to this method.
+        extra_headers: Headers | None = None,
+        extra_query: Query | None = None,
+        extra_body: Body | None = None,
+        timeout: float | httpx.Timeout | None | NotGiven = NOT_GIVEN,
+    ) -> AsyncBinaryAPIResponse:
+        """
+        Generates audio from the input text.
+
+        Args:
+          input: The text to generate audio for.
+
+          model: One of the available TTS models
+
+          voice: The voice to use when generating the audio.
+
+          response_format: The format to audio in. Supported formats are `mp3`, `opus`, `aac`, `flac`,
+              `wav`, and `pcm`.
+
+          speed: The speed of the generated audio. Select a value from `0.25` to `4.0`. `1.0` is
+              the default.
+
+          extra_headers: Send extra headers
+
+          extra_query: Add additional query parameters to the request
+
+          extra_body: Add additional JSON properties to the request
+
+          timeout: Override the client-level default timeout for this request, in seconds
+        """
+        extra_headers = {"Accept": "application/octet-stream", **(extra_headers or {})}
+        return await self._post(
+            "/openai/v1/audio/speech",
+            body=await async_maybe_transform(
+                {
+                    "input": input,
+                    "model": model,
+                    "voice": voice,
+                    "response_format": response_format,
+                    "speed": speed,
+                },
+                speech_create_params.SpeechCreateParams,
+            ),
+            options=make_request_options(
+                extra_headers=extra_headers, extra_query=extra_query, extra_body=extra_body, timeout=timeout
+            ),
+            cast_to=AsyncBinaryAPIResponse,
+        )
+
+
+class SpeechWithRawResponse:
+    def __init__(self, speech: Speech) -> None:
+        self._speech = speech
+
+        self.create = to_custom_raw_response_wrapper(
+            speech.create,
+            BinaryAPIResponse,
+        )
+
+
+class AsyncSpeechWithRawResponse:
+    def __init__(self, speech: AsyncSpeech) -> None:
+        self._speech = speech
+
+        self.create = async_to_custom_raw_response_wrapper(
+            speech.create,
+            AsyncBinaryAPIResponse,
+        )
+
+
+class SpeechWithStreamingResponse:
+    def __init__(self, speech: Speech) -> None:
+        self._speech = speech
+
+        self.create = to_custom_streamed_response_wrapper(
+            speech.create,
+            StreamedBinaryAPIResponse,
+        )
+
+
+class AsyncSpeechWithStreamingResponse:
+    def __init__(self, speech: AsyncSpeech) -> None:
+        self._speech = speech
+
+        self.create = async_to_custom_streamed_response_wrapper(
+            speech.create,
+            AsyncStreamedBinaryAPIResponse,
+        )
diff --git a/src/groq/types/audio/__init__.py b/src/groq/types/audio/__init__.py
@@ -4,5 +4,6 @@
 
 from .translation import Translation as Translation
 from .transcription import Transcription as Transcription
+from .speech_create_params import SpeechCreateParams as SpeechCreateParams
 from .translation_create_params import TranslationCreateParams as TranslationCreateParams
 from .transcription_create_params import TranscriptionCreateParams as TranscriptionCreateParams
diff --git a/src/groq/types/audio/speech_create_params.py b/src/groq/types/audio/speech_create_params.py
@@ -0,0 +1,30 @@
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+
+from __future__ import annotations
+
+from typing_extensions import Literal, Required, TypedDict
+
+__all__ = ["SpeechCreateParams"]
+
+
+class SpeechCreateParams(TypedDict, total=False):
+    input: Required[str]
+    """The text to generate audio for."""
+
+    model: Required[str]
+    """One of the available TTS models"""
+
+    voice: Required[str]
+    """The voice to use when generating the audio."""
+
+    response_format: Literal["mp3", "opus", "aac", "flac", "wav", "pcm"]
+    """The format to audio in.
+
+    Supported formats are `mp3`, `opus`, `aac`, `flac`, `wav`, and `pcm`.
+    """
+
+    speed: float
+    """The speed of the generated audio.
+
+    Select a value from `0.25` to `4.0`. `1.0` is the default.
+    """
diff --git a/tests/api_resources/audio/test_speech.py b/tests/api_resources/audio/test_speech.py

Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,2 @@`
`1`		`-configured_endpoints: 15`
	`1`	`+configured_endpoints: 16`
`2`	`2`	`openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/groqcloud%2Fgroqcloud-055e57d5b3cad069182bb870f76dd7936e69fc88c9a1e51ad198400e38c1d076.yml`
-Original file line number
+Diff line change
 +# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
++
 +from __future__ import annotations
++
 +import os
 +from typing import Any, cast
++
 +import httpx
 +import pytest
 +from respx import MockRouter
++
 +from groq import Groq, AsyncGroq
 +from groq._response import (
 +    BinaryAPIResponse,
 +    AsyncBinaryAPIResponse,
 +    StreamedBinaryAPIResponse,
 +    AsyncStreamedBinaryAPIResponse,
 +)
++
 +base_url = os.environ.get("TEST_API_BASE_URL", "http://127.0.0.1:4010")
++
++
 +class TestSpeech:
 +    parametrize = pytest.mark.parametrize("client", [False, True], indirect=True, ids=["loose", "strict"])
++
 +    @parametrize
 +    @pytest.mark.respx(base_url=base_url)
 +    def test_method_create(self, client: Groq, respx_mock: MockRouter) -> None:
 +        respx_mock.post("/openai/v1/audio/speech").mock(return_value=httpx.Response(200, json={"foo": "bar"}))
 +        speech = client.audio.speech.create(
 +            input="input",
 +            model="model",
 +            voice="voice",
 +        )
 +        assert speech.is_closed
 +        assert speech.json() == {"foo": "bar"}
 +        assert cast(Any, speech.is_closed) is True
 +        assert isinstance(speech, BinaryAPIResponse)
++
 +    @parametrize
 +    @pytest.mark.respx(base_url=base_url)
 +    def test_method_create_with_all_params(self, client: Groq, respx_mock: MockRouter) -> None:
 +        respx_mock.post("/openai/v1/audio/speech").mock(return_value=httpx.Response(200, json={"foo": "bar"}))
 +        speech = client.audio.speech.create(
 +            input="input",
 +            model="model",
 +            voice="voice",
 +            response_format="mp3",
 +            speed=0.25,
 +        )
 +        assert speech.is_closed
 +        assert speech.json() == {"foo": "bar"}
 +        assert cast(Any, speech.is_closed) is True
 +        assert isinstance(speech, BinaryAPIResponse)
++
 +    @parametrize
 +    @pytest.mark.respx(base_url=base_url)
 +    def test_raw_response_create(self, client: Groq, respx_mock: MockRouter) -> None:
 +        respx_mock.post("/openai/v1/audio/speech").mock(return_value=httpx.Response(200, json={"foo": "bar"}))
++
 +        speech = client.audio.speech.with_raw_response.create(
 +            input="input",
 +            model="model",
 +            voice="voice",
 +        )
++
 +        assert speech.is_closed is True
 +        assert speech.http_request.headers.get("X-Stainless-Lang") == "python"
 +        assert speech.json() == {"foo": "bar"}
 +        assert isinstance(speech, BinaryAPIResponse)
++
 +    @parametrize
 +    @pytest.mark.respx(base_url=base_url)
 +    def test_streaming_response_create(self, client: Groq, respx_mock: MockRouter) -> None:
 +        respx_mock.post("/openai/v1/audio/speech").mock(return_value=httpx.Response(200, json={"foo": "bar"}))
 +        with client.audio.speech.with_streaming_response.create(
 +            input="input",
 +            model="model",
 +            voice="voice",
 +        ) as speech:
 +            assert not speech.is_closed
 +            assert speech.http_request.headers.get("X-Stainless-Lang") == "python"
++
 +            assert speech.json() == {"foo": "bar"}
 +            assert cast(Any, speech.is_closed) is True
 +            assert isinstance(speech, StreamedBinaryAPIResponse)
++
 +        assert cast(Any, speech.is_closed) is True
++
++
 +class TestAsyncSpeech:
 +    parametrize = pytest.mark.parametrize("async_client", [False, True], indirect=True, ids=["loose", "strict"])
++
 +    @parametrize
 +    @pytest.mark.respx(base_url=base_url)
 +    async def test_method_create(self, async_client: AsyncGroq, respx_mock: MockRouter) -> None:
 +        respx_mock.post("/openai/v1/audio/speech").mock(return_value=httpx.Response(200, json={"foo": "bar"}))
 +        speech = await async_client.audio.speech.create(
 +            input="input",
 +            model="model",
 +            voice="voice",
 +        )
 +        assert speech.is_closed
 +        assert await speech.json() == {"foo": "bar"}
 +        assert cast(Any, speech.is_closed) is True
 +        assert isinstance(speech, AsyncBinaryAPIResponse)
++
 +    @parametrize
 +    @pytest.mark.respx(base_url=base_url)
 +    async def test_method_create_with_all_params(self, async_client: AsyncGroq, respx_mock: MockRouter) -> None:
 +        respx_mock.post("/openai/v1/audio/speech").mock(return_value=httpx.Response(200, json={"foo": "bar"}))
 +        speech = await async_client.audio.speech.create(
 +            input="input",
 +            model="model",
 +            voice="voice",
 +            response_format="mp3",
 +            speed=0.25,
 +        )
 +        assert speech.is_closed
 +        assert await speech.json() == {"foo": "bar"}
 +        assert cast(Any, speech.is_closed) is True
 +        assert isinstance(speech, AsyncBinaryAPIResponse)
++
 +    @parametrize
 +    @pytest.mark.respx(base_url=base_url)
 +    async def test_raw_response_create(self, async_client: AsyncGroq, respx_mock: MockRouter) -> None:
 +        respx_mock.post("/openai/v1/audio/speech").mock(return_value=httpx.Response(200, json={"foo": "bar"}))
++
 +        speech = await async_client.audio.speech.with_raw_response.create(
 +            input="input",
 +            model="model",
 +            voice="voice",
 +        )
++
 +        assert speech.is_closed is True
 +        assert speech.http_request.headers.get("X-Stainless-Lang") == "python"
 +        assert await speech.json() == {"foo": "bar"}
 +        assert isinstance(speech, AsyncBinaryAPIResponse)
++
 +    @parametrize
 +    @pytest.mark.respx(base_url=base_url)
 +    async def test_streaming_response_create(self, async_client: AsyncGroq, respx_mock: MockRouter) -> None:
 +        respx_mock.post("/openai/v1/audio/speech").mock(return_value=httpx.Response(200, json={"foo": "bar"}))
 +        async with async_client.audio.speech.with_streaming_response.create(
 +            input="input",
 +            model="model",
 +            voice="voice",
 +        ) as speech:
 +            assert not speech.is_closed
 +            assert speech.http_request.headers.get("X-Stainless-Lang") == "python"
++
 +            assert await speech.json() == {"foo": "bar"}
 +            assert cast(Any, speech.is_closed) is True
 +            assert isinstance(speech, AsyncStreamedBinaryAPIResponse)
++
 +        assert cast(Any, speech.is_closed) is True