Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
6 changes: 3 additions & 3 deletions .fern/metadata.json
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
{
"cliVersion": "4.62.5",
"cliVersion": "4.65.2",
"generatorName": "fernapi/fern-python-sdk",
"generatorVersion": "4.61.0",
"generatorConfig": {
Expand Down Expand Up @@ -64,6 +64,6 @@
}
]
},
"originGitCommit": "a07a0deaa640e8b286f9c8e4e47426b37a083a67",
"sdkVersion": "0.13.11"
"originGitCommit": "274a9e627c776728cbf8da2fc71627448d122f99",
"sdkVersion": "0.13.12"
}
365 changes: 182 additions & 183 deletions poetry.lock

Large diffs are not rendered by default.

2 changes: 1 addition & 1 deletion pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@ dynamic = ["version"]

[tool.poetry]
name = "hume"
version = "0.13.11"
version = "0.13.12"
description = "A Python SDK for Hume AI"
readme = "README.md"
authors = []
Expand Down
4 changes: 2 additions & 2 deletions src/hume/core/client_wrapper.py
Original file line number Diff line number Diff line change
Expand Up @@ -28,12 +28,12 @@ def get_headers(self) -> typing.Dict[str, str]:
import platform

headers: typing.Dict[str, str] = {
"User-Agent": "hume/0.13.11",
"User-Agent": "hume/0.13.12",
"X-Fern-Language": "Python",
"X-Fern-Runtime": f"python/{platform.python_version()}",
"X-Fern-Platform": f"{platform.system().lower()}/{platform.release()}",
"X-Fern-SDK-Name": "hume",
"X-Fern-SDK-Version": "0.13.11",
"X-Fern-SDK-Version": "0.13.12",
**(self.get_custom_headers() or {}),
}
if self.api_key is not None:
Expand Down
4 changes: 2 additions & 2 deletions src/hume/empathic_voice/tools/client.py
Original file line number Diff line number Diff line change
Expand Up @@ -447,7 +447,7 @@ def delete_tool_version(
api_key="YOUR_API_KEY",
)
client.empathic_voice.tools.delete_tool_version(
id="",
id="your-tool-id",
version=1,
)
"""
Expand Down Expand Up @@ -1008,7 +1008,7 @@ async def delete_tool_version(

async def main() -> None:
await client.empathic_voice.tools.delete_tool_version(
id="",
id="your-tool-id",
version=1,
)

Expand Down
128 changes: 128 additions & 0 deletions src/hume/tts/raw_client.py

Large diffs are not rendered by default.

24 changes: 24 additions & 0 deletions src/hume/tts/stream_input/client.py
Original file line number Diff line number Diff line change
Expand Up @@ -50,6 +50,7 @@ def connect(
instant_mode: typing.Optional[bool] = None,
no_binary: typing.Optional[bool] = None,
strip_headers: typing.Optional[bool] = None,
temperature: typing.Optional[float] = None,
version: typing.Optional[OctaveVersion] = None,
api_key: typing.Optional[str] = None,
request_options: typing.Optional[RequestOptions] = None,
Expand Down Expand Up @@ -84,6 +85,16 @@ def connect(
strip_headers : typing.Optional[bool]
If enabled, the audio for all the chunks of a generation, once concatenated together, will constitute a single audio file. Otherwise, if disabled, each chunk's audio will be its own audio file, each with its own headers (if applicable).

temperature : typing.Optional[float]
Sampling temperature for the speech generation model. Higher values increase variation; lower values increase consistency.

**This is an experimental parameter.** It is recommended to use the default values for most use cases.

Defaults when omitted:
- Octave 1 voice creation (no voice specified): `0.9`
- Octave 1 text-to-speech: `0.8`
- Octave 2 text-to-speech: `0.75`

version : typing.Optional[OctaveVersion]
The version of the Octave Model to use. 1 for the legacy model, 2 for the new model.

Expand Down Expand Up @@ -111,6 +122,7 @@ def connect(
"instant_mode": instant_mode,
"no_binary": no_binary,
"strip_headers": strip_headers,
"temperature": temperature,
"version": version,
"api_key": api_key,
**(
Expand Down Expand Up @@ -171,6 +183,7 @@ async def connect(
instant_mode: typing.Optional[bool] = None,
no_binary: typing.Optional[bool] = None,
strip_headers: typing.Optional[bool] = None,
temperature: typing.Optional[float] = None,
version: typing.Optional[OctaveVersion] = None,
api_key: typing.Optional[str] = None,
request_options: typing.Optional[RequestOptions] = None,
Expand Down Expand Up @@ -205,6 +218,16 @@ async def connect(
strip_headers : typing.Optional[bool]
If enabled, the audio for all the chunks of a generation, once concatenated together, will constitute a single audio file. Otherwise, if disabled, each chunk's audio will be its own audio file, each with its own headers (if applicable).

temperature : typing.Optional[float]
Sampling temperature for the speech generation model. Higher values increase variation; lower values increase consistency.

**This is an experimental parameter.** It is recommended to use the default values for most use cases.

Defaults when omitted:
- Octave 1 voice creation (no voice specified): `0.9`
- Octave 1 text-to-speech: `0.8`
- Octave 2 text-to-speech: `0.75`

version : typing.Optional[OctaveVersion]
The version of the Octave Model to use. 1 for the legacy model, 2 for the new model.

Expand Down Expand Up @@ -232,6 +255,7 @@ async def connect(
"instant_mode": instant_mode,
"no_binary": no_binary,
"strip_headers": strip_headers,
"temperature": temperature,
"version": version,
"api_key": api_key,
**(
Expand Down
24 changes: 24 additions & 0 deletions src/hume/tts/stream_input/raw_client.py
Original file line number Diff line number Diff line change
Expand Up @@ -38,6 +38,7 @@ def connect(
instant_mode: typing.Optional[bool] = None,
no_binary: typing.Optional[bool] = None,
strip_headers: typing.Optional[bool] = None,
temperature: typing.Optional[float] = None,
version: typing.Optional[OctaveVersion] = None,
api_key: typing.Optional[str] = None,
request_options: typing.Optional[RequestOptions] = None,
Expand Down Expand Up @@ -72,6 +73,16 @@ def connect(
strip_headers : typing.Optional[bool]
If enabled, the audio for all the chunks of a generation, once concatenated together, will constitute a single audio file. Otherwise, if disabled, each chunk's audio will be its own audio file, each with its own headers (if applicable).

temperature : typing.Optional[float]
Sampling temperature for the speech generation model. Higher values increase variation; lower values increase consistency.

**This is an experimental parameter.** It is recommended to use the default values for most use cases.

Defaults when omitted:
- Octave 1 voice creation (no voice specified): `0.9`
- Octave 1 text-to-speech: `0.8`
- Octave 2 text-to-speech: `0.75`

version : typing.Optional[OctaveVersion]
The version of the Octave Model to use. 1 for the legacy model, 2 for the new model.

Expand Down Expand Up @@ -99,6 +110,7 @@ def connect(
"instant_mode": instant_mode,
"no_binary": no_binary,
"strip_headers": strip_headers,
"temperature": temperature,
"version": version,
"api_key": api_key,
**(
Expand Down Expand Up @@ -148,6 +160,7 @@ async def connect(
instant_mode: typing.Optional[bool] = None,
no_binary: typing.Optional[bool] = None,
strip_headers: typing.Optional[bool] = None,
temperature: typing.Optional[float] = None,
version: typing.Optional[OctaveVersion] = None,
api_key: typing.Optional[str] = None,
request_options: typing.Optional[RequestOptions] = None,
Expand Down Expand Up @@ -182,6 +195,16 @@ async def connect(
strip_headers : typing.Optional[bool]
If enabled, the audio for all the chunks of a generation, once concatenated together, will constitute a single audio file. Otherwise, if disabled, each chunk's audio will be its own audio file, each with its own headers (if applicable).

temperature : typing.Optional[float]
Sampling temperature for the speech generation model. Higher values increase variation; lower values increase consistency.

**This is an experimental parameter.** It is recommended to use the default values for most use cases.

Defaults when omitted:
- Octave 1 voice creation (no voice specified): `0.9`
- Octave 1 text-to-speech: `0.8`
- Octave 2 text-to-speech: `0.75`

version : typing.Optional[OctaveVersion]
The version of the Octave Model to use. 1 for the legacy model, 2 for the new model.

Expand Down Expand Up @@ -209,6 +232,7 @@ async def connect(
"instant_mode": instant_mode,
"no_binary": no_binary,
"strip_headers": strip_headers,
"temperature": temperature,
"version": version,
"api_key": api_key,
**(
Expand Down
20 changes: 19 additions & 1 deletion src/hume/tts/types/posted_tts.py
Original file line number Diff line number Diff line change
Expand Up @@ -50,6 +50,18 @@ class PostedTts(UniversalBaseModel):
If enabled, the audio for all the chunks of a generation, once concatenated together, will constitute a single audio file. Otherwise, if disabled, each chunk's audio will be its own audio file, each with its own headers (if applicable).
"""

temperature: typing.Optional[float] = pydantic.Field(default=None)
"""
Sampling temperature for the speech generation model. Higher values increase variation; lower values increase consistency.

**This is an experimental parameter.** It is recommended to use the default values for most use cases.

Defaults when omitted:
- Octave 1 voice creation (no voice specified): `0.9`
- Octave 1 text-to-speech: `0.8`
- Octave 2 text-to-speech: `0.75`
"""

utterances: typing.List[PostedUtterance] = pydantic.Field()
"""
A list of **Utterances** to be converted to speech output.
Expand All @@ -66,7 +78,13 @@ class PostedTts(UniversalBaseModel):
For a comparison of Octave versions, see the [Octave versions](/docs/text-to-speech-tts/overview#octave-versions) section in the TTS overview.
"""

instant_mode: typing.Optional[bool] = None
instant_mode: typing.Optional[bool] = pydantic.Field(default=None)
"""
Enables ultra-low latency streaming, significantly reducing the time until the first audio chunk is received. Recommended for real-time applications requiring immediate audio playback. For further details, see our documentation on [instant mode](/docs/text-to-speech-tts/overview#ultra-low-latency-streaming-instant-mode).
- A [voice](/reference/text-to-speech-tts/synthesize-json-streaming#request.body.utterances.voice) must be specified when instant mode is enabled. Dynamic voice generation is not supported with this mode.
- Instant mode is only supported for streaming endpoints (e.g., [/v0/tts/stream/json](/reference/text-to-speech-tts/synthesize-json-streaming), [/v0/tts/stream/file](/reference/text-to-speech-tts/synthesize-file-streaming)).
- Ensure only a single generation is requested ([num_generations](/reference/text-to-speech-tts/synthesize-json-streaming#request.body.num_generations) must be `1` or omitted).
"""

if IS_PYDANTIC_V2:
model_config: typing.ClassVar[pydantic.ConfigDict] = pydantic.ConfigDict(extra="allow", frozen=True) # type: ignore # Pydantic v2
Expand Down
2 changes: 1 addition & 1 deletion wiremock/wiremock-mappings.json

Large diffs are not rendered by default.

Loading