no more 30 second time limit on kokoro, can go for several minutes.
Browse files
app.py
CHANGED
@@ -583,18 +583,18 @@ def Generate_Speech( # <-- MCP tool #4 (Generate Speech)
|
|
583 |
Japanese, Portuguese, and Chinese speakers.
|
584 |
|
585 |
Enhanced for longer audio generation:
|
|
|
586 |
- Can generate audio of any length based on input text
|
587 |
- Concatenates multiple segments for seamless longer audio
|
588 |
|
589 |
Default behavior:
|
590 |
-
- Speed defaults to 1.25 (slightly brisk cadence).
|
591 |
-
- Voice defaults to "af_heart"
|
592 |
|
593 |
Args:
|
594 |
text: The text to synthesize. Works best with English but supports multiple languages.
|
595 |
speed: Speech speed multiplier in 0.5–2.0; 1.0 = normal speed. Default: 1.25 (slightly brisk).
|
596 |
-
voice: Voice identifier from 54 available options. Use List_Kokoro_Voices() to see all choices.
|
597 |
-
Examples: 'af_heart' (US female), 'am_adam' (US male), 'bf_bella' (British female),
|
598 |
|
599 |
Returns:
|
600 |
A tuple of (sample_rate_hz, audio_waveform) where:
|
@@ -605,6 +605,7 @@ def Generate_Speech( # <-- MCP tool #4 (Generate Speech)
|
|
605 |
- Requires the 'kokoro' package (>=0.9.4). If unavailable, an error is raised.
|
606 |
- Runs on CUDA if available; otherwise CPU.
|
607 |
- Supports 54 voices across 9 language/accent categories.
|
|
|
608 |
- Use List_Kokoro_Voices() MCP tool to discover all available voice options.
|
609 |
"""
|
610 |
if not text or not text.strip():
|
|
|
583 |
Japanese, Portuguese, and Chinese speakers.
|
584 |
|
585 |
Enhanced for longer audio generation:
|
586 |
+
- Processes ALL text segments (not just the first one)
|
587 |
- Can generate audio of any length based on input text
|
588 |
- Concatenates multiple segments for seamless longer audio
|
589 |
|
590 |
Default behavior:
|
591 |
+
- Speed defaults to 1.25 (slightly brisk cadence) for clearer, snappier delivery.
|
592 |
+
- Voice defaults to "af_heart" (American Female, Heart voice)
|
593 |
|
594 |
Args:
|
595 |
text: The text to synthesize. Works best with English but supports multiple languages.
|
596 |
speed: Speech speed multiplier in 0.5–2.0; 1.0 = normal speed. Default: 1.25 (slightly brisk).
|
597 |
+
voice: Voice identifier from 54 available options. Use List_Kokoro_Voices() to see all choices. Default: 'af_heart'.
|
|
|
598 |
|
599 |
Returns:
|
600 |
A tuple of (sample_rate_hz, audio_waveform) where:
|
|
|
605 |
- Requires the 'kokoro' package (>=0.9.4). If unavailable, an error is raised.
|
606 |
- Runs on CUDA if available; otherwise CPU.
|
607 |
- Supports 54 voices across 9 language/accent categories.
|
608 |
+
- Can generate audio of any length - no 30 second limit!
|
609 |
- Use List_Kokoro_Voices() MCP tool to discover all available voice options.
|
610 |
"""
|
611 |
if not text or not text.strip():
|