Skip to content

Commit 07ae912

Browse files
authored
feat(blocks): Add text to speech block and Unreal Speech API key (Significant-Gravitas#8264)
1 parent 7501089 commit 07ae912

File tree

2 files changed

+81
-1
lines changed

2 files changed

+81
-1
lines changed
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,79 @@
1+
from typing import Any
2+
3+
import requests
4+
5+
from backend.data.block import Block, BlockCategory, BlockOutput, BlockSchema
6+
from backend.data.model import BlockSecret, SchemaField, SecretField
7+
8+
9+
class UnrealTextToSpeechBlock(Block):
10+
class Input(BlockSchema):
11+
text: str = SchemaField(
12+
description="The text to be converted to speech",
13+
placeholder="Enter the text you want to convert to speech",
14+
)
15+
voice_id: str = SchemaField(
16+
description="The voice ID to use for text-to-speech conversion",
17+
placeholder="Scarlett",
18+
default="Scarlett",
19+
)
20+
api_key: BlockSecret = SecretField(
21+
key="unreal_speech_api_key", description="Your Unreal Speech API key"
22+
)
23+
24+
class Output(BlockSchema):
25+
mp3_url: str = SchemaField(description="The URL of the generated MP3 file")
26+
error: str = SchemaField(description="Error message if the API call failed")
27+
28+
def __init__(self):
29+
super().__init__(
30+
id="4ff1ff6d-cc40-4caa-ae69-011daa20c378",
31+
description="Converts text to speech using the Unreal Speech API",
32+
categories={BlockCategory.AI, BlockCategory.TEXT},
33+
input_schema=UnrealTextToSpeechBlock.Input,
34+
output_schema=UnrealTextToSpeechBlock.Output,
35+
test_input={
36+
"text": "This is a test of the text to speech API.",
37+
"voice_id": "Scarlett",
38+
"api_key": "test_api_key",
39+
},
40+
test_output=[("mp3_url", "https://example.com/test.mp3")],
41+
test_mock={
42+
"call_unreal_speech_api": lambda *args, **kwargs: {
43+
"OutputUri": "https://example.com/test.mp3"
44+
}
45+
},
46+
)
47+
48+
@staticmethod
49+
def call_unreal_speech_api(
50+
api_key: str, text: str, voice_id: str
51+
) -> dict[str, Any]:
52+
url = "https://api.v7.unrealspeech.com/speech"
53+
headers = {
54+
"Authorization": f"Bearer {api_key}",
55+
"Content-Type": "application/json",
56+
}
57+
data = {
58+
"Text": text,
59+
"VoiceId": voice_id,
60+
"Bitrate": "192k",
61+
"Speed": "0",
62+
"Pitch": "1",
63+
"TimestampType": "sentence",
64+
}
65+
66+
response = requests.post(url, headers=headers, json=data)
67+
response.raise_for_status()
68+
return response.json()
69+
70+
def run(self, input_data: Input, **kwargs) -> BlockOutput:
71+
try:
72+
api_response = self.call_unreal_speech_api(
73+
input_data.api_key.get_secret_value(),
74+
input_data.text,
75+
input_data.voice_id,
76+
)
77+
yield "mp3_url", api_response["OutputUri"]
78+
except Exception as e:
79+
yield "error", str(e)

autogpt_platform/backend/backend/util/settings.py

+2-1
Original file line numberDiff line numberDiff line change
@@ -219,8 +219,9 @@ class Secrets(UpdateTrackingModel["Secrets"], BaseSettings):
219219
google_maps_api_key: str = Field(default="", description="Google Maps API Key")
220220

221221
replicate_api_key: str = Field(default="", description="Replicate API Key")
222-
222+
unreal_speech_api_key: str = Field(default="", description="Unreal Speech API Key")
223223
ideogram_api_key: str = Field(default="", description="Ideogram API Key")
224+
224225
# Add more secret fields as needed
225226

226227
model_config = SettingsConfigDict(

0 commit comments

Comments
 (0)