Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -183,11 +183,14 @@ def generate_speech(text, voice1, voice2, temperature, top_p, repetition_penalty
|
|
183 |
# Concatenate all audio samples
|
184 |
final_audio = np.concatenate(audio_samples)
|
185 |
|
|
|
|
|
|
|
186 |
# Convert numpy array to AudioSegment
|
187 |
speech_audio = AudioSegment(
|
188 |
-
final_audio.tobytes(),
|
189 |
frame_rate=24000,
|
190 |
-
sample_width=
|
191 |
channels=1
|
192 |
)
|
193 |
|
@@ -208,7 +211,6 @@ def generate_speech(text, voice1, voice2, temperature, top_p, repetition_penalty
|
|
208 |
print(f"Error generating speech: {e}")
|
209 |
return None
|
210 |
|
211 |
-
|
212 |
with gr.Blocks(title="Orpheus Text-to-Speech") as demo:
|
213 |
with gr.Row():
|
214 |
with gr.Column(scale=1):
|
@@ -217,13 +219,13 @@ with gr.Blocks(title="Orpheus Text-to-Speech") as demo:
|
|
217 |
uploaded_file = gr.File(label="Upload File")
|
218 |
|
219 |
with gr.Column(scale=2):
|
|
|
|
|
220 |
script_output = gr.Textbox(label="Generated Script", lines=10)
|
221 |
audio_output = gr.Audio(label="Generated Audio", type="numpy")
|
222 |
generate_script_btn = gr.Button("Generate Podcast Script")
|
223 |
|
224 |
with gr.Column(scale=2):
|
225 |
-
duration = gr.Slider(minimum=1, maximum=60, value=5, step=1, label="Duration (minutes)")
|
226 |
-
num_hosts = gr.Radio(["1", "2"], label="Number of Hosts", value="1")
|
227 |
voice1 = gr.Dropdown(
|
228 |
choices=VOICES,
|
229 |
value="tara",
|
|
|
183 |
# Concatenate all audio samples
|
184 |
final_audio = np.concatenate(audio_samples)
|
185 |
|
186 |
+
# Normalize the audio
|
187 |
+
final_audio = final_audio / np.max(np.abs(final_audio))
|
188 |
+
|
189 |
# Convert numpy array to AudioSegment
|
190 |
speech_audio = AudioSegment(
|
191 |
+
(final_audio * 32767).astype(np.int16).tobytes(),
|
192 |
frame_rate=24000,
|
193 |
+
sample_width=2,
|
194 |
channels=1
|
195 |
)
|
196 |
|
|
|
211 |
print(f"Error generating speech: {e}")
|
212 |
return None
|
213 |
|
|
|
214 |
with gr.Blocks(title="Orpheus Text-to-Speech") as demo:
|
215 |
with gr.Row():
|
216 |
with gr.Column(scale=1):
|
|
|
219 |
uploaded_file = gr.File(label="Upload File")
|
220 |
|
221 |
with gr.Column(scale=2):
|
222 |
+
duration = gr.Slider(minimum=1, maximum=60, value=5, step=1, label="Duration (minutes)")
|
223 |
+
num_hosts = gr.Radio(["1", "2"], label="Number of Hosts", value="1")
|
224 |
script_output = gr.Textbox(label="Generated Script", lines=10)
|
225 |
audio_output = gr.Audio(label="Generated Audio", type="numpy")
|
226 |
generate_script_btn = gr.Button("Generate Podcast Script")
|
227 |
|
228 |
with gr.Column(scale=2):
|
|
|
|
|
229 |
voice1 = gr.Dropdown(
|
230 |
choices=VOICES,
|
231 |
value="tara",
|