bluenevus commited on
Commit
13cd58d
·
verified ·
1 Parent(s): 483671e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -5
app.py CHANGED
@@ -183,11 +183,14 @@ def generate_speech(text, voice1, voice2, temperature, top_p, repetition_penalty
183
  # Concatenate all audio samples
184
  final_audio = np.concatenate(audio_samples)
185
 
 
 
 
186
  # Convert numpy array to AudioSegment
187
  speech_audio = AudioSegment(
188
- final_audio.tobytes(),
189
  frame_rate=24000,
190
- sample_width=final_audio.dtype.itemsize,
191
  channels=1
192
  )
193
 
@@ -208,7 +211,6 @@ def generate_speech(text, voice1, voice2, temperature, top_p, repetition_penalty
208
  print(f"Error generating speech: {e}")
209
  return None
210
 
211
-
212
  with gr.Blocks(title="Orpheus Text-to-Speech") as demo:
213
  with gr.Row():
214
  with gr.Column(scale=1):
@@ -217,13 +219,13 @@ with gr.Blocks(title="Orpheus Text-to-Speech") as demo:
217
  uploaded_file = gr.File(label="Upload File")
218
 
219
  with gr.Column(scale=2):
 
 
220
  script_output = gr.Textbox(label="Generated Script", lines=10)
221
  audio_output = gr.Audio(label="Generated Audio", type="numpy")
222
  generate_script_btn = gr.Button("Generate Podcast Script")
223
 
224
  with gr.Column(scale=2):
225
- duration = gr.Slider(minimum=1, maximum=60, value=5, step=1, label="Duration (minutes)")
226
- num_hosts = gr.Radio(["1", "2"], label="Number of Hosts", value="1")
227
  voice1 = gr.Dropdown(
228
  choices=VOICES,
229
  value="tara",
 
183
  # Concatenate all audio samples
184
  final_audio = np.concatenate(audio_samples)
185
 
186
+ # Normalize the audio
187
+ final_audio = final_audio / np.max(np.abs(final_audio))
188
+
189
  # Convert numpy array to AudioSegment
190
  speech_audio = AudioSegment(
191
+ (final_audio * 32767).astype(np.int16).tobytes(),
192
  frame_rate=24000,
193
+ sample_width=2,
194
  channels=1
195
  )
196
 
 
211
  print(f"Error generating speech: {e}")
212
  return None
213
 
 
214
  with gr.Blocks(title="Orpheus Text-to-Speech") as demo:
215
  with gr.Row():
216
  with gr.Column(scale=1):
 
219
  uploaded_file = gr.File(label="Upload File")
220
 
221
  with gr.Column(scale=2):
222
+ duration = gr.Slider(minimum=1, maximum=60, value=5, step=1, label="Duration (minutes)")
223
+ num_hosts = gr.Radio(["1", "2"], label="Number of Hosts", value="1")
224
  script_output = gr.Textbox(label="Generated Script", lines=10)
225
  audio_output = gr.Audio(label="Generated Audio", type="numpy")
226
  generate_script_btn = gr.Button("Generate Podcast Script")
227
 
228
  with gr.Column(scale=2):
 
 
229
  voice1 = gr.Dropdown(
230
  choices=VOICES,
231
  value="tara",