bluenevus commited on
Commit
29aab57
·
verified ·
1 Parent(s): 180ce7d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -18
app.py CHANGED
@@ -141,9 +141,6 @@ def generate_speech(text, voice1, voice2, temperature, top_p, repetition_penalty
141
  return None
142
 
143
  try:
144
- music = AudioSegment.from_mp3("Maiko-intro-outro.mp3")
145
- music = music.set_frame_rate(24000)
146
-
147
  progress(0.1, "Processing text...")
148
  lines = text.split('\n')
149
  audio_samples = []
@@ -179,24 +176,15 @@ def generate_speech(text, voice1, voice2, temperature, top_p, repetition_penalty
179
 
180
  final_audio = np.concatenate(audio_samples)
181
 
182
- speech_audio = AudioSegment(
183
- final_audio.tobytes(),
184
- frame_rate=24000,
185
- sample_width=final_audio.dtype.itemsize,
186
- channels=1
187
- )
188
-
189
- combined_audio = music + speech_audio + music
190
-
191
- combined_numpy = np.array(combined_audio.get_array_of_samples(), dtype=np.float32)
192
-
193
- combined_numpy = np.int16(combined_numpy / np.max(np.abs(combined_numpy)) * 32767)
194
 
 
195
  max_samples = 24000 * 15
196
- if len(combined_numpy) > max_samples:
197
- combined_numpy = combined_numpy[:max_samples]
198
 
199
- return (24000, combined_numpy)
200
  except Exception as e:
201
  print(f"Error generating speech: {e}")
202
  return None
 
141
  return None
142
 
143
  try:
 
 
 
144
  progress(0.1, "Processing text...")
145
  lines = text.split('\n')
146
  audio_samples = []
 
176
 
177
  final_audio = np.concatenate(audio_samples)
178
 
179
+ # Normalize the audio
180
+ final_audio = np.int16(final_audio / np.max(np.abs(final_audio)) * 32767)
 
 
 
 
 
 
 
 
 
 
181
 
182
+ # Trim to 15 seconds if longer
183
  max_samples = 24000 * 15
184
+ if len(final_audio) > max_samples:
185
+ final_audio = final_audio[:max_samples]
186
 
187
+ return (24000, final_audio)
188
  except Exception as e:
189
  print(f"Error generating speech: {e}")
190
  return None