kemuriririn commited on
Commit
dab4429
·
1 Parent(s): 19ae156

(wip)debug

Browse files
Files changed (1) hide show
  1. tts.py +9 -1
tts.py CHANGED
@@ -7,6 +7,8 @@ import fal_client
7
  import requests
8
  import time
9
  import io
 
 
10
  from pyht import Client as PyhtClient
11
  from pyht.client import TTSOptions
12
  import base64
@@ -204,8 +206,10 @@ def predict_index_tts(text, reference_audio_path=None):
204
  result = client.predict(
205
  prompt=prompt,
206
  text=text,
 
207
  api_name="/gen_single"
208
  )
 
209
  return result
210
 
211
 
@@ -220,8 +224,10 @@ def predict_spark_tts(text, reference_audio_path=None):
220
  prompt_text=text,
221
  prompt_wav_upload=prompt_wav,
222
  prompt_wav_record=prompt_wav,
 
223
  api_name="/voice_clone"
224
  )
 
225
  return result
226
 
227
 
@@ -230,7 +236,7 @@ def predict_cosyvoice_tts(text, reference_audio_path=None):
230
  client = Client("https://iic-cosyvoice2-0-5b.ms.show/")
231
  if not reference_audio_path:
232
  raise ValueError("cosyvoice-2.0 需要 reference_audio_path")
233
- prompt_wav = file(reference_audio_path)
234
  result = client.predict(
235
  tts_text=text,
236
  mode_checkbox_group="3s极速复刻",
@@ -242,6 +248,8 @@ def predict_cosyvoice_tts(text, reference_audio_path=None):
242
  stream="false",
243
  api_name="/generate_audio"
244
  )
 
 
245
  return result
246
 
247
 
 
7
  import requests
8
  import time
9
  import io
10
+
11
+ from gradio_client import handle_file
12
  from pyht import Client as PyhtClient
13
  from pyht.client import TTSOptions
14
  import base64
 
206
  result = client.predict(
207
  prompt=prompt,
208
  text=text,
209
+ stream="false",
210
  api_name="/gen_single"
211
  )
212
+ print("index-tts result:", result)
213
  return result
214
 
215
 
 
224
  prompt_text=text,
225
  prompt_wav_upload=prompt_wav,
226
  prompt_wav_record=prompt_wav,
227
+ stream="false",
228
  api_name="/voice_clone"
229
  )
230
+ print("spark-tts result:", result)
231
  return result
232
 
233
 
 
236
  client = Client("https://iic-cosyvoice2-0-5b.ms.show/")
237
  if not reference_audio_path:
238
  raise ValueError("cosyvoice-2.0 需要 reference_audio_path")
239
+ prompt_wav = handle_file(reference_audio_path)
240
  result = client.predict(
241
  tts_text=text,
242
  mode_checkbox_group="3s极速复刻",
 
248
  stream="false",
249
  api_name="/generate_audio"
250
  )
251
+ print("cosyvoice-2.0 result:", result)
252
+
253
  return result
254
 
255