kemuriririn commited on
Commit
64aec9c
·
1 Parent(s): 58071a6

(wip)debug

Browse files
Files changed (2) hide show
  1. models.py +2 -94
  2. tts.py +2 -2
models.py CHANGED
@@ -404,35 +404,6 @@ def insert_initial_models():
404
  is_open=True,
405
  model_url="https://github.com/Index-Research/index-tts",
406
  ),
407
- # Model(
408
- # id="eleven-multilingual-v2",
409
- # name="Eleven Multilingual v2",
410
- # model_type=ModelType.TTS,
411
- # is_open=False,
412
- # model_url="https://elevenlabs.io/",
413
- # ),
414
- # Model(
415
- # id="eleven-turbo-v2.5",
416
- # name="Eleven Turbo v2.5",
417
- # model_type=ModelType.TTS,
418
- # is_open=False,
419
- # model_url="https://elevenlabs.io/",
420
- # ),
421
- # Model(
422
- # id="eleven-flash-v2.5",
423
- # name="Eleven Flash v2.5",
424
- # model_type=ModelType.TTS,
425
- # is_open=False,
426
- # model_url="https://elevenlabs.io/",
427
- # ),
428
- # Model(
429
- # id="cartesia-sonic-2",
430
- # name="Cartesia Sonic 2",
431
- # model_type=ModelType.TTS,
432
- # is_open=False,
433
- # is_active=False, # ran out of credits
434
- # model_url="https://cartesia.ai/",
435
- # ),
436
  Model(
437
  id="spark-tts",
438
  name="Spark TTS",
@@ -446,30 +417,9 @@ def insert_initial_models():
446
  name="maskgct",
447
  model_type=ModelType.TTS,
448
  is_open=False,
449
- is_active=True,
450
  model_url="https://github.com/open-mmlab/Amphion/tree/main/models/tts/maskgct",
451
  ),
452
- # Model(
453
- # id="playht-2.0",
454
- # name="PlayHT 2.0",
455
- # model_type=ModelType.TTS,
456
- # is_open=False,
457
- # model_url="https://play.ht/",
458
- # ),
459
- # Model(
460
- # id="styletts2",
461
- # name="StyleTTS 2",
462
- # model_type=ModelType.TTS,
463
- # is_open=True,
464
- # model_url="https://github.com/yl4579/StyleTTS2",
465
- # ),
466
- # Model(
467
- # id="kokoro-v1",
468
- # name="Kokoro v1.0",
469
- # model_type=ModelType.TTS,
470
- # is_open=True,
471
- # model_url="https://huggingface.co/hexgrad/Kokoro-82M",
472
- # ),
473
  Model(
474
  id="cosyvoice-2.0",
475
  name="CosyVoice 2.0",
@@ -483,49 +433,7 @@ def insert_initial_models():
483
  model_type=ModelType.TTS,
484
  is_open=True,
485
  model_url="https://huggingface.co/spaces/lj1995/GPT-SoVITS-v2",
486
- ),
487
- # Model(
488
- # id="papla-p1",
489
- # name="Papla P1",
490
- # model_type=ModelType.TTS,
491
- # is_open=False,
492
- # model_url="https://papla.media/",
493
- # ),
494
- # Model(
495
- # id="hume-octave",
496
- # name="Hume Octave",
497
- # model_type=ModelType.TTS,
498
- # is_open=False,
499
- # model_url="https://hume.ai/",
500
- # ),
501
- # Model(
502
- # id="megatts3",
503
- # name="MegaTTS 3",
504
- # model_type=ModelType.TTS,
505
- # is_active=False,
506
- # is_open=True,
507
- # model_url="https://github.com/bytedance/MegaTTS3",
508
- # ),
509
- # Model(
510
- # id="minimax-02-hd",
511
- # name="MiniMax Speech-02-HD",
512
- # model_type=ModelType.TTS,
513
- # is_open=False,
514
- # model_url="http://minimax.io/",
515
- # ),
516
- # Model(
517
- # id="minimax-02-turbo",
518
- # name="MiniMax Speech-02-Turbo",
519
- # model_type=ModelType.TTS,
520
- # is_open=False,
521
- # model_url="http://minimax.io/",
522
- # ),
523
- # Model(
524
- # id="lanternfish-1",
525
- # name="Lanternfish",
526
- # model_type=ModelType.TTS,
527
- # is_open=False,
528
- # ),
529
  ]
530
  conversational_models = [
531
  Model(
 
404
  is_open=True,
405
  model_url="https://github.com/Index-Research/index-tts",
406
  ),
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
407
  Model(
408
  id="spark-tts",
409
  name="Spark TTS",
 
417
  name="maskgct",
418
  model_type=ModelType.TTS,
419
  is_open=False,
420
+ is_active=False,
421
  model_url="https://github.com/open-mmlab/Amphion/tree/main/models/tts/maskgct",
422
  ),
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
423
  Model(
424
  id="cosyvoice-2.0",
425
  name="CosyVoice 2.0",
 
433
  model_type=ModelType.TTS,
434
  is_open=True,
435
  model_url="https://huggingface.co/spaces/lj1995/GPT-SoVITS-v2",
436
+ )
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
437
  ]
438
  conversational_models = [
439
  Model(
tts.py CHANGED
@@ -47,7 +47,7 @@ data = {"text": "string", "provider": "string", "model": "string"}
47
 
48
  def predict_index_tts(text, reference_audio_path=None):
49
  from gradio_client import Client, handle_file
50
- client = Client("kemuriririn/IndexTTS", hf_token=os.getenv("HF_TOKEN"))
51
  if reference_audio_path:
52
  prompt = handle_file(reference_audio_path)
53
  else:
@@ -65,7 +65,7 @@ def predict_index_tts(text, reference_audio_path=None):
65
 
66
  def predict_spark_tts(text, reference_audio_path=None):
67
  from gradio_client import Client, handle_file
68
- client = Client("kemuriririn/SparkTTS", hf_token=os.getenv("HF_TOKEN"))
69
  prompt_wav = None
70
  if reference_audio_path:
71
  prompt_wav = handle_file(reference_audio_path)
 
47
 
48
  def predict_index_tts(text, reference_audio_path=None):
49
  from gradio_client import Client, handle_file
50
+ client = Client("kemuriririn/IndexTTS", hf_token=get_zerogpu_token())
51
  if reference_audio_path:
52
  prompt = handle_file(reference_audio_path)
53
  else:
 
65
 
66
  def predict_spark_tts(text, reference_audio_path=None):
67
  from gradio_client import Client, handle_file
68
+ client = Client("kemuriririn/SparkTTS", hf_token=get_zerogpu_token())
69
  prompt_wav = None
70
  if reference_audio_path:
71
  prompt_wav = handle_file(reference_audio_path)