Spaces:
Running
Running
Commit
·
64aec9c
1
Parent(s):
58071a6
(wip)debug
Browse files
models.py
CHANGED
@@ -404,35 +404,6 @@ def insert_initial_models():
|
|
404 |
is_open=True,
|
405 |
model_url="https://github.com/Index-Research/index-tts",
|
406 |
),
|
407 |
-
# Model(
|
408 |
-
# id="eleven-multilingual-v2",
|
409 |
-
# name="Eleven Multilingual v2",
|
410 |
-
# model_type=ModelType.TTS,
|
411 |
-
# is_open=False,
|
412 |
-
# model_url="https://elevenlabs.io/",
|
413 |
-
# ),
|
414 |
-
# Model(
|
415 |
-
# id="eleven-turbo-v2.5",
|
416 |
-
# name="Eleven Turbo v2.5",
|
417 |
-
# model_type=ModelType.TTS,
|
418 |
-
# is_open=False,
|
419 |
-
# model_url="https://elevenlabs.io/",
|
420 |
-
# ),
|
421 |
-
# Model(
|
422 |
-
# id="eleven-flash-v2.5",
|
423 |
-
# name="Eleven Flash v2.5",
|
424 |
-
# model_type=ModelType.TTS,
|
425 |
-
# is_open=False,
|
426 |
-
# model_url="https://elevenlabs.io/",
|
427 |
-
# ),
|
428 |
-
# Model(
|
429 |
-
# id="cartesia-sonic-2",
|
430 |
-
# name="Cartesia Sonic 2",
|
431 |
-
# model_type=ModelType.TTS,
|
432 |
-
# is_open=False,
|
433 |
-
# is_active=False, # ran out of credits
|
434 |
-
# model_url="https://cartesia.ai/",
|
435 |
-
# ),
|
436 |
Model(
|
437 |
id="spark-tts",
|
438 |
name="Spark TTS",
|
@@ -446,30 +417,9 @@ def insert_initial_models():
|
|
446 |
name="maskgct",
|
447 |
model_type=ModelType.TTS,
|
448 |
is_open=False,
|
449 |
-
is_active=
|
450 |
model_url="https://github.com/open-mmlab/Amphion/tree/main/models/tts/maskgct",
|
451 |
),
|
452 |
-
# Model(
|
453 |
-
# id="playht-2.0",
|
454 |
-
# name="PlayHT 2.0",
|
455 |
-
# model_type=ModelType.TTS,
|
456 |
-
# is_open=False,
|
457 |
-
# model_url="https://play.ht/",
|
458 |
-
# ),
|
459 |
-
# Model(
|
460 |
-
# id="styletts2",
|
461 |
-
# name="StyleTTS 2",
|
462 |
-
# model_type=ModelType.TTS,
|
463 |
-
# is_open=True,
|
464 |
-
# model_url="https://github.com/yl4579/StyleTTS2",
|
465 |
-
# ),
|
466 |
-
# Model(
|
467 |
-
# id="kokoro-v1",
|
468 |
-
# name="Kokoro v1.0",
|
469 |
-
# model_type=ModelType.TTS,
|
470 |
-
# is_open=True,
|
471 |
-
# model_url="https://huggingface.co/hexgrad/Kokoro-82M",
|
472 |
-
# ),
|
473 |
Model(
|
474 |
id="cosyvoice-2.0",
|
475 |
name="CosyVoice 2.0",
|
@@ -483,49 +433,7 @@ def insert_initial_models():
|
|
483 |
model_type=ModelType.TTS,
|
484 |
is_open=True,
|
485 |
model_url="https://huggingface.co/spaces/lj1995/GPT-SoVITS-v2",
|
486 |
-
)
|
487 |
-
# Model(
|
488 |
-
# id="papla-p1",
|
489 |
-
# name="Papla P1",
|
490 |
-
# model_type=ModelType.TTS,
|
491 |
-
# is_open=False,
|
492 |
-
# model_url="https://papla.media/",
|
493 |
-
# ),
|
494 |
-
# Model(
|
495 |
-
# id="hume-octave",
|
496 |
-
# name="Hume Octave",
|
497 |
-
# model_type=ModelType.TTS,
|
498 |
-
# is_open=False,
|
499 |
-
# model_url="https://hume.ai/",
|
500 |
-
# ),
|
501 |
-
# Model(
|
502 |
-
# id="megatts3",
|
503 |
-
# name="MegaTTS 3",
|
504 |
-
# model_type=ModelType.TTS,
|
505 |
-
# is_active=False,
|
506 |
-
# is_open=True,
|
507 |
-
# model_url="https://github.com/bytedance/MegaTTS3",
|
508 |
-
# ),
|
509 |
-
# Model(
|
510 |
-
# id="minimax-02-hd",
|
511 |
-
# name="MiniMax Speech-02-HD",
|
512 |
-
# model_type=ModelType.TTS,
|
513 |
-
# is_open=False,
|
514 |
-
# model_url="http://minimax.io/",
|
515 |
-
# ),
|
516 |
-
# Model(
|
517 |
-
# id="minimax-02-turbo",
|
518 |
-
# name="MiniMax Speech-02-Turbo",
|
519 |
-
# model_type=ModelType.TTS,
|
520 |
-
# is_open=False,
|
521 |
-
# model_url="http://minimax.io/",
|
522 |
-
# ),
|
523 |
-
# Model(
|
524 |
-
# id="lanternfish-1",
|
525 |
-
# name="Lanternfish",
|
526 |
-
# model_type=ModelType.TTS,
|
527 |
-
# is_open=False,
|
528 |
-
# ),
|
529 |
]
|
530 |
conversational_models = [
|
531 |
Model(
|
|
|
404 |
is_open=True,
|
405 |
model_url="https://github.com/Index-Research/index-tts",
|
406 |
),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
407 |
Model(
|
408 |
id="spark-tts",
|
409 |
name="Spark TTS",
|
|
|
417 |
name="maskgct",
|
418 |
model_type=ModelType.TTS,
|
419 |
is_open=False,
|
420 |
+
is_active=False,
|
421 |
model_url="https://github.com/open-mmlab/Amphion/tree/main/models/tts/maskgct",
|
422 |
),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
423 |
Model(
|
424 |
id="cosyvoice-2.0",
|
425 |
name="CosyVoice 2.0",
|
|
|
433 |
model_type=ModelType.TTS,
|
434 |
is_open=True,
|
435 |
model_url="https://huggingface.co/spaces/lj1995/GPT-SoVITS-v2",
|
436 |
+
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
437 |
]
|
438 |
conversational_models = [
|
439 |
Model(
|
tts.py
CHANGED
@@ -47,7 +47,7 @@ data = {"text": "string", "provider": "string", "model": "string"}
|
|
47 |
|
48 |
def predict_index_tts(text, reference_audio_path=None):
|
49 |
from gradio_client import Client, handle_file
|
50 |
-
client = Client("kemuriririn/IndexTTS", hf_token=
|
51 |
if reference_audio_path:
|
52 |
prompt = handle_file(reference_audio_path)
|
53 |
else:
|
@@ -65,7 +65,7 @@ def predict_index_tts(text, reference_audio_path=None):
|
|
65 |
|
66 |
def predict_spark_tts(text, reference_audio_path=None):
|
67 |
from gradio_client import Client, handle_file
|
68 |
-
client = Client("kemuriririn/SparkTTS", hf_token=
|
69 |
prompt_wav = None
|
70 |
if reference_audio_path:
|
71 |
prompt_wav = handle_file(reference_audio_path)
|
|
|
47 |
|
48 |
def predict_index_tts(text, reference_audio_path=None):
|
49 |
from gradio_client import Client, handle_file
|
50 |
+
client = Client("kemuriririn/IndexTTS", hf_token=get_zerogpu_token())
|
51 |
if reference_audio_path:
|
52 |
prompt = handle_file(reference_audio_path)
|
53 |
else:
|
|
|
65 |
|
66 |
def predict_spark_tts(text, reference_audio_path=None):
|
67 |
from gradio_client import Client, handle_file
|
68 |
+
client = Client("kemuriririn/SparkTTS", hf_token=get_zerogpu_token())
|
69 |
prompt_wav = None
|
70 |
if reference_audio_path:
|
71 |
prompt_wav = handle_file(reference_audio_path)
|