Spaces:
Running
Running
Commit
·
64aec9c
1
Parent(s):
58071a6
(wip)debug
Browse files
models.py
CHANGED
|
@@ -404,35 +404,6 @@ def insert_initial_models():
|
|
| 404 |
is_open=True,
|
| 405 |
model_url="https://github.com/Index-Research/index-tts",
|
| 406 |
),
|
| 407 |
-
# Model(
|
| 408 |
-
# id="eleven-multilingual-v2",
|
| 409 |
-
# name="Eleven Multilingual v2",
|
| 410 |
-
# model_type=ModelType.TTS,
|
| 411 |
-
# is_open=False,
|
| 412 |
-
# model_url="https://elevenlabs.io/",
|
| 413 |
-
# ),
|
| 414 |
-
# Model(
|
| 415 |
-
# id="eleven-turbo-v2.5",
|
| 416 |
-
# name="Eleven Turbo v2.5",
|
| 417 |
-
# model_type=ModelType.TTS,
|
| 418 |
-
# is_open=False,
|
| 419 |
-
# model_url="https://elevenlabs.io/",
|
| 420 |
-
# ),
|
| 421 |
-
# Model(
|
| 422 |
-
# id="eleven-flash-v2.5",
|
| 423 |
-
# name="Eleven Flash v2.5",
|
| 424 |
-
# model_type=ModelType.TTS,
|
| 425 |
-
# is_open=False,
|
| 426 |
-
# model_url="https://elevenlabs.io/",
|
| 427 |
-
# ),
|
| 428 |
-
# Model(
|
| 429 |
-
# id="cartesia-sonic-2",
|
| 430 |
-
# name="Cartesia Sonic 2",
|
| 431 |
-
# model_type=ModelType.TTS,
|
| 432 |
-
# is_open=False,
|
| 433 |
-
# is_active=False, # ran out of credits
|
| 434 |
-
# model_url="https://cartesia.ai/",
|
| 435 |
-
# ),
|
| 436 |
Model(
|
| 437 |
id="spark-tts",
|
| 438 |
name="Spark TTS",
|
|
@@ -446,30 +417,9 @@ def insert_initial_models():
|
|
| 446 |
name="maskgct",
|
| 447 |
model_type=ModelType.TTS,
|
| 448 |
is_open=False,
|
| 449 |
-
is_active=
|
| 450 |
model_url="https://github.com/open-mmlab/Amphion/tree/main/models/tts/maskgct",
|
| 451 |
),
|
| 452 |
-
# Model(
|
| 453 |
-
# id="playht-2.0",
|
| 454 |
-
# name="PlayHT 2.0",
|
| 455 |
-
# model_type=ModelType.TTS,
|
| 456 |
-
# is_open=False,
|
| 457 |
-
# model_url="https://play.ht/",
|
| 458 |
-
# ),
|
| 459 |
-
# Model(
|
| 460 |
-
# id="styletts2",
|
| 461 |
-
# name="StyleTTS 2",
|
| 462 |
-
# model_type=ModelType.TTS,
|
| 463 |
-
# is_open=True,
|
| 464 |
-
# model_url="https://github.com/yl4579/StyleTTS2",
|
| 465 |
-
# ),
|
| 466 |
-
# Model(
|
| 467 |
-
# id="kokoro-v1",
|
| 468 |
-
# name="Kokoro v1.0",
|
| 469 |
-
# model_type=ModelType.TTS,
|
| 470 |
-
# is_open=True,
|
| 471 |
-
# model_url="https://huggingface.co/hexgrad/Kokoro-82M",
|
| 472 |
-
# ),
|
| 473 |
Model(
|
| 474 |
id="cosyvoice-2.0",
|
| 475 |
name="CosyVoice 2.0",
|
|
@@ -483,49 +433,7 @@ def insert_initial_models():
|
|
| 483 |
model_type=ModelType.TTS,
|
| 484 |
is_open=True,
|
| 485 |
model_url="https://huggingface.co/spaces/lj1995/GPT-SoVITS-v2",
|
| 486 |
-
)
|
| 487 |
-
# Model(
|
| 488 |
-
# id="papla-p1",
|
| 489 |
-
# name="Papla P1",
|
| 490 |
-
# model_type=ModelType.TTS,
|
| 491 |
-
# is_open=False,
|
| 492 |
-
# model_url="https://papla.media/",
|
| 493 |
-
# ),
|
| 494 |
-
# Model(
|
| 495 |
-
# id="hume-octave",
|
| 496 |
-
# name="Hume Octave",
|
| 497 |
-
# model_type=ModelType.TTS,
|
| 498 |
-
# is_open=False,
|
| 499 |
-
# model_url="https://hume.ai/",
|
| 500 |
-
# ),
|
| 501 |
-
# Model(
|
| 502 |
-
# id="megatts3",
|
| 503 |
-
# name="MegaTTS 3",
|
| 504 |
-
# model_type=ModelType.TTS,
|
| 505 |
-
# is_active=False,
|
| 506 |
-
# is_open=True,
|
| 507 |
-
# model_url="https://github.com/bytedance/MegaTTS3",
|
| 508 |
-
# ),
|
| 509 |
-
# Model(
|
| 510 |
-
# id="minimax-02-hd",
|
| 511 |
-
# name="MiniMax Speech-02-HD",
|
| 512 |
-
# model_type=ModelType.TTS,
|
| 513 |
-
# is_open=False,
|
| 514 |
-
# model_url="http://minimax.io/",
|
| 515 |
-
# ),
|
| 516 |
-
# Model(
|
| 517 |
-
# id="minimax-02-turbo",
|
| 518 |
-
# name="MiniMax Speech-02-Turbo",
|
| 519 |
-
# model_type=ModelType.TTS,
|
| 520 |
-
# is_open=False,
|
| 521 |
-
# model_url="http://minimax.io/",
|
| 522 |
-
# ),
|
| 523 |
-
# Model(
|
| 524 |
-
# id="lanternfish-1",
|
| 525 |
-
# name="Lanternfish",
|
| 526 |
-
# model_type=ModelType.TTS,
|
| 527 |
-
# is_open=False,
|
| 528 |
-
# ),
|
| 529 |
]
|
| 530 |
conversational_models = [
|
| 531 |
Model(
|
|
|
|
| 404 |
is_open=True,
|
| 405 |
model_url="https://github.com/Index-Research/index-tts",
|
| 406 |
),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 407 |
Model(
|
| 408 |
id="spark-tts",
|
| 409 |
name="Spark TTS",
|
|
|
|
| 417 |
name="maskgct",
|
| 418 |
model_type=ModelType.TTS,
|
| 419 |
is_open=False,
|
| 420 |
+
is_active=False,
|
| 421 |
model_url="https://github.com/open-mmlab/Amphion/tree/main/models/tts/maskgct",
|
| 422 |
),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 423 |
Model(
|
| 424 |
id="cosyvoice-2.0",
|
| 425 |
name="CosyVoice 2.0",
|
|
|
|
| 433 |
model_type=ModelType.TTS,
|
| 434 |
is_open=True,
|
| 435 |
model_url="https://huggingface.co/spaces/lj1995/GPT-SoVITS-v2",
|
| 436 |
+
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 437 |
]
|
| 438 |
conversational_models = [
|
| 439 |
Model(
|
tts.py
CHANGED
|
@@ -47,7 +47,7 @@ data = {"text": "string", "provider": "string", "model": "string"}
|
|
| 47 |
|
| 48 |
def predict_index_tts(text, reference_audio_path=None):
|
| 49 |
from gradio_client import Client, handle_file
|
| 50 |
-
client = Client("kemuriririn/IndexTTS", hf_token=
|
| 51 |
if reference_audio_path:
|
| 52 |
prompt = handle_file(reference_audio_path)
|
| 53 |
else:
|
|
@@ -65,7 +65,7 @@ def predict_index_tts(text, reference_audio_path=None):
|
|
| 65 |
|
| 66 |
def predict_spark_tts(text, reference_audio_path=None):
|
| 67 |
from gradio_client import Client, handle_file
|
| 68 |
-
client = Client("kemuriririn/SparkTTS", hf_token=
|
| 69 |
prompt_wav = None
|
| 70 |
if reference_audio_path:
|
| 71 |
prompt_wav = handle_file(reference_audio_path)
|
|
|
|
| 47 |
|
| 48 |
def predict_index_tts(text, reference_audio_path=None):
|
| 49 |
from gradio_client import Client, handle_file
|
| 50 |
+
client = Client("kemuriririn/IndexTTS", hf_token=get_zerogpu_token())
|
| 51 |
if reference_audio_path:
|
| 52 |
prompt = handle_file(reference_audio_path)
|
| 53 |
else:
|
|
|
|
| 65 |
|
| 66 |
def predict_spark_tts(text, reference_audio_path=None):
|
| 67 |
from gradio_client import Client, handle_file
|
| 68 |
+
client = Client("kemuriririn/SparkTTS", hf_token=get_zerogpu_token())
|
| 69 |
prompt_wav = None
|
| 70 |
if reference_audio_path:
|
| 71 |
prompt_wav = handle_file(reference_audio_path)
|