mirror of
https://github.com/resemble-ai/chatterbox.git
synced 2025-12-22 05:37:10 +00:00
* Add multilingual support * Update model card and README * Update examples and README * Remove EOS supression * Keep EOS supression for longer text * Update README.md * Update README.md * modify tokenizers, set alignment analyzer default to none * minor fixes, strict forcing EOS * Update model repo
32 lines
1.1 KiB
Python
32 lines
1.1 KiB
Python
import torchaudio as ta
|
|
import torch
|
|
from chatterbox.tts import ChatterboxTTS
|
|
from chatterbox.mtl_tts import ChatterboxMultilingualTTS
|
|
|
|
# Automatically detect the best available device
|
|
if torch.cuda.is_available():
|
|
device = "cuda"
|
|
elif torch.backends.mps.is_available():
|
|
device = "mps"
|
|
else:
|
|
device = "cpu"
|
|
|
|
print(f"Using device: {device}")
|
|
|
|
model = ChatterboxTTS.from_pretrained(device=device)
|
|
|
|
text = "Ezreal and Jinx teamed up with Ahri, Yasuo, and Teemo to take down the enemy's Nexus in an epic late-game pentakill."
|
|
wav = model.generate(text)
|
|
ta.save("test-1.wav", wav, model.sr)
|
|
|
|
multilingual_model = ChatterboxMultilingualTTS.from_pretrained(device=device)
|
|
text = "Bonjour, comment ça va? Ceci est le modèle de synthèse vocale multilingue Chatterbox, il prend en charge 23 langues."
|
|
wav = multilingual_model.generate(text, language_id="fr")
|
|
ta.save("test-2.wav", wav, multilingual_model.sr)
|
|
|
|
|
|
# If you want to synthesize with a different voice, specify the audio prompt
|
|
AUDIO_PROMPT_PATH = "YOUR_FILE.wav"
|
|
wav = model.generate(text, audio_prompt_path=AUDIO_PROMPT_PATH)
|
|
ta.save("test-3.wav", wav, model.sr)
|