mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-09 00:29:06 +00:00
22 lines
No EOL
801 B
Python
22 lines
No EOL
801 B
Python
import outetts
|
|
print("Speaker JSON creation for Voice Cloning for OuteTTS...")
|
|
|
|
model_config = outetts.HFModelConfig_v1(
|
|
model_path="OuteAI/OuteTTS-0.2-500M",
|
|
language="en", # Supported languages in v0.2: en, zh, ja, ko
|
|
)
|
|
|
|
interface = outetts.InterfaceHF(model_version="0.2", cfg=model_config)
|
|
|
|
speaker = interface.create_speaker(
|
|
audio_path="input_audio.wav",
|
|
|
|
# If transcript is not provided, it will be automatically transcribed using Whisper
|
|
transcript=None, # Set to None to use Whisper for transcription
|
|
|
|
whisper_model="turbo", # Optional: specify Whisper model (default: "turbo")
|
|
whisper_device=None, # Optional: specify device for Whisper (default: None)
|
|
)
|
|
|
|
interface.save_speaker(speaker, "speaker_output.json")
|
|
print("Speaker JSON saved!") |