From e8570de0e605c59a19a03efde922eea3bf76b1ac Mon Sep 17 00:00:00 2001 From: Concedo <39025047+LostRuins@users.noreply.github.com> Date: Fri, 17 Jan 2025 18:45:16 +0800 Subject: [PATCH] improved tts default voices quality and sample rate --- expose.h | 1 + kcpp_docs.embd | 2 +- klite.embd | 7 +++---- koboldcpp.py | 27 ++++++++++++++++++++------- otherarch/tts_adapter.cpp | 28 ++++++++++++---------------- 5 files changed, 37 insertions(+), 28 deletions(-) diff --git a/expose.h b/expose.h index 91eeca404..30390d4c9 100644 --- a/expose.h +++ b/expose.h @@ -205,6 +205,7 @@ struct whisper_generation_outputs struct tts_load_model_inputs { + const int threads = 4; const char * ttc_model_filename = nullptr; const char * cts_model_filename = nullptr; const char * executable_path = nullptr; diff --git a/kcpp_docs.embd b/kcpp_docs.embd index dae8920f1..a425eb285 100644 --- a/kcpp_docs.embd +++ b/kcpp_docs.embd @@ -1463,7 +1463,7 @@ }, "voice": { "type": "string", - "description": "The voice to use when generating the audio. You can enter anything you like, a unique speaker will be generated. There are a few preset voices you can use: kobo,cheery,sleepy,tutor,shouty,bored,record" + "description": "The voice to use when generating the audio. You can enter anything you like, a unique speaker will be generated. There are a few preset voices you can use: kobo,cheery,sleepy,shouty,chatty" } }, "type": "object" diff --git a/klite.embd b/klite.embd index fac252a4a..caa0bb721 100644 --- a/klite.embd +++ b/klite.embd @@ -12,7 +12,7 @@ Current version indicated by LITEVER below. -->