various fixes

This commit is contained in:
Concedo 2025-01-18 23:52:39 +08:00
parent e90866fd46
commit fa7e661133
14 changed files with 51 additions and 32 deletions

View file

@ -527,7 +527,7 @@ bool ttstype_load_model(const tts_load_model_inputs inputs)
tts_ctx_params.n_ubatch = 512;
tts_ctx_params.n_threads = nthreads;
tts_ctx_params.n_threads_batch = nthreads;
tts_ctx_params.flash_attn = false;
tts_ctx_params.flash_attn = inputs.flash_attention;
llama_model * ttcmodel = llama_model_load_from_file(modelfile_ttc.c_str(), tts_model_params);
ttc_ctx = llama_new_context_with_model(ttcmodel, tts_ctx_params);