mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-11 09:34:37 +00:00
Probable typo (#1287)
This commit is contained in:
parent
263d49d0d5
commit
3e6ef8e0ef
1 changed files with 2 additions and 2 deletions
|
@ -629,14 +629,14 @@ struct kcpp_embd_batch { //duplcated from llava_embd_batch
|
||||||
};
|
};
|
||||||
|
|
||||||
//loads a model for speculative decoding.
|
//loads a model for speculative decoding.
|
||||||
static void speculative_decoding_setup(std::string spec_model_filename, const llama_model_params & base_model_params, const llama_context_params & base_ctx_params, int base_n_vocab, const float * draft_gpusplit, int draftgpulayers)
|
static void speculative_decoding_setup(std::string spec_model_filename, const llama_model_params & base_model_params, const llama_context_params & base_ctx_params, int base_n_vocab, const float * draft_gpusplit, int draft_gpulayers)
|
||||||
{
|
{
|
||||||
llama_model_params draft_model_params = llama_model_default_params();
|
llama_model_params draft_model_params = llama_model_default_params();
|
||||||
llama_context_params draft_ctx_params = llama_context_default_params();
|
llama_context_params draft_ctx_params = llama_context_default_params();
|
||||||
|
|
||||||
draft_model_params.use_mmap = base_model_params.use_mmap;
|
draft_model_params.use_mmap = base_model_params.use_mmap;
|
||||||
draft_model_params.use_mlock = base_model_params.use_mlock;
|
draft_model_params.use_mlock = base_model_params.use_mlock;
|
||||||
draft_model_params.n_gpu_layers = draftgpulayers; //layers offload the speculative model.
|
draft_model_params.n_gpu_layers = draft_gpulayers; //layers offload the speculative model.
|
||||||
draft_ctx_params.n_ctx = base_ctx_params.n_ctx;
|
draft_ctx_params.n_ctx = base_ctx_params.n_ctx;
|
||||||
draft_ctx_params.logits_all = false;
|
draft_ctx_params.logits_all = false;
|
||||||
draft_ctx_params.offload_kqv = base_ctx_params.offload_kqv;
|
draft_ctx_params.offload_kqv = base_ctx_params.offload_kqv;
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue