mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-10 17:14:36 +00:00
wstring convert for mpt
This commit is contained in:
parent
6d718525c4
commit
0485fa65a2
5 changed files with 30 additions and 7 deletions
|
@ -313,6 +313,7 @@ ModelLoadResult gpttype_load_model(const load_model_inputs inputs, FileFormat in
|
|||
= gpt2_ctx_v1.hparams.n_ctx = gpt2_ctx_v2.hparams.n_ctx = gpt2_ctx_v3.hparams.n_ctx
|
||||
= mpt_ctx_v3.hparams.n_ctx = params.n_ctx;
|
||||
|
||||
//this is used for the mem_per_token eval, openblas needs more RAM
|
||||
bool use_scratch = ggml_cpu_has_gpublas();
|
||||
|
||||
printf("System Info: %s\n", llama_print_system_info());
|
||||
|
@ -904,7 +905,7 @@ generation_outputs gpttype_generate(const generation_inputs inputs, generation_o
|
|||
concat_output = "";
|
||||
|
||||
bool startedsampling = false;
|
||||
bool use_scratch = true;
|
||||
bool use_scratch = true; //for normal inference always use scratch
|
||||
|
||||
timer_start();
|
||||
double time1 = 0, time2 = 0;
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue