mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-11 01:24:36 +00:00
Allow use of OpenCL GPU-based BLAS using ClBlast instead of OpenBLAS for context processing
This commit is contained in:
parent
69b85f5b61
commit
c3db99ea32
3 changed files with 134 additions and 9 deletions
|
@ -251,10 +251,12 @@ generation_outputs llama_generate(const generation_inputs inputs, generation_out
|
|||
last_n_tokens.push_back(embd_inp[input_consumed]);
|
||||
current_context_tokens.push_back(embd_inp[input_consumed]);
|
||||
++input_consumed;
|
||||
#ifndef GGML_USE_CLBLAST
|
||||
if ((int)embd.size() >= params.n_batch)
|
||||
{
|
||||
break;
|
||||
}
|
||||
#endif
|
||||
}
|
||||
}
|
||||
}
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue