mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-10 17:14:36 +00:00
reverted sequence mode for rwkv due to multiple issues with speed loss with bigger quantized models
This commit is contained in:
parent
f83b66606b
commit
3ed3e7b7e2
4 changed files with 5 additions and 5 deletions
|
@ -479,7 +479,7 @@ ModelLoadResult gpttype_load_model(const load_model_inputs inputs, FileFormat in
|
|||
}
|
||||
else
|
||||
{
|
||||
n_batch = 8; //use sequence mode to speedup
|
||||
n_batch = 1; //do not use sequence mode to speedup until it is fixed
|
||||
|
||||
//setup buffers for rwkv state
|
||||
auto padding = 512u;
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue