mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-11 09:34:37 +00:00
fix for jamba models - they have recurrent layers like rwkv, so context shifting and forwarding wont work on them.
This commit is contained in:
parent
e9473305d0
commit
5a3b2e3921
3 changed files with 12 additions and 7 deletions
|
@ -324,6 +324,10 @@ void print_tok_vec(std::vector<float> &embd)
|
|||
{
|
||||
fileformatmeta->model_architecture = GGUFArch::ARCH_MAMBA;
|
||||
}
|
||||
else if(modelarch=="jamba")
|
||||
{
|
||||
fileformatmeta->model_architecture = GGUFArch::ARCH_JAMBA;
|
||||
}
|
||||
else if(modelarch=="llama" && freq_base_train==10000.0f && (n_tensors==435 || n_tensors==611))
|
||||
{
|
||||
fileformatmeta->model_architecture = GGUFArch::ARCH_SOLAR;
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue