mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-09 16:44:35 +00:00
wip
This commit is contained in:
parent
e01e373e63
commit
b692e4d2a4
8 changed files with 99 additions and 25 deletions
|
@ -108,9 +108,15 @@ void print_tok_vec(std::vector<float> &embd)
|
|||
fin.read((char *)&temp, sizeof(temp)); //n_layer
|
||||
fin.read((char *)&temp, sizeof(temp)); //n_rot
|
||||
fin.read((char *)&temp, sizeof(temp)); //f16
|
||||
if(temp!=0 && temp!=1)
|
||||
const int32_t qntvr = temp / 1000;
|
||||
temp %= 1000;
|
||||
if (qntvr != 0)
|
||||
{
|
||||
fileformat = FileFormat::GPTJ_3; //quantized format cannot be legacy type
|
||||
fileformat = FileFormat::GPTJ_4;
|
||||
}
|
||||
else if (temp != 0 && temp != 1)
|
||||
{
|
||||
fileformat = FileFormat::GPTJ_3; //quantized format cannot be legacy type
|
||||
}
|
||||
}
|
||||
else if(vocabsiz==50257)
|
||||
|
@ -122,15 +128,34 @@ void print_tok_vec(std::vector<float> &embd)
|
|||
fin.read((char *)&temp, sizeof(temp)); //n_head
|
||||
fin.read((char *)&temp, sizeof(temp)); //n_layer
|
||||
fin.read((char *)&temp, sizeof(temp)); //f16
|
||||
if(temp!=0 && temp!=1)
|
||||
const int32_t qntvr = temp / 1000;
|
||||
temp %= 1000;
|
||||
if (qntvr != 0)
|
||||
{
|
||||
fileformat = FileFormat::GPT2_2; //quantized format cannot be legacy type
|
||||
}
|
||||
fileformat = FileFormat::GPT2_3;
|
||||
}
|
||||
else if (temp != 0 && temp != 1)
|
||||
{
|
||||
fileformat = FileFormat::GPT2_2; //quantized format cannot be legacy type
|
||||
}
|
||||
}
|
||||
else if(vocabsiz < 31998 || vocabsiz > 33000)
|
||||
{
|
||||
//anything outside the llama v1 range is assumed to be NeoX
|
||||
fileformat = FileFormat::NEOX_2;
|
||||
fileformat = FileFormat::NEOX_4;
|
||||
uint32_t temp;
|
||||
fin.read((char *)&temp, sizeof(temp)); //ctx
|
||||
fin.read((char *)&temp, sizeof(temp)); //n_embd
|
||||
fin.read((char *)&temp, sizeof(temp)); //n_head
|
||||
fin.read((char *)&temp, sizeof(temp)); //n_layer
|
||||
fin.read((char *)&temp, sizeof(temp)); //n_rot
|
||||
fin.read((char *)&temp, sizeof(temp)); //f16
|
||||
const int32_t qntvr = temp / 1000;
|
||||
temp %= 1000;
|
||||
if(qntvr==0)
|
||||
{
|
||||
fileformat = FileFormat::NEOX_2;
|
||||
}
|
||||
}
|
||||
}
|
||||
else if(magic == 0x67676d66) //v2 format ggmf
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue