updated lite, added autorope config based on trained ctxlen, hotfix for falcon gpu broken

This commit is contained in:
Concedo 2023-08-30 16:50:55 +08:00
parent 89495c0716
commit d4c22a8b02
4 changed files with 654 additions and 74 deletions

View file

@ -271,6 +271,11 @@ void print_tok_vec(std::vector<float> &embd)
{
fileformat = FileFormat::GGUF_LLAMA;
}
else if(modelarch=="falcon")
{
fileformat = FileFormat::GGUF_FALCON; //uses the same loader
printf("\nDetected GGUF FALCON format.\n");
}
else
{
printf("\nERROR: Detected unimplemented GGUF Arch: %s\n",modelarch.c_str());