removed main.exe to reduce clutter, added support for rep pen in gptj

This commit is contained in:
Concedo 2023-04-04 20:43:13 +08:00
parent 9c0dbbb08b
commit 52de932842
11 changed files with 46 additions and 22 deletions

View file

@ -294,7 +294,7 @@ ModelLoadResult legacy_gptj_model_load(const std::string & fname, gptj_model_v1
//test for transposition and retry older loader
if(tensor->ne[0]==ne[1] && tensor->ne[1]==ne[0] && should_transpose_layer(name))
{
printf("\nFound a transposed tensor. This could be an older model. Retrying load...");
printf("\nFound a transposed tensor. This could be an older or newer model. Retrying load...");
ggml_v1_free(ctx);
return ModelLoadResult::RETRY_LOAD;
}