fixed lora, now works quanted too

This commit is contained in:
Concedo 2025-04-14 23:44:42 +08:00
parent ad2522b319
commit fe12b1cbd4
3 changed files with 12 additions and 26 deletions

View file

@ -3,7 +3,7 @@
#include "ggml_extend.hpp"
#define LORA_GRAPH_SIZE 10240
#define LORA_GRAPH_SIZE 20480
struct LoraModel : public GGMLRunner {
enum lora_t {