mirror of
https://github.com/Lizonghang/prima.cpp.git
synced 2025-09-04 09:19:02 +00:00
fix q6k and q80
This commit is contained in:
parent
b59d6d9cdf
commit
5a5f103833
1 changed files with 1 additions and 1 deletions
|
@ -370,7 +370,7 @@ float device_inp_embd_delay(struct llama_model * model, enum ggml_type src0t, in
|
|||
case GGML_TYPE_Q6_K:
|
||||
case GGML_TYPE_Q8_K:
|
||||
case GGML_TYPE_Q8_0:
|
||||
QK_K = 256;
|
||||
QK_K = ggml_blck_size(src0t);
|
||||
matrix_B = malloc((embd_size / QK_K) * ggml_type_size(src0t));
|
||||
break;
|
||||
default:
|
||||
|
|
Loading…
Add table
Reference in a new issue