mirror of
https://github.com/Lizonghang/prima.cpp.git
synced 2025-09-07 07:59:29 +00:00
fix q6k and q80
This commit is contained in:
parent
b59d6d9cdf
commit
5a5f103833
1 changed files with 1 additions and 1 deletions
|
@ -370,7 +370,7 @@ float device_inp_embd_delay(struct llama_model * model, enum ggml_type src0t, in
|
||||||
case GGML_TYPE_Q6_K:
|
case GGML_TYPE_Q6_K:
|
||||||
case GGML_TYPE_Q8_K:
|
case GGML_TYPE_Q8_K:
|
||||||
case GGML_TYPE_Q8_0:
|
case GGML_TYPE_Q8_0:
|
||||||
QK_K = 256;
|
QK_K = ggml_blck_size(src0t);
|
||||||
matrix_B = malloc((embd_size / QK_K) * ggml_type_size(src0t));
|
matrix_B = malloc((embd_size / QK_K) * ggml_type_size(src0t));
|
||||||
break;
|
break;
|
||||||
default:
|
default:
|
||||||
|
|
Loading…
Add table
Reference in a new issue