mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-11 01:24:36 +00:00
bump size of some payload arr sequences from 16 to 24
This commit is contained in:
parent
e47477fd4d
commit
f289fb494a
2 changed files with 6 additions and 6 deletions
6
expose.h
6
expose.h
|
@ -1,11 +1,11 @@
|
||||||
#pragma once
|
#pragma once
|
||||||
#include <cstdint>
|
#include <cstdint>
|
||||||
|
|
||||||
const int stop_token_max = 16;
|
const int stop_token_max = 24;
|
||||||
const int ban_token_max = 16;
|
const int ban_token_max = 16;
|
||||||
const int tensor_split_max = 16;
|
const int tensor_split_max = 16;
|
||||||
const int logit_bias_max = 16;
|
const int logit_bias_max = 24;
|
||||||
const int dry_seq_break_max = 16;
|
const int dry_seq_break_max = 24;
|
||||||
const int images_max = 4;
|
const int images_max = 4;
|
||||||
|
|
||||||
// match kobold's sampler list and order
|
// match kobold's sampler list and order
|
||||||
|
|
|
@ -18,11 +18,11 @@ from concurrent.futures import ThreadPoolExecutor
|
||||||
|
|
||||||
# constants
|
# constants
|
||||||
sampler_order_max = 7
|
sampler_order_max = 7
|
||||||
stop_token_max = 16
|
stop_token_max = 24
|
||||||
ban_token_max = 16
|
ban_token_max = 16
|
||||||
tensor_split_max = 16
|
tensor_split_max = 16
|
||||||
logit_bias_max = 16
|
logit_bias_max = 24
|
||||||
dry_seq_break_max = 16
|
dry_seq_break_max = 24
|
||||||
images_max = 4
|
images_max = 4
|
||||||
bias_min_value = -100.0
|
bias_min_value = -100.0
|
||||||
bias_max_value = 100.0
|
bias_max_value = 100.0
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue