mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-10 00:54:41 +00:00
experimental swa flag
This commit is contained in:
parent
499283c63a
commit
c4df151298
3 changed files with 11 additions and 1 deletions
1
expose.h
1
expose.h
|
@ -70,6 +70,7 @@ struct load_model_inputs
|
||||||
const int quant_k = 0;
|
const int quant_k = 0;
|
||||||
const int quant_v = 0;
|
const int quant_v = 0;
|
||||||
const bool check_slowness = false;
|
const bool check_slowness = false;
|
||||||
|
const bool swa_support = false;
|
||||||
const bool quiet = false;
|
const bool quiet = false;
|
||||||
const int debugmode = 0;
|
const int debugmode = 0;
|
||||||
};
|
};
|
||||||
|
|
|
@ -1927,7 +1927,11 @@ ModelLoadResult gpttype_load_model(const load_model_inputs inputs, FileFormat in
|
||||||
kcpp_data->use_smartcontext = inputs.use_smartcontext;
|
kcpp_data->use_smartcontext = inputs.use_smartcontext;
|
||||||
kcpp_data->use_contextshift = inputs.use_contextshift;
|
kcpp_data->use_contextshift = inputs.use_contextshift;
|
||||||
kcpp_data->use_fastforward = inputs.use_fastforward;
|
kcpp_data->use_fastforward = inputs.use_fastforward;
|
||||||
kcpp_data->swa_full = (inputs.use_fastforward || inputs.use_contextshift)?true:false;
|
kcpp_data->swa_full = !inputs.swa_support;//(inputs.use_fastforward || inputs.use_contextshift)?true:false;
|
||||||
|
if(!kcpp_data->swa_full)
|
||||||
|
{
|
||||||
|
printf("\n!!!!!!!!!!!!!!!!!!!\nExperimental FLAG - SWA SUPPORT IS ENABLED!\n!!!!!!!!!!!!!!!!!!!\n");
|
||||||
|
}
|
||||||
debugmode = inputs.debugmode;
|
debugmode = inputs.debugmode;
|
||||||
draft_ctx = nullptr;
|
draft_ctx = nullptr;
|
||||||
guidance_ctx = nullptr;
|
guidance_ctx = nullptr;
|
||||||
|
|
|
@ -192,6 +192,7 @@ class load_model_inputs(ctypes.Structure):
|
||||||
("quant_k", ctypes.c_int),
|
("quant_k", ctypes.c_int),
|
||||||
("quant_v", ctypes.c_int),
|
("quant_v", ctypes.c_int),
|
||||||
("check_slowness", ctypes.c_bool),
|
("check_slowness", ctypes.c_bool),
|
||||||
|
("swa_support", ctypes.c_bool),
|
||||||
("quiet", ctypes.c_bool),
|
("quiet", ctypes.c_bool),
|
||||||
("debugmode", ctypes.c_int)]
|
("debugmode", ctypes.c_int)]
|
||||||
|
|
||||||
|
@ -1248,6 +1249,7 @@ def load_model(model_filename):
|
||||||
inputs.override_kv = args.overridekv.encode("UTF-8") if args.overridekv else "".encode("UTF-8")
|
inputs.override_kv = args.overridekv.encode("UTF-8") if args.overridekv else "".encode("UTF-8")
|
||||||
inputs.override_tensors = args.overridetensors.encode("UTF-8") if args.overridetensors else "".encode("UTF-8")
|
inputs.override_tensors = args.overridetensors.encode("UTF-8") if args.overridetensors else "".encode("UTF-8")
|
||||||
inputs.check_slowness = (not args.highpriority and os.name == 'nt' and 'Intel' in platform.processor())
|
inputs.check_slowness = (not args.highpriority and os.name == 'nt' and 'Intel' in platform.processor())
|
||||||
|
inputs.swa_support = args.experiment_swa
|
||||||
inputs = set_backend_props(inputs)
|
inputs = set_backend_props(inputs)
|
||||||
ret = handle.load_model(inputs)
|
ret = handle.load_model(inputs)
|
||||||
return ret
|
return ret
|
||||||
|
@ -6907,6 +6909,9 @@ if __name__ == '__main__':
|
||||||
admingroup.add_argument("--adminpassword", metavar=('[password]'), help="Require a password to access admin functions. You are strongly advised to use one for publically accessible instances!", default=None)
|
admingroup.add_argument("--adminpassword", metavar=('[password]'), help="Require a password to access admin functions. You are strongly advised to use one for publically accessible instances!", default=None)
|
||||||
admingroup.add_argument("--admindir", metavar=('[directory]'), help="Specify a directory to look for .kcpps configs in, which can be used to swap models.", default="")
|
admingroup.add_argument("--admindir", metavar=('[directory]'), help="Specify a directory to look for .kcpps configs in, which can be used to swap models.", default="")
|
||||||
|
|
||||||
|
experimentgroup = parser.add_argument_group('Experimental Commands, can change or break any time!')
|
||||||
|
experimentgroup.add_argument("--experiment_swa", help="Enables SWA mode. There are no safety checks.", action='store_true')
|
||||||
|
|
||||||
deprecatedgroup = parser.add_argument_group('Deprecated Commands, DO NOT USE!')
|
deprecatedgroup = parser.add_argument_group('Deprecated Commands, DO NOT USE!')
|
||||||
deprecatedgroup.add_argument("--hordeconfig", help=argparse.SUPPRESS, nargs='+')
|
deprecatedgroup.add_argument("--hordeconfig", help=argparse.SUPPRESS, nargs='+')
|
||||||
deprecatedgroup.add_argument("--sdconfig", help=argparse.SUPPRESS, nargs='+')
|
deprecatedgroup.add_argument("--sdconfig", help=argparse.SUPPRESS, nargs='+')
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue