Merge branch 'master' into concedo_experimental

# Conflicts:
#	.flake8
#	.github/workflows/python-lint.yml
#	flake.lock
#	ggml-cuda.cu
#	ggml-quants.c
#	llama.cpp
#	pocs/vdot/q8dot.cpp
#	pocs/vdot/vdot.cpp
#	tests/test-quantize-fns.cpp
#	tests/test-quantize-perf.cpp
This commit is contained in:
Concedo 2024-02-13 00:14:22 +08:00
commit 3cec37c2e0
35 changed files with 2814 additions and 1749 deletions

View file

@ -466,7 +466,7 @@ maxhordelen = 256
modelbusy = threading.Lock()
requestsinqueue = 0
defaultport = 5001
KcppVersion = "1.57.1"
KcppVersion = "1.58"
showdebug = True
showsamplerwarning = True
showmaxctxwarning = True