mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-09 22:05:30 +00:00
add balance-serve, support concurrence
This commit is contained in:
parent
8d0292aa44
commit
25cee5810e
196 changed files with 22077 additions and 565 deletions
|
@ -15,6 +15,7 @@ from ktransformers.server.backend.context_manager import ThreadContextManager
|
|||
from ktransformers.server.backend.interfaces.exllamav2 import ExllamaInterface
|
||||
from ktransformers.server.backend.interfaces.transformers import TransformersInterface
|
||||
from ktransformers.server.backend.interfaces.ktransformers import KTransformersInterface
|
||||
|
||||
def create_interface(config: Config, default_args: ConfigArgs):
|
||||
if config.backend_type=='transformers':
|
||||
from ktransformers.server.backend.interfaces.transformers import TransformersInterface as BackendInterface
|
||||
|
@ -22,6 +23,8 @@ def create_interface(config: Config, default_args: ConfigArgs):
|
|||
from ktransformers.server.backend.interfaces.exllamav2 import ExllamaInterface as BackendInterface
|
||||
elif config.backend_type == 'ktransformers':
|
||||
from ktransformers.server.backend.interfaces.ktransformers import KTransformersInterface as BackendInterface
|
||||
elif config.backend_type == 'balance_serve':
|
||||
from ktransformers.server.backend.interfaces.balance_serve import BalanceServeInterface as BackendInterface
|
||||
else:
|
||||
raise NotImplementedError(f'{config.backend_type} not implemented')
|
||||
GlobalInterface.interface = BackendInterface(default_args)
|
||||
|
@ -30,9 +33,9 @@ def create_interface(config: Config, default_args: ConfigArgs):
|
|||
class GlobalContextManager:
|
||||
context_manager: ThreadContextManager
|
||||
class GlobalInterface:
|
||||
interface: TransformersInterface | KTransformersInterface | ExllamaInterface
|
||||
interface: TransformersInterface | KTransformersInterface | ExllamaInterface
|
||||
|
||||
def get_thread_context_manager() -> ThreadContextManager:
|
||||
def get_thread_context_manager() -> GlobalContextManager:
|
||||
return GlobalContextManager.context_manager
|
||||
def get_interface() -> TransformersInterface | KTransformersInterface | ExllamaInterface:
|
||||
def get_interface() -> GlobalInterface:
|
||||
return GlobalInterface.interface
|
Loading…
Add table
Add a link
Reference in a new issue