mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-10 06:14:58 +00:00
fix: fix server for triton kernel
This commit is contained in:
parent
bb1cadfff3
commit
ee24eb8dc3
2 changed files with 8 additions and 4 deletions
|
@ -106,9 +106,6 @@ def custom_openapi(app):
|
|||
def main():
|
||||
cfg = Config()
|
||||
|
||||
# Temporarily disable cuda graph by default because of a bug in the prefix cache.
|
||||
cfg.use_cuda_graph = False
|
||||
|
||||
arg_parser = ArgumentParser(cfg)
|
||||
|
||||
# 初始化消息
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue