fix: fix server for triton kernel

This commit is contained in:
ceerrep 2025-02-17 18:08:45 +08:00
parent bb1cadfff3
commit ee24eb8dc3
2 changed files with 8 additions and 4 deletions

View file

@ -106,9 +106,6 @@ def custom_openapi(app):
def main():
cfg = Config()
# Temporarily disable cuda graph by default because of a bug in the prefix cache.
cfg.use_cuda_graph = False
arg_parser = ArgumentParser(cfg)
# 初始化消息