added support for added memory and gemma and glm prompt fixes for batching mode

This commit is contained in:
Concedo 2026-05-10 23:39:03 +08:00
parent 33ca75d56f
commit bfaddd7a3b
2 changed files with 23 additions and 5 deletions

View file

@ -2290,7 +2290,7 @@ def continuous_batching_python_eligible(genparams, api_format):
return False
if not getattr(args, "noshift", False) or getattr(args, "smartcontext", False) or getattr(args, "draftmodel", "") or getattr(args, "mmproj", "") or getattr(args, "enableguidance", False):
return False
if genparams.get("memory") or genparams.get("negative_prompt") or genparams.get("images") or genparams.get("audio"):
if genparams.get("negative_prompt") or genparams.get("images") or genparams.get("audio"):
return False
if genparams.get("ban_eos_token", False):
return False