Add per-model thinking toggles

This commit is contained in:
Alishahryar1 2026-04-25 20:51:07 -07:00
parent 180c942af7
commit f29e693dc5
21 changed files with 220 additions and 54 deletions

View file

@ -17,6 +17,7 @@ class ResolvedModel:
provider_id: str
provider_model: str
provider_model_ref: str
thinking_enabled: bool
@dataclass(frozen=True, slots=True)
@ -39,6 +40,7 @@ class ModelRouter:
def resolve(self, claude_model_name: str) -> ResolvedModel:
provider_model_ref = self._settings.resolve_model(claude_model_name)
thinking_enabled = self._settings.resolve_thinking(claude_model_name)
provider_id = Settings.parse_provider_type(provider_model_ref)
provider_model = Settings.parse_model_name(provider_model_ref)
if provider_model != claude_model_name:
@ -50,6 +52,7 @@ class ModelRouter:
provider_id=provider_id,
provider_model=provider_model,
provider_model_ref=provider_model_ref,
thinking_enabled=thinking_enabled,
)
def resolve_messages_request(

View file

@ -95,6 +95,7 @@ class ClaudeProxyService:
routed.request,
input_tokens=input_tokens,
request_id=request_id,
thinking_enabled=routed.resolved.thinking_enabled,
),
media_type="text/event-stream",
headers={