Improved optimizations to decrease llm calls further and increase throughput

2026-04-28 11:30:03 +00:00 · 2026-02-18 17:54:41 -08:00 · 2026-02-18 17:54:41 -08:00 · e7ac85264f
commit e7ac85264f
parent 593fb55954
5 changed files with 53 additions and 4 deletions
--- a/tests/api/test_api.py
+++ b/tests/api/test_api.py
@ -81,7 +81,12 @@ def test_error_fallbacks():
        RateLimitError,
    )

-    base_payload = {"model": "test", "messages": [], "max_tokens": 10, "stream": True}
+    base_payload = {
+        "model": "test",
+        "messages": [{"role": "user", "content": "Hi"}],
+        "max_tokens": 10,
+        "stream": True,
+    }

    def _raise_auth(*args, **kwargs):
        raise AuthenticationError("Invalid Key")