mirror of
https://github.com/diegosouzapw/OmniRoute.git
synced 2026-05-06 02:07:00 +00:00
287 lines
11 KiB
JavaScript
287 lines
11 KiB
JavaScript
import test from "node:test";
|
|
import assert from "node:assert/strict";
|
|
|
|
const {
|
|
applyThinkingBudget,
|
|
setThinkingBudgetConfig,
|
|
getThinkingBudgetConfig,
|
|
ThinkingMode,
|
|
EFFORT_BUDGETS,
|
|
DEFAULT_THINKING_CONFIG,
|
|
THINKING_LEVEL_MAP,
|
|
normalizeThinkingLevel,
|
|
ensureThinkingConfig,
|
|
hasThinkingCapableModel,
|
|
} = await import("../../open-sse/services/thinkingBudget.ts");
|
|
|
|
// ─── Config Management ──────────────────────────────────────────────────────
|
|
|
|
test("default config is passthrough", () => {
|
|
const config = getThinkingBudgetConfig();
|
|
assert.equal(config.mode, ThinkingMode.PASSTHROUGH);
|
|
});
|
|
|
|
test("setThinkingBudgetConfig updates config", () => {
|
|
setThinkingBudgetConfig({ mode: ThinkingMode.AUTO });
|
|
assert.equal(getThinkingBudgetConfig().mode, ThinkingMode.AUTO);
|
|
// Reset
|
|
setThinkingBudgetConfig(DEFAULT_THINKING_CONFIG);
|
|
});
|
|
|
|
// ─── PASSTHROUGH Mode ───────────────────────────────────────────────────────
|
|
|
|
test("PASSTHROUGH: body unchanged", () => {
|
|
setThinkingBudgetConfig({ mode: ThinkingMode.PASSTHROUGH });
|
|
const body = {
|
|
model: "claude-sonnet-4-20250514",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
thinking: { type: "enabled", budget_tokens: 8192 },
|
|
};
|
|
const result = applyThinkingBudget(body);
|
|
assert.deepEqual(result, body);
|
|
setThinkingBudgetConfig(DEFAULT_THINKING_CONFIG);
|
|
});
|
|
|
|
// ─── AUTO Mode ──────────────────────────────────────────────────────────────
|
|
|
|
test("AUTO: strips Claude thinking config", () => {
|
|
setThinkingBudgetConfig({ mode: ThinkingMode.AUTO });
|
|
const body = {
|
|
model: "claude-sonnet-4-20250514",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
thinking: { type: "enabled", budget_tokens: 8192 },
|
|
};
|
|
const result = applyThinkingBudget(body);
|
|
assert.equal(result.thinking, undefined);
|
|
setThinkingBudgetConfig(DEFAULT_THINKING_CONFIG);
|
|
});
|
|
|
|
test("AUTO: strips OpenAI reasoning_effort", () => {
|
|
setThinkingBudgetConfig({ mode: ThinkingMode.AUTO });
|
|
const body = {
|
|
model: "o3-mini",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
reasoning_effort: "high",
|
|
};
|
|
const result = applyThinkingBudget(body);
|
|
assert.equal(result.reasoning_effort, undefined);
|
|
setThinkingBudgetConfig(DEFAULT_THINKING_CONFIG);
|
|
});
|
|
|
|
test("AUTO: strips Gemini thinking_config", () => {
|
|
setThinkingBudgetConfig({ mode: ThinkingMode.AUTO });
|
|
const body = {
|
|
model: "gemini-2.5-pro",
|
|
generationConfig: { thinking_config: { thinking_budget: 8192 } },
|
|
};
|
|
const result = applyThinkingBudget(body);
|
|
assert.equal(result.generationConfig.thinking_config, undefined);
|
|
setThinkingBudgetConfig(DEFAULT_THINKING_CONFIG);
|
|
});
|
|
|
|
// ─── CUSTOM Mode ────────────────────────────────────────────────────────────
|
|
|
|
test("CUSTOM: sets Claude budget", () => {
|
|
setThinkingBudgetConfig({ mode: ThinkingMode.CUSTOM, customBudget: 4096 });
|
|
const body = {
|
|
model: "claude-sonnet-4-20250514",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
thinking: { type: "enabled", budget_tokens: 8192 },
|
|
};
|
|
const result = applyThinkingBudget(body);
|
|
assert.equal(result.thinking.budget_tokens, 4096);
|
|
setThinkingBudgetConfig(DEFAULT_THINKING_CONFIG);
|
|
});
|
|
|
|
test("CUSTOM: sets OpenAI reasoning_effort from budget", () => {
|
|
setThinkingBudgetConfig({ mode: ThinkingMode.CUSTOM, customBudget: 131072 });
|
|
const body = {
|
|
model: "o3-mini",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
reasoning_effort: "low",
|
|
};
|
|
const result = applyThinkingBudget(body);
|
|
// T11 (sub2api gap): full budget (131072) now maps to "max" instead of "high"
|
|
assert.equal(result.reasoning_effort, "max");
|
|
setThinkingBudgetConfig(DEFAULT_THINKING_CONFIG);
|
|
});
|
|
|
|
test("CUSTOM: budget 0 disables Claude thinking", () => {
|
|
setThinkingBudgetConfig({ mode: ThinkingMode.CUSTOM, customBudget: 0 });
|
|
const body = {
|
|
model: "claude-sonnet-4-20250514",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
thinking: { type: "enabled", budget_tokens: 8192 },
|
|
};
|
|
const result = applyThinkingBudget(body);
|
|
assert.equal(result.thinking.type, "disabled");
|
|
setThinkingBudgetConfig(DEFAULT_THINKING_CONFIG);
|
|
});
|
|
|
|
// ─── ADAPTIVE Mode ──────────────────────────────────────────────────────────
|
|
|
|
test("ADAPTIVE: simple request gets base budget", () => {
|
|
setThinkingBudgetConfig({ mode: ThinkingMode.ADAPTIVE, effortLevel: "medium" });
|
|
const body = {
|
|
model: "claude-sonnet-4-20250514",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
thinking: { type: "enabled", budget_tokens: 8192 },
|
|
};
|
|
const result = applyThinkingBudget(body);
|
|
assert.equal(result.thinking.budget_tokens, EFFORT_BUDGETS.medium);
|
|
setThinkingBudgetConfig(DEFAULT_THINKING_CONFIG);
|
|
});
|
|
|
|
test("ADAPTIVE: complex request (many messages + tools) gets higher budget", () => {
|
|
setThinkingBudgetConfig({ mode: ThinkingMode.ADAPTIVE, effortLevel: "medium" });
|
|
const messages = Array.from({ length: 15 }, (_, i) => ({
|
|
role: i % 2 === 0 ? "user" : "assistant",
|
|
content: "x".repeat(3000),
|
|
}));
|
|
const tools = Array.from({ length: 5 }, (_, i) => ({ name: `tool${i}` }));
|
|
const body = {
|
|
model: "claude-sonnet-4-20250514",
|
|
messages,
|
|
tools,
|
|
thinking: { type: "enabled", budget_tokens: 1000 },
|
|
};
|
|
const result = applyThinkingBudget(body);
|
|
// multiplier = 1.0 + 0.5 (msgs>10) + 0.5 (tools>3) + 0.3 (lastMsg>2000) = 2.3
|
|
assert.ok(result.thinking.budget_tokens > EFFORT_BUDGETS.medium);
|
|
setThinkingBudgetConfig(DEFAULT_THINKING_CONFIG);
|
|
});
|
|
|
|
// ─── Edge Cases ─────────────────────────────────────────────────────────────
|
|
|
|
test("null/undefined body returns as-is", () => {
|
|
assert.equal(applyThinkingBudget(null), null);
|
|
assert.equal(applyThinkingBudget(undefined), undefined);
|
|
});
|
|
|
|
test("EFFORT_BUDGETS has expected keys", () => {
|
|
assert.ok(EFFORT_BUDGETS.none === 0);
|
|
assert.ok(EFFORT_BUDGETS.low > 0);
|
|
assert.ok(EFFORT_BUDGETS.medium > EFFORT_BUDGETS.low);
|
|
assert.ok(EFFORT_BUDGETS.high > EFFORT_BUDGETS.medium);
|
|
});
|
|
|
|
// ─── thinkingLevel String Conversion (Feature 4) ────────────────────────────
|
|
|
|
test("THINKING_LEVEL_MAP has all expected levels", () => {
|
|
assert.equal(THINKING_LEVEL_MAP.none, 0);
|
|
assert.equal(THINKING_LEVEL_MAP.low, 4096);
|
|
assert.equal(THINKING_LEVEL_MAP.medium, 8192);
|
|
assert.equal(THINKING_LEVEL_MAP.high, 24576);
|
|
});
|
|
|
|
test("normalizeThinkingLevel: converts thinkingLevel 'high' to budget", () => {
|
|
const body = {
|
|
model: "claude-sonnet-4",
|
|
thinkingLevel: "high",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
};
|
|
const result = normalizeThinkingLevel(body);
|
|
assert.equal(result.thinking.type, "enabled");
|
|
assert.equal(result.thinking.budget_tokens, 24576);
|
|
assert.equal(result.thinkingLevel, undefined);
|
|
});
|
|
|
|
test("normalizeThinkingLevel: converts thinking_level 'low' to budget", () => {
|
|
const body = {
|
|
model: "claude-sonnet-4",
|
|
thinking_level: "low",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
};
|
|
const result = normalizeThinkingLevel(body);
|
|
assert.equal(result.thinking.type, "enabled");
|
|
assert.equal(result.thinking.budget_tokens, 4096);
|
|
assert.equal(result.thinking_level, undefined);
|
|
});
|
|
|
|
test("normalizeThinkingLevel: converts 'none' to disabled", () => {
|
|
const body = { model: "claude-sonnet-4", thinkingLevel: "none" };
|
|
const result = normalizeThinkingLevel(body);
|
|
assert.equal(result.thinking.type, "disabled");
|
|
assert.equal(result.thinking.budget_tokens, 0);
|
|
});
|
|
|
|
test("normalizeThinkingLevel: converts Gemini thinkingConfig.thinkingLevel", () => {
|
|
const body = {
|
|
model: "gemini-2.5-pro",
|
|
generationConfig: {
|
|
thinkingConfig: { thinkingLevel: "high" },
|
|
},
|
|
};
|
|
const result = normalizeThinkingLevel(body);
|
|
assert.equal(result.generationConfig.thinkingConfig.thinkingBudget, 24576);
|
|
assert.equal(result.generationConfig.thinking_config, undefined);
|
|
});
|
|
|
|
test("normalizeThinkingLevel: ignores unknown string values", () => {
|
|
const body = { model: "claude-sonnet-4", thinkingLevel: "ultra" };
|
|
const result = normalizeThinkingLevel(body);
|
|
assert.equal(result.thinking, undefined); // not converted
|
|
assert.equal(result.thinkingLevel, "ultra"); // preserved
|
|
});
|
|
|
|
// ─── -thinking Suffix Auto-Injection (Feature 5) ────────────────────────────
|
|
|
|
test("ensureThinkingConfig: auto-injects for -thinking suffix model", () => {
|
|
const body = {
|
|
model: "claude-opus-4-6-thinking",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
};
|
|
const result = ensureThinkingConfig(body);
|
|
assert.equal(result.thinking.type, "enabled");
|
|
assert.equal(result.thinking.budget_tokens, EFFORT_BUDGETS.medium);
|
|
});
|
|
|
|
test("ensureThinkingConfig: does NOT override existing thinking config", () => {
|
|
const body = {
|
|
model: "claude-opus-4-6-thinking",
|
|
thinking: { type: "enabled", budget_tokens: 50000 },
|
|
messages: [{ role: "user", content: "hello" }],
|
|
};
|
|
const result = ensureThinkingConfig(body);
|
|
assert.equal(result.thinking.budget_tokens, 50000); // preserved
|
|
});
|
|
|
|
test("ensureThinkingConfig: does nothing for non-thinking models", () => {
|
|
const body = {
|
|
model: "claude-sonnet-4",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
};
|
|
const result = ensureThinkingConfig(body);
|
|
assert.equal(result.thinking, undefined);
|
|
});
|
|
|
|
test("hasThinkingCapableModel: matches -thinking suffix", () => {
|
|
assert.ok(hasThinkingCapableModel({ model: "claude-opus-4-6-thinking" }));
|
|
assert.ok(hasThinkingCapableModel({ model: "kimi-k2-thinking" }));
|
|
assert.ok(hasThinkingCapableModel({ model: "custom-model-thinking" }));
|
|
});
|
|
|
|
test("applyThinkingBudget: thinkingLevel 'high' + PASSTHROUGH = converts and passes through", () => {
|
|
setThinkingBudgetConfig({ mode: ThinkingMode.PASSTHROUGH });
|
|
const body = {
|
|
model: "claude-sonnet-4",
|
|
thinkingLevel: "high",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
};
|
|
const result = applyThinkingBudget(body);
|
|
assert.equal(result.thinking.budget_tokens, 24576);
|
|
assert.equal(result.thinkingLevel, undefined);
|
|
setThinkingBudgetConfig(DEFAULT_THINKING_CONFIG);
|
|
});
|
|
|
|
test("applyThinkingBudget: -thinking model without config + PASSTHROUGH = auto-inject", () => {
|
|
setThinkingBudgetConfig({ mode: ThinkingMode.PASSTHROUGH });
|
|
const body = {
|
|
model: "claude-opus-4-6-thinking",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
};
|
|
const result = applyThinkingBudget(body);
|
|
assert.equal(result.thinking.type, "enabled");
|
|
assert.equal(result.thinking.budget_tokens, EFFORT_BUDGETS.medium);
|
|
setThinkingBudgetConfig(DEFAULT_THINKING_CONFIG);
|
|
});
|