mirror of
https://github.com/diegosouzapw/OmniRoute.git
synced 2026-05-23 04:28:06 +00:00
Some checks are pending
Build Fork Image (ghcr.io) / Build and Push to ghcr.io (push) Waiting to run
CI / Security Tests (push) Blocked by required conditions
CI / Lint (push) Waiting to run
CI / Build language matrix (push) Waiting to run
CI / i18n Validation (push) Blocked by required conditions
CI / PR Test Policy (push) Waiting to run
CI / Build (push) Waiting to run
CI / Package Artifact (push) Blocked by required conditions
CI / Electron Package Smoke (push) Blocked by required conditions
CI / Unit Tests (1/2) (push) Blocked by required conditions
CI / Unit Tests (2/2) (push) Blocked by required conditions
CI / Node 24 Compatibility (1/2) (push) Blocked by required conditions
CI / Node 24 Compatibility (2/2) (push) Blocked by required conditions
CI / Node 26 Compatibility (1/2) (push) Blocked by required conditions
CI / Node 26 Compatibility (2/2) (push) Blocked by required conditions
CI / Coverage (push) Blocked by required conditions
CI / SonarQube (push) Blocked by required conditions
CI / PR Coverage Comment (push) Blocked by required conditions
CI / E2E Tests (1/6) (push) Blocked by required conditions
CI / E2E Tests (2/6) (push) Blocked by required conditions
CI / E2E Tests (3/6) (push) Blocked by required conditions
CI / E2E Tests (4/6) (push) Blocked by required conditions
CI / E2E Tests (5/6) (push) Blocked by required conditions
CI / E2E Tests (6/6) (push) Blocked by required conditions
CI / Integration Tests (1/2) (push) Blocked by required conditions
CI / Integration Tests (2/2) (push) Blocked by required conditions
CI / CI Dashboard (push) Blocked by required conditions
Publish to Docker Hub / Build and Push Docker (multi-arch) (push) Waiting to run
Integrated into release/v3.8.0
476 lines
15 KiB
TypeScript
476 lines
15 KiB
TypeScript
import test from "node:test";
|
|
import assert from "node:assert/strict";
|
|
import fs from "node:fs";
|
|
import os from "node:os";
|
|
import path from "node:path";
|
|
|
|
const TEST_DATA_DIR = fs.mkdtempSync(path.join(os.tmpdir(), "omniroute-usage-analytics-"));
|
|
process.env.DATA_DIR = TEST_DATA_DIR;
|
|
|
|
const core = await import("../../src/lib/db/core.ts");
|
|
const localDb = await import("../../src/lib/localDb.ts");
|
|
const apiKeysDb = await import("../../src/lib/db/apiKeys.ts");
|
|
const providersDb = await import("../../src/lib/db/providers.ts");
|
|
const usageHistory = await import("../../src/lib/usage/usageHistory.ts");
|
|
const usageStats = await import("../../src/lib/usage/usageStats.ts");
|
|
const legacyUsageAnalytics = await import("../../src/lib/usageAnalytics.ts");
|
|
const callLogs = await import("../../src/lib/usage/callLogs.ts");
|
|
const { calculateCost } = await import("../../src/lib/usage/costCalculator.ts");
|
|
|
|
// Use the official clearPendingRequests export instead of manual cleanup
|
|
const clearPendingRequests = usageHistory.clearPendingRequests;
|
|
|
|
async function resetStorage() {
|
|
core.resetDbInstance();
|
|
apiKeysDb.resetApiKeyState();
|
|
fs.rmSync(TEST_DATA_DIR, { recursive: true, force: true });
|
|
fs.mkdirSync(TEST_DATA_DIR, { recursive: true });
|
|
clearPendingRequests();
|
|
}
|
|
|
|
test.beforeEach(async () => {
|
|
await resetStorage();
|
|
});
|
|
|
|
test.after(() => {
|
|
core.resetDbInstance();
|
|
apiKeysDb.resetApiKeyState();
|
|
fs.rmSync(TEST_DATA_DIR, { recursive: true, force: true });
|
|
});
|
|
|
|
test("usage history persists entries and supports filtering and usageDb compatibility", async () => {
|
|
const recentTimestamp = new Date().toISOString();
|
|
const olderTimestamp = new Date(Date.now() - 2 * 60 * 60 * 1000).toISOString();
|
|
|
|
await usageHistory.saveRequestUsage({
|
|
provider: "provider-a",
|
|
model: "model-a",
|
|
connectionId: "conn-a",
|
|
apiKeyId: "key-a",
|
|
apiKeyName: "Key A",
|
|
tokens: {
|
|
input: 10,
|
|
output: 5,
|
|
cacheRead: 2,
|
|
cacheCreation: 1,
|
|
reasoning: 3,
|
|
},
|
|
status: "success",
|
|
success: true,
|
|
latencyMs: 120,
|
|
timeToFirstTokenMs: 30,
|
|
timestamp: recentTimestamp,
|
|
});
|
|
|
|
await usageHistory.saveRequestUsage({
|
|
provider: "provider-b",
|
|
model: "model-b",
|
|
connectionId: "conn-b",
|
|
tokens: {
|
|
prompt_tokens: 20,
|
|
completion_tokens: 7,
|
|
cached_tokens: 4,
|
|
cache_creation_input_tokens: 2,
|
|
reasoning_tokens: 1,
|
|
},
|
|
status: "error",
|
|
success: false,
|
|
latencyMs: 400,
|
|
errorCode: "rate_limited",
|
|
timestamp: olderTimestamp,
|
|
});
|
|
|
|
const filtered = await usageHistory.getUsageHistory({
|
|
provider: "provider-a",
|
|
startDate: new Date(Date.now() - 5 * 60 * 1000).toISOString(),
|
|
});
|
|
const all = await usageHistory.getUsageDb();
|
|
|
|
assert.equal(filtered.length, 1);
|
|
assert.equal(filtered[0].provider, "provider-a");
|
|
assert.equal(filtered[0].tokens.input, 10);
|
|
assert.equal(filtered[0].tokens.output, 5);
|
|
assert.equal(filtered[0].tokens.cacheRead, 2);
|
|
assert.equal(filtered[0].tokens.cacheCreation, 1);
|
|
assert.equal(filtered[0].tokens.reasoning, 3);
|
|
assert.equal(filtered[0].timeToFirstTokenMs, 30);
|
|
|
|
assert.equal(all.data.history.length, 2);
|
|
assert.equal(all.data.history[0].provider, "provider-b");
|
|
assert.equal(all.data.history[1].provider, "provider-a");
|
|
assert.equal(all.data.history[0].success, false);
|
|
assert.equal(all.data.history[1].success, true);
|
|
});
|
|
|
|
test("getModelLatencyStats aggregates success rate and latency percentiles", async () => {
|
|
const now = Date.now();
|
|
const entries = [
|
|
{ latencyMs: 100, success: true },
|
|
{ latencyMs: 200, success: true },
|
|
{ latencyMs: 400, success: true },
|
|
{ latencyMs: 900, success: false },
|
|
];
|
|
|
|
for (const [index, entry] of entries.entries()) {
|
|
await usageHistory.saveRequestUsage({
|
|
provider: "latency-provider",
|
|
model: "latency-model",
|
|
success: entry.success,
|
|
latencyMs: entry.latencyMs,
|
|
timestamp: new Date(now - index * 60 * 1000).toISOString(),
|
|
});
|
|
}
|
|
|
|
const stats = await usageHistory.getModelLatencyStats({
|
|
windowHours: 1,
|
|
minSamples: 2,
|
|
maxRows: 50,
|
|
});
|
|
|
|
const entry = stats["latency-provider/latency-model"];
|
|
assert.ok(entry);
|
|
assert.equal(entry.totalRequests, 4);
|
|
assert.equal(entry.successfulRequests, 3);
|
|
assert.equal(entry.successRate, 0.75);
|
|
assert.equal(entry.avgLatencyMs, 233);
|
|
assert.equal(entry.p50LatencyMs, 200);
|
|
assert.equal(entry.p95LatencyMs, 400);
|
|
assert.equal(entry.p99LatencyMs, 400);
|
|
assert.ok(entry.latencyStdDev > 0);
|
|
});
|
|
|
|
test("getModelLatencyStats falls back to all latencies when successful sample count is too small", async () => {
|
|
await usageHistory.saveRequestUsage({
|
|
provider: "fallback-provider",
|
|
model: "fallback-model",
|
|
success: true,
|
|
latencyMs: 100,
|
|
timestamp: new Date().toISOString(),
|
|
});
|
|
await usageHistory.saveRequestUsage({
|
|
provider: "fallback-provider",
|
|
model: "fallback-model",
|
|
success: false,
|
|
latencyMs: 500,
|
|
timestamp: new Date().toISOString(),
|
|
});
|
|
|
|
const stats = await usageHistory.getModelLatencyStats({
|
|
windowHours: 1,
|
|
minSamples: 2,
|
|
});
|
|
|
|
const entry = stats["fallback-provider/fallback-model"];
|
|
assert.ok(entry);
|
|
assert.equal(entry.successRate, 0.5);
|
|
assert.equal(entry.avgLatencyMs, 300);
|
|
assert.equal(entry.p50LatencyMs, 500);
|
|
});
|
|
|
|
test("getUsageStats aggregates totals, buckets, pending requests, and cost breakdowns", async () => {
|
|
await localDb.updatePricing({
|
|
"pricing-provider": {
|
|
"pricing-model": {
|
|
input: 1000,
|
|
cached: 100,
|
|
output: 2000,
|
|
reasoning: 3000,
|
|
cache_creation: 1500,
|
|
},
|
|
},
|
|
});
|
|
|
|
const connection = await providersDb.createProviderConnection({
|
|
provider: "pricing-provider",
|
|
authType: "apikey",
|
|
name: "Primary Account",
|
|
apiKey: "sk-test",
|
|
});
|
|
|
|
const recentTokens = {
|
|
input: 100,
|
|
output: 50,
|
|
cacheRead: 20,
|
|
cacheCreation: 10,
|
|
reasoning: 5,
|
|
};
|
|
const oldTokens = {
|
|
input: 40,
|
|
output: 10,
|
|
cacheRead: 0,
|
|
cacheCreation: 0,
|
|
reasoning: 0,
|
|
};
|
|
|
|
await usageHistory.saveRequestUsage({
|
|
provider: "pricing-provider",
|
|
model: "pricing-model",
|
|
connectionId: connection.id,
|
|
apiKeyId: "api-key-1",
|
|
apiKeyName: "Service Key",
|
|
tokens: recentTokens,
|
|
success: true,
|
|
latencyMs: 150,
|
|
timestamp: new Date().toISOString(),
|
|
});
|
|
await usageHistory.saveRequestUsage({
|
|
provider: "pricing-provider",
|
|
model: "pricing-model",
|
|
connectionId: connection.id,
|
|
apiKeyId: "api-key-1",
|
|
apiKeyName: "Service Key",
|
|
tokens: oldTokens,
|
|
success: true,
|
|
latencyMs: 80,
|
|
timestamp: new Date(Date.now() - 20 * 60 * 1000).toISOString(),
|
|
});
|
|
|
|
usageHistory.trackPendingRequest(
|
|
"pricing-model",
|
|
"pricing-provider",
|
|
(connection as any).id,
|
|
true
|
|
);
|
|
usageHistory.trackPendingRequest(
|
|
"pricing-model",
|
|
"pricing-provider" as any,
|
|
(connection as any).id,
|
|
true
|
|
);
|
|
usageHistory.trackPendingRequest(
|
|
"pricing-model",
|
|
"pricing-provider" as any,
|
|
(connection as any).id,
|
|
false
|
|
);
|
|
|
|
const stats = await usageStats.getUsageStats();
|
|
const expectedCost =
|
|
(await calculateCost("pricing-provider", "pricing-model", recentTokens)) +
|
|
(await calculateCost("pricing-provider", "pricing-model", oldTokens));
|
|
|
|
assert.equal(stats.totalRequests, 2);
|
|
assert.equal(stats.totalPromptTokens, 140);
|
|
assert.equal(stats.totalCompletionTokens, 60);
|
|
assert.ok(Math.abs(stats.totalCost - expectedCost) < 1e-9);
|
|
|
|
assert.equal(stats.byProvider["pricing-provider"].requests, 2);
|
|
assert.equal(stats.byProvider["pricing-provider"].promptTokens, 140);
|
|
assert.equal(stats.byModel["pricing-model (pricing-provider)"].requests, 2);
|
|
|
|
const accountKey = "pricing-model (pricing-provider - Primary Account)";
|
|
assert.equal(stats.byAccount[accountKey].requests, 2);
|
|
assert.equal(stats.byAccount[accountKey].accountName, "Primary Account");
|
|
|
|
assert.equal(stats.byApiKey["id:api-key-1"].requests, 2);
|
|
assert.equal(stats.pending.byModel["pricing-model (pricing-provider)"], 1);
|
|
assert.equal(stats.pending.byAccount[connection.id]["pricing-model (pricing-provider)"], 1);
|
|
assert.deepEqual(stats.activeRequests, [
|
|
{
|
|
model: "pricing-model",
|
|
provider: "pricing-provider",
|
|
account: "Primary Account",
|
|
count: 1,
|
|
},
|
|
]);
|
|
|
|
assert.equal(stats.last10Minutes.length, 10);
|
|
const recentBucketTotal = stats.last10Minutes.reduce((sum, bucket) => sum + bucket.requests, 0);
|
|
assert.equal(recentBucketTotal, 1);
|
|
});
|
|
|
|
test("getUsageStats groups renamed API key usage by stable ID", async () => {
|
|
const db = core.getDbInstance();
|
|
const now = new Date().toISOString();
|
|
db.prepare(
|
|
`INSERT INTO api_keys (id, name, key, machine_id, allowed_models, no_log, created_at, key_prefix)
|
|
VALUES (?, ?, ?, ?, ?, ?, ?, ?)`
|
|
).run(
|
|
"api-key-rename",
|
|
"Current Name",
|
|
"omni-test-key",
|
|
"machine1234567890",
|
|
"[]",
|
|
0,
|
|
now,
|
|
"omni-test-ke"
|
|
);
|
|
|
|
await usageHistory.saveRequestUsage({
|
|
provider: "provider-a",
|
|
model: "model-a",
|
|
apiKeyId: "api-key-rename",
|
|
apiKeyName: "Original Name",
|
|
tokens: { input: 10, output: 5 },
|
|
success: true,
|
|
timestamp: new Date(Date.now() - 60_000).toISOString(),
|
|
});
|
|
await usageHistory.saveRequestUsage({
|
|
provider: "provider-a",
|
|
model: "model-a",
|
|
apiKeyId: "api-key-rename",
|
|
apiKeyName: "Renamed Alias",
|
|
tokens: { input: 20, output: 10 },
|
|
success: true,
|
|
timestamp: now,
|
|
});
|
|
|
|
const stats = await usageStats.getUsageStats();
|
|
const row = stats.byApiKey["id:api-key-rename"];
|
|
|
|
assert.ok(row);
|
|
assert.equal(Object.keys(stats.byApiKey).length, 1);
|
|
assert.equal(row.apiKeyId, "api-key-rename");
|
|
assert.equal(row.apiKeyName, "Current Name");
|
|
assert.deepEqual(row.historicalApiKeyNames?.sort(), ["Original Name", "Renamed Alias"]);
|
|
assert.equal(row.requests, 2);
|
|
assert.equal(row.promptTokens, 30);
|
|
assert.equal(row.completionTokens, 15);
|
|
});
|
|
|
|
test("computeAnalytics groups renamed API key usage by stable ID", async () => {
|
|
const analytics = await legacyUsageAnalytics.computeAnalytics(
|
|
[
|
|
{
|
|
timestamp: new Date(Date.now() - 60_000).toISOString(),
|
|
provider: "provider-a",
|
|
model: "model-a",
|
|
apiKeyId: "api-key-legacy",
|
|
apiKeyName: "Original Name",
|
|
tokens: { input: 10, output: 5 },
|
|
},
|
|
{
|
|
timestamp: new Date().toISOString(),
|
|
provider: "provider-a",
|
|
model: "model-a",
|
|
apiKeyId: "api-key-legacy",
|
|
apiKeyName: "Renamed Alias",
|
|
tokens: { input: 20, output: 10 },
|
|
},
|
|
],
|
|
"all"
|
|
);
|
|
|
|
assert.equal(analytics.summary.uniqueApiKeys, 1);
|
|
assert.equal(analytics.byApiKey.length, 1);
|
|
assert.equal(analytics.byApiKey[0].apiKeyId, "api-key-legacy");
|
|
assert.deepEqual(analytics.byApiKey[0].historicalApiKeyNames.sort(), [
|
|
"Original Name",
|
|
"Renamed Alias",
|
|
]);
|
|
assert.equal(analytics.byApiKey[0].requests, 2);
|
|
assert.equal(analytics.byApiKey[0].promptTokens, 30);
|
|
assert.equal(analytics.byApiKey[0].completionTokens, 15);
|
|
});
|
|
|
|
test("Codex Fast service tier applies documented GPT-5.5 and GPT-5.4 cost multipliers", async () => {
|
|
await localDb.updatePricing({
|
|
codex: {
|
|
"gpt-5.5": { input: 5, output: 30 },
|
|
"gpt-5.4": { input: 5, output: 30 },
|
|
},
|
|
});
|
|
|
|
const tokens = { input: 1000, output: 500 };
|
|
|
|
assert.equal(await calculateCost("codex", "gpt-5.5", tokens), 0.02);
|
|
assert.equal(await calculateCost("codex", "gpt-5.5", tokens, { serviceTier: "priority" }), 0.05);
|
|
assert.equal(await calculateCost("codex", "gpt-5.4-high", tokens, { serviceTier: "fast" }), 0.04);
|
|
assert.equal(await calculateCost("openai", "gpt-5.5", tokens, { serviceTier: "priority" }), 0.02);
|
|
});
|
|
|
|
test("recent request summaries are generated from SQLite call logs", async () => {
|
|
const connection = await providersDb.createProviderConnection({
|
|
provider: "log-provider",
|
|
authType: "apikey",
|
|
name: "Named Account",
|
|
apiKey: "sk-test",
|
|
});
|
|
|
|
for (let i = 0; i < 205; i++) {
|
|
await callLogs.saveCallLog({
|
|
id: `log-${i}`,
|
|
timestamp: new Date(Date.now() + i).toISOString(),
|
|
method: "POST",
|
|
path: "/v1/chat/completions",
|
|
status: 200,
|
|
model: `model-${i}`,
|
|
provider: "log-provider",
|
|
connectionId: connection.id,
|
|
tokens: { input: i + 1, output: i + 2 },
|
|
requestBody: { index: i },
|
|
responseBody: { ok: true, index: i },
|
|
});
|
|
}
|
|
|
|
const recent = await usageHistory.getRecentLogs(3);
|
|
|
|
assert.equal(recent.length, 3);
|
|
assert.match(recent[0], /model-204/);
|
|
assert.match(recent[0], /LOG-PROVIDER/);
|
|
assert.match(recent[0], /Named Account/);
|
|
assert.match(recent[0], /205 \| 206 \| 200$/);
|
|
});
|
|
|
|
test("pending request metadata stores sanitized payload previews and clears after completion", async () => {
|
|
usageHistory.trackPendingRequest("gpt-test", "openai", "conn-preview", true, {
|
|
clientEndpoint: "/v1/chat/completions",
|
|
clientRequest: {
|
|
token: "super-secret-token",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
},
|
|
});
|
|
|
|
usageHistory.updatePendingRequest("gpt-test", "openai", "conn-preview", {
|
|
providerUrl: "https://api.example.com/v1/chat/completions",
|
|
providerRequest: {
|
|
authorization: "Bearer super-secret-token",
|
|
messages: [{ role: "user", content: "hello" }],
|
|
},
|
|
});
|
|
|
|
const pending = usageHistory.getPendingRequests();
|
|
const detail = pending.details["conn-preview"]["gpt-test (openai)"];
|
|
const clientRequestPreview = detail.clientRequest as Record<string, unknown>;
|
|
const providerRequestPreview = detail.providerRequest as Record<string, unknown>;
|
|
|
|
assert.equal(detail.clientEndpoint, "/v1/chat/completions");
|
|
assert.equal(clientRequestPreview.token, "[REDACTED]");
|
|
assert.equal(providerRequestPreview.authorization, "[REDACTED]");
|
|
assert.equal(detail.providerUrl, "https://api.example.com/v1/chat/completions");
|
|
|
|
usageHistory.trackPendingRequest("gpt-test", "openai", "conn-preview", false);
|
|
assert.equal(pending.details["conn-preview"], undefined);
|
|
});
|
|
|
|
test("clearPendingRequests resets all pending counts and details", () => {
|
|
// Simulate leaked pending counts (increment without matching decrement)
|
|
usageHistory.trackPendingRequest("model-a", "provider-x", "conn-1", true);
|
|
usageHistory.trackPendingRequest("model-a", "provider-x", "conn-1", true);
|
|
usageHistory.trackPendingRequest("model-b", "provider-y", "conn-2", true);
|
|
|
|
const before = usageHistory.getPendingRequests();
|
|
assert.equal(before.byModel["model-a (provider-x)"], 2);
|
|
assert.equal(before.byModel["model-b (provider-y)"], 1);
|
|
assert.ok(before.details["conn-1"]);
|
|
assert.ok(before.details["conn-2"]);
|
|
|
|
// Clear all pending
|
|
usageHistory.clearPendingRequests();
|
|
|
|
const after = usageHistory.getPendingRequests();
|
|
assert.equal(Object.keys(after.byModel).length, 0);
|
|
assert.equal(Object.keys(after.byAccount).length, 0);
|
|
assert.equal(Object.keys(after.details).length, 0);
|
|
});
|
|
|
|
test("clearPendingRequests allows fresh tracking after clearing", () => {
|
|
usageHistory.trackPendingRequest("model-c", "provider-z", "conn-3", true);
|
|
usageHistory.clearPendingRequests();
|
|
|
|
// Tracking should work normally after clearing
|
|
usageHistory.trackPendingRequest("model-d", "provider-w", "conn-4", true);
|
|
const pending = usageHistory.getPendingRequests();
|
|
assert.equal(pending.byModel["model-d (provider-w)"], 1);
|
|
assert.ok(pending.details["conn-4"]);
|
|
});
|