OmniRoute/tests/unit/usage-analytics.test.ts
Diego Rodrigues de Sa e Souza 3d75fb3fae
Some checks are pending
Build Fork Image (ghcr.io) / Build and Push to ghcr.io (push) Waiting to run
CI / Security Tests (push) Blocked by required conditions
CI / Lint (push) Waiting to run
CI / Build language matrix (push) Waiting to run
CI / i18n Validation (push) Blocked by required conditions
CI / PR Test Policy (push) Waiting to run
CI / Build (push) Waiting to run
CI / Package Artifact (push) Blocked by required conditions
CI / Electron Package Smoke (push) Blocked by required conditions
CI / Unit Tests (1/2) (push) Blocked by required conditions
CI / Unit Tests (2/2) (push) Blocked by required conditions
CI / Node 24 Compatibility (1/2) (push) Blocked by required conditions
CI / Node 24 Compatibility (2/2) (push) Blocked by required conditions
CI / Node 26 Compatibility (1/2) (push) Blocked by required conditions
CI / Node 26 Compatibility (2/2) (push) Blocked by required conditions
CI / Coverage (push) Blocked by required conditions
CI / SonarQube (push) Blocked by required conditions
CI / PR Coverage Comment (push) Blocked by required conditions
CI / E2E Tests (1/6) (push) Blocked by required conditions
CI / E2E Tests (2/6) (push) Blocked by required conditions
CI / E2E Tests (3/6) (push) Blocked by required conditions
CI / E2E Tests (4/6) (push) Blocked by required conditions
CI / E2E Tests (5/6) (push) Blocked by required conditions
CI / E2E Tests (6/6) (push) Blocked by required conditions
CI / Integration Tests (1/2) (push) Blocked by required conditions
CI / Integration Tests (2/2) (push) Blocked by required conditions
CI / CI Dashboard (push) Blocked by required conditions
Publish to Docker Hub / Build and Push Docker (multi-arch) (push) Waiting to run
Release v3.8.0 (#2073)
Integrated into release/v3.8.0
2026-05-10 00:55:06 -03:00

476 lines
15 KiB
TypeScript

import test from "node:test";
import assert from "node:assert/strict";
import fs from "node:fs";
import os from "node:os";
import path from "node:path";
const TEST_DATA_DIR = fs.mkdtempSync(path.join(os.tmpdir(), "omniroute-usage-analytics-"));
process.env.DATA_DIR = TEST_DATA_DIR;
const core = await import("../../src/lib/db/core.ts");
const localDb = await import("../../src/lib/localDb.ts");
const apiKeysDb = await import("../../src/lib/db/apiKeys.ts");
const providersDb = await import("../../src/lib/db/providers.ts");
const usageHistory = await import("../../src/lib/usage/usageHistory.ts");
const usageStats = await import("../../src/lib/usage/usageStats.ts");
const legacyUsageAnalytics = await import("../../src/lib/usageAnalytics.ts");
const callLogs = await import("../../src/lib/usage/callLogs.ts");
const { calculateCost } = await import("../../src/lib/usage/costCalculator.ts");
// Use the official clearPendingRequests export instead of manual cleanup
const clearPendingRequests = usageHistory.clearPendingRequests;
async function resetStorage() {
core.resetDbInstance();
apiKeysDb.resetApiKeyState();
fs.rmSync(TEST_DATA_DIR, { recursive: true, force: true });
fs.mkdirSync(TEST_DATA_DIR, { recursive: true });
clearPendingRequests();
}
test.beforeEach(async () => {
await resetStorage();
});
test.after(() => {
core.resetDbInstance();
apiKeysDb.resetApiKeyState();
fs.rmSync(TEST_DATA_DIR, { recursive: true, force: true });
});
test("usage history persists entries and supports filtering and usageDb compatibility", async () => {
const recentTimestamp = new Date().toISOString();
const olderTimestamp = new Date(Date.now() - 2 * 60 * 60 * 1000).toISOString();
await usageHistory.saveRequestUsage({
provider: "provider-a",
model: "model-a",
connectionId: "conn-a",
apiKeyId: "key-a",
apiKeyName: "Key A",
tokens: {
input: 10,
output: 5,
cacheRead: 2,
cacheCreation: 1,
reasoning: 3,
},
status: "success",
success: true,
latencyMs: 120,
timeToFirstTokenMs: 30,
timestamp: recentTimestamp,
});
await usageHistory.saveRequestUsage({
provider: "provider-b",
model: "model-b",
connectionId: "conn-b",
tokens: {
prompt_tokens: 20,
completion_tokens: 7,
cached_tokens: 4,
cache_creation_input_tokens: 2,
reasoning_tokens: 1,
},
status: "error",
success: false,
latencyMs: 400,
errorCode: "rate_limited",
timestamp: olderTimestamp,
});
const filtered = await usageHistory.getUsageHistory({
provider: "provider-a",
startDate: new Date(Date.now() - 5 * 60 * 1000).toISOString(),
});
const all = await usageHistory.getUsageDb();
assert.equal(filtered.length, 1);
assert.equal(filtered[0].provider, "provider-a");
assert.equal(filtered[0].tokens.input, 10);
assert.equal(filtered[0].tokens.output, 5);
assert.equal(filtered[0].tokens.cacheRead, 2);
assert.equal(filtered[0].tokens.cacheCreation, 1);
assert.equal(filtered[0].tokens.reasoning, 3);
assert.equal(filtered[0].timeToFirstTokenMs, 30);
assert.equal(all.data.history.length, 2);
assert.equal(all.data.history[0].provider, "provider-b");
assert.equal(all.data.history[1].provider, "provider-a");
assert.equal(all.data.history[0].success, false);
assert.equal(all.data.history[1].success, true);
});
test("getModelLatencyStats aggregates success rate and latency percentiles", async () => {
const now = Date.now();
const entries = [
{ latencyMs: 100, success: true },
{ latencyMs: 200, success: true },
{ latencyMs: 400, success: true },
{ latencyMs: 900, success: false },
];
for (const [index, entry] of entries.entries()) {
await usageHistory.saveRequestUsage({
provider: "latency-provider",
model: "latency-model",
success: entry.success,
latencyMs: entry.latencyMs,
timestamp: new Date(now - index * 60 * 1000).toISOString(),
});
}
const stats = await usageHistory.getModelLatencyStats({
windowHours: 1,
minSamples: 2,
maxRows: 50,
});
const entry = stats["latency-provider/latency-model"];
assert.ok(entry);
assert.equal(entry.totalRequests, 4);
assert.equal(entry.successfulRequests, 3);
assert.equal(entry.successRate, 0.75);
assert.equal(entry.avgLatencyMs, 233);
assert.equal(entry.p50LatencyMs, 200);
assert.equal(entry.p95LatencyMs, 400);
assert.equal(entry.p99LatencyMs, 400);
assert.ok(entry.latencyStdDev > 0);
});
test("getModelLatencyStats falls back to all latencies when successful sample count is too small", async () => {
await usageHistory.saveRequestUsage({
provider: "fallback-provider",
model: "fallback-model",
success: true,
latencyMs: 100,
timestamp: new Date().toISOString(),
});
await usageHistory.saveRequestUsage({
provider: "fallback-provider",
model: "fallback-model",
success: false,
latencyMs: 500,
timestamp: new Date().toISOString(),
});
const stats = await usageHistory.getModelLatencyStats({
windowHours: 1,
minSamples: 2,
});
const entry = stats["fallback-provider/fallback-model"];
assert.ok(entry);
assert.equal(entry.successRate, 0.5);
assert.equal(entry.avgLatencyMs, 300);
assert.equal(entry.p50LatencyMs, 500);
});
test("getUsageStats aggregates totals, buckets, pending requests, and cost breakdowns", async () => {
await localDb.updatePricing({
"pricing-provider": {
"pricing-model": {
input: 1000,
cached: 100,
output: 2000,
reasoning: 3000,
cache_creation: 1500,
},
},
});
const connection = await providersDb.createProviderConnection({
provider: "pricing-provider",
authType: "apikey",
name: "Primary Account",
apiKey: "sk-test",
});
const recentTokens = {
input: 100,
output: 50,
cacheRead: 20,
cacheCreation: 10,
reasoning: 5,
};
const oldTokens = {
input: 40,
output: 10,
cacheRead: 0,
cacheCreation: 0,
reasoning: 0,
};
await usageHistory.saveRequestUsage({
provider: "pricing-provider",
model: "pricing-model",
connectionId: connection.id,
apiKeyId: "api-key-1",
apiKeyName: "Service Key",
tokens: recentTokens,
success: true,
latencyMs: 150,
timestamp: new Date().toISOString(),
});
await usageHistory.saveRequestUsage({
provider: "pricing-provider",
model: "pricing-model",
connectionId: connection.id,
apiKeyId: "api-key-1",
apiKeyName: "Service Key",
tokens: oldTokens,
success: true,
latencyMs: 80,
timestamp: new Date(Date.now() - 20 * 60 * 1000).toISOString(),
});
usageHistory.trackPendingRequest(
"pricing-model",
"pricing-provider",
(connection as any).id,
true
);
usageHistory.trackPendingRequest(
"pricing-model",
"pricing-provider" as any,
(connection as any).id,
true
);
usageHistory.trackPendingRequest(
"pricing-model",
"pricing-provider" as any,
(connection as any).id,
false
);
const stats = await usageStats.getUsageStats();
const expectedCost =
(await calculateCost("pricing-provider", "pricing-model", recentTokens)) +
(await calculateCost("pricing-provider", "pricing-model", oldTokens));
assert.equal(stats.totalRequests, 2);
assert.equal(stats.totalPromptTokens, 140);
assert.equal(stats.totalCompletionTokens, 60);
assert.ok(Math.abs(stats.totalCost - expectedCost) < 1e-9);
assert.equal(stats.byProvider["pricing-provider"].requests, 2);
assert.equal(stats.byProvider["pricing-provider"].promptTokens, 140);
assert.equal(stats.byModel["pricing-model (pricing-provider)"].requests, 2);
const accountKey = "pricing-model (pricing-provider - Primary Account)";
assert.equal(stats.byAccount[accountKey].requests, 2);
assert.equal(stats.byAccount[accountKey].accountName, "Primary Account");
assert.equal(stats.byApiKey["id:api-key-1"].requests, 2);
assert.equal(stats.pending.byModel["pricing-model (pricing-provider)"], 1);
assert.equal(stats.pending.byAccount[connection.id]["pricing-model (pricing-provider)"], 1);
assert.deepEqual(stats.activeRequests, [
{
model: "pricing-model",
provider: "pricing-provider",
account: "Primary Account",
count: 1,
},
]);
assert.equal(stats.last10Minutes.length, 10);
const recentBucketTotal = stats.last10Minutes.reduce((sum, bucket) => sum + bucket.requests, 0);
assert.equal(recentBucketTotal, 1);
});
test("getUsageStats groups renamed API key usage by stable ID", async () => {
const db = core.getDbInstance();
const now = new Date().toISOString();
db.prepare(
`INSERT INTO api_keys (id, name, key, machine_id, allowed_models, no_log, created_at, key_prefix)
VALUES (?, ?, ?, ?, ?, ?, ?, ?)`
).run(
"api-key-rename",
"Current Name",
"omni-test-key",
"machine1234567890",
"[]",
0,
now,
"omni-test-ke"
);
await usageHistory.saveRequestUsage({
provider: "provider-a",
model: "model-a",
apiKeyId: "api-key-rename",
apiKeyName: "Original Name",
tokens: { input: 10, output: 5 },
success: true,
timestamp: new Date(Date.now() - 60_000).toISOString(),
});
await usageHistory.saveRequestUsage({
provider: "provider-a",
model: "model-a",
apiKeyId: "api-key-rename",
apiKeyName: "Renamed Alias",
tokens: { input: 20, output: 10 },
success: true,
timestamp: now,
});
const stats = await usageStats.getUsageStats();
const row = stats.byApiKey["id:api-key-rename"];
assert.ok(row);
assert.equal(Object.keys(stats.byApiKey).length, 1);
assert.equal(row.apiKeyId, "api-key-rename");
assert.equal(row.apiKeyName, "Current Name");
assert.deepEqual(row.historicalApiKeyNames?.sort(), ["Original Name", "Renamed Alias"]);
assert.equal(row.requests, 2);
assert.equal(row.promptTokens, 30);
assert.equal(row.completionTokens, 15);
});
test("computeAnalytics groups renamed API key usage by stable ID", async () => {
const analytics = await legacyUsageAnalytics.computeAnalytics(
[
{
timestamp: new Date(Date.now() - 60_000).toISOString(),
provider: "provider-a",
model: "model-a",
apiKeyId: "api-key-legacy",
apiKeyName: "Original Name",
tokens: { input: 10, output: 5 },
},
{
timestamp: new Date().toISOString(),
provider: "provider-a",
model: "model-a",
apiKeyId: "api-key-legacy",
apiKeyName: "Renamed Alias",
tokens: { input: 20, output: 10 },
},
],
"all"
);
assert.equal(analytics.summary.uniqueApiKeys, 1);
assert.equal(analytics.byApiKey.length, 1);
assert.equal(analytics.byApiKey[0].apiKeyId, "api-key-legacy");
assert.deepEqual(analytics.byApiKey[0].historicalApiKeyNames.sort(), [
"Original Name",
"Renamed Alias",
]);
assert.equal(analytics.byApiKey[0].requests, 2);
assert.equal(analytics.byApiKey[0].promptTokens, 30);
assert.equal(analytics.byApiKey[0].completionTokens, 15);
});
test("Codex Fast service tier applies documented GPT-5.5 and GPT-5.4 cost multipliers", async () => {
await localDb.updatePricing({
codex: {
"gpt-5.5": { input: 5, output: 30 },
"gpt-5.4": { input: 5, output: 30 },
},
});
const tokens = { input: 1000, output: 500 };
assert.equal(await calculateCost("codex", "gpt-5.5", tokens), 0.02);
assert.equal(await calculateCost("codex", "gpt-5.5", tokens, { serviceTier: "priority" }), 0.05);
assert.equal(await calculateCost("codex", "gpt-5.4-high", tokens, { serviceTier: "fast" }), 0.04);
assert.equal(await calculateCost("openai", "gpt-5.5", tokens, { serviceTier: "priority" }), 0.02);
});
test("recent request summaries are generated from SQLite call logs", async () => {
const connection = await providersDb.createProviderConnection({
provider: "log-provider",
authType: "apikey",
name: "Named Account",
apiKey: "sk-test",
});
for (let i = 0; i < 205; i++) {
await callLogs.saveCallLog({
id: `log-${i}`,
timestamp: new Date(Date.now() + i).toISOString(),
method: "POST",
path: "/v1/chat/completions",
status: 200,
model: `model-${i}`,
provider: "log-provider",
connectionId: connection.id,
tokens: { input: i + 1, output: i + 2 },
requestBody: { index: i },
responseBody: { ok: true, index: i },
});
}
const recent = await usageHistory.getRecentLogs(3);
assert.equal(recent.length, 3);
assert.match(recent[0], /model-204/);
assert.match(recent[0], /LOG-PROVIDER/);
assert.match(recent[0], /Named Account/);
assert.match(recent[0], /205 \| 206 \| 200$/);
});
test("pending request metadata stores sanitized payload previews and clears after completion", async () => {
usageHistory.trackPendingRequest("gpt-test", "openai", "conn-preview", true, {
clientEndpoint: "/v1/chat/completions",
clientRequest: {
token: "super-secret-token",
messages: [{ role: "user", content: "hello" }],
},
});
usageHistory.updatePendingRequest("gpt-test", "openai", "conn-preview", {
providerUrl: "https://api.example.com/v1/chat/completions",
providerRequest: {
authorization: "Bearer super-secret-token",
messages: [{ role: "user", content: "hello" }],
},
});
const pending = usageHistory.getPendingRequests();
const detail = pending.details["conn-preview"]["gpt-test (openai)"];
const clientRequestPreview = detail.clientRequest as Record<string, unknown>;
const providerRequestPreview = detail.providerRequest as Record<string, unknown>;
assert.equal(detail.clientEndpoint, "/v1/chat/completions");
assert.equal(clientRequestPreview.token, "[REDACTED]");
assert.equal(providerRequestPreview.authorization, "[REDACTED]");
assert.equal(detail.providerUrl, "https://api.example.com/v1/chat/completions");
usageHistory.trackPendingRequest("gpt-test", "openai", "conn-preview", false);
assert.equal(pending.details["conn-preview"], undefined);
});
test("clearPendingRequests resets all pending counts and details", () => {
// Simulate leaked pending counts (increment without matching decrement)
usageHistory.trackPendingRequest("model-a", "provider-x", "conn-1", true);
usageHistory.trackPendingRequest("model-a", "provider-x", "conn-1", true);
usageHistory.trackPendingRequest("model-b", "provider-y", "conn-2", true);
const before = usageHistory.getPendingRequests();
assert.equal(before.byModel["model-a (provider-x)"], 2);
assert.equal(before.byModel["model-b (provider-y)"], 1);
assert.ok(before.details["conn-1"]);
assert.ok(before.details["conn-2"]);
// Clear all pending
usageHistory.clearPendingRequests();
const after = usageHistory.getPendingRequests();
assert.equal(Object.keys(after.byModel).length, 0);
assert.equal(Object.keys(after.byAccount).length, 0);
assert.equal(Object.keys(after.details).length, 0);
});
test("clearPendingRequests allows fresh tracking after clearing", () => {
usageHistory.trackPendingRequest("model-c", "provider-z", "conn-3", true);
usageHistory.clearPendingRequests();
// Tracking should work normally after clearing
usageHistory.trackPendingRequest("model-d", "provider-w", "conn-4", true);
const pending = usageHistory.getPendingRequests();
assert.equal(pending.byModel["model-d (provider-w)"], 1);
assert.ok(pending.details["conn-4"]);
});