agent-ecosystem/test/main/utils/costCalculation.test.ts
iliya 9b7c9fec0c feat: enhance task assignment notifications and improve message clarity
- Updated the task assignment message in tasks.js to include additional instructions for task initiation based on current workload.
- Modified the notification tests to verify the inclusion of new task initiation guidance.
- Adjusted the formatting in the CollapsibleTeamSection component for better layout consistency.
- Refactored the ChangeExtractorService tests to improve clarity and accuracy in log file reference handling.
- Updated cost calculation tests to reflect changes in model names and pricing structures, ensuring accurate cost assessments.
- Enhanced mention detection tests to include trigger character information for improved functionality.
2026-03-14 23:05:42 +02:00

598 lines
17 KiB
TypeScript

/**
* Tests for cost calculation in jsonl.ts
*/
import { describe, it, expect, vi } from 'vitest';
import { calculateMetrics } from '@main/utils/jsonl';
import type { ParsedMessage } from '@main/types';
describe('Cost Calculation', () => {
describe('Basic Cost Calculation', () => {
it('should calculate cost for simple token usage', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-4-sonnet-20250514',
usage: {
input_tokens: 1000,
output_tokens: 500,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
// Expected: (1000 * 0.000003) + (500 * 0.000015) = 0.003 + 0.0075 = 0.0105
expect(metrics.costUsd).toBeCloseTo(0.0105, 6);
});
it('should calculate cost with cache tokens', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-4-sonnet-20250514',
usage: {
input_tokens: 1000,
output_tokens: 500,
cache_creation_input_tokens: 200,
cache_read_input_tokens: 300,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
// Input: 1000 * 0.000003 = 0.003
// Output: 500 * 0.000015 = 0.0075
// Cache creation: 200 * 0.00000375 = 0.00075
// Cache read: 300 * 0.0000003 = 0.00009
// Total: 0.01134
expect(metrics.costUsd).toBeCloseTo(0.01134, 6);
});
it('should return 0 cost when no model is specified', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
usage: {
input_tokens: 1000,
output_tokens: 500,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
expect(metrics.costUsd).toBe(0);
});
it('should return 0 cost when model pricing not found', () => {
const warnSpy = vi.spyOn(console, 'warn').mockImplementation(() => undefined);
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'unknown-model',
usage: {
input_tokens: 1000,
output_tokens: 500,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
expect(metrics.costUsd).toBe(0);
warnSpy.mockRestore();
});
});
describe('Tiered Pricing', () => {
it('should use base rates for tokens below 200k threshold', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-4-sonnet-20250514',
usage: {
input_tokens: 100_000,
output_tokens: 50_000,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
// Input: 100000 * 0.000003 = 0.3
// Output: 50000 * 0.000015 = 0.75
// Total: 1.05
expect(metrics.costUsd).toBeCloseTo(1.05, 6);
});
it('should use base rates for input tokens above 200k when model has no tiered pricing', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-3-opus-20240229',
usage: {
input_tokens: 250_000,
output_tokens: 1_000,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
// claude-3-opus-20240229 has no tiered rates in pricing.json, so base rates apply
// Input: 250000 * 0.000015 = 3.75
// Output: 1000 * 0.000075 = 0.075
// Total: 3.825
expect(metrics.costUsd).toBeCloseTo(3.825, 6);
});
it('should use base rates for output tokens above 200k when model has no tiered pricing', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-3-opus-20240229',
usage: {
input_tokens: 1_000,
output_tokens: 250_000,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
// No tiered rates, so base rates for all tokens
// Input: 1000 * 0.000015 = 0.015
// Output: 250000 * 0.000075 = 18.75
// Total: 18.765
expect(metrics.costUsd).toBeCloseTo(18.765, 6);
});
it('should use base rates for cache tokens above 200k when model has no tiered pricing', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-3-opus-20240229',
usage: {
input_tokens: 1_000,
output_tokens: 1_000,
cache_creation_input_tokens: 250_000,
cache_read_input_tokens: 250_000,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
// No tiered rates for this model, so base rates apply
// Input: 1000 * 0.000015 = 0.015
// Output: 1000 * 0.000075 = 0.075
// Cache creation: 250000 * 0.00001875 = 4.6875
// Cache read: 250000 * 0.0000015 = 0.375
// Total: 5.1525
expect(metrics.costUsd).toBeCloseTo(5.1525, 6);
});
it('should handle model without tiered pricing', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-3-opus-20240229',
usage: {
input_tokens: 250_000,
output_tokens: 250_000,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
// No tiered rates, so use base rates even above 200k
// Input: 250000 * 0.000015 = 3.75
// Output: 250000 * 0.000075 = 18.75
// Total: 22.5
expect(metrics.costUsd).toBeCloseTo(22.5, 6);
});
it('should use tiered rates for a model that has them (claude-4-sonnet)', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-4-sonnet-20250514',
usage: {
input_tokens: 250_000,
output_tokens: 1_000,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
// claude-4-sonnet has tiered rates:
// input base=0.000003, above_200k=0.000006
// Input: (200000 * 0.000003) + (50000 * 0.000006) = 0.6 + 0.3 = 0.9
// Output: 1000 * 0.000015 = 0.015
// Total: 0.915
expect(metrics.costUsd).toBeCloseTo(0.915, 6);
});
});
describe('Multiple Messages', () => {
it('should aggregate costs across multiple messages', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-4-sonnet-20250514',
usage: {
input_tokens: 1000,
output_tokens: 500,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
{
type: 'assistant',
uuid: 'msg-2',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-4-sonnet-20250514',
usage: {
input_tokens: 2000,
output_tokens: 1000,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
// Message 1: (1000 * 0.000003) + (500 * 0.000015) = 0.0105
// Message 2: (2000 * 0.000003) + (1000 * 0.000015) = 0.021
// Total: 0.0315
expect(metrics.costUsd).toBeCloseTo(0.0315, 6);
});
it("should calculate cost per-message using each message's model", () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-4-sonnet-20250514',
usage: {
input_tokens: 1000,
output_tokens: 500,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
{
type: 'assistant',
uuid: 'msg-2',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-3-opus-20240229', // Different model
usage: {
input_tokens: 1000,
output_tokens: 500,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
// Each message uses its own model's pricing
// Message 1 (sonnet): (1000 * 0.000003) + (500 * 0.000015) = 0.003 + 0.0075 = 0.0105
// Message 2 (opus): (1000 * 0.000015) + (500 * 0.000075) = 0.015 + 0.0375 = 0.0525
// Total cost: 0.0105 + 0.0525 = 0.063
expect(metrics.costUsd).toBeCloseTo(0.063, 6);
});
});
describe('Edge Cases', () => {
it('should handle zero tokens', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-4-sonnet-20250514',
usage: {
input_tokens: 0,
output_tokens: 0,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
expect(metrics.costUsd).toBe(0);
});
it('should handle messages without usage data', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-4-sonnet-20250514',
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
expect(metrics.costUsd).toBe(0);
});
it('should handle empty messages array', () => {
const messages: ParsedMessage[] = [];
const metrics = calculateMetrics(messages);
expect(metrics.costUsd).toBe(0);
});
});
describe('Model Name Lookup', () => {
it('should find model with exact match', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-4-sonnet-20250514',
usage: {
input_tokens: 1000,
output_tokens: 500,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
expect(metrics.costUsd).toBeGreaterThan(0);
});
it('should find model with case-insensitive match', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'CLAUDE-4-SONNET-20250514',
usage: {
input_tokens: 1000,
output_tokens: 500,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
expect(metrics.costUsd).toBeGreaterThan(0);
});
});
describe('Per-Message Tiering', () => {
it('should apply tiered pricing per-message, not to aggregated totals', () => {
// Scenario: Many messages each with cache_read tokens < 200k,
// but aggregated total > 200k
// Each message should use base rates, not tiered rates
const messages: ParsedMessage[] = [];
// Create 10 messages, each with 50k cache_read tokens (500k total)
for (let i = 0; i < 10; i++) {
messages.push({
type: 'assistant',
uuid: `msg-${i}`,
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-4-sonnet-20250514',
usage: {
input_tokens: 0,
output_tokens: 0,
cache_read_input_tokens: 50000,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
});
}
const metrics = calculateMetrics(messages);
// Per-message tiering: Each message uses base rate (< 200k threshold)
// Each message: 50,000 * 0.0000003 = $0.015
// Total: 10 * $0.015 = $0.15
const expectedCost = 10 * 50000 * 0.0000003;
expect(metrics.costUsd).toBeCloseTo(expectedCost, 6);
// Verify this is NOT using tiered rate on aggregated total
// If incorrectly aggregated: (200k * 0.0000003) + (300k * 0.0000006) = $0.24
const incorrectAggregatedCost = 0.24;
expect(metrics.costUsd).not.toBeCloseTo(incorrectAggregatedCost, 2);
});
it('should use base rates when individual messages exceed 200k and model has no tiered rates', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-3-opus-20240229',
usage: {
input_tokens: 0,
output_tokens: 0,
cache_read_input_tokens: 300000, // Exceeds 200k threshold
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
// No tiered rates for this model, so all 300k at base rate
// 300,000 * 0.0000015 = $0.45
const expectedCost = 300000 * 0.0000015;
expect(metrics.costUsd).toBeCloseTo(expectedCost, 6);
});
});
describe('Integration with Other Metrics', () => {
it('should include cost alongside other session metrics', () => {
const messages: ParsedMessage[] = [
{
type: 'assistant',
uuid: 'msg-1',
parentUuid: null,
isMeta: false,
timestamp: new Date(),
content: [],
model: 'claude-4-sonnet-20250514',
usage: {
input_tokens: 1000,
output_tokens: 500,
},
toolCalls: [],
toolResults: [],
isSidechain: false,
},
];
const metrics = calculateMetrics(messages);
// Check that all expected metrics are present
expect(metrics).toHaveProperty('totalTokens');
expect(metrics).toHaveProperty('inputTokens');
expect(metrics).toHaveProperty('outputTokens');
expect(metrics).toHaveProperty('costUsd');
expect(metrics.totalTokens).toBe(1500);
expect(metrics.inputTokens).toBe(1000);
expect(metrics.outputTokens).toBe(500);
expect(metrics.costUsd).toBeCloseTo(0.0105, 6);
});
});
});