feat(cost): add budget tracking core and harden storage reliability (#292)

This commit is contained in:
Chummy 2026-02-16 23:40:47 +08:00 committed by GitHub
parent 8882746ced
commit e4944a5fc2
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
8 changed files with 890 additions and 2 deletions

193
src/cost/types.rs Normal file
View file

@ -0,0 +1,193 @@
use serde::{Deserialize, Serialize};
/// Token usage information from a single API call.
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct TokenUsage {
/// Model identifier (e.g., "anthropic/claude-sonnet-4-20250514")
pub model: String,
/// Input/prompt tokens
pub input_tokens: u64,
/// Output/completion tokens
pub output_tokens: u64,
/// Total tokens
pub total_tokens: u64,
/// Calculated cost in USD
pub cost_usd: f64,
/// Timestamp of the request
pub timestamp: chrono::DateTime<chrono::Utc>,
}
impl TokenUsage {
fn sanitize_price(value: f64) -> f64 {
if value.is_finite() && value > 0.0 {
value
} else {
0.0
}
}
/// Create a new token usage record.
pub fn new(
model: impl Into<String>,
input_tokens: u64,
output_tokens: u64,
input_price_per_million: f64,
output_price_per_million: f64,
) -> Self {
let model = model.into();
let input_price_per_million = Self::sanitize_price(input_price_per_million);
let output_price_per_million = Self::sanitize_price(output_price_per_million);
let total_tokens = input_tokens.saturating_add(output_tokens);
// Calculate cost: (tokens / 1M) * price_per_million
let input_cost = (input_tokens as f64 / 1_000_000.0) * input_price_per_million;
let output_cost = (output_tokens as f64 / 1_000_000.0) * output_price_per_million;
let cost_usd = input_cost + output_cost;
Self {
model,
input_tokens,
output_tokens,
total_tokens,
cost_usd,
timestamp: chrono::Utc::now(),
}
}
/// Get the total cost.
pub fn cost(&self) -> f64 {
self.cost_usd
}
}
/// Time period for cost aggregation.
#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
pub enum UsagePeriod {
Session,
Day,
Month,
}
/// A single cost record for persistent storage.
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct CostRecord {
/// Unique identifier
pub id: String,
/// Token usage details
pub usage: TokenUsage,
/// Session identifier (for grouping)
pub session_id: String,
}
impl CostRecord {
/// Create a new cost record.
pub fn new(session_id: impl Into<String>, usage: TokenUsage) -> Self {
Self {
id: uuid::Uuid::new_v4().to_string(),
usage,
session_id: session_id.into(),
}
}
}
/// Budget enforcement result.
#[derive(Debug, Clone)]
pub enum BudgetCheck {
/// Within budget, request can proceed
Allowed,
/// Warning threshold exceeded but request can proceed
Warning {
current_usd: f64,
limit_usd: f64,
period: UsagePeriod,
},
/// Budget exceeded, request blocked
Exceeded {
current_usd: f64,
limit_usd: f64,
period: UsagePeriod,
},
}
/// Cost summary for reporting.
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct CostSummary {
/// Total cost for the session
pub session_cost_usd: f64,
/// Total cost for the day
pub daily_cost_usd: f64,
/// Total cost for the month
pub monthly_cost_usd: f64,
/// Total tokens used
pub total_tokens: u64,
/// Number of requests
pub request_count: usize,
/// Breakdown by model
pub by_model: std::collections::HashMap<String, ModelStats>,
}
/// Statistics for a specific model.
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct ModelStats {
/// Model name
pub model: String,
/// Total cost for this model
pub cost_usd: f64,
/// Total tokens for this model
pub total_tokens: u64,
/// Number of requests for this model
pub request_count: usize,
}
impl Default for CostSummary {
fn default() -> Self {
Self {
session_cost_usd: 0.0,
daily_cost_usd: 0.0,
monthly_cost_usd: 0.0,
total_tokens: 0,
request_count: 0,
by_model: std::collections::HashMap::new(),
}
}
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn token_usage_calculation() {
let usage = TokenUsage::new("test/model", 1000, 500, 3.0, 15.0);
// Expected: (1000/1M)*3 + (500/1M)*15 = 0.003 + 0.0075 = 0.0105
assert!((usage.cost_usd - 0.0105).abs() < 0.0001);
assert_eq!(usage.input_tokens, 1000);
assert_eq!(usage.output_tokens, 500);
assert_eq!(usage.total_tokens, 1500);
}
#[test]
fn token_usage_zero_tokens() {
let usage = TokenUsage::new("test/model", 0, 0, 3.0, 15.0);
assert!(usage.cost_usd.abs() < f64::EPSILON);
assert_eq!(usage.total_tokens, 0);
}
#[test]
fn token_usage_negative_or_non_finite_prices_are_clamped() {
let usage = TokenUsage::new("test/model", 1000, 1000, -3.0, f64::NAN);
assert!(usage.cost_usd.abs() < f64::EPSILON);
assert_eq!(usage.total_tokens, 2000);
}
#[test]
fn cost_record_creation() {
let usage = TokenUsage::new("test/model", 100, 50, 1.0, 2.0);
let record = CostRecord::new("session-123", usage);
assert_eq!(record.session_id, "session-123");
assert!(!record.id.is_empty());
assert_eq!(record.usage.model, "test/model");
}
}