修改计算规则以及数据库

This commit is contained in:
2025-08-10 02:46:52 +08:00
parent dcd6b42a66
commit d8995bfe36
6 changed files with 733 additions and 102 deletions

View File

@@ -0,0 +1,571 @@
use chrono::{Local, Utc};
use rusqlite::{params, Connection};
use serde::{Deserialize, Serialize};
use std::collections::{HashMap, HashSet};
use std::fs;
use std::path::{Path, PathBuf};
use std::sync::{Arc, Mutex};
use tauri::{command, State};
use walkdir::WalkDir;
use super::usage::{
UsageStats, ModelUsage, DailyUsage, ProjectUsage, UsageEntry,
parse_jsonl_file
};
#[derive(Default)]
pub struct UsageCacheState {
pub conn: Arc<Mutex<Option<Connection>>>,
pub last_scan_time: Arc<Mutex<Option<i64>>>,
}
#[derive(Debug, Serialize, Deserialize)]
pub struct ScanResult {
pub files_scanned: u32,
pub entries_added: u32,
pub entries_skipped: u32,
pub scan_time_ms: u64,
}
fn db_path() -> PathBuf {
dirs::home_dir()
.unwrap_or_else(|| PathBuf::from("."))
.join(".claudia/cache/usage_stats.sqlite")
}
fn ensure_parent_dir(p: &Path) -> std::io::Result<()> {
if let Some(dir) = p.parent() {
std::fs::create_dir_all(dir)?;
}
Ok(())
}
pub fn init_cache_db() -> rusqlite::Result<Connection> {
let path = db_path();
ensure_parent_dir(&path).map_err(|e| rusqlite::Error::ToSqlConversionFailure(Box::new(e)))?;
let conn = Connection::open(path)?;
conn.pragma_update(None, "journal_mode", &"WAL")?;
// Create schema
conn.execute_batch(
r#"
CREATE TABLE IF NOT EXISTS schema_version (version INTEGER PRIMARY KEY);
INSERT OR IGNORE INTO schema_version(version) VALUES (1);
-- File scan records
CREATE TABLE IF NOT EXISTS scanned_files (
id INTEGER PRIMARY KEY AUTOINCREMENT,
file_path TEXT NOT NULL UNIQUE,
file_size INTEGER NOT NULL,
mtime_ms INTEGER NOT NULL,
last_scanned_ms INTEGER NOT NULL,
entry_count INTEGER DEFAULT 0
);
CREATE INDEX IF NOT EXISTS idx_files_path ON scanned_files(file_path);
-- API usage records
CREATE TABLE IF NOT EXISTS usage_entries (
id INTEGER PRIMARY KEY AUTOINCREMENT,
timestamp TEXT NOT NULL,
model TEXT NOT NULL,
input_tokens INTEGER DEFAULT 0,
output_tokens INTEGER DEFAULT 0,
cache_creation_tokens INTEGER DEFAULT 0,
cache_read_tokens INTEGER DEFAULT 0,
cost REAL NOT NULL,
session_id TEXT NOT NULL,
project_path TEXT NOT NULL,
file_path TEXT NOT NULL,
unique_hash TEXT NOT NULL UNIQUE
);
CREATE INDEX IF NOT EXISTS idx_entries_timestamp ON usage_entries(timestamp);
CREATE INDEX IF NOT EXISTS idx_entries_project ON usage_entries(project_path);
CREATE INDEX IF NOT EXISTS idx_entries_hash ON usage_entries(unique_hash);
CREATE INDEX IF NOT EXISTS idx_entries_model ON usage_entries(model);
"#,
)?;
Ok(conn)
}
fn get_file_mtime_ms(path: &Path) -> i64 {
fs::metadata(path)
.and_then(|m| m.modified())
.ok()
.and_then(|t| t.duration_since(std::time::UNIX_EPOCH).ok())
.map(|d| d.as_millis() as i64)
.unwrap_or(0)
}
fn get_file_size(path: &Path) -> i64 {
fs::metadata(path)
.map(|m| m.len() as i64)
.unwrap_or(0)
}
fn generate_unique_hash(entry: &UsageEntry, has_io_tokens: bool, has_cache_tokens: bool) -> String {
if has_io_tokens {
// For I/O tokens: use session_id + timestamp + model
format!("io:{}:{}:{}", entry.session_id, entry.timestamp, entry.model)
} else if has_cache_tokens {
// For cache tokens: use timestamp + model + project
format!("cache:{}:{}:{}", entry.timestamp, entry.model, entry.project_path)
} else {
// Fallback
format!("other:{}:{}", entry.timestamp, entry.session_id)
}
}
#[command]
pub async fn usage_scan_update(state: State<'_, UsageCacheState>) -> Result<ScanResult, String> {
let start_time = Utc::now().timestamp_millis();
// Initialize or get connection
let mut conn_guard = state.conn.lock().map_err(|e| e.to_string())?;
if conn_guard.is_none() {
*conn_guard = Some(init_cache_db().map_err(|e| e.to_string())?);
}
let conn = conn_guard.as_mut().unwrap();
let claude_path = dirs::home_dir()
.ok_or("Failed to get home directory")?
.join(".claude");
let projects_dir = claude_path.join("projects");
// Get existing scanned files from DB
let mut existing_files: HashMap<String, (i64, i64)> = HashMap::new();
{
let mut stmt = conn
.prepare("SELECT file_path, file_size, mtime_ms FROM scanned_files")
.map_err(|e| e.to_string())?;
let rows = stmt.query_map(params![], |row| {
Ok((
row.get::<_, String>(0)?,
(row.get::<_, i64>(1)?, row.get::<_, i64>(2)?),
))
}).map_err(|e| e.to_string())?;
for row in rows {
if let Ok((path, data)) = row {
existing_files.insert(path, data);
}
}
}
// Find all .jsonl files
let mut files_to_process = Vec::new();
let mut all_current_files = HashSet::new();
if let Ok(projects) = fs::read_dir(&projects_dir) {
for project in projects.flatten() {
if project.file_type().map(|t| t.is_dir()).unwrap_or(false) {
let project_name = project.file_name().to_string_lossy().to_string();
let project_path = project.path();
WalkDir::new(&project_path)
.into_iter()
.filter_map(Result::ok)
.filter(|e| e.path().extension().and_then(|s| s.to_str()) == Some("jsonl"))
.for_each(|entry| {
let path = entry.path().to_path_buf();
let path_str = path.to_string_lossy().to_string();
all_current_files.insert(path_str.clone());
// Check if file needs processing
let current_size = get_file_size(&path);
let current_mtime = get_file_mtime_ms(&path);
let needs_processing = if let Some((stored_size, stored_mtime)) = existing_files.get(&path_str) {
current_size != *stored_size || current_mtime != *stored_mtime
} else {
true // New file
};
if needs_processing {
files_to_process.push((path, project_name.clone()));
}
});
}
}
}
let mut files_scanned = 0u32;
let mut entries_added = 0u32;
let mut entries_skipped = 0u32;
// Process files that need updating
let tx = conn.transaction().map_err(|e| e.to_string())?;
for (file_path, project_name) in files_to_process {
let path_str = file_path.to_string_lossy().to_string();
let file_size = get_file_size(&file_path);
let mtime_ms = get_file_mtime_ms(&file_path);
// Parse the JSONL file and get entries
let mut processed_hashes = HashSet::new();
let entries = parse_jsonl_file(&file_path, &project_name, &mut processed_hashes);
// Insert or update file record
tx.execute(
"INSERT INTO scanned_files (file_path, file_size, mtime_ms, last_scanned_ms, entry_count)
VALUES (?1, ?2, ?3, ?4, ?5)
ON CONFLICT(file_path) DO UPDATE SET
file_size = excluded.file_size,
mtime_ms = excluded.mtime_ms,
last_scanned_ms = excluded.last_scanned_ms,
entry_count = excluded.entry_count",
params![path_str, file_size, mtime_ms, start_time, entries.len() as i64],
).map_err(|e| e.to_string())?;
// Insert usage entries
for entry in entries {
let has_io_tokens = entry.input_tokens > 0 || entry.output_tokens > 0;
let has_cache_tokens = entry.cache_creation_tokens > 0 || entry.cache_read_tokens > 0;
let unique_hash = generate_unique_hash(&entry, has_io_tokens, has_cache_tokens);
let result = tx.execute(
"INSERT INTO usage_entries (
timestamp, model, input_tokens, output_tokens,
cache_creation_tokens, cache_read_tokens, cost,
session_id, project_path, file_path, unique_hash
) VALUES (?1, ?2, ?3, ?4, ?5, ?6, ?7, ?8, ?9, ?10, ?11)
ON CONFLICT(unique_hash) DO NOTHING",
params![
entry.timestamp,
entry.model,
entry.input_tokens as i64,
entry.output_tokens as i64,
entry.cache_creation_tokens as i64,
entry.cache_read_tokens as i64,
entry.cost,
entry.session_id,
entry.project_path,
path_str,
unique_hash,
],
);
match result {
Ok(n) if n > 0 => entries_added += 1,
_ => entries_skipped += 1,
}
}
files_scanned += 1;
}
// Remove entries for files that no longer exist
for (old_path, _) in existing_files {
if !all_current_files.contains(&old_path) {
tx.execute("DELETE FROM usage_entries WHERE file_path = ?1", params![old_path])
.map_err(|e| e.to_string())?;
tx.execute("DELETE FROM scanned_files WHERE file_path = ?1", params![old_path])
.map_err(|e| e.to_string())?;
}
}
tx.commit().map_err(|e| e.to_string())?;
// Update last scan time
let mut last_scan = state.last_scan_time.lock().map_err(|e| e.to_string())?;
*last_scan = Some(start_time);
let scan_time_ms = (Utc::now().timestamp_millis() - start_time) as u64;
Ok(ScanResult {
files_scanned,
entries_added,
entries_skipped,
scan_time_ms,
})
}
#[command]
pub async fn usage_get_stats_cached(
days: Option<u32>,
state: State<'_, UsageCacheState>,
) -> Result<UsageStats, String> {
// First ensure cache is up to date
usage_scan_update(state.clone()).await?;
let conn_guard = state.conn.lock().map_err(|e| e.to_string())?;
let conn = conn_guard.as_ref().ok_or("Database not initialized")?;
// Build date filter
let date_filter = if let Some(d) = days {
let cutoff = Local::now().naive_local().date() - chrono::Duration::days(d as i64);
Some(cutoff.format("%Y-%m-%d").to_string())
} else {
None
};
// Query total stats
let (total_cost, total_input, total_output, total_cache_creation, total_cache_read): (f64, i64, i64, i64, i64) =
if let Some(cutoff) = &date_filter {
conn.query_row(
"SELECT
COALESCE(SUM(cost), 0.0),
COALESCE(SUM(input_tokens), 0),
COALESCE(SUM(output_tokens), 0),
COALESCE(SUM(cache_creation_tokens), 0),
COALESCE(SUM(cache_read_tokens), 0)
FROM usage_entries
WHERE timestamp >= ?1",
params![cutoff],
|row| Ok((row.get(0)?, row.get(1)?, row.get(2)?, row.get(3)?, row.get(4)?)),
).map_err(|e| e.to_string())?
} else {
conn.query_row(
"SELECT
COALESCE(SUM(cost), 0.0),
COALESCE(SUM(input_tokens), 0),
COALESCE(SUM(output_tokens), 0),
COALESCE(SUM(cache_creation_tokens), 0),
COALESCE(SUM(cache_read_tokens), 0)
FROM usage_entries",
params![],
|row| Ok((row.get(0)?, row.get(1)?, row.get(2)?, row.get(3)?, row.get(4)?)),
).map_err(|e| e.to_string())?
};
let total_tokens = total_input + total_output + total_cache_creation + total_cache_read;
// Get session count
let total_sessions: i64 = if let Some(cutoff) = &date_filter {
conn.query_row(
"SELECT COUNT(DISTINCT session_id) FROM usage_entries WHERE timestamp >= ?1",
params![cutoff],
|row| row.get(0),
).map_err(|e| e.to_string())?
} else {
conn.query_row(
"SELECT COUNT(DISTINCT session_id) FROM usage_entries",
params![],
|row| row.get(0),
).map_err(|e| e.to_string())?
};
// Get stats by model
let mut by_model = Vec::new();
{
let query = if date_filter.is_some() {
"SELECT
model,
SUM(cost) as total_cost,
SUM(input_tokens) as input,
SUM(output_tokens) as output,
SUM(cache_creation_tokens) as cache_creation,
SUM(cache_read_tokens) as cache_read,
COUNT(DISTINCT session_id) as sessions
FROM usage_entries
WHERE timestamp >= ?1
GROUP BY model
ORDER BY total_cost DESC"
} else {
"SELECT
model,
SUM(cost) as total_cost,
SUM(input_tokens) as input,
SUM(output_tokens) as output,
SUM(cache_creation_tokens) as cache_creation,
SUM(cache_read_tokens) as cache_read,
COUNT(DISTINCT session_id) as sessions
FROM usage_entries
GROUP BY model
ORDER BY total_cost DESC"
};
let mut stmt = conn.prepare(query).map_err(|e| e.to_string())?;
// Create closure once to avoid type mismatch
let create_model_usage = |row: &rusqlite::Row| -> rusqlite::Result<ModelUsage> {
Ok(ModelUsage {
model: row.get(0)?,
total_cost: row.get(1)?,
input_tokens: row.get::<_, i64>(2)? as u64,
output_tokens: row.get::<_, i64>(3)? as u64,
cache_creation_tokens: row.get::<_, i64>(4)? as u64,
cache_read_tokens: row.get::<_, i64>(5)? as u64,
session_count: row.get::<_, i64>(6)? as u64,
total_tokens: 0, // Will calculate below
})
};
let rows = if let Some(cutoff) = &date_filter {
stmt.query_map(params![cutoff], create_model_usage).map_err(|e| e.to_string())?
} else {
stmt.query_map(params![], create_model_usage).map_err(|e| e.to_string())?
};
for row in rows {
if let Ok(mut usage) = row {
usage.total_tokens = usage.input_tokens + usage.output_tokens +
usage.cache_creation_tokens + usage.cache_read_tokens;
by_model.push(usage);
}
}
}
// Get daily stats
let mut by_date = Vec::new();
{
let query = if date_filter.is_some() {
"SELECT
DATE(timestamp) as date,
SUM(cost) as total_cost,
SUM(input_tokens) as input,
SUM(output_tokens) as output,
SUM(cache_creation_tokens) as cache_creation,
SUM(cache_read_tokens) as cache_read,
COUNT(DISTINCT session_id) as sessions,
COUNT(*) as requests,
GROUP_CONCAT(DISTINCT model) as models
FROM usage_entries
WHERE timestamp >= ?1
GROUP BY DATE(timestamp)
ORDER BY date DESC"
} else {
"SELECT
DATE(timestamp) as date,
SUM(cost) as total_cost,
SUM(input_tokens) as input,
SUM(output_tokens) as output,
SUM(cache_creation_tokens) as cache_creation,
SUM(cache_read_tokens) as cache_read,
COUNT(DISTINCT session_id) as sessions,
COUNT(*) as requests,
GROUP_CONCAT(DISTINCT model) as models
FROM usage_entries
GROUP BY DATE(timestamp)
ORDER BY date DESC"
};
let mut stmt = conn.prepare(query).map_err(|e| e.to_string())?;
// Create closure once to avoid type mismatch
let create_daily_usage = |row: &rusqlite::Row| -> rusqlite::Result<DailyUsage> {
let models_str: String = row.get(8)?;
let models_used: Vec<String> = models_str.split(',').map(|s| s.to_string()).collect();
Ok(DailyUsage {
date: row.get(0)?,
total_cost: row.get(1)?,
total_tokens: (row.get::<_, i64>(2)? + row.get::<_, i64>(3)? +
row.get::<_, i64>(4)? + row.get::<_, i64>(5)?) as u64,
input_tokens: row.get::<_, i64>(2)? as u64,
output_tokens: row.get::<_, i64>(3)? as u64,
cache_creation_tokens: row.get::<_, i64>(4)? as u64,
cache_read_tokens: row.get::<_, i64>(5)? as u64,
request_count: row.get::<_, i64>(7)? as u64,
models_used,
})
};
let rows = if let Some(cutoff) = &date_filter {
stmt.query_map(params![cutoff], create_daily_usage).map_err(|e| e.to_string())?
} else {
stmt.query_map(params![], create_daily_usage).map_err(|e| e.to_string())?
};
for row in rows {
if let Ok(daily) = row {
by_date.push(daily);
}
}
}
// Get project stats
let mut by_project = Vec::new();
{
let query = if date_filter.is_some() {
"SELECT
project_path,
SUM(cost) as total_cost,
SUM(input_tokens + output_tokens + cache_creation_tokens + cache_read_tokens) as total_tokens,
COUNT(DISTINCT session_id) as sessions,
MAX(timestamp) as last_used
FROM usage_entries
WHERE timestamp >= ?1
GROUP BY project_path
ORDER BY total_cost DESC"
} else {
"SELECT
project_path,
SUM(cost) as total_cost,
SUM(input_tokens + output_tokens + cache_creation_tokens + cache_read_tokens) as total_tokens,
COUNT(DISTINCT session_id) as sessions,
MAX(timestamp) as last_used
FROM usage_entries
GROUP BY project_path
ORDER BY total_cost DESC"
};
let mut stmt = conn.prepare(query).map_err(|e| e.to_string())?;
// Create closure once to avoid type mismatch
let create_project_usage = |row: &rusqlite::Row| -> rusqlite::Result<ProjectUsage> {
Ok(ProjectUsage {
project_path: row.get(0)?,
project_name: String::new(), // Will be extracted from path
total_cost: row.get(1)?,
total_tokens: row.get::<_, i64>(2)? as u64,
session_count: row.get::<_, i64>(3)? as u64,
last_used: row.get(4)?,
})
};
let rows = if let Some(cutoff) = &date_filter {
stmt.query_map(params![cutoff], create_project_usage).map_err(|e| e.to_string())?
} else {
stmt.query_map(params![], create_project_usage).map_err(|e| e.to_string())?
};
for row in rows {
if let Ok(mut project) = row {
// Extract project name from path
project.project_name = project.project_path
.split('/')
.last()
.unwrap_or(&project.project_path)
.to_string();
by_project.push(project);
}
}
}
Ok(UsageStats {
total_cost,
total_tokens: total_tokens as u64,
total_input_tokens: total_input as u64,
total_output_tokens: total_output as u64,
total_cache_creation_tokens: total_cache_creation as u64,
total_cache_read_tokens: total_cache_read as u64,
total_sessions: total_sessions as u64,
by_model,
by_date,
by_project,
})
}
#[command]
pub async fn usage_clear_cache(state: State<'_, UsageCacheState>) -> Result<String, String> {
let mut conn_guard = state.conn.lock().map_err(|e| e.to_string())?;
if let Some(conn) = conn_guard.as_mut() {
conn.execute("DELETE FROM usage_entries", params![])
.map_err(|e| e.to_string())?;
conn.execute("DELETE FROM scanned_files", params![])
.map_err(|e| e.to_string())?;
// 重置last scan time
let mut last_scan = state.last_scan_time.lock().map_err(|e| e.to_string())?;
*last_scan = None;
return Ok("Cache cleared successfully. All costs will be recalculated.".to_string());
}
Ok("No cache to clear.".to_string())
}