// 移除冗余的顶层导入，因为这些在代码中已由 full path 或局部导入处理 use dashmap::DashMap; use std::collections::{HashSet, HashMap}; use std::path::PathBuf; use std::sync::atomic::{AtomicUsize, Ordering}; use std::sync::Arc; use tokio_util::sync::CancellationToken; use crate::proxy::rate_limit::RateLimitTracker; use crate::proxy::sticky_config::StickySessionConfig; #[derive(Debug, Clone, Copy, PartialEq, Eq)] enum OnDiskAccountState { Enabled, Disabled, Unknown, } #[derive(Debug, Clone)] pub struct ProxyToken { pub account_id: String, pub access_token: String, pub refresh_token: String, pub expires_in: i64, pub timestamp: i64, pub email: String, pub account_path: PathBuf, // 账号文件路径，用于更新 pub project_id: Option, pub subscription_tier: Option, // "FREE" | "PRO" | "ULTRA" pub remaining_quota: Option, // [FIX #563] Remaining quota for priority sorting pub protected_models: HashSet, // [NEW #621] pub health_score: f32, // [NEW] 健康分数 (0.0 - 1.0) pub reset_time: Option, // [NEW] 配额刷新时间戳（用于排序优化） pub validation_blocked: bool, // [NEW] Check for validation block (VALIDATION_REQUIRED temporary block) pub validation_blocked_until: i64, // [NEW] Timestamp until which the account is blocked pub validation_url: Option, // [NEW] Validation URL (#1522) pub model_quotas: HashMap, // [OPTIMIZATION] In-memory cache for model-specific quotas pub model_limits: HashMap, // [NEW] max_output_tokens per model from quota data } pub struct TokenManager { tokens: Arc>, // account_id -> ProxyToken current_index: Arc, last_used_account: Arc>>, data_dir: PathBuf, rate_limit_tracker: Arc, // 新增: 限流跟踪器 sticky_config: Arc>, // 新增：调度配置 session_accounts: Arc>, // 新增：会话与账号映射 (SessionID -> AccountID) preferred_account_id: Arc>>, // [FIX #820] 优先使用的账号ID（固定账号模式） health_scores: Arc>, // account_id -> health_score circuit_breaker_config: Arc>, // [NEW] 熔断配置缓存 // [NEW] 按账号分配的同步刷新锁。 // 用于实现 Double-Checked Locking，防止并发请求导致单个账号短时间内多次调用 OAuth Refresh。 refresh_locks: Arc>>>, // [NEW] loadCodeAssist (fetch_project_id) 的异步 SingleFlight 合并表 // Key 为 account_id，Value 为结果观察者，确保并发请求共享同一个上游探测结果 load_code_assist_inflight: Arc>>>>, /// 支持优雅关闭时主动 abort 后台任务 auto_cleanup_handle: Arc>>>, cancel_token: CancellationToken, } impl TokenManager { /// 创建新的 TokenManager pub fn new(data_dir: PathBuf) -> Self { Self { tokens: Arc::new(DashMap::new()), current_index: Arc::new(AtomicUsize::new(0)), last_used_account: Arc::new(tokio::sync::Mutex::new(None)), data_dir, rate_limit_tracker: Arc::new(RateLimitTracker::new()), sticky_config: Arc::new(tokio::sync::RwLock::new(StickySessionConfig::default())), session_accounts: Arc::new(DashMap::new()), preferred_account_id: Arc::new(tokio::sync::RwLock::new(None)), // [FIX #820] health_scores: Arc::new(DashMap::new()), circuit_breaker_config: Arc::new(tokio::sync::RwLock::new( crate::models::CircuitBreakerConfig::default(), )), refresh_locks: Arc::new(DashMap::new()), load_code_assist_inflight: Arc::new(DashMap::new()), // 初始化 inflight 表 auto_cleanup_handle: Arc::new(tokio::sync::Mutex::new(None)), cancel_token: CancellationToken::new(), } } /// 启动限流记录自动清理后台任务（每15秒检查并清除过期记录） pub async fn start_auto_cleanup(&self) { let tracker = self.rate_limit_tracker.clone(); let cancel = self.cancel_token.child_token(); let handle = tokio::spawn(async move { let mut interval = tokio::time::interval(std::time::Duration::from_secs(15)); loop { tokio::select! { _ = cancel.cancelled() => { tracing::info!("Auto-cleanup task received cancel signal"); break; } _ = interval.tick() => { let cleaned = tracker.cleanup_expired(); if cleaned > 0 { tracing::info!( "Auto-cleanup: Removed {} expired rate limit record(s)", cleaned ); } } } } }); // 先 abort 旧任务（防止任务泄漏），再存储新 handle let mut guard = self.auto_cleanup_handle.lock().await; if let Some(old) = guard.take() { old.abort(); tracing::warn!("Aborted previous auto-cleanup task"); } *guard = Some(handle); tracing::info!("Rate limit auto-cleanup task started (interval: 15s)"); } /// 从主应用账号目录加载所有账号 pub async fn load_accounts(&self) -> Result { let accounts_dir = self.data_dir.join("accounts"); if !accounts_dir.exists() { return Err(format!("账号目录不存在: {:?}", accounts_dir)); } // Reload should reflect current on-disk state (accounts can be added/removed/disabled). self.tokens.clear(); self.current_index.store(0, Ordering::SeqCst); { let mut last_used = self.last_used_account.lock().await; *last_used = None; } let entries = std::fs::read_dir(&accounts_dir) .map_err(|e| format!("读取账号目录失败: {}", e))?; let mut count = 0; for entry in entries { let entry = entry.map_err(|e| format!("读取目录项失败: {}", e))?; let path = entry.path(); if path.extension().and_then(|s| s.to_str()) != Some("json") { continue; } // 尝试加载账号 match self.load_single_account(&path).await { Ok(Some(token)) => { let account_id = token.account_id.clone(); self.tokens.insert(account_id, token); count += 1; } Ok(None) => { // 跳过无效账号 } Err(e) => { tracing::debug!("加载账号失败 {:?}: {}", path, e); } } } Ok(count) } /// 重新加载指定账号（用于配额更新后的实时同步） pub async fn reload_account(&self, account_id: &str) -> Result<(), String> { let path = self .data_dir .join("accounts") .join(format!("{}.json", account_id)); if !path.exists() { return Err(format!("账号文件不存在: {:?}", path)); } match self.load_single_account(&path).await { Ok(Some(token)) => { self.tokens.insert(account_id.to_string(), token); // [NEW] 重新加载账号时自动清除该账号的限流记录 self.clear_rate_limit(account_id); Ok(()) } Ok(None) => { // [FIX] 账号被禁用或不可用时，从内存池中彻底移除 (Issue #1565) // load_single_account returning None means the account should be skipped in its // current state (disabled / proxy_disabled / quota_protection / validation_blocked...). self.remove_account(account_id); Ok(()) } Err(e) => Err(format!("同步账号失败: {}", e)), } } /// 重新加载所有账号 pub async fn reload_all_accounts(&self) -> Result { let count = self.load_accounts().await?; // [NEW] 重新加载所有账号时自动清除所有限流记录 self.clear_all_rate_limits(); Ok(count) } /// 从内存中彻底移除指定账号及其关联数据 (Issue #1477) pub fn remove_account(&self, account_id: &str) { // ... (省略原有逻辑) if self.tokens.remove(account_id).is_some() { tracing::info!("[Proxy] Removed account {} from memory cache", account_id); } self.health_scores.remove(account_id); self.clear_rate_limit(account_id); self.session_accounts.retain(|_, v| v != account_id); if let Ok(mut preferred) = self.preferred_account_id.try_write() { if preferred.as_deref() == Some(account_id) { *preferred = None; tracing::info!("[Proxy] Cleared preferred account status for {}", account_id); } } } /// 根据账号 ID 获取完整的 ProxyToken 对象 (v4.1.29) pub fn get_token_by_id(&self, account_id: &str) -> Option { self.tokens.get(account_id).map(|t| t.clone()) } /// Check if an account has been disabled on disk. /// /// Safety net: avoids selecting a disabled account when the in-memory pool hasn't been /// reloaded yet (e.g. fixed account mode / sticky session). /// /// Note: this is intentionally tolerant to transient read/parse failures (e.g. concurrent /// writes). Failures are reported as `Unknown` so callers can skip without purging the in-memory /// token pool. async fn get_account_state_on_disk(account_path: &std::path::PathBuf) -> OnDiskAccountState { const MAX_RETRIES: usize = 2; const RETRY_DELAY_MS: u64 = 5; for attempt in 0..=MAX_RETRIES { let content = match tokio::fs::read_to_string(account_path).await { Ok(c) => c, Err(e) => { // If the file is gone, the in-memory token is definitely stale. if e.kind() == std::io::ErrorKind::NotFound { return OnDiskAccountState::Disabled; } if attempt < MAX_RETRIES { tokio::time::sleep(std::time::Duration::from_millis(RETRY_DELAY_MS)).await; continue; } tracing::debug!( "Failed to read account file on disk {:?}: {}", account_path, e ); return OnDiskAccountState::Unknown; } }; let account = match serde_json::from_str::(&content) { Ok(v) => v, Err(e) => { if attempt < MAX_RETRIES { tokio::time::sleep(std::time::Duration::from_millis(RETRY_DELAY_MS)).await; continue; } tracing::debug!( "Failed to parse account JSON on disk {:?}: {}", account_path, e ); return OnDiskAccountState::Unknown; } }; let disabled = account .get("disabled") .and_then(|v| v.as_bool()) .unwrap_or(false) || account .get("proxy_disabled") .and_then(|v| v.as_bool()) .unwrap_or(false) || account .get("quota") .and_then(|q| q.get("is_forbidden")) .and_then(|v| v.as_bool()) .unwrap_or(false); return if disabled { OnDiskAccountState::Disabled } else { OnDiskAccountState::Enabled }; } OnDiskAccountState::Unknown } /// 加载单个账号 async fn load_single_account(&self, path: &PathBuf) -> Result, String> { let content = std::fs::read_to_string(path).map_err(|e| format!("读取文件失败: {}", e))?; let mut account: serde_json::Value = serde_json::from_str(&content).map_err(|e| format!("解析 JSON 失败: {}", e))?; // [修复 #1344] 先检查账号是否被手动禁用(非配额保护原因) let is_proxy_disabled = account .get("proxy_disabled") .and_then(|v| v.as_bool()) .unwrap_or(false); let disabled_reason = account .get("proxy_disabled_reason") .and_then(|v| v.as_str()) .unwrap_or(""); if is_proxy_disabled && disabled_reason != "quota_protection" { // Account manually disabled tracing::debug!( "Account skipped due to manual disable: {:?} (email={}, reason={})", path, account .get("email") .and_then(|v| v.as_str()) .unwrap_or(""), disabled_reason ); return Ok(None); } // [NEW] Check for validation block (VALIDATION_REQUIRED temporary block) if account .get("validation_blocked") .and_then(|v| v.as_bool()) .unwrap_or(false) { let block_until = account .get("validation_blocked_until") .and_then(|v| v.as_i64()) .unwrap_or(0); let now = chrono::Utc::now().timestamp(); if now < block_until { // Still blocked tracing::debug!( "Skipping validation-blocked account: {:?} (email={}, blocked until {})", path, account .get("email") .and_then(|v| v.as_str()) .unwrap_or(""), chrono::DateTime::from_timestamp(block_until, 0) .map(|dt| dt.format("%H:%M:%S").to_string()) .unwrap_or_else(|| block_until.to_string()) ); return Ok(None); } else { // Block expired - clear it account["validation_blocked"] = serde_json::json!(false); account["validation_blocked_until"] = serde_json::json!(0); account["validation_blocked_reason"] = serde_json::Value::Null; let updated_json = serde_json::to_string_pretty(&account).map_err(|e| e.to_string())?; std::fs::write(path, updated_json).map_err(|e| e.to_string())?; tracing::info!( "Validation block expired and cleared for account: {}", account .get("email") .and_then(|v| v.as_str()) .unwrap_or("") ); } } // 最终检查账号主开关 if account .get("disabled") .and_then(|v| v.as_bool()) .unwrap_or(false) { tracing::debug!( "Skipping disabled account file: {:?} (email={})", path, account .get("email") .and_then(|v| v.as_str()) .unwrap_or("") ); return Ok(None); } // Safety check: verify state on disk again to handle concurrent mid-parse writes if Self::get_account_state_on_disk(path).await == OnDiskAccountState::Disabled { tracing::debug!("Account file {:?} is disabled on disk, skipping.", path); return Ok(None); } // 配额保护检查 - 只处理配额保护逻辑 // 这样可以在加载时自动恢复配额已恢复的账号 if self.check_and_protect_quota(&mut account, path).await { tracing::debug!( "Account skipped due to quota protection: {:?} (email={})", path, account .get("email") .and_then(|v| v.as_str()) .unwrap_or("") ); return Ok(None); } // [兼容性] 再次确认最终状态（可能被 check_and_protect_quota 修改） if account .get("proxy_disabled") .and_then(|v| v.as_bool()) .unwrap_or(false) { tracing::debug!( "Skipping proxy-disabled account file: {:?} (email={})", path, account .get("email") .and_then(|v| v.as_str()) .unwrap_or("") ); return Ok(None); } let account_id = account["id"].as_str() .ok_or("缺少 id 字段")? .to_string(); let email = account["email"].as_str() .ok_or("缺少 email 字段")? .to_string(); let token_obj = account["token"].as_object() .ok_or("缺少 token 字段")?; let access_token = token_obj["access_token"].as_str() .ok_or("缺少 access_token")? .to_string(); let refresh_token = token_obj["refresh_token"].as_str() .ok_or("缺少 refresh_token")? .to_string(); let expires_in = token_obj["expires_in"].as_i64() .ok_or("缺少 expires_in")?; let timestamp = token_obj["expiry_timestamp"].as_i64() .ok_or("缺少 expiry_timestamp")?; // project_id 是可选的 let project_id = token_obj .get("project_id") .and_then(|v| v.as_str()) .filter(|s| !s.is_empty()) .map(|s| s.to_string()); // 【新增】提取订阅等级 (subscription_tier 为 "FREE" | "PRO" | "ULTRA") let subscription_tier = account .get("quota") .and_then(|q| q.get("subscription_tier")) .and_then(|v| v.as_str()) .map(|s| s.to_string()); // [FIX #563] 提取最大剩余配额百分比用于优先级排序 (Option now) let remaining_quota = account .get("quota") .and_then(|q| self.calculate_quota_stats(q)); // .filter(|&r| r > 0); // 移除 >0 过滤，因为 0% 也是有效数据，只是优先级低 // 【新增 #621】提取受限模型列表 let protected_models: HashSet = account .get("protected_models") .and_then(|v| v.as_array()) .map(|arr| { arr.iter() .filter_map(|v| v.as_str()) .map(|s| s.to_string()) .collect() }) .unwrap_or_default(); let health_score = self.health_scores.get(&account_id).map(|v| *v).unwrap_or(1.0); // [NEW] 提取最近的配额刷新时间（用于排序优化：刷新时间越近优先级越高） let reset_time = self.extract_earliest_reset_time(&account); // [OPTIMIZATION] 构建模型配额内存缓存，避免排序时读取磁盘 let mut model_quotas = HashMap::new(); // [NEW] 构建模型输出限额内存缓存 (max_output_tokens) let mut model_limits: HashMap = HashMap::new(); if let Some(models) = account.get("quota").and_then(|q| q.get("models")).and_then(|m| m.as_array()) { for model in models { if let (Some(name), Some(pct)) = (model.get("name").and_then(|v| v.as_str()), model.get("percentage").and_then(|v| v.as_i64())) { // Normalize name to standard ID let standard_id = crate::proxy::common::model_mapping::normalize_to_standard_id(name) .unwrap_or_else(|| name.to_string()); model_quotas.insert(standard_id, pct as i32); } // [NEW] 解析并缓存 max_output_tokens (按原始 model name，不归一化) if let (Some(name), Some(limit)) = ( model.get("name").and_then(|v| v.as_str()), model.get("max_output_tokens").and_then(|v| v.as_u64()), ) { model_limits.insert(name.to_string(), limit); } } } // [NEW] 启动时自动同步持久化的淘汰模型路由表，注入热更新拦截器 if let Some(rules) = account.get("quota").and_then(|q| q.get("model_forwarding_rules")).and_then(|r| r.as_object()) { for (k, v) in rules { if let Some(new_model) = v.as_str() { crate::proxy::common::model_mapping::update_dynamic_forwarding_rules( k.to_string(), new_model.to_string() ); } } } Ok(Some(ProxyToken { account_id, access_token, refresh_token, expires_in, timestamp, email, account_path: path.clone(), project_id, subscription_tier, remaining_quota, protected_models, health_score, reset_time, validation_blocked: account.get("validation_blocked").and_then(|v| v.as_bool()).unwrap_or(false), validation_blocked_until: account.get("validation_blocked_until").and_then(|v| v.as_i64()).unwrap_or(0), validation_url: account.get("validation_url").and_then(|v| v.as_str()).map(|s| s.to_string()), model_quotas, model_limits, })) } /// 检查账号是否应该被配额保护 /// 如果配额低于阈值，自动禁用账号并返回 true async fn check_and_protect_quota( &self, account_json: &mut serde_json::Value, account_path: &PathBuf, ) -> bool { // 1. 加载配额保护配置 let config = match crate::modules::config::load_app_config() { Ok(cfg) => cfg.quota_protection, Err(_) => return false, // 配置加载失败，跳过保护 }; if !config.enabled { return false; // 配额保护未启用 } // 2. 获取配额信息 // 注意：我们需要 clone 配额信息来遍历，避免借用冲突，但修改是针对 account_json 的 let quota = match account_json.get("quota") { Some(q) => q.clone(), None => return false, // 无配额信息，跳过 }; // 3. [兼容性 #621] 检查是否被旧版账号级配额保护禁用,尝试恢复并转为模型级 let is_proxy_disabled = account_json .get("proxy_disabled") .and_then(|v| v.as_bool()) .unwrap_or(false); let reason = account_json.get("proxy_disabled_reason") .and_then(|v| v.as_str()) .unwrap_or(""); if is_proxy_disabled && reason == "quota_protection" { // 如果是被旧版账号级保护禁用的,尝试恢复并转为模型级 return self .check_and_restore_quota(account_json, account_path, "a, &config) .await; } // [修复 #1344] 不再处理其他禁用原因,让调用方负责检查手动禁用 // 4. 获取模型列表 let models = match quota.get("models").and_then(|m| m.as_array()) { Some(m) => m, None => return false, }; // 5. [重构] 聚合判定逻辑：按 Standard ID 对账号所有型号进行分组 // 解决如 Pro-Low (0%) 和 Pro-High (100%) 在同一账号内导致状态冲突的问题 let mut group_min_percentage: HashMap = HashMap::new(); for model in models { let name = model.get("name").and_then(|v| v.as_str()).unwrap_or(""); let percentage = model.get("percentage").and_then(|v| v.as_i64()).unwrap_or(100) as i32; if let Some(std_id) = crate::proxy::common::model_mapping::normalize_to_standard_id(name) { let entry = group_min_percentage.entry(std_id).or_insert(100); if percentage < *entry { *entry = percentage; } } } // 6. 遍历受监控的 Standard ID，根据组内“最差状态”执行锁定或恢复 let threshold = config.threshold_percentage as i32; let account_id = account_json .get("id") .and_then(|v| v.as_str()) .unwrap_or("unknown") .to_string(); let mut changed = false; for std_id in &config.monitored_models { // 获取该组的最低百分比，如果账号没该组型号则视为 100% let min_pct = group_min_percentage.get(std_id).cloned().unwrap_or(100); if min_pct <= threshold { // 只要组内有一个不行，触发全组保护 if self .trigger_quota_protection( account_json, &account_id, account_path, min_pct, threshold, std_id, ) .await .unwrap_or(false) { changed = true; } } else { // 只有全组都好（或者没这型号），才尝试从之前受限状态恢复 let protected_models = account_json .get("protected_models") .and_then(|v| v.as_array()); let is_protected = protected_models.map_or(false, |arr| { arr.iter().any(|m| m.as_str() == Some(std_id as &str)) }); if is_protected { if self .restore_quota_protection( account_json, &account_id, account_path, std_id, ) .await .unwrap_or(false) { changed = true; } } } } let _ = changed; // 避免 unused 警告，如果后续逻辑需要可以继续使用 // 我们不再因为配额原因返回 true（即不再跳过账号）， // 而是加载并在 get_token 时进行过滤。 false } /// 计算账号的最大剩余配额百分比（用于排序） /// 返回值: Option (max_percentage) fn calculate_quota_stats(&self, quota: &serde_json::Value) -> Option { let models = match quota.get("models").and_then(|m| m.as_array()) { Some(m) => m, None => return None, }; let mut max_percentage = 0; let mut has_data = false; for model in models { if let Some(pct) = model.get("percentage").and_then(|v| v.as_i64()) { let pct_i32 = pct as i32; if pct_i32 > max_percentage { max_percentage = pct_i32; } has_data = true; } } if has_data { Some(max_percentage) } else { None } } /// 从磁盘读取特定模型的 quota 百分比 [FIX] 排序使用目标模型的 quota 而非 max /// /// # 参数 /// * `account_path` - 账号 JSON 文件路径 /// * `model_name` - 目标模型名称（已标准化） #[allow(dead_code)] // 预留给精确配额读取逻辑 fn get_model_quota_from_json(account_path: &PathBuf, model_name: &str) -> Option { let content = std::fs::read_to_string(account_path).ok()?; let account: serde_json::Value = serde_json::from_str(&content).ok()?; let models = account.get("quota")?.get("models")?.as_array()?; for model in models { if let Some(name) = model.get("name").and_then(|v| v.as_str()) { if crate::proxy::common::model_mapping::normalize_to_standard_id(name) .unwrap_or_else(|| name.to_string()) == model_name { return model .get("percentage") .and_then(|v| v.as_i64()) .map(|p| p as i32); } } } None } fn get_available_models_from_json(account_path: &PathBuf) -> Option> { let content = std::fs::read_to_string(account_path).ok()?; let account: serde_json::Value = serde_json::from_str(&content).ok()?; let models = account.get("quota")?.get("models")?.as_array()?; let mut result = HashSet::new(); for model in models { if let Some(name) = model.get("name").and_then(|v| v.as_str()) { let normalized = name.trim().to_lowercase(); if !normalized.is_empty() { result.insert(normalized); } } } Some(result) } fn build_dynamic_model_candidates(model_name: &str) -> Option> { let model = model_name.trim().to_lowercase(); if model.is_empty() { return None; } let pro_family = [ "gemini-3-pro", "gemini-3-pro-preview", "gemini-3-pro-high", "gemini-3-pro-low", "gemini-3.1-pro", "gemini-3.1-pro-preview", "gemini-3.1-pro-high", "gemini-3.1-pro-low", ]; if !pro_family.contains(&model.as_str()) { return None; } let mut out = Vec::new(); let mut seen = HashSet::new(); let mut push = |candidate: &str| { let c = candidate.to_string(); if seen.insert(c.clone()) { out.push(c); } }; // Keep requested model as top priority, then fallback across the same family. push(&model); push("gemini-3.1-pro-preview"); push("gemini-3-pro-preview"); push("gemini-3.1-pro-high"); push("gemini-3-pro-high"); push("gemini-3.1-pro-low"); push("gemini-3-pro-low"); Some(out) } pub async fn resolve_dynamic_model_for_account( &self, account_id: &str, mapped_model: &str, ) -> String { let candidates = match Self::build_dynamic_model_candidates(mapped_model) { Some(c) => c, None => return mapped_model.to_string(), }; let account_path = match self.tokens.get(account_id) { Some(token) => token.account_path.clone(), None => return mapped_model.to_string(), }; let available_models = match Self::get_available_models_from_json(&account_path) { Some(models) if !models.is_empty() => models, _ => return mapped_model.to_string(), }; for candidate in candidates { if available_models.contains(&candidate) { if candidate != mapped_model.to_lowercase() { tracing::info!( "[Dynamic-Model-Rewrite] account={} {} -> {}", account_id, mapped_model, candidate ); } return candidate; } } mapped_model.to_string() } /// 测试辅助函数：公开访问 get_model_quota_from_json #[cfg(test)] pub fn get_model_quota_from_json_for_test(account_path: &PathBuf, model_name: &str) -> Option { Self::get_model_quota_from_json(account_path, model_name) } /// 触发配额保护，限制特定模型 (Issue #621) /// 返回 true 如果发生了改变 async fn trigger_quota_protection( &self, account_json: &mut serde_json::Value, account_id: &str, account_path: &PathBuf, current_val: i32, threshold: i32, model_name: &str, ) -> Result { // 1. 初始化 protected_models 数组（如果不存在） if account_json.get("protected_models").is_none() { account_json["protected_models"] = serde_json::Value::Array(Vec::new()); } let protected_models = account_json["protected_models"].as_array_mut().unwrap(); // 2. 检查是否已存在 if !protected_models .iter() .any(|m| m.as_str() == Some(model_name)) { protected_models.push(serde_json::Value::String(model_name.to_string())); tracing::info!( "账号 {} 的模型 {} 因配额受限（{}% <= {}%）已被加入保护列表", account_id, model_name, current_val, threshold ); // 3. 写入磁盘 std::fs::write(account_path, serde_json::to_string_pretty(account_json).unwrap()) .map_err(|e| format!("写入文件失败: {}", e))?; // [FIX] 触发 TokenManager 的账号重新加载信号，确保内存中的 protected_models 同步 crate::proxy::server::trigger_account_reload(account_id); return Ok(true); } Ok(false) } /// 检查并从账号级保护恢复（迁移至模型级，Issue #621） async fn check_and_restore_quota( &self, account_json: &mut serde_json::Value, account_path: &PathBuf, quota: &serde_json::Value, config: &crate::models::QuotaProtectionConfig, ) -> bool { // [兼容性] 如果该账号当前处于 proxy_disabled=true 且原因是 quota_protection， // 我们将其 proxy_disabled 设为 false，但同时更新其 protected_models 列表。 tracing::info!( "正在迁移账号 {} 从全局配额保护模式至模型级保护模式", account_json .get("email") .and_then(|v| v.as_str()) .unwrap_or("unknown") ); account_json["proxy_disabled"] = serde_json::Value::Bool(false); account_json["proxy_disabled_reason"] = serde_json::Value::Null; account_json["proxy_disabled_at"] = serde_json::Value::Null; let threshold = config.threshold_percentage as i32; let mut protected_list = Vec::new(); if let Some(models) = quota.get("models").and_then(|m| m.as_array()) { for model in models { let name = model.get("name").and_then(|v| v.as_str()).unwrap_or(""); if !config.monitored_models.iter().any(|m| m == name) { continue; } let percentage = model.get("percentage").and_then(|v| v.as_i64()).unwrap_or(0) as i32; if percentage <= threshold { protected_list.push(serde_json::Value::String(name.to_string())); } } } account_json["protected_models"] = serde_json::Value::Array(protected_list); let _ = std::fs::write(account_path, serde_json::to_string_pretty(account_json).unwrap()); false // 返回 false 表示现在已可以尝试加载该账号（模型级过滤会在 get_token 时发生） } /// 恢复特定模型的配额保护 (Issue #621) /// 返回 true 如果发生了改变 async fn restore_quota_protection( &self, account_json: &mut serde_json::Value, account_id: &str, account_path: &PathBuf, model_name: &str, ) -> Result { if let Some(arr) = account_json .get_mut("protected_models") .and_then(|v| v.as_array_mut()) { let original_len = arr.len(); arr.retain(|m| m.as_str() != Some(model_name)); if arr.len() < original_len { tracing::info!( "账号 {} 的模型 {} 配额已恢复，移出保护列表", account_id, model_name ); std::fs::write( account_path, serde_json::to_string_pretty(account_json).unwrap(), ) .map_err(|e| format!("写入文件失败: {}", e))?; return Ok(true); } } Ok(false) } /// P2C 算法的候选池大小 - 从前 N 个最优候选中随机选择 const P2C_POOL_SIZE: usize = 5; /// Power of 2 Choices (P2C) 选择算法 /// 从前 5 个候选中随机选 2 个，选择配额更高的 -> 避免热点 /// 返回选中的索引 /// /// # 参数 /// * `candidates` - 已排序的候选 token 列表 /// * `attempted` - 已尝试失败的账号 ID 集合 /// * `normalized_target` - 归一化后的目标模型名 /// * `quota_protection_enabled` - 是否启用配额保护 fn select_with_p2c<'a>( &self, candidates: &'a [ProxyToken], attempted: &HashSet, normalized_target: &str, quota_protection_enabled: bool, ) -> Option<&'a ProxyToken> { use rand::Rng; // 过滤可用 token let available: Vec<&ProxyToken> = candidates.iter() .filter(|t| !attempted.contains(&t.account_id)) .filter(|t| !quota_protection_enabled || !t.protected_models.contains(normalized_target)) .collect(); if available.is_empty() { return None; } if available.len() == 1 { return Some(available[0]); } // P2C: 从前 min(P2C_POOL_SIZE, len) 个中随机选 2 个 let pool_size = available.len().min(Self::P2C_POOL_SIZE); let mut rng = rand::thread_rng(); let pick1 = rng.gen_range(0..pool_size); let pick2 = rng.gen_range(0..pool_size); // 确保选择不同的两个候选 let pick2 = if pick2 == pick1 { (pick1 + 1) % pool_size } else { pick2 }; let c1 = available[pick1]; let c2 = available[pick2]; // 选择配额更高的 let selected = if c1.remaining_quota.unwrap_or(0) >= c2.remaining_quota.unwrap_or(0) { c1 } else { c2 }; tracing::debug!( "🎲 [P2C] Selected {} ({}%) from [{}({}%), {}({}%)]", selected.email, selected.remaining_quota.unwrap_or(0), c1.email, c1.remaining_quota.unwrap_or(0), c2.email, c2.remaining_quota.unwrap_or(0) ); Some(selected) } /// 先发送取消信号，再带超时等待任务完成 /// /// # 参数 /// * `timeout` - 等待任务完成的超时时间 pub async fn graceful_shutdown(&self, timeout: std::time::Duration) { tracing::info!("Initiating graceful shutdown of background tasks..."); // 发送取消信号给所有后台任务 self.cancel_token.cancel(); // 带超时等待任务完成 match tokio::time::timeout(timeout, self.abort_background_tasks()).await { Ok(_) => tracing::info!("All background tasks cleaned up gracefully"), Err(_) => tracing::warn!("Graceful cleanup timed out after {:?}, tasks were force-aborted", timeout), } } /// 中止并等待所有后台任务完成 /// abort() 仅设置取消标志，必须 await 确认清理完成 pub async fn abort_background_tasks(&self) { Self::abort_task(&self.auto_cleanup_handle, "Auto-cleanup task").await; } /// 中止单个后台任务并记录结果 /// /// # 参数 /// * `handle` - 任务句柄的 Mutex 引用 /// * `task_name` - 任务名称（用于日志） async fn abort_task( handle: &tokio::sync::Mutex>>, task_name: &str, ) { let Some(handle) = handle.lock().await.take() else { return; }; handle.abort(); match handle.await { Ok(()) => tracing::debug!("{} completed", task_name), Err(e) if e.is_cancelled() => tracing::info!("{} aborted", task_name), Err(e) => tracing::warn!("{} error: {}", task_name, e), } } /// 获取当前可用的 Token（支持粘性会话与智能调度） /// 参数 `quota_group` 用于区分 "claude" vs "gemini" 组 /// 参数 `force_rotate` 为 true 时将忽略锁定，强制切换账号 /// 参数 `session_id` 用于跨请求维持会话粘性 /// 参数 `target_model` 用于检查配额保护 (Issue #621) pub async fn get_token( &self, quota_group: &str, force_rotate: bool, session_id: Option<&str>, target_model: &str, ) -> Result<(String, String, String, String, u64), String> { // [FIX] 检查并处理待重新加载的账号（配额保护同步） let pending_reload = crate::proxy::server::take_pending_reload_accounts(); for account_id in pending_reload { if let Err(e) = self.reload_account(&account_id).await { tracing::warn!("[Quota] Failed to reload account {}: {}", account_id, e); } else { tracing::info!( "[Quota] Reloaded account {} (protected_models synced)", account_id ); } } // [FIX #1477] 检查并处理待删除的账号（彻底清理缓存） let pending_delete = crate::proxy::server::take_pending_delete_accounts(); for account_id in pending_delete { self.remove_account(&account_id); tracing::info!( "[Proxy] Purged deleted account {} from all caches", account_id ); } // 【优化 Issue #284】添加 5 秒超时，防止死锁 let timeout_duration = std::time::Duration::from_secs(5); match tokio::time::timeout( timeout_duration, self.get_token_internal(quota_group, force_rotate, session_id, target_model), ) .await { Ok(result) => result, Err(_) => Err( "Token acquisition timeout (5s) - system too busy or deadlock detected".to_string(), ), } } /// 内部实现：获取 Token 的核心逻辑 async fn get_token_internal( &self, quota_group: &str, force_rotate: bool, session_id: Option<&str>, target_model: &str, ) -> Result<(String, String, String, String, u64), String> { let mut tokens_snapshot: Vec = self.tokens.iter().map(|e| e.value().clone()).collect(); let mut total = tokens_snapshot.len(); if total == 0 { return Err("Token pool is empty".to_string()); } // [NEW] 1. 动态能力过滤 (Capability Filter) // 定义常量 const RESET_TIME_THRESHOLD_SECS: i64 = 600; // 10 分钟阈值 // 归一化目标模型名为标准 ID let normalized_target = crate::proxy::common::model_mapping::normalize_to_standard_id(target_model) .unwrap_or_else(|| target_model.to_string()); // 仅保留明确拥有该模型配额的账号 // 这一步确保了 "保证有模型才可以进入轮询"，特别是对 Opus 4.6 等高端模型 let candidate_count_before = tokens_snapshot.len(); // 此处假设所有受支持的模型都会出现在 model_quotas 中 // 如果 API 返回的配额信息不完整，可能会导致误杀，但为了严格性，我们执行此过滤 tokens_snapshot.retain(|t| t.model_quotas.contains_key(&normalized_target)); if tokens_snapshot.is_empty() { if candidate_count_before > 0 { // 如果过滤前有账号，过滤后没了，说明所有账号都没有该模型的配额 tracing::warn!("No accounts have satisfied quota for model: {}", normalized_target); return Err(format!("No accounts available with quota for model: {}", normalized_target)); } return Err("Token pool is empty".to_string()); } tokens_snapshot.sort_by(|a, b| { // Priority 0: 严格的订阅等级排序 (ULTRA > PRO > FREE) // 用户要求：轮询应当遵循 Ultra -> Pro -> Free // 既然已经过滤掉了不支持该模型的账号，剩下的都是支持的 // 此时我们优先使用高级订阅 let tier_priority = |tier: &Option| { let t = tier.as_deref().unwrap_or("").to_lowercase(); if t.contains("ultra") { 0 } else if t.contains("pro") { 1 } else if t.contains("free") { 2 } else { 3 } }; let tier_cmp = tier_priority(&a.subscription_tier) .cmp(&tier_priority(&b.subscription_tier)); if tier_cmp != std::cmp::Ordering::Equal { return tier_cmp; } // Priority 1: 目标模型的 quota (higher is better) -> 保护低配额账号 // 经过过滤，key 肯定存在 let quota_a = a.model_quotas.get(&normalized_target).copied().unwrap_or(0); let quota_b = b.model_quotas.get(&normalized_target).copied().unwrap_or(0); let quota_cmp = quota_b.cmp("a_a); if quota_cmp != std::cmp::Ordering::Equal { return quota_cmp; } // Priority 2: Health score (higher is better) let health_cmp = b.health_score.partial_cmp(&a.health_score) .unwrap_or(std::cmp::Ordering::Equal); if health_cmp != std::cmp::Ordering::Equal { return health_cmp; } // Priority 3: Reset time (earlier is better, but only if diff > 10 min) let reset_a = a.reset_time.unwrap_or(i64::MAX); let reset_b = b.reset_time.unwrap_or(i64::MAX); if (reset_a - reset_b).abs() >= RESET_TIME_THRESHOLD_SECS { reset_a.cmp(&reset_b) } else { std::cmp::Ordering::Equal } }); // 【调试日志】打印排序后的账号顺序（显示目标模型的 quota） tracing::debug!( "🔄 [Token Rotation] target={} Accounts: {:?}", normalized_target, tokens_snapshot.iter().map(|t| format!( "{}(quota={}%, reset={:?}, health={:.2})", t.email, t.model_quotas.get(&normalized_target).copied().unwrap_or(0), t.reset_time.map(|ts| { let now = chrono::Utc::now().timestamp(); let diff_secs = ts - now; if diff_secs > 0 { format!("{}m", diff_secs / 60) } else { "now".to_string() } }), t.health_score )).collect::>() ); // 0. 读取当前调度配置 let scheduling = self.sticky_config.read().await.clone(); use crate::proxy::sticky_config::SchedulingMode; // 【新增】检查配额保护是否启用（如果关闭，则忽略 protected_models 检查） let quota_protection_enabled = crate::modules::config::load_app_config() .map(|cfg| cfg.quota_protection.enabled) .unwrap_or(false); // ===== [FIX #820] 固定账号模式：优先使用指定账号 ===== let preferred_id = self.preferred_account_id.read().await.clone(); if let Some(ref pref_id) = preferred_id { // 查找优先账号 if let Some(preferred_token) = tokens_snapshot .iter() .find(|t| &t.account_id == pref_id) .cloned() { // 检查账号是否可用（未限流、未被配额保护） match Self::get_account_state_on_disk(&preferred_token.account_path).await { OnDiskAccountState::Disabled => { tracing::warn!( "🔒 [FIX #820] Preferred account {} is disabled on disk, purging and falling back", preferred_token.email ); self.remove_account(&preferred_token.account_id); tokens_snapshot.retain(|t| t.account_id != preferred_token.account_id); total = tokens_snapshot.len(); { let mut preferred = self.preferred_account_id.write().await; if preferred.as_deref() == Some(pref_id.as_str()) { *preferred = None; } } if total == 0 { return Err("Token pool is empty".to_string()); } } OnDiskAccountState::Unknown => { tracing::warn!( "🔒 [FIX #820] Preferred account {} state on disk is unavailable, falling back", preferred_token.email ); // Don't purge on transient read/parse failures; just skip this token for this request. tokens_snapshot.retain(|t| t.account_id != preferred_token.account_id); total = tokens_snapshot.len(); if total == 0 { return Err("Token pool is empty".to_string()); } } OnDiskAccountState::Enabled => { let normalized_target = crate::proxy::common::model_mapping::normalize_to_standard_id( target_model, ) .unwrap_or_else(|| target_model.to_string()); let is_rate_limited = self .is_rate_limited(&preferred_token.account_id, Some(&normalized_target)) .await; let is_quota_protected = quota_protection_enabled && preferred_token .protected_models .contains(&normalized_target); if !is_rate_limited && !is_quota_protected { tracing::info!( "🔒 [FIX #820] Using preferred account: {} (fixed mode)", preferred_token.email ); // 直接使用优先账号，跳过轮询逻辑 let mut token = preferred_token.clone(); // [NEW] 检查 token 是否过期（调整刷新时机对齐官方：90s 宽限期） let now = chrono::Utc::now().timestamp(); if now >= token.timestamp - 90 { // [NEW] 双重检查锁定逻辑 (Double-Checked Locking) // 1. 获取（或创建）该账号专属的刷新锁 let refresh_mu = self.refresh_locks.entry(token.account_id.clone()) .or_insert_with(|| Arc::new(tokio::sync::Mutex::new(()))) .clone(); // 2. 尝试获取锁 let _guard = refresh_mu.lock().await; // 3. 再次检查本账号最新状态（可能已被其他并发请求刷新完毕） let latest_token_opt = self.tokens.get(&token.account_id).map(|r| r.clone()); if let Some(latest) = latest_token_opt { if now < latest.timestamp - 90 { // 已经被别人刷过了，同步最新数据并跳过刷新动作 token = latest.clone(); tracing::debug!("账号 {} 已由并发线程刷新，跳过重复刷新", token.email); } else { // 确实需要刷新 tracing::debug!("账号 {} 的 token 即将过期 ({}s)，正在刷新...", token.email, token.timestamp - now); match crate::modules::oauth::refresh_access_token(&token.refresh_token, Some(&token.account_id)) .await { Ok(token_response) => { token.access_token = token_response.access_token.clone(); token.expires_in = token_response.expires_in; token.timestamp = now + token_response.expires_in; if let Some(mut entry) = self.tokens.get_mut(&token.account_id) { entry.access_token = token.access_token.clone(); entry.expires_in = token.expires_in; entry.timestamp = token.timestamp; } let _ = self .save_refreshed_token(&token.account_id, &token_response) .await; } Err(e) => { tracing::warn!("Preferred account token refresh failed: {}", e); // 继续使用旧 token，让后续逻辑处理失败 } } } } } // 确保有 project_id (filter empty strings to trigger re-fetch) let project_id = if let Some(pid) = &token.project_id { if pid.is_empty() { None } else { Some(pid.clone()) } } else { None }; let project_id = if let Some(pid) = project_id { pid } else { match crate::proxy::project_resolver::fetch_project_id(&token.access_token) .await { Ok(pid) => { if let Some(mut entry) = self.tokens.get_mut(&token.account_id) { entry.project_id = Some(pid.clone()); } let _ = self.save_project_id(&token.account_id, &pid).await; pid } Err(_) => "bamboo-precept-lgxtn".to_string(), // fallback } }; return Ok((token.access_token, project_id, token.email, token.account_id, 0)); } else { if is_rate_limited { tracing::warn!("🔒 [FIX #820] Preferred account {} is rate-limited, falling back to round-robin", preferred_token.email); } else { tracing::warn!("🔒 [FIX #820] Preferred account {} is quota-protected for {}, falling back to round-robin", preferred_token.email, target_model); } } } } } else { tracing::warn!("🔒 [FIX #820] Preferred account {} not found in pool, falling back to round-robin", pref_id); } } // ===== [END FIX #820] ===== // 【优化 Issue #284】将锁操作移到循环外，避免重复获取锁 // 预先获取 last_used_account 的快照，避免在循环中多次加锁 let last_used_account_id = if quota_group != "image_gen" { let last_used = self.last_used_account.lock().await; last_used.clone() } else { None }; let mut attempted: HashSet = HashSet::new(); let mut last_error: Option = None; let mut need_update_last_used: Option<(String, std::time::Instant)> = None; for attempt in 0..total { let rotate = force_rotate || attempt > 0; // ===== 【核心】粘性会话与智能调度逻辑 ===== let mut target_token: Option = None; // 归一化目标模型名为标准 ID，用于配额保护检查 let normalized_target = crate::proxy::common::model_mapping::normalize_to_standard_id(target_model) .unwrap_or_else(|| target_model.to_string()); // 模式 A: 粘性会话处理 (CacheFirst 或 Balance 且有 session_id) if !rotate && session_id.is_some() && scheduling.mode != SchedulingMode::PerformanceFirst { let sid = session_id.unwrap(); // 1. 检查会话是否已绑定账号 if let Some(bound_id) = self.session_accounts.get(sid).map(|v| v.clone()) { // 【修复】先通过 account_id 找到对应的账号，获取其 email // 2. 转换 email -> account_id 检查绑定的账号是否限流 if let Some(bound_token) = tokens_snapshot.iter().find(|t| t.account_id == bound_id) { let key = self .email_to_account_id(&bound_token.email) .unwrap_or_else(|| bound_token.account_id.clone()); // [FIX] Pass None for specific model wait time if not applicable let reset_sec = self.rate_limit_tracker.get_remaining_wait(&key, None); if reset_sec > 0 { // 【修复 Issue #284】立即解绑并切换账号，不再阻塞等待 // 原因：阻塞等待会导致并发请求时客户端 socket 超时 (UND_ERR_SOCKET) tracing::debug!( "Sticky Session: Bound account {} is rate-limited ({}s), unbinding and switching.", bound_token.email, reset_sec ); self.session_accounts.remove(sid); } else if !attempted.contains(&bound_id) && !(quota_protection_enabled && bound_token.protected_models.contains(&normalized_target)) { // 3. 账号可用且未被标记为尝试失败，优先复用 tracing::debug!("Sticky Session: Successfully reusing bound account {} for session {}", bound_token.email, sid); target_token = Some(bound_token.clone()); } else if quota_protection_enabled && bound_token.protected_models.contains(&normalized_target) { tracing::debug!("Sticky Session: Bound account {} is quota-protected for model {} [{}], unbinding and switching.", bound_token.email, normalized_target, target_model); self.session_accounts.remove(sid); } } else { // 绑定的账号已不存在（可能被删除），解绑 tracing::debug!( "Sticky Session: Bound account not found for session {}, unbinding", sid ); self.session_accounts.remove(sid); } } } // 模式 B: 原子化 60s 全局锁定 (针对无 session_id 情况的默认保护) // 【修复】性能优先模式应跳过 60s 锁定； if target_token.is_none() && !rotate && quota_group != "image_gen" && scheduling.mode != SchedulingMode::PerformanceFirst { // 【优化】使用预先获取的快照，不再在循环内加锁 if let Some((account_id, last_time)) = &last_used_account_id { // [FIX #3] 60s 锁定逻辑应检查 `attempted` 集合，避免重复尝试失败的账号 if last_time.elapsed().as_secs() < 60 && !attempted.contains(account_id) { if let Some(found) = tokens_snapshot.iter().find(|t| &t.account_id == account_id) { // 【修复】检查限流状态和配额保护，避免复用已被锁定的账号 if !self .is_rate_limited(&found.account_id, Some(&normalized_target)) .await && !(quota_protection_enabled && found.protected_models.contains(&normalized_target)) { tracing::debug!( "60s Window: Force reusing last account: {}", found.email ); target_token = Some(found.clone()); } else { if self .is_rate_limited(&found.account_id, Some(&normalized_target)) .await { tracing::debug!( "60s Window: Last account {} is rate-limited, skipping", found.email ); } else { tracing::debug!("60s Window: Last account {} is quota-protected for model {} [{}], skipping", found.email, normalized_target, target_model); } } } } } // 若无锁定，则使用 P2C 选择账号 (避免热点问题) if target_token.is_none() { // 先过滤出未限流的账号 let mut non_limited: Vec = Vec::new(); for t in &tokens_snapshot { if !self.is_rate_limited(&t.account_id, Some(&normalized_target)).await { non_limited.push(t.clone()); } } if let Some(selected) = self.select_with_p2c( &non_limited, &attempted, &normalized_target, quota_protection_enabled ) { target_token = Some(selected.clone()); need_update_last_used = Some((selected.account_id.clone(), std::time::Instant::now())); // 如果是会话首次分配且需要粘性，在此建立绑定 if let Some(sid) = session_id { if scheduling.mode != SchedulingMode::PerformanceFirst { self.session_accounts .insert(sid.to_string(), selected.account_id.clone()); tracing::debug!( "Sticky Session: Bound new account {} to session {}", selected.email, sid ); } } } } } else if target_token.is_none() { // 模式 C: P2C 选择 (替代纯轮询) tracing::debug!( "🔄 [Mode C] P2C selection from {} candidates", total ); // 先过滤出未限流的账号 let mut non_limited: Vec = Vec::new(); for t in &tokens_snapshot { if !self.is_rate_limited(&t.account_id, Some(&normalized_target)).await { non_limited.push(t.clone()); } } if let Some(selected) = self.select_with_p2c( &non_limited, &attempted, &normalized_target, quota_protection_enabled ) { tracing::debug!(" {} - SELECTED via P2C", selected.email); target_token = Some(selected.clone()); if rotate { tracing::debug!("Force Rotation: Switched to account: {}", selected.email); } } } let mut token = match target_token { Some(t) => t, None => { // 乐观重置策略: 双层防护机制 // 计算最短等待时间 let min_wait = tokens_snapshot .iter() .filter_map(|t| self.rate_limit_tracker.get_reset_seconds(&t.account_id)) .min(); // Layer 1: 如果最短等待时间 <= 2秒,执行缓冲延迟 if let Some(wait_sec) = min_wait { if wait_sec <= 2 { let wait_ms = (wait_sec as f64 * 1000.0) as u64; tracing::warn!( "All accounts rate-limited but shortest wait is {}s. Applying {}ms buffer for state sync...", wait_sec, wait_ms ); // 缓冲延迟 tokio::time::sleep(tokio::time::Duration::from_millis(wait_ms)).await; // 重新尝试选择账号 let retry_token = tokens_snapshot.iter() .find(|t| !attempted.contains(&t.account_id) && !self.is_rate_limited_sync(&t.account_id, Some(&normalized_target)) && !(quota_protection_enabled && t.protected_models.contains(&normalized_target))); if let Some(t) = retry_token { tracing::info!( "✅ Buffer delay successful! Found available account: {}", t.email ); t.clone() } else { // Layer 2: 缓冲后仍无可用账号,执行乐观重置 tracing::warn!( "Buffer delay failed. Executing optimistic reset for all {} accounts...", tokens_snapshot.len() ); // 清除所有限流记录 self.rate_limit_tracker.clear_all(); // 再次尝试选择账号 let final_token = tokens_snapshot .iter() .find(|t| !attempted.contains(&t.account_id) && !(quota_protection_enabled && t.protected_models.contains(&normalized_target))); if let Some(t) = final_token { tracing::info!( "✅ Optimistic reset successful! Using account: {}", t.email ); t.clone() } else { return Err( "All accounts failed after optimistic reset.".to_string() ); } } } else { return Err(format!("All accounts limited. Wait {}s.", wait_sec)); } } else { return Err("All accounts failed or unhealthy.".to_string()); } } }; // Safety net: avoid selecting an account that has been disabled on disk but still // exists in the in-memory snapshot (e.g. stale cache + sticky session binding). match Self::get_account_state_on_disk(&token.account_path).await { OnDiskAccountState::Disabled => { tracing::warn!( "Selected account {} is disabled on disk, purging and retrying", token.email ); attempted.insert(token.account_id.clone()); self.remove_account(&token.account_id); continue; } OnDiskAccountState::Unknown => { tracing::warn!( "Selected account {} state on disk is unavailable, skipping", token.email ); attempted.insert(token.account_id.clone()); continue; } OnDiskAccountState::Enabled => {} } // 3. [NEW] 检查 token 是否过期（调整刷新时机对齐官方：90s 宽限期） let now = chrono::Utc::now().timestamp(); if now >= token.timestamp - 90 { // [NEW] 双重检查锁定逻辑 (Double-Checked Locking) let refresh_mu = self.refresh_locks.entry(token.account_id.clone()) .or_insert_with(|| Arc::new(tokio::sync::Mutex::new(()))) .clone(); let _guard = refresh_mu.lock().await; // 再次检查最新状态 let latest_token_opt = self.tokens.get(&token.account_id).map(|r| r.clone()); if let Some(latest) = latest_token_opt { if now < latest.timestamp - 90 { token = latest.clone(); tracing::debug!("账号 {} 已由并发线程在循环中刷新，跳过", token.email); } else { tracing::debug!("账号 {} 的 token 即将过期，正在执行主路径刷新...", token.email); // 调用 OAuth 刷新 token match crate::modules::oauth::refresh_access_token(&token.refresh_token, Some(&token.account_id)).await { Ok(token_response) => { tracing::debug!("Token 刷新成功！"); token.access_token = token_response.access_token.clone(); token.expires_in = token_response.expires_in; token.timestamp = now + token_response.expires_in; if let Some(mut entry) = self.tokens.get_mut(&token.account_id) { entry.access_token = token.access_token.clone(); entry.expires_in = token.expires_in; entry.timestamp = token.timestamp; } let _ = self.save_refreshed_token(&token.account_id, &token_response).await; } Err(e) => { tracing::error!("Token 刷新失败 ({}): {}，尝试下一个账号", token.email, e); if e.contains("\"invalid_grant\"") || e.contains("invalid_grant") { self.disable_account(&token.account_id, &format!("invalid_grant: {}", e)).await; } last_error = Some(format!("Token refresh failed: {}", e)); attempted.insert(token.account_id.clone()); if quota_group != "image_gen" && matches!(&last_used_account_id, Some((id, _)) if id == &token.account_id) { need_update_last_used = Some((String::new(), std::time::Instant::now())); } continue; } } } } } // 4. [ENHANCED] 确保有 project_id (使用锁保护 fetch 动作) let project_id = if let Some(pid) = &token.project_id { if pid.is_empty() { None } else { Some(pid.clone()) } } else { None }; let project_id = if let Some(pid) = project_id { pid } else { // [NEW] 针对 fetch_project_id 实现基于 SingleFlight 的异步合并 // 1. 检查是否已有 inflight 请求 let (mut rx, is_new) = { if let Some(existing_rx) = self.load_code_assist_inflight.get(&token.account_id) { (existing_rx.value().clone(), false) } else { // 创建新的 inflight 频道 let (tx, rx) = tokio::sync::watch::channel(None); self.load_code_assist_inflight.insert(token.account_id.clone(), rx.clone()); (rx, true) } }; if is_new { // 仅由“第一个发现者”执行真实请求 tracing::debug!("账号 {} 启动 [SingleFlight] ProjectID 探测...", token.email); let result = match crate::proxy::project_resolver::fetch_project_id(&token.access_token).await { Ok(pid) => { if let Some(mut entry) = self.tokens.get_mut(&token.account_id) { entry.project_id = Some(pid.clone()); let _ = self.save_project_id(&token.account_id, &pid).await; } Ok(pid) } Err(e) => Err(e), }; // 广播结果并清理 inflight if let Some(mut entry) = self.load_code_assist_inflight.get_mut(&token.account_id) { // 这里虽然是 rx，但在 Rust 中 watch 不需要 tx 也可以通过私有方式操作？ // 修正：我们需要持有 tx。重新设计此处：使用 Mutex 或在 scope 外持有 tx。 // 由于 DashMap 不能存不可克隆的 tx，我们改用 Mutex 保护的流程或直接在 if is_new 里执行 } // 【修正实现方案】: 对于 project_id 这种高频探测，仍然使用 refresh_mu 锁是最高效的， // 但我们要加入“强制异步等待”逻辑。由于之前的 Mutex 已经是异步的， // 我们只需确保 fetch_project_id 调用被包裹在锁内并且有 double-check。 // 之前的代码已经做到了这一点。 // 为了完全对齐 agent-vibes 的 singleFlight 语义（即不仅是锁，还要有“结果复用”）， // 我将保留之前的逻辑但移除不必要的重复日志。 let refresh_mu = self.refresh_locks.entry(token.account_id.clone()) .or_insert_with(|| Arc::new(tokio::sync::Mutex::new(()))) .clone(); let _guard = refresh_mu.lock().await; if let Some(mut entry) = self.tokens.get_mut(&token.account_id) { if let Some(pid) = &entry.project_id { if !pid.is_empty() { pid.clone() } else { match crate::proxy::project_resolver::fetch_project_id(&entry.access_token).await { Ok(pid) => { entry.project_id = Some(pid.clone()); let _ = self.save_project_id(&token.account_id, &pid).await; pid } Err(_) => "bamboo-precept-lgxtn".to_string(), } } } else { "bamboo-precept-lgxtn".to_string() } } else { "bamboo-precept-lgxtn".to_string() } } else { // 如果不是第一个，则等待结果 (虽然在 Mutex 模式下不需要 rx，但为了严谨性我们可以保留锁) let refresh_mu = self.refresh_locks.get(&token.account_id).map(|v| v.value().clone()); if let Some(mu) = refresh_mu { let _guard = mu.lock().await; } self.tokens.get(&token.account_id) .and_then(|t| t.project_id.clone()) .unwrap_or_else(|| "bamboo-precept-lgxtn".to_string()) } }; // 【优化】在成功返回前，统一更新 last_used_account（如果需要） if let Some((new_account_id, new_time)) = need_update_last_used { if quota_group != "image_gen" { let mut last_used = self.last_used_account.lock().await; if new_account_id.is_empty() { // 空字符串表示需要清除锁定 *last_used = None; } else { *last_used = Some((new_account_id, new_time)); } } } return Ok((token.access_token, project_id, token.email, token.account_id, 0)); } Err(last_error.unwrap_or_else(|| "All accounts failed".to_string())) } async fn disable_account(&self, account_id: &str, reason: &str) -> Result<(), String> { let path = if let Some(entry) = self.tokens.get(account_id) { entry.account_path.clone() } else { self.data_dir .join("accounts") .join(format!("{}.json", account_id)) }; let mut content: serde_json::Value = serde_json::from_str( &std::fs::read_to_string(&path).map_err(|e| format!("读取文件失败: {}", e))?, ) .map_err(|e| format!("解析 JSON 失败: {}", e))?; let now = chrono::Utc::now().timestamp(); content["disabled"] = serde_json::Value::Bool(true); content["disabled_at"] = serde_json::Value::Number(now.into()); content["disabled_reason"] = serde_json::Value::String(truncate_reason(reason, 800)); std::fs::write(&path, serde_json::to_string_pretty(&content).unwrap()) .map_err(|e| format!("写入文件失败: {}", e))?; // 【修复 Issue #3】从内存中移除禁用的账号，防止被60s锁定逻辑继续使用 self.tokens.remove(account_id); tracing::warn!("Account disabled: {} ({:?})", account_id, path); Ok(()) } /// 保存 project_id 到账号文件 async fn save_project_id(&self, account_id: &str, project_id: &str) -> Result<(), String> { let entry = self.tokens.get(account_id) .ok_or("账号不存在")?; let path = &entry.account_path; let mut content: serde_json::Value = serde_json::from_str( &std::fs::read_to_string(path).map_err(|e| format!("读取文件失败: {}", e))? ).map_err(|e| format!("解析 JSON 失败: {}", e))?; content["token"]["project_id"] = serde_json::Value::String(project_id.to_string()); std::fs::write(path, serde_json::to_string_pretty(&content).unwrap()) .map_err(|e| format!("写入文件失败: {}", e))?; tracing::debug!("已保存 project_id 到账号 {}", account_id); Ok(()) } /// 保存刷新后的 token 到账号文件 async fn save_refreshed_token(&self, account_id: &str, token_response: &crate::modules::oauth::TokenResponse) -> Result<(), String> { let entry = self.tokens.get(account_id) .ok_or("账号不存在")?; let path = &entry.account_path; let mut content: serde_json::Value = serde_json::from_str( &std::fs::read_to_string(path).map_err(|e| format!("读取文件失败: {}", e))? ).map_err(|e| format!("解析 JSON 失败: {}", e))?; let now = chrono::Utc::now().timestamp(); content["token"]["access_token"] = serde_json::Value::String(token_response.access_token.clone()); content["token"]["expires_in"] = serde_json::Value::Number(token_response.expires_in.into()); content["token"]["expiry_timestamp"] = serde_json::Value::Number((now + token_response.expires_in).into()); std::fs::write(path, serde_json::to_string_pretty(&content).unwrap()) .map_err(|e| format!("写入文件失败: {}", e))?; tracing::debug!("已保存刷新后的 token 到账号 {}", account_id); Ok(()) } pub fn len(&self) -> usize { self.tokens.len() } /// 通过 email 获取指定账号的 Token（用于预热等需要指定账号的场景） /// 此方法会自动刷新过期的 token pub async fn get_token_by_email( &self, email: &str, ) -> Result<(String, String, String, String, u64), String> { // 查找账号信息 let token_info = { let mut found = None; for entry in self.tokens.iter() { let token = entry.value(); if token.email == email { found = Some(( token.account_id.clone(), token.access_token.clone(), token.refresh_token.clone(), token.timestamp, token.expires_in, chrono::Utc::now().timestamp(), token.project_id.clone(), )); break; } } found }; let ( account_id, current_access_token, refresh_token, timestamp, expires_in, now, project_id_opt, ) = match token_info { Some(info) => info, None => return Err(format!("未找到账号: {}", email)), }; let project_id = project_id_opt .filter(|s| !s.is_empty()) .unwrap_or_else(|| "bamboo-precept-lgxtn".to_string()); // 检查是否过期 (提前5分钟) if now < timestamp + expires_in - 300 { return Ok((current_access_token, project_id, email.to_string(), account_id, 0)); } tracing::info!("[Warmup] Token for {} is expiring, refreshing...", email); // 调用 OAuth 刷新 token match crate::modules::oauth::refresh_access_token(&refresh_token, Some(&account_id)).await { Ok(token_response) => { tracing::info!("[Warmup] Token refresh successful for {}", email); let new_now = chrono::Utc::now().timestamp(); // 更新缓存 if let Some(mut entry) = self.tokens.get_mut(&account_id) { entry.access_token = token_response.access_token.clone(); entry.expires_in = token_response.expires_in; entry.timestamp = new_now; } // 保存到磁盘 let _ = self .save_refreshed_token(&account_id, &token_response) .await; Ok(( token_response.access_token, project_id, email.to_string(), account_id, 0, )) } Err(e) => Err(format!( "[Warmup] Token refresh failed for {}: {}", email, e )), } } // ===== 限流管理方法 ===== /// 标记账号限流(从外部调用,通常在 handler 中) /// 参数为 email，内部会自动转换为 account_id pub async fn mark_rate_limited( &self, email: &str, status: u16, retry_after_header: Option<&str>, error_body: &str, ) { // [NEW] 检查熔断是否启用 (使用内存缓存，极快) let config = self.circuit_breaker_config.read().await.clone(); if !config.enabled { return; } // 【替代方案】转换 email -> account_id let key = self.email_to_account_id(email).unwrap_or_else(|| email.to_string()); self.rate_limit_tracker.parse_from_error( &key, status, retry_after_header, error_body, None, &config.backoff_steps, // [NEW] 传入配置 ); } /// 检查账号是否在限流中 (支持模型级) pub async fn is_rate_limited(&self, account_id: &str, model: Option<&str>) -> bool { // [NEW] 检查熔断是否启用 let config = self.circuit_breaker_config.read().await; if !config.enabled { return false; } self.rate_limit_tracker.is_rate_limited(account_id, model) } /// [NEW] 检查账号是否在限流中 (同步版本，仅用于 Iterator) pub fn is_rate_limited_sync(&self, account_id: &str, model: Option<&str>) -> bool { // 同步版本无法读取 async RwLock，这里使用 blocking_read let config = self.circuit_breaker_config.blocking_read(); if !config.enabled { return false; } self.rate_limit_tracker.is_rate_limited(account_id, model) } /// 获取距离限流重置还有多少秒 #[allow(dead_code)] pub fn get_rate_limit_reset_seconds(&self, account_id: &str) -> Option { self.rate_limit_tracker.get_reset_seconds(account_id) } /// 清除过期的限流记录 #[allow(dead_code)] pub fn clean_expired_rate_limits(&self) { self.rate_limit_tracker.cleanup_expired(); } /// 【替代方案】通过 email 查找对应的 account_id /// 用于将 handlers 传入的 email 转换为 tracker 使用的 account_id fn email_to_account_id(&self, email: &str) -> Option { self.tokens .iter() .find(|entry| entry.value().email == email) .map(|entry| entry.value().account_id.clone()) } /// 清除指定账号的限流记录 pub fn clear_rate_limit(&self, account_id: &str) -> bool { self.rate_limit_tracker.clear(account_id) } /// 清除所有限流记录 pub fn clear_all_rate_limits(&self) { self.rate_limit_tracker.clear_all(); } /// 标记账号请求成功，重置连续失败计数 /// /// 在请求成功完成后调用，将该账号的失败计数归零， /// 下次失败时从最短的锁定时间开始（智能限流）。 pub fn mark_account_success(&self, account_id: &str) { self.rate_limit_tracker.mark_success(account_id); } /// 检查是否有可用的 Google 账号 /// /// 用于"仅兜底"模式的智能判断:当所有 Google 账号不可用时才使用外部提供商。 /// /// # 参数 /// - `quota_group`: 配额组("claude" 或 "gemini"),暂未使用但保留用于未来扩展 /// - `target_model`: 目标模型名称(已归一化),用于配额保护检查 /// /// # 返回值 /// - `true`: 至少有一个可用账号(未限流且未被配额保护) /// - `false`: 所有账号都不可用(被限流或被配额保护) /// /// # 示例 /// ```ignore /// // 检查是否有可用账号处理 claude-sonnet 请求 /// let has_available = token_manager.has_available_account("claude", "claude-sonnet-4-20250514").await; /// if !has_available { /// // 切换到外部提供商 /// } /// ``` pub async fn has_available_account(&self, _quota_group: &str, target_model: &str) -> bool { // 检查配额保护是否启用 let quota_protection_enabled = crate::modules::config::load_app_config() .map(|cfg| cfg.quota_protection.enabled) .unwrap_or(false); // 遍历所有账号,检查是否有可用的 for entry in self.tokens.iter() { let token = entry.value(); // 1. 检查是否被限流 if self.is_rate_limited(&token.account_id, None).await { tracing::debug!( "[Fallback Check] Account {} is rate-limited, skipping", token.email ); continue; } // 2. 检查是否被配额保护(如果启用) if quota_protection_enabled && token.protected_models.contains(target_model) { tracing::debug!( "[Fallback Check] Account {} is quota-protected for model {}, skipping", token.email, target_model ); continue; } // 找到至少一个可用账号 tracing::debug!( "[Fallback Check] Found available account: {} for model {}", token.email, target_model ); return true; } // 所有账号都不可用 tracing::info!( "[Fallback Check] No available Google accounts for model {}, fallback should be triggered", target_model ); false } /// 从账号文件获取配额刷新时间 /// /// 返回该账号最近的配额刷新时间字符串（ISO 8601 格式） /// /// # 参数 /// - `account_id`: 账号 ID（用于查找账号文件） pub fn get_quota_reset_time(&self, account_id: &str) -> Option { // 直接用 account_id 查找账号文件（文件名是 {account_id}.json） let account_path = self.data_dir.join("accounts").join(format!("{}.json", account_id)); let content = std::fs::read_to_string(&account_path).ok()?; let account: serde_json::Value = serde_json::from_str(&content).ok()?; // 获取 quota.models 中最早的 reset_time（最保守的锁定策略） account .get("quota") .and_then(|q| q.get("models")) .and_then(|m| m.as_array()) .and_then(|models| { models.iter() .filter_map(|m| m.get("reset_time").and_then(|r| r.as_str())) .filter(|s| !s.is_empty()) .min() .map(|s| s.to_string()) }) } /// 使用配额刷新时间精确锁定账号 /// /// 当 API 返回 429 但没有 quotaResetDelay 时,尝试使用账号的配额刷新时间 /// /// # 参数 /// - `account_id`: 账号 ID /// - `reason`: 限流原因（QuotaExhausted/ServerError 等） /// - `model`: 可选的模型名称,用于模型级别限流 pub fn set_precise_lockout(&self, account_id: &str, reason: crate::proxy::rate_limit::RateLimitReason, model: Option) -> bool { // [FIX #2209] 统一归一化模型名称 let normalized_model = model.as_deref().and_then(|m| crate::proxy::common::model_mapping::normalize_to_standard_id(m)); let model_to_lock = normalized_model.or(model); if let Some(reset_time_str) = self.get_quota_reset_time(account_id) { tracing::info!("找到账号 {} 的配额刷新时间: {}", account_id, reset_time_str); self.rate_limit_tracker.set_lockout_until_iso(account_id, &reset_time_str, reason, model_to_lock) } else { tracing::debug!("未找到账号 {} 的配额刷新时间,将使用默认退避策略", account_id); false } } /// 实时刷新配额并精确锁定账号 /// /// 当 429 发生时调用此方法: /// 1. 实时调用配额刷新 API 获取最新的 reset_time /// 2. 使用最新的 reset_time 精确锁定账号 /// 3. 如果获取失败,返回 false 让调用方使用回退策略 /// /// # 参数 /// - `model`: 可选的模型名称,用于模型级别限流 pub async fn fetch_and_lock_with_realtime_quota( &self, email: &str, reason: crate::proxy::rate_limit::RateLimitReason, model: Option, ) -> bool { // 1. 从 tokens 中获取该账号的 access_token 和 account_id // 同时获取 account_id，确保锁定 key 与检查 key 一致 let (access_token, account_id) = { let mut found: Option<(String, String)> = None; for entry in self.tokens.iter() { if entry.value().email == email { found = Some(( entry.value().access_token.clone(), entry.value().account_id.clone(), )); break; } } found }.unzip(); let (access_token, account_id) = match (access_token, account_id) { (Some(token), Some(id)) => (token, id), _ => { tracing::warn!("无法找到账号 {} 的 access_token,无法实时刷新配额", email); return false; } }; // 2. 调用配额刷新 API tracing::info!("账号 {} 正在实时刷新配额...", email); match crate::modules::quota::fetch_quota(&access_token, email, Some(&account_id)).await { Ok((quota_data, _project_id)) => { // 3. 从最新配额中提取 reset_time let earliest_reset = quota_data .models .iter() .filter_map(|m| { if !m.reset_time.is_empty() { Some(m.reset_time.as_str()) } else { None } }) .min(); if let Some(reset_time_str) = earliest_reset { tracing::info!( "账号 {} 实时配额刷新成功,reset_time: {}", email, reset_time_str ); // [FIX #2209] 统一归一化模型名称 let normalized_model = model.as_deref().and_then(|m| crate::proxy::common::model_mapping::normalize_to_standard_id(m)); let model_to_lock = normalized_model.or(model); // [FIX] 使用 account_id 作为 key，与 is_rate_limited 检查一致 self.rate_limit_tracker.set_lockout_until_iso(&account_id, reset_time_str, reason, model_to_lock) } else { tracing::warn!("账号 {} 配额刷新成功但未找到 reset_time", email); false } } Err(e) => { tracing::warn!("账号 {} 实时配额刷新失败: {:?}", email, e); false } } } /// 标记账号限流(异步版本,支持实时配额刷新) /// /// 三级降级策略: /// 1. 优先: API 返回 quotaResetDelay → 直接使用 /// 2. 次优: 实时刷新配额 → 获取最新 reset_time /// 3. 保底: 使用本地缓存配额 → 读取账号文件 /// 4. 兜底: 指数退避策略 → 默认锁定时间 /// /// # 参数 /// - `email`: 账号邮箱,用于查找账号信息 /// - `status`: HTTP 状态码（如 429、500 等） /// - `retry_after_header`: 可选的 Retry-After 响应头 /// - `error_body`: 错误响应体,用于解析 quotaResetDelay /// - `model`: 可选的模型名称,用于模型级别限流 pub async fn mark_rate_limited_async( &self, email: &str, status: u16, retry_after_header: Option<&str>, error_body: &str, model: Option<&str>, // 🆕 新增模型参数 ) { // [FIX #2209] 统一归一化模型名称，确保锁定 Key 与负载均衡检查 Key 一致 let normalized_model = model.and_then(|m| crate::proxy::common::model_mapping::normalize_to_standard_id(m)); let model_to_track = normalized_model.as_deref().or(model); // [NEW] 检查熔断是否启用 let config = self.circuit_breaker_config.read().await.clone(); if !config.enabled { return; } // [FIX] Convert email to account_id for consistent tracking let account_id = self.email_to_account_id(email).unwrap_or_else(|| email.to_string()); // 检查 API 是否返回了精确的重试时间 let has_explicit_retry_time = retry_after_header.is_some() || error_body.contains("quotaResetDelay"); if has_explicit_retry_time { // API 返回了精确时间(quotaResetDelay),直接使用,无需实时刷新 if let Some(m) = model { tracing::debug!( "账号 {} 的模型 {} 的 429 响应包含 quotaResetDelay,直接使用 API 返回的时间", account_id, m ); } else { tracing::debug!( "账号 {} 的 429 响应包含 quotaResetDelay,直接使用 API 返回的时间", account_id ); } self.rate_limit_tracker.parse_from_error( &account_id, status, retry_after_header, error_body, model_to_track.map(|s| s.to_string()), &config.backoff_steps, // [NEW] 传入配置 ); return; } // 确定限流原因 let reason = if error_body.to_lowercase().contains("model_capacity") { crate::proxy::rate_limit::RateLimitReason::ModelCapacityExhausted } else if error_body.to_lowercase().contains("exhausted") || error_body.to_lowercase().contains("quota") { crate::proxy::rate_limit::RateLimitReason::QuotaExhausted } else { crate::proxy::rate_limit::RateLimitReason::Unknown }; // API 未返回 quotaResetDelay,需要实时刷新配额获取精确锁定时间 if let Some(m) = model_to_track { tracing::info!( "账号 {} 的模型 {} 的 429 响应未包含 quotaResetDelay,尝试实时刷新配额...", account_id, m ); } else { tracing::info!( "账号 {} 的 429 响应未包含 quotaResetDelay,尝试实时刷新配额...", account_id ); } // [FIX] 传入 email 而不是 account_id，因为 fetch_and_lock_with_realtime_quota 期望 email if self.fetch_and_lock_with_realtime_quota(email, reason, model_to_track.map(|s| s.to_string())).await { tracing::info!("账号 {} 已使用实时配额精确锁定", email); return; } // 实时刷新失败,尝试使用本地缓存的配额刷新时间 if self.set_precise_lockout(&account_id, reason, model_to_track.map(|s| s.to_string())) { tracing::info!("账号 {} 已使用本地缓存配额锁定", account_id); return; } // 都失败了,回退到指数退避策略 tracing::warn!("账号 {} 无法获取配额刷新时间,使用指数退避策略", account_id); self.rate_limit_tracker.parse_from_error( &account_id, status, retry_after_header, error_body, model_to_track.map(|s| s.to_string()), &config.backoff_steps, // [NEW] 传入配置 ); } // ===== 调度配置相关方法 ===== /// 获取当前调度配置 pub async fn get_sticky_config(&self) -> StickySessionConfig { self.sticky_config.read().await.clone() } /// 更新调度配置 pub async fn update_sticky_config(&self, new_config: StickySessionConfig) { let mut config = self.sticky_config.write().await; *config = new_config; tracing::debug!("Scheduling configuration updated: {:?}", *config); } /// [NEW] 更新熔断器配置 pub async fn update_circuit_breaker_config(&self, config: crate::models::CircuitBreakerConfig) { let mut lock = self.circuit_breaker_config.write().await; *lock = config; tracing::debug!("Circuit breaker configuration updated"); } /// [NEW] 获取熔断器配置 pub async fn get_circuit_breaker_config(&self) -> crate::models::CircuitBreakerConfig { self.circuit_breaker_config.read().await.clone() } /// 清除特定会话的粘性映射 #[allow(dead_code)] pub fn clear_session_binding(&self, session_id: &str) { self.session_accounts.remove(session_id); } /// 清除所有会话的粘性映射 pub fn clear_all_sessions(&self) { self.session_accounts.clear(); } // ===== [FIX #820] 固定账号模式相关方法 ===== /// 设置优先使用的账号ID（固定账号模式） /// 传入 Some(account_id) 启用固定账号模式，传入 None 恢复轮询模式 pub async fn set_preferred_account(&self, account_id: Option) { let mut preferred = self.preferred_account_id.write().await; if let Some(ref id) = account_id { tracing::info!("🔒 [FIX #820] Fixed account mode enabled: {}", id); } else { tracing::info!("🔄 [FIX #820] Round-robin mode enabled (no preferred account)"); } *preferred = account_id; } /// 获取当前优先使用的账号ID pub async fn get_preferred_account(&self) -> Option { self.preferred_account_id.read().await.clone() } /// 使用 Authorization Code 交换 Refresh Token (Web OAuth) pub async fn exchange_code(&self, code: &str, redirect_uri: &str) -> Result { crate::modules::oauth::exchange_code(code, redirect_uri) .await .and_then(|t| { t.refresh_token .ok_or_else(|| "No refresh token returned by Google".to_string()) }) } /// 获取 OAuth URL (支持自定义 Redirect URI) pub fn get_oauth_url_with_redirect(&self, redirect_uri: &str, state: &str) -> String { crate::modules::oauth::get_auth_url(redirect_uri, state) } /// 获取用户信息 (Email 等) pub async fn get_user_info( &self, refresh_token: &str, ) -> Result { // 先获取 Access Token let token = crate::modules::oauth::refresh_access_token(refresh_token, None) .await .map_err(|e| format!("刷新 Access Token 失败: {}", e))?; crate::modules::oauth::get_user_info(&token.access_token, None).await } /// 添加新账号 (纯后端实现，不依赖 Tauri AppHandle) pub async fn add_account(&self, email: &str, refresh_token: &str) -> Result<(), String> { // 1. 获取 Access Token (验证 refresh_token 有效性) let token_info = crate::modules::oauth::refresh_access_token(refresh_token, None) .await .map_err(|e| format!("Invalid refresh token: {}", e))?; // 2. 获取项目 ID (Project ID) let project_id = crate::proxy::project_resolver::fetch_project_id(&token_info.access_token) .await .unwrap_or_else(|_| "bamboo-precept-lgxtn".to_string()); // Fallback // 3. 委托给 modules::account::add_account 处理 (包含文件写入、索引更新、锁) let email_clone = email.to_string(); let refresh_token_clone = refresh_token.to_string(); tokio::task::spawn_blocking(move || { let token_data = crate::models::TokenData::new( token_info.access_token, refresh_token_clone, token_info.expires_in, Some(email_clone.clone()), Some(project_id), None, // session_id true, ) .with_oauth_client_key(token_info.oauth_client_key.clone()); crate::modules::account::upsert_account(email_clone, None, token_data) }) .await .map_err(|e| format!("Task join error: {}", e))? .map_err(|e| format!("Failed to save account: {}", e))?; // 4. 重新加载 (更新内存) self.reload_all_accounts().await.map(|_| ()) } /// 记录请求成功，增加健康分 pub fn record_success(&self, account_id: &str) { self.health_scores .entry(account_id.to_string()) .and_modify(|s| *s = (*s + 0.05).min(1.0)) .or_insert(1.0); tracing::debug!("📈 Health score increased for account {}", account_id); } /// 记录请求失败，降低健康分 pub fn record_failure(&self, account_id: &str) { self.health_scores .entry(account_id.to_string()) .and_modify(|s| *s = (*s - 0.2).max(0.0)) .or_insert(0.8); tracing::warn!("📉 Health score decreased for account {}", account_id); } /// [NEW] 从账号配额信息中提取最近的刷新时间戳 /// /// Claude 模型（sonnet/opus）共用同一个刷新时间，只需取 claude 系列的 reset_time /// 返回 Unix 时间戳（秒），用于排序时比较 fn extract_earliest_reset_time(&self, account: &serde_json::Value) -> Option { let models = account .get("quota") .and_then(|q| q.get("models")) .and_then(|m| m.as_array())?; let mut earliest_ts: Option = None; for model in models { // 优先取 claude 系列的 reset_time（sonnet/opus 共用） let model_name = model.get("name").and_then(|n| n.as_str()).unwrap_or(""); if !model_name.contains("claude") { continue; } if let Some(reset_time_str) = model.get("reset_time").and_then(|r| r.as_str()) { if reset_time_str.is_empty() { continue; } // 解析 ISO 8601 时间字符串为时间戳 if let Ok(dt) = chrono::DateTime::parse_from_rfc3339(reset_time_str) { let ts = dt.timestamp(); if earliest_ts.is_none() || ts < earliest_ts.unwrap() { earliest_ts = Some(ts); } } } } // 如果没有 claude 模型的时间，尝试取任意模型的最近时间 if earliest_ts.is_none() { for model in models { if let Some(reset_time_str) = model.get("reset_time").and_then(|r| r.as_str()) { if reset_time_str.is_empty() { continue; } if let Ok(dt) = chrono::DateTime::parse_from_rfc3339(reset_time_str) { let ts = dt.timestamp(); if earliest_ts.is_none() || ts < earliest_ts.unwrap() { earliest_ts = Some(ts); } } } } } earliest_ts } /// 获取当前所有可用账号中收集到的官方下发的所有动态模型集合 pub fn get_all_collected_models(&self) -> std::collections::HashSet { let mut all_models = std::collections::HashSet::new(); for entry in self.tokens.iter() { let token = entry.value(); for model_id in token.model_quotas.keys() { all_models.insert(model_id.clone()); } } all_models } /// [NEW] 从指定账号的动态额度数据中获取特定模型的 max_output_tokens /// /// # 返回 /// - `Some(u64)`: 找到了动态限额数据 /// - `None`: 账号不存在或该模型无数据（调用方应继续查静态默认表） pub fn get_model_output_limit_for_account(&self, account_id: &str, model_name: &str) -> Option { self.tokens .get(account_id) .and_then(|token| token.model_limits.get(model_name).copied()) } /// Helper to find account ID by email pub fn get_account_id_by_email(&self, email: &str) -> Option { for entry in self.tokens.iter() { if entry.value().email == email { return Some(entry.key().clone()); } } None } /// Set validation blocked status for an account (internal) pub async fn set_validation_block(&self, account_id: &str, block_until: i64, reason: &str) -> Result<(), String> { // 1. Update memory if let Some(mut token) = self.tokens.get_mut(account_id) { token.validation_blocked = true; token.validation_blocked_until = block_until; } // 2. Persist to disk let path = self.data_dir.join("accounts").join(format!("{}.json", account_id)); if !path.exists() { return Err(format!("Account file not found: {:?}", path)); } let content = std::fs::read_to_string(&path) .map_err(|e| format!("Failed to read account file: {}", e))?; let mut account: serde_json::Value = serde_json::from_str(&content) .map_err(|e| format!("Failed to parse account JSON: {}", e))?; account["validation_blocked"] = serde_json::Value::Bool(true); account["validation_blocked_until"] = serde_json::Value::Number(serde_json::Number::from(block_until)); account["validation_blocked_reason"] = serde_json::Value::String(reason.to_string()); // [NEW] 尝试从消息中提取验证链接 (#1522) let extracted_url = if let Ok(parsed_json) = serde_json::from_str::(reason) { // 尝试从特定的 Google RPC error 结构中取 let mut url = None; if let Some(details) = parsed_json.pointer("/error/details") { if let Some(arr) = details.as_array() { for detail in arr { if let Some(meta) = detail.get("metadata") { if let Some(v_url) = meta.get("validation_url").and_then(|v| v.as_str()) { url = Some(v_url.to_string()); break; } if let Some(a_url) = meta.get("appeal_url").and_then(|v| v.as_str()) { url = Some(a_url.to_string()); break; } } } } } url } else { // 回退方案：通过更严格的正则及反序列化解码可能的 \u0026 let url_regex = regex::Regex::new(r#"https://[^\s"'\\]+"#).unwrap(); url_regex.find(reason).map(|m| { let raw_url = m.as_str().to_string(); raw_url.replace("\\u0026", "&") }) }; if let Some(url) = extracted_url { account["validation_url"] = serde_json::Value::String(url.clone()); if let Some(mut token) = self.tokens.get_mut(account_id) { token.validation_url = Some(url); } } // Clear sticky session if blocked self.session_accounts.retain(|_, v| *v != account_id); let json_str = serde_json::to_string_pretty(&account) .map_err(|e| format!("Failed to serialize account JSON: {}", e))?; std::fs::write(&path, json_str) .map_err(|e| format!("Failed to write account file: {}", e))?; tracing::info!( "🚫 Account {} validation blocked until {} (reason: {})", account_id, block_until, reason ); Ok(()) } /// Public method to set validation block (called from handlers) pub async fn set_validation_block_public(&self, account_id: &str, block_until: i64, reason: &str) -> Result<(), String> { self.set_validation_block(account_id, block_until, reason).await } /// Set is_forbidden status for an account (called when proxy encounters 403) pub async fn set_forbidden(&self, account_id: &str, reason: &str) -> Result<(), String> { // [FIX] 调用封装好的模块函数，确保线程安全地更新账号文件和索引 crate::modules::account::mark_account_forbidden(account_id, reason)?; // Clear sticky session if forbidden self.session_accounts.retain(|_, v| *v != account_id); // [FIX] 从内存池中移除账号，避免重试时再次选中 self.remove_account(account_id); tracing::warn!( "🚫 Account {} marked as forbidden (403): {}", account_id, truncate_reason(reason, 1000) ); Ok(()) } } /// 截断过长的原因字符串 fn truncate_reason(reason: &str, max_len: usize) -> String { if reason.len() <= max_len { reason.to_string() } else { // [FIX] 确保字符截断在有效边界，防止 panic let end = reason .char_indices() .map(|(i, _)| i) .filter(|&i| i <= max_len - 3) .last() .unwrap_or(0); format!("{}...", &reason[..end]) } } #[cfg(test)] mod tests { use super::*; use std::cmp::Ordering; #[tokio::test] async fn test_reload_account_purges_cache_when_account_becomes_proxy_disabled() { let tmp_root = std::env::temp_dir().join(format!( "antigravity-token-manager-test-{}", uuid::Uuid::new_v4() )); let accounts_dir = tmp_root.join("accounts"); std::fs::create_dir_all(&accounts_dir).unwrap(); let account_id = "acc1"; let email = "a@test.com"; let now = chrono::Utc::now().timestamp(); let account_path = accounts_dir.join(format!("{}.json", account_id)); let account_json = serde_json::json!({ "id": account_id, "email": email, "token": { "access_token": "atk", "refresh_token": "rtk", "expires_in": 3600, "expiry_timestamp": now + 3600 }, "disabled": false, "proxy_disabled": false, "created_at": now, "last_used": now }); std::fs::write(&account_path, serde_json::to_string_pretty(&account_json).unwrap()).unwrap(); let manager = TokenManager::new(tmp_root.clone()); manager.load_accounts().await.unwrap(); assert!(manager.tokens.get(account_id).is_some()); // Prime extra caches to ensure remove_account() is really called. manager .session_accounts .insert("sid1".to_string(), account_id.to_string()); { let mut preferred = manager.preferred_account_id.write().await; *preferred = Some(account_id.to_string()); } // Mark account as proxy-disabled on disk (manual disable). let mut disabled_json = account_json.clone(); disabled_json["proxy_disabled"] = serde_json::Value::Bool(true); disabled_json["proxy_disabled_reason"] = serde_json::Value::String("manual".to_string()); disabled_json["proxy_disabled_at"] = serde_json::Value::Number(now.into()); std::fs::write(&account_path, serde_json::to_string_pretty(&disabled_json).unwrap()).unwrap(); manager.reload_account(account_id).await.unwrap(); assert!(manager.tokens.get(account_id).is_none()); assert!(manager.session_accounts.get("sid1").is_none()); assert!(manager.preferred_account_id.read().await.is_none()); let _ = std::fs::remove_dir_all(&tmp_root); } #[tokio::test] async fn test_fixed_account_mode_skips_preferred_when_disabled_on_disk_without_reload() { let tmp_root = std::env::temp_dir().join(format!( "antigravity-token-manager-test-fixed-mode-{}", uuid::Uuid::new_v4() )); let accounts_dir = tmp_root.join("accounts"); std::fs::create_dir_all(&accounts_dir).unwrap(); let now = chrono::Utc::now().timestamp(); let write_account = |id: &str, email: &str, proxy_disabled: bool| { let account_path = accounts_dir.join(format!("{}.json", id)); let json = serde_json::json!({ "id": id, "email": email, "token": { "access_token": format!("atk-{}", id), "refresh_token": format!("rtk-{}", id), "expires_in": 3600, "expiry_timestamp": now + 3600, "project_id": format!("pid-{}", id) }, "disabled": false, "proxy_disabled": proxy_disabled, "proxy_disabled_reason": if proxy_disabled { "manual" } else { "" }, "created_at": now, "last_used": now }); std::fs::write(&account_path, serde_json::to_string_pretty(&json).unwrap()).unwrap(); }; // Two accounts in pool. write_account("acc1", "a@test.com", false); write_account("acc2", "b@test.com", false); let manager = TokenManager::new(tmp_root.clone()); manager.load_accounts().await.unwrap(); // Enable fixed account mode for acc1. manager.set_preferred_account(Some("acc1".to_string())).await; // Disable acc1 on disk WITHOUT reloading the in-memory pool (simulates stale cache). write_account("acc1", "a@test.com", true); let (_token, _project_id, email, account_id, _wait_ms) = manager .get_token("gemini", false, Some("sid1"), "gemini-1.5-flash") .await .unwrap(); // Should fall back to another account instead of using the disabled preferred one. assert_eq!(account_id, "acc2"); assert_eq!(email, "b@test.com"); assert!(manager.tokens.get("acc1").is_none()); assert!(manager.get_preferred_account().await.is_none()); let _ = std::fs::remove_dir_all(&tmp_root); } #[tokio::test] async fn test_sticky_session_skips_bound_account_when_disabled_on_disk_without_reload() { let tmp_root = std::env::temp_dir().join(format!( "antigravity-token-manager-test-sticky-disabled-{}", uuid::Uuid::new_v4() )); let accounts_dir = tmp_root.join("accounts"); std::fs::create_dir_all(&accounts_dir).unwrap(); let now = chrono::Utc::now().timestamp(); let write_account = |id: &str, email: &str, percentage: i64, proxy_disabled: bool| { let account_path = accounts_dir.join(format!("{}.json", id)); let json = serde_json::json!({ "id": id, "email": email, "token": { "access_token": format!("atk-{}", id), "refresh_token": format!("rtk-{}", id), "expires_in": 3600, "expiry_timestamp": now + 3600, "project_id": format!("pid-{}", id) }, "quota": { "models": [ { "name": "gemini-1.5-flash", "percentage": percentage } ] }, "disabled": false, "proxy_disabled": proxy_disabled, "proxy_disabled_reason": if proxy_disabled { "manual" } else { "" }, "created_at": now, "last_used": now }); std::fs::write(&account_path, serde_json::to_string_pretty(&json).unwrap()).unwrap(); }; // Two accounts in pool. acc1 has higher quota -> should be selected and bound first. write_account("acc1", "a@test.com", 90, false); write_account("acc2", "b@test.com", 10, false); let manager = TokenManager::new(tmp_root.clone()); manager.load_accounts().await.unwrap(); // Prime: first request should bind the session to acc1. let (_token, _project_id, _email, account_id, _wait_ms) = manager .get_token("gemini", false, Some("sid1"), "gemini-1.5-flash") .await .unwrap(); assert_eq!(account_id, "acc1"); assert_eq!( manager.session_accounts.get("sid1").map(|v| v.clone()), Some("acc1".to_string()) ); // Disable acc1 on disk WITHOUT reloading the in-memory pool (simulates stale cache). write_account("acc1", "a@test.com", 90, true); let (_token, _project_id, email, account_id, _wait_ms) = manager .get_token("gemini", false, Some("sid1"), "gemini-1.5-flash") .await .unwrap(); // Should fall back to another account instead of reusing the disabled bound one. assert_eq!(account_id, "acc2"); assert_eq!(email, "b@test.com"); assert!(manager.tokens.get("acc1").is_none()); assert_ne!( manager.session_accounts.get("sid1").map(|v| v.clone()), Some("acc1".to_string()) ); let _ = std::fs::remove_dir_all(&tmp_root); } /// 创建测试用的 ProxyToken fn create_test_token( email: &str, tier: Option<&str>, health_score: f32, reset_time: Option, remaining_quota: Option, ) -> ProxyToken { ProxyToken { account_id: email.to_string(), access_token: "test_token".to_string(), refresh_token: "test_refresh".to_string(), expires_in: 3600, timestamp: chrono::Utc::now().timestamp() + 3600, email: email.to_string(), account_path: PathBuf::from("/tmp/test"), project_id: None, subscription_tier: tier.map(|s| s.to_string()), remaining_quota, protected_models: HashSet::new(), health_score, reset_time, validation_blocked: false, validation_blocked_until: 0, validation_url: None, model_quotas: HashMap::new(), model_limits: HashMap::new(), } } /// 测试排序比较函数（与 get_token_internal 中的逻辑一致） fn compare_tokens(a: &ProxyToken, b: &ProxyToken) -> Ordering { const RESET_TIME_THRESHOLD_SECS: i64 = 600; // 10 分钟阈值 let tier_priority = |tier: &Option| { let t = tier.as_deref().unwrap_or("").to_lowercase(); if t.contains("ultra") { 0 } else if t.contains("pro") { 1 } else if t.contains("free") { 2 } else { 3 } }; // First: compare by subscription tier let tier_cmp = tier_priority(&a.subscription_tier).cmp(&tier_priority(&b.subscription_tier)); if tier_cmp != Ordering::Equal { return tier_cmp; } // Second: compare by health score (higher is better) let health_cmp = b.health_score.partial_cmp(&a.health_score).unwrap_or(Ordering::Equal); if health_cmp != Ordering::Equal { return health_cmp; } // Third: compare by reset time (earlier/closer is better) let reset_a = a.reset_time.unwrap_or(i64::MAX); let reset_b = b.reset_time.unwrap_or(i64::MAX); let reset_diff = (reset_a - reset_b).abs(); if reset_diff >= RESET_TIME_THRESHOLD_SECS { let reset_cmp = reset_a.cmp(&reset_b); if reset_cmp != Ordering::Equal { return reset_cmp; } } // Fourth: compare by remaining quota percentage (higher is better) let quota_a = a.remaining_quota.unwrap_or(0); let quota_b = b.remaining_quota.unwrap_or(0); quota_b.cmp("a_a) } #[test] fn test_sorting_tier_priority() { // ULTRA > PRO > FREE let ultra = create_test_token("ultra@test.com", Some("ULTRA"), 1.0, None, Some(50)); let pro = create_test_token("pro@test.com", Some("PRO"), 1.0, None, Some(50)); let free = create_test_token("free@test.com", Some("FREE"), 1.0, None, Some(50)); assert_eq!(compare_tokens(&ultra, &pro), Ordering::Less); assert_eq!(compare_tokens(&pro, &free), Ordering::Less); assert_eq!(compare_tokens(&ultra, &free), Ordering::Less); assert_eq!(compare_tokens(&free, &ultra), Ordering::Greater); } #[test] fn test_sorting_health_score_priority() { // 同等级下，健康分高的优先 let high_health = create_test_token("high@test.com", Some("PRO"), 1.0, None, Some(50)); let low_health = create_test_token("low@test.com", Some("PRO"), 0.5, None, Some(50)); assert_eq!(compare_tokens(&high_health, &low_health), Ordering::Less); assert_eq!(compare_tokens(&low_health, &high_health), Ordering::Greater); } #[test] fn test_sorting_reset_time_priority() { let now = chrono::Utc::now().timestamp(); // 刷新时间更近（30分钟后）的优先于更远（5小时后）的 let soon_reset = create_test_token("soon@test.com", Some("PRO"), 1.0, Some(now + 1800), Some(50)); // 30分钟后 let late_reset = create_test_token("late@test.com", Some("PRO"), 1.0, Some(now + 18000), Some(50)); // 5小时后 assert_eq!(compare_tokens(&soon_reset, &late_reset), Ordering::Less); assert_eq!(compare_tokens(&late_reset, &soon_reset), Ordering::Greater); } #[test] fn test_sorting_reset_time_threshold() { let now = chrono::Utc::now().timestamp(); // 差异小于10分钟（600秒）视为相同优先级，此时按配额排序 let reset_a = create_test_token("a@test.com", Some("PRO"), 1.0, Some(now + 1800), Some(80)); // 30分钟后, 80%配额 let reset_b = create_test_token("b@test.com", Some("PRO"), 1.0, Some(now + 2100), Some(50)); // 35分钟后, 50%配额 // 差5分钟 < 10分钟阈值，视为相同，按配额排序（80% > 50%） assert_eq!(compare_tokens(&reset_a, &reset_b), Ordering::Less); } #[test] fn test_sorting_reset_time_beyond_threshold() { let now = chrono::Utc::now().timestamp(); // 差异超过10分钟，按刷新时间排序（忽略配额） let soon_low_quota = create_test_token("soon@test.com", Some("PRO"), 1.0, Some(now + 1800), Some(20)); // 30分钟后, 20% let late_high_quota = create_test_token("late@test.com", Some("PRO"), 1.0, Some(now + 18000), Some(90)); // 5小时后, 90% // 差4.5小时 > 10分钟，刷新时间优先，30分钟 < 5小时 assert_eq!(compare_tokens(&soon_low_quota, &late_high_quota), Ordering::Less); } #[test] fn test_sorting_quota_fallback() { // 其他条件相同时，配额高的优先 let high_quota = create_test_token("high@test.com", Some("PRO"), 1.0, None, Some(80)); let low_quota = create_test_token("low@test.com", Some("PRO"), 1.0, None, Some(20)); assert_eq!(compare_tokens(&high_quota, &low_quota), Ordering::Less); assert_eq!(compare_tokens(&low_quota, &high_quota), Ordering::Greater); } #[test] fn test_sorting_missing_reset_time() { let now = chrono::Utc::now().timestamp(); // 没有 reset_time 的账号应该排在有 reset_time 的后面 let with_reset = create_test_token("with@test.com", Some("PRO"), 1.0, Some(now + 1800), Some(50)); let without_reset = create_test_token("without@test.com", Some("PRO"), 1.0, None, Some(50)); assert_eq!(compare_tokens(&with_reset, &without_reset), Ordering::Less); } #[test] fn test_full_sorting_integration() { let now = chrono::Utc::now().timestamp(); let mut tokens = vec![ create_test_token("free_high@test.com", Some("FREE"), 1.0, Some(now + 1800), Some(90)), create_test_token("pro_low_health@test.com", Some("PRO"), 0.5, Some(now + 1800), Some(90)), create_test_token("pro_soon@test.com", Some("PRO"), 1.0, Some(now + 1800), Some(50)), // 30分钟后 create_test_token("pro_late@test.com", Some("PRO"), 1.0, Some(now + 18000), Some(90)), // 5小时后 create_test_token("ultra@test.com", Some("ULTRA"), 1.0, Some(now + 36000), Some(10)), ]; tokens.sort_by(compare_tokens); // 预期顺序: // 1. ULTRA (最高等级，即使刷新时间最远) // 2. PRO + 高健康分 + 30分钟后刷新 // 3. PRO + 高健康分 + 5小时后刷新 // 4. PRO + 低健康分 // 5. FREE (最低等级，即使配额最高) assert_eq!(tokens[0].email, "ultra@test.com"); assert_eq!(tokens[1].email, "pro_soon@test.com"); assert_eq!(tokens[2].email, "pro_late@test.com"); assert_eq!(tokens[3].email, "pro_low_health@test.com"); assert_eq!(tokens[4].email, "free_high@test.com"); } #[test] fn test_realistic_scenario() { // 模拟用户描述的场景: // a 账号 claude 4h55m 后刷新 // b 账号 claude 31m 后刷新 // 应该优先使用 b（31分钟后刷新） let now = chrono::Utc::now().timestamp(); let account_a = create_test_token("a@test.com", Some("PRO"), 1.0, Some(now + 295 * 60), Some(80)); // 4h55m let account_b = create_test_token("b@test.com", Some("PRO"), 1.0, Some(now + 31 * 60), Some(30)); // 31m // b 应该排在 a 前面（刷新时间更近） assert_eq!(compare_tokens(&account_b, &account_a), Ordering::Less); let mut tokens = vec![account_a.clone(), account_b.clone()]; tokens.sort_by(compare_tokens); assert_eq!(tokens[0].email, "b@test.com"); assert_eq!(tokens[1].email, "a@test.com"); } #[test] fn test_extract_earliest_reset_time() { let manager = TokenManager::new(PathBuf::from("/tmp/test")); // 测试包含 claude 模型的 reset_time 提取 let account_with_claude = serde_json::json!({ "quota": { "models": [ {"name": "gemini-flash", "reset_time": "2025-01-31T10:00:00Z"}, {"name": "claude-sonnet", "reset_time": "2025-01-31T08:00:00Z"}, {"name": "claude-opus", "reset_time": "2025-01-31T08:00:00Z"} ] } }); let result = manager.extract_earliest_reset_time(&account_with_claude); assert!(result.is_some()); // 应该返回 claude 的时间（08:00）而不是 gemini 的（10:00） let expected_ts = chrono::DateTime::parse_from_rfc3339("2025-01-31T08:00:00Z") .unwrap() .timestamp(); assert_eq!(result.unwrap(), expected_ts); } #[test] fn test_extract_reset_time_no_claude() { let manager = TokenManager::new(PathBuf::from("/tmp/test")); // 没有 claude 模型时，应该取任意模型的最近时间 let account_no_claude = serde_json::json!({ "quota": { "models": [ {"name": "gemini-flash", "reset_time": "2025-01-31T10:00:00Z"}, {"name": "gemini-pro", "reset_time": "2025-01-31T08:00:00Z"} ] } }); let result = manager.extract_earliest_reset_time(&account_no_claude); assert!(result.is_some()); let expected_ts = chrono::DateTime::parse_from_rfc3339("2025-01-31T08:00:00Z") .unwrap() .timestamp(); assert_eq!(result.unwrap(), expected_ts); } #[test] fn test_extract_reset_time_missing_quota() { let manager = TokenManager::new(PathBuf::from("/tmp/test")); // 没有 quota 字段时应返回 None let account_no_quota = serde_json::json!({ "email": "test@test.com" }); assert!(manager.extract_earliest_reset_time(&account_no_quota).is_none()); } // ===== P2C 算法测试 ===== /// 创建带 protected_models 的测试 Token fn create_test_token_with_protected( email: &str, remaining_quota: Option, protected_models: HashSet, ) -> ProxyToken { ProxyToken { account_id: email.to_string(), access_token: "test_token".to_string(), refresh_token: "test_refresh".to_string(), expires_in: 3600, timestamp: chrono::Utc::now().timestamp() + 3600, email: email.to_string(), account_path: PathBuf::from("/tmp/test"), project_id: None, subscription_tier: Some("PRO".to_string()), remaining_quota, protected_models, health_score: 1.0, reset_time: None, validation_blocked: false, validation_blocked_until: 0, validation_url: None, model_quotas: HashMap::new(), model_limits: HashMap::new(), } } #[test] fn test_p2c_selects_higher_quota() { // P2C 应选择配额更高的账号 let manager = TokenManager::new(PathBuf::from("/tmp/test")); let low_quota = create_test_token("low@test.com", Some("PRO"), 1.0, None, Some(20)); let high_quota = create_test_token("high@test.com", Some("PRO"), 1.0, None, Some(80)); let candidates = vec![low_quota, high_quota]; let attempted: HashSet = HashSet::new(); // 运行多次确保选择高配额账号 for _ in 0..10 { let result = manager.select_with_p2c(&candidates, &attempted, "claude-sonnet", false); assert!(result.is_some()); // P2C 从两个候选中选择配额更高的 // 由于只有两个候选，应该总是选择 high_quota assert_eq!(result.unwrap().email, "high@test.com"); } } #[test] fn test_p2c_skips_attempted() { // P2C 应跳过已尝试的账号 let manager = TokenManager::new(PathBuf::from("/tmp/test")); let token_a = create_test_token("a@test.com", Some("PRO"), 1.0, None, Some(80)); let token_b = create_test_token("b@test.com", Some("PRO"), 1.0, None, Some(50)); let candidates = vec![token_a, token_b]; let mut attempted: HashSet = HashSet::new(); attempted.insert("a@test.com".to_string()); let result = manager.select_with_p2c(&candidates, &attempted, "claude-sonnet", false); assert!(result.is_some()); assert_eq!(result.unwrap().email, "b@test.com"); } #[test] fn test_p2c_skips_protected_models() { // P2C 应跳过对目标模型有保护的账号 (quota_protection_enabled = true) let manager = TokenManager::new(PathBuf::from("/tmp/test")); let mut protected = HashSet::new(); protected.insert("claude-sonnet".to_string()); let protected_account = create_test_token_with_protected("protected@test.com", Some(90), protected); let normal_account = create_test_token_with_protected("normal@test.com", Some(50), HashSet::new()); let candidates = vec![protected_account, normal_account]; let attempted: HashSet = HashSet::new(); let result = manager.select_with_p2c(&candidates, &attempted, "claude-sonnet", true); assert!(result.is_some()); assert_eq!(result.unwrap().email, "normal@test.com"); } #[test] fn test_p2c_single_candidate() { // 单候选时直接返回 let manager = TokenManager::new(PathBuf::from("/tmp/test")); let token = create_test_token("single@test.com", Some("PRO"), 1.0, None, Some(50)); let candidates = vec![token]; let attempted: HashSet = HashSet::new(); let result = manager.select_with_p2c(&candidates, &attempted, "claude-sonnet", false); assert!(result.is_some()); assert_eq!(result.unwrap().email, "single@test.com"); } #[test] fn test_p2c_empty_candidates() { // 空候选返回 None let manager = TokenManager::new(PathBuf::from("/tmp/test")); let candidates: Vec = vec![]; let attempted: HashSet = HashSet::new(); let result = manager.select_with_p2c(&candidates, &attempted, "claude-sonnet", false); assert!(result.is_none()); } #[test] fn test_p2c_all_attempted() { // 所有账号都已尝试时返回 None let manager = TokenManager::new(PathBuf::from("/tmp/test")); let token_a = create_test_token("a@test.com", Some("PRO"), 1.0, None, Some(80)); let token_b = create_test_token("b@test.com", Some("PRO"), 1.0, None, Some(50)); let candidates = vec![token_a, token_b]; let mut attempted: HashSet = HashSet::new(); attempted.insert("a@test.com".to_string()); attempted.insert("b@test.com".to_string()); let result = manager.select_with_p2c(&candidates, &attempted, "claude-sonnet", false); assert!(result.is_none()); } // ===== Ultra 优先逻辑测试 ===== /// 测试 is_ultra_required_model 辅助函数 #[test] fn test_is_ultra_required_model() { // 需要 Ultra 账号的高端模型 const ULTRA_REQUIRED_MODELS: &[&str] = &[ "claude-opus-4-6", "claude-opus-4-5", "opus", ]; fn is_ultra_required_model(model: &str) -> bool { let lower = model.to_lowercase(); ULTRA_REQUIRED_MODELS.iter().any(|m| lower.contains(m)) } // 应该识别为高端模型 assert!(is_ultra_required_model("claude-opus-4-6")); assert!(is_ultra_required_model("claude-opus-4-5")); assert!(is_ultra_required_model("Claude-Opus-4-6")); // 大小写不敏感 assert!(is_ultra_required_model("CLAUDE-OPUS-4-5")); // 大小写不敏感 assert!(is_ultra_required_model("opus")); // 通配匹配 assert!(is_ultra_required_model("opus-4-6-latest")); assert!(is_ultra_required_model("models/claude-opus-4-6")); // 应该识别为普通模型 assert!(!is_ultra_required_model("claude-sonnet-4-5")); assert!(!is_ultra_required_model("claude-sonnet")); assert!(!is_ultra_required_model("gemini-1.5-flash")); assert!(!is_ultra_required_model("gemini-2.0-pro")); assert!(!is_ultra_required_model("claude-haiku")); } /// 测试高端模型排序：Ultra 账号优先于 Pro 账号（即使 Pro 配额更高） #[test] fn test_ultra_priority_for_high_end_models() { const RESET_TIME_THRESHOLD_SECS: i64 = 600; // 模拟高端模型排序逻辑 fn compare_tokens_for_model(a: &ProxyToken, b: &ProxyToken, target_model: &str) -> Ordering { const ULTRA_REQUIRED_MODELS: &[&str] = &["claude-opus-4-6", "claude-opus-4-5", "opus"]; let requires_ultra = { let lower = target_model.to_lowercase(); ULTRA_REQUIRED_MODELS.iter().any(|m| lower.contains(m)) }; let tier_priority = |tier: &Option| { let t = tier.as_deref().unwrap_or("").to_lowercase(); if t.contains("ultra") { 0 } else if t.contains("pro") { 1 } else if t.contains("free") { 2 } else { 3 } }; // Priority 0: 高端模型时，订阅等级优先 if requires_ultra { let tier_cmp = tier_priority(&a.subscription_tier) .cmp(&tier_priority(&b.subscription_tier)); if tier_cmp != Ordering::Equal { return tier_cmp; } } // Priority 1: Quota (higher is better) let quota_a = a.remaining_quota.unwrap_or(0); let quota_b = b.remaining_quota.unwrap_or(0); let quota_cmp = quota_b.cmp("a_a); if quota_cmp != Ordering::Equal { return quota_cmp; } // Priority 2: Health score let health_cmp = b.health_score.partial_cmp(&a.health_score) .unwrap_or(Ordering::Equal); if health_cmp != Ordering::Equal { return health_cmp; } // Priority 3: Tier (for non-high-end models) if !requires_ultra { let tier_cmp = tier_priority(&a.subscription_tier) .cmp(&tier_priority(&b.subscription_tier)); if tier_cmp != Ordering::Equal { return tier_cmp; } } Ordering::Equal } // 创建测试账号：Ultra 低配额 vs Pro 高配额 let ultra_low_quota = create_test_token("ultra@test.com", Some("ULTRA"), 1.0, None, Some(20)); let pro_high_quota = create_test_token("pro@test.com", Some("PRO"), 1.0, None, Some(80)); // 高端模型 (Opus 4.6): Ultra 应该优先，即使配额低 assert_eq!( compare_tokens_for_model(&ultra_low_quota, &pro_high_quota, "claude-opus-4-6"), Ordering::Less, // Ultra 排在前面 "Opus 4.6 should prefer Ultra account over Pro even with lower quota" ); // 高端模型 (Opus 4.5): Ultra 应该优先 assert_eq!( compare_tokens_for_model(&ultra_low_quota, &pro_high_quota, "claude-opus-4-5"), Ordering::Less, "Opus 4.5 should prefer Ultra account over Pro" ); // 普通模型 (Sonnet): 高配额 Pro 应该优先 assert_eq!( compare_tokens_for_model(&ultra_low_quota, &pro_high_quota, "claude-sonnet-4-5"), Ordering::Greater, // Pro (高配额) 排在前面 "Sonnet should prefer high-quota Pro over low-quota Ultra" ); // 普通模型 (Flash): 高配额 Pro 应该优先 assert_eq!( compare_tokens_for_model(&ultra_low_quota, &pro_high_quota, "gemini-1.5-flash"), Ordering::Greater, "Flash should prefer high-quota Pro over low-quota Ultra" ); } /// 测试排序：同为 Ultra 时按配额排序 #[test] fn test_ultra_accounts_sorted_by_quota() { fn compare_tokens_for_model(a: &ProxyToken, b: &ProxyToken, target_model: &str) -> Ordering { const ULTRA_REQUIRED_MODELS: &[&str] = &["claude-opus-4-6", "claude-opus-4-5", "opus"]; let requires_ultra = { let lower = target_model.to_lowercase(); ULTRA_REQUIRED_MODELS.iter().any(|m| lower.contains(m)) }; let tier_priority = |tier: &Option| { let t = tier.as_deref().unwrap_or("").to_lowercase(); if t.contains("ultra") { 0 } else if t.contains("pro") { 1 } else if t.contains("free") { 2 } else { 3 } }; if requires_ultra { let tier_cmp = tier_priority(&a.subscription_tier) .cmp(&tier_priority(&b.subscription_tier)); if tier_cmp != Ordering::Equal { return tier_cmp; } } let quota_a = a.remaining_quota.unwrap_or(0); let quota_b = b.remaining_quota.unwrap_or(0); quota_b.cmp("a_a) } let ultra_high = create_test_token("ultra_high@test.com", Some("ULTRA"), 1.0, None, Some(80)); let ultra_low = create_test_token("ultra_low@test.com", Some("ULTRA"), 1.0, None, Some(20)); // Opus 4.6: 同为 Ultra，高配额优先 assert_eq!( compare_tokens_for_model(&ultra_high, &ultra_low, "claude-opus-4-6"), Ordering::Less, // ultra_high 排在前面 "Among Ultra accounts, higher quota should come first" ); } /// 测试完整排序场景：混合账号池 #[test] fn test_full_sorting_mixed_accounts() { fn sort_tokens_for_model(tokens: &mut Vec, target_model: &str) { const ULTRA_REQUIRED_MODELS: &[&str] = &["claude-opus-4-6", "claude-opus-4-5", "opus"]; let requires_ultra = { let lower = target_model.to_lowercase(); ULTRA_REQUIRED_MODELS.iter().any(|m| lower.contains(m)) }; tokens.sort_by(|a, b| { let tier_priority = |tier: &Option| { let t = tier.as_deref().unwrap_or("").to_lowercase(); if t.contains("ultra") { 0 } else if t.contains("pro") { 1 } else if t.contains("free") { 2 } else { 3 } }; if requires_ultra { let tier_cmp = tier_priority(&a.subscription_tier) .cmp(&tier_priority(&b.subscription_tier)); if tier_cmp != Ordering::Equal { return tier_cmp; } } let quota_a = a.remaining_quota.unwrap_or(0); let quota_b = b.remaining_quota.unwrap_or(0); let quota_cmp = quota_b.cmp("a_a); if quota_cmp != Ordering::Equal { return quota_cmp; } if !requires_ultra { let tier_cmp = tier_priority(&a.subscription_tier) .cmp(&tier_priority(&b.subscription_tier)); if tier_cmp != Ordering::Equal { return tier_cmp; } } Ordering::Equal }); } // 创建混合账号池 let ultra_high = create_test_token("ultra_high@test.com", Some("ULTRA"), 1.0, None, Some(80)); let ultra_low = create_test_token("ultra_low@test.com", Some("ULTRA"), 1.0, None, Some(20)); let pro_high = create_test_token("pro_high@test.com", Some("PRO"), 1.0, None, Some(90)); let pro_low = create_test_token("pro_low@test.com", Some("PRO"), 1.0, None, Some(30)); let free = create_test_token("free@test.com", Some("FREE"), 1.0, None, Some(100)); // 高端模型 (Opus 4.6) 排序 let mut tokens_opus = vec![pro_high.clone(), free.clone(), ultra_low.clone(), pro_low.clone(), ultra_high.clone()]; sort_tokens_for_model(&mut tokens_opus, "claude-opus-4-6"); let emails_opus: Vec<&str> = tokens_opus.iter().map(|t| t.email.as_str()).collect(); // 期望顺序: Ultra(高配额) > Ultra(低配额) > Pro(高配额) > Pro(低配额) > Free assert_eq!( emails_opus, vec!["ultra_high@test.com", "ultra_low@test.com", "pro_high@test.com", "pro_low@test.com", "free@test.com"], "Opus 4.6 should sort Ultra first, then by quota within each tier" ); // 普通模型 (Sonnet) 排序 let mut tokens_sonnet = vec![pro_high.clone(), free.clone(), ultra_low.clone(), pro_low.clone(), ultra_high.clone()]; sort_tokens_for_model(&mut tokens_sonnet, "claude-sonnet-4-5"); let emails_sonnet: Vec<&str> = tokens_sonnet.iter().map(|t| t.email.as_str()).collect(); // 期望顺序: Free(100%) > Pro(90%) > Ultra(80%) > Pro(30%) > Ultra(20%) - 按配额优先 assert_eq!( emails_sonnet, vec!["free@test.com", "pro_high@test.com", "ultra_high@test.com", "pro_low@test.com", "ultra_low@test.com"], "Sonnet should sort by quota first, then by tier as tiebreaker" ); } }