File size: 7,699 Bytes
e054d0c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 |
"""
本地进度管理适配器
基于内存队列实现的进度管理适配器,适用于本地单实例场景。
"""
import asyncio
from collections import defaultdict
from datetime import datetime
from typing import Any, AsyncGenerator, Dict, List, Optional
from ..base import ProgressAdapter
class LocalProgressAdapter(ProgressAdapter):
"""
本地内存进度管理适配器
特点:
1. 使用内存字典存储最新进度
2. 使用 asyncio.Queue 实现订阅者模式
3. 支持多订阅者同时订阅同一任务
4. 与 AsyncTrainingManager 的进度推送机制兼容
注意:
- 进程重启后进度数据会丢失
- 仅适用于单实例部署
- 服务器模式应使用 RedisProgressAdapter
Example:
>>> adapter = LocalProgressAdapter()
>>> await adapter.update_progress("task-123", {
... "stage": "sovits_train",
... "progress": 0.5,
... "message": "Epoch 8/16"
... })
>>>
>>> # 订阅进度
>>> async for progress in adapter.subscribe("task-123"):
... print(f"{progress['stage']}: {progress['progress']*100:.1f}%")
"""
def __init__(self):
"""初始化本地进度适配器"""
# 存储每个任务的最新进度
self.progress_store: Dict[str, Dict[str, Any]] = {}
# 存储每个任务的订阅者队列列表
self.subscribers: Dict[str, List[asyncio.Queue]] = defaultdict(list)
# 锁,用于保护订阅者列表的并发访问
self._lock = asyncio.Lock()
async def update_progress(self, task_id: str, progress: Dict[str, Any]) -> None:
"""
更新进度
Args:
task_id: 任务ID
progress: 进度信息字典,可包含:
- type: 消息类型 ("progress", "log", "error", "heartbeat")
- stage: 当前阶段
- progress: 阶段进度 (0.0-1.0)
- overall_progress: 总体进度 (0.0-1.0)
- message: 进度消息
- status: 状态 ("running", "completed", "failed", "cancelled")
"""
# 添加时间戳
if "timestamp" not in progress:
progress["timestamp"] = datetime.utcnow().isoformat()
# 存储最新进度
self.progress_store[task_id] = progress
# 通知所有订阅者
async with self._lock:
if task_id in self.subscribers:
for queue in self.subscribers[task_id]:
try:
await queue.put(progress)
except asyncio.QueueFull:
# 队列满了,跳过(避免阻塞)
pass
async def get_progress(self, task_id: str) -> Optional[Dict[str, Any]]:
"""
获取当前进度
Args:
task_id: 任务ID
Returns:
最新进度信息,不存在则返回 None
"""
return self.progress_store.get(task_id)
async def subscribe(self, task_id: str) -> AsyncGenerator[Dict[str, Any], None]:
"""
订阅进度更新
创建一个异步生成器,持续接收指定任务的进度更新。
当任务进入终态(completed, failed, cancelled)时自动结束。
Args:
task_id: 任务ID
Yields:
进度信息字典
Example:
>>> async for progress in adapter.subscribe("task-123"):
... print(progress)
... if progress.get("status") == "completed":
... break
"""
# 创建订阅者队列
queue: asyncio.Queue = asyncio.Queue(maxsize=100)
async with self._lock:
self.subscribers[task_id].append(queue)
try:
# 首先发送当前进度(如果有)
current = self.progress_store.get(task_id)
if current:
yield current
# 如果已经是终态,直接返回
if current.get("status") in ("completed", "failed", "cancelled"):
return
# 持续接收更新
while True:
try:
# 30秒超时,发送心跳
progress = await asyncio.wait_for(queue.get(), timeout=30.0)
yield progress
# 检查是否为终态
if progress.get("status") in ("completed", "failed", "cancelled"):
break
except asyncio.TimeoutError:
# 发送心跳保持连接
yield {
"type": "heartbeat",
"timestamp": datetime.utcnow().isoformat(),
}
finally:
# 清理订阅者
async with self._lock:
if task_id in self.subscribers:
try:
self.subscribers[task_id].remove(queue)
except ValueError:
pass
# 如果没有订阅者了,清理列表
if not self.subscribers[task_id]:
del self.subscribers[task_id]
async def clear_progress(self, task_id: str) -> None:
"""
清除任务进度数据
Args:
task_id: 任务ID
"""
self.progress_store.pop(task_id, None)
async with self._lock:
self.subscribers.pop(task_id, None)
async def get_subscriber_count(self, task_id: str) -> int:
"""
获取任务的订阅者数量
Args:
task_id: 任务ID
Returns:
订阅者数量
"""
async with self._lock:
return len(self.subscribers.get(task_id, []))
async def broadcast_to_all(self, message: Dict[str, Any]) -> int:
"""
向所有任务的订阅者广播消息
用于系统级通知,如服务器关闭警告等。
Args:
message: 消息内容
Returns:
发送成功的订阅者数量
"""
if "timestamp" not in message:
message["timestamp"] = datetime.utcnow().isoformat()
count = 0
async with self._lock:
for task_id, queues in self.subscribers.items():
for queue in queues:
try:
await queue.put(message)
count += 1
except asyncio.QueueFull:
pass
return count
def get_active_tasks(self) -> List[str]:
"""
获取有活跃订阅者的任务列表
Returns:
任务ID列表
"""
return list(self.subscribers.keys())
def get_stats(self) -> Dict[str, Any]:
"""
获取适配器统计信息
Returns:
统计信息字典
"""
total_subscribers = sum(
len(queues) for queues in self.subscribers.values()
)
return {
"stored_progress_count": len(self.progress_store),
"active_tasks": len(self.subscribers),
"total_subscribers": total_subscribers,
}
|