AgentJet/ajet/tuner_lib/experimental/swarm_overwatch_utils.py at 4658ce027f7288e945f50a67906bcf99df50da77 · modelscope/AgentJet · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
from typing import List, Dict
from pydantic import BaseModel


class RewardHistoryEntry(BaseModel):
    """A single entry in the reward history."""
    global_step: int
    mean_reward: float
    std_reward: float
    timestamp: float  # Unix timestamp when this entry was recorded


class RewardHistoryResponse(BaseModel):
    """Response containing the reward history for visualization."""
    history: List[RewardHistoryEntry] = []


class CurrentBatchRolloutPoolInformation(BaseModel):
    sample_collection_method: str = ""
    completed_episodes: int = 0
    completed_episode_target: int = 0
    completed_tasks: int = 0
    completed_task_target: int = 0
    completed_non_dummy_tasks: int = 0
    completed_non_dummy_task_target: int = 0
    task_expected_num_repeat: int = 0
    completed_tasks_details: Dict[str, List[str]] = {}           # task_id -> list of episode_uuids
    completed_tasks_rewards: Dict[str, List[float]] = {}         # task_id -> list of rewards (one per episode)
    completed_tasks_client_uuids: Dict[str, List[str]] = {}      # task_id -> list of client UUIDs (one per episode)
    running_episode_details: Dict[str, Dict[str, str]] | None = None # episode_uuid -> { "episode_status": ..., "time_since_last_activity": ..., "discard_episode_timeout": ..., "llm_call_count": ..., "client_uuid": ... }
    engine_status: str | None = None
    global_step: int | None = None
    booting_start_time: float | None = None  # timestamp when ENGINE.BOOTING started