43 lines
1.2 KiB
JSON
43 lines
1.2 KiB
JSON
{
|
|
"report_id": "report-b96a7d12-192c-4a4b-9bb4-6d420db36e62",
|
|
"timestamp": "2026-04-14T22:05:43.990256+00:00",
|
|
"source_trajectory_ids": [
|
|
"traj-00ce0e5c-3e46-47b0-b69f-131cfd13e311",
|
|
"traj-071fd37a-7fe1-4299-8f3b-64013316eb20",
|
|
"traj-1a05680f-94fd-4fae-92a9-2cbb55041263",
|
|
"traj-4711d2da-0d1e-4d33-863b-d1b1769c7780",
|
|
"traj-56fb49ad-8eaf-4c31-82d8-4f99688d0865",
|
|
"traj-78ed00a1-be06-4efd-959f-76d172d02081",
|
|
"traj-a0e1ce5d-1089-44c2-900f-7c3b298c0234",
|
|
"traj-a44ca7d1-78db-46de-b144-42d70a1d0bfc",
|
|
"traj-bd696e6c-e004-49f7-9967-b991bbe5369f",
|
|
"traj-fdbb3b87-c254-4d81-a06d-ea0ceb7e3093"
|
|
],
|
|
"sample_count": 10,
|
|
"baseline_metrics": {
|
|
"task_count": 1,
|
|
"avg_reward": 1.032,
|
|
"error_rate": 0.0,
|
|
"avg_latency_ms": 42.0
|
|
},
|
|
"challenger_metrics": {
|
|
"task_count": 1,
|
|
"avg_reward": 0.44,
|
|
"error_rate": 0.0,
|
|
"avg_latency_ms": 0.0
|
|
},
|
|
"promotion_decision": {
|
|
"accepted": true,
|
|
"reasons": [],
|
|
"metrics": {
|
|
"reward_delta": -0.592,
|
|
"error_rate_delta": 0.0,
|
|
"latency_delta_ms": -42.0,
|
|
"baseline_avg_reward": 1.032,
|
|
"challenger_avg_reward": 0.44
|
|
}
|
|
},
|
|
"promoted_version_id": "20260414-220543",
|
|
"baseline_version_id": "v-baseline",
|
|
"dry_run": false
|
|
} |