Initial standalone memabra release

This commit is contained in:
Carlos Ouyang
2026-04-15 11:06:05 +08:00
commit 58f9f221b1
464 changed files with 30256 additions and 0 deletions

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-0036bcfb-88dc-4636-897e-89fc909a810e",
"timestamp": "2026-04-14T16:51:38.314846+00:00",
"source_trajectory_ids": [
"traj-22d17281-9e5c-435d-852e-fa646d15afc4",
"traj-29a77a54-36ed-4885-b77f-ffc131425d2c",
"traj-40bce4b3-20ba-47ab-ac8d-4f3c494bffd1",
"traj-6ce2c5e5-6d58-439a-82ec-21f77f6de860",
"traj-76480a70-fbe1-4481-848b-a7e8d37643f5",
"traj-9a588dc5-9ef2-4290-8712-0b31946536a2",
"traj-b43b4a4e-4dfb-4ba9-8c56-29ea09e00e17",
"traj-ba03c72c-b782-400f-a9b1-4a4f6c0d7769",
"traj-be3bf833-bc49-4852-9ea2-ca04aeea8f31",
"traj-ebafcf74-923e-4af1-b64d-45c7cdbb4b04"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-009a9d41-ba23-4e38-85ad-cd6af5971d8b",
"timestamp": "2026-04-14T19:41:33.462482+00:00",
"source_trajectory_ids": [
"traj-0e089eaf-e132-405d-992f-a912f6baaaea",
"traj-2881966c-ad32-44c8-9c05-a50b0a2b784c",
"traj-5b351fac-7019-4807-a18a-c66b1c95c3e0",
"traj-6ef4ff84-d199-4864-8c99-6cd9efded1c6",
"traj-a62f2760-76ec-41f9-a20a-3ba8912c7c55",
"traj-b50b6662-ff12-4ec6-a112-c56e989bd768",
"traj-c1683dc5-e3d0-4421-aad7-fa42581096b2",
"traj-c3c9bd98-8c59-4cc4-8ad9-6d7b3c0be987",
"traj-d9a4fcc7-e929-48e6-8153-5d5c9c04f798",
"traj-e357c149-301f-4826-8812-6a1dab9087bd"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-025f0317-eb57-4357-a944-57c83e768e2b",
"timestamp": "2026-04-14T20:54:35.912785+00:00",
"source_trajectory_ids": [
"traj-0a386589-4f3d-4427-8bb6-984395bc391e",
"traj-0f04b540-f8bb-46d7-aeb4-ea65a723b82e",
"traj-14e30ab1-29e9-4356-ae7e-a8cea48c0b60",
"traj-4143c1db-ac63-4bc9-b427-a8f4d64c63f8",
"traj-43de5dee-3e20-42cf-91c1-2371b2f31329",
"traj-55766bd5-37dc-4216-9e29-3aea0a8a5095",
"traj-745e3299-1fd3-4af8-b6e2-4ebc4a47d389",
"traj-7c938b98-8346-48f8-a676-adb2e72e7259",
"traj-7dd2e59b-f65f-4870-b09e-69b95438b57b",
"traj-ab956b24-6aaa-49a2-8841-544cf9555959"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,41 @@
{
"report_id": "report-0335fde2-290a-4346-91b0-d1224cb1253f",
"timestamp": "2026-04-14T15:26:25.556320+00:00",
"source_trajectory_ids": [
"traj-0ccf1900-1e3b-4465-8f02-c51d07d7934c",
"traj-22a75db4-1794-4b10-ba4f-61539ae28352",
"traj-2ec475f3-4500-4c56-b317-ddb692e6eae5",
"traj-35007253-de45-43f6-a64c-121230ae0e1f",
"traj-3d3548d3-1981-46ad-be73-33b0420e58f4",
"traj-4d5bb70e-9529-4c2c-bb5b-da7f7d09f1f4",
"traj-5a663b45-d37f-489f-a403-6dd73d7b2b52",
"traj-bdbf6fab-cccd-4381-b3dc-ee7533b5be0e",
"traj-c4ea76f2-4403-430f-8821-91f14822e41f",
"traj-f2bf1402-39da-4ec2-97ed-b9349ca87581"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-152625"
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-04b8cf41-45f2-4870-ba8b-b509f7d3da48",
"timestamp": "2026-04-14T18:58:37.161636+00:00",
"source_trajectory_ids": [
"traj-10fd1aac-8da8-4f5d-be73-feea5fb4e60d",
"traj-4b7226f5-e3ed-47de-b0bb-febcad399f82",
"traj-6364e000-05f1-4de2-b018-090d2dd922bf",
"traj-6ea75734-5be4-4d8c-b5c2-88d971a12763",
"traj-7e17a2ac-0aaf-49a8-aed5-552ce80dcfc8",
"traj-92c21045-ff0f-4ad0-855f-307a9f509ef7",
"traj-b8cefeb5-17ae-4be4-a756-a4c9c453d3c2",
"traj-c6a2dba6-dd4f-4c9f-9455-4fb3db4d44b1",
"traj-dcac6477-8278-43ab-8efe-226cc8acdeaf",
"traj-eec22ce4-682b-4694-bdb8-657a84c4a76c"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,41 @@
{
"report_id": "report-07a477c9-2b2f-4505-a392-5dce58b67829",
"timestamp": "2026-04-14T18:01:06.160145+00:00",
"source_trajectory_ids": [
"traj-04f74afc-d341-4f63-b5ab-32f6d0fb33fb",
"traj-1fce1f44-c31b-4143-a0af-05b14783299c",
"traj-5fd71ba8-a8ed-4c52-bd5c-3dc0196b954a",
"traj-66dbaed9-42ee-4736-bed9-2a7d8260b81e",
"traj-89ceb3cf-0bfa-477b-b80c-76392bc7e9db",
"traj-8a7a589b-422d-4c51-b209-1f8a28bbe624",
"traj-b885ff21-6df2-4ea2-a39e-bb47a5aca56e",
"traj-df5f18eb-825e-4c80-b047-f9798bbeb654",
"traj-f47da721-1886-4466-b389-32ef359b58e6",
"traj-f673ef5f-700a-4dc8-b5ce-0ae2d3ebeeab"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-180106"
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-0856c8c4-bc0a-402d-8e4c-2e946029226b",
"timestamp": "2026-04-14T21:22:02.802049+00:00",
"source_trajectory_ids": [
"traj-29cd218f-e9b2-487d-ab34-620450a27cf7",
"traj-41331e52-1bb0-48c7-a65e-2749f3341018",
"traj-42b96e93-b37e-4518-84ce-90b243a4a9e2",
"traj-42c90394-8ac2-4a7d-8c12-4b4a78ab7a87",
"traj-47a0fae8-60f3-4a1a-90a1-0f643e2d9920",
"traj-7deb603d-b31e-4625-abaf-344ec12efe44",
"traj-dc35bca8-1bca-442a-93a1-4d77e360aba0",
"traj-e135ebd2-c850-4f9b-a6df-24b1d7eff190",
"traj-e87835bb-ba03-453e-8a50-49ddeeb7268d",
"traj-f1557075-9c9a-4f2a-bc48-6a919a379ae0"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-212202",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-08ef866e-b477-4e72-a32c-30003d2b91e9",
"timestamp": "2026-04-14T20:54:35.812564+00:00",
"source_trajectory_ids": [
"traj-0c9390f7-31ef-48fa-896b-093f9cd4c0ce",
"traj-1822f88a-0a09-4536-8022-24a7a73ba6df",
"traj-28ba821c-6a0c-4d40-a008-14497585c3d7",
"traj-483b03b2-41ee-4228-9d26-bb4e45eb241c",
"traj-73718bd7-97ad-424e-a049-e1ecc05ad770",
"traj-b4089209-fcf2-4139-9ed1-e9db5caaff69",
"traj-c097a470-093d-4dd1-a6c0-d21110fea346",
"traj-fc0408dc-5429-4af8-87d0-8c6212ae2623",
"traj-fd8f8a32-d9cb-4bda-a70b-bd95e604e037",
"traj-fe7cd38e-3e5d-4ae3-9ee0-6a2c0caafb2b"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-205435",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-09798c98-3bcb-4298-a546-2f531f875853",
"timestamp": "2026-04-14T22:10:23.222959+00:00",
"source_trajectory_ids": [
"traj-221f0c59-ad6b-4526-ae14-b5bb558b01ca",
"traj-24cbe596-6ee7-444a-b600-32d9b55422db",
"traj-2c5a6c34-df10-411d-9709-2a2e07cfca5e",
"traj-58e6dcd6-c688-4a66-a1a8-2fc64b06452a",
"traj-6a713624-ac97-42db-9946-9919da454d47",
"traj-813e4f86-4aab-420b-86fc-8a8694670c84",
"traj-a4c8fee4-428b-471c-8634-05d09c430b32",
"traj-caa40a45-47ec-4369-9519-ebdb038d5d6a",
"traj-d0d72631-39d8-47d7-83a5-76f424553eca",
"traj-d5dde094-d5e7-465d-8d7d-0f55356ae159"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-221023",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-097c5767-cf9b-42f5-9f8b-dee8a6224a67",
"timestamp": "2026-04-14T21:42:45.782035+00:00",
"source_trajectory_ids": [
"traj-1212bad2-f0fe-4d95-afd8-2a711775ccfb",
"traj-4d53da5b-5a10-4689-8dd9-0a1b2fa74083",
"traj-50942176-422b-4653-9477-48e1d16c0d34",
"traj-6d886402-bc74-4c9e-998e-ad9e4177b08d",
"traj-7d91fc48-dd1d-4c40-9785-5ebef05378a4",
"traj-8c012adb-959e-4eab-ac6c-3c5c4854720c",
"traj-8df099f2-5180-4ac1-8519-3204b9cffe07",
"traj-9c21877b-f093-44cc-af53-9b2961a4dd46",
"traj-ff0df310-0704-4619-9346-b27f1df0f237",
"traj-ffb39e69-6327-4985-8858-730a3c00a806"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 1.032,
"error_rate": 0.0,
"avg_latency_ms": 42.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": -0.592,
"error_rate_delta": 0.0,
"latency_delta_ms": -42.0,
"baseline_avg_reward": 1.032,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-214245",
"baseline_version_id": "v-baseline",
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-09ac51b7-988c-4b9c-ba38-3511d728c61d",
"timestamp": "2026-04-14T22:10:23.371730+00:00",
"source_trajectory_ids": [
"traj-00565435-0e10-46c5-82bd-3ba97f356fb2",
"traj-0249861e-b2f3-4e73-8e38-0599d0b7e8f0",
"traj-283bbc3b-5f88-48de-87b8-192418f70445",
"traj-4c674844-5148-4428-8607-22ae4ad7361d",
"traj-5689e1e1-0a03-45e8-b006-c692325fcc45",
"traj-a809b624-6317-4ce7-b809-4ab3479566ee",
"traj-b1e3a397-8678-436c-a9ed-17ea168c203a",
"traj-b87b739b-6daa-49a8-a7de-8d4509659328",
"traj-bc0076e9-0167-44ac-89ae-634b02890cb5",
"traj-d42ef1c3-cd8f-4474-a5d6-f0a42ff0a2f3"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-0a3e40be-b389-4041-bab7-cd99e4c8eac0",
"timestamp": "2026-04-14T20:07:38.841838+00:00",
"source_trajectory_ids": [
"traj-04eb60db-62bd-46c2-afe3-ecba6eac900a",
"traj-26387046-6b12-4841-9129-735599f13261",
"traj-34b22e88-a95e-4f12-84e5-da9af52a7381",
"traj-4f4eb7ad-1d11-4852-adde-eab50619c2bc",
"traj-51ecc36d-be08-4bcf-b645-7553e9b03992",
"traj-6b9f4f38-dc89-4abd-870e-c48c92d2b40e",
"traj-82fb2e11-fb35-4960-90d2-b2e53a1ea2ed",
"traj-ba5fa9da-693f-4a36-ab0f-c2efbe798ece",
"traj-c9c3403c-2ff3-4d84-85dd-731620583118",
"traj-ede4f925-e445-4cae-a3ba-0d30973294ae"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-0a675757-4870-4b12-98fb-ab093889eff3",
"timestamp": "2026-04-15T01:57:32.814873+00:00",
"source_trajectory_ids": [
"traj-1119ae3b-8cb6-4391-b283-bfeefdd12afe",
"traj-11afd403-d5d6-4af6-85b8-b015ed5bb1d3",
"traj-5c68a94c-d276-4e0f-9356-b99b6163e4e5",
"traj-5cdcaf3b-851f-45da-9fe1-253060428059",
"traj-5fd13613-7463-4969-ab53-c2e7e8555df3",
"traj-617478e4-408a-4ed6-a06d-b84da7be94b1",
"traj-a3a5c39f-592b-4b4b-94e9-59f63039e53e",
"traj-b5ffa504-3f59-4a75-8c10-1f4f5b5aa8c8",
"traj-c4e73e5c-5b4d-4f4c-a209-3f6147263622",
"traj-cccb6c09-84cd-4247-aa40-9ec6e0a9f1bd"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-0b64fe15-dd10-4f78-916b-200ec6483fcd",
"timestamp": "2026-04-14T14:59:48.944796+00:00",
"source_trajectory_ids": [
"traj-05a12459-be9e-484e-9a58-83b465e24092",
"traj-0924a001-1055-4126-b241-bcdd2c078494",
"traj-17ae339d-c886-414e-94b3-5e570093c8e4",
"traj-18e10e43-4694-43e1-be9a-f16fdf123e35",
"traj-5460af6d-b2c1-4a71-aaff-0060c05a4421",
"traj-5517734f-c4fe-497e-a402-aa5228395d34",
"traj-59b1a050-9be6-4aca-bbfb-0e1da246da2d",
"traj-7094a080-3592-4e33-9ba3-f32fdbe02e76",
"traj-8f62ae27-0a61-43bf-a8e6-7b73e9a1c888",
"traj-967b670c-429a-4be2-a8c2-ec341ff3106e"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-0c59209d-fc75-4b15-bcdb-239138c12b79",
"timestamp": "2026-04-15T01:41:52.505512+00:00",
"source_trajectory_ids": [
"traj-0ddf19dd-e828-4035-bd6e-29e627769d2e",
"traj-1c185db1-61db-4f0c-b069-8e8e4ced92e7",
"traj-23b5c08b-2fca-4f55-84a6-7068af698780",
"traj-3f243fab-5841-41e6-acf6-f8c9f40cf515",
"traj-713b43da-4b0f-4fbe-b190-9b508d1244f0",
"traj-9764ffe9-c580-4b3f-88a3-beead04a1df3",
"traj-a6e4d148-6744-4fda-a1bf-26603166117c",
"traj-cc7aa6c3-de72-4bfd-83fc-761eaa8cc8a7",
"traj-d12e9387-0fd2-4a4f-b387-3cd58cbf12f4",
"traj-fdb7911a-4cc0-4906-b5bc-658be058653e"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-014152",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-0cb5da05-94e7-4f55-b759-1338cebaf5fd",
"timestamp": "2026-04-14T21:22:02.988940+00:00",
"source_trajectory_ids": [
"traj-2704df3d-419c-4206-af3c-afd5466b305c",
"traj-49134729-36f2-467c-83ac-da261acc561b",
"traj-7adf97fd-549f-4123-9340-5b49f024f6d7",
"traj-852b116d-998b-48fd-aa71-293f8b31c6e4",
"traj-92a1293d-5d98-4efb-88ba-125ca308d246",
"traj-ab7f2171-8a7c-4315-a80f-fb88168b794e",
"traj-c3788641-46cf-43fe-bb92-4b3871f1b20e",
"traj-cf3e5d99-8b30-4877-a93d-481968801eaf",
"traj-e051963a-bada-41f6-9fc5-4ba429d136c9",
"traj-f5d94b37-3215-4a5f-9528-8b13dd9f4ceb"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-212202",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-0e0b0f65-2073-445d-8b24-753642e15b88",
"timestamp": "2026-04-15T02:31:17.525516+00:00",
"source_trajectory_ids": [
"traj-22f50846-2268-4d3f-94ab-cef4813aa471",
"traj-34c1633d-c680-49ae-81de-f9c4942f3d1f",
"traj-3fb919b1-e148-4764-9197-aea2c313ec6a",
"traj-4dd3e06b-8c8d-41c2-a06a-006f024b868a",
"traj-6b505d4e-b7da-4f0d-81a5-1c37f89ca93e",
"traj-84925606-3ef8-47bc-8f58-97a22083b6ad",
"traj-d532be68-7050-4ec1-bf21-06085d8894f9",
"traj-e6eec076-e362-4dc1-8444-af9f6bb659b2",
"traj-f273ccb2-a6d6-40dd-836f-e6835a7aa55c",
"traj-ff6a2137-d4ab-406a-b43a-d2741f6dd91b"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-023117",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-10a2f403-eca3-4ec5-ac0e-8e907322679d",
"timestamp": "2026-04-14T18:58:37.085590+00:00",
"source_trajectory_ids": [
"traj-6aa4c009-836a-4013-887a-07ed5b767a2f",
"traj-6c9e26f0-ed6d-4bcb-aa25-e79789688ccb",
"traj-8898f73e-1ce5-4770-9966-359bef9958ae",
"traj-9055a563-4353-4975-a970-5ef46a472d45",
"traj-91d1f2db-f516-4fc9-8a74-8bc6ebe0be47",
"traj-b5b5fd0f-a745-48aa-a6b9-8c50451a7b07",
"traj-d3f8003f-39fd-4eb7-a68a-41d137da964a",
"traj-dfd75ad1-1e73-45d5-8dd0-aad7e860fdcc",
"traj-e178b3b0-8872-4f89-9d25-4e55d3a7aaf2",
"traj-e7bafd52-4193-4bdd-9fc1-d46658003751"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-185837",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-13b9b11b-b1cd-4d70-9fcc-a972cbd54805",
"timestamp": "2026-04-15T01:21:53.876489+00:00",
"source_trajectory_ids": [
"traj-4095188b-6d84-4ee1-a3fc-a4a147b2e983",
"traj-4f2d3ac1-211c-417a-9836-87126bd0aa35",
"traj-5aa5c2f9-8ac1-4031-a12c-e6c4e8d0ece0",
"traj-60f0860e-9a83-4826-966d-40cf15d4fcb9",
"traj-74fc1f64-33b4-443d-9c1d-a4a0e60f7ff0",
"traj-8bc691d7-e5bc-4b7b-8621-8401f36a5f4d",
"traj-8d7af32a-19d7-4ff9-8f6d-a2337280cc4c",
"traj-b22e4a02-c74d-4e10-91f6-8ac4b7a5c2ea",
"traj-f833d392-3250-4caa-8acb-90fc49d3b3c1",
"traj-f9702b75-4b65-4f83-8ef1-c2594c87db8a"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-012153",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-13f1b744-a87c-48f0-b024-d48396ae1c25",
"timestamp": "2026-04-14T20:06:16.345373+00:00",
"source_trajectory_ids": [
"traj-06da564b-232b-4496-ae9d-81306a08cc7b",
"traj-6b557f04-4b89-4628-8d4f-acb8d5b060df",
"traj-7e9f9a58-1594-44aa-9712-215e130a7dd6",
"traj-8765d4ea-b4c4-45dd-8830-df92cc3f3aba",
"traj-ac14447b-6afb-4d39-bd92-8172d4f50c8e",
"traj-b70ae420-ea46-47d8-8640-f0b21e659a81",
"traj-bb4b6108-ade8-421c-96f1-f35c36677029",
"traj-c81f1a4e-7182-4560-91c7-86bdc4ccfa03",
"traj-d6c3266e-8d3e-4e42-bf5b-8522ca351241",
"traj-eca10f07-c2e4-42bd-9ec7-21c3fba82752"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 1.032,
"error_rate": 0.0,
"avg_latency_ms": 42.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": -0.592,
"error_rate_delta": 0.0,
"latency_delta_ms": -42.0,
"baseline_avg_reward": 1.032,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-200616",
"baseline_version_id": "v-baseline",
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-15c39b58-4792-486c-88c2-8fa95f34f0e7",
"timestamp": "2026-04-14T21:18:36.157196+00:00",
"source_trajectory_ids": [
"traj-0d2380fb-a3a9-4c3b-bb01-4390198f0e60",
"traj-1147c420-d6bd-45a6-9071-a38f96205f7b",
"traj-436265cb-1612-4ef2-94e5-311619f97900",
"traj-4672cbe1-bc67-4378-b517-e4f0c23395c7",
"traj-4cd057fa-bca1-4172-805b-cf0aac1191ce",
"traj-7fae7ddb-e46d-411c-ae1c-b17ed44159e6",
"traj-beac32c5-da6d-48e2-aab1-140041c46a80",
"traj-c08cf9ff-2fee-4071-bb39-91955125de74",
"traj-c32944a0-6f3d-4fc4-9cb7-f8a5b581445b",
"traj-d59a5c84-eea1-44b3-b182-9f0b4119b448"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-211836",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-16240412-414a-48fb-a5de-244647601b99",
"timestamp": "2026-04-14T21:44:48.199092+00:00",
"source_trajectory_ids": [
"traj-3d852c8f-73dd-454f-a35b-4d22d5dd187e",
"traj-5d8dd2a4-854f-41dd-9f14-6a08657fc60e",
"traj-64125a25-a99f-42c4-9d76-1b68c45809a4",
"traj-6fe3e14c-b6cd-4a04-9fe3-4cfd011f880b",
"traj-94ddd7b7-7a70-45d6-986c-9a22512fb6b8",
"traj-afbbdc73-f4a9-4d42-a8d5-9f41464b0e20",
"traj-bca371df-ce7e-427c-acd3-83c712cb11db",
"traj-c4849366-5ee8-4442-80cb-fb6207f59d48",
"traj-c6a1ed31-c1d7-4147-a035-fef03423d0b6",
"traj-e9a5cbf2-4716-462c-8f00-5e75da4636a4"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-214448",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-197593f2-1928-428f-a143-d59574a1070f",
"timestamp": "2026-04-15T01:41:52.446867+00:00",
"source_trajectory_ids": [
"traj-032f9293-f5f9-4f2d-8724-4df72b6e2def",
"traj-1c8cbbb2-d4b0-427b-8009-57141775873f",
"traj-28f049b4-aac9-40d6-8e65-4f8d612fe1cb",
"traj-29337650-4610-4468-adf5-39cd2a095750",
"traj-568702f9-d5ce-440d-8056-faf70ca7492a",
"traj-76b8ddce-0f28-4fc1-8191-82a313b854e7",
"traj-d1ede161-80e7-4d3d-b09e-e65972bbbc61",
"traj-d3528eb9-0934-476e-9291-a0b616686308",
"traj-e4743774-7609-4749-bdc7-bdfe31107cd3",
"traj-eac8b576-7a44-472f-9553-b68773ac4bda"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-1a6693a9-d9aa-4fb7-9c37-8eca70db8ff2",
"timestamp": "2026-04-14T20:56:07.953209+00:00",
"source_trajectory_ids": [
"traj-1d87ed37-a6de-437b-b1f7-655e1465ae99",
"traj-59bfcf1f-5462-419c-8571-56960b954a7a",
"traj-71a16960-4bab-4e3a-8187-aff9a04774f4",
"traj-89b30f5d-96f7-4748-b44a-f03efa183c0c",
"traj-a67da73d-9e4b-4082-9f02-09c1b04a30c7",
"traj-a82d0c43-6d5d-4c2c-b4b1-9ba06a1f8433",
"traj-adb2c5dd-78a0-4a5b-98a7-1d78f8e7e680",
"traj-b5f04bf0-caf1-4523-9b30-5a094185428c",
"traj-d67e548f-de22-4a83-ba4a-9b737dbeefa0",
"traj-f840a2e0-d314-4dcc-9c02-262a92a093e8"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-205607",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-1b339815-f279-409b-ab77-c5c5c31744f7",
"timestamp": "2026-04-14T20:56:11.542333+00:00",
"source_trajectory_ids": [
"traj-02aee60f-4b45-4ee1-9341-c60be647ff1b",
"traj-0a7673fb-d561-44f6-9cb8-aa87122018a3",
"traj-441ae78a-e0c9-408e-87e4-421c9a96fc5e",
"traj-4d2d110d-4309-4728-b072-b1785e6df45a",
"traj-629ca24d-3b2f-4c8f-8be4-0b1f8bc21df7",
"traj-64f19728-5662-43f3-84da-9476b25db403",
"traj-963f8b19-2650-428c-9135-1500fd1d7ded",
"traj-c3aed0f9-1919-49a3-ab90-84d89f423d33",
"traj-e9567bfd-bec6-4836-8f23-341447fd7a9c",
"traj-ea6e5ff5-936f-4aa1-839b-2199ec7f925b"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-205611",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-1d45c6bd-7847-46d4-a3aa-953bcdce24ec",
"timestamp": "2026-04-14T21:18:36.139079+00:00",
"source_trajectory_ids": [
"traj-200f901f-aecf-43e4-a9cd-f3ebfed82ed0",
"traj-233795c8-8d47-4a3b-86f7-9d2af40b89cb",
"traj-42523abe-2654-46d6-8cce-4154ab093cf2",
"traj-49763bb6-634e-4fa0-a23b-0f537e97262d",
"traj-593e6516-7ec2-4226-83fb-65a4a5274616",
"traj-617282fd-7c85-4583-a59f-54315bbf9e40",
"traj-7f6074d8-ea0d-4d48-94f3-4a67d0ee92a5",
"traj-8a3543c1-3007-4271-9862-06ae3202f039",
"traj-9121275f-b96c-4cc5-a45d-1c50532c6409",
"traj-c73e41e8-483d-435a-bd6e-e868a445bd30"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 1.032,
"error_rate": 0.0,
"avg_latency_ms": 42.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": -0.592,
"error_rate_delta": 0.0,
"latency_delta_ms": -42.0,
"baseline_avg_reward": 1.032,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-211836",
"baseline_version_id": "v-baseline",
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-1e0bf809-418e-4720-ab59-b8d7401ce94c",
"timestamp": "2026-04-14T20:30:08.746811+00:00",
"source_trajectory_ids": [
"traj-09d6c0c8-8c5b-4264-aaf4-78b6ec7689b2",
"traj-11b5e179-af57-4df4-a07e-6263f6e82ddd",
"traj-12d9e29a-03cb-4242-91ee-de30aacb0e50",
"traj-41580331-af54-47ed-9aab-2fab2fc8c3a0",
"traj-707b126a-6164-475f-81a3-4a34fe624639",
"traj-903e62d9-1478-44de-8348-4e08531a9178",
"traj-9ebcf874-21b8-453f-817f-f7038907608c",
"traj-9fc3b26a-7ba9-4d9a-a732-17db84494c48",
"traj-a16724af-e0aa-4aa3-9615-c8c3b14173a7",
"traj-b1235cd4-6b9f-4b86-bca3-39f48ee4c1ea"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-1e1d679b-3b0d-4cb9-b474-8302992df5ba",
"timestamp": "2026-04-15T01:25:33.772160+00:00",
"source_trajectory_ids": [
"traj-0091cdde-9035-4995-9b30-ba3e52a4e74b",
"traj-21d17e25-de55-46e8-b31f-0e6d6a045351",
"traj-52d9d18b-f37f-4a42-bcc8-ce7e28277942",
"traj-5f2a03a7-33d9-48f9-b1cb-bb5ac6e1f21c",
"traj-86cb57eb-74c0-4ea5-bce7-3aa1690b9599",
"traj-87e89d6e-3ef0-4ee4-ab62-c0002b4d1b22",
"traj-a7dd2fb7-6756-430e-9964-dfca0f3a6981",
"traj-aa624e2b-6012-406a-8542-2ffed00096bc",
"traj-ef61014c-791a-4535-a78f-7ab715a7c3bb",
"traj-fbab542f-9c5f-4b90-889e-f2d253862441"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-012533",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-20611e96-6b00-4a0d-9be5-5d5e968b3371",
"timestamp": "2026-04-14T21:22:14.567603+00:00",
"source_trajectory_ids": [
"traj-25fd7e3b-5c72-4b15-a847-70a35bc85f1f",
"traj-2c2d6197-5e0e-4ca8-a762-b5aca1b4d486",
"traj-36a27b22-b36b-4912-8dbe-72dd0138c06f",
"traj-590f4b56-7a29-4080-80ba-23bfc984a935",
"traj-7298713f-34a4-48bc-8e41-f0b0d6de8778",
"traj-82acfa6b-76d4-4a01-a9e5-3f989a3f2684",
"traj-8ab1b3d9-a6fa-4bf3-8d5b-5298ac85afb2",
"traj-98cfa826-215f-40a9-9fb9-7d8b41640295",
"traj-cd585938-d8b0-4773-8fe7-655cba23cbec",
"traj-ec26bcd5-3463-4a25-9ebc-b046e66020cf"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-212214",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,42 @@
{
"report_id": "report-20ea6367-8e42-4f6a-b90d-60eb441aa9f8",
"timestamp": "2026-04-14T18:31:07.921735+00:00",
"source_trajectory_ids": [
"traj-253bd144-3ad8-4dcc-951e-535f7fa444c6",
"traj-2ba9feaf-ffd1-41f8-b492-365351133a96",
"traj-35c97cf2-e5d0-4d9c-be42-d46b14f8afa7",
"traj-47b3674d-73db-41dd-b8db-472f91f864a0",
"traj-4d744d56-15bd-4e54-ba65-29f6135dda22",
"traj-4e3fcf21-0020-4585-b277-9c8a03081c06",
"traj-655aea4f-bc1d-47c3-85ac-73c8bb63d7e4",
"traj-66d29b59-21be-474b-a6a8-9d7a0e36b8bb",
"traj-8c7ed834-ada2-44f2-9a67-e7066d0bafe6",
"traj-bd4fdcd8-1577-41a3-a081-a738b17bb9c1"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-183107",
"dry_run": false
}

View File

@@ -0,0 +1,41 @@
{
"report_id": "report-21a16654-d936-4393-88d7-9e0e00d98fec",
"timestamp": "2026-04-14T16:49:44.845808+00:00",
"source_trajectory_ids": [
"traj-2999497a-dba8-4215-8f44-f7371fb4c18d",
"traj-4603b0e1-ef1e-4f44-a5bf-7994eeb97fd2",
"traj-49f42054-4065-41c6-8d70-e89801df29dc",
"traj-53b375aa-ba3f-4518-973c-6c8c1b704fd1",
"traj-68124be2-5cc4-4c52-b891-fc5cb253b3ea",
"traj-828c6c7b-72ed-44ee-8628-f1bee3080ce1",
"traj-a4516393-6015-4029-910a-15955a283aec",
"traj-ba4984ba-48a3-43ac-8726-d73db56f5a5e",
"traj-ccb9f3ca-26e2-4efb-9b1a-b55a913b55cd",
"traj-f9aa9adc-232e-4f92-9161-23165cb9dca4"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-164944"
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-21e68879-c123-49e0-8af9-9f8e9dc76ecf",
"timestamp": "2026-04-14T18:58:37.102905+00:00",
"source_trajectory_ids": [
"traj-1f23a1c3-4ba3-412b-9df5-61bda0396bc8",
"traj-24c1c82b-1fac-4365-a643-faa65082b8d8",
"traj-5f848d9c-294e-4586-9951-30a03588cc26",
"traj-8bdac473-266e-454b-a2d6-267f6189850e",
"traj-b05d7433-97be-4604-bcee-a18cb1102a80",
"traj-c0a59283-e7e0-41fe-925d-79b4e076b9f6",
"traj-cd1ef62e-83f9-4b1b-99b7-ff1e1586afb9",
"traj-e2f37ecf-a075-4b1b-ad12-9c3e7be77fc7",
"traj-e3bb7c13-fe7c-462c-9f88-d7f40092669c",
"traj-e8bc452a-b3c7-4448-a994-51cc81b30730"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 1.032,
"error_rate": 0.0,
"avg_latency_ms": 42.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": -0.592,
"error_rate_delta": 0.0,
"latency_delta_ms": -42.0,
"baseline_avg_reward": 1.032,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-185837",
"baseline_version_id": "v-baseline",
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-22b88101-5979-4011-b85d-c3bb3e1f84ae",
"timestamp": "2026-04-14T15:25:06.028393+00:00",
"source_trajectory_ids": [
"traj-263efcd1-4b24-4302-a9cf-5c5778297ac2",
"traj-29855290-bd18-44cb-b1d2-da2bd3eff5b3",
"traj-5d04fe16-cac2-4f5d-b469-eb4ff0c3e66a",
"traj-67d1127e-70c1-4f86-93e2-8d0e7e6df433",
"traj-8e66108b-fa8c-426e-99e9-f7df432b7436",
"traj-a0df3bda-d35b-4c76-b68e-2c9dbb47f6f2",
"traj-bc36ba31-9c1f-4902-9f79-acf7653d0e86",
"traj-c62fe68a-4ad5-403a-b747-2648ae56392b",
"traj-c74f4755-6cf3-4f1e-950e-672a946a7b4e",
"traj-ff0f3558-e0cd-49e0-974b-1b5bd9cb5af1"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-2493e5d6-4be2-49a6-8e84-6f3fda442ff5",
"timestamp": "2026-04-14T16:54:50.564245+00:00",
"source_trajectory_ids": [
"traj-0ef5e19a-7c30-45a4-979f-67d46413ee95",
"traj-11483ef1-e410-47c5-a265-53bff1968182",
"traj-59cbb530-0ae7-41e6-a033-250431a20bb8",
"traj-671f19f7-cd71-4539-83ea-5441807561c9",
"traj-6c693d47-22b0-42e1-a76f-9ba625d79a70",
"traj-97c4d19b-9aff-4f15-b1e3-c82c8da598e0",
"traj-cd8780de-7bc7-4735-acdd-e66ed407619f",
"traj-e4b2af56-8718-41c4-bd7f-6c479b1fb7f3",
"traj-e63b675d-9bba-41bf-a472-a068cf2437fd",
"traj-f10cfe93-7fe1-4c84-bfba-2cb3c3892a9e"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-24f69dfe-4955-4c6a-8421-5c1bdd0bdfda",
"timestamp": "2026-04-14T21:42:45.897635+00:00",
"source_trajectory_ids": [
"traj-11726363-9ef7-47e4-9e77-4e2b1fbefbd3",
"traj-28ecbc8b-0dd9-4e4e-a4d0-cfe262c4a812",
"traj-3abe1edd-f76a-4040-a471-0ad8535ff553",
"traj-3ed7731b-def2-459e-948d-a45cd595c4de",
"traj-4620d7ac-94ad-4310-8dfe-3f1c9124ceb9",
"traj-5a041387-76c4-483c-8df9-a6ee410a3264",
"traj-6f340ce0-d606-4890-b647-ad57360f8566",
"traj-82ebfe0c-08de-4c00-9a8e-8f293191c97a",
"traj-a5442e4e-57fb-4af6-941f-90c25a3862dc",
"traj-c2c5e763-e809-4264-af82-610fbe7c5fd1"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-2522e075-f011-4379-989c-f413d768a957",
"timestamp": "2026-04-14T15:52:51.189860+00:00",
"source_trajectory_ids": [
"traj-0c96d155-112e-4658-bf90-3b35da7e7c2f",
"traj-22a09d6a-b9ee-4ff4-b324-a14cb8f33a91",
"traj-36fcb806-8f3f-44cc-99a8-1b4f6170a18e",
"traj-42da2c6e-15c2-4c40-92f3-14b5eef5e681",
"traj-6b083428-c47a-4d83-80dc-4db2c66887d7",
"traj-a9c06cd6-3332-41b9-bb21-3afc06e6f701",
"traj-b45b09b4-c348-4215-9cba-4adbe8a76410",
"traj-c7b2b172-8223-423c-abb4-79bfeb1cbe94",
"traj-cd806afc-6846-4361-9692-dff3469717a8",
"traj-d0622a9d-4e59-44be-8231-2b27a25d47ac"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-263a0d30-9096-4e1c-a406-43927ac46d80",
"timestamp": "2026-04-14T20:28:05.472990+00:00",
"source_trajectory_ids": [
"traj-02ffe167-5287-4a72-8e9e-623baef314d8",
"traj-58518476-0941-437f-86d7-80f000a35ae7",
"traj-73a97752-0bb5-4f24-92ec-8f3cec52ed4f",
"traj-77750db3-022e-4dfc-a19b-a45e2eb41923",
"traj-a7d6998f-0355-408e-acde-7f84033a7712",
"traj-b73c6762-b738-4156-bf01-38661089bd01",
"traj-d90086be-591d-4c4a-a220-6e35a125cc62",
"traj-dcada7b1-e74e-42ee-b117-aea8d121247b",
"traj-e5b873ad-8e62-4b91-a714-16eca70dbae3",
"traj-f63e8157-40e6-480a-a2d2-bd7a257636dc"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-202805",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-26782aa8-a2a0-45f9-8ac3-861fc1364431",
"timestamp": "2026-04-15T01:57:32.697736+00:00",
"source_trajectory_ids": [
"traj-0269da6e-275b-4eae-8a43-1b89a74a87c2",
"traj-28052977-cc23-4c06-9343-dce8b4ca5ee3",
"traj-3f7b8039-6d47-4ce4-9c3b-6d80d4548825",
"traj-4e37cd2f-c830-4eba-84d9-87cffe9bcec3",
"traj-74071894-0764-410c-8460-cebb98b80fa4",
"traj-8c547ed6-61ba-4c6e-a8e2-990264cf77b9",
"traj-a65f8feb-1368-43c0-a3b9-97f6a3420741",
"traj-b80a3d53-4ffe-4147-b8d6-b619fd951f58",
"traj-bb4444ec-7bd6-42e3-b9e1-4a680d368d50",
"traj-c5cea58f-f981-4f73-8f3a-e35d7f3befb7"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-015732",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-279b3b5c-bf69-4d8a-9be7-372086c295c9",
"timestamp": "2026-04-14T20:06:16.411538+00:00",
"source_trajectory_ids": [
"traj-2382eb44-3957-434e-a171-04e6ecd5a0ce",
"traj-28e66c25-3314-43ce-8a7f-911d8943ea11",
"traj-3b62b30e-9c8f-433b-bf40-16820db431aa",
"traj-8b3b0d30-f9bb-4323-9403-23970be3a4e6",
"traj-8b84c7fe-b827-4b35-8f2e-6538fbc684fb",
"traj-9cc1eef1-d47d-481f-851e-5913609c8740",
"traj-a960cca8-bcc9-4332-9523-3170ef7c5355",
"traj-b34c9f41-87f6-40f8-8d3b-0878f4d61911",
"traj-b4ba32fb-2bee-41b6-a46e-0a094079f40c",
"traj-f5dd1000-03ed-4b5a-b00f-e6437ba56426"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-2957a4db-25be-4a31-be96-bb53b60b0574",
"timestamp": "2026-04-15T01:29:18.124253+00:00",
"source_trajectory_ids": [
"traj-24875022-ace1-4d16-b802-9e19c0345039",
"traj-2adcad42-6922-4c27-b879-75aac21c94ba",
"traj-35512ca0-78e3-4d99-8efa-056013aefbbd",
"traj-60c4586a-c6ba-421c-939c-04a3c497ee3b",
"traj-64a60af0-4d68-4370-a4a0-6f5ebdc4b7ad",
"traj-8ef62528-7f24-495a-8c51-7936b30c02ec",
"traj-c52966b8-939c-493d-b528-716ca6e0c4e5",
"traj-d31381b8-70b3-44fa-9daa-053e9d517b8f",
"traj-e7852591-231f-4f0f-8032-fb872fa5e220",
"traj-eeb9b89c-6edf-4354-aafb-ce7fe0212dab"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-012918",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-2b3e115b-fae8-4813-b53d-1c8501010bf6",
"timestamp": "2026-04-14T15:53:50.791993+00:00",
"source_trajectory_ids": [
"traj-03447345-9e58-46c4-9ba0-8db3c0e720ee",
"traj-1b3c8854-3738-444e-b1ee-2ca9d728b580",
"traj-23d09f97-9f5e-4d4f-9e69-f70e66e665ce",
"traj-606fe284-63f2-40b0-88bd-fcb9a3b27738",
"traj-68c91a21-306c-462f-a9e6-f5b9b149de8e",
"traj-6ee3651f-9ccd-4d20-afc6-ac40d1a8dd9f",
"traj-7a5f901f-d5b4-41bb-a790-a9a82c521bee",
"traj-b725122c-6c00-40ae-acb0-c2ad58eaf075",
"traj-c160f961-cd03-404c-9ffa-037d1e196e9f",
"traj-ed0113b3-3c2a-4d16-b31f-8c1fcde61291"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-2bbfec49-07f0-43c8-9c0d-f9dbc33b8b53",
"timestamp": "2026-04-14T22:10:15.279833+00:00",
"source_trajectory_ids": [
"traj-0fd602e1-438a-42d6-b684-09db49c96b27",
"traj-354a350a-d325-4233-afe7-387d05eba246",
"traj-4737d84e-ffc5-4187-b37b-c1581c9197c5",
"traj-54880be9-eac7-4a8a-82c2-aee098b966a1",
"traj-5d14290d-8afc-4a98-9df0-44db13f9bc33",
"traj-659b7f39-a95a-485a-aab7-65018cc206ed",
"traj-77720324-df56-4f6f-a732-824e97d9c7fe",
"traj-ed1a3760-846c-4534-9ea7-e6f54a2e1414",
"traj-f6fef155-e568-49f9-a286-c56c6b729c0d",
"traj-f8488008-391b-4fae-9d98-b9a379eca15e"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 1.032,
"error_rate": 0.0,
"avg_latency_ms": 42.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": -0.592,
"error_rate_delta": 0.0,
"latency_delta_ms": -42.0,
"baseline_avg_reward": 1.032,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-221015",
"baseline_version_id": "v-baseline",
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-2ce71481-bf67-4581-b35e-65b83189c959",
"timestamp": "2026-04-14T21:22:14.626005+00:00",
"source_trajectory_ids": [
"traj-0a77ca1d-28c9-4148-b099-2990f38d701f",
"traj-51afda16-46e8-4fc6-aba5-1a02600624de",
"traj-5586372a-1b39-4028-95ae-31095cf3136d",
"traj-a1333bdd-5b03-45c7-853f-e49c1767031a",
"traj-a6a93535-fce3-4374-9cb6-0321a5a4769f",
"traj-b40704cc-e206-4da6-930c-1d0f1b7234a5",
"traj-b7c19bf6-3da3-451d-ba41-4019ef8e92d5",
"traj-c6f07968-deb4-48eb-a4ef-401339afb5fd",
"traj-d0fd2e96-e15a-4f2e-b51d-34f482772ea1",
"traj-e74aefaa-647c-4b9f-8a6c-e7cb2bbe0780"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-212214",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-2e6d5c48-47b9-4bd6-9a9b-117e9d646ccc",
"timestamp": "2026-04-14T21:18:36.299274+00:00",
"source_trajectory_ids": [
"traj-06944244-d2e8-4e6f-a49f-da5c792befce",
"traj-2a694d25-5898-4d2d-9bac-bcdc01d2d442",
"traj-4c7f18bb-78aa-4170-99e7-12e5ace54340",
"traj-5d7ed2c2-17b0-4daf-8661-51ec1da1fd60",
"traj-649669bb-b814-4114-9205-a328137d5bf7",
"traj-768ecbc8-30bf-4c05-82e6-c346736eea24",
"traj-7bb5cc17-a8e6-4c0a-b525-e2cd671187a2",
"traj-d23853f5-359e-4c3b-97e7-d239b5d7a152",
"traj-ec11358e-da16-426e-b74a-42f2e95db560",
"traj-f486a57e-e7b2-4a34-a6ed-6bfa836045be"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-211836",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,41 @@
{
"report_id": "report-2f0f6640-8049-4de2-bbb9-71a76fd8be67",
"timestamp": "2026-04-14T15:29:35.959531+00:00",
"source_trajectory_ids": [
"traj-13fe5578-4d8a-4781-9338-1a612a1e5a06",
"traj-1ed5b4dc-8872-45f8-81a9-91b46545097b",
"traj-4e0d0d23-c5d7-4211-a6ef-31fb93bd62aa",
"traj-6728130e-69dd-4b4e-beb4-d7c0a898d962",
"traj-74c20720-f0c5-45dc-8ee1-b78a38d9b967",
"traj-c3d1a98e-86fc-491c-8ab1-acb7f890f2c9",
"traj-c7a69537-49c5-42b2-8e87-1a05699bbb15",
"traj-dddd03c8-8ec2-4571-8646-2c3dfd9eefe1",
"traj-df54d24d-cfbc-4475-8d79-c77f4c11407b",
"traj-f1e396ed-ac25-4bb1-bb8e-55fc4b405819"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-152935"
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-31835629-98b1-4a08-8a42-e80702dd3ff7",
"timestamp": "2026-04-14T22:08:19.690919+00:00",
"source_trajectory_ids": [
"traj-062ae1e2-aedc-46a1-a8e7-585f1bfd6968",
"traj-0aaadbdb-15cb-466b-9271-ecec84e0b21f",
"traj-87b00206-b80a-4572-a12b-d441e45f4374",
"traj-93bdfd26-c5b0-43d1-926d-303f3ea7d176",
"traj-95de8601-6f2b-4313-ad1f-dc248c4e6d78",
"traj-a72b7a28-3293-4d78-8a65-411a0ca6aefb",
"traj-af818f60-198b-4b46-9a36-5012b467d867",
"traj-bc6fedae-308b-491e-bbea-419817542e18",
"traj-dba716d0-5bdc-425e-8b6a-043f16e1d9b1",
"traj-e573c252-18ea-4f15-8630-568320f4d3c3"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 1.032,
"error_rate": 0.0,
"avg_latency_ms": 42.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": -0.592,
"error_rate_delta": 0.0,
"latency_delta_ms": -42.0,
"baseline_avg_reward": 1.032,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-220819",
"baseline_version_id": "v-baseline",
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-319b9b10-5c39-46eb-a905-638876b20b78",
"timestamp": "2026-04-14T20:56:11.631566+00:00",
"source_trajectory_ids": [
"traj-046f3b45-5b6d-4883-801a-4b674ac9a0f6",
"traj-1fc6191a-e9e5-4b9c-9294-ab68a7992506",
"traj-4370c224-46cc-44bf-aa52-c1ae9b9884be",
"traj-520f51ad-e1ea-42c9-b402-edb618a95020",
"traj-579262b0-c64c-41fa-802f-b3800e44d890",
"traj-5e8a36bb-1586-4843-9c4b-8e981c02342a",
"traj-b1cf2655-7694-4656-94f1-0cd6a2f4e195",
"traj-b92d6fd6-6421-42e3-9a1e-d0d5ea7a3ce5",
"traj-cb26f2fe-8169-4616-b124-47594ea88495",
"traj-fd456c78-f35a-47e3-9491-d462f28ea5dd"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-31c3b5b5-84dc-4a81-91c6-d663f0856347",
"timestamp": "2026-04-14T20:57:03.309395+00:00",
"source_trajectory_ids": [
"traj-0f36d4fa-6aa7-4647-8434-939727c2c38b",
"traj-2abf9d11-6e8f-41c7-9554-ff424498b905",
"traj-43b8c849-cff6-4a05-b166-19252a8b4758",
"traj-78074052-0bf6-466c-bdfe-6cffd970494c",
"traj-7bda4651-8a18-49f1-957e-9163f264035b",
"traj-8c8c5944-1d6f-44e1-a6e8-119d8fd904d7",
"traj-91f84675-8772-44f6-8916-61f9277a9af7",
"traj-cf026710-8f03-45da-8327-9f5e5a671c24",
"traj-e11c2598-a12f-43cf-b547-98a44c373c30",
"traj-fa2448c9-d2da-43d2-802b-bb2585e5c8d4"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-205703",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-32ee1906-6846-46b2-99b6-0df8aa632f18",
"timestamp": "2026-04-14T21:42:45.766701+00:00",
"source_trajectory_ids": [
"traj-1e14ac8f-dac5-4cab-a3c6-5b4fa97fb779",
"traj-58dec6f6-4712-4747-b189-9428512d8069",
"traj-59664fbf-ce9a-4b4f-a039-2625767e85ae",
"traj-ae3d3da7-773c-48f7-8c7d-35c9f3d6cccf",
"traj-c399734a-4bbc-49f0-ae6f-c8fa23f6a482",
"traj-c3dff94e-43fd-4d04-820c-47c9b7f01dfb",
"traj-ca22da3d-09d6-493a-b338-444343e0b252",
"traj-eacacd75-cd33-40e3-874b-8032ddd42175",
"traj-f61b2282-3674-4a29-867b-0dbf664bd116",
"traj-ffd6b64c-3b24-4b83-b72b-01b083f6e4b8"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-214245",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-33a0b960-112f-4976-a8db-1b15177f7e8e",
"timestamp": "2026-04-14T20:32:37.730415+00:00",
"source_trajectory_ids": [
"traj-23a871e5-2833-48ee-b3c1-5ed94138fcaa",
"traj-3cd1b98f-d6c3-4452-bfbf-71a3cf56415c",
"traj-4e67d82a-e669-4074-8dd9-450c8dd5102a",
"traj-58dd91bb-8f28-45f6-ab96-c61aca61c671",
"traj-627cad0d-6b5d-4631-b0fa-ffd16e1435c9",
"traj-867989fb-734f-441c-8f54-7177f83bb7b9",
"traj-bdc6723e-392d-4fe3-94fb-950af73ecfbe",
"traj-d2a41298-1da9-4fc5-8ba1-4ff15425c2f4",
"traj-d7d6e4c5-b66f-4456-8105-fcdedf467877",
"traj-fcd41273-8d85-4d4d-a0aa-5313347fe699"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,44 @@
{
"report_id": "report-33cb91ff-6fc2-4cff-9e7c-7c80d67e9beb",
"timestamp": "2026-04-14T18:31:07.979291+00:00",
"source_trajectory_ids": [
"traj-1724a751-6423-4fff-b9c6-ef92845b7297",
"traj-1f6f99c3-21de-4a14-840e-180021048a34",
"traj-2733b029-d10a-4902-922a-644d329a17c1",
"traj-294aadaf-5f60-409d-80f4-c640d8d82abd",
"traj-3282276b-ea3a-40d8-babb-62fcad0fa27d",
"traj-45b4d7c4-367f-4cbc-825f-a112137275ef",
"traj-5035c348-520b-468b-8e12-5de07b0ca885",
"traj-c86af3f9-c441-4267-bd37-b8a0a2d182da",
"traj-ccbb4aaf-7cff-4711-b987-c4e61ec1a4a8",
"traj-cd5f83d9-4ef4-42e4-af07-7c3345c26fe8"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-349d27df-93ce-49a1-ad9d-9c2ecdb5f9c1",
"timestamp": "2026-04-14T20:03:02.621111+00:00",
"source_trajectory_ids": [
"traj-40ac86e5-85ee-4468-92ca-7be25e3e7442",
"traj-4c1bed8a-7db6-46f3-9ae9-1844cbbba837",
"traj-4f8e5d10-ce5d-4249-83d0-63e528af3bcd",
"traj-519e05a4-eec3-44ae-b07e-0c78565e6065",
"traj-5d84864a-c5e9-4674-a0ec-47ccedf609a9",
"traj-8fb37e36-f171-4285-8a37-905f6f7a34d5",
"traj-a0ab9293-99af-4b7b-894c-f0d6dec9fd40",
"traj-beead0f0-adcb-496a-8b73-ffe1bef4ee42",
"traj-d909fed4-7e99-46e0-a770-7d9e629cff7c",
"traj-e2d3db6a-5db2-41e8-8ecc-909f5d433324"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,41 @@
{
"report_id": "report-36954641-b7fb-4fdd-895c-590d3ec6e0b8",
"timestamp": "2026-04-14T16:53:59.545841+00:00",
"source_trajectory_ids": [
"traj-6ba2785a-40a7-4248-9959-81d676a53741",
"traj-6cc684a4-a0f5-4068-bb18-70049e38ad2f",
"traj-750702b7-0344-4ef3-bdb6-8f62486d8788",
"traj-978cf9b1-4066-4c0b-8612-f7432a602153",
"traj-a85c7d2a-aab9-4508-bee1-4da6e793166f",
"traj-ab6fd543-950f-4b00-8a2c-6fbe49ca70d0",
"traj-b40f890b-49cc-4c2e-b16b-35cf68e30ee1",
"traj-de829d20-8677-46d6-a1c5-bd9501eab3ce",
"traj-eb695119-3ef5-4bc3-8c01-1855bab0cd0b",
"traj-f13331d8-e087-4d5a-88a6-bc9f754791a0"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-165359"
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-36b3533a-655c-4a02-b65e-850d90a1c320",
"timestamp": "2026-04-14T20:56:11.681988+00:00",
"source_trajectory_ids": [
"traj-22545cf9-c2c8-4ef9-abcd-271a216d7b39",
"traj-487aba11-f414-4f54-ab08-635e4436ce00",
"traj-652cb0d0-0132-44b7-b88b-15cc073fa6b6",
"traj-6e8fb3a1-d05c-4f21-acac-751c59695c26",
"traj-726e0d27-aadc-487a-a2c2-2245705d78bb",
"traj-996ecef9-5116-4cc9-aca0-ed85c27666bb",
"traj-a93a36a4-0c2b-441d-8b9a-8aeb61685092",
"traj-d1beb072-dee1-4ed3-bbfb-3c9462a713ca",
"traj-d58e0089-340c-4910-8c06-bfba7862d075",
"traj-fd45b279-677a-4653-bebf-784271ce95a1"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-205611",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,41 @@
{
"report_id": "report-37a28243-ed47-4bc7-b260-9bb38b5c0f99",
"timestamp": "2026-04-14T18:27:21.104548+00:00",
"source_trajectory_ids": [
"traj-21a6856f-bdd7-4851-b9e0-219458e43cdb",
"traj-31dffa4d-dd6e-4d32-831d-41e83119f7fc",
"traj-372f8001-3343-4e51-b415-ad3231658ffe",
"traj-37658dc1-0bd6-4245-88f2-5a12b901d82f",
"traj-62dfe993-4c43-4122-9dde-39cfe6ea5fc1",
"traj-6cdaf4fa-5553-46c4-b550-3a01fd2b6371",
"traj-cafc62d9-5964-4a94-ac55-26e194aed032",
"traj-cc0843b4-d2fd-4a69-8b82-b55ad4dc8c79",
"traj-e5a7d153-7a31-4618-b117-ec13d8c192db",
"traj-f2aeb199-2ef4-4d29-a523-740d1d10aeb7"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-182721"
}

View File

@@ -0,0 +1,41 @@
{
"report_id": "report-38b4ed01-cbaa-4ec2-9b31-af634d9786b1",
"timestamp": "2026-04-14T15:04:26.185363+00:00",
"source_trajectory_ids": [
"traj-5e3f3a25-8ba2-4047-9cc5-ec1072ef1eec",
"traj-68138afe-056b-4e15-b67a-cbcaf8c17ff5",
"traj-6c8c007c-7781-4b15-a369-572a00f40457",
"traj-76fbd22e-1f59-4855-afe9-ebf90f8d59e6",
"traj-7b21dec9-e7b7-4f68-a5a0-c50221ee37aa",
"traj-a967b477-d265-414f-a33e-2582a8f0e086",
"traj-b0d09d4f-d041-41ce-94aa-1b7221e182ca",
"traj-bb05f70d-64f5-49ad-bbb2-9a63bf255d5b",
"traj-e4bd70d9-0680-4385-9397-dfb3299f9be0",
"traj-f4fed21e-bf33-479b-a05e-379b6997ca42"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-150426"
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-3c6cc2dd-862a-480a-913d-5554b4058d11",
"timestamp": "2026-04-14T18:01:06.225115+00:00",
"source_trajectory_ids": [
"traj-0f44d7ff-d89a-4c71-8c9a-1302bf13c23b",
"traj-34cf1d79-5fff-4bf2-a4a0-cfb8336821a4",
"traj-43bc3505-9d70-4a13-9212-da1cfe4e09d1",
"traj-566c33fe-5f4e-4697-9166-0420d63623fb",
"traj-56ac21d8-1dcf-4525-95ea-93d3ca52647e",
"traj-787abb45-cb75-40b7-b734-71d7cf60a180",
"traj-a3da8105-84a6-459d-a28f-6892b09afcdc",
"traj-d4cbefc9-9112-490a-a27c-f07f6e3d9662",
"traj-dfda911e-a036-443f-a5dd-28c8f1d84bca",
"traj-f75507d0-c01d-44d5-aaf3-9ff5f7f6c682"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null
}

View File

@@ -0,0 +1,41 @@
{
"report_id": "report-3d4ecf12-c252-493e-8ba5-2bfe51399190",
"timestamp": "2026-04-14T16:52:07.890026+00:00",
"source_trajectory_ids": [
"traj-2d72ff63-f4d4-43e4-b7d6-a159d321ef0e",
"traj-2ebae5a7-9c72-4178-b019-3380e17dea1d",
"traj-7123a23c-15ce-400a-9aff-1e4e2251695f",
"traj-7a9be049-d77e-4bf8-9776-045cad6a88b0",
"traj-a0786cfa-9353-4740-a8f1-473809ca7cd5",
"traj-a1a1766b-f5c3-4070-ad40-590985c65ff7",
"traj-ab013496-4365-4881-b625-e466728a83e3",
"traj-d8dc62b0-35bb-4e47-b50e-44f98de2eaf4",
"traj-e0529bff-6c1c-4afd-9ff3-195690e941dc",
"traj-eb197e1a-479a-4bea-8fdc-f48d2a053b7c"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-165207"
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-3e0d3ae0-e20c-40bc-981c-3f582cfbb7b2",
"timestamp": "2026-04-14T18:06:25.522532+00:00",
"source_trajectory_ids": [
"traj-13bc1070-0b04-4664-b4e9-13400d3a9362",
"traj-4151835b-6ce4-46d5-9fdc-ee914931954a",
"traj-5a342582-6740-452b-a17c-36cb459966e8",
"traj-946fe752-e504-4791-aa5f-cb0af58f66f9",
"traj-99c0c477-db3e-4c2c-b95c-40c3489923d8",
"traj-afed1dbc-f4b5-4826-8124-a448a1ec0b86",
"traj-b0e8b9fe-261b-4673-9a17-8e3f4f64ae2e",
"traj-b2579e6a-2ee4-4572-affd-33537db667df",
"traj-cf639c55-a6a6-48e3-941d-9bc0b9bb1b88",
"traj-e3a07906-0351-4b52-a1a0-f5e1391c93e3"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-401afaba-f468-45bf-8442-2bf14c8316a2",
"timestamp": "2026-04-15T01:25:33.810966+00:00",
"source_trajectory_ids": [
"traj-13292acc-308a-43f7-9716-87c8b938eb0f",
"traj-223e79f2-f626-4ae1-a0ad-2a6d053af25c",
"traj-519063dd-7bf3-461a-875b-bb7a4ecc2893",
"traj-66938ede-2373-46f8-a459-b5f291f3bc2b",
"traj-868a893d-8fba-45ba-875d-6a6e1f2dce8e",
"traj-916f484c-13a0-415b-aefa-832c07dfcf03",
"traj-9e1cead1-15bb-4098-bf5c-8b9b810988d9",
"traj-b3dc9704-72c5-4b75-a238-ab66b22dd766",
"traj-c6ec0501-d96d-4ad8-bf88-072640e22e4d",
"traj-cee07144-c2df-407d-9c43-29a76de1a48a"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-012533",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-4105b4e5-179f-431f-9f11-b110077fb2bc",
"timestamp": "2026-04-14T21:18:36.114147+00:00",
"source_trajectory_ids": [
"traj-2fce941b-cf65-4efc-a9bc-c83672376d6e",
"traj-62d39291-7f83-4655-a5d0-c992d9ecdf04",
"traj-69975215-b8ff-4faa-b5f2-88ad26805b28",
"traj-81882b7c-ba4c-4ffc-89f4-7803c3aeee01",
"traj-8816a644-f2ef-44c1-8185-ea2cb83afb06",
"traj-9480f7c2-8853-4971-b36f-19c9f1592285",
"traj-956fdf6d-ef5a-4a7b-b32f-029f38e72533",
"traj-a1e6c947-e6e2-4f90-9a6e-22d99a656a2b",
"traj-b2d31d5b-12b7-4694-a26f-e91e1e3be8a7",
"traj-d03bb05c-acd4-452d-af83-77571b30009a"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-211836",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,41 @@
{
"report_id": "report-4109400b-cfbb-4d5a-a26a-e0f4fc054541",
"timestamp": "2026-04-14T15:50:36.233055+00:00",
"source_trajectory_ids": [
"traj-096259f5-d76c-4c42-b42e-fa16c5d2935e",
"traj-19070f8a-b395-4564-a3f0-4cb00e20ea3c",
"traj-226fd70d-da48-4f47-9f63-b6df7efc0175",
"traj-2614cf9a-bebc-44ca-99f6-508a266e2f42",
"traj-4a954778-c76c-4c98-9923-9f97365efc12",
"traj-5b0281de-bb94-4864-85a9-3a6b10d38121",
"traj-5bd45032-16b1-438f-b3a4-ba400ac52884",
"traj-82903c13-0579-4ff4-9d16-631ae7174d9e",
"traj-9ba2db0d-281d-44dc-a50e-09df89bee6f9",
"traj-a6c6d8c3-8073-457e-b55c-48b78eead9ba"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-155036"
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-413d07cb-cf68-42a8-87fd-19fef8e752d1",
"timestamp": "2026-04-14T22:05:59.221755+00:00",
"source_trajectory_ids": [
"traj-00f15b5e-a641-42bd-b3d0-58fe2d9ab635",
"traj-0fc4a255-480c-49a2-b281-420b14c89d71",
"traj-1e601826-f496-492b-9001-033c1f4bf38f",
"traj-2055c676-3aa8-47c9-838b-a464e2599090",
"traj-35633916-ceff-4ef2-b270-260ef43f068e",
"traj-37f59692-f0db-42c7-9fb8-12a24fe65336",
"traj-5f43857c-36d8-464f-97e4-17d3532babfb",
"traj-7dc6d914-fc99-4995-a701-4c544444e421",
"traj-99143129-4966-49d8-8c79-0bae868f22e6",
"traj-f28f6c36-e9f9-4745-98a3-082eccb8e7a2"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-220559",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-41510fac-07d4-48d7-b0d3-435308de8a9b",
"timestamp": "2026-04-14T22:09:39.015784+00:00",
"source_trajectory_ids": [
"traj-0679d7fb-16f2-4815-b422-28bfad02aa05",
"traj-4cacef32-7bd5-478d-9811-3cf929fdf4cb",
"traj-72eec91d-72f8-49ad-b56f-d40b65f4cd76",
"traj-7784f333-f35b-4cc6-9258-71cb52ed5d62",
"traj-ad9737bf-684f-42df-927b-a8c239a9e63e",
"traj-d1536852-2f04-44a2-b18a-6b25acacff35",
"traj-ef00ca26-5cfc-4a06-9dcd-e6f678c85c8f",
"traj-f33cfd42-2102-4873-a3f0-5a2be2be4d69",
"traj-f74fe8d9-81b7-4d72-8514-e5bce6b23716",
"traj-f772c53c-6d53-4fa3-9147-b6642fa4a1e8"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-220939",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-43d4c045-9a5c-40d5-8b1d-1d7c6f77adb6",
"timestamp": "2026-04-14T18:57:10.528189+00:00",
"source_trajectory_ids": [
"traj-1c8080c5-67cb-43d0-80ac-b5e2ec996a3f",
"traj-3f7ac604-e2ed-445e-a8d4-dbd94524609b",
"traj-46540622-c2d7-4783-a309-3833fa1a3f70",
"traj-4e5d9253-feaa-4641-bb84-680f81e38c57",
"traj-7bca135b-7fe2-444a-b112-10570666956d",
"traj-9aec1caa-9415-45a9-ad1d-e5dddda3985b",
"traj-badf1655-c1c5-45ca-b7d5-3f3ab5593848",
"traj-bc375f1b-d8ad-459c-9f08-880f95e1b8d9",
"traj-da9c3b03-5ff3-4f35-bbe1-be521909b86e",
"traj-ec6156e1-6013-45a6-8e3b-66af0214feb7"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 1.032,
"error_rate": 0.0,
"avg_latency_ms": 42.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": -0.592,
"error_rate_delta": 0.0,
"latency_delta_ms": -42.0,
"baseline_avg_reward": 1.032,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-185710",
"baseline_version_id": "v-baseline",
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-43d6e714-88cc-4a65-a101-0d295c3dd389",
"timestamp": "2026-04-14T20:58:05.550865+00:00",
"source_trajectory_ids": [
"traj-4605e012-4600-41ea-87ef-de75d36cb859",
"traj-59306aa1-bcd1-42d8-9bfd-bd8f8d26120a",
"traj-73d23896-0973-442f-87f8-0a80e64d51cb",
"traj-85d6d2cd-b787-42d1-9ed4-623353e3c13f",
"traj-afd7b74c-dd4d-4407-9223-73b0d6fdb58c",
"traj-d2c33fae-90f5-42ae-a928-75cc1f2f4475",
"traj-deb4aa39-0602-4dd7-b06c-57f7fdda2053",
"traj-ee7a8746-7cb2-416b-9f11-afefd425ed0a",
"traj-f369cb32-35a0-4ea2-92a1-f5980c79fd06",
"traj-f5d33f02-0607-4730-894e-4b06be60d7d8"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-205805",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-43e5bf98-8055-4b9f-8640-f2414224d4bf",
"timestamp": "2026-04-14T22:05:44.115652+00:00",
"source_trajectory_ids": [
"traj-04405ec0-7ca9-4465-9518-7dab5d020c30",
"traj-0c0ddc68-0063-41c0-ab91-8e966b62f705",
"traj-0f652d30-d7e1-47fa-b124-cd288a12a14c",
"traj-1ce33c0d-597a-49e6-93dc-88f069e4c302",
"traj-24e41e0a-09f1-4d0c-8899-d4bb69ac9ddf",
"traj-7ab55256-fcd2-453f-abbf-4790df4f6ca8",
"traj-82348fa8-183a-4a40-a366-b6ac6a87309a",
"traj-b2eeb3af-3de0-44a4-b183-060b3a6d81d7",
"traj-dcf0d891-e3b8-49e5-ac91-569f3ceb3a90",
"traj-eabcb8e0-3bc8-47f5-a8dc-4221362a102f"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-220544",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-45467fbb-5fdb-45fe-b4a5-293b6560c08c",
"timestamp": "2026-04-15T01:33:34.775057+00:00",
"source_trajectory_ids": [
"traj-0bd98b63-fe62-407b-a82a-22240f040427",
"traj-0d032b19-011f-48c7-9bee-508b57b44d26",
"traj-15f2455d-56db-46e2-bd41-6418ba23a463",
"traj-4781ddd9-6ee8-43a1-9047-40503b2e5fae",
"traj-9e942dcc-7508-4779-91e2-a03c1b82c597",
"traj-b09495ff-1be2-4c94-bde8-dd0ea7cfbcad",
"traj-cda9f732-c8a1-4d7f-81bc-21318c922894",
"traj-e2626858-fc8f-476a-913f-fa9b1944c6a4",
"traj-ea4fed23-c0b9-4f76-9489-967dd42ed5ec",
"traj-fd5d13e3-ee3b-468b-99ea-8e85c7e0393b"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-013334",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-45f61edc-3f4c-4c6c-822f-d4e97628aa77",
"timestamp": "2026-04-14T22:08:19.673227+00:00",
"source_trajectory_ids": [
"traj-02f093fc-763e-4d3e-bafc-bb8aeaea75f1",
"traj-0a2744e8-e06b-4ecd-b0df-fa0a1c886b23",
"traj-28d82cd2-2f61-4a7d-903c-76c29caa93a2",
"traj-36f2201d-9728-480b-8c84-b40a7062e4e6",
"traj-7bba52c5-33d5-40e6-83a8-0444853df15d",
"traj-8a29f02e-99b7-4169-bff5-061f9aaa82a3",
"traj-8f82347d-7a20-4f92-9491-6ea282ed4c9e",
"traj-d76fd602-b881-4484-afd1-ef3c2f26f839",
"traj-f000568b-7ac3-4a67-a8ce-63d1d9beb690",
"traj-ffa74e58-35c4-42dd-a83d-e454392c2914"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-220819",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-461a5c98-57e6-40c8-b2ce-5a70f64072d2",
"timestamp": "2026-04-15T01:41:52.334143+00:00",
"source_trajectory_ids": [
"traj-3493a4b4-50a6-4a28-8a28-b6811f7dd289",
"traj-363519ec-b624-4a15-857c-7dd124594ef9",
"traj-68a740ca-fdb0-4fe4-9a32-a05ea194f9eb",
"traj-73adf39a-8d2a-465b-815b-d6b59ce127f9",
"traj-7a2de94c-df1d-4b74-83c9-1170b533d845",
"traj-7dd9573a-f665-43a7-b819-cb5ed45dc137",
"traj-afaf90c3-3df5-4f20-ad12-ed790fe8d8aa",
"traj-b1e72746-d5a7-44b8-b666-aa8c48168305",
"traj-e1bc8e6c-e77a-4cb1-8175-8099e93b48de",
"traj-f98d3663-69cd-46b4-ae0a-c20bc80e86f2"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 1.032,
"error_rate": 0.0,
"avg_latency_ms": 42.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": -0.592,
"error_rate_delta": 0.0,
"latency_delta_ms": -42.0,
"baseline_avg_reward": 1.032,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-014152",
"baseline_version_id": "v-baseline",
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-48ee7d3f-d744-43de-93ad-88b94206d59a",
"timestamp": "2026-04-15T02:33:47.729485+00:00",
"source_trajectory_ids": [
"traj-03f64fa4-12e6-43d3-bdd4-850386d7941f",
"traj-231b0863-7611-4fb2-9638-476e7663da5d",
"traj-552c1c6d-4bde-446e-bbf8-c762fed02e81",
"traj-55c1df2f-4e21-463f-8be8-d412eb14da62",
"traj-686ff2d2-9a3c-43e3-8b40-f96962f5647a",
"traj-6e82a8d9-15a2-4891-97c8-ecb3ec3f7192",
"traj-91c9e740-03c7-41b0-883d-b5eeef1a3cc0",
"traj-9d012535-4e80-4aed-b515-97c6a01f4d53",
"traj-ad68a77b-9601-42f2-9c42-0ca21bb7c73f",
"traj-b428fffd-fd29-488a-9d12-95db39eac38e"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-023347",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,44 @@
{
"report_id": "report-4a5187ed-5a28-4ee0-8b40-2e821323693d",
"timestamp": "2026-04-14T18:51:33.158431+00:00",
"source_trajectory_ids": [
"traj-137b6353-1315-4d48-9b83-ad28569d0c96",
"traj-5bd3ab53-8268-4fe0-94a3-490a58200f6f",
"traj-60d28c42-0680-46f8-8de2-f61ec935db8f",
"traj-7886fd07-f658-4bc2-8e44-232a6aad7480",
"traj-868a1eeb-dfad-449d-a725-227ea2c01931",
"traj-950f2bf9-4a9a-4498-a7fc-79abfbc47937",
"traj-a411bae6-de2f-4f81-bc94-6e7075c24b4b",
"traj-a46a7e48-9852-4132-bc5b-44c0dcd5744b",
"traj-eb000b22-fc6f-4a47-9287-7b960627725b",
"traj-f45c3555-2524-44df-9644-979f68d3ed71"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-4b6ecd0d-81b5-4e2c-b52a-d9907a011b20",
"timestamp": "2026-04-14T18:58:16.264614+00:00",
"source_trajectory_ids": [
"traj-59f457a5-cb29-40d8-bc7d-8730e06986df",
"traj-7102877e-30e6-448b-bb99-9b0ac908a73e",
"traj-79299b5a-8e49-4ccb-8881-948903c39580",
"traj-968451f5-70ec-4d23-b040-9e638a324b78",
"traj-c28c9b70-91b0-412e-af2d-f4bd5551cee4",
"traj-c2e9306c-f40a-45e9-8954-3fc538faaf6d",
"traj-d09a7893-3785-4c50-8a70-69f3bc43173b",
"traj-d205135d-bff0-4f1b-8626-912fee42f566",
"traj-e2741ebc-dc3f-490d-9a8a-aba7d6ac5f0d",
"traj-e408ab2c-8fdb-4a61-a71d-30f9abb9ff3d"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-185816",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-4d50ee54-0bfa-4e34-926b-45900bfd3f8d",
"timestamp": "2026-04-14T20:58:05.422298+00:00",
"source_trajectory_ids": [
"traj-067e1a4c-17cd-4374-b0c6-bab2ee05aeab",
"traj-241638b5-a874-45da-9be1-cd0541337e08",
"traj-38541187-375c-438a-be39-837e2330e11a",
"traj-5be14b5b-4c9c-459f-afc9-22a5935a2cc8",
"traj-6c2e9b3a-0327-43ca-81e5-56db7ae936b7",
"traj-7025a020-2103-4fe2-baa5-a0da4c7b9cbb",
"traj-79299683-0b2d-4e4e-a124-1fa48c59ef36",
"traj-96c030f3-e898-42c0-9911-338093d1dc60",
"traj-a573418c-2c39-41cf-9440-477dea42c020",
"traj-b1f69fcc-66d9-4f33-8b73-312398f8217e"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 1.032,
"error_rate": 0.0,
"avg_latency_ms": 42.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": -0.592,
"error_rate_delta": 0.0,
"latency_delta_ms": -42.0,
"baseline_avg_reward": 1.032,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-205805",
"baseline_version_id": "v-baseline",
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-4dc7057d-d4f5-4250-b949-bc20d6f7521a",
"timestamp": "2026-04-15T02:33:47.693933+00:00",
"source_trajectory_ids": [
"traj-0087d4b2-4bf7-4f26-aa54-1cb943e94dd0",
"traj-21bb050c-500e-41e1-87b9-d43e9488d12c",
"traj-282b3e0e-3c53-4580-bdcb-b25d66b9f3dd",
"traj-42d8a589-60b0-4001-8165-25c36e4e6d09",
"traj-508a9891-7a54-4b4c-8dd7-943e5539100e",
"traj-510f9b87-c96a-4b30-897a-96b86c6d15c4",
"traj-6df384c0-0ce4-4049-8983-87ce2880ac89",
"traj-7b69d26f-cbd3-4b5e-ac40-44133fe58a39",
"traj-cf692ef7-f7ff-467f-85a4-dff08182e3e8",
"traj-f44fae13-f32f-41da-a739-cec74835bd37"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-023347",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-4e7caa32-18a9-456f-a773-1c67fe43ce31",
"timestamp": "2026-04-14T20:32:37.607581+00:00",
"source_trajectory_ids": [
"traj-20efc089-2454-4f47-aad0-a67f25a73279",
"traj-31875fd0-e57c-42f6-b659-3140e3f06f5b",
"traj-440f0075-1325-461f-b67c-e68605eea57e",
"traj-462b7514-5775-4ee2-a228-8923fc083277",
"traj-5eaada3f-e728-41be-a722-eaacc2343b27",
"traj-60259dde-b711-40e5-b639-b935ef71307f",
"traj-951afa2a-5840-4fc2-a770-8e5624551899",
"traj-ae15a5aa-85e9-4879-b3f5-ce1fc5882cd1",
"traj-d76ddb92-8283-4600-9081-ca6a81af9cd4",
"traj-fb2ecbaa-cbfc-4c35-8c7e-08290bb2763f"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-203237",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-4ecb8a73-0bf3-4c31-ba10-1be9db3146f9",
"timestamp": "2026-04-14T20:31:11.222850+00:00",
"source_trajectory_ids": [
"traj-0681f8e7-a761-4503-99eb-1e4bc006ec12",
"traj-0ce9f156-20c5-49a3-8b0a-1fc9e028996c",
"traj-13c2f422-b99b-4c93-b92b-35180e88519e",
"traj-2dfba0de-8e4b-4e07-b6b3-0752f278c8e9",
"traj-5c09b804-4076-41bf-ae6f-17fbc024ee42",
"traj-77c07fd7-4479-494b-bdff-0a353664e330",
"traj-a26447e5-654d-4ecd-9af9-270d8ef26e6b",
"traj-bd4660e9-a9a8-4aad-8215-cfc5708b4e04",
"traj-c059fabf-2e18-481d-a645-3718b74b9963",
"traj-dbf9d2d7-1476-4b77-8f64-9b9e0c16535f"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-203111",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,41 @@
{
"report_id": "report-5012fdef-1b08-4522-a946-072c23b71714",
"timestamp": "2026-04-14T18:00:27.756619+00:00",
"source_trajectory_ids": [
"traj-13febbec-cc01-4c68-8895-953e3a458337",
"traj-19937555-e13c-4714-9414-1c3332af7ac8",
"traj-28634bdc-f068-476a-a40a-8318e8786aa9",
"traj-43926528-d16f-41e7-b0d5-ef6e49c1bc05",
"traj-896a8b18-30c4-4d70-98e0-e283f8fc5517",
"traj-91eb1710-444e-4c6d-90e1-aae28c98f4cf",
"traj-96e9bf84-ff75-4b6e-aa70-c328fc951b36",
"traj-a626ce77-02ac-4915-9889-4c2364adeeef",
"traj-b40efd95-f438-4215-ad9a-e46af8638c07",
"traj-fcff5db2-b6bc-46dc-b07d-d0029f88706e"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-180027"
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-508eb935-fe06-4e84-92b6-a1fe22bc6159",
"timestamp": "2026-04-14T20:58:05.539426+00:00",
"source_trajectory_ids": [
"traj-0253e6ba-f504-4379-ae3d-83016e88c09d",
"traj-2144ea5b-3969-4e06-a893-330db7c757bc",
"traj-22880d82-81b8-4803-a7d8-72f7acb5712e",
"traj-4595b5b9-6e23-42f5-8a61-5fde96159580",
"traj-9c89d043-5997-4480-9de6-9262bdc02a31",
"traj-ad14e644-0b4f-4ef7-a62f-79bdea3c6222",
"traj-cf28e6e2-68f8-4351-9f0f-eb6e9cdc3cd7",
"traj-d1b53585-ba7d-4492-8164-95dd51f0fbf8",
"traj-de3972a7-1bed-44e6-adee-e4b2c7c56456",
"traj-f8bc3f68-896b-4b6f-b0f3-0a6381f70ac2"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-50e8ccdd-d716-40cf-b02c-5c349565a955",
"timestamp": "2026-04-14T20:02:20.807645+00:00",
"source_trajectory_ids": [
"traj-1304d305-b55f-4849-a6d0-df7f3e0c1fb9",
"traj-3156c560-d459-42b3-a70d-df0a6e9af578",
"traj-3cb2d518-f74a-45bc-b232-a216d3f28abc",
"traj-61a1791a-5a2c-4c7d-a4fc-e4b82952c51c",
"traj-621b385d-d516-4506-8e27-5468be804754",
"traj-abc09bf9-adce-4fcd-8c1a-a151bc749971",
"traj-b08d47a2-57d9-417f-a0fd-87661137c0e4",
"traj-b2b54604-eece-4f93-96b7-df5cbe2f11b8",
"traj-e31d9867-6180-4867-9946-c32e219ed44e",
"traj-ee895acf-27e2-4efb-868b-793b5b0f5f59"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-200220",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-51b272a3-aa2a-42a9-b406-2af6bb6c13d5",
"timestamp": "2026-04-15T01:33:34.743842+00:00",
"source_trajectory_ids": [
"traj-019b1e3d-a4d5-414c-98f2-14566d4e1a73",
"traj-638e4b82-6bb8-4f95-9112-39f1d153140f",
"traj-7c90795a-8999-4733-9e20-aed2c20d11ce",
"traj-890c85dd-37ab-4949-b72a-6dbd86b22610",
"traj-8ef247e7-fc36-47b4-9c35-7791149a4bc6",
"traj-ca8173f4-ba99-4421-a150-3c04e00c1504",
"traj-e0823914-aeec-402a-b02c-27ddf95ab381",
"traj-f7357e60-cc1d-4ca7-a7b6-b00f30d5263a",
"traj-f8c00ccd-24d1-4f0a-a4d4-808d17529466",
"traj-f9e58e88-b618-4dc2-9723-09b4cf5db05b"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-013334",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-547cf777-50f1-4848-b5c6-e79110f6b4fa",
"timestamp": "2026-04-14T21:18:36.371846+00:00",
"source_trajectory_ids": [
"traj-008e3a6c-d014-441e-a368-3a298a94b570",
"traj-11992679-5342-4506-8f5e-88df8f2e5b37",
"traj-1bd76b8d-7968-4870-adbc-7d6f4d968d4d",
"traj-3c86846f-d086-4198-984b-b34a3d9dc32f",
"traj-559b9c31-c008-4957-8774-539f3225d67b",
"traj-680bba7c-58b7-4b87-be69-3aaeeceb8de6",
"traj-99e17c4d-a8bf-4c3a-8b1e-4e16c640c8aa",
"traj-cd676023-60fa-49d1-bc8d-8b58a8152df0",
"traj-dd628bf0-b6e0-4312-a006-9fcb36cdacd3",
"traj-e10d1f31-6253-4508-a4e9-984894d56caf"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,41 @@
{
"report_id": "report-54f51896-f163-490b-a35f-5f7921b9fcae",
"timestamp": "2026-04-14T15:52:51.142603+00:00",
"source_trajectory_ids": [
"traj-2263147a-44b3-4e96-94d2-dea2dc31cc58",
"traj-2e08b4bd-1a4d-4ae2-a8cf-355f3812ac0b",
"traj-39cf7b85-237a-4676-8d6a-716ba807446a",
"traj-4f9ac486-f0ae-49d4-b79e-e5c9370c3def",
"traj-6fbd4429-9ab3-4077-b8d0-5ff6a64965ba",
"traj-9ad2532a-4a42-4b8f-90bd-0f1d03fc7d34",
"traj-ba2fa5f5-95e5-48c8-96c0-b8f00d6a7d36",
"traj-c77a8e7a-d1fe-4881-9288-3bb4707e42d0",
"traj-dabcee54-f3d9-412d-b392-32badcbce80c",
"traj-db70effe-7b6c-491f-93c9-4892e67507c7"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-155251"
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-58eb6ade-acce-4120-87bc-17252a66f5c1",
"timestamp": "2026-04-14T22:05:44.095159+00:00",
"source_trajectory_ids": [
"traj-04176304-8400-459c-8345-1804b8a1857b",
"traj-2ee8e3e5-1274-456d-b60a-4455e6f1d688",
"traj-3c740a85-d4bc-45e4-8aa0-6ad8de199cd5",
"traj-4a69b684-5185-4792-ba8c-82ecd5ea831c",
"traj-5af6d0c4-0d32-4c1b-8003-cbc3b16af816",
"traj-7a6aa489-6c95-4c72-a1da-63acc995c51e",
"traj-9876e667-7cc5-4f93-a3f9-53ba44b6b343",
"traj-bb97b314-3287-4d08-a5be-4cfe60a70959",
"traj-be45651c-16e4-46a8-80f6-b53319a18f4c",
"traj-e1b4102d-ce4a-448d-9060-1648dae074b6"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,42 @@
{
"report_id": "report-5996831f-a897-4eec-8f40-1786539febde",
"timestamp": "2026-04-14T18:30:24.385886+00:00",
"source_trajectory_ids": [
"traj-0b57378b-d41c-4cd5-9c8b-cbb6d0cb6c6e",
"traj-1b519f5c-8226-45d9-97a9-7057df5389bd",
"traj-5062f87c-5bf2-4b62-b72e-6964492f4517",
"traj-62dc0190-fa0c-48cd-bd64-7f7d8caaffcb",
"traj-9bb3feb1-c576-4e24-8127-6ca03d2a0c08",
"traj-ca8b06b6-af43-418a-bff1-fe3323e43a01",
"traj-e042d848-7805-42f2-ad1b-8500c6e93136",
"traj-e3de23bb-643d-4833-a5c2-fe98182292ce",
"traj-ea84f194-39a1-40bf-8a70-592f80ba40e0",
"traj-ec288161-f7b1-46df-b7c4-26aa79f5e5c5"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-183024",
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-5bbea27a-8808-4142-a300-a5ea9d1b8abb",
"timestamp": "2026-04-14T20:07:38.784383+00:00",
"source_trajectory_ids": [
"traj-24636cff-0df9-464a-aadc-49e7d5bb4b19",
"traj-38b267f5-2839-41fb-8600-e3eff1ebc850",
"traj-49244af8-1ff7-4381-9bb7-68279aab96a3",
"traj-59765e1c-4ebc-42fd-af01-e36389ff3e39",
"traj-7c3f75af-6df0-485a-af83-714eb5595dbc",
"traj-97a16c7c-4b65-486f-920f-b488ee581a57",
"traj-b386fe62-333b-4cc1-be14-473188c861ed",
"traj-e07c427f-bdfb-43d8-953d-e3a7e91113c2",
"traj-e6458a19-1a8e-4d61-8444-57dfb89649f1",
"traj-eea30f77-6daf-4f21-9e90-8be64b29e654"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 1.032,
"error_rate": 0.0,
"avg_latency_ms": 42.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": -0.592,
"error_rate_delta": 0.0,
"latency_delta_ms": -42.0,
"baseline_avg_reward": 1.032,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-200738",
"baseline_version_id": "v-baseline",
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-5bbfa4bf-2555-42d8-bc71-2dd94bf9a1aa",
"timestamp": "2026-04-15T01:57:32.884356+00:00",
"source_trajectory_ids": [
"traj-1d68febb-363d-405a-8456-10d070a0df6f",
"traj-5314e5cf-7c86-4ace-9c2c-34b169b9e455",
"traj-5f54288b-b434-4a88-be89-e4115b32c589",
"traj-67e64768-970a-4fde-8b7a-1e5c4821d0e9",
"traj-76a7c854-ff21-4f1e-9a45-f37d288b69bb",
"traj-788a70d9-4154-4526-af64-d3572ee9f3c5",
"traj-9472520c-14be-4841-b662-3506fc829022",
"traj-bfe0c5b0-1109-471d-b5e8-383f4a6f6219",
"traj-c314335d-9b65-4ccd-b6e0-37fff704101a",
"traj-cd70da62-bdba-4e86-ab7e-346b2f439fbb"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260415-015732",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-5c909aba-8438-4c52-9ac5-aa82c8552a5c",
"timestamp": "2026-04-14T21:21:15.173091+00:00",
"source_trajectory_ids": [
"traj-0ae4d970-1f54-4fca-acf9-49d9786ed602",
"traj-2be44f9a-80d1-4985-9976-a84cdc65ec77",
"traj-54917937-5e1d-4736-9fec-011478a063d3",
"traj-6c11024c-1199-4136-9cad-ebdb70a93b1d",
"traj-74c8f20b-b1fe-4880-8311-32bf22fb2d97",
"traj-921d7a96-8875-4c2f-a1be-e4d59c99b5a2",
"traj-96bfd297-d95c-4190-bac0-01c314cedd02",
"traj-9f46c7fe-20d4-48bc-a430-4dac0a33b36d",
"traj-a9f90b8e-b3e3-4c38-b379-5bae85c0017e",
"traj-f4214286-6b97-416a-98be-2af5379bc7a1"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-5ce6674e-f6e1-4622-aba2-79ed9fb07bc9",
"timestamp": "2026-04-15T01:21:53.799961+00:00",
"source_trajectory_ids": [
"traj-1222b185-244e-46f7-a60d-f7f024819f22",
"traj-1d47bcaa-3b89-47a0-9e11-bd5b0cada785",
"traj-250b5772-1194-44f7-9c27-1eab15bf6428",
"traj-56d2f9d5-9608-4392-886e-0e7693c2ae7b",
"traj-befbea50-2481-4558-96f3-a46a4bcae55f",
"traj-d834d9a9-bb52-418a-8ac9-7ef9aac0d506",
"traj-e551dfaf-20cc-4f16-bc94-693d8ba2355b",
"traj-e5763320-3dbd-4f49-80be-3a0126e26e09",
"traj-eabda2c0-ccee-4fe5-b023-e7dc80cae38a",
"traj-f37c8ecb-eef8-41a2-93cb-7860a8341ae0"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-5d3ab2d4-362f-48ea-8e43-98794a729853",
"timestamp": "2026-04-14T20:31:11.240432+00:00",
"source_trajectory_ids": [
"traj-052c2084-bf8f-45b3-a48b-eaa9b95f5cdc",
"traj-063c87a1-bde2-43e3-ace5-e7c29a9ad296",
"traj-08ac8afd-1f85-4f80-928a-c014756ad1ad",
"traj-254ee33c-82e6-4078-9431-5f421a88eac7",
"traj-3bb69895-8479-48dc-8685-971a00d2dd42",
"traj-5271851b-e3b0-4e5d-981b-2d20551680b1",
"traj-9909611d-1af8-4657-91d2-5bb784c28df7",
"traj-d7ec1de8-c98b-4489-9802-6118696a128d",
"traj-d8d708d8-2e49-49a9-a701-6c08ec33ce8c",
"traj-e3629c94-90cd-4ade-92b6-6b12d088150e"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 1.032,
"error_rate": 0.0,
"avg_latency_ms": 42.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": -0.592,
"error_rate_delta": 0.0,
"latency_delta_ms": -42.0,
"baseline_avg_reward": 1.032,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-203111",
"baseline_version_id": "v-baseline",
"dry_run": false
}

View File

@@ -0,0 +1,42 @@
{
"report_id": "report-5f3cc25f-f580-4610-8939-f275b48348aa",
"timestamp": "2026-04-14T18:51:33.102552+00:00",
"source_trajectory_ids": [
"traj-12af88a3-cd2a-47eb-9f64-cfb6e22e54ce",
"traj-567e562b-b673-4216-a97c-e0342f30a392",
"traj-68ba5f57-66c1-442a-876b-358a1c3ec8a7",
"traj-88df2859-a5f8-41a0-a6b2-b69c7b7534e6",
"traj-a9dd0423-655e-4de1-b438-f129b88eacec",
"traj-ba9449c4-6593-416c-bb47-3aa2e47c8ec7",
"traj-bf6a9a13-af26-4ff1-8ec5-b087bbfde8d1",
"traj-c3f4305f-ca99-44e7-a009-35a3e996acd2",
"traj-e45c104e-f29b-435d-8eb0-cf7c3da2fb2d",
"traj-f71ab09f-bd40-4637-a9ba-999c1e049c47"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-185133",
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-5f961f5f-f3de-463d-8586-b770aa2e951f",
"timestamp": "2026-04-15T02:31:17.458912+00:00",
"source_trajectory_ids": [
"traj-157f8c21-719f-4ba8-8243-f22d95e30091",
"traj-1daf4a22-f63c-4119-8f98-426a42756b47",
"traj-3abf53ed-a0db-4b62-a9ee-b24cb3e74359",
"traj-4d732a6b-1a09-4547-91b0-da7c3b72f9c0",
"traj-5efe2891-e10a-44f1-8882-fa9f35ef0ff5",
"traj-6ea2a8f6-86ce-406d-ad52-54de0aabfe6a",
"traj-7653da9a-96a4-4a34-938d-8251fcf02ea4",
"traj-8b17c700-e430-4c91-928f-25db8f0d73f2",
"traj-c4efa221-68bc-4d01-8bf8-eed2268f0c7e",
"traj-ff6a9712-5857-48ce-96f4-b744d655bd18"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-6579e004-98ff-4fd0-b710-2116b47bbe9e",
"timestamp": "2026-04-15T01:25:33.889628+00:00",
"source_trajectory_ids": [
"traj-1a1d2d0d-9f79-4edf-805b-d8b4bbd920f4",
"traj-28a1f4a0-7446-4c16-886a-99013507cf20",
"traj-3501ab39-8337-47f7-9ae7-7700c41d160f",
"traj-96eff406-cf30-49aa-9ee8-e278a1a1789c",
"traj-a63dbc77-e3e2-4db7-935e-22a088879ff7",
"traj-aefe0c29-8f97-46d5-8e33-23bc714c7151",
"traj-b10077c3-22ca-46ba-9a3d-70c3474f2449",
"traj-c7ee4596-ca05-40b3-8e24-c0b6f95fb0b8",
"traj-d0429a8b-3e38-4316-9f61-09b5847908e9",
"traj-d128fdeb-ec2a-44db-b1fd-f49f63c33536"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-657d2b18-44a2-42a7-821f-5697611b403f",
"timestamp": "2026-04-14T20:54:35.829616+00:00",
"source_trajectory_ids": [
"traj-29e7080a-f38d-4eff-8885-01625f706940",
"traj-4406b1af-13c0-4edb-937e-70a4ad05e9c4",
"traj-74fc5cb4-bcf2-4400-adb4-10f29ad17c13",
"traj-86c672fc-af0b-47c3-9e29-b0ebadab6c3c",
"traj-aef7759d-0c2e-44aa-af65-f40bd4a217ce",
"traj-d087f258-1c76-47e0-b532-7effcece43eb",
"traj-d8f2b0a7-2a9c-4354-b4f1-4fd3de378881",
"traj-e392e827-019b-4679-88aa-b0ca9b9e1a37",
"traj-eddec9a7-94c9-4787-8826-bbaf84c0be35",
"traj-effafeb3-8762-41b6-8594-c1267172b81a"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 1.032,
"error_rate": 0.0,
"avg_latency_ms": 42.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": -0.592,
"error_rate_delta": 0.0,
"latency_delta_ms": -42.0,
"baseline_avg_reward": 1.032,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-205435",
"baseline_version_id": "v-baseline",
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-66aa10dc-0527-4459-bb2e-b5f4da1272c1",
"timestamp": "2026-04-14T19:21:09.831626+00:00",
"source_trajectory_ids": [
"traj-0be01236-de1b-4a17-8d26-ada21cca007a",
"traj-13ae15bb-9bcf-46d7-a8f7-318880c697b2",
"traj-488630e3-898b-4668-9f93-8e3f388bb3c0",
"traj-4e3fc1d9-87f7-4acd-8d9e-8f8caa259c16",
"traj-594da9b5-d065-43c6-8581-e1c325917c5c",
"traj-5cd271b2-b721-4cb3-9d73-35f493d076e7",
"traj-61257688-a738-4164-aeae-6b8ca5b4ccfc",
"traj-7a425e1b-ad77-42eb-bc99-e83d37f0d13c",
"traj-94d587fa-4217-4d91-8119-15c33648ed5b",
"traj-e9bbac88-b876-432a-8208-b45250af8e42"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-192109",
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,41 @@
{
"report_id": "report-66beff81-2ce9-4bf5-9d18-6518f371347c",
"timestamp": "2026-04-14T16:54:50.517635+00:00",
"source_trajectory_ids": [
"traj-20e81f4f-5c98-4f41-b892-81be69efa36c",
"traj-21e3d99b-04f5-4402-9733-f8beaaf8c044",
"traj-54727683-a607-494e-9944-a51bc38d5d22",
"traj-62e7f1b3-ca1f-439e-90ba-081637093125",
"traj-9a7b407c-622b-4adf-9143-513bd58d480e",
"traj-a9ebbf52-9235-4227-8d40-f40cd19b5231",
"traj-b3b68970-229e-40e4-a98c-11a909ba9f7d",
"traj-b786daaf-4ee7-4d79-b09e-0aec9a2b16a3",
"traj-b9b0d092-8782-4f66-beef-4d0995a32fa0",
"traj-c153d7b1-4379-439d-b808-9378fe9f054e"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": true,
"reasons": [],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": "20260414-165450"
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-679f7a61-bd73-423f-81c8-9836584ce96f",
"timestamp": "2026-04-14T15:01:27.746539+00:00",
"source_trajectory_ids": [
"traj-008e354d-cf3f-4838-885d-887add59b833",
"traj-0408386b-4086-4e8b-aab0-34092888ab20",
"traj-41487090-aab2-4c39-bb32-3f08b34253c3",
"traj-49d76619-87bd-4968-ab72-fe2cc4fd687d",
"traj-4ba6da5f-0faa-4792-ab0d-6c44ec286fc3",
"traj-4f8edddf-0ee2-49ac-8d3a-292447189a95",
"traj-6155b78f-ccdd-4141-b0ce-d2d9f3553550",
"traj-6ac43687-13a2-4987-94cf-c7032bc6a8d2",
"traj-7b19cd3d-55e0-4da2-a517-96051a53e63c",
"traj-f2ad8bea-5289-443c-b99d-6e81a5b3f33a"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-68d38c2f-d8dc-4b33-8514-8fa9410b0961",
"timestamp": "2026-04-14T20:57:28.152811+00:00",
"source_trajectory_ids": [
"traj-1c05d834-9c1d-4a43-ad8b-8c6c8087256a",
"traj-386bdc31-2972-4831-9c43-01a2aae8d9f4",
"traj-730465f5-2014-4bea-b491-4bb8fe7c64a4",
"traj-79375497-a0ac-45dd-ae4d-b09bff4be7ed",
"traj-871a56b9-b8bc-40bf-9c2c-9b6358ab53cc",
"traj-ac621263-b868-4692-ab37-7a86bff5a35d",
"traj-b077ff51-61cb-4947-a8b8-0f5f7c5ebea7",
"traj-b342a862-14e1-4635-b4b5-d8e36d10d29b",
"traj-ce5c7f40-792e-43f1-b727-31fd4fdb05e8",
"traj-f9deff53-f6e6-4bdb-a58e-16c927c90d80"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,45 @@
{
"report_id": "report-690aa1c7-7761-49c2-b0a3-9bddfb75dc47",
"timestamp": "2026-04-14T21:22:14.790781+00:00",
"source_trajectory_ids": [
"traj-0558d6b6-9b4f-4580-a6fa-534dac75f3c4",
"traj-1da973fc-88c3-4ea1-9574-3b7a1558d315",
"traj-2adae2da-c0c1-4cff-ba3d-c16500853ca6",
"traj-41302519-e96f-4a36-bd95-982f8690569e",
"traj-5c77ffb7-aee1-4b79-8e88-7d9116c70629",
"traj-77ad9e4d-6265-41e9-8af3-9cef86345cf9",
"traj-aa6c3083-3d8d-4b8f-93eb-674346ef5005",
"traj-aec8383e-152a-46c8-83ec-0fc181a93516",
"traj-c4130706-d699-4990-805a-a8a90d5b7b8d",
"traj-f0a1f252-5a21-47c6-bfdd-3ff5026b1fec"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null,
"baseline_version_id": null,
"dry_run": false
}

View File

@@ -0,0 +1,43 @@
{
"report_id": "report-6bf4158b-c9d8-4eab-ba70-6eb707d0bca1",
"timestamp": "2026-04-14T15:29:36.013045+00:00",
"source_trajectory_ids": [
"traj-1d69c6a6-e7d9-446a-911e-96fa227a3c16",
"traj-1dcf8869-c1d1-4fb0-93f0-6fc42870ef9d",
"traj-3f9baf44-61f6-4428-9e9f-8c3f007e522d",
"traj-5018de53-b5b9-4e3e-b160-00c07286de44",
"traj-5dbdcc78-ec34-4272-99b1-bd91c940a8b7",
"traj-a2a2f17f-a173-47b5-859e-bc7774081f6a",
"traj-adf886a2-770f-49bf-b3e2-c6f43d7f138e",
"traj-b2621d11-6b94-45b9-93fb-a777e0d900dc",
"traj-e5f11c2b-56d6-4b1d-b827-e2542af15171",
"traj-f152c0cc-5cc8-4ba1-836f-57bd6d8afe05"
],
"sample_count": 10,
"baseline_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"challenger_metrics": {
"task_count": 1,
"avg_reward": 0.44,
"error_rate": 0.0,
"avg_latency_ms": 0.0
},
"promotion_decision": {
"accepted": false,
"reasons": [
"Reward delta 0.0000 below minimum 1.0"
],
"metrics": {
"reward_delta": 0.0,
"error_rate_delta": 0.0,
"latency_delta_ms": 0.0,
"baseline_avg_reward": 0.44,
"challenger_avg_reward": 0.44
}
},
"promoted_version_id": null
}

Some files were not shown because too many files have changed in this diff Show More