Initial standalone memabra release
This commit is contained in:
@@ -0,0 +1,50 @@
|
||||
{
|
||||
"version_id": "20260414-143742",
|
||||
"weights": {
|
||||
"inject_memory": {
|
||||
"input_length": 43.0,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.95,
|
||||
"top_skill_success_rate": 0.9,
|
||||
"top_tool_confidence": 0.95,
|
||||
"top_tool_risk": 0.0
|
||||
},
|
||||
"load_skill": {
|
||||
"input_length": 44.0,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.95,
|
||||
"top_skill_success_rate": 0.9,
|
||||
"top_tool_confidence": 0.95,
|
||||
"top_tool_risk": 0.0
|
||||
},
|
||||
"call_tool": {
|
||||
"input_length": 32.0,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.9500000000000001,
|
||||
"top_skill_success_rate": 0.9000000000000001,
|
||||
"top_tool_confidence": 0.9500000000000001,
|
||||
"top_tool_risk": 0.0
|
||||
}
|
||||
},
|
||||
"feature_keys": [
|
||||
"input_length",
|
||||
"memory_count",
|
||||
"skill_count",
|
||||
"tool_count",
|
||||
"top_memory_confidence",
|
||||
"top_skill_success_rate",
|
||||
"top_tool_confidence",
|
||||
"top_tool_risk"
|
||||
],
|
||||
"metadata": {
|
||||
"avg_reward": 1.04,
|
||||
"task_count": 3,
|
||||
"source": "wrapup_workflow"
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,50 @@
|
||||
{
|
||||
"version_id": "20260414-152738",
|
||||
"weights": {
|
||||
"load_skill": {
|
||||
"input_length": 42.15803814713897,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.9499999999999997,
|
||||
"top_skill_success_rate": 0.9,
|
||||
"top_tool_confidence": 0.9499999999999997,
|
||||
"top_tool_risk": 0.0
|
||||
},
|
||||
"call_tool": {
|
||||
"input_length": 32.0,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.95,
|
||||
"top_skill_success_rate": 0.9000000000000001,
|
||||
"top_tool_confidence": 0.95,
|
||||
"top_tool_risk": 0.0
|
||||
},
|
||||
"inject_memory": {
|
||||
"input_length": 42.99999999999999,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.95,
|
||||
"top_skill_success_rate": 0.8999999999999999,
|
||||
"top_tool_confidence": 0.95,
|
||||
"top_tool_risk": 0.0
|
||||
}
|
||||
},
|
||||
"feature_keys": [
|
||||
"input_length",
|
||||
"memory_count",
|
||||
"skill_count",
|
||||
"tool_count",
|
||||
"top_memory_confidence",
|
||||
"top_skill_success_rate",
|
||||
"top_tool_confidence",
|
||||
"top_tool_risk"
|
||||
],
|
||||
"metadata": {
|
||||
"avg_reward": 1.04,
|
||||
"task_count": 3,
|
||||
"source": "wrapup_workflow"
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,55 @@
|
||||
{
|
||||
"version_id": "20260414-155224",
|
||||
"weights": {
|
||||
"load_skill": {
|
||||
"input_length": 42.38663484486874,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.9499999999999997,
|
||||
"top_skill_success_rate": 0.9,
|
||||
"top_tool_confidence": 0.9499999999999997,
|
||||
"top_tool_risk": 0.0
|
||||
},
|
||||
"call_tool": {
|
||||
"input_length": 32.0,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.9500000000000001,
|
||||
"top_skill_success_rate": 0.9000000000000001,
|
||||
"top_tool_confidence": 0.9500000000000001,
|
||||
"top_tool_risk": 0.0
|
||||
},
|
||||
"inject_memory": {
|
||||
"input_length": 41.75894988066825,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.9499999999999997,
|
||||
"top_skill_success_rate": 0.8999999999999999,
|
||||
"top_tool_confidence": 0.9499999999999997,
|
||||
"top_tool_risk": 0.0
|
||||
}
|
||||
},
|
||||
"feature_keys": [
|
||||
"input_length",
|
||||
"memory_count",
|
||||
"skill_count",
|
||||
"tool_count",
|
||||
"top_memory_confidence",
|
||||
"top_skill_success_rate",
|
||||
"top_tool_confidence",
|
||||
"top_tool_risk"
|
||||
],
|
||||
"metadata": {
|
||||
"source": "online_learning",
|
||||
"benchmark_summary": {
|
||||
"reward_delta": 0.154,
|
||||
"error_rate_delta": 0.0,
|
||||
"latency_delta_ms": -21.0,
|
||||
"baseline_avg_reward": 0.886,
|
||||
"challenger_avg_reward": 1.04
|
||||
}
|
||||
}
|
||||
}
|
||||
@@ -0,0 +1,65 @@
|
||||
{
|
||||
"version_id": "20260414-165018",
|
||||
"weights": {
|
||||
"load_skill": {
|
||||
"input_length": 41.594896331738454,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.9499999999999998,
|
||||
"top_skill_success_rate": 0.9000000000000001,
|
||||
"top_tool_confidence": 0.9499999999999998,
|
||||
"top_tool_risk": 0.0
|
||||
},
|
||||
"call_tool": {
|
||||
"input_length": 32.85406896551724,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.95,
|
||||
"top_skill_success_rate": 0.9,
|
||||
"top_tool_confidence": 0.95,
|
||||
"top_tool_risk": 0.0
|
||||
},
|
||||
"clarify": {
|
||||
"input_length": 51.0,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.95,
|
||||
"top_skill_success_rate": 0.9,
|
||||
"top_tool_confidence": 0.95,
|
||||
"top_tool_risk": 0.0
|
||||
},
|
||||
"inject_memory": {
|
||||
"input_length": 41.45435244161358,
|
||||
"memory_count": 1.0,
|
||||
"skill_count": 1.0,
|
||||
"tool_count": 1.0,
|
||||
"top_memory_confidence": 0.9499999999999996,
|
||||
"top_skill_success_rate": 0.8999999999999998,
|
||||
"top_tool_confidence": 0.9499999999999996,
|
||||
"top_tool_risk": 0.0
|
||||
}
|
||||
},
|
||||
"feature_keys": [
|
||||
"input_length",
|
||||
"memory_count",
|
||||
"skill_count",
|
||||
"tool_count",
|
||||
"top_memory_confidence",
|
||||
"top_skill_success_rate",
|
||||
"top_tool_confidence",
|
||||
"top_tool_risk"
|
||||
],
|
||||
"metadata": {
|
||||
"source": "online_learning",
|
||||
"benchmark_summary": {
|
||||
"reward_delta": -0.446,
|
||||
"error_rate_delta": 0.0,
|
||||
"latency_delta_ms": -21.0,
|
||||
"baseline_avg_reward": 0.886,
|
||||
"challenger_avg_reward": 0.44
|
||||
}
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user