Skip to content

Commit 8680217

Browse files
committed
chore(catalog): regenerate catalog, stats and update skill/tool files
1 parent 2ea2f4b commit 8680217

File tree

43 files changed

+1383
-66
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

43 files changed

+1383
-66
lines changed

catalog/capabilities.json

Lines changed: 172 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1329,21 +1329,147 @@
13291329
{
13301330
"id": "ops.trace.analyze",
13311331
"version": "1.0.0",
1332-
"description": "TODO define capability contract for ops.trace.analyze.",
1332+
"description": "Analyze incremental execution traces as a cognitive interpretation unit. This capability reconstructs the agent's reasoning path from runtime events, infers assumptions, identifies plausible alternatives, estimates confidence, and returns structured views such as decision graphs. It is intended to be called repeatedly during execution (update mode) and once at run closure (finalize mode), without coupling to any specific model provider.\n",
13331333
"file": "capabilities/ops.trace.analyze.yaml",
1334-
"inputs": {},
1335-
"outputs": {},
1334+
"inputs": {
1335+
"goal": {
1336+
"type": "string",
1337+
"required": true,
1338+
"description": "Declared goal of the agent run being traced."
1339+
},
1340+
"context": {
1341+
"type": "object",
1342+
"required": false,
1343+
"description": "Optional contextual constraints or environment metadata for analysis."
1344+
},
1345+
"events": {
1346+
"type": "array",
1347+
"required": true,
1348+
"description": "Ordered batch of runtime events for this analysis cycle."
1349+
},
1350+
"trace_state": {
1351+
"type": "object",
1352+
"required": false,
1353+
"description": "Inline accumulated trace state from previous cycles."
1354+
},
1355+
"trace_session_id": {
1356+
"type": "string",
1357+
"required": false,
1358+
"description": "Reference identifier for server-managed trace state."
1359+
},
1360+
"state_mode": {
1361+
"type": "string",
1362+
"required": false,
1363+
"description": "State continuity mode. Supported values are auto, inline, and reference."
1364+
},
1365+
"mode": {
1366+
"type": "string",
1367+
"required": false,
1368+
"description": "Analysis mode. Supported values are update and finalize."
1369+
},
1370+
"output_views": {
1371+
"type": "array",
1372+
"required": false,
1373+
"description": "Optional list of requested views such as decision_graph, assumptions, and summary."
1374+
}
1375+
},
1376+
"outputs": {
1377+
"trace_session_id": {
1378+
"type": "string",
1379+
"required": true,
1380+
"description": "Stable trace session id to continue analysis across calls."
1381+
},
1382+
"updated_trace_state": {
1383+
"type": "object",
1384+
"required": true,
1385+
"description": "Updated accumulated trace state for subsequent cycles."
1386+
},
1387+
"state_checksum": {
1388+
"type": "string",
1389+
"required": false,
1390+
"description": "Hash/checksum of the updated state for auditability and drift checks."
1391+
},
1392+
"trace_version": {
1393+
"type": "string",
1394+
"required": false,
1395+
"description": "Version tag of the trace state schema used in this response."
1396+
},
1397+
"decision_graph": {
1398+
"type": "object",
1399+
"required": false,
1400+
"description": "Structured graph representation of detected decisions and dependencies."
1401+
},
1402+
"assumptions": {
1403+
"type": "array",
1404+
"required": false,
1405+
"description": "Detected assumptions inferred from the analyzed execution path."
1406+
},
1407+
"alternative_paths": {
1408+
"type": "array",
1409+
"required": false,
1410+
"description": "Alternative viable paths inferred from current evidence and goal."
1411+
},
1412+
"confidence": {
1413+
"type": "number",
1414+
"required": false,
1415+
"description": "Confidence score for this analysis cycle in the range 0 to 1."
1416+
},
1417+
"risk_candidates": {
1418+
"type": "array",
1419+
"required": false,
1420+
"description": "Candidate risk findings before thresholding/monitoring."
1421+
},
1422+
"summary": {
1423+
"type": "string",
1424+
"required": false,
1425+
"description": "Human-readable summary of the current trace analysis."
1426+
}
1427+
},
13361428
"metadata": {
1337-
"tags": [],
1429+
"tags": [
1430+
"trace",
1431+
"observability",
1432+
"reasoning",
1433+
"cognitive-unit"
1434+
],
13381435
"category": null,
13391436
"status": "experimental",
1340-
"examples": []
1437+
"examples": [
1438+
{
1439+
"input": {
1440+
"goal": "Assess market expansion feasibility",
1441+
"state_mode": "inline",
1442+
"mode": "update",
1443+
"events": [
1444+
{
1445+
"type": "step_completed",
1446+
"timestamp": "2026-03-15T10:00:00Z",
1447+
"step_id": "search_market_data"
1448+
}
1449+
]
1450+
},
1451+
"output": {
1452+
"confidence": 0.71,
1453+
"assumptions": [
1454+
"Primary source is representative for target market"
1455+
],
1456+
"risk_candidates": [
1457+
"decision_without_evidence"
1458+
]
1459+
}
1460+
}
1461+
]
1462+
},
1463+
"properties": {
1464+
"deterministic": false,
1465+
"side_effects": false,
1466+
"idempotent": true
13411467
}
13421468
},
13431469
{
13441470
"id": "ops.trace.monitor",
13451471
"version": "1.0.0",
1346-
"description": "Monitor a trace against thresholds and raise alerts.",
1472+
"description": "Monitor trace state against operational thresholds as a control/governance cognitive unit. This capability does not infer new reasoning structure; instead it evaluates existing trace artifacts and emits deterministic control signals (status, risk flags, alerts, metrics) that can be used to continue, re-plan, or stop an agent workflow.\n",
13471473
"file": "capabilities/ops.trace.monitor.yaml",
13481474
"inputs": {
13491475
"trace": {
@@ -1363,17 +1489,54 @@
13631489
"required": true,
13641490
"description": "Overall monitoring status."
13651491
},
1492+
"risk_flags": {
1493+
"type": "array",
1494+
"required": false,
1495+
"description": "Thresholded risk flags derived from the trace."
1496+
},
13661497
"alerts": {
13671498
"type": "array",
13681499
"required": false,
13691500
"description": "Raised alerts."
1501+
},
1502+
"metrics": {
1503+
"type": "object",
1504+
"required": false,
1505+
"description": "Summary metrics used to evaluate thresholds."
13701506
}
13711507
},
13721508
"metadata": {
1373-
"tags": [],
1509+
"tags": [
1510+
"trace",
1511+
"monitoring",
1512+
"governance",
1513+
"cognitive-unit"
1514+
],
13741515
"category": null,
1375-
"status": "unspecified",
1376-
"examples": []
1516+
"status": "experimental",
1517+
"examples": [
1518+
{
1519+
"input": {
1520+
"trace": {
1521+
"assumptions": [
1522+
"Dataset is complete"
1523+
],
1524+
"risk_candidates": [
1525+
"goal_drift"
1526+
]
1527+
},
1528+
"thresholds": {
1529+
"max_risk_flags": 0
1530+
}
1531+
},
1532+
"output": {
1533+
"status": "blocked",
1534+
"risk_flags": [
1535+
"goal_drift"
1536+
]
1537+
}
1538+
}
1539+
]
13771540
},
13781541
"properties": {
13791542
"deterministic": true,

catalog/governance_guardrails.json

Lines changed: 10 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
{
22
"summary": {
3-
"skills_total": 31,
4-
"skills_with_metadata_issues": 31,
3+
"skills_total": 32,
4+
"skills_with_metadata_issues": 32,
55
"overlap_alerts": 0,
66
"unknown_capability_references": 0,
77
"overlap_threshold": 0.8,
@@ -26,6 +26,14 @@
2626
"missing_tags"
2727
]
2828
},
29+
{
30+
"skill_id": "agent.trace",
31+
"channel": "experimental",
32+
"issues": [
33+
"missing_use_cases",
34+
"missing_examples"
35+
]
36+
},
2937
{
3038
"skill_id": "audio.transcribe-summary",
3139
"channel": "official",

catalog/graph.json

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,14 @@
1313
],
1414
"skills": []
1515
},
16+
"agent.trace": {
17+
"capabilities": [
18+
"data.schema.validate",
19+
"ops.trace.analyze",
20+
"ops.trace.monitor"
21+
],
22+
"skills": []
23+
},
1624
"audio.transcribe-summary": {
1725
"capabilities": [
1826
"audio.transcribe",

0 commit comments

Comments
 (0)