Zion Boggan
repos/TreeTrace/examples/weather-dashboard/.treetrace/failures.json
zionboggan.com ↗
72 lines · json
History for this file →
1
{
2
  "schemaVersion": "0.3",
3
  "project": {
4
    "name": "weather-dashboard",
5
    "generatedAt": "2026-06-19T06:50:11.984Z"
6
  },
7
  "summary": {
8
    "totalFailureSignals": 2,
9
    "topFailureTypes": [
10
      {
11
        "type": "overbuilt_solution",
12
        "count": 1
13
      },
14
      {
15
        "type": "user_rejected_action",
16
        "count": 1
17
      }
18
    ],
19
    "tierCounts": {
20
      "verified": 1,
21
      "high": 0,
22
      "confirmed": 1,
23
      "inferred": 0
24
    },
25
    "models": [
26
      "assistant-model"
27
    ],
28
    "thinkingBlocks": 0,
29
    "correctionChains": 1,
30
    "evalCandidates": 2,
31
    "lessons": 2
32
  },
33
  "failures": [
34
    {
35
      "id": "failure_001",
36
      "type": "user_rejected_action",
37
      "tier": "verified",
38
      "confidence": 1,
39
      "model": null,
40
      "firstSeenNodeId": "node_003",
41
      "correctedByNodeId": null,
42
      "summary": "The user explicitly told the agent to stop or not proceed near \"No, scrap the radar map, it is too heavy.\".",
43
      "evidence": "user_text_decline (text): \"No, scrap the radar map, it is too heavy. Keep the page lightweight, just the forecast cards.\"",
44
      "lesson": "Future agents should not retry a tool action the user just declined without first explaining why the action is still worth taking. Specifically: user_text_decline (text): \"No, scrap the radar map, it is too heavy. Keep the page lightweight, just the forecast cards.\"",
45
      "evalCandidate": true
46
    },
47
    {
48
      "id": "failure_002",
49
      "type": "overbuilt_solution",
50
      "tier": "confirmed",
51
      "confidence": 0.82,
52
      "model": "assistant-model",
53
      "firstSeenNodeId": "node_002",
54
      "correctedByNodeId": "node_003",
55
      "summary": "The work appears to have overbuilt the requested shape near \"Try using leaflet for an interactive radar map layer on top of the forecast.\"; corrected by \"No, scrap the radar map, it is too heavy.\".",
56
      "evidence": "User said: \"No, scrap the radar map, it is too heavy. Keep the page lightweight, just the forecast cards.\"",
57
      "lesson": "Future agents should prefer the smallest implementation that satisfies the corrected product direction. Specifically: User said: \"No, scrap the radar map, it is too heavy. Keep the page lightweight, just the forecast cards.\"",
58
      "evalCandidate": true
59
    }
60
  ],
61
  "correctionChains": [
62
    {
63
      "id": "chain_001",
64
      "failureNodeId": "node_002",
65
      "correctionNodeId": "node_003",
66
      "resolvedNodeId": null,
67
      "failureType": "overbuilt_solution",
68
      "confidence": "high",
69
      "summary": "The work appears to have overbuilt the requested shape near \"Try using leaflet for an interactive radar map layer on top of the forecast.\"; corrected by \"No, scrap the radar map, it is too heavy.\"."
70
    }
71
  ]
72
}