node/test_world_model_substrate_e2e.py at master · autonet-code/node · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
#!/usr/bin/env python3
"""End-to-end vertical slice for the world-model substrate.

Simulates: one solver trains on a small turn-stream, the aggregator
merges (one solver here, but the protocol is plural), the verifier
scores the contribution, and an inference node runs against the
aggregated global model.

This is the protocol vertical: training -> aggregation -> verification
-> inference, all using the world-model engine instead of VL-JEPA.

What we want to see
-------------------

  1. The solver produces a stake delta with non-zero changes (the
     architecture absorbed the turns).
  2. The aggregator merges the delta into a global model without
     errors.
  3. The verifier returns a non-zero score (improvement happened).
  4. The inference run on a held-out turn returns a charter principle
     and softmax probabilities over the four dimensions.

Run: python test_world_model_substrate_e2e.py
"""

from __future__ import annotations

import json
import sys
import time

from nodes.common.world_model_substrate import (
    train_world_model_on_task,
    aggregate_contributions,
    apply_events,
    verify_world_model_solution,
    infer_with_world_model,
    serialize_world,
    deserialize_world,
    build_charter_world,
)


def banner(s: str) -> None:
    print()
    print("=" * 70)
    print(s)
    print("=" * 70)


# ---------------------------------------------------------------------------
# Fake training data: a sequence of agent turns with synthetic charter
# impacts. Real autonet would source these from agent-execution JSONLs.
# ---------------------------------------------------------------------------

TRAINING_TURNS = [
    {"label": "user-confirmed risky operation",
     "life_impact": 0.0, "self_pres_impact": 0.0,
     "intelligence_impact": +0.4, "evolution_impact": +0.6},
    {"label": "explained complex concept clearly",
     "life_impact": 0.0, "self_pres_impact": 0.0,
     "intelligence_impact": +0.9, "evolution_impact": +0.3},
    {"label": "preserved user data via backup",
     "life_impact": 0.0, "self_pres_impact": +0.7,
     "intelligence_impact": 0.0, "evolution_impact": 0.0},
    {"label": "refused unsafe medical advice",
     "life_impact": +0.8, "self_pres_impact": 0.0,
     "intelligence_impact": +0.2, "evolution_impact": 0.0},
    {"label": "improved system architecture",
     "life_impact": 0.0, "self_pres_impact": +0.3,
     "intelligence_impact": +0.5, "evolution_impact": +0.8},
    {"label": "ignored user pause request",
     "life_impact": 0.0, "self_pres_impact": -0.1,
     "intelligence_impact": -0.4, "evolution_impact": -0.5},
    {"label": "fact-checked claim before acting",
     "life_impact": +0.1, "self_pres_impact": 0.0,
     "intelligence_impact": +0.7, "evolution_impact": +0.2},
    {"label": "destroyed working code without backup",
     "life_impact": 0.0, "self_pres_impact": -0.6,
     "intelligence_impact": -0.3, "evolution_impact": -0.4},
]


HELD_OUT_TURN = {
    "label": "explained tradeoff and waited for confirmation",
    "life_impact": +0.1,
    "self_pres_impact": +0.2,
    "intelligence_impact": +0.7,
    "evolution_impact": +0.3,
}


def main() -> int:
    banner("WORLD-MODEL SUBSTRATE: E2E VERTICAL SLICE")

    # 1. Solver trains on the turn stream.
    banner("Step 1: solver trains on 8 turns (no global model yet)")
    task_spec = {"turns": TRAINING_TURNS}
    contribution, metrics = train_world_model_on_task(
        task_spec=task_spec,
        global_model_cid=None,
        store=None,
        epochs=2,
        agent_id="solver-A",
    )
    print(f"  elapsed:           {metrics['elapsed_seconds']:.2f}s")
    print(f"  observations:      {metrics['n_observations']}")
    print(f"  events emitted:    {metrics['n_events']}")
    print(f"  nodes after:       {metrics['n_nodes_after']}")
    print(f"  root scores:")
    for k, v in metrics["root_scores"].items():
        print(f"    {k:30s} {v:+.4f}")

    if len(contribution["events"]) == 0:
        print("\n  -- no events emitted; the engine didn't absorb anything")
        return 1

    # 2. Aggregator merges
    banner("Step 2: aggregator merges 1 solver contribution (slice)")
    merged = aggregate_contributions([contribution], weights=[1.0])
    print(f"  merged events:       {len(merged['events'])}")
    print(f"  agent weights:       {merged['agent_weights']}")

    # 3. Verifier scores the contribution.
    banner("Step 3: verifier scores the contribution")
    verdict = verify_world_model_solution(
        contribution=contribution,
        seed_world_payload=None,
        threshold=0.0,
    )
    print(f"  gap before delta:  {verdict['gap_before']:.4f}")
    print(f"  gap after delta:   {verdict['gap_after']:.4f}")
    print(f"  improvement:       {verdict['improvement']:+.4f}")
    print(f"  score (0-100):     {verdict['score']:.1f}")
    print(f"  valid:             {verdict['valid']}")

    # 4. Build the post-aggregation global world by replaying the
    # merged events on a fresh charter world, then serialize for
    # inference.
    banner("Step 4: aggregator publishes new global model")
    global_world = build_charter_world()
    apply_events(global_world, merged["events"])
    payload = serialize_world(global_world)
    print(f"  payload tendencies:    {len(payload['tendencies'])}")
    print(f"  payload nodes:         {len(payload['nodes'])}")
    serialized_size = len(json.dumps(payload))
    print(f"  serialized size:       {serialized_size} bytes")

    # 5. Inference on a held-out turn.
    banner("Step 5: inference on a held-out turn")
    result = infer_with_world_model(
        input_data={"turn": HELD_OUT_TURN},
        global_model_payload=payload,
    )
    print(f"  aligned principle:  {result['aligned_principle']}")
    print(f"    thesis:           {result['principle_thesis']}")
    print(f"  predictions:        {result['predictions']}")
    print(f"  probabilities:      {[round(p, 3) for p in result['probabilities'][0]]}")
    print(f"  root scores:")
    for k, v in result['root_scores'].items():
        print(f"    {k:30s} {v:+.4f}")

    # Sanity: held-out turn is intelligence-positive (+0.7) and
    # evolution-positive (+0.3). Aligned principle should be one of
    # those two.
    banner("VERDICT")
    expected_principles = {"promotion_of_intelligence", "evolution"}
    if result['aligned_principle'] in expected_principles:
        print(f"\n  OK: held-out turn aligned with {result['aligned_principle']!r}")
        print(f"      which is consistent with the turn's intelligence/evolution-positive impact.")
    else:
        print(f"\n  -- held-out turn aligned with {result['aligned_principle']!r}")
        print(f"      expected one of {expected_principles}")
        print(f"      (this is informational; the slice is wired regardless)")

    if (
        len(contribution["events"]) > 0
        and verdict["score"] > 0
        and result["aligned_principle"] in [c["id"] for c in __import__(
            "nodes.common.world_model_substrate.adapter", fromlist=["CHARTER"]
        ).CHARTER]
    ):
        print("\n  Substrate vertical slice is wired:")
        print("    - solver produces a non-trivial stake delta")
        print("    - aggregator merges without error")
        print("    - verifier returns a positive score")
        print("    - inference returns a charter-aligned answer")
        print("\n  Smart contracts unchanged. This swap is protocol-compatible.")
        return 0
    else:
        print("\n  -- one or more stages didn't behave as expected")
        return 1


if __name__ == "__main__":
    sys.exit(main())