cortex/examples/custom_core_example.py at main · Metta-AI/cortex · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
#!/usr/bin/env -S uv run python
"""Example showing how to create custom core types for the cortex architecture."""

import torch
import torch.nn as nn
from cortex import (
    CoreConfig,
    CortexStack,
    CortexStackConfig,
    LSTMCoreConfig,
    MemoryCore,
    PassThroughScaffoldConfig,
    register_core,
)
from cortex.types import MaybeState, ResetMask, Tensor
from pydantic import Field
from tensordict import TensorDict


# Step 1: Define custom core configuration.
class GRUCoreConfig(CoreConfig):
    """Configuration for a GRU core."""

    core_type: str = "gru"
    num_layers: int = Field(default=1, ge=1)
    bias: bool = Field(default=True)
    dropout: float = Field(default=0.0, ge=0.0)


# Step 2: Implement and register the custom core.
@register_core(GRUCoreConfig)
class GRUCore(MemoryCore):
    """GRU core implementation with TensorDict state management."""

    def __init__(self, cfg: GRUCoreConfig) -> None:
        super().__init__(hidden_size=cfg.hidden_size)
        self.cfg = cfg
        self.net = nn.GRU(
            input_size=cfg.hidden_size,
            hidden_size=cfg.hidden_size,
            num_layers=cfg.num_layers,
            bias=cfg.bias,
            dropout=cfg.dropout if cfg.num_layers > 1 else 0.0,
            batch_first=True,  # Always batch-first
        )
        self.num_layers = cfg.num_layers

    def init_state(self, batch: int, *, device: torch.device, dtype: torch.dtype) -> TensorDict:
        # Batch-first state: [B, L, H]
        h = torch.zeros(batch, self.num_layers, self.hidden_size, device=device, dtype=dtype)
        return TensorDict({"h": h}, batch_size=[batch])

    def forward(
        self,
        x: Tensor,
        state: MaybeState,
        *,
        resets: ResetMask | None = None,
    ) -> tuple[Tensor, MaybeState]:
        # Handle state
        if state is None:
            batch_size = x.shape[0]  # Always batch-first
            state = self.init_state(batch_size, device=x.device, dtype=x.dtype)

        # Get state and transpose from [B, L, H] to [L, B, H] for nn.GRU
        h = state["h"].transpose(0, 1)  # [B, L, H] -> [L, B, H]

        # Handle input shape - always batch-first
        is_batched = x.dim() == 3
        if not is_batched:
            x = x.unsqueeze(1)  # Add seq dimension: [B, H] -> [B, 1, H]

        # Run GRU (always batch-first)
        y, h_new = self.net(x, h)

        # Remove seq dimension if input was not batched
        if not is_batched:
            y = y.squeeze(1)  # [B, 1, H] -> [B, H]

        # Handle resets if provided
        if resets is not None:
            if resets.dim() == 1:  # Batch-level reset
                reset_mask = resets.view(1, -1, 1)  # [B] -> [1, B, 1]
                h_new = torch.where(reset_mask, torch.zeros_like(h_new), h_new)

        # Transpose state back to batch-first: [L, B, H] -> [B, L, H]
        batch_size = x.shape[0]
        h_new_bf = h_new.transpose(0, 1)
        return y, TensorDict({"h": h_new_bf}, batch_size=[batch_size])

    def reset_state(self, state: MaybeState, mask: ResetMask) -> MaybeState:
        if state is None:
            return state

        h = state["h"]  # [B, L, H]
        batch_size = state.batch_size[0] if state.batch_size else h.shape[0]
        reset_mask = mask.view(-1, 1, 1)  # [B] -> [B, 1, 1]
        h_new = torch.where(reset_mask, torch.zeros_like(h), h)
        return TensorDict({"h": h_new}, batch_size=[batch_size])


def test_custom_core():
    """Test the custom GRU core."""
    print("Testing Custom Core Implementation\n" + "=" * 40)

    device = torch.device("cpu")
    dtype = torch.float32
    batch_size = 2
    seq_len = 5
    d_hidden = 64

    # Create a recipe mixing LSTM and GRU cores.
    recipe = CortexStackConfig(
        d_hidden=d_hidden,
        scaffolds=[
            PassThroughScaffoldConfig(
                core=LSTMCoreConfig(hidden_size=64, num_layers=1),
            ),
            PassThroughScaffoldConfig(
                core=GRUCoreConfig(hidden_size=64, num_layers=2),
            ),
            PassThroughScaffoldConfig(
                core=LSTMCoreConfig(hidden_size=64, num_layers=1),
            ),
        ],
        post_norm=True,
    )

    print("Mixed Core Types Configuration:")
    print(f"  d_hidden: {recipe.d_hidden}")
    print(f"  num_scaffolds: {len(recipe.scaffolds)}")
    for i, scaffold in enumerate(recipe.scaffolds):
        core_type = type(scaffold.core).__name__.replace("Config", "") if scaffold.core is not None else "None"
        print(f"  Scaffold {i}: {core_type}")
    print()

    # Build the stack; it automatically handles both LSTM and GRU cores.
    stack = CortexStack(recipe)
    print(f"Built stack with {len(stack.scaffolds)} scaffolds (mixed core types)")

    # Test forward pass
    x = torch.randn(batch_size, seq_len, d_hidden, device=device, dtype=dtype)
    print(f"\nInput shape: {x.shape}")

    state = stack.init_state(batch=batch_size, device=device, dtype=dtype)
    output, new_state = stack(x, state)

    print(f"Output shape: {output.shape}")
    assert output.shape == x.shape, "Output shape mismatch!"

    # Check state structure
    print("\nState structure:")
    for key in new_state.keys():
        scaffold_state = new_state.get(key)
        if scaffold_state is None:
            continue
        core_key = next(iter(scaffold_state.keys()), None)
        if core_key is not None:
            core_state = scaffold_state[core_key]
            print(f"  {key}: {core_key} -> {list(core_state.keys())}")

    print("\n✓ Custom core test passed!")

    print("\n" + "=" * 40)
    print("How the core registry system works:")
    print("1. Define your CoreConfig subclass with custom parameters")
    print("2. Define your core class extending MemoryCore")
    print("3. Use @register_core(YourConfig) on your core class")
    print("4. Your core is now usable in any scaffold configuration!")
    print("\nThe system is fully extensible for both scaffolds and cores.")


if __name__ == "__main__":
    test_custom_core()