File size: 20,195 Bytes

b5d4048

"""
pl/core.py — Propagation Logic Core
=====================================

P / G → Q

The single primitive operator of Propagation Logic.

A loaded pattern P = (v_P, L_P) propagates through gradient field G
in context C = (Γ_C, θ_C) to produce updated pattern Q.

Everything in this module is derived from that operator.
Nothing is assumed that is not forced by the mechanism.

Key insight (PL v13, Section 2.6):
    G is not a different kind of thing from P.
    G is P occupying the gradient role contextually.
    All G is P post-boundary-imposition.
    There is no view from outside.
    This file is also P / G → Q.
"""

from __future__ import annotations
from dataclasses import dataclass, field
from typing import Any, Callable, Dict, List, Optional, Set, Tuple, Union
import math


# =============================================================================
# LOADED PATTERN
# =============================================================================

@dataclass
class Pattern:
    """
    P = (v_P, L_P)

    Definition 2.1 (PL v13):
        P = (v_P, H_P) with v_P ∈ V, H_P a propagation history.
        V is the carrier set.
        L_P = |H_P| ≥ 0 is the informational load.

    v_P : designation component — what the pattern currently designates.
          In logic: 0 or 1.
          In arithmetic: a number.
          In language: a token or sentence.
          In physics: a field value.

    L_P : informational load — magnitude of accumulated propagation history.
          L_P = 0 : seed state. No history. Propagates freely.
          L_P > 0 : loaded. Has been through gradient fields.
                    The more it has been through, the harder to propagate further.

    history : the full qualitative record (L_P is its magnitude).
              Conceptually rich; computationally we track both.
    """
    v: Any
    L: float = 0.0
    history: List[str] = field(default_factory=list)

    def __repr__(self) -> str:
        h = " → ".join(self.history[-3:]) if self.history else "∅"
        return f"P(v={self.v!r}, L={self.L:.3f}, hist=[{h}])"

    def __eq__(self, other: object) -> bool:
        if not isinstance(other, Pattern):
            return False
        return self.v == other.v and abs(self.L - other.L) < 1e-9

    def __hash__(self) -> int:
        return hash((repr(self.v), round(self.L, 9)))

    def is_seed(self) -> bool:
        """L_P = 0: no propagation history."""
        return self.L == 0.0

    def copy_with(self, v=None, L=None, history=None) -> "Pattern":
        return Pattern(
            v=v if v is not None else self.v,
            L=L if L is not None else self.L,
            history=history if history is not None else self.history.copy(),
        )


def seed(v: Any) -> Pattern:
    """Convenience: create a seed pattern with no history."""
    return Pattern(v=v, L=0.0)


# =============================================================================
# CONTEXT
# =============================================================================

@dataclass
class Context:
    """
    C = (Γ_C, θ_C)

    Definition 2.2 (PL v13):
        A context is a pair C = (Γ_C, θ_C) where:
            Γ_C : the set of gradient fields available in C
            θ_C : the coherence threshold

    Key derived quantities:
        support(P, C) = min(L_P, θ_C)
        demand(P, C)  = max(0, L_P − θ_C)

        demand = 0  → coherent (pattern is fully supported)
        demand > 0  → incoherent (pattern needs more context than available)

    Theorem 2.1 (the propagation rate theorem):
        Among incoherent patterns, rate ∝ 1/L_P.
        Simpler patterns propagate faster.
        This is Zipf's law, natural selection, why e^x is its own derivative —
        all one theorem.
    """
    gradients: List["Gradient"]
    theta: float = 1.0
    name: str = "C"

    def support(self, p: Pattern) -> float:
        """support(P, C) = min(L_P, θ_C)"""
        return min(p.L, self.theta)

    def demand(self, p: Pattern) -> float:
        """demand(P, C) = max(0, L_P − θ_C)"""
        return max(0.0, p.L - self.theta)

    def is_coherent(self, p: Pattern) -> bool:
        """demand = 0: pattern is fully supported by context."""
        return self.demand(p) == 0.0

    def is_valid(self, p: Pattern, designated: Set = None) -> bool:
        """
        valid = designated AND coherent.
        designated: values that count as "true" in this carrier.
        Default: {1, True} (classical logic convention).
        """
        if designated is None:
            designated = {1, True, 1.0}
        return p.v in designated and self.is_coherent(p)

    def propagation_rate(self, p: Pattern) -> float:
        """
        Theorem 2.1: rate = 1/L_P for incoherent patterns.
        Rate = inf for coherent patterns (already there).
        """
        if self.is_coherent(p):
            return float("inf")
        return 1.0 / p.L if p.L > 0 else float("inf")


# =============================================================================
# GRADIENT
# =============================================================================

class Gradient:
    """
    G — a gradient field.

    G is P occupying the gradient role contextually (PL v13, Section 2.6).
    Every G has loaded history. Every G was constituted by prior propagation.
    G can become P in a higher-order event.

    The propagation event:
        P / G → Q
        v_Q = transform(v_P)          — designation changes
        L_Q = L_P + cost(P)           — load accumulates
        H_Q = H_P + [G.name]          — history records this gradient

    cost: by default 1.0 per propagation step.
          Zero-cost gradients (identity, observation) can be specified.
          Variable-cost gradients can depend on P.
    """

    def __init__(
        self,
        name: str,
        transform: Callable[[Any], Any],
        cost: Union[float, Callable[["Pattern"], float]] = 1.0,
        domain: Optional[Set] = None,
        description: str = "",
    ):
        self.name = name
        self._transform = transform
        self._cost_fn = (cost if callable(cost) else (lambda p, c=cost: c))
        self.domain = domain          # None = any carrier
        self.description = description

    def transform(self, v: Any) -> Any:
        """Apply the designation transformation."""
        return self._transform(v)

    def cost(self, p: Pattern) -> float:
        """Load cost for propagating this pattern through this gradient."""
        return self._cost_fn(p)

    def propagate(self, p: Pattern) -> Pattern:
        """
        P / G → Q

        The primitive operation. Everything else is derived from this.
        """
        v_Q = self._transform(p.v)
        L_Q = p.L + self._cost_fn(p)
        hist_Q = p.history + [self.name]
        return Pattern(v=v_Q, L=L_Q, history=hist_Q)

    def __call__(self, p: Pattern) -> Pattern:
        return self.propagate(p)

    def __repr__(self) -> str:
        return f"G[{self.name}]"

    def is_closed_on(self, carrier: Set) -> Tuple[bool, List]:
        """
        Does this gradient keep the carrier closed?
        Returns (is_closed, violations)
        where violations = [(v_in, v_out_of_carrier), ...]
        """
        violations = []
        for v in carrier:
            out = self._transform(v)
            if out not in carrier:
                violations.append((v, out))
        return len(violations) == 0, violations

    def fixed_points(self, carrier: Set) -> List:
        """Values v ∈ V where G(v) = v."""
        return [v for v in carrier if self._transform(v) == v]

    def orbit(self, v: Any, max_steps: int = 64) -> List:
        """
        The orbit of v under repeated application of G.
        Returns the full cycle if found, truncated at max_steps otherwise.

        If the orbit escapes the carrier (transform raises ValueError),
        returns the visited list so far — indicating no cycle within V.
        This is the correct result for closure violations:
        orbits that exit V have no cycle within V.
        """
        visited = [v]
        current = v
        for _ in range(max_steps):
            try:
                current = self._transform(current)
            except (ValueError, KeyError):
                # Orbit has escaped the carrier — no cycle within V.
                return visited
            if current == v:
                return visited   # full cycle
            visited.append(current)
        return visited           # truncated (no cycle found within max_steps)

    def cycle_length(self, v: Any, max_steps: int = 64) -> Optional[int]:
        """
        Length of the orbit cycle. None if no cycle found.
        None is also correct when the orbit escapes the carrier (closure violation).
        """
        o = self.orbit(v, max_steps)
        if not o:
            return None
        current = o[-1]
        try:
            next_v = self._transform(current)
        except (ValueError, KeyError):
            return None   # orbit escapes carrier, no cycle
        if next_v == o[0]:
            return len(o)
        return None


# =============================================================================
# GRADIENT FAMILIES
# Standard gradient families for known carriers.
# Each family is itself a Pattern in a higher-order carrier.
# =============================================================================

# ── Classical Logic: V = {0, 1} ────────────────────────────────────────────

def G_neg() -> Gradient:
    """
    Classical negation on {0, 1}.
    G_neg flips the designation but does NOT change the load.
    Negating "all dogs bark" costs the same as asserting it.
    """
    return Gradient(
        name="neg",
        transform=lambda v: 1 - v,
        domain={0, 1},
        description="Classical negation: v → 1 - v",
    )

def G_and() -> Gradient:
    """
    Conjunction as a binary gradient.
    Requires tuple input (v_P, v_Q); returns conjunction value.
    """
    return Gradient(
        name="and",
        transform=lambda v: int(v[0] and v[1]) if isinstance(v, tuple) else v,
        domain=None,
        description="Classical conjunction",
    )

def G_or() -> Gradient:
    """Disjunction."""
    return Gradient(
        name="or",
        transform=lambda v: int(v[0] or v[1]) if isinstance(v, tuple) else v,
        domain=None,
        description="Classical disjunction",
    )

def G_id() -> Gradient:
    """
    Identity: zero-cost, leaves everything unchanged.
    The simplest gradient. Fixed point of the gradient-family gradient family.
    """
    return Gradient(
        name="id",
        transform=lambda v: v,
        cost=0.0,
        description="Identity: v → v, zero cost",
    )

# ── Fuzzy Logic: V = {0, 0.5, 1} ───────────────────────────────────────────

def G_fuzzy_neg() -> Gradient:
    """
    Fuzzy negation: v → 1 - v.
    Same formula as classical neg, but on a richer carrier.
    On V={0,0.5,1}: 0.5 is a fixed point. Excluded middle fails at 0.5.
    This is DERIVED from the carrier structure, not assumed.
    """
    return Gradient(
        name="fuzzy_neg",
        transform=lambda v: 1 - v,
        domain={0, 0.5, 1},
        description="Fuzzy negation: v → 1-v on {0, 0.5, 1}",
    )

def G_lukasiewicz_and() -> Gradient:
    """Łukasiewicz conjunction: max(0, v[0] + v[1] - 1)."""
    return Gradient(
        name="luk_and",
        transform=lambda v: max(0, v[0] + v[1] - 1) if isinstance(v, tuple) else v,
        description="Łukasiewicz conjunction",
    )

# ── Arithmetic: V = ℕ, ℤ, ℚ, ℝ ─────────────────────────────────────────────

def G_succ() -> Gradient:
    """
    Successor: n → n + 1.
    On ℕ: always closed.
    No fixed points (nothing maps to itself under +1).
    """
    return Gradient(
        name="succ",
        transform=lambda v: v + 1,
        description="Successor: v → v + 1",
    )

def G_pred() -> Gradient:
    """
    Predecessor: n → n - 1.
    On ℕ = {0, 1, 2, ...}: NOT closed (0 → -1 ∉ ℕ).
    Closure violation FORCES extension to ℤ.
    This is how ℕ → ℤ is derived, not assumed.
    """
    return Gradient(
        name="pred",
        transform=lambda v: v - 1,
        description="Predecessor: v → v - 1 (forces ℕ→ℤ extension)",
    )

def G_double() -> Gradient:
    """v → 2v. On ℤ: closed. Reveals even/odd structure."""
    return Gradient(
        name="double",
        transform=lambda v: 2 * v,
        description="Doubling: v → 2v",
    )

def G_halve() -> Gradient:
    """
    v → v/2.
    On ℤ: NOT closed for odd integers (1/2 ∉ ℤ).
    Forces extension to ℚ.
    This is how ℤ → ℚ is derived.
    """
    return Gradient(
        name="halve",
        transform=lambda v: v / 2,
        description="Halving: v → v/2 (forces ℤ→ℚ extension)",
    )

def G_sqrt() -> Gradient:
    """
    v → √v.
    On ℚ⁺: NOT closed (√2 ∉ ℚ).
    Forces extension to ℝ.
    This is how ℚ → ℝ is derived.
    """
    return Gradient(
        name="sqrt",
        transform=lambda v: v ** 0.5,
        description="Square root: v → √v (forces ℚ→ℝ extension)",
    )

def G_neg_sqrt() -> Gradient:
    """
    v → √(-v) for v < 0, else √v.
    On ℝ: NOT closed for negative values.
    Forces extension to ℂ.
    This is how ℝ → ℂ is derived.
    """
    return Gradient(
        name="neg_sqrt",
        transform=lambda v: complex(0, (-v)**0.5) if v < 0 else v**0.5,
        description="Negative sqrt: forces ℝ→ℂ extension",
    )

# ── Modular arithmetic ──────────────────────────────────────────────────────

def G_mod(n: int, op: str = "add1") -> Gradient:
    """Modular arithmetic on ℤ/nℤ."""
    ops = {
        "add1": lambda v: (v + 1) % n,
        "add2": lambda v: (v + 2) % n,
        "neg":  lambda v: (-v) % n,
        "double": lambda v: (2 * v) % n,
    }
    if op not in ops:
        raise ValueError(f"Unknown op {op!r}. Choose from {list(ops)}")
    return Gradient(
        name=f"mod{n}_{op}",
        transform=ops[op],
        domain=set(range(n)),
        description=f"Mod-{n} {op}",
    )

# ── Custom gradient ─────────────────────────────────────────────────────────

def G_custom(name: str, mapping: Dict[Any, Any], cost: float = 1.0) -> Gradient:
    """
    Build a gradient from an explicit mapping.
    Any carrier, any domain. The engine derives what it forces.
    This is the 'novel carrier' entry point for boundary condition extrapolation.
    """
    def _transform(v: Any) -> Any:
        if v not in mapping:
            raise ValueError(
                f"G[{name}]: value {v!r} not in mapping {set(mapping.keys())}. "
                f"Carrier extension may be required."
            )
        return mapping[v]

    return Gradient(
        name=name,
        transform=_transform,
        cost=cost,
        domain=set(mapping.keys()),
        description=f"Custom gradient with mapping {mapping}",
    )


# =============================================================================
# GRADIENT FAMILY REGISTRY
# Standard (V, Γ) configurations and what they force.
# Used by the engine and the data generator.
# =============================================================================

KNOWN_SYSTEMS = {
    "classical_logic": {
        "description": "Classical two-valued logic",
        "carrier": {0, 1},
        "gradients": lambda: [G_neg(), G_id()],
        "designated": {1},
        "forced": ["closure", "involution", "excluded_middle", "double_negation"],
    },
    "three_valued_logic": {
        "description": "Three-valued (Łukasiewicz) logic",
        "carrier": {0, 0.5, 1},
        "gradients": lambda: [G_fuzzy_neg(), G_id()],
        "designated": {1},
        "forced": ["closure", "middle_value_fixed", "excluded_middle_fails"],
    },
    "natural_numbers": {
        "description": "ℕ with successor (closed) and predecessor (not closed)",
        "carrier": set(range(10)),    # finite sample; full ℕ is unbounded
        "gradients": lambda: [G_succ(), G_id()],
        "designated": {1},
        "forced": ["closure_under_succ", "no_fixed_points_succ"],
    },
    "integers_forced": {
        "description": "ℕ ∪ predecessor → forces ℤ",
        "carrier": {0, 1, 2, 3, 4},
        "gradients": lambda: [G_pred(), G_id()],
        "designated": {1},
        "forced": ["closure_violation", "negative_extension_forced"],
    },
    "rationals_forced": {
        "description": "ℤ ∪ halving → forces ℚ",
        "carrier": {-2, -1, 0, 1, 2, 3, 4},
        "gradients": lambda: [G_halve(), G_id()],
        "designated": {1},
        "forced": ["closure_violation", "rational_extension_forced"],
    },
    "Z4": {
        "description": "Cyclic group ℤ/4ℤ",
        "carrier": {0, 1, 2, 3},
        "gradients": lambda: [G_mod(4, "add1"), G_id()],
        "designated": {0},
        "forced": ["closure", "uniform_4_cycle", "no_fixed_points"],
    },
    "Z2": {
        "description": "Cyclic group ℤ/2ℤ (bit flip)",
        "carrier": {0, 1},
        "gradients": lambda: [G_mod(2, "add1"), G_id()],
        "designated": {0},
        "forced": ["closure", "involution"],
    },
}


# =============================================================================
# PROPAGATION CHAIN
# Records a sequence of P / G → Q steps.
# This is the training unit for the mechanism-first model.
# =============================================================================

@dataclass
class PropagationChain:
    """
    A recorded sequence of propagation steps.

    Step 0: P_0 / G_0 → P_1
    Step 1: P_1 / G_1 → P_2
    ...
    Step n: P_n / G_n → P_{n+1}

    This is the fundamental training example:
    not prose about the mechanism, but the mechanism running.
    """
    steps: List[Tuple[Pattern, Gradient, Pattern]] = field(default_factory=list)
    context: Optional[Context] = None
    carrier: Optional[Set] = None

    def add(self, p_in: Pattern, g: Gradient, p_out: Pattern):
        self.steps.append((p_in, g, p_out))

    def run(self, initial: Pattern, gradients: List[Gradient]) -> "PropagationChain":
        """Run a chain of propagation steps from initial pattern."""
        chain = PropagationChain(context=self.context, carrier=self.carrier)
        current = initial
        for g in gradients:
            next_p = g.propagate(current)
            chain.add(current, g, next_p)
            current = next_p
        return chain

    def as_text(self) -> str:
        """
        Render as training text.
        This is the format the LM learns to predict.
        """
        lines = []
        if self.carrier:
            lines.append(f"CARRIER: {sorted(self.carrier, key=str)}")
        for i, (p_in, g, p_out) in enumerate(self.steps):
            lines.append(
                f"STEP {i}: P(v={p_in.v!r}, L={p_in.L:.1f}) / G[{g.name}] "
                f"→ Q(v={p_out.v!r}, L={p_out.L:.1f})"
            )
        return "\n".join(lines)

    def demand_profile(self) -> List[float]:
        """
        How does demand change across the chain?
        Increasing demand: moving away from coherence (incoherence accumulating).
        Decreasing demand: moving toward coherence (gradient is solving something).
        """
        if not self.context:
            return []
        return [self.context.demand(p_out) for _, _, p_out in self.steps]

    def __len__(self) -> int:
        return len(self.steps)

    def __repr__(self) -> str:
        return f"Chain({len(self.steps)} steps)"