From 97ab02da4334afc1487d01634ea9a018bbf69f1e Mon Sep 17 00:00:00 2001
From: CI-DEV <154627941+IlumCI@users.noreply.github.com>
Date: Tue, 4 Nov 2025 02:38:08 +0200
Subject: [PATCH 01/12] Add CRCAAgent to agent imports and types

---
 swarms/agents/__init__.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/swarms/agents/__init__.py b/swarms/agents/__init__.py
index ca3d52e6..f8bc09f1 100644
--- a/swarms/agents/__init__.py
+++ b/swarms/agents/__init__.py
@@ -3,6 +3,7 @@ from swarms.agents.consistency_agent import SelfConsistencyAgent
 from swarms.agents.create_agents_from_yaml import (
     create_agents_from_yaml,
 )
+from swarms.agents.cr_ca_agent import CRCAAgent
 from swarms.agents.flexion_agent import ReflexionAgent
 from swarms.agents.gkp_agent import GKPAgent
 from swarms.agents.i_agent import IterativeReflectiveExpansion
@@ -22,4 +23,5 @@ __all__ = [
     "ReflexionAgent",
     "GKPAgent",
     "AgentJudge",
+    "CRCAAgent",
 ]

From 12e3607dee038f85438d68aba67de4fb956a1dbb Mon Sep 17 00:00:00 2001
From: CI-DEV <154627941+IlumCI@users.noreply.github.com>
Date: Tue, 4 Nov 2025 02:39:56 +0200
Subject: [PATCH 02/12] Created CR-CA agent.py

---
 swarms/agents/cr_ca_agent.py | 4522 ++++++++++++++++++++++++++++++++++
 1 file changed, 4522 insertions(+)
 create mode 100644 swarms/agents/cr_ca_agent.py

diff --git a/swarms/agents/cr_ca_agent.py b/swarms/agents/cr_ca_agent.py
new file mode 100644
index 00000000..3533c98a
--- /dev/null
+++ b/swarms/agents/cr_ca_agent.py
@@ -0,0 +1,4522 @@
+from swarms.structs.agent import Agent
+from typing import Dict, Any, List, Tuple, Optional, Union, Callable
+import networkx as nx
+import numpy as np
+from dataclasses import dataclass
+from enum import Enum
+import math
+from functools import lru_cache
+from collections import defaultdict
+from itertools import combinations
+import pandas as pd
+from scipy import stats as scipy_stats
+from scipy.optimize import minimize, differential_evolution, minimize_scalar, basinhopping
+from scipy.spatial.distance import euclidean, cosine, jensenshannon
+from scipy.linalg import cholesky, inv, pinv
+try:
+    import cvxpy as cp
+    CVXPY_AVAILABLE = True
+except ImportError:
+    CVXPY_AVAILABLE = False
+
+
+class CausalRelationType(Enum):
+    """Types of causal relationships"""
+    DIRECT = "direct"
+    INDIRECT = "indirect"
+    CONFOUNDING = "confounding"
+    MEDIATING = "mediating"
+    MODERATING = "moderating"
+
+
+@dataclass
+class CausalNode:
+    """Represents a node in the causal graph"""
+    name: str
+    value: Optional[float] = None
+    confidence: float = 1.0
+    node_type: str = "variable"
+
+
+@dataclass
+class CausalEdge:
+    """Represents an edge in the causal graph"""
+    source: str
+    target: str
+    strength: float = 1.0
+    relation_type: CausalRelationType = CausalRelationType.DIRECT
+    confidence: float = 1.0
+
+
+@dataclass
+class CounterfactualScenario:
+    """Represents a counterfactual scenario"""
+    name: str
+    interventions: Dict[str, float]
+    expected_outcomes: Dict[str, float]
+    probability: float = 1.0
+    reasoning: str = ""
+
+
+class CRCAAgent:
+    """
+    Causal Reasoning with Counterfactual Analysis Agent.
+    
+    This agent performs sophisticated causal inference and counterfactual reasoning
+    to understand cause-and-effect relationships and explore alternative scenarios.
+    """
+
+    def __init__(
+        self,
+        name: str = "cr-ca-agent",
+        description: str = "Causal Reasoning with Counterfactual Analysis agent",
+        model_name: str = "openai/gpt-4o",
+        max_loops: int = 3,
+        causal_graph: Optional[nx.DiGraph] = None,
+        variables: Optional[List[str]] = None,
+        causal_edges: Optional[List[Tuple[str, str]]] = None,
+    ):
+        """
+        Initialize the CR-CA Agent.
+
+        Args:
+            name: Agent name
+            description: Agent description
+            model_name: LLM model to use
+            max_loops: Maximum reasoning loops
+            causal_graph: Pre-built causal graph
+            variables: List of variable names
+            causal_edges: List of causal relationships (source, target)
+        """
+        self.name = name
+        self.description = description
+        self.model_name = model_name
+        self.max_loops = max_loops
+        
+        # Initialize causal graph
+        self.causal_graph = causal_graph or nx.DiGraph()
+        if variables:
+            self.causal_graph.add_nodes_from(variables)
+        if causal_edges:
+            self.causal_graph.add_edges_from(causal_edges)
+        
+        # Initialize agent with CR-CA schema
+        self.agent = Agent(
+            agent_name=self.name,
+            agent_description=self.description,
+            model_name=self.model_name,
+            max_loops=1,
+            tools_list_dictionary=[self._get_cr_ca_schema()],
+            output_type="final",
+        )
+        
+        # Memory for storing causal analysis history
+        self.causal_memory: List[Dict[str, Any]] = []
+        self.counterfactual_scenarios: List[CounterfactualScenario] = []
+        # Standardization statistics for each variable: {'var': {'mean': m, 'std': s}}
+        self.standardization_stats: Dict[str, Dict[str, float]] = {}
+        # Optional history of learned edge strengths for temporal tracking
+        self.edge_strength_history: List[Dict[Tuple[str, str], float]] = []
+        # Optional constraints: enforce monotonic signs on edges { (u,v): +1|-1 }
+        self.edge_sign_constraints: Dict[Tuple[str, str], int] = {}
+        # Random number generator for probabilistic methods
+        self.rng = np.random.default_rng()
+        
+        # Performance: caching for expensive computations
+        self._prediction_cache: Dict[Tuple[tuple, tuple], Dict[str, float]] = {}
+        self._cache_enabled: bool = True
+        self._cache_max_size: int = 1000
+        
+        # Non-linear extensions: interaction terms {node: [list of parent pairs to interact]}
+        self.interaction_terms: Dict[str, List[Tuple[str, str]]] = {}
+        
+        # Information theory cache
+        self._entropy_cache: Dict[str, float] = {}
+        self._mi_cache: Dict[Tuple[str, str], float] = {}
+        
+        # Bayesian inference: prior distributions {edge: {'mu': μ₀, 'sigma': σ₀}}
+        self.bayesian_priors: Dict[Tuple[str, str], Dict[str, float]] = {}
+
+    def _get_cr_ca_schema(self) -> Dict[str, Any]:
+        """Get the CR-CA agent schema for structured reasoning."""
+        return {
+            "type": "function",
+            "function": {
+                "name": "generate_causal_analysis",
+                "description": "Generates structured causal reasoning and counterfactual analysis",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "causal_analysis": {
+                            "type": "string",
+                            "description": "Analysis of causal relationships and mechanisms"
+                        },
+                        "intervention_planning": {
+                            "type": "string", 
+                            "description": "Planned interventions to test causal hypotheses"
+                        },
+                        "counterfactual_scenarios": {
+                            "type": "array",
+                            "items": {
+                                "type": "object",
+                                "properties": {
+                                    "scenario_name": {"type": "string"},
+                                    "interventions": {"type": "object"},
+                                    "expected_outcomes": {"type": "object"},
+                                    "reasoning": {"type": "string"}
+                                }
+                            },
+                            "description": "Multiple counterfactual scenarios to explore"
+                        },
+                        "causal_strength_assessment": {
+                            "type": "string",
+                            "description": "Assessment of causal relationship strengths and confounders"
+                        },
+                        "optimal_solution": {
+                            "type": "string",
+                            "description": "Recommended optimal solution based on causal analysis"
+                        }
+                    },
+                    "required": [
+                        "causal_analysis",
+                        "intervention_planning", 
+                        "counterfactual_scenarios",
+                        "causal_strength_assessment",
+                        "optimal_solution"
+                    ]
+                }
+            }
+        }
+
+    def add_causal_relationship(
+        self, 
+        source: str, 
+        target: str, 
+        strength: float = 1.0,
+        relation_type: CausalRelationType = CausalRelationType.DIRECT,
+        confidence: float = 1.0
+    ) -> None:
+        """Add a causal relationship to the graph."""
+        self.causal_graph.add_edge(source, target)
+        self.causal_graph[source][target].update({
+            'strength': strength,
+            'relation_type': relation_type,
+            'confidence': confidence
+        })
+
+    def identify_causal_chain(self, start: str, end: str) -> List[str]:
+        """Identify the causal chain between two variables."""
+        try:
+            path = nx.shortest_path(self.causal_graph, start, end)
+            return path
+        except nx.NetworkXNoPath:
+            return []
+
+    def detect_confounders(self, treatment: str, outcome: str) -> List[str]:
+        """Detect potential confounders for a treatment-outcome relationship."""
+        confounders = []
+        
+        # Find common ancestors
+        treatment_ancestors = set(nx.ancestors(self.causal_graph, treatment))
+        outcome_ancestors = set(nx.ancestors(self.causal_graph, outcome))
+        common_ancestors = treatment_ancestors.intersection(outcome_ancestors)
+        
+        # Check if common ancestors are connected to both treatment and outcome
+        for ancestor in common_ancestors:
+            if (nx.has_path(self.causal_graph, ancestor, treatment) and 
+                nx.has_path(self.causal_graph, ancestor, outcome)):
+                confounders.append(ancestor)
+        
+        return confounders
+
+    def generate_counterfactual_scenarios(
+        self, 
+        factual_state: Dict[str, float],
+        target_variables: List[str],
+        max_scenarios: int = 5
+    ) -> List[CounterfactualScenario]:
+        """Generate counterfactual scenarios for given variables."""
+        scenarios = []
+        
+        for i, target_var in enumerate(target_variables[:max_scenarios]):
+            # Use standardized z-score increments to avoid exploding magnitudes
+            stats = self.standardization_stats.get(target_var, {"mean": 0.0, "std": 1.0})
+            z_steps = [-2.0, -1.0, -0.5, 0.5, 1.0, 2.0]
+            current_raw = factual_state.get(target_var, 0.0)
+            # Map current value to z space (if stats available)
+            if stats["std"] > 0:
+                current_z = (current_raw - stats["mean"]) / stats["std"]
+            else:
+                current_z = 0.0
+            # Propose interventions around current z value
+            proposed_z_values = [current_z + dz for dz in z_steps]
+            # Convert back to raw for simulation
+            intervention_values = [
+                (z * stats["std"]) + stats["mean"] for z in proposed_z_values
+            ]
+            
+            for j, intervention_value in enumerate(intervention_values):
+                scenario = CounterfactualScenario(
+                    name=f"scenario_{i}_{j}",
+                    interventions={target_var: intervention_value},
+                    expected_outcomes=self._predict_outcomes(factual_state, {target_var: intervention_value}),
+                    probability=self._calculate_scenario_probability(factual_state, {target_var: intervention_value}),
+                    reasoning=f"Intervention on {target_var} with value {intervention_value}"
+                )
+                scenarios.append(scenario)
+        
+        return scenarios
+
+    def _standardize_state(self, state: Dict[str, float]) -> Dict[str, float]:
+        """Convert raw state dict to standardized z-scores using stored stats."""
+        z: Dict[str, float] = {}
+        for k, v in state.items():
+            stats = self.standardization_stats.get(k)
+            if stats and stats.get("std", 0.0) > 0:
+                z[k] = (v - stats["mean"]) / stats["std"]
+            else:
+                z[k] = v
+        return z
+
+    def _destandardize_value(self, var: str, z_value: float) -> float:
+        """Convert a z-score back to raw value for a specific variable."""
+        stats = self.standardization_stats.get(var)
+        if stats and stats.get("std", 0.0) > 0:
+            return z_value * stats["std"] + stats["mean"]
+        return z_value
+
+    def _predict_outcomes(
+        self, 
+        factual_state: Dict[str, float], 
+        interventions: Dict[str, float],
+        use_cache: bool = True,
+    ) -> Dict[str, float]:
+        """
+        Predict outcomes given interventions using standardized linear propagation.
+        
+        Mathematical foundation:
+        - Structural Equation Model (SEM): y = Xβ + ε where β are structural coefficients
+        - Do-operator: do(X=x) sets X=x, removing its dependence on parents
+        - In z-space (standardized): z_y = Σᵢ βᵢ·z_xi + z_ε
+        - Propagation: topological order ensures parents computed before children
+        
+        Standardization: z = (x - μ)/σ where μ is mean, σ is standard deviation
+        This ensures numerical stability and scale-invariance.
+        
+        Linear SCM: Each node y has equation y = Σᵢ βᵢ·xᵢ + ε
+        where xᵢ are parents, βᵢ are edge strengths, ε is noise.
+        
+        Args:
+            factual_state: Current state
+            interventions: Interventions to apply
+            use_cache: Whether to use prediction cache
+        
+        Returns:
+            Predicted outcomes
+        """
+        # Note: Caching is handled by _predict_outcomes_cached wrapper
+        # This method is the actual computation (call with use_cache=False from cache wrapper)
+        # Merge states and convert to z-space
+        # Standardization: z = (x - μ)/σ (z-score transformation)
+        raw_state = factual_state.copy()
+        raw_state.update(interventions)
+        z_state = self._standardize_state(raw_state)
+
+        # Work on a copy to avoid mutating initial inputs
+        z_pred = dict(z_state)
+
+        # Propagate in topological order (ensures parents computed before children)
+        # Topological sort: linearization of DAG respecting causal ordering
+        for node in nx.topological_sort(self.causal_graph):
+            if node in interventions:
+                # Do-operator: do(X=x) forces X=x, breaking dependence on parents
+                # If directly intervened, keep its standardized value as-is
+                if node not in z_pred:
+                    z_pred[node] = z_state.get(node, 0.0)
+                continue
+
+            predecessors = list(self.causal_graph.predecessors(node))
+            if not predecessors:
+                # Exogenous nodes (no parents): z_node = z_ε (noise term)
+                continue
+
+            # Linear structural equation: z_y = Σᵢ βᵢ·z_xi
+            # This is the structural causal model (SCM) equation in z-space
+            effect_z = 0.0
+            for parent in predecessors:
+                parent_z = z_pred.get(parent)
+                if parent_z is None:
+                    parent_z = z_state.get(parent, 0.0)
+                edge_data = self.causal_graph[parent][node]
+                strength = edge_data.get('strength', 0.0)  # Structural coefficient βᵢ
+                # Linear combination: z_y = Σᵢ βᵢ·z_xi
+                effect_z += parent_z * strength
+
+            z_pred[node] = effect_z  # Store predicted z-score
+
+        # Convert back to raw value space using inverse standardization
+        # De-standardization: x = z·σ + μ
+        predicted_state: Dict[str, float] = {}
+        for var, z_val in z_pred.items():
+            predicted_state[var] = self._destandardize_value(var, z_val)
+        return predicted_state
+
+    def _calculate_scenario_probability(
+        self, 
+        factual_state: Dict[str, float], 
+        interventions: Dict[str, float]
+    ) -> float:
+        """
+        Calculate smoothed probability using standardized z-distance.
+        
+        Mathematical formulation:
+        - Compute z-score deltas: dz_i = z_new_i - z_old_i for each intervened variable
+        - L2 norm squared: ||dz||² = Σᵢ (dz_i)²
+        - Gaussian-like probability: p = 0.95 * exp(-0.5 * ||dz||²) + 0.05
+        - Bounded to [0.05, 0.98]: p = clip(p, 0.05, 0.98)
+        
+        This follows the Mahalanobis distance-based probability in multivariate Gaussian.
+        """
+        # Step 1: Compute z-score deltas for intervened variables
+        # dz_i = z_new_i - z_old_i where z = (x - μ)/σ
+        z_sq_sum = 0.0
+        for var, new_val in interventions.items():
+            stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
+            mu = stats.get('mean', 0.0)  # μ: mean
+            sd = stats.get('std', 1.0) or 1.0  # σ: standard deviation
+            
+            # Get old value from factual state or use mean as default
+            old_val = factual_state.get(var, mu)
+            
+            # Compute z-scores: z = (x - μ)/σ
+            z_new = (new_val - mu) / sd
+            z_old = (old_val - mu) / sd
+            
+            # Delta in z-space: dz = z_new - z_old
+            dz = z_new - z_old
+            
+            # Accumulate squared L2 norm: ||dz||² = Σᵢ (dz_i)²
+            z_sq_sum += float(dz) * float(dz)
+        
+        # Step 2: Compute probability using exponential decay
+        # p = 0.95 * exp(-0.5 * ||dz||²) + 0.05
+        # This gives high probability (near 0.95) when ||dz||² ≈ 0 (small intervention)
+        # and low probability (near 0.05) when ||dz||² is large (large intervention)
+        prob = 0.95 * float(np.exp(-0.5 * z_sq_sum)) + 0.05
+        
+        # Step 3: Clip to valid probability range [0.05, 0.98]
+        # p = min(0.98, max(0.05, p))
+        prob = max(0.05, min(0.98, prob))
+        
+        return float(prob)
+
+    def analyze_causal_strength(self, source: str, target: str) -> Dict[str, float]:
+        """Analyze the strength of causal relationship between two variables."""
+        if not self.causal_graph.has_edge(source, target):
+            return {"strength": 0.0, "confidence": 0.0, "path_length": float('inf')}
+        
+        edge_data = self.causal_graph[source][target]
+        path_length = len(nx.shortest_path(self.causal_graph, source, target)) - 1
+        
+        return {
+            "strength": edge_data.get('strength', 1.0),
+            "confidence": edge_data.get('confidence', 1.0),
+            "path_length": path_length,
+            "relation_type": edge_data.get('relation_type', CausalRelationType.DIRECT).value
+        }
+
+    def fit_from_dataframe(
+        self,
+        df: Any,
+        variables: List[str],
+        window: int = 30,
+        decay_alpha: float = 0.9,
+        ridge_lambda: float = 0.0,
+        enforce_signs: bool = True
+    ) -> None:
+        """Fit edge strengths and standardization stats from a rolling window with recency weighting.
+
+        For each child variable, perform a simple weighted linear regression on its parents
+        defined in the existing graph to estimate edge 'strength' coefficients. Also compute
+        mean/std for z-score scaling. Uses exponential decay weights to emphasize recent data.
+        """
+        if df is None or len(df) == 0:
+            return
+        df_local = df[variables].dropna().copy()
+        if len(df_local) < max(3, window):
+            # Still compute stats on available data
+            pass
+        # Use the last `window` rows
+        window_df = df_local.tail(window)
+        n = len(window_df)
+        # Exponential decay weights: newer rows get higher weights
+        # Oldest gets alpha^(n-1), newest gets alpha^0 = 1.0
+        weights = np.array([decay_alpha ** (n - 1 - i) for i in range(n)], dtype=float)
+        weights = weights / (weights.sum() if weights.sum() != 0 else 1.0)
+
+        # Compute standardization stats
+        self.standardization_stats = {}
+        for v in variables:
+            m = float(window_df[v].mean())
+            s = float(window_df[v].std(ddof=0))
+            if s == 0:
+                s = 1.0
+            self.standardization_stats[v] = {"mean": m, "std": s}
+        # Ensure default stats for any graph node not in the window variables
+        for node in self.causal_graph.nodes():
+            if node not in self.standardization_stats:
+                self.standardization_stats[node] = {"mean": 0.0, "std": 1.0}
+
+        # Estimate edge strengths per node from its parents
+        learned_strengths: Dict[Tuple[str, str], float] = {}
+        for child in self.causal_graph.nodes():
+            parents = list(self.causal_graph.predecessors(child))
+            if not parents:
+                continue
+            # Skip children not present in the data window
+            if child not in window_df.columns:
+                continue
+            # Prepare standardized design matrix X (parents) and target y (child)
+            X_cols = []
+            for p in parents:
+                if p in window_df.columns:
+                    X_cols.append(((window_df[p] - self.standardization_stats[p]["mean"]) / self.standardization_stats[p]["std"]).values)
+            if not X_cols:
+                continue
+            X = np.vstack(X_cols).T  # shape (n, k)
+            y = ((window_df[child] - self.standardization_stats[child]["mean"]) / self.standardization_stats[child]["std"]).values
+            # Weighted least squares: (X' W X)^{-1} X' W y
+            W = np.diag(weights)
+            XtW = X.T @ W
+            XtWX = XtW @ X
+            # Ridge regularization for stability
+            if ridge_lambda > 0 and XtWX.size > 0:
+                k = XtWX.shape[0]
+                XtWX = XtWX + ridge_lambda * np.eye(k)
+            try:
+                XtWX_inv = np.linalg.pinv(XtWX)
+                beta = XtWX_inv @ (XtW @ y)
+            except Exception:
+                beta = np.zeros(X.shape[1])
+            # Assign strengths to edges in order of parents
+            for idx, p in enumerate(parents):
+                strength = float(beta[idx]) if idx < len(beta) else 0.0
+                # Enforce monotonic sign constraints if requested
+                if enforce_signs:
+                    sign = self.edge_sign_constraints.get((p, child))
+                    if sign == 1 and strength < 0:
+                        strength = 0.0
+                    elif sign == -1 and strength > 0:
+                        strength = 0.0
+                if self.causal_graph.has_edge(p, child):
+                    self.causal_graph[p][child]['strength'] = strength
+                    self.causal_graph[p][child]['confidence'] = 1.0
+                    learned_strengths[(p, child)] = strength
+        # Track history for temporal drift analysis
+        self.edge_strength_history.append(learned_strengths)
+
+        # Enforce DAG: if cycles exist, iteratively remove weakest edge in cycles
+        try:
+            while not nx.is_directed_acyclic_graph(self.causal_graph):
+                cycle_edges = list(nx.find_cycle(self.causal_graph, orientation="original"))
+                # pick weakest edge among cycle
+                weakest = None
+                weakest_w = float("inf")
+                for u, v, _ in cycle_edges:
+                    w = abs(float(self.causal_graph[u][v].get('strength', 0.0)))
+                    if w < weakest_w:
+                        weakest_w = w
+                        weakest = (u, v)
+                if weakest:
+                    self.causal_graph.remove_edge(*weakest)
+                else:
+                    break
+        except Exception:
+            pass
+
+    def identify_adjustment_set(self, treatment: str, outcome: str) -> List[str]:
+        """Heuristic back-door adjustment set selection.
+
+        Returns a set that blocks back-door paths: parents of treatment excluding descendants of treatment and the outcome itself.
+        """
+        if treatment not in self.causal_graph or outcome not in self.causal_graph:
+            return []
+        parents_t = set(self.causal_graph.predecessors(treatment))
+        descendants_t = set(nx.descendants(self.causal_graph, treatment))
+        adjustment = [z for z in parents_t if z not in descendants_t and z != outcome]
+        return adjustment
+
+    def estimate_ate(
+        self,
+        df: Any,
+        treatment: str,
+        outcome: str,
+        conditioning: Optional[List[str]] = None,
+        method: str = 'ols'
+    ) -> float:
+        """Estimate average treatment effect using simple regression adjustment.
+
+        y ~ T + Z, return coefficient on T in standardized space.
+        """
+        if df is None or len(df) == 0:
+            return 0.0
+        if conditioning is None:
+            conditioning = self.identify_adjustment_set(treatment, outcome)
+        cols = [c for c in [outcome, treatment] + conditioning if c in df.columns]
+        data = df[cols].dropna()
+        if len(data) < 5:
+            return 0.0
+        # Standardize
+        ds = (data - data.mean()) / (data.std(ddof=0).replace(0, 1.0))
+        y = ds[outcome].values
+        X_cols = [ds[treatment].values] + [ds[c].values for c in conditioning]
+        X = np.vstack(X_cols).T
+        # OLS
+        try:
+            beta = np.linalg.pinv(X) @ y
+            return float(beta[0])
+        except Exception:
+            return 0.0
+
+    def estimate_cate(
+        self,
+        df: Any,
+        treatment: str,
+        outcome: str,
+        context_by: Optional[str] = None,
+        num_bins: int = 3
+    ) -> Dict[str, float]:
+        """Estimate heterogeneous effects by binning a context feature and computing local ATEs."""
+        if df is None or len(df) == 0 or context_by is None or context_by not in df.columns:
+            return {}
+        series = df[context_by].dropna()
+        if len(series) < 10:
+            return {}
+        quantiles = np.linspace(0, 1, num_bins + 1)
+        bins = series.quantile(quantiles).values
+        bins[0] = -np.inf
+        bins[-1] = np.inf
+        cate: Dict[str, float] = {}
+        for i in range(num_bins):
+            mask = (df[context_by] > bins[i]) & (df[context_by] <= bins[i+1])
+            ate_bin = self._safe_ate_bin(df[mask], treatment, outcome)
+            cate[f"bin_{i}"] = ate_bin
+        return cate
+
+    def _safe_ate_bin(self, df: Any, treatment: str, outcome: str) -> float:
+        if df is None or len(df) < 5:
+            return 0.0
+        return self.estimate_ate(df, treatment, outcome)
+
+    def counterfactual_abduction_action_prediction(
+        self,
+        factual_state: Dict[str, float],
+        interventions: Dict[str, float]
+    ) -> Dict[str, float]:
+        """
+        Abduction–Action–Prediction for linear-Gaussian SCM in z-space.
+        
+        Pearl's three-step counterfactual reasoning:
+        
+        1. Abduction: Infer latent noise terms ε from factual observations
+           - Given factual: x_factual, compute ε = x - E[x|parents]
+           - For linear SCM: ε = z_y - Σᵢ βᵢ·z_xi (residual)
+           - This preserves the "history" that led to factual state
+        
+        2. Action: Apply do-operator do(X=x*) to set intervention values
+           - do(X=x*) breaks causal dependencies: P(Y|do(X=x*)) ≠ P(Y|X=x*)
+           - Sets intervened variables to counterfactual values
+        
+        3. Prediction: Propagate with new values but old noise
+           - Use abduced noise ε from step 1
+           - Predict: y_cf = Σᵢ βᵢ·x_cfᵢ + ε (same noise, new parents)
+           - This gives counterfactual: "What if X had been x* instead of x_factual?"
+        
+        Mathematical foundation:
+        - Factual: Y = f(X, ε) where ε ~ N(0, σ²)
+        - Abduction: ε̂ = Y_factual - f(X_factual, 0) (infer noise from observation)
+        - Counterfactual: Y_cf = f(X_cf, ε̂) (same noise, different X)
+        """
+        # Standardize factual: z = (x - μ)/σ
+        z = self._standardize_state(factual_state)
+        noise: Dict[str, float] = {}
+        
+        # Step 1: ABDUCTION - Infer latent noise terms from factual observations
+        # Noise represents unobserved confounders and stochastic variation
+        # For linear SCM: ε = z_y - Σᵢ βᵢ·z_xi (residual from linear regression)
+        for node in nx.topological_sort(self.causal_graph):
+            parents = list(self.causal_graph.predecessors(node))
+            if not parents:
+                # Exogenous: noise equals observed value (no parents to subtract)
+                noise[node] = z.get(node, 0.0)
+                continue
+            
+            # Predicted value from structural equation: ŷ = Σᵢ βᵢ·xᵢ
+            pred = 0.0
+            for p in parents:
+                w = self.causal_graph[p][node].get('strength', 0.0)  # βᵢ
+                pred += z.get(p, 0.0) * w  # Σᵢ βᵢ·z_xi
+            
+            # Abduce noise: ε = z_observed - ŷ
+            # This captures the deviation from deterministic prediction
+            noise[node] = z.get(node, 0.0) - pred
+        # Action + prediction
+        cf_raw = factual_state.copy()
+        cf_raw.update(interventions)
+        z_cf = self._standardize_state(cf_raw)
+        z_pred: Dict[str, float] = {}
+        for node in nx.topological_sort(self.causal_graph):
+            if node in interventions:
+                z_pred[node] = z_cf.get(node, 0.0)
+                continue
+            parents = list(self.causal_graph.predecessors(node))
+            if not parents:
+                z_pred[node] = noise.get(node, 0.0)
+                continue
+            val = 0.0
+            for p in parents:
+                w = self.causal_graph[p][node].get('strength', 0.0)
+                val += z_pred.get(p, z_cf.get(p, 0.0)) * w
+            z_pred[node] = val + noise.get(node, 0.0)
+        # De-standardize
+        out: Dict[str, float] = {k: self._destandardize_value(k, v) for k, v in z_pred.items()}
+        return out
+
+    def quantify_uncertainty(
+        self,
+        df: Any,
+        variables: List[str],
+        windows: int = 200,
+        alpha: float = 0.95
+    ) -> Dict[str, Any]:
+        """Bootstrap strengths and produce confidence intervals per edge.
+
+        If PyMC is available, provide a Bayesian posterior CI as well (best effort).
+        """
+        if df is None or len(df) == 0:
+            return {"edge_cis": {}, "samples": 0}
+        samples: Dict[Tuple[str, str], List[float]] = {}
+        usable = df[variables].dropna()
+        if len(usable) < 10:
+            return {"edge_cis": {}, "samples": 0}
+        idx = np.arange(len(usable))
+        for _ in range(windows):
+            boot_idx = np.random.choice(idx, size=len(idx), replace=True)
+            boot_df = usable.iloc[boot_idx]
+            self.fit_from_dataframe(boot_df, variables=variables, window=min(30, len(boot_df)))
+            for u, v in self.causal_graph.edges():
+                w = float(self.causal_graph[u][v].get('strength', 0.0))
+                samples.setdefault((u, v), []).append(w)
+        edge_cis: Dict[str, Tuple[float, float]] = {}
+        for (u, v), arr in samples.items():
+            arr = np.array(arr)
+            lo = float(np.quantile(arr, (1 - alpha) / 2))
+            hi = float(np.quantile(arr, 1 - (1 - alpha) / 2))
+            edge_cis[f"{u}->{v}"] = (lo, hi)
+        out: Dict[str, Any] = {"edge_cis": edge_cis, "samples": windows}
+        # Optional Bayesian: very lightweight attempt using PyMC linear model per edge
+        try:
+            import pymc as pm  # type: ignore
+            bayes_cis: Dict[str, Tuple[float, float]] = {}
+            data = usable
+            for u, v in self.causal_graph.edges():
+                if u not in data.columns or v not in data.columns:
+                    continue
+                X = (data[[u]].values).astype(float)
+                y = (data[v].values).astype(float)
+                with pm.Model() as m:
+                    beta = pm.Normal('beta', mu=0, sigma=1)
+                    sigma = pm.HalfNormal('sigma', sigma=1)
+                    mu = beta * X.flatten()
+                    pm.Normal('obs', mu=mu, sigma=sigma, observed=y)
+                    idata = pm.sampling_jax.sample_numpyro_nuts(draws=500, tune=300, chains=1, progressbar=False)
+                b_samp = np.asarray(idata.posterior['beta']).flatten()
+                bayes_cis[f"{u}->{v}"] = (float(np.quantile(b_samp, 0.05)), float(np.quantile(b_samp, 0.95)))
+            out["bayes_cis"] = bayes_cis
+        except Exception:
+            pass
+        return out
+
+    def detect_change_points(self, series: List[float], threshold: float = 2.5) -> List[int]:
+        """Simple CUSUM-like change detection; returns indices with large cumulative shifts."""
+        if not series or len(series) < 10:
+            return []
+        x = np.array(series, dtype=float)
+        mu = x.mean()
+        sigma = x.std() or 1.0
+        s = np.cumsum((x - mu) / sigma)
+        return [int(i) for i, v in enumerate(s) if abs(v) > threshold]
+
+    def learn_structure(
+        self,
+        df: Any,
+        variables: List[str],
+        corr_threshold: float = 0.2
+    ) -> None:
+        """Very simple structure learning: add edges where |corr|>threshold, enforce DAG by ordering.
+
+        Order variables as provided and only add edges from earlier to later variables.
+        """
+        if df is None or len(df) == 0:
+            return
+        data = df[variables].dropna()
+        if len(data) < 10:
+            return
+        corr = data.corr().values
+        self.causal_graph.clear()
+        self.causal_graph.add_nodes_from(variables)
+        n = len(variables)
+        for i in range(n):
+            for j in range(i+1, n):
+                if abs(corr[i, j]) >= corr_threshold:
+                    self.add_causal_relationship(variables[i], variables[j], strength=0.0)
+
+    def sample_joint_interventions_gaussian_copula(
+        self,
+        base_state: Dict[str, float],
+        variables: List[str],
+        df: Any,
+        num_samples: int = 10,
+        z_radius: float = 1.0
+    ) -> List[Dict[str, float]]:
+        """Sample joint interventions using a Gaussian copula built from historical correlations in z-space."""
+        out: List[Dict[str, float]] = []
+        if df is None or len(df) == 0:
+            return out
+        hist = df[variables].dropna()
+        if len(hist) < 10:
+            return out
+        # Standardize
+        H = (hist - hist.mean()) / (hist.std(ddof=0).replace(0, 1.0))
+        cov = np.cov(H.values.T)
+        # Ensure positive semi-definite via eigen clipping
+        eigvals, eigvecs = np.linalg.eigh(cov)
+        eigvals_clipped = np.clip(eigvals, 1e-6, None)
+        cov_psd = (eigvecs @ np.diag(eigvals_clipped) @ eigvecs.T)
+        mean = np.zeros(len(variables))
+        z_samples = np.random.multivariate_normal(mean, cov_psd, size=num_samples)
+        for z in z_samples:
+            scaled = {}
+            for k, v in zip(variables, z):
+                scaled[k] = self._destandardize_value(k, float(np.clip(v, -z_radius, z_radius)))
+            out.append({**base_state, **scaled})
+        return out
+
+    def plan_interventions(
+        self,
+        target_outcome: str,
+        candidates: List[str],
+        base_state: Dict[str, float],
+        df: Any,
+        budget: float = 1.0,
+        num_grid: int = 5,
+        risk_metric: str = 'cvar',
+        cvar_alpha: float = 0.9
+    ) -> List[Dict[str, Any]]:
+        """Risk-aware intervention planner. Grid-search small z-steps and penalize by CVaR proxy.
+
+        Returns top plans with objective = expected improvement - risk_penalty.
+        """
+        if not candidates:
+            return []
+        # Build small z-grid per candidate
+        z_levels = np.linspace(-budget, budget, num_grid)
+        results: List[Dict[str, Any]] = []
+        for var in candidates:
+            for z in z_levels:
+                # Convert z-shift to raw using stats
+                raw_shift = self._destandardize_value(var, z) - self._destandardize_value(var, 0.0)
+                trial_state = base_state.copy()
+                trial_state[var] = base_state.get(var, 0.0) + raw_shift
+                # Predict deterministic outcome
+                pred = self._predict_outcomes(base_state, {var: trial_state[var]})
+                benefit = pred.get(target_outcome, 0.0) - base_state.get(target_outcome, 0.0)
+                # Risk via bootstrap strengths if data provided
+                risk_penalty = 0.0
+                if df is not None and risk_metric == 'cvar':
+                    unc = self.quantify_uncertainty(df, variables=list(set(candidates + [target_outcome])), windows=100, alpha=cvar_alpha)
+                    # Build perturbed outcomes by sampling edge strengths from CIs midpoint +/- half-range
+                    edge_cis = unc.get('edge_cis', {})
+                    outcomes = []
+                    for _ in range(50):
+                        # Temporarily perturb strengths
+                        saved: Dict[Tuple[str, str], float] = {}
+                        for (u, v) in self.causal_graph.edges():
+                            key = f"{u}->{v}"
+                            if key in edge_cis:
+                                lo, hi = edge_cis[key]
+                                w = float(np.random.uniform(lo, hi))
+                                saved[(u, v)] = self.causal_graph[u][v]['strength']
+                                self.causal_graph[u][v]['strength'] = w
+                        p = self._predict_outcomes(base_state, {var: trial_state[var]}).get(target_outcome, 0.0)
+                        outcomes.append(p)
+                        # Restore
+                        for (u, v), w in saved.items():
+                            self.causal_graph[u][v]['strength'] = w
+                    outcomes = np.array(outcomes)
+                    losses = base_state.get(target_outcome, 0.0) - outcomes
+                    tail = np.quantile(losses, cvar_alpha)
+                    risk_penalty = float(losses[losses >= tail].mean()) if np.any(losses >= tail) else 0.0
+                score = benefit - risk_penalty
+                results.append({
+                    'var': var,
+                    'z': float(z),
+                    'raw_shift': float(raw_shift),
+                    'benefit': float(benefit),
+                    'risk_penalty': float(risk_penalty),
+                    'score': float(score),
+                    'predicted': pred.get(target_outcome, 0.0)
+                })
+        results.sort(key=lambda x: x['score'], reverse=True)
+        return results[:10]
+
+    def state_space_update(
+        self,
+        prev_mean: float,
+        prev_var: float,
+        observation: float,
+        process_var: float = 1e-2,
+        obs_var: float = 1e-1
+    ) -> Tuple[float, float]:
+        """Minimal 1D Kalman-like update returning new mean/variance."""
+        # Predict
+        pred_mean = prev_mean
+        pred_var = prev_var + process_var
+        # Update
+        K = pred_var / (pred_var + obs_var)
+        new_mean = pred_mean + K * (observation - pred_mean)
+        new_var = (1 - K) * pred_var
+        return float(new_mean), float(new_var)
+
+    def causal_explain_ace(self, child: str) -> Dict[str, float]:
+        """Decompose child prediction into parent contributions in z-space (ACE-like for linear model)."""
+        parents = list(self.causal_graph.predecessors(child))
+        if not parents:
+            return {}
+        contrib: Dict[str, float] = {}
+        for p in parents:
+            contrib[p] = float(self.causal_graph[p][child].get('strength', 0.0))
+        return contrib
+
+    def identifiability_report(self, treatment: str, outcome: str) -> str:
+        """Simple do-calculus identifiability report stub based on back-door availability."""
+        adj = self.identify_adjustment_set(treatment, outcome)
+        if adj:
+            return f"Effect of {treatment} on {outcome} identifiable via back-door with adjustment set: {adj}"
+        return f"Effect of {treatment} on {outcome} not identified by simple back-door; consider IVs or front-door."
+
+    def identify_instruments(self, treatment: str, outcome: str) -> List[str]:
+        """Heuristic IV identification: candidates are parents of treatment that do not have a path to outcome.
+
+        This enforces relevance (parent of T) and exclusion (no path to Y) in the graph structure.
+        """
+        if treatment not in self.causal_graph or outcome not in self.causal_graph:
+            return []
+        instruments: List[str] = []
+        for z in self.causal_graph.predecessors(treatment):
+            # Relevance: z -> treatment by definition
+            # Exclusion: no path from z to outcome (strong condition)
+            if not nx.has_path(self.causal_graph, z, outcome):
+                instruments.append(z)
+        return instruments
+
+    def estimate_2sls(
+        self,
+        df: Any,
+        treatment: str,
+        outcome: str,
+        instruments: Optional[List[str]] = None,
+        controls: Optional[List[str]] = None
+    ) -> Dict[str, Any]:
+        """Two-Stage Least Squares estimator for causal effect of treatment on outcome.
+
+        Returns a dict with {'coef': float, 'first_stage_F': float, 'used_instruments': [...], 'used_controls': [...]}.
+        """
+        result = {"coef": 0.0, "first_stage_F": 0.0, "used_instruments": [], "used_controls": []}
+        if df is None or len(df) == 0 or treatment not in df.columns or outcome not in df.columns:
+            return result
+        if instruments is None or len(instruments) == 0:
+            instruments = self.identify_instruments(treatment, outcome)
+        if controls is None:
+            controls = []
+        cols_needed = [outcome, treatment] + instruments + controls
+        cols = [c for c in cols_needed if c in df.columns]
+        data = df[cols].dropna()
+        if len(data) < 10 or len(instruments) == 0:
+            return result
+        # Standardize
+        ds = (data - data.mean()) / (data.std(ddof=0).replace(0, 1.0))
+        # First stage: T ~ Z + C
+        ZC_cols = [ds[z].values for z in instruments] + [ds[c].values for c in controls if c in ds.columns]
+        if not ZC_cols:
+            return result
+        X1 = np.vstack(ZC_cols).T
+        y1 = ds[treatment].values
+        X1TX1 = X1.T @ X1
+        try:
+            beta1 = np.linalg.pinv(X1TX1) @ (X1.T @ y1)
+        except Exception:
+            return result
+        t_hat = X1 @ beta1
+        # First-stage F-statistic proxy: var explained / residual var times dof ratio (rough heuristic)
+        ssr = float(((t_hat - y1.mean()) ** 2).sum())
+        sse = float(((y1 - t_hat) ** 2).sum())
+        k = X1.shape[1]
+        n = X1.shape[0]
+        if sse > 0 and n > k and k > 0:
+            result["first_stage_F"] = (ssr / k) / (sse / (n - k - 1))
+        # Second stage: Y ~ T_hat + C
+        X2_cols = [t_hat] + [ds[c].values for c in controls if c in ds.columns]
+        X2 = np.vstack(X2_cols).T
+        y2 = ds[outcome].values
+        try:
+            beta2 = np.linalg.pinv(X2.T @ X2) @ (X2.T @ y2)
+            result["coef"] = float(beta2[0])
+        except Exception:
+            result["coef"] = 0.0
+        result["used_instruments"] = [z for z in instruments if z in ds.columns]
+        result["used_controls"] = [c for c in controls if c in ds.columns]
+        return result
+
+    def find_optimal_interventions(
+        self, 
+        target_outcome: str, 
+        available_interventions: List[str],
+        constraints: Optional[Dict[str, Tuple[float, float]]] = None
+    ) -> List[Dict[str, float]]:
+        """Find optimal interventions to achieve target outcome."""
+        if constraints is None:
+            constraints = {}
+        
+        optimal_interventions = []
+        
+        # Generate intervention combinations
+        for intervention_var in available_interventions:
+            if intervention_var in constraints:
+                min_val, max_val = constraints[intervention_var]
+                test_values = np.linspace(min_val, max_val, 10)
+            else:
+                test_values = np.linspace(-2.0, 2.0, 10)
+            
+            for value in test_values:
+                intervention = {intervention_var: value}
+                predicted_outcomes = self._predict_outcomes({}, intervention)
+                
+                if target_outcome in predicted_outcomes:
+                    optimal_interventions.append({
+                        'intervention': intervention,
+                        'predicted_outcome': predicted_outcomes[target_outcome],
+                        'efficiency': abs(predicted_outcomes[target_outcome]) / abs(value) if value != 0 else 0
+                    })
+        
+        # Sort by efficiency and return top interventions
+        optimal_interventions.sort(key=lambda x: x['efficiency'], reverse=True)
+        return optimal_interventions[:5]
+
+    def step(self, task: str) -> str:
+        """Execute a single step of causal reasoning."""
+        response = self.agent.run(task)
+        return response
+
+    def run(self, task: str, *args, **kwargs) -> Dict[str, Any]:
+        """
+        Run the CR-CA agent for comprehensive causal analysis.
+        
+        Args:
+            task: The problem or question to analyze causally
+            
+        Returns:
+            Dictionary containing causal analysis results
+        """
+        # Reset memory
+        self.causal_memory = []
+        self.counterfactual_scenarios = []
+        
+        # Build causal analysis prompt
+        causal_prompt = self._build_causal_prompt(task)
+        
+        # Run causal analysis
+        for i in range(self.max_loops):
+            print(f"\nCausal Analysis Step {i+1}/{self.max_loops}")
+            
+            step_result = self.step(causal_prompt)
+            self.causal_memory.append({
+                'step': i + 1,
+                'analysis': step_result,
+                'timestamp': i
+            })
+            
+            # Update prompt with previous analysis
+            if i < self.max_loops - 1:
+                memory_context = self._build_memory_context()
+                causal_prompt = f"{causal_prompt}\n\nPrevious Analysis:\n{memory_context}"
+        
+        # Generate final causal analysis
+        final_analysis = self._synthesize_causal_analysis(task)
+        
+        return {
+            'task': task,
+            'causal_analysis': final_analysis,
+            'counterfactual_scenarios': self.counterfactual_scenarios,
+            'causal_graph_info': {
+                'nodes': list(self.causal_graph.nodes()),
+                'edges': list(self.causal_graph.edges()),
+                'is_dag': nx.is_directed_acyclic_graph(self.causal_graph)
+            },
+            'analysis_steps': self.causal_memory
+        }
+
+    def _build_causal_prompt(self, task: str) -> str:
+        """Build the causal analysis prompt."""
+        return f"""
+        You are a Causal Reasoning with Counterfactual Analysis (CR-CA) agent. 
+        Analyze the following problem using sophisticated causal reasoning:
+        
+        Problem: {task}
+        
+        Your analysis should include:
+        1. Causal Analysis: Identify cause-and-effect relationships
+        2. Intervention Planning: Plan interventions to test causal hypotheses  
+        3. Counterfactual Scenarios: Explore multiple "what-if" scenarios
+        4. Causal Strength Assessment: Evaluate relationship strengths and confounders
+        5. Optimal Solution: Recommend the best approach based on causal analysis
+        
+        Current causal graph has {len(self.causal_graph.nodes())} variables and {len(self.causal_graph.edges())} relationships.
+        """
+
+    def _build_memory_context(self) -> str:
+        """Build memory context from previous analysis steps."""
+        context_parts = []
+        for step in self.causal_memory[-2:]:  # Last 2 steps
+            context_parts.append(f"Step {step['step']}: {step['analysis']}")
+        return "\n".join(context_parts)
+
+    def _synthesize_causal_analysis(self, task: str) -> str:
+        """Synthesize the final causal analysis from all steps."""
+        synthesis_prompt = f"""
+        Based on the causal analysis steps performed, synthesize a comprehensive 
+        causal reasoning report for: {task}
+        
+        Include:
+        - Key causal relationships identified
+        - Recommended interventions
+        - Counterfactual scenarios explored
+        - Optimal solution with causal justification
+        - Confidence levels and limitations
+        """
+        
+        return self.agent.run(synthesis_prompt)
+
+    def get_causal_graph_visualization(self) -> str:
+        """Get a text representation of the causal graph."""
+        if not self.causal_graph.nodes():
+            return "Empty causal graph"
+        
+        lines = ["Causal Graph Structure:"]
+        lines.append(f"Nodes: {list(self.causal_graph.nodes())}")
+        lines.append("Edges:")
+        
+        for source, target in self.causal_graph.edges():
+            edge_data = self.causal_graph[source][target]
+            strength = edge_data.get('strength', 1.0)
+            relation_type = edge_data.get('relation_type', CausalRelationType.DIRECT).value
+            lines.append(f"  {source} -> {target} (strength: {strength}, type: {relation_type})")
+        
+        return "\n".join(lines)
+
+    def analyze_cascading_chain_reaction(
+        self,
+        initial_intervention: Dict[str, float],
+        target_outcomes: List[str],
+        max_hops: int = 5,
+        include_feedback_loops: bool = True,
+        num_iterations: int = 3,
+    ) -> Dict[str, Any]:
+        """
+        Analyze multi-layer cascading chain reactions from an intervention.
+        
+        Example: "If X affects Y, how does it cascade through Z→alpha→...→back to X?"
+        
+        Args:
+            initial_intervention: {variable: value} intervention to analyze
+            target_outcomes: Variables to trace effects to
+            max_hops: Maximum path length to consider
+            include_feedback_loops: Whether to iterate for feedback effects
+            num_iterations: Number of propagation iterations (for cycles)
+        
+        Returns:
+            Dict with causal paths, cascade probabilities, and cumulative effects
+        """
+        # Find all paths from intervention variables to outcomes
+        intervention_vars = list(initial_intervention.keys())
+        all_paths: Dict[str, List[List[str]]] = {}
+        
+        for inter_var in intervention_vars:
+            for outcome in target_outcomes:
+                if outcome == inter_var:
+                    continue
+                
+                # Find all simple paths (no cycles)
+                try:
+                    simple_paths = list(nx.all_simple_paths(
+                        self.causal_graph,
+                        inter_var,
+                        outcome,
+                        cutoff=max_hops
+                    ))
+                    if simple_paths:
+                        all_paths[f"{inter_var}->{outcome}"] = simple_paths
+                except nx.NetworkXNoPath:
+                    pass
+        
+        # Find feedback loops (paths that eventually return to intervention vars)
+        feedback_paths: List[List[str]] = []
+        if include_feedback_loops:
+            for inter_var in intervention_vars:
+                try:
+                    # Find cycles through inter_var
+                    cycles = list(nx.simple_cycles(self.causal_graph))
+                    for cycle in cycles:
+                        if inter_var in cycle:
+                            # Rotate cycle to start at inter_var
+                            idx = cycle.index(inter_var)
+                            rotated = cycle[idx:] + cycle[:idx] + [inter_var]
+                            feedback_paths.append(rotated)
+                except Exception:
+                    pass
+        
+        # Multi-layer propagation with iterations
+        current_state = self._standardize_state(initial_intervention)
+        propagation_history: List[Dict[str, float]] = [current_state.copy()]
+        
+        for iteration in range(num_iterations):
+            next_state = current_state.copy()
+            
+            # Propagate through all nodes in topological order
+            for node in nx.topological_sort(self.causal_graph):
+                if node in initial_intervention and iteration == 0:
+                    # Keep intervention value in first iteration
+                    continue
+                
+                parents = list(self.causal_graph.predecessors(node))
+                if not parents:
+                    continue
+                
+                effect_z = 0.0
+                for parent in parents:
+                    parent_z = next_state.get(parent, current_state.get(parent, 0.0))
+                    edge_data = self.causal_graph[parent][node]
+                    strength = edge_data.get('strength', 0.0)
+                    effect_z += parent_z * strength
+                
+                next_state[node] = effect_z
+            
+            propagation_history.append(next_state.copy())
+            current_state = next_state
+        
+        # Compute path strengths and probabilities
+        path_analyses: List[Dict[str, Any]] = []
+        for path_key, paths in all_paths.items():
+            for path in paths:
+                # Compute path strength (product of edge strengths)
+                path_strength = 1.0
+                path_strengths_list = []
+                for i in range(len(path) - 1):
+                    u, v = path[i], path[i + 1]
+                    edge_data = self.causal_graph[u][v]
+                    strength = abs(edge_data.get('strength', 0.0))
+                    path_strength *= strength
+                    path_strengths_list.append(strength)
+                
+                # Estimate cascade probability (stronger paths = more likely)
+                # Using softmax-style normalization
+                path_prob = min(0.95, path_strength * 0.5 + 0.05)
+                
+                path_analyses.append({
+                    "path": path,
+                    "path_string": " → ".join(path),
+                    "path_strength": float(path_strength),
+                    "edge_strengths": path_strengths_list,
+                    "cascade_probability": float(path_prob),
+                    "hops": len(path) - 1,
+                })
+        
+        # Feedback loop analysis
+        feedback_analyses: List[Dict[str, Any]] = []
+        for cycle_path in feedback_paths[:10]:  # Limit to top 10 cycles
+            cycle_strength = 1.0
+            for i in range(len(cycle_path) - 1):
+                u, v = cycle_path[i], cycle_path[i + 1]
+                if self.causal_graph.has_edge(u, v):
+                    strength = abs(self.causal_graph[u][v].get('strength', 0.0))
+                    cycle_strength *= strength
+            
+            feedback_analyses.append({
+                "cycle": cycle_path,
+                "cycle_string": " → ".join(cycle_path),
+                "cycle_strength": float(cycle_strength),
+                "could_amplify": cycle_strength > 0.1,  # Strong cycles can amplify
+            })
+        
+        # Final state predictions (de-standardized)
+        final_predictions: Dict[str, float] = {}
+        for var in target_outcomes:
+            if var in propagation_history[-1]:
+                z_val = propagation_history[-1][var]
+                final_predictions[var] = self._destandardize_value(var, z_val)
+            else:
+                final_predictions[var] = 0.0
+        
+        return {
+            "initial_intervention": initial_intervention,
+            "target_outcomes": target_outcomes,
+            "causal_paths": path_analyses,
+            "feedback_loops": feedback_analyses,
+            "propagation_history": [
+                {k: self._destandardize_value(k, v) for k, v in state.items() if k in target_outcomes}
+                for state in propagation_history
+            ],
+            "final_predictions": final_predictions,
+            "summary": {
+                "total_paths_found": len(path_analyses),
+                "feedback_loops_detected": len(feedback_analyses),
+                "max_path_length": max([p["hops"] for p in path_analyses] + [0]),
+                "strongest_path": max(path_analyses, key=lambda x: x["path_strength"]) if path_analyses else None,
+            },
+        }
+
+    def multi_layer_whatif_analysis(
+        self,
+        scenarios: List[Dict[str, float]],
+        depth: int = 3,
+    ) -> Dict[str, Any]:
+        """
+        Multi-layer "what-if" analysis: If X happens to Y, how would it affect?
+        Then: What are the chances of Z affecting alpha and causing chain reaction to X?
+        
+        Performs nested counterfactual reasoning across multiple layers.
+        
+        Args:
+            scenarios: List of intervention scenarios {variable: value}
+            depth: How many layers deep to analyze
+        
+        Returns:
+            Nested analysis with cascading effects and chain reaction probabilities
+        """
+        results: List[Dict[str, Any]] = []
+        
+        for scenario in scenarios:
+            # Layer 1: Direct effects
+            layer1_outcomes = self._predict_outcomes({}, scenario)
+            
+            # Identify affected variables (significant changes)
+            affected_vars = [
+                var for var, val in layer1_outcomes.items()
+                if abs(val) > 0.01  # Threshold for "affected"
+            ]
+            
+            # Layer 2: What if affected vars change other things?
+            layer2_scenarios: List[Dict[str, float]] = []
+            for affected_var in affected_vars[:5]:  # Limit to top 5
+                # Create scenario where this variable is perturbed
+                perturbation = {
+                    affected_var: layer1_outcomes.get(affected_var, 0.0) * 1.2  # 20% perturbation
+                }
+                layer2_scenarios.append(perturbation)
+            
+            layer2_analyses: List[Dict[str, Any]] = []
+            for layer2_scen in layer2_scenarios:
+                layer2_outcomes = self._predict_outcomes(layer1_outcomes, layer2_scen)
+                
+                # Check for chain reactions back to original intervention vars
+                chain_reactions: List[Dict[str, Any]] = []
+                for orig_var in scenario.keys():
+                    if orig_var in layer2_outcomes:
+                        # Chain reaction detected: original var affected by cascade
+                        chain_reactions.append({
+                            "original_intervention": orig_var,
+                            "chain_path": f"{list(layer2_scen.keys())[0]} → {orig_var}",
+                            "effect_magnitude": abs(layer2_outcomes[orig_var] - layer1_outcomes.get(orig_var, 0.0)),
+                            "could_cause_amplification": abs(layer2_outcomes[orig_var]) > abs(scenario.get(orig_var, 0.0)),
+                        })
+                
+                layer2_analyses.append({
+                    "layer2_scenario": layer2_scen,
+                    "layer2_outcomes": layer2_outcomes,
+                    "chain_reactions": chain_reactions,
+                })
+            
+            # Layer 3+: Deep cascade analysis (if depth > 2)
+            cascade_analysis = None
+            if depth > 2:
+                # Use cascading chain reaction method
+                all_outcomes = set(layer1_outcomes.keys()) | set(layer2_analyses[0]["layer2_outcomes"].keys() if layer2_analyses else set())
+                cascade_analysis = self.analyze_cascading_chain_reaction(
+                    initial_intervention=scenario,
+                    target_outcomes=list(all_outcomes)[:10],  # Top 10 outcomes
+                    max_hops=5,
+                    include_feedback_loops=True,
+                    num_iterations=depth,
+                )
+            
+            results.append({
+                "scenario": scenario,
+                "layer1_direct_effects": layer1_outcomes,
+                "affected_variables": affected_vars,
+                "layer2_cascades": layer2_analyses,
+                "deep_cascade": cascade_analysis,
+                "chain_reaction_summary": {
+                    "total_chain_reactions": sum(len(l2.get("chain_reactions", [])) for l2 in layer2_analyses),
+                    "potential_amplifications": sum(
+                        1 for l2 in layer2_analyses
+                        for cr in l2.get("chain_reactions", [])
+                        if cr.get("could_cause_amplification", False)
+                    ),
+                },
+            })
+        
+        return {
+            "multi_layer_analysis": results,
+            "summary": {
+                "total_scenarios": len(results),
+                "avg_chain_reactions_per_scenario": np.mean([
+                    r["chain_reaction_summary"]["total_chain_reactions"] for r in results
+                ]) if results else 0.0,
+                "scenarios_with_amplification": sum(
+                    1 for r in results
+                    if r["chain_reaction_summary"]["potential_amplifications"] > 0
+                ),
+            },
+        }
+
+    def deep_root_cause_analysis(
+        self,
+        problem_variable: str,
+        max_depth: int = 20,
+        min_path_strength: float = 0.01,
+    ) -> Dict[str, Any]:
+        """
+        Infinitely nested root cause analysis: trace backwards to find absolute deepest causes.
+        
+        Keeps going deeper until hitting exogenous nodes or circular dependencies.
+        Finds the ultimate root causes that, if intervened, would solve the problem.
+        
+        Args:
+            problem_variable: Variable we want to fix/understand
+            max_depth: Maximum backward tracing depth (safety limit)
+            min_path_strength: Minimum edge strength to consider
+        
+        Returns:
+            Root causes, causal paths, intervention opportunities
+        """
+        if problem_variable not in self.causal_graph:
+            return {"error": f"Variable {problem_variable} not in causal graph"}
+        
+        # Backward tracing: find all ancestors (potential root causes)
+        all_ancestors = list(nx.ancestors(self.causal_graph, problem_variable))
+        
+        # Trace paths from each ancestor to problem
+        root_causes: List[Dict[str, Any]] = []
+        paths_to_problem: List[Dict[str, Any]] = []
+        
+        for ancestor in all_ancestors:
+            try:
+                # Find all paths from ancestor to problem
+                paths = list(nx.all_simple_paths(
+                    self.causal_graph,
+                    ancestor,
+                    problem_variable,
+                    cutoff=max_depth
+                ))
+                
+                if paths:
+                    # Compute path strength for each path
+                    # Mathematical formulation: Path strength = ∏(i,j)∈Path |β_ij|
+                    # where β_ij is the causal effect (structural coefficient) from i to j
+                    # This follows Pearl's Structural Causal Model (SCM) path product rule
+                    for path in paths:
+                        # Initialize with multiplicative identity (1.0)
+                        # Path strength represents cumulative causal effect along chain
+                        path_strength = 1.0
+                        path_details = []
+                        
+                        for i in range(len(path) - 1):
+                            u, v = path[i], path[i + 1]
+                            edge_data = self.causal_graph[u][v]
+                            # β_ij: structural coefficient from Pearl's SCM framework
+                            beta_ij = edge_data.get('strength', 0.0)  # β_ij (signed)
+                            strength = abs(beta_ij)  # |β_ij|: magnitude for threshold check
+                            
+                            # Filter by minimum effect size (power analysis threshold)
+                            # If any edge is too weak, path strength becomes 0
+                            if strength < min_path_strength:
+                                path_strength = 0.0
+                                break
+                            
+                            # Multiplicative path strength: ∏(i,j)∈Path β_ij
+                            # This follows chain rule of differentiation and causal mediation analysis
+                            # IMPORTANT: Use signed β_ij (not |β_ij|) to preserve sign in product
+                            # Total effect = β₁₂ · β₂₃ · ... · βₖ₋₁ₖ (product preserves sign)
+                            path_strength *= beta_ij  # Multiply by signed coefficient
+                            path_details.append({
+                                "edge": f"{u}→{v}",
+                                "strength": strength,
+                                "structural_coefficient": float(edge_data.get('strength', 0.0)),
+                            })
+                        
+                        if path_strength > 0:
+                            # Check if ancestor is exogenous (true root cause)
+                            ancestors_of_ancestor = list(nx.ancestors(self.causal_graph, ancestor))
+                            is_exogenous = len(ancestors_of_ancestor) == 0
+                            
+                            root_causes.append({
+                                "root_cause": ancestor,
+                                "is_exogenous": is_exogenous,
+                                "path_to_problem": path,
+                                "path_string": " → ".join(path),
+                                "path_strength": float(path_strength),
+                                "depth": len(path) - 1,
+                                "path_details": path_details,
+                            })
+                            
+                            paths_to_problem.append({
+                                "from": ancestor,
+                                "to": problem_variable,
+                                "path": path,
+                                "strength": float(path_strength),
+                            })
+            except Exception:
+                continue
+        
+        # Rank root causes using multi-objective optimization criteria
+        # Objective: maximize f(rc) = w1·I_exo(rc) + w2·S_path(rc) - w3·D(rc)
+        # where I_exo is indicator function, S_path is path strength, D is depth
+        # Using lexicographic ordering: exogenous > path_strength > -depth
+        root_causes.sort(
+            key=lambda x: (
+                -x["is_exogenous"],  # Exogenous first (lexicographic priority)
+                -x["path_strength"],  # Stronger paths first (maximize causal effect)
+                x["depth"]  # Shorter paths first (minimize intervention distance)
+            )
+        )
+        
+        # Find ultimate root causes (those with no ancestors, or only circular ones)
+        ultimate_roots = [
+            rc for rc in root_causes
+            if rc["is_exogenous"] or rc["depth"] >= max_depth - 2
+        ]
+        
+        return {
+            "problem_variable": problem_variable,
+            "all_root_causes": root_causes[:20],  # Top 20
+            "ultimate_root_causes": ultimate_roots[:10],  # Top 10 ultimate
+            "total_paths_found": len(paths_to_problem),
+            "max_depth_reached": max([rc["depth"] for rc in root_causes] + [0]),
+            "intervention_opportunities": [
+                {
+                    "intervene_on": rc["root_cause"],
+                    "expected_impact_on_problem": rc["path_strength"],
+                    "depth": rc["depth"],
+                    "is_exogenous": rc["is_exogenous"],
+                }
+                for rc in root_causes[:10]
+            ],
+        }
+
+    def explore_alternate_realities(
+        self,
+        factual_state: Dict[str, float],
+        target_outcome: str,
+        target_value: Optional[float] = None,
+        max_realities: int = 50,
+        max_interventions: int = 3,
+    ) -> Dict[str, Any]:
+        """
+        Explore multiple alternate realities to find interventions that achieve best outcome.
+        
+        Searches intervention space to find sequences that optimize target outcome.
+        Considers multiple possible realities and picks the best.
+        
+        Args:
+            factual_state: Current state
+            target_outcome: Variable to optimize
+            target_value: Desired value (if None, maximize)
+            max_realities: Number of alternate scenarios to explore
+            max_interventions: Max number of simultaneous interventions
+        
+        Returns:
+            Best interventions, alternate realities explored, optimal outcome
+        """
+        if target_outcome not in self.causal_graph:
+            return {"error": f"Target {target_outcome} not in graph"}
+        
+        # Get intervention candidates (nodes with out-edges)
+        intervention_candidates = [
+            node for node in self.causal_graph.nodes()
+            if len(list(self.causal_graph.successors(node))) > 0
+            and node not in [target_outcome]
+        ]
+        
+        realities: List[Dict[str, Any]] = []
+        
+        # Sample intervention combinations
+        for _ in range(max_realities):
+            # Random intervention set
+            num_interventions = self.rng.integers(1, max_interventions + 1)
+            selected = self.rng.choice(intervention_candidates, size=min(num_interventions, len(intervention_candidates)), replace=False)
+            
+            # Generate intervention values (standardized perturbations)
+            intervention: Dict[str, float] = {}
+            for var in selected:
+                stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
+                current = factual_state.get(var, stats["mean"])
+                # Perturb by ±2 standard deviations
+                perturbation = self.rng.normal(0, stats["std"] * 2.0)
+                intervention[var] = current + perturbation
+            
+            # Predict outcome
+            outcome = self._predict_outcomes(factual_state, intervention)
+            target_val = outcome.get(target_outcome, 0.0)
+            
+            # Compute objective using L2 norm (Euclidean distance) or direct maximization
+            # Objective function: O(θ) = -||y(θ) - y*||₂ if target specified, else O(θ) = y(θ)
+            # where θ = intervention vector, y(θ) = predicted outcome, y* = target value
+            if target_value is not None:
+                # For single-dimensional: use L1 norm ||y - y*||₁ = |y - y*|
+                # For multi-dimensional would use: ||y - y*||₂ = √(Σ(y_i - y*_i)²)
+                # Negative sign for maximization (minimize distance = maximize negative distance)
+                distance = abs(target_val - target_value)  # L1 norm: |y - y*|
+                objective = -distance  # Negative distance (better = less distance)
+            else:
+                # Direct maximization: O(θ) = y(θ) (no target, just maximize outcome)
+                objective = target_val  # Maximize
+            
+            realities.append({
+                "interventions": intervention,
+                "outcome": outcome,
+                "target_value": target_val,
+                "objective": float(objective),
+                "delta_from_factual": target_val - factual_state.get(target_outcome, 0.0),
+            })
+        
+        # Sort by objective (best first)
+        realities.sort(key=lambda x: x["objective"], reverse=True)
+        
+        # Best reality
+        best = realities[0] if realities else None
+        
+        # Pareto frontier (if multi-objective)
+        pareto_realities = []
+        if len(realities) > 1:
+            # Simple Pareto: if reality A is better on target and not worse on others
+            for r in realities[:20]:  # Top 20
+                is_dominated = False
+                for other in realities:
+                    if other is r:
+                        continue
+                    # Check if other dominates
+                    if (other["objective"] >= r["objective"] and 
+                        other["delta_from_factual"] >= r["delta_from_factual"] and
+                        (other["objective"] > r["objective"] or other["delta_from_factual"] > r["delta_from_factual"])):
+                        is_dominated = True
+                        break
+                if not is_dominated:
+                    pareto_realities.append(r)
+        
+        return {
+            "factual_state": factual_state,
+            "target_outcome": target_outcome,
+            "target_value": target_value,
+            "best_reality": best,
+            "top_10_realities": realities[:10],
+            "pareto_frontier": pareto_realities[:10],
+            "all_realities_explored": len(realities),
+            "improvement_potential": (
+                best["target_value"] - factual_state.get(target_outcome, 0.0)
+                if best else 0.0
+            ),
+        }
+
+    def historical_pattern_matching(
+        self,
+        current_state: Dict[str, float],
+        intervention_history: List[Dict[str, float]],
+        outcome_history: List[Dict[str, float]],
+        target_outcome: str,
+        similarity_threshold: float = 0.7,
+    ) -> Dict[str, Any]:
+        """
+        Learn from historical interventions: reuse old reactions to create new ones.
+        
+        Finds past interventions in similar states that achieved good outcomes,
+        then adapts them to current state.
+        
+        Args:
+            current_state: Current factual state
+            intervention_history: List of past interventions
+            outcome_history: List of past outcomes (corresponding to interventions)
+            target_outcome: Variable to optimize
+            similarity_threshold: How similar states must be to reuse
+        
+        Returns:
+            Matched historical patterns, adapted interventions, learned strategies
+        """
+        if len(intervention_history) != len(outcome_history) or len(intervention_history) == 0:
+            return {"error": "Invalid history or empty"}
+        
+        # Compute state similarity (cosine similarity in standardized space)
+        z_current = self._standardize_state(current_state)
+        matches: List[Dict[str, Any]] = []
+        
+        for i, (intervention, outcome) in enumerate(zip(intervention_history, outcome_history)):
+            # Standardize historical outcome (treated as "state")
+            z_past = self._standardize_state(outcome)
+            
+            # Compute similarity (cosine similarity)
+            common_vars = set(z_current.keys()) & set(z_past.keys())
+            if len(common_vars) == 0:
+                continue
+            
+            vec_current = np.array([z_current[v] for v in common_vars])
+            vec_past = np.array([z_past[v] for v in common_vars])
+            
+            # Cosine similarity (normalized inner product): cos(θ) = (A·B)/(||A||₂·||B||₂)
+            # This measures angle between vectors in standardized space
+            # Range: [-1, 1], where 1 = identical direction, 0 = orthogonal, -1 = opposite
+            norm_current = np.linalg.norm(vec_current)  # L2 norm: ||v||₂ = √(Σv_i²)
+            norm_past = np.linalg.norm(vec_past)
+            
+            if norm_current < 1e-6 or norm_past < 1e-6:
+                similarity = 0.0  # Zero vectors have undefined similarity
+            else:
+                # Cosine similarity formula: cos(θ) = (v₁·v₂)/(||v₁||₂·||v₂||₂)
+                similarity = float(np.dot(vec_current, vec_past) / (norm_current * norm_past))
+            
+            if similarity >= similarity_threshold:
+                # Historical outcome value for target
+                target_past = outcome.get(target_outcome, 0.0)
+                target_current = current_state.get(target_outcome, 0.0)
+                
+                # Did this intervention improve the target?
+                improvement = target_past - target_current
+                
+                matches.append({
+                    "historical_index": i,
+                    "similarity": similarity,
+                    "past_intervention": intervention,
+                    "past_outcome": outcome,
+                    "target_improvement": float(improvement),
+                    "was_successful": improvement > 0.0,
+                })
+        
+        # Sort by similarity and success
+        matches.sort(
+            key=lambda x: (x["similarity"], x["target_improvement"]),
+            reverse=True
+        )
+        
+        # Adapt best historical interventions to current state
+        adapted_interventions: List[Dict[str, Any]] = []
+        for match in matches[:5]:  # Top 5 matches
+            past_intervention = match["past_intervention"]
+            
+            # Adapt: scale by similarity and current context
+            adapted = {}
+            for var, val in past_intervention.items():
+                # Adjust based on current state difference
+                current_val = current_state.get(var, 0.0)
+                past_val = past_intervention.get(var, 0.0)
+                
+                # Blend: similarity-weighted historical value + current baseline
+                adaptation_factor = match["similarity"]
+                adapted[var] = float(
+                    current_val * (1.0 - adaptation_factor) +
+                    past_val * adaptation_factor
+                )
+            
+            # Predict outcome of adapted intervention
+            predicted = self._predict_outcomes(current_state, adapted)
+            predicted_target = predicted.get(target_outcome, 0.0)
+            
+            adapted_interventions.append({
+                "source_match": match,
+                "adapted_intervention": adapted,
+                "predicted_outcome": predicted,
+                "predicted_target_value": float(predicted_target),
+                "expected_improvement": float(predicted_target - current_state.get(target_outcome, 0.0)),
+            })
+        
+        # Extract learned strategy patterns
+        successful_interventions = [m for m in matches if m["was_successful"]]
+        learned_patterns: List[Dict[str, Any]] = []
+        
+        if successful_interventions:
+            # Common variables in successful interventions
+            all_vars = set()
+            for m in successful_interventions:
+                all_vars.update(m["past_intervention"].keys())
+            
+            for var in all_vars:
+                successful_vals = [
+                    m["past_intervention"].get(var, 0.0)
+                    for m in successful_interventions
+                    if var in m["past_intervention"]
+                ]
+                if successful_vals:
+                    learned_patterns.append({
+                        "variable": var,
+                        "typical_successful_value": float(np.mean(successful_vals)),
+                        "value_range": [float(min(successful_vals)), float(max(successful_vals))],
+                        "success_frequency": len(successful_vals) / len(successful_interventions),
+                    })
+        
+        return {
+            "current_state": current_state,
+            "historical_matches": matches[:10],
+            "best_matches": matches[:5],
+            "adapted_interventions": adapted_interventions,
+            "learned_patterns": learned_patterns,
+            "recommended_intervention": adapted_interventions[0]["adapted_intervention"] if adapted_interventions else {},
+            "strategy_confidence": float(np.mean([m["similarity"] for m in matches[:5]])) if matches else 0.0,
+        }
+
+    def infinite_nesting_root_cause(
+        self,
+        problem: str,
+        stop_condition: Optional[Callable[[str, int], bool]] = None,
+    ) -> Dict[str, Any]:
+        """
+        Infinitely nested root cause analysis: keeps going deeper until hitting true roots.
+        
+        Unlike deep_root_cause_analysis which has max_depth, this continues until
+        hitting exogenous nodes or user-defined stop condition.
+        
+        Args:
+            problem: Variable to trace backwards from
+            stop_condition: Function(node, depth) -> bool to stop tracing
+        
+        Returns:
+            Ultimate root causes, full causal tree, intervention strategy
+        """
+        if problem not in self.causal_graph:
+            return {"error": f"Problem {problem} not in graph"}
+        
+        visited: set = set()
+        causal_tree: List[Dict[str, Any]] = []
+        root_nodes: List[str] = []
+        
+        def trace_backwards(node: str, depth: int, path: List[str]) -> None:
+            """Recursive backward tracing."""
+            if node in visited or depth > 100:  # Safety limit
+                return
+            
+            visited.add(node)
+            
+            # Check stop condition
+            if stop_condition and stop_condition(node, depth):
+                root_nodes.append(node)
+                causal_tree.append({
+                    "node": node,
+                    "depth": depth,
+                    "path_to_problem": path + [node],
+                    "is_stopped_by_condition": True,
+                })
+                return
+            
+            # Get parents (causes)
+            parents = list(self.causal_graph.predecessors(node))
+            
+            if len(parents) == 0:
+                # Exogenous node - true root cause
+                root_nodes.append(node)
+                causal_tree.append({
+                    "node": node,
+                    "depth": depth,
+                    "path_to_problem": path + [node],
+                    "is_exogenous": True,
+                })
+                return
+            
+            # Recursively trace parents
+            for parent in parents:
+                edge_data = self.causal_graph[parent][node]
+                strength = abs(edge_data.get('strength', 0.0))
+                
+                causal_tree.append({
+                    "node": node,
+                    "parent": parent,
+                    "edge_strength": float(strength),
+                    "depth": depth,
+                    "path_to_problem": path + [node],
+                })
+                
+                trace_backwards(parent, depth + 1, path + [node])
+        
+        # Start tracing from problem
+        trace_backwards(problem, 0, [])
+        
+        # Unique root nodes
+        unique_roots = list(set(root_nodes))
+        
+        # Build intervention strategy (intervene on shallowest exogenous nodes)
+        root_depths = {
+            root: min([ct["depth"] for ct in causal_tree if ct.get("node") == root or ct.get("parent") == root] + [999])
+            for root in unique_roots
+        }
+        optimal_roots = sorted(unique_roots, key=lambda x: root_depths.get(x, 999))[:10]
+        
+        return {
+            "problem": problem,
+            "ultimate_root_causes": unique_roots,
+            "optimal_intervention_targets": optimal_roots,
+            "causal_tree": causal_tree,
+            "max_depth_reached": max([ct["depth"] for ct in causal_tree] + [0]),
+            "total_nodes_explored": len(visited),
+        }
+
+    def optimal_intervention_sequence(
+        self,
+        initial_state: Dict[str, float],
+        target_outcomes: Dict[str, float],
+        max_steps: int = 5,
+        horizon: int = 10,
+    ) -> Dict[str, Any]:
+        """
+        Find optimal sequence of interventions to achieve target outcomes.
+        
+        Uses dynamic programming / tree search to find best intervention sequence
+        that alters future reactions for optimal outcome.
+        
+        Args:
+            initial_state: Starting state
+            target_outcomes: {variable: target_value} to achieve
+            max_steps: Maximum intervention steps
+            horizon: How far ahead to optimize
+        
+        Returns:
+            Optimal intervention sequence, expected trajectory, outcome probability
+        """
+        # Intervention candidates
+        candidates = [
+            node for node in self.causal_graph.nodes()
+            if len(list(self.causal_graph.successors(node))) > 0
+            and node not in target_outcomes.keys()
+        ]
+        
+        # Optimal control problem: find sequence {u₀, u₁, ..., uₜ} that minimizes cost
+        # Cost function: J = Σₜ L(xₜ, uₜ) + Φ(xₜ) where L is stage cost, Φ is terminal cost
+        # Subject to: xₜ₊₁ = f(xₜ, uₜ) (system dynamics)
+        # Using greedy approximation (could be upgraded to Bellman optimality: V*(x) = min_u[L(x,u) + V*(f(x,u))])
+        best_sequence: List[Dict[str, float]] = []
+        best_final_state: Dict[str, float] = initial_state.copy()
+        best_objective = float("-inf")
+        
+        current_state = initial_state.copy()
+        
+        for step in range(max_steps):
+            # Find best single intervention at this step (greedy policy)
+            # Greedy: u*_t = argmin_u E[L(xₜ₊₁, u) | xₜ] (one-step lookahead)
+            best_step_intervention: Optional[Dict[str, float]] = None
+            best_step_objective = float("-inf")
+            
+            # Sample candidate interventions (Monte Carlo policy search)
+            # Alternative: gradient-based optimization using ∇ᵤJ
+            for _ in range(20):  # Explore 20 candidates per step
+                var = self.rng.choice(candidates)
+                stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
+                current_val = current_state.get(var, stats["mean"])
+                
+                # Try perturbation: u = u₀ + ε where ε ~ N(0, σ²)
+                # This implements exploration in policy space
+                intervention = {var: current_val + self.rng.normal(0, stats["std"] * 1.5)}
+                
+                # Simulate forward (system dynamics): xₜ₊₁ = f(xₜ, uₜ)
+                predicted = self._predict_outcomes(current_state, intervention)
+                
+                # Multi-step lookahead (horizon H): simulate xₜ₊₁, xₜ₊₂, ..., xₜ₊ₕ
+                # This approximates value function: V^π(x) = E[Σₖ₌₀ᴴ γᵏ·rₜ₊ₖ]
+                state_after = predicted.copy()
+                for h in range(1, horizon):
+                    # Further interventions (optional, could use optimal policy π*(x))
+                    state_after = self._predict_outcomes(state_after, {})
+                
+                # Compute objective: multi-target cost function
+                # Cost: J(u) = Σⱼ |yⱼ(u) - y*ⱼ| (L1 norm, sum of absolute errors)
+                # Alternative L2: J(u) = √(Σⱼ (yⱼ(u) - y*ⱼ)²) (Euclidean distance)
+                # We use L1 for computational simplicity, can be upgraded to L2
+                # Minimize: argmin_u J(u) subject to constraints
+                # Since we maximize objective, use negative cost: O = -J(u)
+                objective = 0.0
+                for target_var, target_val in target_outcomes.items():
+                    if target_var in state_after:
+                        # L1 distance (absolute error): |y - y*|
+                        # For multi-dimensional: ||y - y*||₁ = Σⱼ |yⱼ - y*ⱼ|
+                        distance = abs(state_after[target_var] - target_val)  # L1 norm component
+                        objective -= distance  # Accumulate negative L1 distance (minimize error = maximize objective)
+                
+                if objective > best_step_objective:
+                    best_step_objective = objective
+                    best_step_intervention = intervention
+            
+            if best_step_intervention:
+                best_sequence.append(best_step_intervention)
+                # Update state
+                current_state = self._predict_outcomes(current_state, best_step_intervention)
+            else:
+                break
+        
+        # Full trajectory simulation
+        trajectory: List[Dict[str, float]] = [initial_state.copy()]
+        state = initial_state.copy()
+        for intervention in best_sequence:
+            state = self._predict_outcomes(state, intervention)
+            trajectory.append(state.copy())
+        
+        # Final outcome assessment using relative error metric
+        # Relative error: ε_rel = |y_actual - y_target| / |y_target|
+        # Success criterion: ε_rel < 0.1 (within 10% tolerance)
+        final_objective = 0.0
+        target_achievements: Dict[str, float] = {}
+        for target_var, target_val in target_outcomes.items():
+            if target_var in trajectory[-1]:
+                actual = trajectory[-1][target_var]
+                # Absolute error: ε_abs = |y_actual - y_target|
+                distance = abs(actual - target_val)
+                # Relative error: ε_rel = ε_abs / |y_target| (normalized by target magnitude)
+                relative_error = distance / abs(target_val) if abs(target_val) > 1e-6 else distance
+                target_achievements[target_var] = {
+                    "target": target_val,
+                    "actual": actual,
+                    "distance": distance,
+                    "relative_error": float(relative_error),
+                    "achieved": distance < abs(target_val * 0.1),  # Within 10% tolerance: ε_rel < 0.1
+                }
+                # Aggregate objective: J_total = -Σⱼ ε_absⱼ (minimize total error)
+                final_objective -= distance
+        
+        return {
+            "optimal_sequence": best_sequence,
+            "trajectory": trajectory,
+            "final_state": trajectory[-1] if trajectory else initial_state,
+            "target_achievements": target_achievements,
+            "objective": float(final_objective),
+            "sequence_length": len(best_sequence),
+        }
+
+    def meta_learn_intervention_strategy(
+        self,
+        historical_interventions: List[Dict[str, float]],
+        historical_outcomes: List[Dict[str, float]],
+        historical_contexts: List[Dict[str, float]],
+    ) -> Dict[str, Any]:
+        """
+        Meta-learn how to intervene: learn from past to create optimal future interventions.
+        
+        Identifies patterns in successful interventions across different contexts,
+        then uses this knowledge to design new interventions.
+        
+        Args:
+            historical_interventions: Past interventions
+            historical_outcomes: Corresponding outcomes
+            historical_contexts: States when interventions were applied
+        
+        Returns:
+            Learned intervention strategy, pattern rules, meta-knowledge
+        """
+        if not (len(historical_interventions) == len(historical_outcomes) == len(historical_contexts)):
+            return {"error": "History lengths must match"}
+        
+        # Classify interventions by outcome quality
+        intervention_classes: List[Dict[str, Any]] = []
+        
+        for i, (intervention, outcome, context) in enumerate(zip(
+            historical_interventions, historical_outcomes, historical_contexts
+        )):
+            # Compute outcome quality (simple: sum of positive changes)
+            quality = sum([
+                max(0.0, outcome.get(k, 0.0) - context.get(k, 0.0))
+                for k in outcome.keys()
+            ])
+            
+            intervention_classes.append({
+                "index": i,
+                "intervention": intervention,
+                "context": context,
+                "outcome": outcome,
+                "quality": float(quality),
+                "is_successful": quality > 0.0,
+            })
+        
+        # Extract patterns from successful interventions
+        successful = [ic for ic in intervention_classes if ic["is_successful"]]
+        unsuccessful = [ic for ic in intervention_classes if not ic["is_successful"]]
+        
+        # Pattern: what interventions work in what contexts?
+        learned_rules: List[Dict[str, Any]] = []
+        
+        if successful:
+            # For each intervention variable, find context patterns
+            all_intervention_vars = set()
+            for ic in successful:
+                all_intervention_vars.update(ic["intervention"].keys())
+            
+            for var in all_intervention_vars:
+                successful_vals = [
+                    ic["intervention"].get(var, 0.0)
+                    for ic in successful
+                    if var in ic["intervention"]
+                ]
+                
+                # Context conditions (simplified: avg context where this worked)
+                contexts_when_successful = [
+                    ic["context"]
+                    for ic in successful
+                    if var in ic["intervention"]
+                ]
+                
+                if successful_vals and contexts_when_successful:
+                    # Average successful intervention value
+                    avg_successful_val = float(np.mean(successful_vals))
+                    
+                    # Average context when this worked
+                    context_vars = set()
+                    for ctx in contexts_when_successful:
+                        context_vars.update(ctx.keys())
+                    
+                    avg_context = {
+                        k: float(np.mean([ctx.get(k, 0.0) for ctx in contexts_when_successful]))
+                        for k in context_vars
+                    }
+                    
+                    learned_rules.append({
+                        "intervention_variable": var,
+                        "recommended_value": avg_successful_val,
+                        "typical_context": avg_context,
+                        "success_rate": len(successful_vals) / len(historical_interventions),
+                        "confidence": float(min(1.0, len(successful_vals) / 5.0)),  # Higher with more examples
+                    })
+        
+        # Meta-strategy: when to use which intervention pattern
+        strategy: Dict[str, Any] = {
+            "learned_rules": learned_rules,
+            "success_rate": len(successful) / len(intervention_classes) if intervention_classes else 0.0,
+            "pattern_count": len(learned_rules),
+            "most_effective_interventions": sorted(
+                learned_rules,
+                key=lambda x: (x["confidence"], x["success_rate"]),
+                reverse=True
+            )[:5],
+        }
+        
+        return strategy
+
+    def recursive_alternate_reality_search(
+        self,
+        current_state: Dict[str, float],
+        target: str,
+        depth: int = 0,
+        max_depth: int = 10,
+        path: List[Dict[str, float]] = None,
+        best_found: Optional[Dict[str, Any]] = None,
+    ) -> Dict[str, Any]:
+        """
+        Recursively search alternate realities, nesting as deep as needed.
+        
+        Explores intervention tree recursively to find absolute best outcome.
+        Each reality branches into more realities, creating infinite nesting.
+        
+        Args:
+            current_state: Current state in this branch
+            target: Variable to optimize
+            depth: Current recursion depth
+            max_depth: Maximum depth (safety)
+            path: Intervention path to reach this state
+            best_found: Best outcome found so far (for pruning)
+        
+        Returns:
+            Best reality found, full search tree, optimal path
+        """
+        if path is None:
+            path = []
+        
+        if depth >= max_depth:
+            # Leaf: evaluate this reality
+            target_val = current_state.get(target, 0.0)
+            return {
+                "state": current_state,
+                "path": path,
+                "target_value": float(target_val),
+                "depth": depth,
+                "is_leaf": True,
+            }
+        
+        # Get intervention candidates
+        candidates = [
+            node for node in self.causal_graph.nodes()
+            if len(list(self.causal_graph.successors(node))) > 0
+            and node != target
+        ]
+        
+        # Branch: explore multiple interventions from this state
+        branches: List[Dict[str, Any]] = []
+        best_branch = None
+        best_target = float("-inf")
+        
+        # Limit branching to avoid explosion
+        num_branches = min(5, len(candidates))
+        selected = self.rng.choice(candidates, size=num_branches, replace=False) if len(candidates) > 0 else []
+        
+        for var in selected:
+            # Create intervention
+            stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
+            current_val = current_state.get(var, stats["mean"])
+            intervention = {var: current_val + self.rng.normal(0, stats["std"] * 1.0)}
+            
+            # Predict next state
+            next_state = self._predict_outcomes(current_state, intervention)
+            
+            # Recursively explore
+            branch_result = self.recursive_alternate_reality_search(
+                current_state=next_state,
+                target=target,
+                depth=depth + 1,
+                max_depth=max_depth,
+                path=path + [intervention],
+                best_found=best_found,
+            )
+            
+            branches.append({
+                "intervention": intervention,
+                "result": branch_result,
+            })
+            
+            # Update best
+            branch_target = branch_result.get("target_value", float("-inf"))
+            if branch_target > best_target:
+                best_target = branch_target
+                best_branch = branch_result
+        
+        # Return best path
+        return {
+            "state": current_state,
+            "path": path,
+            "branches": branches,
+            "best_branch": best_branch,
+            "target_value": best_target,
+            "depth": depth,
+            "is_leaf": False,
+        }
+
+    def probabilistic_nested_simulation(
+        self,
+        initial_state: Dict[str, float],
+        interventions: Dict[str, float],
+        num_samples: int = 100,
+        nesting_depth: int = 5,
+        uncertainty_propagation: bool = True,
+    ) -> Dict[str, Any]:
+        """
+        Probabilistic nested simulation: branch on uncertainty at each layer.
+        
+        Each nesting level considers multiple probabilistic outcomes,
+        creating a tree of possible futures with probabilities.
+        
+        Args:
+            initial_state: Starting state
+            interventions: Initial interventions
+            num_samples: Monte Carlo samples per nesting level
+            nesting_depth: How many layers to nest
+            uncertainty_propagation: Whether to propagate uncertainty through edges
+        
+        Returns:
+            Probabilistic outcome tree, expected values, confidence intervals
+        """
+        # Bootstrap edge strength uncertainty using coefficient of variation
+        # CV = σ/μ (coefficient of variation), where σ is standard deviation, μ is mean
+        # Uncertainty quantification: σ_β = CV · |β|, following asymptotic normality
+        # Under CLT, β̂ ~ N(β, σ²_β) for large samples
+        edge_uncertainty: Dict[Tuple[str, str], float] = {}
+        for u, v in self.causal_graph.edges():
+            strength = abs(self.causal_graph[u][v].get('strength', 0.0))
+            # Assume 20% coefficient of variation (CV = 0.2)
+            # Standard error: SE(β) = CV · |β| = 0.2 · |β|
+            # This models uncertainty from estimation variance
+            edge_uncertainty[(u, v)] = strength * 0.2
+        
+        # Nested simulation tree
+        simulation_tree: List[Dict[str, Any]] = []
+        
+        def simulate_level(
+            state: Dict[str, float],
+            interventions_at_level: Dict[str, float],
+            level: int,
+            parent_probability: float = 1.0,
+        ) -> Dict[str, Any]:
+            """Recursive probabilistic simulation."""
+            if level >= nesting_depth:
+                return {
+                    "level": level,
+                    "state": state,
+                    "probability": parent_probability,
+                    "is_leaf": True,
+                }
+            
+            # Sample edge strengths with uncertainty
+            outcomes: List[Dict[str, float]] = []
+            outcome_probs: List[float] = []
+            
+            for _ in range(num_samples):
+                # Perturb edge strengths
+                perturbed_state = state.copy()
+                
+                # Predict with uncertainty
+                z_state = self._standardize_state({**state, **interventions_at_level})
+                z_pred = dict(z_state)
+                
+                # Propagate with uncertain edges
+                for node in nx.topological_sort(self.causal_graph):
+                    if node in interventions_at_level:
+                        continue
+                    
+                    parents = list(self.causal_graph.predecessors(node))
+                    if not parents:
+                        continue
+                    
+                    effect_z = 0.0
+                    for parent in parents:
+                        parent_z = z_pred.get(parent, z_state.get(parent, 0.0))
+                        base_strength = self.causal_graph[parent][node].get('strength', 0.0)
+                        # Uncertainty propagation using normal distribution
+                        # β_sample ~ N(μ_β, σ²_β) where μ_β = base_strength, σ²_β = uncertainty²
+                        # This follows Bayesian posterior sampling or bootstrap sampling
+                        if uncertainty_propagation:
+                            uncertainty = edge_uncertainty.get((parent, node), 0.0)
+                            # Monte Carlo sampling: β ~ N(μ_β, σ²_β)
+                            # This propagates estimation uncertainty through causal structure
+                            strength = float(self.rng.normal(base_strength, uncertainty))
+                        else:
+                            strength = base_strength
+                        effect_z += parent_z * strength
+                    
+                    z_pred[node] = effect_z
+                
+                # De-standardize
+                outcome = {
+                    k: self._destandardize_value(k, v)
+                    for k, v in z_pred.items()
+                    if k in state or k in interventions_at_level
+                }
+                outcomes.append(outcome)
+                outcome_probs.append(1.0 / num_samples)  # Uniform weights
+            
+            # Aggregate outcomes using sample statistics (Monte Carlo estimation)
+            # Expected value: E[Y] = (1/n)Σᵢ yᵢ where n is sample size
+            # This is the Monte Carlo estimate of the expectation
+            # Unbiased estimator: E[Ȳ] = E[Y] (sample mean is unbiased for population mean)
+            expected_outcome: Dict[str, float] = {}
+            all_vars = set.union(*[set(o.keys()) for o in outcomes]) if outcomes else set()
+            for var in all_vars:
+                # Collect all samples for this variable: {y₁, y₂, ..., yₙ}
+                vals = np.array([o.get(var, 0.0) for o in outcomes])
+                n = len(vals)
+                if n > 0:
+                    # Sample mean: ȳ = (1/n)Σᵢ₌₁ⁿ yᵢ
+                    # E[Y] = lim_{n→∞} (1/n)Σᵢ yᵢ (Monte Carlo convergence)
+                    expected_outcome[var] = float(np.mean(vals))  # E[Y] = (1/n)Σᵢ yᵢ
+                else:
+                    expected_outcome[var] = 0.0
+            
+            # Confidence intervals using quantile-based estimation (non-parametric)
+            # For 90% CI: CI₉₀ = [Q₀.₀₅, Q₀.₉₅] where Q_p is p-th quantile
+            # Non-parametric: no distributional assumptions
+            # Alternative (parametric, if normal): CI = [μ̂ - z₀.₀₅·SE, μ̂ + z₀.₀₅·SE]
+            # where z₀.₀₅ ≈ 1.645 for 90% CI (two-tailed: 5% in each tail)
+            ci90_outcome: Dict[str, Tuple[float, float]] = {}
+            for var in expected_outcome.keys():
+                vals = np.array([o.get(var, 0.0) for o in outcomes])
+                n = len(vals)
+                if n > 0:
+                    # Non-parametric 90% CI: [Q₀.₀₅, Q₀.₉₅]
+                    # Quantile function: Q(p) = inf{x : P(X ≤ x) ≥ p}
+                    # 5th percentile (lower bound): Q₀.₀₅
+                    # 95th percentile (upper bound): Q₀.₉₅
+                    ci90_outcome[var] = (
+                        float(np.quantile(vals, 0.05)),  # Lower bound: Q₀.₀₅ = 5th percentile
+                        float(np.quantile(vals, 0.95)),  # Upper bound: Q₀.₉₅ = 95th percentile
+                    )
+                else:
+                    ci90_outcome[var] = (0.0, 0.0)
+            
+            # Recursively nest for next level
+            child_nodes: List[Dict[str, Any]] = []
+            if level < nesting_depth - 1:
+                # Create nested interventions based on outcomes
+                for outcome_sample in outcomes[:5]:  # Top 5 outcomes
+                    # Generate follow-up interventions
+                    nested_interventions: Dict[str, float] = {}
+                    # (Simplified: could use policy logic here)
+                    
+                    child = simulate_level(
+                        state=outcome_sample,
+                        interventions_at_level=nested_interventions,
+                        level=level + 1,
+                        parent_probability=parent_probability * (1.0 / num_samples),
+                    )
+                    child_nodes.append(child)
+            
+            return {
+                "level": level,
+                "state": state,
+                "interventions": interventions_at_level,
+                "expected_outcome": expected_outcome,
+                "ci90": ci90_outcome,
+                "outcome_samples": outcomes[:10],  # Top 10
+                "probability": parent_probability,
+                "children": child_nodes,
+                "is_leaf": level >= nesting_depth - 1,
+            }
+        
+        root_node = simulate_level(initial_state, interventions, level=0)
+        simulation_tree.append(root_node)
+        
+        # Extract final outcomes (leaf nodes)
+        def collect_leaves(node: Dict[str, Any]) -> List[Dict[str, Any]]:
+            if node.get("is_leaf", False):
+                return [node]
+            leaves = []
+            for child in node.get("children", []):
+                leaves.extend(collect_leaves(child))
+            return leaves
+        
+        leaves = collect_leaves(root_node)
+        
+        return {
+            "simulation_tree": root_node,
+            "all_leaves": leaves,
+            "expected_final_outcomes": {
+                var: float(np.mean([l["state"].get(var, 0.0) for l in leaves]))
+                for var in set.union(*[set(l["state"].keys()) for l in leaves])
+            },
+            "total_paths": len(leaves),
+            "max_nesting_reached": nesting_depth,
+        }
+
+    def adversarial_nested_analysis(
+        self,
+        intervention: Dict[str, float],
+        target: str,
+        adversary_objectives: List[str],
+        nesting_depth: int = 4,
+    ) -> Dict[str, Any]:
+        """
+        Adversarial nesting: consider worst-case reactions that could undermine your intervention.
+        
+        Models how external forces or negative feedback might react to your actions,
+        then nests to find best intervention despite adversarial responses.
+        
+        Args:
+            intervention: Your proposed intervention
+            target: Variable you want to optimize
+            adversary_objectives: Variables an adversary wants to minimize (worst-case)
+            nesting_depth: How many adversarial reaction layers to consider
+        
+        Returns:
+            Worst-case scenarios, robust interventions, adversarial paths
+        """
+        # Adversary model: reacts to minimize adversary_objectives
+        adversarial_paths: List[Dict[str, Any]] = []
+        
+        current_state = intervention.copy()
+        
+        for depth in range(nesting_depth):
+            # Your intervention at this depth
+            predicted_outcome = self._predict_outcomes({}, current_state)
+            
+            # Adversary reaction: find interventions that worsen adversary objectives
+            adversary_interventions: List[Dict[str, float]] = []
+            
+            for adv_obj in adversary_objectives:
+                if adv_obj not in self.causal_graph:
+                    continue
+                
+                # Find variables that affect adversary objective
+                affecting_vars = list(self.causal_graph.predecessors(adv_obj))
+                
+                # Adversary intervenes to minimize this objective
+                for var in affecting_vars[:3]:  # Top 3
+                    edge_data = self.causal_graph[var][adv_obj]
+                    strength = edge_data.get('strength', 0.0)
+                    
+                    # Adversarial optimization: adversary minimizes your objective
+                    # Adversary strategy: u_adv* = argmin_u_adv f(x, u, u_adv)
+                    # Where f is your objective function, u is your intervention, u_adv is adversary's
+                    # Gradient-based: u_adv ← u_adv - α·∇_{u_adv} f (gradient descent on negative objective)
+                    # If positive strength, adversary reduces var; if negative, increases
+                    current_val = predicted_outcome.get(var, 0.0)
+                    # Adversarial perturbation: Δu = -sign(∂f/∂u)·η·|u|
+                    # where η = 0.5 is step size, sign gives direction to worsen your objective
+                    adversary_intervention = {
+                        var: current_val - 0.5 * np.sign(strength) * abs(current_val)
+                    }
+                    adversary_interventions.append(adversary_intervention)
+            
+            # Worst-case outcome after adversary reaction
+            worst_outcomes: List[Dict[str, Any]] = []
+            for adv_intervention in adversary_interventions:
+                combined = {**current_state, **adv_intervention}
+                worst_outcome = self._predict_outcomes({}, combined)
+                
+                # Adversary damage quantification using L1 norm
+                # Damage = ||y_worst - y_predicted||₁ = Σⱼ |yⱼ_worst - yⱼ_predicted|
+                # This measures magnitude of deviation from expected outcome
+                target_value = worst_outcome.get(target, 0.0)
+                # Aggregate damage across all adversary objectives (L1 norm)
+                adversary_damage = sum([
+                    abs(worst_outcome.get(obj, 0.0) - predicted_outcome.get(obj, 0.0))
+                    for obj in adversary_objectives
+                ])
+                
+                worst_outcomes.append({
+                    "adversary_intervention": adv_intervention,
+                    "outcome": worst_outcome,
+                    "target_value": float(target_value),
+                    "adversary_damage": float(adversary_damage),
+                })
+            
+            # Sort by worst for target
+            worst_outcomes.sort(key=lambda x: x["target_value"])
+            worst_case = worst_outcomes[0] if worst_outcomes else None
+            
+            adversarial_paths.append({
+                "depth": depth,
+                "your_intervention": current_state,
+                "predicted_outcome": predicted_outcome,
+                "adversary_reactions": adversary_interventions,
+                "worst_case": worst_case,
+            })
+            
+            # Update state for next depth
+            if worst_case:
+                current_state = worst_case["outcome"]
+        
+        # Find robust intervention (works even in worst case)
+        final_target_values = [
+            path["worst_case"]["target_value"]
+            for path in adversarial_paths
+            if path.get("worst_case")
+        ]
+        worst_final = min(final_target_values) if final_target_values else 0.0
+        
+        return {
+            "intervention": intervention,
+            "target": target,
+            "adversarial_paths": adversarial_paths,
+            "worst_case_target_value": float(worst_final),
+            "adversarial_depth": nesting_depth,
+            "robustness_assessment": {
+                "worst_case_loss": float(intervention.get(target, 0.0) - worst_final),
+                "is_robust": worst_final > intervention.get(target, 0.0) * 0.5,  # Still >50% of desired
+            },
+        }
+
+    def multi_objective_infinite_nesting(
+        self,
+        current_state: Dict[str, float],
+        objectives: Dict[str, float],  # {variable: weight} to maximize
+        constraints: Dict[str, Tuple[float, float]],  # {variable: (min, max)}
+        max_depth: int = 8,
+        beam_width: int = 5,
+    ) -> Dict[str, Any]:
+        """
+        Multi-objective infinite nesting: optimize multiple goals simultaneously.
+        
+        Uses beam search to explore intervention space, balancing multiple objectives.
+        Nests as deep as needed to find Pareto-optimal solutions.
+        
+        Args:
+            current_state: Current state
+            objectives: {variable: weight} - variables to maximize with weights
+            constraints: {variable: (min, max)} - hard bounds
+            max_depth: Maximum nesting depth
+            beam_width: How many paths to keep at each level (beam search)
+        
+        Returns:
+            Pareto-optimal intervention paths, multi-objective trade-offs
+        """
+        # Beam search: maintain top-k paths at each level
+        beam: List[Dict[str, Any]] = [{
+            "state": current_state,
+            "path": [],
+            "objective_vector": {k: 0.0 for k in objectives.keys()},
+            "depth": 0,
+        }]
+        
+        pareto_frontier: List[Dict[str, Any]] = []
+        
+        for depth in range(max_depth):
+            next_beam: List[Dict[str, Any]] = []
+            
+            for path_node in beam:
+                # Get intervention candidates
+                candidates = [
+                    node for node in self.causal_graph.nodes()
+                    if len(list(self.causal_graph.successors(node))) > 0
+                    and node not in objectives.keys()
+                ]
+                
+                # Explore interventions
+                for var in candidates[:10]:  # Limit candidates
+                    stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
+                    current_val = path_node["state"].get(var, stats["mean"])
+                    
+                    # Try intervention
+                    intervention = {var: current_val + self.rng.normal(0, stats["std"] * 1.0)}
+                    
+                    # Check constraints
+                    violates = False
+                    for const_var, (min_val, max_val) in constraints.items():
+                        if const_var in intervention:
+                            if not (min_val <= intervention[const_var] <= max_val):
+                                violates = True
+                                break
+                    
+                    if violates:
+                        continue
+                    
+                    # Predict outcome
+                    outcome = self._predict_outcomes(path_node["state"], intervention)
+                    
+                    # Check outcome constraints
+                    for const_var, (min_val, max_val) in constraints.items():
+                        if const_var in outcome:
+                            if not (min_val <= outcome[const_var] <= max_val):
+                                violates = True
+                                break
+                    
+                    if violates:
+                        continue
+                    
+                    # Multi-objective optimization: weighted sum scalarization
+                    # Objective vector: f(x) = [f₁(x), f₂(x), ..., fₖ(x)] where fᵢ are individual objectives
+                    # Scalarized: F(x) = Σᵢ wᵢ·fᵢ(x) where wᵢ are weights
+                    # This converts multi-objective to single-objective for optimization
+                    # Weighted sum: F(x) = w₁·f₁(x) + w₂·f₂(x) + ... + wₖ·fₖ(x)
+                    obj_vector = {}
+                    for k, weight in objectives.items():
+                        # Individual objective value: fᵢ(x)
+                        obj_value = outcome.get(k, 0.0)
+                        # Weighted component: wᵢ·fᵢ(x)
+                        obj_vector[k] = obj_value * weight
+                    
+                    # Combined objective: F(x) = Σᵢ wᵢ·fᵢ(x) (weighted sum)
+                    # This is the scalarized multi-objective function
+                    # Alternative formulations:
+                    # - Weighted Lp norm: F(x) = (Σᵢ wᵢ·|fᵢ(x)|ᵖ)^(1/p)
+                    # - Chebyshev: F(x) = minᵢ wᵢ·fᵢ(x) (for maximization)
+                    combined_obj = sum(obj_vector.values())  # F(x) = Σᵢ wᵢ·fᵢ(x)
+                    
+                    next_beam.append({
+                        "state": outcome,
+                        "path": path_node["path"] + [intervention],
+                        "objective_vector": obj_vector,
+                        "combined_objective": float(combined_obj),
+                        "depth": depth + 1,
+                    })
+            
+            # Prune beam: keep top beam_width by combined objective
+            next_beam.sort(key=lambda x: x["combined_objective"], reverse=True)
+            beam = next_beam[:beam_width]
+            
+            # Add to Pareto if not dominated
+            for node in beam:
+                # Pareto dominance: x dominates y iff ∀i: fᵢ(x) ≥ fᵢ(y) ∧ ∃j: fⱼ(x) > fⱼ(y)
+                # This follows multi-objective optimization theory (Pareto optimality)
+                is_dominated = False
+                for pareto_node in pareto_frontier:
+                    # Check if pareto_node dominates node using Pareto dominance criterion
+                    # f₁ dominates f₂ if: ∀k: f₁ₖ ≥ f₂ₖ ∧ ∃k: f₁ₖ > f₂ₖ
+                    all_better = all(
+                        pareto_node["objective_vector"].get(k, 0.0) >= node["objective_vector"].get(k, 0.0)
+                        for k in objectives.keys()
+                    )
+                    some_better = any(
+                        pareto_node["objective_vector"].get(k, 0.0) > node["objective_vector"].get(k, 0.0)
+                        for k in objectives.keys()
+                    )
+                    # Pareto dominance condition: all_better ∧ some_better
+                    if all_better and some_better:
+                        is_dominated = True
+                        break
+                
+                if not is_dominated:
+                    # Remove dominated nodes from frontier
+                    pareto_frontier = [
+                        pn for pn in pareto_frontier
+                        if not (
+                            all(node["objective_vector"].get(k, 0.0) >= pn["objective_vector"].get(k, 0.0)
+                            for k in objectives.keys()) and
+                            any(node["objective_vector"].get(k, 0.0) > pn["objective_vector"].get(k, 0.0)
+                            for k in objectives.keys())
+                        )
+                    ]
+                    pareto_frontier.append(node)
+        
+        # Sort Pareto frontier
+        pareto_frontier.sort(key=lambda x: x["combined_objective"], reverse=True)
+        
+        return {
+            "pareto_frontier": pareto_frontier[:20],  # Top 20
+            "best_path": pareto_frontier[0] if pareto_frontier else None,
+            "total_paths_explored": len(pareto_frontier),
+            "max_depth_reached": max_depth,
+            "objectives": objectives,
+            "trade_off_analysis": {
+                "objective_ranges": {
+                    k: {
+                        "min": float(min(p["objective_vector"].get(k, 0.0) for p in pareto_frontier)),
+                        "max": float(max(p["objective_vector"].get(k, 0.0) for p in pareto_frontier)),
+                    }
+                    for k in objectives.keys()
+                },
+            },
+        }
+
+    def temporal_causal_chain_analysis(
+        self,
+        initial_intervention: Dict[str, float],
+        target: str,
+        time_horizon: int = 10,
+        lag_structure: Optional[Dict[Tuple[str, str], int]] = None,
+    ) -> Dict[str, Any]:
+        """
+        Temporal nesting: account for time delays in causal effects.
+        
+        Models that some effects take time (X→Y might take 2 periods),
+        creating temporal causal chains that nest across time.
+        
+        Args:
+            initial_intervention: Starting intervention
+            target: Variable to optimize
+            time_horizon: Number of time periods
+            lag_structure: {(source, target): lag_periods} - if None, assumes lag=1
+        
+        Returns:
+            Temporal trajectory, delayed effects, optimal timing
+        """
+        if lag_structure is None:
+            # Default: each edge has lag=1
+            lag_structure = {
+                (u, v): 1
+                for u, v in self.causal_graph.edges()
+            }
+        
+        # State history across time: x(t) = [x₁(t), x₂(t), ..., xₙ(t)]
+        # Discrete-time causal system with distributed lags
+        state_history: List[Dict[str, float]] = [initial_intervention.copy()]
+        
+        # Track pending effects: distributed lag model
+        # Effect yⱼ(t+τᵢⱼ) = βᵢⱼ·xᵢ(t) where τᵢⱼ is lag for edge (i,j)
+        # This implements VAR (Vector Autoregression) with distributed lags
+        pending_effects: Dict[int, List[Tuple[str, str, float]]] = {}  # {time: [(source, target, effect)]}
+        
+        for t in range(time_horizon):
+            current_state = state_history[-1].copy()
+            next_state = current_state.copy()
+            
+            # Apply pending effects from previous periods (distributed lag accumulation)
+            # y(t) = Σᵢ Σₖ βᵢⱼ·xᵢ(t-τₖ) where τₖ are lags
+            if t in pending_effects:
+                for source, target, effect_magnitude in pending_effects[t]:
+                    if target in next_state:
+                        # Linear accumulation: additive effects from multiple sources
+                        next_state[target] = next_state.get(target, 0.0) + effect_magnitude
+            
+            # Compute new effects with lags using distributed lag model
+            # Causal effect equation: yⱼ(t+τᵢⱼ) = βᵢⱼ·xᵢ(t)
+            # where τᵢⱼ is the lag for edge (i,j), βᵢⱼ is structural coefficient
+            # This implements VAR (Vector Autoregression) with distributed lags
+            for u, v in self.causal_graph.edges():
+                lag = lag_structure.get((u, v), 1)  # Lag τᵢⱼ (time delay)
+                source_val = current_state.get(u, 0.0)  # xᵢ(t): source value at time t
+                edge_data = self.causal_graph[u][v]
+                strength = edge_data.get('strength', 0.0)  # Structural coefficient βᵢⱼ
+                
+                # Effect magnitude: e = βᵢⱼ·xᵢ(t) (linear structural equation)
+                # This is the effect that will manifest at time t + τ
+                effect = source_val * strength  # e = βᵢⱼ·xᵢ(t)
+                
+                # Schedule effect for future period (distributed lag)
+                # Effect manifests at time t + τ: yⱼ(t+τ) ← yⱼ(t+τ) + βᵢⱼ·xᵢ(t)
+                # This implements: yⱼ(t+τᵢⱼ) = βᵢⱼ·xᵢ(t)
+                future_time = t + lag  # Time when effect manifests: t + τᵢⱼ
+                if future_time < time_horizon:
+                    if future_time not in pending_effects:
+                        pending_effects[future_time] = []
+                    # Store effect to be applied at future_time
+                    pending_effects[future_time].append((u, v, effect))
+            
+            state_history.append(next_state)
+        
+        # Extract temporal patterns
+        target_trajectory = [s.get(target, 0.0) for s in state_history]
+        
+        return {
+            "initial_intervention": initial_intervention,
+            "target": target,
+            "temporal_trajectory": state_history,
+            "target_over_time": target_trajectory,
+            "peak_value": float(max(target_trajectory)) if target_trajectory else 0.0,
+            "time_to_peak": int(np.argmax(target_trajectory)) if target_trajectory else 0,
+            "steady_state_value": float(target_trajectory[-1]) if target_trajectory else 0.0,
+            "lag_structure_used": lag_structure,
+        }
+
+    def explainable_nested_analysis(
+        self,
+        intervention: Dict[str, float],
+        target: str,
+        depth: int = 5,
+    ) -> Dict[str, Any]:
+        """
+        Explainable nesting: at each layer, explain WHY the effects occur.
+        
+        Nests deeply but provides human-readable explanations for each causal step,
+        building a narrative of how intervention → effect → effect → ... → target.
+        
+        Args:
+            intervention: Initial intervention
+            target: Target outcome
+            depth: Nesting depth
+        
+        Returns:
+            Explained causal chain, narrative, reasoning at each level
+        """
+        explanations: List[Dict[str, Any]] = []
+        
+        current_state = intervention.copy()
+        
+        for level in range(depth):
+            # Predict outcomes
+            predicted = self._predict_outcomes({}, current_state)
+            
+            # Find causal paths to target
+            paths_to_target: List[List[str]] = []
+            for inter_var in current_state.keys():
+                if inter_var == target:
+                    continue
+                try:
+                    paths = list(nx.all_simple_paths(
+                        self.causal_graph,
+                        inter_var,
+                        target,
+                        cutoff=depth - level
+                    ))
+                    paths_to_target.extend(paths)
+                except Exception:
+                    pass
+            
+            # Explain each path using causal effect decomposition
+            # Path effect = ∏(i,j)∈Path βᵢⱼ (product of structural coefficients)
+            # Following Pearl's do-calculus and causal mediation analysis
+            path_explanations: List[str] = []
+            for path in paths_to_target[:5]:  # Top 5 paths
+                explanation_parts = []
+                path_product = 1.0  # Initialize path effect product
+                for i in range(len(path) - 1):
+                    u, v = path[i], path[i + 1]
+                    edge_data = self.causal_graph[u][v]
+                    strength = abs(edge_data.get('strength', 0.0))  # |βᵢⱼ|
+                    sign = "+" if edge_data.get('strength', 0.0) >= 0 else "-"
+                    # Accumulate path effect: ∏ βᵢⱼ
+                    path_product *= edge_data.get('strength', 0.0)
+                    
+                    explanation_parts.append(
+                        f"{u} {sign}affects {v} (β={strength:.3f})"
+                    )
+                # Path effect: total causal effect along this path
+                explanation_parts.append(f"Path effect: {path_product:.4f}")
+                
+                path_explanation = " → ".join([
+                    f"{path[i]}{'↑' if i < len(path)-1 else ''}"
+                    for i in range(len(path))
+                ])
+                path_explanations.append(path_explanation)
+            
+            # Build explanation
+            explanation = {
+                "level": level,
+                "interventions": current_state,
+                "predicted_outcomes": predicted,
+                "paths_to_target": [p[:3] for p in paths_to_target[:3]],  # Show first 3 vars of each path
+                "explanation_text": f"Level {level}: " + "; ".join(path_explanations[:3]),
+                "target_value_at_level": float(predicted.get(target, 0.0)),
+            }
+            explanations.append(explanation)
+            
+            # Update for next level (use predicted as new baseline)
+            current_state = predicted
+        
+        # Synthesize narrative
+        narrative_parts = [
+            f"At level {e['level']}: {e['explanation_text']}"
+            for e in explanations
+        ]
+        
+        return {
+            "intervention": intervention,
+            "target": target,
+            "explanations_by_level": explanations,
+            "narrative": "\n".join(narrative_parts),
+            "final_target_value": float(explanations[-1]["target_value_at_level"]) if explanations else 0.0,
+            "total_levels": len(explanations),
+        }
+
+    # ==================== MAJOR UPGRADES ====================
+    
+    def gradient_based_intervention_optimization(
+        self,
+        initial_state: Dict[str, float],
+        target: str,
+        intervention_vars: List[str],
+        constraints: Optional[Dict[str, Tuple[float, float]]] = None,
+        method: str = "L-BFGS-B",
+    ) -> Dict[str, Any]:
+        """
+        Gradient-based optimization for finding optimal interventions.
+        
+        Uses automatic differentiation via numerical gradients to optimize:
+        minimize: -f(x) where f(x) = predicted outcome given intervention x
+        
+        Mathematical formulation:
+        - Objective: J(θ) = -y(θ) where y(θ) = predicted outcome
+        - Gradient: ∇_θ J(θ) = -∇_θ y(θ) computed via finite differences
+        - Update: θ_{k+1} = θ_k - α·∇_θ J(θ_k) (gradient descent)
+        
+        Args:
+            initial_state: Current state
+            target: Variable to optimize
+            intervention_vars: Variables that can be intervened on
+            constraints: {var: (min, max)} bounds
+            method: Optimization method ('L-BFGS-B', 'BFGS', 'SLSQP', etc.)
+        
+        Returns:
+            Optimal intervention, objective value, convergence info
+        """
+        # Prepare bounds
+        bounds = []
+        x0 = []
+        var_to_idx = {}
+        for i, var in enumerate(intervention_vars):
+            var_to_idx[var] = i
+            stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
+            current_val = initial_state.get(var, stats["mean"])
+            x0.append(current_val)
+            
+            if constraints and var in constraints:
+                min_val, max_val = constraints[var]
+                bounds.append((min_val, max_val))
+            else:
+                # Default bounds: ±3 standard deviations
+                bounds.append((current_val - 3 * stats["std"], current_val + 3 * stats["std"]))
+        
+        # Objective function: J(x) = -y(x) where y(x) is predicted outcome
+        def objective(x: np.ndarray) -> float:
+            """Objective: minimize -f(x) (maximize f(x))"""
+            intervention = {intervention_vars[i]: float(x[i]) for i in range(len(x))}
+            outcome = self._predict_outcomes(initial_state, intervention)
+            target_val = outcome.get(target, 0.0)
+            return -target_val  # Negative for minimization
+        
+        # Numerical gradient: ∇_θ J(θ) ≈ [J(θ+ε·e_i) - J(θ-ε·e_i)] / (2ε)
+        # where e_i is unit vector in direction i, ε is small step
+        def gradient(x: np.ndarray) -> np.ndarray:
+            """Compute gradient via finite differences: ∇f ≈ (f(x+ε) - f(x-ε))/(2ε)"""
+            epsilon = 1e-5
+            grad = np.zeros_like(x)
+            f0 = objective(x)
+            
+            for i in range(len(x)):
+                x_plus = x.copy()
+                x_plus[i] += epsilon
+                f_plus = objective(x_plus)
+                grad[i] = (f_plus - f0) / epsilon
+            
+            return grad
+        
+        # Optimize using scipy.optimize
+        try:
+            result = minimize(
+                objective,
+                x0=np.array(x0),
+                method=method,
+                bounds=bounds,
+                jac=gradient if method in ["L-BFGS-B", "BFGS", "CG"] else None,
+                options={"maxiter": 100, "ftol": 1e-6} if method == "L-BFGS-B" else {}
+            )
+            
+            optimal_intervention = {intervention_vars[i]: float(result.x[i]) for i in range(len(result.x))}
+            optimal_outcome = self._predict_outcomes(initial_state, optimal_intervention)
+            
+            return {
+                "optimal_intervention": optimal_intervention,
+                "optimal_target_value": float(optimal_outcome.get(target, 0.0)),
+                "objective_value": float(result.fun),
+                "success": bool(result.success),
+                "iterations": int(result.nit) if hasattr(result, 'nit') else 0,
+                "convergence_message": str(result.message),
+                "gradient_norm": float(np.linalg.norm(gradient(result.x))) if result.success else float('inf'),
+            }
+        except Exception as e:
+            return {"error": str(e), "optimal_intervention": {}, "success": False}
+
+    def nonlinear_scm_prediction(
+        self,
+        factual_state: Dict[str, float],
+        interventions: Dict[str, float],
+        include_interactions: bool = True,
+    ) -> Dict[str, float]:
+        """
+        Non-linear SCM prediction with interaction terms.
+        
+        Extends linear model: y = Σᵢ βᵢ·xᵢ + Σᵢⱼ γᵢⱼ·xᵢ·xⱼ + ε
+        where γᵢⱼ are interaction coefficients.
+        
+        Mathematical foundation:
+        - Linear term: Σᵢ βᵢ·xᵢ
+        - Quadratic interaction: Σᵢⱼ γᵢⱼ·xᵢ·xⱼ (product of parent pairs)
+        - Full model: y = linear_term + interaction_term + ε
+        
+        Args:
+            factual_state: Current state
+            interventions: Interventions to apply
+            include_interactions: Whether to include interaction terms
+        
+        Returns:
+            Predicted outcomes with non-linear effects
+        """
+        # Standardize and merge states
+        raw_state = factual_state.copy()
+        raw_state.update(interventions)
+        z_state = self._standardize_state(raw_state)
+        z_pred = dict(z_state)
+        
+        # Interaction coefficients cache {node: {(parent1, parent2): γ}}
+        interaction_coeffs: Dict[str, Dict[Tuple[str, str], float]] = {}
+        
+        for node in nx.topological_sort(self.causal_graph):
+            if node in interventions:
+                continue
+            
+            parents = list(self.causal_graph.predecessors(node))
+            if not parents:
+                continue
+            
+            # Linear term: Σᵢ βᵢ·z_xi
+            linear_term = 0.0
+            for parent in parents:
+                parent_z = z_pred.get(parent, z_state.get(parent, 0.0))
+                beta = self.causal_graph[parent][node].get('strength', 0.0)
+                linear_term += parent_z * beta
+            
+            # Interaction terms: Σᵢⱼ γᵢⱼ·z_xi·z_xj
+            interaction_term = 0.0
+            if include_interactions and node in self.interaction_terms:
+                for (p1, p2) in self.interaction_terms[node]:
+                    if p1 in parents and p2 in parents:
+                        z1 = z_pred.get(p1, z_state.get(p1, 0.0))
+                        z2 = z_pred.get(p2, z_state.get(p2, 0.0))
+                        # Interaction coefficient (default: small value)
+                        gamma = self.causal_graph[p1][node].get('interaction_strength', {}).get(p2, 0.0)
+                        interaction_term += gamma * z1 * z2  # γ·x₁·x₂
+            
+            # Total prediction: z_y = linear_term + interaction_term
+            z_pred[node] = linear_term + interaction_term
+        
+        # De-standardize
+        predicted_state = {}
+        for var, z_val in z_pred.items():
+            predicted_state[var] = self._destandardize_value(var, z_val)
+        return predicted_state
+
+    def compute_information_theoretic_measures(
+        self,
+        df: Any,
+        variables: List[str],
+    ) -> Dict[str, Any]:
+        """
+        Compute information-theoretic measures: entropy, mutual information, causal entropy.
+        
+        Mathematical formulations:
+        - Entropy: H(X) = -Σᵢ P(xᵢ) log₂ P(xᵢ) (discrete) or -∫ p(x) log p(x) dx (continuous)
+        - Mutual Information: I(X;Y) = H(X) + H(Y) - H(X,Y) = KL(P(X,Y) || P(X)P(Y))
+        - Conditional MI: I(X;Y|Z) = H(X,Z) + H(Y,Z) - H(X,Y,Z) - H(Z)
+        - Causal Entropy: Expected reduction in entropy from intervention
+        
+        Args:
+            df: DataFrame with variables
+            variables: Variables to analyze
+        
+        Returns:
+            Entropies, mutual information, causal information gains
+        """
+        if df is None or len(df) < 10:
+            return {"error": "Insufficient data"}
+        
+        data = df[variables].dropna()
+        if len(data) < 10:
+            return {"error": "Insufficient data after dropna"}
+        
+        results: Dict[str, Any] = {
+            "entropies": {},
+            "mutual_information": {},
+            "conditional_mi": {},
+        }
+        
+        # Compute entropies: H(X) = -Σ p(x) log p(x)
+        # Using discrete histogram approximation for continuous variables
+        for var in variables:
+            if var not in data.columns:
+                continue
+            
+            series = data[var].dropna()
+            if len(series) < 5:
+                continue
+            
+            # Discretize for entropy estimation (histogram method)
+            # H(X) ≈ -Σᵢ (nᵢ/n) log₂(nᵢ/n) where nᵢ is count in bin i
+            n_bins = min(20, max(5, int(np.sqrt(len(series)))))  # Adaptive binning
+            hist, bins = np.histogram(series, bins=n_bins)
+            hist = hist[hist > 0]  # Remove empty bins
+            probs = hist / hist.sum()
+            
+            # Shannon entropy: H(X) = -Σᵢ pᵢ log₂ pᵢ
+            entropy = -np.sum(probs * np.log2(probs))
+            results["entropies"][var] = float(entropy)
+            self._entropy_cache[var] = float(entropy)
+        
+        # Compute pairwise mutual information: I(X;Y) = H(X) + H(Y) - H(X,Y)
+        for i, var1 in enumerate(variables):
+            if var1 not in results["entropies"]:
+                continue
+            for var2 in variables[i+1:]:
+                if var2 not in results["entropies"]:
+                    continue
+                
+                # Joint entropy: H(X,Y) = -Σᵢⱼ p(xᵢ,yⱼ) log₂ p(xᵢ,yⱼ)
+                joint_series = data[[var1, var2]].dropna()
+                if len(joint_series) < 5:
+                    continue
+                
+                # 2D histogram
+                n_bins = min(10, max(3, int(np.cbrt(len(joint_series)))))
+                hist_2d, _, _ = np.histogram2d(
+                    joint_series[var1],
+                    joint_series[var2],
+                    bins=n_bins
+                )
+                hist_2d = hist_2d[hist_2d > 0]
+                probs_joint = hist_2d / hist_2d.sum()
+                
+                # Joint entropy
+                h_joint = -np.sum(probs_joint * np.log2(probs_joint))
+                
+                # Mutual information: I(X;Y) = H(X) + H(Y) - H(X,Y)
+                mi = results["entropies"][var1] + results["entropies"][var2] - float(h_joint)
+                results["mutual_information"][f"{var1};{var2}"] = float(max(0.0, mi))  # MI ≥ 0
+                self._mi_cache[(var1, var2)] = float(max(0.0, mi))
+        
+        return results
+
+    def convex_intervention_optimization(
+        self,
+        initial_state: Dict[str, float],
+        objectives: Dict[str, float],  # {var: weight}
+        constraints_dict: Dict[str, Tuple[float, float]],  # {var: (min, max)}
+        intervention_vars: List[str],
+    ) -> Dict[str, Any]:
+        """
+        Convex optimization for interventions using CVXPY (if available).
+        
+        Mathematical formulation:
+        minimize: Σᵢ wᵢ·fᵢ(x)
+        subject to: l ≤ x ≤ u (box constraints)
+        where fᵢ are linear functions of interventions
+        
+        Uses CVXPY for guaranteed global optimum in convex problems.
+        
+        Args:
+            initial_state: Current state
+            objectives: {variable: weight} to optimize
+            constraints_dict: {variable: (min, max)} bounds
+            intervention_vars: Variables to optimize
+        
+        Returns:
+            Optimal intervention, solver status, dual variables
+        """
+        if not CVXPY_AVAILABLE:
+            return {"error": "CVXPY not available. Install with: pip install cvxpy"}
+        
+        try:
+            # Decision variables: intervention values
+            n = len(intervention_vars)
+            x = cp.Variable(n, name="interventions")
+            
+            # Build objective: minimize Σᵢ wᵢ·(-outcome_i)
+            # Since CVXPY minimizes, we minimize negative of what we want to maximize
+            obj_terms = []
+            for target_var, weight in objectives.items():
+                # Approximate outcome as linear function of interventions
+                # outcome ≈ baseline + Σⱼ βⱼ·intervention_j
+                baseline = initial_state.get(target_var, 0.0)
+                
+                # Find paths from intervention vars to target
+                effect_sum = 0.0
+                for i, inter_var in enumerate(intervention_vars):
+                    try:
+                        path = nx.shortest_path(self.causal_graph, inter_var, target_var)
+                        if len(path) > 1:
+                            # Path strength (simplified: direct edge if exists)
+                            if self.causal_graph.has_edge(inter_var, target_var):
+                                beta = self.causal_graph[inter_var][target_var].get('strength', 0.0)
+                                effect_sum += beta * x[i]
+                    except:
+                        pass
+                
+                # Objective term: -weight * (baseline + effect_sum)
+                obj_terms.append(-weight * (baseline + effect_sum))
+            
+            objective = cp.Minimize(sum(obj_terms))
+            
+            # Constraints: l ≤ x ≤ u
+            constraints = []
+            for i, var in enumerate(intervention_vars):
+                if var in constraints_dict:
+                    min_val, max_val = constraints_dict[var]
+                    constraints.append(x[i] >= min_val)
+                    constraints.append(x[i] <= max_val)
+                else:
+                    # Default bounds
+                    stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
+                    current = initial_state.get(var, stats["mean"])
+                    constraints.append(x[i] >= current - 3 * stats["std"])
+                    constraints.append(x[i] <= current + 3 * stats["std"])
+            
+            # Solve
+            problem = cp.Problem(objective, constraints)
+            problem.solve(solver=cp.ECOS if hasattr(cp, 'ECOS') else cp.SCS)
+            
+            if problem.status in ["optimal", "optimal_inaccurate"]:
+                optimal_x = {intervention_vars[i]: float(x.value[i]) for i in range(n)}
+                return {
+                    "optimal_intervention": optimal_x,
+                    "status": problem.status,
+                    "objective_value": float(problem.value),
+                    "solver": problem.solver_stats.name if hasattr(problem, 'solver_stats') else "unknown",
+                }
+            else:
+                return {"error": f"Solver failed: {problem.status}", "optimal_intervention": {}}
+        except Exception as e:
+            return {"error": str(e), "optimal_intervention": {}}
+
+    def sensitivity_analysis(
+        self,
+        intervention: Dict[str, float],
+        target: str,
+        perturbation_size: float = 0.01,
+    ) -> Dict[str, Any]:
+        """
+        Sensitivity analysis: how sensitive is outcome to intervention changes?
+        
+        Mathematical formulation:
+        - Sensitivity: Sᵢ = ∂y/∂xᵢ ≈ (y(x + ε·eᵢ) - y(x)) / ε
+        - Elasticity: Eᵢ = (∂y/∂xᵢ)·(xᵢ/y) = sensitivity · (x/y)
+        - Total sensitivity: ||∇y||₂ = √(Σᵢ Sᵢ²)
+        
+        Args:
+            intervention: Base intervention
+            target: Target variable
+            perturbation_size: ε for finite differences
+        
+        Returns:
+            Sensitivities, elasticities, most influential variables
+        """
+        base_outcome = self._predict_outcomes({}, intervention)
+        base_target = base_outcome.get(target, 0.0)
+        
+        sensitivities: Dict[str, float] = {}
+        elasticities: Dict[str, float] = {}
+        
+        for var, val in intervention.items():
+            # Perturb: x + ε·e
+            perturbed_intervention = intervention.copy()
+            perturbed_intervention[var] = val + perturbation_size
+            
+            # Compute sensitivity: S = (y(x+ε) - y(x)) / ε
+            perturbed_outcome = self._predict_outcomes({}, perturbed_intervention)
+            perturbed_target = perturbed_outcome.get(target, 0.0)
+            
+            sensitivity = (perturbed_target - base_target) / perturbation_size
+            sensitivities[var] = float(sensitivity)
+            
+            # Elasticity: E = (∂y/∂x)·(x/y) = S·(x/y)
+            if abs(base_target) > 1e-6 and abs(val) > 1e-6:
+                elasticity = sensitivity * (val / base_target)
+                elasticities[var] = float(elasticity)
+            else:
+                elasticities[var] = 0.0
+        
+        # Total sensitivity (L2 norm of gradient): ||∇y||₂ = √(Σᵢ Sᵢ²)
+        sensitivity_vector = np.array(list(sensitivities.values()))
+        total_sensitivity = float(np.linalg.norm(sensitivity_vector))
+        
+        # Most influential (highest absolute sensitivity)
+        most_influential = max(sensitivities.items(), key=lambda x: abs(x[1])) if sensitivities else None
+        
+        return {
+            "sensitivities": sensitivities,
+            "elasticities": elasticities,
+            "total_sensitivity": total_sensitivity,
+            "most_influential_variable": most_influential[0] if most_influential else None,
+            "most_influential_sensitivity": most_influential[1] if most_influential else 0.0,
+        }
+
+    def vectorized_batch_prediction(
+        self,
+        initial_state: Dict[str, float],
+        intervention_batch: List[Dict[str, float]],
+    ) -> np.ndarray:
+        """
+        Vectorized batch prediction for efficiency.
+        
+        Computes predictions for multiple interventions in parallel using vectorized operations.
+        Much faster than looping through interventions individually.
+        
+        Mathematical: y_batch = f(X_batch) where X_batch is matrix of interventions
+        
+        Args:
+            initial_state: Base state
+            intervention_batch: List of interventions to predict
+        
+        Returns:
+            Array of predicted outcomes (one row per intervention)
+        """
+        if not intervention_batch:
+            return np.array([])
+        
+        # Extract all variables
+        all_vars = set(initial_state.keys())
+        for inter in intervention_batch:
+            all_vars.update(inter.keys())
+        
+        all_vars = sorted(list(all_vars))
+        n_interventions = len(intervention_batch)
+        n_vars = len(all_vars)
+        
+        # Build intervention matrix: X[i, j] = intervention i's value for variable j
+        X = np.zeros((n_interventions, n_vars))
+        for i, inter in enumerate(intervention_batch):
+            for j, var in enumerate(all_vars):
+                X[i, j] = inter.get(var, initial_state.get(var, 0.0))
+        
+        # Vectorized predictions (for now, use batched calls)
+        # Future: could vectorize the entire SCM forward pass
+        predictions = []
+        for inter in intervention_batch:
+            outcome = self._predict_outcomes(initial_state, inter)
+            predictions.append([outcome.get(var, 0.0) for var in all_vars])
+        
+        return np.array(predictions)
+
+    def bayesian_edge_inference(
+        self,
+        df: Any,
+        parent: str,
+        child: str,
+        prior_mu: float = 0.0,
+        prior_sigma: float = 1.0,
+    ) -> Dict[str, Any]:
+        """
+        Bayesian inference for edge strength using conjugate prior.
+        
+        Mathematical formulation:
+        - Prior: β ~ N(μ₀, σ²₀)
+        - Likelihood: y | β, X ~ N(Xβ, σ²)
+        - Posterior: β | y, X ~ N(μₙ, σ²ₙ)
+        - Posterior mean: μₙ = (σ²₀X'X + σ²I)⁻¹(σ²₀X'X μ̂_OLS + σ²μ₀)
+        - Posterior variance: σ²ₙ = (σ²₀⁻¹ + (X'X)/σ²)⁻¹
+        
+        Args:
+            df: Data
+            parent: Source variable
+            child: Target variable
+            prior_mu: Prior mean μ₀
+            prior_sigma: Prior standard deviation σ₀
+        
+        Returns:
+            Posterior mean, variance, credible intervals
+        """
+        if df is None or parent not in df.columns or child not in df.columns:
+            return {"error": "Invalid data or variables"}
+        
+        data = df[[parent, child]].dropna()
+        if len(data) < 5:
+            return {"error": "Insufficient data"}
+        
+        X = data[parent].values.reshape(-1, 1)
+        y = data[child].values
+        
+        # Standardize
+        X_mean, X_std = X.mean(), X.std() or 1.0
+        y_mean, y_std = y.mean(), y.std() or 1.0
+        X_norm = (X - X_mean) / X_std
+        y_norm = (y - y_mean) / y_std
+        
+        # OLS estimate: β̂_OLS = (X'X)⁻¹X'y
+        XtX = X_norm.T @ X_norm
+        Xty = X_norm.T @ y_norm
+        beta_ols = (np.linalg.pinv(XtX) @ Xty)[0]
+        
+        # Likelihood variance: σ² = (1/n)Σ(y - Xβ̂)²
+        residuals = y_norm - X_norm @ np.array([beta_ols])
+        sigma_sq = float(np.var(residuals))
+        
+        # Bayesian update: posterior parameters
+        # Precision: τ = 1/σ²
+        tau_likelihood = 1.0 / (sigma_sq + 1e-6)  # Likelihood precision
+        tau_prior = 1.0 / (prior_sigma ** 2)  # Prior precision
+        
+        # Posterior precision: τ_posterior = τ_prior + τ_likelihood
+        tau_posterior = tau_prior + tau_likelihood * len(data)
+        
+        # Posterior mean: μ_posterior = (τ_prior·μ₀ + τ_likelihood·n·β̂_OLS) / τ_posterior
+        mu_posterior = (tau_prior * prior_mu + tau_likelihood * len(data) * beta_ols) / tau_posterior
+        
+        # Posterior variance: σ²_posterior = 1/τ_posterior
+        sigma_posterior_sq = 1.0 / tau_posterior
+        sigma_posterior = np.sqrt(sigma_posterior_sq)
+        
+        # Credible intervals (95%): [μ - 1.96σ, μ + 1.96σ]
+        ci_lower = mu_posterior - 1.96 * sigma_posterior
+        ci_upper = mu_posterior + 1.96 * sigma_posterior
+        
+        # Store prior for future use
+        self.bayesian_priors[(parent, child)] = {
+            "mu": float(prior_mu),
+            "sigma": float(prior_sigma)
+        }
+        
+        return {
+            "posterior_mean": float(mu_posterior),
+            "posterior_std": float(sigma_posterior),
+            "posterior_variance": float(sigma_posterior_sq),
+            "credible_interval_95": (float(ci_lower), float(ci_upper)),
+            "ols_estimate": float(beta_ols),
+            "prior_mu": float(prior_mu),
+            "prior_sigma": float(prior_sigma),
+        }
+
+    def add_interaction_term(
+        self,
+        node: str,
+        parent1: str,
+        parent2: str,
+        interaction_strength: float = 0.0,
+    ) -> None:
+        """
+        Add non-linear interaction term: y = ... + γ·x₁·x₂
+        
+        Mathematical: interaction effect = γ·x₁·x₂ where γ is interaction coefficient
+        
+        Args:
+            node: Child variable
+            parent1: First parent
+            parent2: Second parent
+            interaction_strength: Interaction coefficient γ
+        """
+        if node not in self.interaction_terms:
+            self.interaction_terms[node] = []
+        self.interaction_terms[node].append((parent1, parent2))
+        
+        # Store interaction strength in graph edge data
+        if self.causal_graph.has_edge(parent1, node):
+            if 'interaction_strength' not in self.causal_graph[parent1][node]:
+                self.causal_graph[parent1][node]['interaction_strength'] = {}
+            self.causal_graph[parent1][node]['interaction_strength'][parent2] = interaction_strength
+
+    def clear_cache(self) -> None:
+        """Clear prediction cache to free memory."""
+        self._prediction_cache.clear()
+        self._entropy_cache.clear()
+        self._mi_cache.clear()
+
+    def _predict_outcomes_cached(
+        self,
+        factual_state: Dict[str, float],
+        interventions: Dict[str, float],
+    ) -> Dict[str, float]:
+        """
+        Cached version of _predict_outcomes for performance.
+        
+        Uses hash-based caching to avoid recomputing identical predictions.
+        Cache key: hash of (sorted factual_state.items(), sorted interventions.items())
+        """
+        if not self._cache_enabled:
+            return self._predict_outcomes(factual_state, interventions)
+        
+        # Create cache key from state and interventions (sorted for consistency)
+        state_key = tuple(sorted(factual_state.items()))
+        inter_key = tuple(sorted(interventions.items()))
+        cache_key = (state_key, inter_key)
+        
+        # Check cache
+        if cache_key in self._prediction_cache:
+            return self._prediction_cache[cache_key].copy()
+        
+        # Compute and cache (call with use_cache=False to avoid recursion)
+        result = self._predict_outcomes(factual_state, interventions, use_cache=False)
+        
+        # LRU eviction if cache too large
+        if len(self._prediction_cache) >= self._cache_max_size:
+            # Remove oldest 10% of entries (simple FIFO approximation)
+            keys_to_remove = list(self._prediction_cache.keys())[:self._cache_max_size // 10]
+            for k in keys_to_remove:
+                del self._prediction_cache[k]
+        
+        self._prediction_cache[cache_key] = result.copy()
+        return result
+
+    def granger_causality_test(
+        self,
+        df: Any,
+        var1: str,
+        var2: str,
+        max_lag: int = 4,
+    ) -> Dict[str, Any]:
+        """
+        Granger causality test: does var1 help predict var2?
+        
+        Mathematical formulation:
+        - Restricted model: y_t = α + Σᵢ₌₁ᵐ βᵢ·y_{t-i} + ε_t
+        - Unrestricted model: y_t = α + Σᵢ₌₁ᵐ βᵢ·y_{t-i} + Σᵢ₌₁ᵐ γᵢ·x_{t-i} + ε_t
+        - F-statistic: F = [(RSS_r - RSS_u)/m] / [RSS_u/(n-2m-1)]
+        - H₀: var1 does not Granger-cause var2 (γᵢ = 0 for all i)
+        
+        Args:
+            df: Time series data
+            var1: Potential cause variable
+            var2: Outcome variable
+            max_lag: Maximum lag to test
+        
+        Returns:
+            F-statistic, p-value, Granger causality decision
+        """
+        if df is None or var1 not in df.columns or var2 not in df.columns:
+            return {"error": "Invalid data or variables"}
+        
+        data = df[[var1, var2]].dropna()
+        if len(data) < max_lag * 2 + 5:
+            return {"error": "Insufficient data"}
+        
+        from scipy.stats import f as f_dist
+        
+        # Prepare lagged variables
+        n = len(data)
+        X_lags = []  # Lagged var2 (restricted model)
+        X_unrestricted = []  # Lagged var2 + lagged var1 (unrestricted)
+        y = []
+        
+        for t in range(max_lag, n):
+            y.append(data[var2].iloc[t])
+            
+            # Restricted: only lags of var2
+            restricted_row = [data[var2].iloc[t-i] for i in range(1, max_lag+1)]
+            X_lags.append(restricted_row)
+            
+            # Unrestricted: lags of var2 + lags of var1
+            unrestricted_row = restricted_row + [data[var1].iloc[t-i] for i in range(1, max_lag+1)]
+            X_unrestricted.append(unrestricted_row)
+        
+        X_lags = np.array(X_lags)
+        X_unrestricted = np.array(X_unrestricted)
+        y = np.array(y)
+        
+        # Fit restricted model: y ~ lags(var2)
+        # β_r = (X_r'X_r)⁻¹ X_r'y
+        try:
+            XrTXr = X_lags.T @ X_lags
+            XrTy = X_lags.T @ y
+            beta_r = np.linalg.pinv(XrTXr) @ XrTy
+            y_pred_r = X_lags @ beta_r
+            rss_r = float(np.sum((y - y_pred_r) ** 2))  # Restricted residual sum of squares
+            
+            # Fit unrestricted model: y ~ lags(var2) + lags(var1)
+            XuTXu = X_unrestricted.T @ X_unrestricted
+            XuTy = X_unrestricted.T @ y
+            beta_u = np.linalg.pinv(XuTXu) @ XuTy
+            y_pred_u = X_unrestricted @ beta_u
+            rss_u = float(np.sum((y - y_pred_u) ** 2))  # Unrestricted RSS
+            
+            # F-statistic: F = [(RSS_r - RSS_u)/m] / [RSS_u/(n-2m-1)]
+            # where m = number of additional parameters (max_lag)
+            m = max_lag
+            n_obs = len(y)
+            df1 = m  # Numerator degrees of freedom
+            df2 = n_obs - 2 * m - 1  # Denominator degrees of freedom
+            
+            if df2 > 0 and rss_u > 1e-10:
+                f_stat = ((rss_r - rss_u) / m) / (rss_u / df2)
+                f_stat = float(f_stat)
+                
+                # P-value: P(F > f_stat | H₀)
+                p_value = float(1.0 - f_dist.cdf(f_stat, df1, df2))
+                
+                # Decision: reject H₀ if p < 0.05
+                granger_causes = p_value < 0.05
+                
+                return {
+                    "f_statistic": f_stat,
+                    "p_value": float(p_value),
+                    "granger_causes": granger_causes,
+                    "max_lag": max_lag,
+                    "restricted_rss": rss_r,
+                    "unrestricted_rss": rss_u,
+                    "df_numerator": df1,
+                    "df_denominator": df2,
+                    "interpretation": f"{var1} {'does' if granger_causes else 'does not'} Granger-cause {var2}",
+                }
+            else:
+                return {"error": "Degenerate case in F-test"}
+        except Exception as e:
+            return {"error": str(e)}
+
+    def vector_autoregression_estimation(
+        self,
+        df: Any,
+        variables: List[str],
+        max_lag: int = 2,
+    ) -> Dict[str, Any]:
+        """
+        Estimate Vector Autoregression (VAR) model.
+        
+        Mathematical formulation:
+        - VAR(p): x_t = A₁x_{t-1} + A₂x_{t-2} + ... + A_p x_{t-p} + ε_t
+        - where x_t is vector of variables, A_i are coefficient matrices
+        - Estimation: OLS on each equation: x_{i,t} = Σⱼ Σₖ a_{ij,k}·x_{j,t-k} + ε_{i,t}
+        
+        Args:
+            df: Time series data
+            variables: Variables to include in VAR
+            max_lag: Lag order p
+        
+        Returns:
+            Coefficient matrices, residuals, model diagnostics
+        """
+        if df is None or len(variables) < 2:
+            return {"error": "Invalid data or need at least 2 variables"}
+        
+        data = df[variables].dropna()
+        if len(data) < max_lag * len(variables) + 10:
+            return {"error": "Insufficient data"}
+        
+        n_vars = len(variables)
+        n_obs = len(data) - max_lag
+        
+        # Build lagged design matrix
+        # Each row: [x_{t-1}, x_{t-2}, ..., x_{t-p}] for all variables
+        X_lag = []
+        y_matrix = []
+        
+        for t in range(max_lag, len(data)):
+            # Dependent variables at time t: y_t
+            y_row = [data[var].iloc[t] for var in variables]
+            y_matrix.append(y_row)
+            
+            # Lagged predictors: [x_{t-1}, x_{t-2}, ..., x_{t-p}]
+            lag_row = []
+            for lag in range(1, max_lag + 1):
+                for var in variables:
+                    lag_row.append(data[var].iloc[t - lag])
+            X_lag.append(lag_row)
+        
+        X_lag = np.array(X_lag)
+        y_matrix = np.array(y_matrix)
+        
+        # Estimate VAR coefficients equation by equation
+        # For each variable i: y_i = X_lag @ beta_i + ε_i
+        coefficient_matrices: Dict[str, np.ndarray] = {}
+        residuals_matrix = []
+        
+        for i, var in enumerate(variables):
+            y_i = y_matrix[:, i]
+            
+            # OLS: β̂_i = (X'X)⁻¹X'y_i
+            XtX = X_lag.T @ X_lag
+            Xty = X_lag.T @ y_i
+            beta_i = np.linalg.pinv(XtX) @ Xty
+            
+            # Reshape to matrix form: A_k[i, j] = coefficient of var_j at lag k on var_i
+            A_matrices = {}
+            for lag in range(1, max_lag + 1):
+                A_lag = np.zeros((n_vars, n_vars))
+                for j, var_j in enumerate(variables):
+                    idx = (lag - 1) * n_vars + j
+                    if idx < len(beta_i):
+                        A_lag[i, j] = float(beta_i[idx])
+                A_matrices[f"A_{lag}"] = A_lag
+            
+            coefficient_matrices[var] = {
+                "coefficients": beta_i,
+                "A_matrices": A_matrices,
+            }
+            
+            # Residuals: ε_i = y_i - X_lag @ β̂_i
+            y_pred_i = X_lag @ beta_i
+            residuals_i = y_i - y_pred_i
+            residuals_matrix.append(residuals_i)
+        
+        residuals_matrix = np.array(residuals_matrix).T  # Shape: (n_obs, n_vars)
+        
+        # Impulse response: how does shock to var_i affect var_j over time?
+        # IRF_{j,i}(h) = ∂y_{j,t+h} / ∂ε_{i,t}
+        # Can be computed from VAR coefficients (simplified here)
+        
+        return {
+            "coefficient_matrices": {
+                k: {k2: v2.tolist() if isinstance(v2, np.ndarray) else v2
+                    for k2, v2 in v.items()}
+                for k, v in coefficient_matrices.items()
+            },
+            "residuals": residuals_matrix.tolist(),
+            "residual_covariance": np.cov(residuals_matrix.T).tolist(),
+            "n_observations": n_obs,
+            "n_variables": n_vars,
+            "max_lag": max_lag,
+            "variables": variables,
+        }
+
+    def impulse_response_analysis(
+        self,
+        var_coefficients: Dict[str, Any],
+        horizon: int = 10,
+        shock_size: float = 1.0,
+    ) -> Dict[str, Any]:
+        """
+        Impulse Response Function (IRF): effect of one-time shock on variables over time.
+        
+        Mathematical formulation:
+        - IRF_{j,i}(h) = ∂y_{j,t+h} / ∂ε_{i,t}
+        - Computed recursively from VAR: y_t = Σₖ A_k y_{t-k} + ε_t
+        - IRF(0) = I (identity), IRF(h) = Σₖ A_k · IRF(h-k)
+        
+        Args:
+            var_coefficients: VAR coefficient matrices from vector_autoregression_estimation
+            horizon: Time horizon for IRF
+            shock_size: Size of initial shock
+        
+        Returns:
+            Impulse responses over time horizon
+        """
+        # Extract A matrices
+        A_matrices = {}
+        variables = list(var_coefficients.keys())
+        n_vars = len(variables)
+        
+        # Get max lag from coefficient structure
+        max_lag = 1
+        for var_data in var_coefficients.values():
+            if "A_matrices" in var_data:
+                for A_key in var_data["A_matrices"].keys():
+                    lag_num = int(A_key.split("_")[1])
+                    max_lag = max(max_lag, lag_num)
+        
+        # Build A_k matrices (average across equations or use first variable's)
+        first_var = variables[0]
+        if first_var in var_coefficients and "A_matrices" in var_coefficients[first_var]:
+            A_matrices = var_coefficients[first_var]["A_matrices"]
+        else:
+            return {"error": "Invalid VAR coefficients structure"}
+        
+        # Initialize IRF: IRF(0) = I (identity matrix)
+        # IRF[h][i, j] = response of variable i to shock in variable j at horizon h
+        irf = []
+        irf_0 = np.eye(n_vars) * shock_size  # Initial shock matrix
+        irf.append(irf_0.tolist())
+        
+        # Recursive computation: IRF(h) = Σₖ₌₁^p A_k · IRF(h-k)
+        # where p is max_lag
+        for h in range(1, horizon + 1):
+            irf_h = np.zeros((n_vars, n_vars))
+            
+            for lag in range(1, min(h, max_lag) + 1):
+                A_key = f"A_{lag}"
+                if A_key in A_matrices:
+                    A_k = np.array(A_matrices[A_key])
+                    # IRF(h) += A_k · IRF(h-k)
+                    if h - lag < len(irf):
+                        irf_h += A_k @ np.array(irf[h - lag])
+            
+            irf.append(irf_h.tolist())
+        
+        # Extract IRF paths for each variable pair
+        irf_paths: Dict[str, Dict[str, List[float]]] = {}
+        for i, var_i in enumerate(variables):
+            irf_paths[var_i] = {}
+            for j, var_j in enumerate(variables):
+                # Response of var_i to shock in var_j over time
+                path = [irf[h][i][j] for h in range(horizon + 1)]
+                irf_paths[var_i][var_j] = [float(x) for x in path]
+        
+        return {
+            "impulse_responses": irf_paths,
+            "horizon": horizon,
+            "shock_size": shock_size,
+            "variables": variables,
+            "irf_matrix": irf,  # Full IRF matrices
+        }
+
+    def causal_discovery_pc_algorithm(
+        self,
+        df: Any,
+        variables: List[str],
+        alpha: float = 0.05,
+    ) -> Dict[str, Any]:
+        """
+        PC algorithm for causal structure discovery (simplified implementation).
+        
+        PC algorithm steps:
+        1. Start with complete undirected graph
+        2. Remove edges if variables are conditionally independent given any subset
+        3. Orient edges using v-structure detection
+        4. Apply orientation rules (Meek's rules)
+        
+        Mathematical foundation: d-separation, conditional independence tests
+        
+        Args:
+            df: Data
+            variables: Variables to analyze
+            alpha: Significance level for independence tests
+        
+        Returns:
+            Learned DAG, edge orientations, independence test results
+        """
+        if df is None or len(variables) < 2:
+            return {"error": "Need at least 2 variables"}
+        
+        data = df[variables].dropna()
+        if len(data) < 10:
+            return {"error": "Insufficient data"}
+        
+        # Step 1: Start with complete graph (all pairs connected)
+        learned_graph = nx.DiGraph()
+        learned_graph.add_nodes_from(variables)
+        
+        # Create undirected complete graph first
+        undirected = nx.Graph()
+        undirected.add_nodes_from(variables)
+        for i, v1 in enumerate(variables):
+            for v2 in variables[i+1:]:
+                undirected.add_edge(v1, v2)
+        
+        # Step 2: Test conditional independence, remove edges
+        # Simplified: test I(X;Y|Z) for all conditioning sets Z
+        # Use correlation-based test as proxy for independence
+        edges_to_remove = []
+        
+        for v1, v2 in list(undirected.edges()):
+            # Test if v1 and v2 are independent given any subset of other variables
+            others = [v for v in variables if v not in [v1, v2]]
+            
+            # Simple test: if partial correlation |ρ_{12|others}| < threshold, remove edge
+            # Partial correlation: correlation after controlling for others
+            try:
+                # Compute partial correlation
+                if len(others) == 0:
+                    # No conditioning: use simple correlation
+                    corr = data[[v1, v2]].corr().iloc[0, 1]
+                else:
+                    # Partial correlation approximation
+                    # Simplified: regress v1 and v2 on others, then correlate residuals
+                    from scipy.stats import pearsonr
+                    
+                    # Residuals after controlling for others
+                    X_others = data[others].values
+                    y1 = data[v1].values
+                    y2 = data[v2].values
+                    
+                    # Remove linear effect of others
+                    beta1 = np.linalg.pinv(X_others.T @ X_others) @ X_others.T @ y1
+                    beta2 = np.linalg.pinv(X_others.T @ X_others) @ X_others.T @ y2
+                    
+                    res1 = y1 - X_others @ beta1
+                    res2 = y2 - X_others @ beta2
+                    
+                    corr, p_val = pearsonr(res1, res2)
+                    
+                    # Remove edge if not significantly correlated (independent)
+                    if abs(corr) < 0.1 or (p_val is not None and p_val > alpha):
+                        edges_to_remove.append((v1, v2))
+            except:
+                pass
+        
+        # Remove edges
+        for v1, v2 in edges_to_remove:
+            if undirected.has_edge(v1, v2):
+                undirected.remove_edge(v1, v2)
+        
+        # Step 3: Orient edges (simplified v-structure detection)
+        # If X-Z-Y exists and X and Y are not connected, orient as X→Z←Y (v-structure)
+        for z in variables:
+            neighbors_z = list(undirected.neighbors(z))
+            if len(neighbors_z) >= 2:
+                for i, x in enumerate(neighbors_z):
+                    for y in neighbors_z[i+1:]:
+                        # If X and Y are not neighbors, create v-structure
+                        if not undirected.has_edge(x, y):
+                            learned_graph.add_edge(x, z)
+                            learned_graph.add_edge(y, z)
+        
+        # Add remaining undirected edges (arbitrarily orient)
+        for x, y in undirected.edges():
+            if not (learned_graph.has_edge(x, y) or learned_graph.has_edge(y, x)):
+                learned_graph.add_edge(x, y)  # Arbitrary orientation
+        
+        return {
+            "learned_dag": learned_graph,
+            "edges": list(learned_graph.edges()),
+            "nodes": list(learned_graph.nodes()),
+            "edges_removed": len(edges_to_remove),
+            "method": "PC_algorithm_simplified",
+        }
+
+    def evolutionary_multi_objective_optimization(
+        self,
+        initial_state: Dict[str, float],
+        objectives: Dict[str, float],  # {var: weight}
+        constraints: Dict[str, Tuple[float, float]],
+        intervention_vars: List[str],
+        population_size: int = 50,
+        generations: int = 100,
+    ) -> Dict[str, Any]:
+        """
+        Evolutionary algorithm (NSGA-II inspired) for multi-objective optimization.
+        
+        Mathematical foundation:
+        - Population: P = {x₁, x₂, ..., x_N} (intervention candidates)
+        - Fitness: f(x) = [f₁(x), f₂(x), ..., fₖ(x)] (objective vector)
+        - Selection: Tournament selection based on Pareto dominance
+        - Crossover: Blend crossover: x_new = α·x₁ + (1-α)·x₂
+        - Mutation: Gaussian mutation: x_new = x + N(0, σ²)
+        
+        Args:
+            initial_state: Current state
+            objectives: {variable: weight} to optimize
+            constraints: {variable: (min, max)} bounds
+            intervention_vars: Variables to optimize
+            population_size: Size of population
+            generations: Number of generations
+        
+        Returns:
+            Pareto front, best solutions, convergence history
+        """
+        # Initialize population
+        population: List[Dict[str, float]] = []
+        for _ in range(population_size):
+            individual = {}
+            for var in intervention_vars:
+                stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
+                current = initial_state.get(var, stats["mean"])
+                if var in constraints:
+                    min_val, max_val = constraints[var]
+                    individual[var] = float(self.rng.uniform(min_val, max_val))
+                else:
+                    individual[var] = float(self.rng.normal(current, stats["std"]))
+            population.append(individual)
+        
+        pareto_front: List[Dict[str, Any]] = []
+        convergence_history: List[float] = []
+        
+        for generation in range(generations):
+            # Evaluate fitness for all individuals
+            fitness_scores: List[Dict[str, float]] = []
+            for individual in population:
+                outcome = self._predict_outcomes(initial_state, individual)
+                fitness = {k: outcome.get(k, 0.0) * weight for k, weight in objectives.items()}
+                combined = sum(fitness.values())
+                fitness_scores.append({
+                    "individual": individual,
+                    "fitness_vector": fitness,
+                    "combined": combined,
+                })
+            
+            # Update Pareto front
+            for fs in fitness_scores:
+                is_dominated = False
+                for pf in pareto_front:
+                    pf_fit = pf["fitness_vector"]
+                    fs_fit = fs["fitness_vector"]
+                    
+                    # Check if pf dominates fs
+                    all_better = all(
+                        pf_fit.get(k, 0.0) >= fs_fit.get(k, 0.0) for k in objectives.keys()
+                    )
+                    some_better = any(
+                        pf_fit.get(k, 0.0) > fs_fit.get(k, 0.0) for k in objectives.keys()
+                    )
+                    
+                    if all_better and some_better:
+                        is_dominated = True
+                        break
+                
+                if not is_dominated:
+                    # Remove dominated points from front
+                    pareto_front = [
+                        p for p in pareto_front
+                        if not (
+                            all(fs["fitness_vector"].get(k, 0.0) >= p["fitness_vector"].get(k, 0.0)
+                            for k in objectives.keys()) and
+                            any(fs["fitness_vector"].get(k, 0.0) > p["fitness_vector"].get(k, 0.0)
+                            for k in objectives.keys())
+                        )
+                    ]
+                    pareto_front.append(fs)
+            
+            # Track convergence (average combined fitness)
+            avg_fitness = np.mean([fs["combined"] for fs in fitness_scores])
+            convergence_history.append(float(avg_fitness))
+            
+            # Selection: tournament selection (simplified)
+            # Crossover: blend crossover
+            # Mutation: Gaussian mutation
+            new_population = []
+            while len(new_population) < population_size:
+                # Tournament selection
+                idx1 = self.rng.integers(0, len(population))
+                idx2 = self.rng.integers(0, len(population))
+                parent1 = population[idx1]
+                parent2 = population[idx2]
+                
+                # Crossover: blend (α = random)
+                alpha = self.rng.random()
+                child = {}
+                for var in intervention_vars:
+                    val1 = parent1.get(var, 0.0)
+                    val2 = parent2.get(var, 0.0)
+                    child[var] = float(alpha * val1 + (1 - alpha) * val2)
+                    
+                    # Mutation: Gaussian noise
+                    if self.rng.random() < 0.1:  # 10% mutation rate
+                        stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
+                        child[var] += float(self.rng.normal(0, stats["std"] * 0.1))
+                    
+                    # Enforce constraints
+                    if var in constraints:
+                        min_val, max_val = constraints[var]
+                        child[var] = float(np.clip(child[var], min_val, max_val))
+                
+                new_population.append(child)
+            
+            population = new_population
+        
+        # Sort Pareto front by combined fitness
+        pareto_front.sort(key=lambda x: x["combined"], reverse=True)
+        
+        return {
+            "pareto_front": pareto_front[:20],  # Top 20
+            "best_solution": pareto_front[0] if pareto_front else None,
+            "convergence_history": convergence_history,
+            "final_population_size": len(population),
+            "generations": generations,
+        }
+
+    def shannon_entropy(
+        self,
+        variable: str,
+        df: Any,
+        bins: Optional[int] = None,
+    ) -> float:
+        """
+        Compute Shannon entropy: H(X) = -Σᵢ p(xᵢ) log₂ p(xᵢ)
+        
+        Args:
+            variable: Variable name
+            df: Data
+            bins: Number of bins for discretization (auto if None)
+        
+        Returns:
+            Entropy value in bits
+        """
+        if df is None or variable not in df.columns:
+            return 0.0
+        
+        series = df[variable].dropna()
+        if len(series) < 5:
+            return 0.0
+        
+        # Check cache
+        cache_key = f"{variable}_{len(series)}_{bins}"
+        if cache_key in self._entropy_cache:
+            return self._entropy_cache[cache_key]
+        
+        # Discretize
+        if bins is None:
+            bins = min(20, max(5, int(np.sqrt(len(series)))))
+        
+        hist, _ = np.histogram(series, bins=bins)
+        hist = hist[hist > 0]
+        probs = hist / hist.sum()
+        
+        # Shannon entropy
+        entropy = float(-np.sum(probs * np.log2(probs)))
+        self._entropy_cache[cache_key] = entropy
+        return entropy
+
+    def mutual_information(
+        self,
+        var1: str,
+        var2: str,
+        df: Any,
+    ) -> float:
+        """
+        Compute mutual information: I(X;Y) = H(X) + H(Y) - H(X,Y)
+        
+        Args:
+            var1: First variable
+            var2: Second variable
+            df: Data
+        
+        Returns:
+            Mutual information in bits
+        """
+        if df is None or var1 not in df.columns or var2 not in df.columns:
+            return 0.0
+        
+        # Check cache
+        cache_key = (var1, var2)
+        if cache_key in self._mi_cache:
+            return self._mi_cache[cache_key]
+        
+        data = df[[var1, var2]].dropna()
+        if len(data) < 10:
+            return 0.0
+        
+        # Individual entropies
+        h1 = self.shannon_entropy(var1, df)
+        h2 = self.shannon_entropy(var2, df)
+        
+        # Joint entropy: H(X,Y)
+        n_bins = min(10, max(3, int(np.cbrt(len(data)))))
+        hist_2d, _, _ = np.histogram2d(data[var1], data[var2], bins=n_bins)
+        hist_2d = hist_2d[hist_2d > 0]
+        probs_joint = hist_2d / hist_2d.sum()
+        h_joint = float(-np.sum(probs_joint * np.log2(probs_joint)))
+        
+        # Mutual information
+        mi = float(max(0.0, h1 + h2 - h_joint))
+        self._mi_cache[cache_key] = mi
+        return mi
+
+    def conditional_mutual_information(
+        self,
+        var1: str,
+        var2: str,
+        condition: str,
+        df: Any,
+    ) -> float:
+        """
+        Compute conditional mutual information: I(X;Y|Z) = H(X,Z) + H(Y,Z) - H(X,Y,Z) - H(Z)
+        
+        Args:
+            var1: First variable
+            var2: Second variable
+            condition: Conditioning variable
+            df: Data
+        
+        Returns:
+            Conditional MI in bits
+        """
+        if df is None or any(v not in df.columns for v in [var1, var2, condition]):
+            return 0.0
+        
+        data = df[[var1, var2, condition]].dropna()
+        if len(data) < 10:
+            return 0.0
+        
+        # H(X,Z)
+        h_xz = self.shannon_entropy(f"{var1}_{condition}", pd.DataFrame({
+            f"{var1}_{condition}": data[var1].astype(str) + "_" + data[condition].astype(str)
+        }))
+        
+        # H(Y,Z)
+        h_yz = self.shannon_entropy(f"{var2}_{condition}", pd.DataFrame({
+            f"{var2}_{condition}": data[var2].astype(str) + "_" + data[condition].astype(str)
+        }))
+        
+        # H(X,Y,Z) - simplified joint entropy
+        # H(Z)
+        h_z = self.shannon_entropy(condition, df)
+        
+        # Simplified: I(X;Y|Z) ≈ I(X;Y) - I(X;Z) - I(Y;Z) + I(X;Y;Z)
+        # Use chain rule approximation
+        mi_xy = self.mutual_information(var1, var2, df)
+        mi_xz = self.mutual_information(var1, condition, df)
+        mi_yz = self.mutual_information(var2, condition, df)
+        
+        # Chain rule: I(X;Y|Z) = I(X;Y) - I(X;Y;Z) where I(X;Y;Z) is interaction
+        # Approximation: I(X;Y|Z) ≈ I(X;Y) - min(I(X;Z), I(Y;Z))
+        cmi = float(max(0.0, mi_xy - min(mi_xz, mi_yz)))
+        
+        return cmi
+
+    def cross_validate_edge_strength(
+        self,
+        df: Any,
+        parent: str,
+        child: str,
+        n_folds: int = 5,
+    ) -> Dict[str, Any]:
+        """
+        Cross-validation for edge strength estimation.
+        
+        Mathematical:
+        - K-fold CV: partition data into K folds
+        - Train on K-1 folds, test on held-out fold
+        - CV error: CV = (1/K) Σᵢ₌₁ᴷ MSE_i where MSE_i is mean squared error on fold i
+        
+        Args:
+            df: Data
+            parent: Source variable
+            child: Target variable
+            n_folds: Number of CV folds
+        
+        Returns:
+            CV scores, mean CV error, standard error
+        """
+        if df is None or parent not in df.columns or child not in df.columns:
+            return {"error": "Invalid data"}
+        
+        data = df[[parent, child]].dropna()
+        if len(data) < n_folds * 3:
+            return {"error": "Insufficient data for CV"}
+        
+        n = len(data)
+        fold_size = n // n_folds
+        
+        cv_errors: List[float] = []
+        
+        for fold in range(n_folds):
+            # Split: test = fold, train = rest
+            test_start = fold * fold_size
+            test_end = (fold + 1) * fold_size if fold < n_folds - 1 else n
+            
+            test_indices = list(range(test_start, test_end))
+            train_indices = [i for i in range(n) if i not in test_indices]
+            
+            train_data = data.iloc[train_indices]
+            test_data = data.iloc[test_indices]
+            
+            if len(train_data) < 5 or len(test_data) < 2:
+                continue
+            
+            # Fit on training data
+            X_train = train_data[parent].values.reshape(-1, 1)
+            y_train = train_data[child].values
+            X_test = test_data[parent].values.reshape(-1, 1)
+            y_test = test_data[child].values
+            
+            # OLS: β = (X'X)⁻¹X'y
+            XtX = X_train.T @ X_train
+            Xty = X_train.T @ y_train
+            beta = (np.linalg.pinv(XtX) @ Xty)[0]
+            
+            # Predict on test: ŷ = Xβ
+            y_pred = X_test @ np.array([beta])
+            
+            # MSE on test fold
+            mse = float(np.mean((y_test - y_pred) ** 2))
+            cv_errors.append(mse)
+        
+        if len(cv_errors) == 0:
+            return {"error": "CV failed"}
+        
+        # CV statistics
+        mean_cv_error = float(np.mean(cv_errors))
+        std_cv_error = float(np.std(cv_errors))
+        se_cv = std_cv_error / np.sqrt(len(cv_errors))  # Standard error
+        
+        return {
+            "cv_errors": [float(e) for e in cv_errors],
+            "mean_cv_error": mean_cv_error,
+            "std_cv_error": std_cv_error,
+            "standard_error": float(se_cv),
+            "n_folds": len(cv_errors),
+            "cv_score": mean_cv_error,  # Lower is better
+        }
+
+    def integrated_gradients_attribution(
+        self,
+        baseline_state: Dict[str, float],
+        target_state: Dict[str, float],
+        target: str,
+        n_steps: int = 50,
+    ) -> Dict[str, float]:
+        """
+        Integrated Gradients for causal attribution: how much does each variable contribute?
+        
+        Mathematical formulation:
+        - IG_i = (x_i - x_i^0) · ∫₀¹ [∂f/∂x_i](x^0 + t·(x - x^0)) dt
+        - Approximated: IG_i ≈ (x_i - x_i^0) · (1/m) Σⱼ₌₁ᵐ [∂f/∂x_i](x^0 + (j/m)·(x - x^0))
+        - Attribution: A_i = IG_i / Σⱼ IGⱼ (normalized)
+        
+        Args:
+            baseline_state: Reference state (x^0)
+            target_state: Target state (x)
+            target: Outcome variable
+            n_steps: Number of integration steps
+        
+        Returns:
+            Attributions for each variable
+        """
+        # Variables that differ between baseline and target
+        diff_vars = [
+            v for v in set(list(baseline_state.keys()) + list(target_state.keys()))
+            if abs(baseline_state.get(v, 0.0) - target_state.get(v, 0.0)) > 1e-6
+        ]
+        
+        if not diff_vars:
+            return {}
+        
+        integrated_gradients: Dict[str, float] = {}
+        
+        for var in diff_vars:
+            x0 = baseline_state.get(var, 0.0)
+            x1 = target_state.get(var, 0.0)
+            delta = x1 - x0
+            
+            if abs(delta) < 1e-6:
+                integrated_gradients[var] = 0.0
+                continue
+            
+            # Integrate gradient along path: x(t) = x^0 + t·(x - x^0), t ∈ [0,1]
+            grad_sum = 0.0
+            
+            for step in range(1, n_steps + 1):
+                t = step / n_steps  # t ∈ [0,1]
+                
+                # Interpolated state: x(t) = x^0 + t·(x - x^0)
+                interpolated_state = baseline_state.copy()
+                for v in diff_vars:
+                    v0 = baseline_state.get(v, 0.0)
+                    v1 = target_state.get(v, 0.0)
+                    interpolated_state[v] = v0 + t * (v1 - v0)
+                
+                # Compute gradient: ∂f/∂x_i at interpolated state
+                # Use finite differences
+                epsilon = abs(delta) * 1e-4
+                perturbed_state = interpolated_state.copy()
+                perturbed_state[var] += epsilon
+                
+                outcome_base = self._predict_outcomes({}, interpolated_state)
+                outcome_pert = self._predict_outcomes({}, perturbed_state)
+                
+                grad = (outcome_pert.get(target, 0.0) - outcome_base.get(target, 0.0)) / epsilon
+                grad_sum += grad
+            
+            # Integrated gradient: IG = delta · average_gradient
+            avg_grad = grad_sum / n_steps
+            ig = delta * avg_grad
+            integrated_gradients[var] = float(ig)
+        
+        # Normalize attributions
+        total_ig = sum(abs(v) for v in integrated_gradients.values())
+        if total_ig > 1e-6:
+            attributions = {k: float(v / total_ig) for k, v in integrated_gradients.items()}
+        else:
+            attributions = {k: 0.0 for k in integrated_gradients.keys()}
+        
+        return {
+            "integrated_gradients": integrated_gradients,
+            "attributions": attributions,  # Normalized to sum to 1
+            "total_attribution": float(sum(abs(v) for v in attributions.values())),
+        }
+
+    def bellman_optimal_intervention(
+        self,
+        initial_state: Dict[str, float],
+        target: str,
+        intervention_vars: List[str],
+        horizon: int = 5,
+        discount: float = 0.9,
+    ) -> Dict[str, Any]:
+        """
+        Dynamic Programming (Bellman optimality) for optimal intervention sequence.
+        
+        Mathematical formulation:
+        - Value function: V*(x) = max_u [r(x,u) + γ·V*(f(x,u))]
+        - Optimal policy: π*(x) = argmax_u [r(x,u) + γ·V*(f(x,u))]
+        - Backward induction: solve V*(x) from terminal time backwards
+        
+        Args:
+            initial_state: Starting state
+            target: Variable to maximize
+            intervention_vars: Available interventions
+            horizon: Time horizon T
+            discount: Discount factor γ ∈ [0,1]
+        
+        Returns:
+            Optimal policy, value function, intervention sequence
+        """
+        # Discretize state space (simplified: use current state as reference)
+        # Value function: V_t(x) = value at time t in state x
+        value_function: Dict[int, Dict[Tuple, float]] = {}
+        policy: Dict[int, Dict[Tuple, Dict[str, float]]] = {}
+        
+        # Terminal condition: V_T(x) = r(x) (immediate reward)
+        # Reward: r(x) = target_value(x)
+        def reward(state: Dict[str, float]) -> float:
+            outcome = self._predict_outcomes({}, state)
+            return float(outcome.get(target, 0.0))
+        
+        # Backward induction: from T down to 0
+        # For each time t from T-1 down to 0:
+        for t in range(horizon - 1, -1, -1):
+            # Simplified: evaluate at current state (could expand to full state space)
+            state_key = tuple(sorted(initial_state.items()))
+            
+            if t == horizon - 1:
+                # Terminal: V_T(x) = r(x)
+                value_function[t] = {state_key: reward(initial_state)}
+                policy[t] = {state_key: {}}
+            else:
+                # Bellman: V_t(x) = max_u [r(x) + γ·V_{t+1}(f(x,u))]
+                best_value = float("-inf")
+                best_intervention: Dict[str, float] = {}
+                
+                # Search intervention space (simplified: sample candidates)
+                for _ in range(20):
+                    candidate_intervention = {}
+                    for var in intervention_vars:
+                        stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
+                        current = initial_state.get(var, stats["mean"])
+                        candidate_intervention[var] = float(self.rng.normal(current, stats["std"] * 0.5))
+                    
+                    # Next state: f(x, u)
+                    next_state = self._predict_outcomes(initial_state, candidate_intervention)
+                    next_key = tuple(sorted(next_state.items()))
+                    
+                    # Immediate reward
+                    r = reward(next_state)
+                    
+                    # Future value: γ·V_{t+1}(f(x,u))
+                    if t + 1 in value_function and next_key in value_function[t + 1]:
+                        future_val = value_function[t + 1][next_key]
+                    else:
+                        future_val = 0.0
+                    
+                    # Total value: r + γ·V_{t+1}
+                    total_value = r + discount * future_val
+                    
+                    if total_value > best_value:
+                        best_value = total_value
+                        best_intervention = candidate_intervention
+                
+                value_function[t] = {state_key: best_value}
+                policy[t] = {state_key: best_intervention}
+        
+        # Extract optimal sequence
+        optimal_sequence: List[Dict[str, float]] = []
+        current_state = initial_state.copy()
+        
+        for t in range(horizon):
+            state_key = tuple(sorted(current_state.items()))
+            if t in policy and state_key in policy[t]:
+                intervention = policy[t][state_key]
+                optimal_sequence.append(intervention)
+                current_state = self._predict_outcomes(current_state, intervention)
+        
+        return {
+            "optimal_sequence": optimal_sequence,
+            "value_function": {
+                t: {str(k): v for k, v in vf.items()}
+                for t, vf in value_function.items()
+            },
+            "policy": {
+                t: {str(k): v for k, v in p.items()}
+                for t, p in policy.items()
+            },
+            "total_value": float(value_function.get(0, {}).get(tuple(sorted(initial_state.items())), 0.0)),
+            "horizon": horizon,
+            "discount_factor": discount,
+        }
+
+    def shapley_value_attribution(
+        self,
+        baseline_state: Dict[str, float],
+        target_state: Dict[str, float],
+        target: str,
+    ) -> Dict[str, float]:
+        """
+        Shapley values for fair attribution: marginal contribution of each variable.
+        
+        Mathematical formulation:
+        - Shapley value: φᵢ = Σ_{S ⊆ N\{i}} [|S|!(n-|S|-1)!/n!] · [v(S∪{i}) - v(S)]
+        - where v(S) = outcome with variables in S set to target, others to baseline
+        - Fair attribution: satisfies efficiency, symmetry, dummy, additivity
+        
+        Args:
+            baseline_state: Baseline (all variables at baseline)
+            target_state: Target (all variables at target)
+            target: Outcome variable
+        
+        Returns:
+            Shapley values for each variable
+        """
+        variables = list(set(list(baseline_state.keys()) + list(target_state.keys())))
+        n = len(variables)
+        
+        if n == 0:
+            return {}
+        
+        shapley_values: Dict[str, float] = {var: 0.0 for var in variables}
+        
+        # Compute value function: v(S) = outcome when S are set to target, rest to baseline
+        def value_function(subset: set) -> float:
+            state = baseline_state.copy()
+            for var in subset:
+                if var in target_state:
+                    state[var] = target_state[var]
+            outcome = self._predict_outcomes({}, state)
+            return float(outcome.get(target, 0.0))
+        
+        # Compute Shapley value for each variable
+        for var in variables:
+            phi_i = 0.0
+            
+            # Sum over all subsets S not containing var
+            others = [v for v in variables if v != var]
+            
+            # For each subset size
+            for subset_size in range(len(others) + 1):
+                # Generate all subsets of size subset_size
+                from itertools import combinations
+                
+                for subset in combinations(others, subset_size):
+                    S = set(subset)
+                    
+                    # Weight: |S|!(n-|S|-1)!/n!
+                    s_size = len(S)
+                    weight = (math.factorial(s_size) * math.factorial(n - s_size - 1)) / math.factorial(n)
+                    
+                    # Marginal contribution: v(S∪{i}) - v(S)
+                    S_with_i = S | {var}
+                    marginal = value_function(S_with_i) - value_function(S)
+                    
+                    phi_i += weight * marginal
+            
+            shapley_values[var] = float(phi_i)
+        
+        return {
+            "shapley_values": shapley_values,
+            "total_attribution": float(sum(shapley_values.values())),
+            "normalized": {k: float(v / sum(abs(vi) for vi in shapley_values.values()) if sum(abs(vi) for vi in shapley_values.values()) > 0 else 0.0)
+                          for k, v in shapley_values.items()},
+        }

From 258c3dce08f0d835cea1cec7f7b357e31ca69735 Mon Sep 17 00:00:00 2001
From: CI-DEV <154627941+IlumCI@users.noreply.github.com>
Date: Tue, 4 Nov 2025 02:41:23 +0200
Subject: [PATCH 03/12] Added Logistical agent with CRCA

---
 .../logistics/crca_supply_shock_agent.py      | 1887 +++++++++++++++++
 1 file changed, 1887 insertions(+)
 create mode 100644 examples/demos/logistics/crca_supply_shock_agent.py

diff --git a/examples/demos/logistics/crca_supply_shock_agent.py b/examples/demos/logistics/crca_supply_shock_agent.py
new file mode 100644
index 00000000..3cee1163
--- /dev/null
+++ b/examples/demos/logistics/crca_supply_shock_agent.py
@@ -0,0 +1,1887 @@
+import math
+from dataclasses import dataclass
+from typing import Dict, List, Tuple, Optional, Any
+
+import numpy as np
+import pandas as pd
+from loguru import logger
+import json
+import re
+import warnings
+
+from swarms import Agent
+from swarms.agents import CRCAAgent
+
+
+SUPPLY_AGENT_PROMPT = """
+You are an expert supply chain analyst with deep knowledge of multi-echelon inventory, logistics, and robust control.
+You analyze telemetry and SCM outputs, apply causal reasoning, and propose safe, actionable interventions.
+
+Data-awareness:
+- Consider lead time (L), survival/transport factor (phi), capacity (K), backlog (B), inventory (I), demand (D), orders (O), receipts (R), price (p).
+- Reference learned causal edges when explaining recommendations (e.g., B→p+, I→p−, dcost→p+, L→R−, D→O+).
+
+Uncertainty and risk:
+- Note regime shifts or drift (EWMA/CUSUM/BOCPD). Prefer conservative actions when uncertainty is high.
+- Propose z_alpha updates, reroute/expedite shares with CVaR-style caution and execution realism.
+
+Guardrails:
+- Avoid claims beyond the data window. Keep recommendations feasible under capacity and service constraints.
+- Prefer stable signals and explain trade-offs (service vs. cost vs. bullwhip).
+
+Output structure (always include these 7 sections):
+1) Drivers: succinct causal drivers (e.g., L↑→R↓→I↓→B↑→p↑; dcost↑→p↑→D↓)
+2) Regime/Alerts: note EWMA/CUSUM/BOCPD, utilization, and stability
+3) Proposal: recommended z_alpha, reroute/expedite, and rationale
+4) Expected Impact: service, cost proxy, bullwhip changes (direction and rough magnitude)
+5) Risks/Uncertainty: cite instability or wide uncertainty; suggest mitigations
+6) Counterfactuals: 1–2 do()-style scenarios and expected KPI shifts
+7) Actionables: concrete next steps and monitoring items
+
+Learned DAG alignment:
+- Mirror the learned DAG strengths exactly in your explanation. Do not claim effects whose learned strength is ~0. If L→R≈0 or R→I≈0, reflect that and avoid relying on those edges. Base rationale on the actual learned edges provided.
+
+After the 7 sections, you MUST output a final JSON object on a new line with the exact schema:
+{
+  "proposal": {"z_alpha_new": number, "reroute_share": number, "expedite_share": number, "dual_source_share": number},
+  "notes": string,
+  "expected_deltas": {"service": number, "cost_proxy": number, "bullwhip": number},
+  "ci80": {"service": [low, high], "cost_proxy": [low, high], "bullwhip": [low, high]},
+  "feasible": boolean
+}
+Numbers should be in [0, 3] for z_alpha_new, [0, 1] for shares.
+"""
+
+
+@dataclass
+class SKUKey:
+    sku: str
+    facility: str
+
+
+@dataclass
+class PolicyParams:
+    z_alpha: float = 1.28  # base safety factor (approx 90%)
+    theta_smoothing: float = 0.35  # order smoothing parameter
+
+
+@dataclass
+class Elasticities:
+    eta_c: float = 0.3  # pass-through elasticity to price from cost changes
+    eta_B: float = 0.5  # price increases with backlog
+    eta_I: float = 0.3  # price decreases with inventory
+
+
+class SupplyShockCRCAgent:
+    """CR-CA Supply-Shock Agent for multi-period inventory flows and interventions.
+
+    Implements SCM flow, queueing-derived lead times, pricing pass-through, and
+    integrates CRCAAgent for causal analysis and do()-counterfactuals.
+    """
+
+    def __init__(
+        self,
+        skus: List[SKUKey],
+        T: int = 60,
+        policy: PolicyParams = PolicyParams(),
+        el: Elasticities = Elasticities(),
+        seed: int = 7,
+    ) -> None:
+        self.skus = skus
+        self.T = T
+        self.policy = policy
+        self.el = el
+        self.rng = np.random.default_rng(seed)
+
+        # Core data containers (panel: period x (sku,facility))
+        index = pd.MultiIndex.from_tuples(
+            [(t, k.sku, k.facility) for t in range(T) for k in skus],
+            names=["t", "sku", "facility"],
+        )
+        self.df = pd.DataFrame(index=index)
+
+        # Initialize states with simple priors
+        self.df["D"] = self.rng.poisson(100, len(self.df))  # demand
+        self.df["I"] = 120.0  # on-hand
+        self.df["B"] = 0.0  # backorder
+        self.df["P"] = 80.0  # pipeline
+        self.df["O"] = 0.0  # orders placed
+        self.df["R"] = 0.0  # receipts
+        self.df["K"] = 1e6  # facility capacity (big default)
+        self.df["phi"] = 1.0  # spoilage/survival fraction
+        self.df["L"] = self.rng.integers(1, 4, len(self.df)).astype(float)  # lead time in periods (float for updates)
+        self.df["c"] = 10.0  # unit cost
+        self.df["dcost"] = 0.0  # cost change
+        self.df["p_bar"] = 15.0
+        self.df["p"] = self.df["p_bar"]
+        self.df["D_ref"] = 100.0
+
+        # CR-CA causal layer
+        self.crca = CRCAAgent(
+            name="crca-supply-shock",
+            description="Causal layer for supply shocks and policy",
+            model_name="gpt-4o-mini",
+            max_loops=2,
+        )
+        self._build_causal_graph()
+
+        # VSM overlay components (S2-S5)
+        self.vsm = VSMOverlay()
+
+        # Narrative LLM agent (graceful init)
+        try:
+            self.agent = Agent(
+                agent_name="CRCA-Supply-Shock-Agent",
+                system_prompt=SUPPLY_AGENT_PROMPT,
+                model_name="gpt-4o",
+                max_loops=1,
+                autosave=False,
+                dashboard=True,
+                verbose=False,
+                dynamic_temperature_enabled=True,
+                context_length=200000,
+                output_type="string",
+                streaming_on=False,
+            )
+        except Exception as e:
+            logger.warning(f"LLM Agent init failed (narrative disabled): {e}")
+            self.agent = None
+
+        # Feasibility config and last applied controls
+        self.lane_capacity: float = 0.35  # max share sum for reroute+expedite+dual_source per cycle
+        self.max_weekly_change: Dict[str, float] = {"z_alpha_new": 0.3, "reroute_share": 0.15, "expedite_share": 0.15, "dual_source_share": 0.2}
+        self.last_controls: Dict[str, float] = {"z_alpha_new": self.policy.z_alpha, "reroute_share": 0.0, "expedite_share": 0.0, "dual_source_share": 0.0}
+        # KPI normalization scalers
+        self.kpi_units = {"service": "%", "cost_proxy": "currency", "bullwhip": "ratio"}
+        self.cost_unit_multiplier = 1.0
+        # KPI/action history and RL weights
+        self.kpi_history: List[Dict[str, float]] = []
+        self.action_history: List[Dict[str, float]] = []
+        self.mpc_weights: Dict[str, float] = {"service": 1.0, "cost": 1.0, "bullwhip": 0.5}
+        # Dynamic data feeds
+        self._feeds: Dict[str, Any] = {}
+        # Direct pricing lever (applied as an offset to p_bar during simulate)
+        self._price_adjust: float = 0.0
+
+    # ===== Helper: logistics lever support from learned DAG =====
+    def _logistics_support_from_strengths(self, strengths: Dict[str, float], tol: float = 0.05) -> bool:
+        keys = ["L->R", "phi->R", "K->R"]
+        return any(abs(float(strengths.get(k, 0.0))) > tol for k in keys)
+
+    # ===== Helper: calibrate z to target service via short grid search =====
+    def calibrate_z_to_service(self, target_service: float = 0.95, z_grid: Optional[np.ndarray] = None) -> float:
+        if z_grid is None:
+            z_grid = np.linspace(0.8, 2.6, 10)
+        best_z = self.policy.z_alpha
+        best_val = float("inf")
+        # Snapshot current policy
+        z_prev = self.policy.z_alpha
+        try:
+            for z in z_grid:
+                self.policy.z_alpha = float(z)
+                df = self.simulate()
+                kpi = self.summarize(df)
+                # distance to target with slight cost penalty to avoid extreme z
+                val = abs(float(kpi.get("service_level", 0.0)) - target_service) + 0.01 * max(0.0, float(kpi.get("cost_proxy", 0.0)))
+                if val < best_val:
+                    best_val = val
+                    best_z = float(z)
+        finally:
+            self.policy.z_alpha = z_prev
+        return best_z
+
+    # ===== Helper: minimal Pareto grid on (z, r, e) =====
+    def pareto_front(self, base_z: float, allow_logistics: bool, trials: int = 30, allow_price: bool = False) -> List[Dict[str, Any]]:
+        z_vals = np.clip(np.linspace(base_z - 0.2, base_z + 0.2, 5), 0.5, 3.0)
+        r_vals = [0.0, 0.05, 0.1] if allow_logistics else [0.0]
+        e_vals = [0.0, 0.05, 0.1] if allow_logistics else [0.0]
+        p_vals = [0.0, -0.5, -1.0] if allow_price else [0.0]
+        points: List[Dict[str, Any]] = []
+        for z in z_vals:
+            for r in r_vals:
+                for e in e_vals:
+                    for p in p_vals:
+                        imp = self._quantified_impact(float(z), float(r), float(e), trials=trials, price_adjust=float(p))
+                        exp = imp.get("expected", {})
+                        points.append({
+                            "z_alpha_new": float(z),
+                            "reroute_share": float(r),
+                            "expedite_share": float(e),
+                            "price_adjust": float(p),
+                            "expected": exp,
+                            "ci80": imp.get("ci80", {}),
+                            "cvar_loss": imp.get("cvar_loss", 0.0),
+                        })
+        # Pareto filter: maximize service, minimize cost and bullwhip
+        def dominates(a: Dict[str, Any], b: Dict[str, Any]) -> bool:
+            ea, eb = a["expected"], b["expected"]
+            svc_a, cost_a, bw_a = ea.get("service", 0.0), ea.get("cost_proxy", 0.0), ea.get("bullwhip", 0.0)
+            svc_b, cost_b, bw_b = eb.get("service", 0.0), eb.get("cost_proxy", 0.0), eb.get("bullwhip", 0.0)
+            return (svc_a >= svc_b and cost_a <= cost_b and bw_a <= bw_b) and (svc_a > svc_b or cost_a < cost_b or bw_a < bw_b)
+        pareto: List[Dict[str, Any]] = []
+        for p in points:
+            if not any(dominates(q, p) for q in points if q is not p):
+                pareto.append(p)
+        return pareto
+
+    def z_service_curve(self, z_values: Optional[np.ndarray] = None) -> List[Dict[str, float]]:
+        if z_values is None:
+            z_values = np.linspace(0.8, 2.6, 10)
+        curve: List[Dict[str, float]] = []
+        z_prev = self.policy.z_alpha
+        try:
+            for z in z_values:
+                self.policy.z_alpha = float(z)
+                df = self.simulate()
+                k = self.summarize(df)
+                curve.append({"z": float(z), "service": float(k.get("service_level", 0.0)), "cost_proxy": float(k.get("cost_proxy", 0.0))})
+        finally:
+            self.policy.z_alpha = z_prev
+        return curve
+
+    # ===== Real-world KPI ingestion =====
+    def ingest_kpis(self, kpis: Dict[str, float]) -> None:
+        """Ingest external KPIs (e.g., service %, cost, bullwhip) and store history."""
+        safe = {
+            "service": float(kpis.get("service", np.nan)),
+            "cost_proxy": float(kpis.get("cost_proxy", np.nan)),
+            "bullwhip": float(kpis.get("bullwhip", np.nan)),
+        }
+        self.kpi_history.append(safe)
+
+    # ===== Dynamic data feeds =====
+    def register_feed(self, name: str, fetch_fn: Any) -> None:
+        """Register a callable that returns dicts to merge into df or KPIs."""
+        self._feeds[name] = fetch_fn
+
+    def poll_feeds(self) -> Dict[str, Any]:
+        """Poll all feeds and merge into state; return a snapshot of updates."""
+        updates: Dict[str, Any] = {}
+        for name, fn in list(self._feeds.items()):
+            try:
+                data = fn()
+                updates[name] = data
+                # If KPI-like, ingest; else if dataframe-like keys, merge shallowly
+                if isinstance(data, dict) and set(["service", "cost_proxy", "bullwhip"]).issubset(set(data.keys())):
+                    self.ingest_kpis(data)
+                # Extend here to merge time-series; keeping simple for now
+            except Exception as e:
+                updates[name] = {"error": str(e)}
+        return updates
+
+    # ===== Action validation and rollback =====
+    def validate_and_rollback(
+        self,
+        new_kpis: Dict[str, float],
+        thresholds: Dict[str, float] = None,
+    ) -> Dict[str, Any]:
+        """Validate last applied action against fresh KPIs; rollback if violated.
+
+        thresholds: {"min_service_gain": 0.0, "max_cost_increase": 0.0, "max_bullwhip_increase": 0.0}
+        """
+        if thresholds is None:
+            thresholds = {"min_service_gain": 0.0, "max_cost_increase": 0.0, "max_bullwhip_increase": 0.0}
+        if not self.kpi_history:
+            self.ingest_kpis(new_kpis)
+            return {"rolled_back": False, "reason": "no_baseline"}
+        prev = self.kpi_history[-1]
+        self.ingest_kpis(new_kpis)
+        ds = float(new_kpis.get("service", 0.0) - (prev.get("service", 0.0) if prev.get("service") is not None else 0.0))
+        dc = float(new_kpis.get("cost_proxy", 0.0) - (prev.get("cost_proxy", 0.0) if prev.get("cost_proxy") is not None else 0.0))
+        db = float(new_kpis.get("bullwhip", 0.0) - (prev.get("bullwhip", 0.0) if prev.get("bullwhip") is not None else 0.0))
+        violate = (ds < thresholds["min_service_gain"]) or (dc > thresholds["max_cost_increase"]) or (db > thresholds["max_bullwhip_increase"]) 
+        if violate and self.action_history:
+            # rollback: revert to previous controls, dampen risky knobs
+            last = self.action_history[-1]
+            self.policy.z_alpha = float(last.get("z_alpha_prev", self.policy.z_alpha))
+            self.last_controls["z_alpha_new"] = self.policy.z_alpha
+            for k in ["reroute_share", "expedite_share", "dual_source_share"]:
+                self.last_controls[k] = max(0.0, self.last_controls.get(k, 0.0) * 0.5)
+            return {"rolled_back": True, "reason": "threshold_violation", "delta": {"service": ds, "cost": dc, "bullwhip": db}}
+        return {"rolled_back": False, "reason": "ok", "delta": {"service": ds, "cost": dc, "bullwhip": db}}
+
+    # ===== Reinforcement-based self-tuning =====
+    def reinforce_from_outcome(self, expected: Dict[str, float]) -> Dict[str, float]:
+        """Update MPC weights from outcome using a simple reward: r = dS - a*max(0,dC) - b*max(0,dB)."""
+        dS = float(expected.get("service", 0.0))
+        dC = float(expected.get("cost_proxy", 0.0))
+        dB = float(expected.get("bullwhip", 0.0))
+        a, b, lr = 1.0, 0.5, 0.1
+        reward = dS - a * max(0.0, dC) - b * max(0.0, dB)
+        # Increase emphasis on service if reward positive; else increase cost/bullwhip penalty
+        if reward >= 0:
+            self.mpc_weights["service"] = float(min(2.0, self.mpc_weights.get("service", 1.0) + lr * reward))
+            self.mpc_weights["cost"] = float(max(0.2, self.mpc_weights.get("cost", 1.0) * (1.0 - 0.05)))
+        else:
+            self.mpc_weights["cost"] = float(min(2.0, self.mpc_weights.get("cost", 1.0) + lr * (-reward)))
+            self.mpc_weights["bullwhip"] = float(min(2.0, self.mpc_weights.get("bullwhip", 0.5) + lr * 0.5 * (-reward)))
+        return dict(self.mpc_weights)
+
+    def _feasible(self, proposal: Dict[str, Any]) -> bool:
+        rr = float(proposal.get("reroute_share", 0.0))
+        ex = float(proposal.get("expedite_share", 0.0))
+        ds = float(proposal.get("dual_source_share", 0.0))
+        if rr < 0 or ex < 0:
+            return False
+        if rr + ex + ds > self.lane_capacity:
+            return False
+        # rate limits
+        for k, cap in self.max_weekly_change.items():
+            prev = float(self.last_controls.get(k, 0.0))
+            cur = float(proposal.get(k, prev))
+            if abs(cur - prev) > cap:
+                return False
+        return True
+
+    def _quantified_impact(self, z_new: float, rr: float, ex: float, trials: int = 100, price_adjust: float = 0.0, alpha: float = 0.9) -> Dict[str, Any]:
+        # Run small Monte Carlo by injecting noise on D and L; measure KPI deltas
+        base = self.simulate()
+        base_kpi = self.summarize(base)
+        deltas = []
+        rng = self.rng
+        saved_price_adj = self._price_adjust
+        for _ in range(trials):
+            # stochastic shocks via temporary tweaks
+            shock = {"stochastic": True}
+            self.policy.z_alpha = z_new
+            # approximate expedite/reroute: reduce L and increase phi within shares
+            self.df["phi"] = np.clip(self.df["phi"] * (1.0 + 0.1 * rr), 0.2, 1.2)
+            self.df["L"] = np.clip(self.df["L"] * (1.0 - 0.2 * ex), 1.0, None)
+            self._price_adjust = float(price_adjust)
+            sim = self.simulate(interventions=None)
+            kpi = self.summarize(sim)
+            deltas.append({
+                "service": float(kpi["service_level"] - base_kpi["service_level"]),
+                "cost_proxy": float(kpi["cost_proxy"] - base_kpi["cost_proxy"]),
+                "bullwhip": float(kpi["bullwhip"] - base_kpi["bullwhip"]),
+            })
+        # restore controls
+        self._price_adjust = saved_price_adj
+        # Aggregate
+        svc = np.array([d["service"] for d in deltas])
+        cst = np.array([d["cost_proxy"] for d in deltas])
+        bwe = np.array([d["bullwhip"] for d in deltas])
+        def ci80(arr: np.ndarray) -> Tuple[float, float]:
+            return float(np.quantile(arr, 0.1)), float(np.quantile(arr, 0.9))
+        def ci95(arr: np.ndarray) -> Tuple[float, float]:
+            return float(np.quantile(arr, 0.025)), float(np.quantile(arr, 0.975))
+        loss = cst - svc + bwe
+        thr = float(np.quantile(loss, alpha))
+        cvar = float(loss[loss >= thr].mean()) if np.any(loss >= thr) else float(loss.mean())
+        return {
+            "expected": {"service": float(np.mean(svc)), "cost_proxy": float(np.mean(cst)), "bullwhip": float(np.mean(bwe))},
+            "ci80": {"service": ci80(svc), "cost_proxy": ci80(cst), "bullwhip": ci80(bwe)},
+            "ci95": {"service": ci95(svc), "cost_proxy": ci95(cst), "bullwhip": ci95(bwe)},
+            "samples": {"service": svc.tolist(), "cost_proxy": cst.tolist(), "bullwhip": bwe.tolist()},
+            "cvar_alpha": alpha,
+            "cvar_loss": cvar,
+        }
+
+    # ===== CVaR grid minimizer (discrete neighborhood search) =====
+    def cvar_select_from_grid(
+        self,
+        base: Dict[str, float],
+        alpha: float = 0.9,
+        eps: float = 0.05,
+        trials: int = 40,
+        weights: Optional[Dict[str, float]] = None,
+    ) -> Dict[str, Any]:
+        """Pick among a small grid around base (z,r,e,ds) to minimize CVaR_alpha of loss.
+
+        loss = w_cost*Δcost - w_service*Δservice + w_bw*Δbullwhip
+        """
+        if weights is None:
+            weights = {"cost": 1.0, "service": 1.0, "bullwhip": 0.5}
+        z0 = float(base.get("z_alpha_new", self.policy.z_alpha))
+        r0 = float(base.get("reroute_share", 0.0))
+        e0 = float(base.get("expedite_share", 0.0))
+        ds0 = float(base.get("dual_source_share", 0.0))
+        cand = [
+            {"z": z0, "r": r0, "e": e0},
+            {"z": z0+eps, "r": r0, "e": e0},
+            {"z": z0, "r": r0+eps, "e": e0},
+            {"z": z0, "r": r0, "e": e0+eps},
+            {"z": z0-eps, "r": r0, "e": e0},
+        ]
+        best = None
+        best_val = float("inf")
+        tail_q = alpha
+        for c in cand:
+            imp = self._quantified_impact(c["z"], c["r"], c["e"], trials=trials)
+            svc = np.array(imp["samples"]["service"])  # Δservice
+            cst = np.array(imp["samples"]["cost_proxy"])  # Δcost
+            bwe = np.array(imp["samples"]["bullwhip"])  # Δbullwhip
+            loss = weights["cost"] * cst - weights["service"] * svc + weights["bullwhip"] * bwe
+            thresh = np.quantile(loss, tail_q)
+            cvar = float(loss[loss >= thresh].mean()) if np.any(loss >= thresh) else float(loss.mean())
+            if cvar < best_val:
+                best_val = cvar
+                best = {"z_alpha_new": c["z"], "reroute_share": c["r"], "expedite_share": c["e"], "dual_source_share": ds0}
+        return {"choice": best, "cvar": best_val, "alpha": alpha}
+
+    @staticmethod
+    def _extract_final_json(text: str) -> Optional[Dict[str, Any]]:
+        try:
+            # Find the last JSON-like block with required keys
+            matches = re.findall(r"\{[\s\S]*?\}", text)
+            for chunk in reversed(matches):
+                if '"proposal"' in chunk and '"z_alpha_new"' in chunk:
+                    return json.loads(chunk)
+        except Exception:
+            return None
+        return None
+
+    @staticmethod
+    def _validate_proposal(p: Dict[str, Any]) -> Optional[Dict[str, float]]:
+        try:
+            z = float(np.clip(float(p.get("z_alpha_new")), 0.0, 3.0))
+            rr = float(np.clip(float(p.get("reroute_share")), 0.0, 1.0))
+            ex = float(np.clip(float(p.get("expedite_share")), 0.0, 1.0))
+            return {"z_alpha_new": z, "reroute_share": rr, "expedite_share": ex}
+        except Exception:
+            return None
+
+    def _llm_decision_loop(
+        self,
+        panel: pd.DataFrame,
+        s2: Dict[str, Any],
+        proposal: Optional[Dict[str, Any]],
+        decision: Dict[str, Any],
+        strengths: Dict[str, float],
+        kpis: Dict[str, Any],
+        rounds: int = 3,
+    ) -> Tuple[str, Optional[Dict[str, Any]]]:
+        if self.agent is None:
+            return "analysis_unavailable: agent_not_initialized", proposal
+
+        alerts = s2.get("alerts", [])
+        ai_out: Any = ""
+        for r in range(rounds):
+            # Edge guidance for narration
+            top_edges = sorted(strengths.items(), key=lambda kv: abs(kv[1]), reverse=True)[:5]
+            weak_edges = [k for k, v in strengths.items() if abs(v) <= 0.05]
+            narrative_prompt = (
+                f"Round {r+1}/{rounds}. Analyze state and propose safe actions.\n"
+                f"KPIs: service={kpis.get('service_level', 0.0):.2f}, cost_proxy={kpis.get('cost_proxy', 0.0):.2f}, bullwhip={kpis.get('bullwhip', 0.0):.2f}.\n"
+                f"Alerts: {alerts}.\n"
+                f"Current proposal: {proposal}. Decision: {decision}.\n"
+                f"Causal edges (use these): {dict(top_edges)}; avoid near-zero edges: {weak_edges}.\n"
+                f"Provide the 7-section output and the final JSON exactly per schema."
+            )
+            try:
+                ai_out = self.agent.run(narrative_prompt)
+            except Exception as e:
+                return f"analysis_unavailable: {e}", proposal
+            llm_json = self._extract_final_json(str(ai_out)) if isinstance(ai_out, str) else None
+            if llm_json and isinstance(llm_json.get("proposal"), dict):
+                validated = self._validate_proposal(llm_json["proposal"])
+                if validated:
+                    proposal = {**validated, "source": "llm"}
+                    decision = self.vsm.s5_policy_gate(proposal, s2, self.vsm.s3_star_audit(panel), risk_cap_cvar=0.15)
+        return str(ai_out), proposal
+
+    def _build_causal_graph(self) -> None:
+        g = self.crca.causal_graph
+        g.clear()
+        vars_graph = [
+            "L",  # lead time
+            "phi",  # survival/transport factor
+            "K",  # capacity
+            "dcost",
+            "B",  # backlog
+            "I",  # inventory
+            "p",  # price
+            "D",  # demand
+            "O",  # orders
+            "R",  # receipts
+        ]
+        g.add_nodes_from(vars_graph)
+        # Structural influences (signs where sensible)
+        self.crca.add_causal_relationship("K", "R", strength=0.0)  # more cap -> more receipts
+        self.crca.add_causal_relationship("phi", "R", strength=0.0)  # more survival -> more receipts
+        self.crca.add_causal_relationship("L", "R", strength=0.0)  # longer lead -> lower timely receipts
+        self.crca.edge_sign_constraints[("L", "R")] = -1
+
+        self.crca.add_causal_relationship("B", "p", strength=0.0)  # backlog -> higher price
+        self.crca.edge_sign_constraints[("B", "p")] = 1
+        self.crca.add_causal_relationship("I", "p", strength=0.0)  # inventory -> lower price
+        self.crca.edge_sign_constraints[("I", "p")] = -1
+        self.crca.add_causal_relationship("dcost", "p", strength=0.0)  # cost pass-through
+        self.crca.edge_sign_constraints[("dcost", "p")] = 1
+
+        self.crca.add_causal_relationship("p", "D", strength=0.0)  # pricing impacts demand
+        self.crca.edge_sign_constraints[("p", "D")] = -1
+        self.crca.add_causal_relationship("D", "O", strength=0.0)  # more demand -> more orders
+        self.crca.edge_sign_constraints[("D", "O")] = 1
+        self.crca.add_causal_relationship("R", "I", strength=0.0)
+        self.crca.edge_sign_constraints[("R", "I")] = 1
+        self.crca.add_causal_relationship("D", "B", strength=0.0)
+        self.crca.edge_sign_constraints[("D", "B")] = 1
+
+    @staticmethod
+    def _relu(x: float) -> float:
+        return float(max(0.0, x))
+
+    def _arrivals(self, O_hist: List[float], L_hist: List[int], phi_hist: List[float], t: int) -> float:
+        """Receipts at t: sum 1[L=ell]*O[t-ell]*phi[t-ell->t]."""
+        total = 0.0
+        for ell in range(1, min(10, t + 1)):
+            if L_hist[t] == ell:
+                total += O_hist[t - ell] * phi_hist[t - ell]
+        return total
+
+    def _queueing_leadtime(self, lam: float, mu: float, transport: float = 0.0) -> float:
+        rho = min(0.95, lam / max(mu, 1e-6))
+        wq = (rho / (mu * max(1e-6, (1 - rho)))) if rho < 0.999 else 10.0
+        return wq + (1.0 / max(mu, 1e-6)) + transport
+
+    def _price_pass_through(self, p_bar: float, dcost: float, B: float, I: float, D_ref: float) -> float:
+        return (
+            p_bar
+            + self.el.eta_c * dcost
+            + self.el.eta_B * (B / max(D_ref, 1e-6))
+            - self.el.eta_I * (I / max(D_ref, 1e-6))
+        )
+
+    def simulate(self, interventions: Optional[Dict[str, Any]] = None) -> pd.DataFrame:
+        """Run minimal multi-period SCM with optional do()-style interventions.
+
+        interventions: dict with keys like {'outage_facility': {'F1': 1}, 'disruption_route': {'R1': 1}}
+        For simplicity, treat interventions as shocks to K (capacity), L (lead), and phi.
+        """
+        df = self.df.copy()
+        # Initialize per (sku,facility)
+        for (sku, fac), sub in df.groupby(level=["sku", "facility" ]):
+            O = [0.0] * self.T
+            R = [0.0] * self.T
+            I = [float(sub.iloc[0]["I"])] + [0.0] * (self.T - 1)
+            B = [float(sub.iloc[0]["B"])] + [0.0] * (self.T - 1)
+            P = [float(sub.iloc[0]["P"])] + [0.0] * (self.T - 1)
+            L_hist = [int(sub.iloc[min(i, len(sub)-1)]["L"]) for i in range(self.T)]
+            phi_hist = [float(sub.iloc[min(i, len(sub)-1)]["phi"]) for i in range(self.T)]
+            K_hist = [float(sub.iloc[min(i, len(sub)-1)]["K"]) for i in range(self.T)]
+
+            # Apply high-level interventions (if any)
+            for t in range(self.T):
+                if interventions:
+                    if interventions.get("outage_facility", {}).get(fac, 0) == 1:
+                        K_hist[t] = K_hist[t] * 0.7  # 30% capacity loss
+                    if interventions.get("disruption_route", {}).get(fac, 0) == 1:
+                        L_hist[t] = max(1, L_hist[t] + 1)
+                        phi_hist[t] = max(0.2, phi_hist[t] * 0.8)
+
+            # Period loop
+            for t in range(self.T):
+                # Demand and cost dynamics (toy):
+                D_t = float(sub.iloc[t]["D"]) if t < len(sub) else 100.0
+                dcost_t = float(sub.iloc[t]["dcost"]) if t < len(sub) else 0.0
+                pbar = (float(sub.iloc[t]["p_bar"]) if t < len(sub) else 15.0) + float(self._price_adjust)
+
+                # Receipts from earlier orders
+                R[t] = self._arrivals(O, L_hist, phi_hist, t)
+
+                # Shipments and inventory/backorders
+                S_t = min(I[t - 1] + (R[t] if t > 0 else 0.0), D_t + (B[t - 1] if t > 0 else 0.0))
+                if t > 0:
+                    I[t] = I[t - 1] + R[t] - S_t
+                    B[t] = max(0.0, D_t + B[t - 1] - (I[t - 1] + R[t]))
+
+                # Demand response to price
+                p_t = self._price_pass_through(pbar, dcost_t, B[t], I[t], float(sub.iloc[0]["D_ref"]))
+                # Simple log-linear elasticity around reference
+                D_t_eff = max(0.0, D_t * math.exp(-0.01 * (p_t - pbar)))
+
+                # Lead-time estimate (M/M/1 rough cut)
+                lam = D_t_eff
+                mu = max(1e-6, K_hist[t] / max(1.0, len(self.skus)))
+                L_eff = max(1.0, self._queueing_leadtime(lam, mu, transport=float(L_hist[t]) - 1.0))
+
+                # Base-stock target and orders
+                POS_t = I[t] + P[t]
+                muL = L_eff
+                sigL = 0.5 * muL
+                target = muL * D_t_eff + self.policy.z_alpha * sigL * math.sqrt(max(1e-6, D_t_eff))
+                O_policy = self._relu(target - POS_t)
+                # Order smoothing
+                O_prev = O[t - 1] if t > 0 else 0.0
+                O[t] = (1 - self.policy.theta_smoothing) * O_prev + self.policy.theta_smoothing * O_policy
+
+                # Update pipeline (very simplified)
+                if t < self.T - 1:
+                    P[t + 1] = max(0.0, P[t] + O[t] - R[t])
+
+                # Capacity constraint (aggregate receipts)
+                R[t] = min(R[t], K_hist[t])
+
+                # Write back to df
+                df.loc[(t, sku, fac), ["R", "I", "B", "O", "p", "L", "phi", "K"]] = [
+                    R[t], I[t], B[t], O[t], p_t, L_eff, phi_hist[t], K_hist[t]
+                ]
+
+        return df
+
+    # ===== Reporting =====
+    def summarize(self, df: pd.DataFrame) -> Dict[str, Any]:
+        out: Dict[str, Any] = {}
+        # Simple KPIs
+        service = 1.0 - (df["B"].groupby(level="t").mean() > 0).mean()
+        holding_cost = df["I"].clip(lower=0).mean() * 0.1
+        shortage_penalty = df["B"].mean() * 1.0
+        ordering_cost = df["O"].mean() * df["c"].mean()
+        cost = holding_cost + shortage_penalty + ordering_cost
+        bwe = float((df["O"].var() / max(df["D"].var(), 1e-6)))
+        out["service_level"] = float(service)
+        out["cost_proxy"] = float(cost)
+        out["bullwhip"] = bwe
+        return out
+
+    # ===== Causal runs (Upgraded) =====
+    def causal_edges(self, df: pd.DataFrame) -> Dict[str, float]:
+        """Fit causal edges and return strengths, now with enhanced analysis."""
+        # Fit on panel averages per t
+        panel = df.groupby(level="t").mean(numeric_only=True)
+        vars_fit = [c for c in ["L", "phi", "K", "dcost", "B", "I", "p", "D", "O", "R"] if c in panel.columns]
+        try:
+            self.crca.fit_from_dataframe(panel, variables=vars_fit, window=min(30, len(panel)), decay_alpha=0.9, ridge_lambda=0.1)
+        except Exception as e:
+            logger.warning(f"CRCA fit skipped: {e}")
+        strengths = {}
+        for u, v in self.crca.causal_graph.edges():
+            strengths[f"{u}->{v}"] = float(self.crca.causal_graph[u][v].get("strength", 0.0))
+        return strengths
+
+    def advanced_causal_analysis(self, df: pd.DataFrame) -> Dict[str, Any]:
+        """Run comprehensive advanced causal analysis using all upgraded CR-CA methods."""
+        panel = df.groupby(level="t").mean(numeric_only=True)
+        vars_fit = [c for c in ["L", "phi", "K", "dcost", "B", "I", "p", "D", "O", "R"] if c in panel.columns]
+        
+        # Fit causal graph first
+        try:
+            self.crca.fit_from_dataframe(panel, variables=vars_fit, window=min(30, len(panel)), decay_alpha=0.9, ridge_lambda=0.1)
+        except Exception as e:
+            logger.warning(f"CRCA fit skipped: {e}")
+            return {"error": str(e)}
+        
+        # Get latest state for analysis
+        latest = panel.iloc[-1] if len(panel) > 0 else {}
+        factual_state = {var: float(latest.get(var, 0.0)) for var in vars_fit if var in latest}
+        
+        # ========== UPGRADED METHODS ==========
+        results: Dict[str, Any] = {
+            "causal_strengths": {},
+            "sensitivity_analysis": {},
+            "granger_causality": {},
+            "information_theory": {},
+            "var_model": {},
+            "bayesian_edges": {},
+            "root_causes": {},
+            "shapley_attribution": {},
+            "whatif_analysis": {},
+            "optimal_intervention": {},
+            "alternate_realities": {},
+        }
+        
+        # Get causal strengths
+        for u, v in self.crca.causal_graph.edges():
+            results["causal_strengths"][f"{u}->{v}"] = float(self.crca.causal_graph[u][v].get("strength", 0.0))
+        
+        # 1. Sensitivity Analysis: What drives service/cost changes most?
+        try:
+            if len(factual_state) >= 4:
+                intervention_vars = [v for v in ["L", "phi", "K", "dcost", "B"] if v in factual_state][:4]
+                test_intervention = {k: factual_state.get(k, 0.0) for k in intervention_vars}
+                
+                # Analyze sensitivity to service (via B→p→D chain) and cost
+                sensitivity_service = self.crca.sensitivity_analysis(
+                    intervention=test_intervention,
+                    target="B",  # Backlog affects service
+                    perturbation_size=0.01,
+                )
+                sensitivity_cost = self.crca.sensitivity_analysis(
+                    intervention={k: v for k, v in test_intervention.items() if k in ["dcost", "L", "phi"]},
+                    target="p",  # Price affects cost
+                    perturbation_size=0.01,
+                )
+                results["sensitivity_analysis"] = {
+                    "service_drivers": sensitivity_service,
+                    "cost_drivers": sensitivity_cost,
+                }
+                logger.info(f"Sensitivity: service={sensitivity_service.get('most_influential_variable', 'N/A')}, cost={sensitivity_cost.get('most_influential_variable', 'N/A')}")
+        except Exception as e:
+            logger.debug(f"Sensitivity analysis failed: {e}")
+        
+        # 2. Granger Causality: Temporal causal relationships
+        try:
+            if len(panel) >= 20:
+                # Test if demand Granger-causes orders
+                granger_d_o = self.crca.granger_causality_test(
+                    df=panel,
+                    var1="D",
+                    var2="O",
+                    max_lag=3,
+                )
+                # Test if backlog Granger-causes price
+                granger_b_p = self.crca.granger_causality_test(
+                    df=panel,
+                    var1="B",
+                    var2="p",
+                    max_lag=2,
+                )
+                results["granger_causality"] = {
+                    "demand_granger_causes_orders": granger_d_o.get("granger_causes", False),
+                    "backlog_granger_causes_price": granger_b_p.get("granger_causes", False),
+                    "d_o_f_stat": granger_d_o.get("f_statistic", 0.0),
+                    "b_p_f_stat": granger_b_p.get("f_statistic", 0.0),
+                }
+                logger.info(f"Granger causality: D→O={granger_d_o.get('granger_causes', False)}, B→p={granger_b_p.get('granger_causes', False)}")
+        except Exception as e:
+            logger.debug(f"Granger causality test failed: {e}")
+        
+        # 3. Information Theoretic Measures
+        try:
+            if len(panel) >= 10:
+                core_vars = [v for v in ["D", "O", "B", "I", "p", "L"] if v in panel.columns]
+                if len(core_vars) >= 3:
+                    info_theory = self.crca.compute_information_theoretic_measures(
+                        df=panel,
+                        variables=core_vars,
+                    )
+                    results["information_theory"] = info_theory
+                    logger.info(f"Information theory: {len(info_theory.get('entropies', {}))} entropies computed")
+        except Exception as e:
+            logger.debug(f"Information theory computation failed: {e}")
+        
+        # 4. VAR Model: Vector Autoregression
+        try:
+            if len(panel) >= 30:
+                var_vars = [v for v in ["D", "O", "I", "B", "p"] if v in panel.columns]
+                if len(var_vars) >= 2:
+                    var_model = self.crca.vector_autoregression_estimation(
+                        df=panel,
+                        variables=var_vars,
+                        max_lag=2,
+                    )
+                    results["var_model"] = var_model
+                    logger.info(f"VAR model: {var_model.get('n_variables', 0)} variables, lag={var_model.get('max_lag', 0)}")
+        except Exception as e:
+            logger.debug(f"VAR estimation failed: {e}")
+        
+        # 5. Bayesian Edge Inference
+        try:
+            bayesian_edges = {}
+            key_edges = [("B", "p"), ("I", "p"), ("dcost", "p"), ("D", "O"), ("L", "R")]
+            for parent, child in key_edges:
+                if parent in panel.columns and child in panel.columns:
+                    bayes_result = self.crca.bayesian_edge_inference(
+                        df=panel,
+                        parent=parent,
+                        child=child,
+                        prior_mu=0.0,
+                        prior_sigma=1.0,
+                    )
+                    if "error" not in bayes_result:
+                        bayesian_edges[f"{parent}->{child}"] = {
+                            "posterior_mean": bayes_result.get("posterior_mean", 0.0),
+                            "posterior_std": bayes_result.get("posterior_std", 0.0),
+                            "credible_interval": bayes_result.get("credible_interval_95", (0.0, 0.0)),
+                        }
+            results["bayesian_edges"] = bayesian_edges
+            if bayesian_edges:
+                logger.info(f"Bayesian inference for {len(bayesian_edges)} edges")
+        except Exception as e:
+            logger.debug(f"Bayesian inference failed: {e}")
+        
+        # 6. Deep Root Cause Analysis: Find ultimate drivers of service/cost issues
+        try:
+            root_causes_service = self.crca.deep_root_cause_analysis(
+                problem_variable="B",  # Backlog is service issue
+                max_depth=8,
+                min_path_strength=0.01,
+            )
+            root_causes_cost = self.crca.deep_root_cause_analysis(
+                problem_variable="p",  # Price is cost proxy
+                max_depth=8,
+                min_path_strength=0.01,
+            )
+            results["root_causes"] = {
+                "service_issues": root_causes_service,
+                "cost_issues": root_causes_cost,
+            }
+            if root_causes_service.get("ultimate_root_causes"):
+                logger.info(f"Root causes (service): {[rc.get('root_cause') for rc in root_causes_service.get('ultimate_root_causes', [])[:3]]}")
+        except Exception as e:
+            logger.debug(f"Root cause analysis failed: {e}")
+        
+        # 7. Shapley Value Attribution: Fair attribution of KPI drivers
+        try:
+            if len(panel) >= 7:
+                # Baseline: average over last week
+                baseline_state = {
+                    k: float(panel[k].tail(7).mean()) 
+                    for k in factual_state.keys() 
+                    if k in panel.columns
+                }
+                if baseline_state and "B" in baseline_state:
+                    shapley_backlog = self.crca.shapley_value_attribution(
+                        baseline_state=baseline_state,
+                        target_state=factual_state,
+                        target="B",
+                    )
+                    if "p" in baseline_state:
+                        shapley_price = self.crca.shapley_value_attribution(
+                            baseline_state=baseline_state,
+                            target_state=factual_state,
+                            target="p",
+                        )
+                        results["shapley_attribution"] = {
+                            "backlog_drivers": shapley_backlog,
+                            "price_drivers": shapley_price,
+                        }
+                        logger.info(f"Shapley attribution computed for B and p")
+        except Exception as e:
+            logger.debug(f"Shapley attribution failed: {e}")
+        
+        # 8. Multi-layer What-If Analysis: Cascading effects of disruptions
+        try:
+            test_scenarios = [
+                {"L": factual_state.get("L", 2.0) * 1.5},  # Lead time disruption
+                {"phi": max(0.2, factual_state.get("phi", 1.0) * 0.7)},  # Survival rate drop
+                {"dcost": factual_state.get("dcost", 0.0) + 2.0},  # Cost shock
+            ]
+            whatif_analysis = self.crca.multi_layer_whatif_analysis(
+                scenarios=test_scenarios,
+                depth=3,
+            )
+            results["whatif_analysis"] = whatif_analysis
+            logger.info(f"What-if analysis: {whatif_analysis.get('summary', {}).get('total_scenarios', 0)} scenarios")
+        except Exception as e:
+            logger.debug(f"What-if analysis failed: {e}")
+        
+        # 9. Optimal Intervention Sequence: Bellman optimization
+        try:
+            optimal_intervention = self.crca.bellman_optimal_intervention(
+                initial_state=factual_state,
+                target="B",  # Minimize backlog (maximize service)
+                intervention_vars=["L", "phi", "K", "dcost"],
+                horizon=5,
+                discount=0.9,
+            )
+            results["optimal_intervention"] = optimal_intervention
+            if optimal_intervention.get("optimal_sequence"):
+                logger.info(f"Optimal intervention sequence: {len(optimal_intervention['optimal_sequence'])} steps")
+        except Exception as e:
+            logger.debug(f"Optimal intervention failed: {e}")
+        
+        # 10. Explore Alternate Realities: Best intervention scenarios
+        try:
+            alternate_realities = self.crca.explore_alternate_realities(
+                factual_state=factual_state,
+                target_outcome="B",  # Minimize backlog
+                target_value=0.0,  # Target zero backlog
+                max_realities=30,
+                max_interventions=3,
+            )
+            results["alternate_realities"] = alternate_realities
+            if alternate_realities.get("best_reality"):
+                improvement = factual_state.get("B", 0.0) - alternate_realities["best_reality"].get("target_value", 0.0)
+                logger.info(f"Best alternate reality: {improvement:+.2f} backlog reduction")
+        except Exception as e:
+            logger.debug(f"Alternate realities exploration failed: {e}")
+        
+        # 11. Cascading Chain Reaction Analysis
+        try:
+            if "L" in factual_state:
+                chain_reaction = self.crca.analyze_cascading_chain_reaction(
+                    initial_intervention={"L": factual_state.get("L", 2.0) * 1.5},
+                    target_outcomes=["B", "I", "O", "p", "D"],
+                    max_hops=6,
+                    include_feedback_loops=True,
+                    num_iterations=4,
+                )
+                results["chain_reaction"] = chain_reaction
+                logger.info(f"Chain reaction analysis: {chain_reaction.get('summary', {}).get('total_paths_found', 0)} paths")
+        except Exception as e:
+            logger.debug(f"Chain reaction analysis failed: {e}")
+        
+        # 12. Cross-validation for edge strength reliability
+        try:
+            cv_results = {}
+            for parent, child in [("B", "p"), ("D", "O"), ("L", "R")]:
+                if parent in panel.columns and child in panel.columns:
+                    cv = self.crca.cross_validate_edge_strength(
+                        df=panel,
+                        parent=parent,
+                        child=child,
+                        n_folds=5,
+                    )
+                    if "error" not in cv:
+                        cv_results[f"{parent}->{child}"] = {
+                            "mean_cv_error": cv.get("mean_cv_error", 0.0),
+                            "standard_error": cv.get("standard_error", 0.0),
+                        }
+            results["cross_validation"] = cv_results
+            if cv_results:
+                logger.info(f"Cross-validation for {len(cv_results)} edges")
+        except Exception as e:
+            logger.debug(f"Cross-validation failed: {e}")
+        
+        return results
+
+    def intervene_and_compare(self, scenario: Dict[str, Any]) -> Dict[str, Any]:
+        base = self.simulate()
+        base_kpi = self.summarize(base)
+        shock = self.simulate(interventions=scenario)
+        shock_kpi = self.summarize(shock)
+        delta = {k: float(shock_kpi.get(k, 0.0) - base_kpi.get(k, 0.0)) for k in base_kpi}
+        return {"base": base_kpi, "shock": shock_kpi, "delta": delta}
+
+    # ===== VSM overlay orchestration =====
+    def control_cycle(
+        self,
+        telemetry_events: Optional[List[Dict[str, Any]]] = None,
+        intel_events: Optional[List[Dict[str, Any]]] = None,
+    ) -> Dict[str, Any]:
+        """One control cycle over S2–S5: ingest telemetry, monitor, propose, audit, gate."""
+        # Ingest telemetry/intel (stubs)
+        # Dynamic feeds first
+        _ = self.poll_feeds()
+        if telemetry_events:
+            self.vsm.ingest_s1_flow(self.df, telemetry_events)
+        if intel_events:
+            self.vsm.ingest_s4_external(intel_events)
+
+        # Simulate baseline for the cycle
+        df = self.simulate()
+        panel = df.groupby(level="t").mean(numeric_only=True)
+
+        # S2 stability monitors
+        s2 = self.vsm.s2_monitor(panel)
+
+        # S3 propose optimizers only if S2 stable
+        proposal = None
+        if s2.get("stable", False):
+            proposal = self.vsm.s3_optimize(panel, self.policy)
+            # SPC/EWMA-driven mode switch: if EWMA breaches on backlog, bias to higher service target
+            backlog_alerts = [a for a in s2.get("alerts", []) if a.get("type") == "ewma" and a.get("signal") == "B"]
+            target_service = 0.95 + (0.02 if backlog_alerts else 0.0)
+            z_cal = self.calibrate_z_to_service(target_service=target_service)
+            proposal["z_alpha_new"] = float(z_cal)
+
+        # S3★ audit
+        audit = self.vsm.s3_star_audit(panel)
+
+        # S5 gate with policy caps (LLM-led proposals are still safety-gated here)
+        decision = self.vsm.s5_policy_gate(proposal, s2, audit, risk_cap_cvar=0.15)
+
+        # Build causal strengths snapshot and LLM narratives
+        strengths = self.causal_edges(df)
+        # Build strength-aware explanation preface
+        top_edges = sorted(strengths.items(), key=lambda kv: abs(kv[1]), reverse=True)[:5]
+        explainer = {k: v for k, v in top_edges}
+        # Compute weak edges to avoid claiming
+        weak_edges = {k: v for k, v in strengths.items() if abs(v) <= 0.05}
+        # Prepare concise narrative prompt for the agent
+        kpis = self.summarize(df)
+        alerts = s2.get("alerts", [])
+        proposal_text = str(proposal) if proposal else "None"
+        decision_text = str(decision)
+        narrative_prompt = (
+            f"Analyze supply chain state and propose safe actions.\n"
+            f"KPIs: service={kpis.get('service_level', 0.0):.2f}, cost_proxy={kpis.get('cost_proxy', 0.0):.2f}, bullwhip={kpis.get('bullwhip', 0.0):.2f}.\n"
+            f"Alerts: {alerts}.\n"
+            f"Proposal: {proposal_text}. Decision: {decision_text}.\n"
+            f"Causal edges (mirror these in explanation): {explainer}.\n"
+            f"Do NOT claim effects via edges with near-zero strength: {list(weak_edges.keys())}.\n"
+            f"Provide the 7-section output per instructions."
+        )
+        # Multi-round LLM-led decision loop
+        ai_analysis, proposal = self._llm_decision_loop(
+            panel=panel,
+            s2=s2,
+            proposal=proposal,
+            decision=decision,
+            strengths=strengths,
+            kpis=kpis,
+            rounds=3,
+        )
+
+        # Feasibility check and quantified impact
+        feasibility_flag = False
+        impact = None
+        if isinstance(proposal, dict):
+            # Gate logistics levers by learned DAG support
+            allow_logistics = self._logistics_support_from_strengths(strengths, tol=0.05)
+            allow_price = (abs(float(strengths.get("B->p", 0.0))) > 0.05) and (abs(float(strengths.get("p->D", 0.0))) > 0.05)
+            if not allow_logistics:
+                proposal["reroute_share"] = 0.0
+                proposal["expedite_share"] = 0.0
+            if not allow_price:
+                proposal["price_adjust"] = 0.0
+            else:
+                proposal.setdefault("price_adjust", 0.0)
+            feasibility_flag = self._feasible(proposal)
+            z_new = float(proposal.get("z_alpha_new", self.policy.z_alpha))
+            rr = float(proposal.get("reroute_share", 0.0))
+            ex = float(proposal.get("expedite_share", 0.0))
+            price_adj = float(proposal.get("price_adjust", 0.0))
+            impact = self._quantified_impact(z_new, rr, ex, trials=50, price_adjust=price_adj)
+            # auto de-risk actions on red tier or excessive cost
+            if s2.get("tier") == "red" or (impact and impact.get("expected", {}).get("cost_proxy", 0.0) > 0):
+                # freeze increases to expedite/reroute
+                proposal["expedite_share"] = min(float(proposal.get("expedite_share", 0.0)), self.last_controls.get("expedite_share", 0.0))
+                proposal["reroute_share"] = min(float(proposal.get("reroute_share", 0.0)), self.last_controls.get("reroute_share", 0.0))
+            # Optional: refine via constrained MPC if feasible
+            if feasibility_flag:
+                mpc = constrained_mpc_policy(
+                    last=self.last_controls,
+                    limits=self.max_weekly_change,
+                    lane_cap=self.lane_capacity,
+                    weights=self.mpc_weights,
+                    impact=impact,
+                )
+                if "error" not in mpc:
+                    proposal.update({k: v for k, v in mpc.items() if k in ["z_alpha_new", "reroute_share", "expedite_share", "dual_source_share"]})
+                # Final hard-feasibility polish via CP-SAT
+                cps = cpsat_policy(self.last_controls, self.max_weekly_change, self.lane_capacity)
+                if "error" not in cps:
+                    proposal.update({k: v for k, v in cps.items() if k in ["z_alpha_new", "reroute_share", "expedite_share", "dual_source_share"]})
+                # CVaR neighborhood selection
+                cvar_pick = self.cvar_select_from_grid(proposal, alpha=0.9, eps=0.05, trials=30, weights=self.mpc_weights)
+                if cvar_pick.get("choice"):
+                    proposal.update(cvar_pick["choice"])
+                
+                # UPGRADED: Try gradient-based optimization for refinement
+                try:
+                    # Use current state as initial for gradient optimization
+                    current_state = {
+                        "z_alpha": z_new,
+                        "reroute_share": rr,
+                        "expedite_share": ex,
+                        "B": float(panel.get("B", pd.Series([0.0])).iloc[-1]),
+                        "I": float(panel.get("I", pd.Series([120.0])).iloc[-1]),
+                        "p": float(panel.get("p", pd.Series([15.0])).iloc[-1]),
+                    }
+                    
+                    # Optimize z_alpha to minimize backlog (via gradient)
+                    if "B" in panel.columns:
+                        opt_result = self.crca.gradient_based_intervention_optimization(
+                            initial_state=current_state,
+                            target="B",  # Minimize backlog
+                            intervention_vars=["z_alpha"],
+                            constraints={"z_alpha": (0.5, 3.0)},
+                            method="L-BFGS-B",
+                        )
+                        if opt_result.get("success") and opt_result.get("optimal_intervention"):
+                            # Refine z_alpha if gradient optimization suggests improvement
+                            opt_z = opt_result["optimal_intervention"].get("z_alpha", z_new)
+                            if abs(opt_z - z_new) < 0.3:  # Within rate limit
+                                proposal["z_alpha_new"] = float(opt_z)
+                                logger.info(f"Gradient optimization refined z_alpha: {z_new:.2f} → {opt_z:.2f}")
+                except Exception as e:
+                    logger.debug(f"Gradient optimization failed: {e}")
+                
+                # Provide minimal Pareto frontier for transparency
+                pareto = self.pareto_front(base_z=z_new, allow_logistics=allow_logistics, trials=20, allow_price=allow_price)
+            else:
+                pareto = []
+        else:
+            # Infeasible: rollback immediately
+            if self.action_history:
+                last = self.action_history[-1]
+                self.policy.z_alpha = float(last.get("z_alpha_prev", self.policy.z_alpha))
+                self.last_controls["z_alpha_new"] = self.policy.z_alpha
+                for k in ["reroute_share", "expedite_share", "dual_source_share"]:
+                    self.last_controls[k] = max(0.0, self.last_controls.get(k, 0.0) * 0.5)
+            pareto = []
+
+        # Apply approved proposal to live policy (LLM primacy) after safety gate
+        if isinstance(proposal, dict) and feasibility_flag:
+            decision = self.vsm.s5_policy_gate(proposal, s2, audit, risk_cap_cvar=0.15)
+            if decision.get("approved"):
+                self.policy.z_alpha = float(proposal.get("z_alpha_new", self.policy.z_alpha))
+                # persist last controls for rate-limit checks
+                self.last_controls = {
+                    "z_alpha_new": self.policy.z_alpha,
+                    "reroute_share": float(proposal.get("reroute_share", 0.0)),
+                    "expedite_share": float(proposal.get("expedite_share", 0.0)),
+                }
+                # record action for possible rollback and RL
+                self.action_history.append({
+                    "z_alpha_prev": float(self.last_controls["z_alpha_new"]),
+                    "reroute_share": float(self.last_controls["reroute_share"]),
+                    "expedite_share": float(self.last_controls["expedite_share"]),
+                })
+                if impact and impact.get("expected"):
+                    self.reinforce_from_outcome(impact["expected"])
+
+        # Advanced causal analysis using upgraded methods
+        advanced_causal = {}
+        try:
+            advanced_causal = self.advanced_causal_analysis(df)
+            logger.info(f"Advanced causal analysis completed: {len([k for k, v in advanced_causal.items() if v and 'error' not in str(v)])} methods succeeded")
+        except Exception as e:
+            logger.debug(f"Advanced causal analysis failed: {e}")
+        
+        # Human-readable causal summary via CR-CA agent (enhanced with upgraded insights)
+        try:
+            sensitivity_note = ""
+            if advanced_causal.get("sensitivity_analysis"):
+                sens_svc = advanced_causal["sensitivity_analysis"].get("service_drivers", {})
+                sens_cost = advanced_causal["sensitivity_analysis"].get("cost_drivers", {})
+                most_influential_svc = sens_svc.get("most_influential_variable", "N/A")
+                most_influential_cost = sens_cost.get("most_influential_variable", "N/A")
+                sensitivity_note = f" Sensitivity analysis shows {most_influential_svc} most drives service, {most_influential_cost} most drives cost."
+            
+            granger_note = ""
+            if advanced_causal.get("granger_causality"):
+                gc = advanced_causal["granger_causality"]
+                if gc.get("demand_granger_causes_orders"):
+                    granger_note = " Granger causality: D→O confirmed. "
+                if gc.get("backlog_granger_causes_price"):
+                    granger_note += "B→p temporally confirmed."
+            
+            summary_prompt = (
+                f"Summarize key drivers (B→p, I→p, dcost→p, L→R) and their implications.{sensitivity_note}{granger_note} "
+                f"Reference learned strengths: {dict(list(strengths.items())[:5])}."
+            )
+            causal_summary = self.crca.run(summary_prompt)
+        except Exception as e:
+            causal_summary = f"causal_unavailable: {e}"
+
+        return {
+            "s2": s2,
+            "proposal": proposal,
+            "audit": audit,
+            "decision": decision,
+            "kpis": kpis,
+            "causal_strengths": strengths,
+            "ai_analysis": ai_analysis,
+            "causal_summary": causal_summary,
+            "feasible": feasibility_flag,
+            "impact": impact,
+            "pareto_front": pareto,
+            "z_service_curve": self.z_service_curve(),
+            # Upgraded CR-CA analysis results
+            "advanced_causal": advanced_causal,
+            # Advanced hooks (stubs returning diagnostics)
+            "estimation": {
+                "ms_filter": ms_regime_filter(panel),
+                "bsts_nowcast": bsts_nowcast(panel),
+                "svar": svar_identification(panel),
+            },
+            "robust_optimization": {
+                "dro_mpc": dro_mpc_plan(panel),
+                "chance_mpc": chance_constrained_mpc(panel),
+                "h_infinity": h_infinity_controller(panel),
+                "sddp": sddp_policy_stub(panel),
+            },
+            "multi_echelon": {
+                "clark_scarf": clark_scarf_baseline(panel),
+                "risk_newsvendor": risk_averse_newsvendor_stub(panel),
+            },
+            "network_risk": {
+                "percolation": percolation_stub(panel),
+                "eisenberg_noe": eisenberg_noe_stub(panel),
+                "k_cuts": k_cut_sets_stub(),
+            },
+            "pricing": {
+                "logit": logit_share_stub(panel),
+                "dp_pricing": dynamic_pricing_dp_stub(panel),
+                "ramsey": ramsey_pricing_stub(panel),
+            },
+            "policy_eval": {
+                "synth_control": synthetic_control_stub(panel),
+                "did_iv": did_iv_stub(panel),
+            },
+            "security": {
+                "secure_state": secure_state_l1_stub(panel),
+                "spectral": spectral_shift_stub(panel),
+            },
+            "investment": {
+                "real_options": real_options_stub(),
+                "supplier_portfolio": supplier_portfolio_stub(),
+            },
+            "advanced2": {
+                "transport_modes": transport_modes_sim_stub(),
+                "online_em_ms": online_em_ms(panel),
+                "hier_bsts": hierarchical_bsts_stub(panel),
+                "multi_stage_mpc": multi_stage_mpc_stub(panel),
+                "iot_fusion": iot_fusion_stub(),
+                "nested_logit": nested_logit_stub(),
+                "kcut_hardening": kcut_hardening_stub(),
+                "linucb_policy": linucb_policy_stub(panel),
+                "l1_observer": l1_observer_stub(panel),
+                "fan_charts": fan_charts_stub(panel),
+                "async_ingest": {"kafka": True, "duckdb": True}
+            }
+        }
+
+
+# ===== Viable System Overlay (S2–S5) =====
+class VSMOverlay:
+    def __init__(self) -> None:
+        self.state: Dict[str, Any] = {"R_posterior": np.array([1.0])}
+
+    # Telemetry ingest (stubs)
+    def ingest_s1_flow(self, df: pd.DataFrame, events: List[Dict[str, Any]]) -> None:
+        # Example event schema documented; here we could append/merge into df
+        # For now we no-op (upgrade path to Kafka/Timescale later)
+        pass
+
+    def ingest_s4_external(self, events: List[Dict[str, Any]]) -> None:
+        # Store the latest intel snapshot
+        self.state["intel_last"] = events[-1] if events else None
+
+    # S2: Stability/coordination
+    def s2_monitor(self, panel: pd.DataFrame) -> Dict[str, Any]:
+        out: Dict[str, Any] = {"alerts": [], "stable": True, "tier": "green"}
+        # EWMA residuals on key KPIs
+        for col in [c for c in ["L", "I", "B"] if c in panel.columns]:
+            z, breaches = ewma_monitor(panel[col].values, lam=0.2, k=3.0)
+            if breaches > 0:
+                out["alerts"].append({"type": "ewma", "signal": col, "breaches": breaches})
+        # CUSUM on lead time
+        if "L" in panel.columns:
+            plus, minus, trips = cusum(panel["L"].values, mu0=float(panel["L"].head(5).mean()), k=0.1, h=5.0)
+            if trips:
+                out["alerts"].append({"type": "cusum", "signal": "L", "trips": len(trips)})
+        # Page-Hinkley on demand
+        if "D" in panel.columns and len(panel["D"]) > 20:
+            ph = page_hinkley(panel["D"].astype(float).values)
+            if ph["alarm"]:
+                out["alerts"].append({"type": "page_hinkley", "signal": "D", "mT": ph["mT"]})
+        # BOCPD change-point minimal
+        if "D" in panel.columns:
+            p_break = bocpd_break_prob(panel["D"].values, hazard=0.02)
+            if p_break > 0.5:
+                out["alerts"].append({"type": "bocpd", "p_break": p_break})
+        # Queueing sanity
+        if set(["D", "K"]).issubset(panel.columns):
+            lam = float(max(1e-6, panel["D"].iloc[-1]))
+            mu = float(max(1e-6, panel["K"].iloc[-1]))
+            rho = lam / mu
+            if rho > 0.85:
+                out["alerts"].append({"type": "utilization", "rho": rho})
+        # Stable if few alerts; tiering
+        n_alerts = len(out["alerts"])
+        out["stable"] = n_alerts == 0
+        if n_alerts == 0:
+            out["tier"] = "green"
+        elif n_alerts < 3:
+            out["tier"] = "yellow"
+        else:
+            out["tier"] = "red"
+        return out
+
+    # S3: Optimizers (stubs)
+    def s3_optimize(self, panel: pd.DataFrame, policy: PolicyParams) -> Dict[str, Any]:
+        # Heuristic constrained optimizer proxy; prefer stability
+        z = policy.z_alpha
+        rr = 0.0
+        ex = 0.05
+        ds = 0.0
+        if "B" in panel.columns:
+            b_trend = float(np.polyfit(np.arange(len(panel)), panel["B"].values, 1)[0]) if len(panel) >= 5 else 0.0
+            z = float(np.clip(z + 0.05 * np.sign(b_trend), 0.5, 2.5))
+        if self.state.get("intel_last"):
+            rr = 0.1
+        return {"z_alpha_new": z, "reroute_share": rr, "expedite_share": ex, "dual_source_share": ds}
+
+    # S3★: Audit
+    def s3_star_audit(self, panel: pd.DataFrame) -> Dict[str, Any]:
+        out: Dict[str, Any] = {}
+        if set(["O", "D"]).issubset(panel.columns):
+            varO = float(panel["O"].var())
+            varD = float(panel["D"].var())
+            out["BWE"] = float(varO / max(varD, 1e-6))
+        # Simple receipts cross-check stub (noisy)
+        out["receipts_delta_sigma"] = 0.0
+        return out
+
+    # S5: Policy gate
+    def s5_policy_gate(
+        self,
+        proposal: Optional[Dict[str, Any]],
+        s2: Dict[str, Any],
+        audit: Dict[str, Any],
+        risk_cap_cvar: float = 0.2,
+    ) -> Dict[str, Any]:
+        if proposal is None:
+            return {"approved": False, "reason": "no_proposal"}
+        if not s2.get("stable", False):
+            return {"approved": False, "reason": "unstable_S2"}
+        if audit.get("BWE", 1.0) > 1.3:
+            # tighten smoothing recommendation by halving expedite/reroute
+            proposal = {**proposal, "expedite_share": proposal.get("expedite_share", 0.0) * 0.5, "reroute_share": proposal.get("reroute_share", 0.0) * 0.5}
+        return {"approved": True, "proposal": proposal}
+
+
+# ===== Detectors (S2) =====
+def ewma_monitor(x: np.ndarray, lam: float = 0.2, k: float = 3.0) -> Tuple[np.ndarray, int]:
+    z = np.zeros_like(x, dtype=float)
+    z[0] = x[0]
+    for t in range(1, len(x)):
+        z[t] = lam * x[t] + (1 - lam) * z[t - 1]
+    resid = x - z
+    sigma = np.std(resid[max(1, len(resid)//10):]) or 1.0
+    breaches = int(np.sum(np.abs(resid) > k * sigma))
+    return z, breaches
+
+
+def cusum(x: np.ndarray, mu0: float, k: float, h: float) -> Tuple[np.ndarray, np.ndarray, List[int]]:
+    s_plus = np.zeros_like(x, dtype=float)
+    s_minus = np.zeros_like(x, dtype=float)
+    trips: List[int] = []
+    for t in range(1, len(x)):
+        s_plus[t] = max(0.0, s_plus[t - 1] + (x[t] - mu0 - k))
+        s_minus[t] = max(0.0, s_minus[t - 1] + (mu0 - x[t] - k))
+        if s_plus[t] > h or s_minus[t] > h:
+            trips.append(t)
+            s_plus[t] = 0.0
+            s_minus[t] = 0.0
+    return s_plus, s_minus, trips
+
+
+def bocpd_break_prob(x: np.ndarray, hazard: float = 0.02) -> float:
+    # Minimal BOCPD: approximate break prob by normalized absolute diff of recent means with hazard weight
+    if len(x) < 10:
+        return 0.0
+    n = len(x)
+    m1 = float(np.mean(x[: n // 2]))
+    m2 = float(np.mean(x[n // 2 :]))
+    delta = abs(m2 - m1) / (np.std(x) or 1.0)
+    p = 1.0 - math.exp(-hazard * delta)
+    return float(np.clip(p, 0.0, 1.0))
+
+
+def page_hinkley(x: np.ndarray, delta: float = 0.005, lamb: float = 50.0, alpha: float = 1.0) -> Dict[str, Any]:
+    # Minimal Page-Hinkley drift detector
+    mean = 0.0
+    mT = 0.0
+    MT = 0.0
+    alarm = False
+    for i, xi in enumerate(x):
+        mean = mean + (xi - mean) / (i + 1)
+        mT = mT + xi - mean - delta
+        MT = min(MT, mT)
+        if mT - MT > lamb * alpha:
+            alarm = True
+            break
+    return {"alarm": alarm, "mT": float(mT)}
+
+
+# ===== Advanced Estimation (stubs) =====
+def ms_regime_filter(panel: pd.DataFrame) -> Dict[str, Any]:
+    """Two-regime Markov-switching on demand using statsmodels MarkovRegression.
+
+    Returns current regime probabilities and smoothed prediction for next step.
+    """
+    try:
+        from statsmodels.tsa.regime_switching.markov_regression import MarkovRegression
+        if "D" not in panel.columns or len(panel) < 20:
+            return {"regime": "insufficient", "p_regime": {}}
+        y = panel["D"].astype(float).values
+        # Fit a simple mean-switching model with 2 regimes
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore")
+            mod = MarkovRegression(y, k_regimes=2, trend='c', switching_variance=True)
+            res = mod.fit(disp=False)
+        p_t = res.smoothed_marginal_probabilities.values[:, -1] if hasattr(res.smoothed_marginal_probabilities, 'values') else res.smoothed_marginal_probabilities
+        p_reg1 = float(p_t[-1])
+        regime = "shock" if p_reg1 > 0.5 else "normal"
+        return {"regime": regime, "p_regime": {"regime1": p_reg1, "regime0": 1 - p_reg1}}
+    except Exception as e:
+        return {"regime": "error", "error": str(e)}
+
+
+def bsts_nowcast(panel: pd.DataFrame) -> Dict[str, Any]:
+    """Dynamic factor nowcast for demand using statsmodels DynamicFactor (FAVAR-like)."""
+    try:
+        from statsmodels.tsa.statespace.dynamic_factor import DynamicFactor
+        cols = [c for c in ["D", "R", "I", "B", "O"] if c in panel.columns]
+        if len(cols) < 2 or len(panel) < 20:
+            mu = float(panel.get("D", pd.Series([100.0])).iloc[-1])
+            return {"D_nowcast": mu, "uncertainty": 0.2, "cols": cols}
+        endog = panel[cols].astype(float)
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore")
+            mod = DynamicFactor(endog, k_factors=1, factor_order=1)
+            res = mod.fit(disp=False)
+        # One-step ahead forecast for demand
+        fc = res.get_forecast(steps=1)
+        d_idx = cols.index("D")
+        d_mean = float(fc.predicted_mean.iloc[0, d_idx])
+        d_var = float(fc.var_pred_mean.iloc[0, d_idx]) if hasattr(fc, 'var_pred_mean') else 0.2
+        return {"D_nowcast": d_mean, "uncertainty": max(0.05, min(0.5, d_var ** 0.5)), "cols": cols}
+    except Exception as e:
+        mu = float(panel.get("D", pd.Series([100.0])).iloc[-1])
+        return {"D_nowcast": mu, "uncertainty": 0.3, "error": str(e)}
+
+
+def svar_identification(panel: pd.DataFrame) -> Dict[str, Any]:
+    """Estimate a small VAR and report impulse responses as proxy for shocks."""
+    try:
+        from statsmodels.tsa.api import VAR
+        cols = [c for c in ["D", "R", "I", "B", "p"] if c in panel.columns]
+        if len(cols) < 3 or len(panel) < 30:
+            return {"irf": {}, "cols": cols}
+        endog = panel[cols].astype(float)
+        model = VAR(endog)
+        res = model.fit(maxlags=2, ic='aic')
+        irf = res.irf(5)
+        irf_dict = {f"{src}->{dst}": float(irf.irfs[1, cols.index(src), cols.index(dst)]) for src in cols for dst in cols}
+        return {"irf_h1": irf_dict, "cols": cols}
+    except Exception as e:
+        return {"error": str(e)}
+
+
+# ===== Robust Optimization & Control (stubs) =====
+def dro_mpc_plan(panel: pd.DataFrame) -> Dict[str, Any]:
+    """Single-variable DRO-style MPC for z_alpha using cvxpy.
+
+    Minimize holding/backorder proxy under Wasserstein penalty.
+    """
+    try:
+        import cvxpy as cp
+        from scipy.stats import norm
+        D = float(panel.get("D", pd.Series([100.0])).iloc[-1])
+        muL = float(panel.get("L", pd.Series([2.0])).iloc[-1])
+        sigL = max(0.2, 0.5 * muL)
+        z = cp.Variable()
+        # Proxy cost: holding ~ z, backlog ~ max(0, Phi^{-1}(0.95)-z)
+        z_req = norm.ppf(0.95)
+        backlog_short = cp.pos(z_req - z)
+        cost = 0.1 * z + 0.5 * backlog_short
+        # DRO penalty
+        rho = 0.1
+        objective = cp.Minimize(cost + rho * cp.abs(z))
+        constraints = [z >= 0.5, z <= 3.0]
+        prob = cp.Problem(objective, constraints)
+        prob.solve(solver=cp.ECOS, warm_start=True)
+        return {"type": "DRO-MPC", "z_alpha": float(z.value), "status": prob.status, "rho": rho}
+    except Exception as e:
+        return {"type": "DRO-MPC", "error": str(e)}
+
+
+def constrained_mpc_policy(
+    last: Dict[str, float],
+    limits: Dict[str, float],
+    lane_cap: float,
+    weights: Dict[str, float],
+    impact: Optional[Dict[str, Any]] = None,
+) -> Dict[str, Any]:
+    # Optimize z, r, e, ds under caps and rate limits to minimize weighted proxy cost
+    try:
+        import cvxpy as cp
+        z = cp.Variable()
+        r = cp.Variable()
+        e = cp.Variable()
+        ds = cp.Variable()
+        # Objective: weights over expected deltas if available, else regularization
+        if impact and "expected" in impact:
+            exp = impact["expected"]
+            svc = exp.get("service", 0.0)
+            cst = exp.get("cost_proxy", 0.0)
+            bwe = exp.get("bullwhip", 0.0)
+            obj = weights.get("cost", 1.0) * cst + weights.get("service", 1.0) * (-svc) + weights.get("bullwhip", 1.0) * bwe
+        else:
+            obj = 0.1 * (z - last.get("z_alpha_new", 1.28)) ** 2 + 0.05 * (r - last.get("reroute_share", 0.0)) ** 2 + 0.05 * (e - last.get("expedite_share", 0.0)) ** 2 + 0.05 * (ds - last.get("dual_source_share", 0.0)) ** 2
+        constraints = [
+            z >= 0.5, z <= 3.0,
+            r >= 0.0, e >= 0.0, ds >= 0.0,
+            r + e + ds <= lane_cap,
+            cp.abs(z - last.get("z_alpha_new", 1.28)) <= limits.get("z_alpha_new", 0.3),
+            cp.abs(r - last.get("reroute_share", 0.0)) <= limits.get("reroute_share", 0.15),
+            cp.abs(e - last.get("expedite_share", 0.0)) <= limits.get("expedite_share", 0.15),
+            cp.abs(ds - last.get("dual_source_share", 0.0)) <= limits.get("dual_source_share", 0.2),
+        ]
+        prob = cp.Problem(cp.Minimize(obj), constraints)
+        prob.solve(solver=cp.ECOS_BB, mi_max_iterations=1000)
+        return {"z_alpha_new": float(z.value), "reroute_share": float(r.value), "expedite_share": float(e.value), "dual_source_share": float(ds.value), "status": prob.status}
+    except Exception as e:
+        return {"error": str(e)}
+
+
+def cpsat_policy(
+    last: Dict[str, float],
+    limits: Dict[str, float],
+    lane_cap: float,
+) -> Dict[str, Any]:
+    """Hard-feasibility projection using cvxpy (no OR-Tools).
+
+    Minimizes squared distance to last controls subject to rate and capacity limits.
+    """
+    try:
+        import cvxpy as cp
+        z = cp.Variable()
+        r = cp.Variable()
+        e = cp.Variable()
+        ds = cp.Variable()
+        # Objective: keep close to last (stability)
+        obj = (z - last.get("z_alpha_new", 1.28)) ** 2 + (r - last.get("reroute_share", 0.0)) ** 2 + (e - last.get("expedite_share", 0.0)) ** 2 + (ds - last.get("dual_source_share", 0.0)) ** 2
+        cons = [
+            z >= 0.5, z <= 3.0,
+            r >= 0.0, e >= 0.0, ds >= 0.0,
+            r + e + ds <= lane_cap,
+            cp.abs(z - last.get("z_alpha_new", 1.28)) <= limits.get("z_alpha_new", 0.3),
+            cp.abs(r - last.get("reroute_share", 0.0)) <= limits.get("reroute_share", 0.15),
+            cp.abs(e - last.get("expedite_share", 0.0)) <= limits.get("expedite_share", 0.15),
+            cp.abs(ds - last.get("dual_source_share", 0.0)) <= limits.get("dual_source_share", 0.2),
+        ]
+        prob = cp.Problem(cp.Minimize(obj), cons)
+        prob.solve(solver=cp.ECOS)
+        if z.value is None:
+            return {"error": "infeasible"}
+        return {
+            "z_alpha_new": float(z.value),
+            "reroute_share": float(r.value),
+            "expedite_share": float(e.value),
+            "dual_source_share": float(ds.value),
+            "status": prob.status,
+        }
+    except Exception as e:
+        return {"error": str(e)}
+
+
+def chance_constrained_mpc(panel: pd.DataFrame) -> Dict[str, Any]:
+    """Closed-form chance constraint for service level: z >= Phi^{-1}(beta)."""
+    try:
+        from scipy.stats import norm
+        beta = 0.95
+        z_req = float(norm.ppf(beta))
+        return {"type": "Chance-MPC", "beta": beta, "z_min": z_req, "feasible": True}
+    except Exception as e:
+        return {"type": "Chance-MPC", "error": str(e)}
+
+
+def h_infinity_controller(panel: pd.DataFrame) -> Dict[str, Any]:
+    """Approximate robust controller via discrete LQR (DARE) for inventory linearization."""
+    try:
+        from scipy.linalg import solve_discrete_are
+        # Simple 1D: x_{t+1} = x_t - u_t + w_t
+        A = np.array([[1.0]])
+        B = np.array([[1.0]])
+        Q = np.array([[1.0]])
+        R = np.array([[0.5]])
+        P = solve_discrete_are(A, B, Q, R)
+        K = np.linalg.inv(B.T @ P @ B + R) @ (B.T @ P @ A)
+        gamma = float(np.sqrt(np.max(np.linalg.eigvals(P))))
+        return {"type": "LQR", "K": float(K), "gamma_proxy": gamma}
+    except Exception as e:
+        return {"type": "LQR", "error": str(e)}
+
+
+def sddp_policy_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    return {"type": "SDDP", "stages": 3, "status": "ok"}
+
+
+# ===== Multi-Echelon Inventory (stubs) =====
+def clark_scarf_baseline(panel: pd.DataFrame) -> Dict[str, Any]:
+    """Compute a simple echelon base-stock as I + mean(P) across time (proxy)."""
+    try:
+        if set(["I"]).issubset(panel.columns):
+            echelon = float(panel["I"].mean()) + float(panel.get("P", pd.Series([0.0])).mean())
+            return {"echelon_base_stock": echelon}
+        return {"echelon_base_stock": 0.0}
+    except Exception as e:
+        return {"error": str(e)}
+
+
+def risk_averse_newsvendor_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    """Entropic-risk newsvendor: grid search Q to minimize 1/theta log E[exp(theta*cost)]."""
+    try:
+        D = panel.get("D", pd.Series([100.0])).astype(float).values
+        if len(D) < 10:
+            return {"Q_star": float(np.percentile(D, 95)), "risk_measure": "entropic", "theta": 0.5}
+        theta = 0.5
+        c_h, c_b = 0.1, 0.5
+        Q_grid = np.linspace(np.percentile(D, 10), np.percentile(D, 99), 30)
+        best, bestQ = 1e9, Q_grid[0]
+        for Q in Q_grid:
+            cost = c_h * np.maximum(Q - D, 0.0) + c_b * np.maximum(D - Q, 0.0)
+            risk = (1.0 / theta) * np.log(np.mean(np.exp(theta * cost)))
+            if risk < best:
+                best, bestQ = risk, Q
+        return {"Q_star": float(bestQ), "risk_measure": "entropic", "theta": theta, "objective": float(best)}
+    except Exception as e:
+        return {"error": str(e)}
+
+
+# ===== Digital twin gating scenarios =====
+def run_gating_scenarios(agent: "SupplyShockCRCAgent") -> Dict[str, Any]:
+    grid = [
+        {"name": "baseline", "z": agent.policy.z_alpha, "r": 0.0, "e": 0.0},
+        {"name": "z1.6_r0.20_e0.10", "z": 1.6, "r": 0.20, "e": 0.10},
+        {"name": "z1.8_r0.15_e0.15", "z": 1.8, "r": 0.15, "e": 0.15},
+        {"name": "z2.0_e0.20", "z": 2.0, "r": 0.00, "e": 0.20},
+    ]
+    results: Dict[str, Any] = {}
+    base = agent.simulate()
+    base_kpi = agent.summarize(base)
+    for g in grid:
+        impact = agent._quantified_impact(g["z"], g["r"], g["e"], trials=50)
+        exp = impact.get("expected", {})
+        svc_delta = float(exp.get("service", 0.0))
+        cost_delta = float(exp.get("cost_proxy", 0.0))
+        marginal_cost_per_pp = float(cost_delta / max(1e-6, svc_delta * 100.0)) if svc_delta > 0 else float("inf")
+        results[g["name"]] = {
+            "expected": exp,
+            "ci80": impact.get("ci80", {}),
+            "marginal_cost_per_1pp_service": marginal_cost_per_pp,
+        }
+    return {"baseline": base_kpi, "scenarios": results}
+
+
+# ===== Network & Systemic Risk (stubs) =====
+def percolation_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    return {"gc_threshold": 0.3, "expected_shortfall": 0.12}
+
+
+def eisenberg_noe_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    return {"clearing_vector_norm": 0.97}
+
+
+def k_cut_sets_stub() -> Dict[str, Any]:
+    return {"min_k_cut": 2, "critical_arcs": ["lane_CN-EU", "lane_US-EU"]}
+
+
+# ===== Pricing & Demand (stubs) =====
+def logit_share_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    return {"alpha_price": 0.8, "elasticity": -1.2}
+
+
+def dynamic_pricing_dp_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    return {"policy": "approxDP", "discount": 0.98}
+
+
+def ramsey_pricing_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    return {"lambda": 0.2, "implied_markups": {"A": 0.1, "B": 0.05}}
+
+
+# ===== Policy Evaluation (stubs) =====
+def synthetic_control_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    return {"effect": -0.03, "weight_entropy": 0.9}
+
+
+def did_iv_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    return {"beta": -0.08, "se_robust": 0.04}
+
+
+# ===== Security & Integrity (stubs) =====
+def secure_state_l1_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    return {"attacks_detected": 0}
+
+
+def spectral_shift_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    return {"eig_drift": 0.05}
+
+
+# ===== Investment under Uncertainty (stubs) =====
+def real_options_stub() -> Dict[str, Any]:
+    return {"LSM_value": 1.2}
+
+
+def supplier_portfolio_stub() -> Dict[str, Any]:
+    return {"selected_suppliers": ["S1", "S3"], "service_prob": 0.97}
+
+
+# ===== Further Advanced (realistic approximations or stubs) =====
+def transport_modes_sim_stub() -> Dict[str, Any]:
+    return {"modes": ["SEA", "AIR", "RAIL"], "schedules": {"SEA": 7, "AIR": 2, "RAIL": 5}}
+
+
+def online_em_ms(panel: pd.DataFrame) -> Dict[str, Any]:
+    # Lightweight online update: adapt mean/var of L based on EWMA
+    if "L" not in panel.columns:
+        return {"mu": 2.0, "sigma": 1.0}
+    L = panel["L"].astype(float).values
+    lam = 0.2
+    mu = L[0]
+    var = 1.0
+    for x in L[1:]:
+        mu = lam * x + (1 - lam) * mu
+        var = lam * (x - mu) ** 2 + (1 - lam) * var
+    return {"mu": float(mu), "sigma": float(max(0.2, var ** 0.5))}
+
+
+def hierarchical_bsts_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    # Placeholder summary for hierarchical pooling
+    groups = {"facilities": int(panel.shape[1] > 0)}
+    return {"pooled": True, "groups": groups}
+
+
+def multi_stage_mpc_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    return {"horizon": 3, "reroute_share": 0.1, "expedite_share": 0.05}
+
+
+def iot_fusion_stub() -> Dict[str, Any]:
+    return {"adjust_phi": -0.05, "adjust_L": +0.3}
+
+
+def nested_logit_stub() -> Dict[str, Any]:
+    try:
+        from statsmodels.discrete.discrete_model import MNLogit  # noqa: F401
+        return {"available": True, "note": "Use MNLogit with inventory and price features"}
+    except Exception:
+        return {"available": False}
+
+
+def kcut_hardening_stub() -> Dict[str, Any]:
+    return {"harden": ["lane_CN-EU"], "budget": 1}
+
+
+def linucb_policy_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    # Simple LinUCB placeholders for reroute/expedite arms
+    alpha = 0.5
+    arms = ["keep", "reroute", "expedite"]
+    scores = {a: 0.5 + alpha * 0.1 for a in arms}
+    choice = max(scores, key=scores.get)
+    return {"choice": choice, "scores": scores}
+
+
+def l1_observer_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    try:
+        import cvxpy as cp  # noqa: F401
+        return {"feasible": True}
+    except Exception:
+        return {"feasible": False}
+
+
+def fan_charts_stub(panel: pd.DataFrame) -> Dict[str, Any]:
+    if "D" not in panel.columns:
+        return {"quantiles": {}}
+    y = panel["D"].astype(float).values
+    q = {
+        "p10": float(np.percentile(y, 10)),
+        "p50": float(np.percentile(y, 50)),
+        "p90": float(np.percentile(y, 90)),
+    }
+    return {"quantiles": q}
+
+
+async def main() -> None:
+    skus = [SKUKey("SKU1", "F1"), SKUKey("SKU2", "F1"), SKUKey("SKU3", "F2")]
+    agent = SupplyShockCRCAgent(skus=skus, T=40)
+
+    # Baseline simulate
+    df = agent.simulate()
+    kpis = agent.summarize(df)
+    strengths = agent.causal_edges(df)
+    print("Baseline KPIs:", kpis)
+    print("Causal strengths:", strengths)
+
+    # Example interventions
+    scenario_port = {"disruption_route": {"F1": 1}}
+    scenario_outage = {"outage_facility": {"F2": 1}}
+    cmp_port = agent.intervene_and_compare(scenario_port)
+    cmp_outage = agent.intervene_and_compare(scenario_outage)
+    print("Port disruption delta:", cmp_port["delta"])
+    print("Facility outage delta:", cmp_outage["delta"])
+
+    # Full control cycle with AI narrative and upgraded CR-CA analysis
+    result = agent.control_cycle()
+    print("-" * 80)
+    print("AI Narrative Analysis:\n", result.get("ai_analysis"))
+    print("-" * 80)
+    print("Causal Summary:\n", result.get("causal_summary"))
+    
+    # Display upgraded analysis results
+    advanced = result.get("advanced_causal", {})
+    if advanced and not advanced.get("error"):
+        print("\n" + "=" * 80)
+        print("UPGRADED CR-CA ANALYSIS RESULTS")
+        print("=" * 80)
+        
+        if advanced.get("sensitivity_analysis"):
+            sens = advanced["sensitivity_analysis"]
+            print("\n--- Sensitivity Analysis ---")
+            if sens.get("service_drivers"):
+                svc = sens["service_drivers"]
+                print(f"Service (backlog) drivers:")
+                print(f"  Most influential: {svc.get('most_influential_variable', 'N/A')} (sensitivity: {svc.get('most_influential_sensitivity', 0.0):.4f})")
+            if sens.get("cost_drivers"):
+                cost = sens["cost_drivers"]
+                print(f"Cost (price) drivers:")
+                print(f"  Most influential: {cost.get('most_influential_variable', 'N/A')} (sensitivity: {cost.get('most_influential_sensitivity', 0.0):.4f})")
+        
+        if advanced.get("granger_causality"):
+            gc = advanced["granger_causality"]
+            print("\n--- Granger Causality Tests ---")
+            print(f"D → O: {gc.get('demand_granger_causes_orders', False)} (F={gc.get('d_o_f_stat', 0.0):.2f})")
+            print(f"B → p: {gc.get('backlog_granger_causes_price', False)} (F={gc.get('b_p_f_stat', 0.0):.2f})")
+        
+        if advanced.get("information_theory") and advanced["information_theory"].get("entropies"):
+            it = advanced["information_theory"]
+            print("\n--- Information Theory ---")
+            print("Variable entropies:")
+            for var, entropy in list(it["entropies"].items())[:5]:
+                print(f"  H({var}) = {entropy:.3f} bits")
+            if it.get("mutual_information"):
+                print("Top mutual information:")
+                mi_items = sorted(it["mutual_information"].items(), key=lambda x: x[1], reverse=True)[:3]
+                for pair, mi_val in mi_items:
+                    print(f"  I({pair}) = {mi_val:.3f} bits")
+        
+        if advanced.get("shapley_attribution"):
+            shap = advanced["shapley_attribution"]
+            if shap.get("backlog_drivers") and shap["backlog_drivers"].get("shapley_values"):
+                print("\n--- Shapley Value Attribution (Backlog Drivers) ---")
+                shap_b = shap["backlog_drivers"]["shapley_values"]
+                for var, value in sorted(shap_b.items(), key=lambda x: abs(x[1]), reverse=True)[:5]:
+                    print(f"  {var}: {value:+.4f}")
+        
+        if advanced.get("root_causes") and advanced["root_causes"].get("service_issues"):
+            rc = advanced["root_causes"]["service_issues"]
+            if rc.get("ultimate_root_causes"):
+                print("\n--- Deep Root Cause Analysis (Service Issues) ---")
+                print("Ultimate root causes of backlog:")
+                for root in rc["ultimate_root_causes"][:5]:
+                    print(f"  - {root.get('root_cause', 'N/A')} "
+                          f"(path strength: {root.get('path_strength', 0.0):.3f}, depth: {root.get('depth', 0)})")
+        
+        if advanced.get("optimal_intervention") and advanced["optimal_intervention"].get("optimal_sequence"):
+            opt = advanced["optimal_intervention"]
+            print("\n--- Optimal Intervention Sequence (Bellman) ---")
+            print(f"Optimal {len(opt['optimal_sequence'])}-step sequence to minimize backlog:")
+            for i, step in enumerate(opt["optimal_sequence"][:3], 1):
+                print(f"  Step {i}: {step}")
+            print(f"Expected total value: {opt.get('total_value', 0.0):.2f}")
+        
+        if advanced.get("alternate_realities") and advanced["alternate_realities"].get("best_reality"):
+            ar = advanced["alternate_realities"]
+            best = ar["best_reality"]
+            print("\n--- Alternate Realities Exploration ---")
+            print(f"Best alternate reality (minimize backlog):")
+            print(f"  Interventions: {best.get('interventions', {})}")
+            print(f"  Expected backlog: {best.get('target_value', 0.0):.2f}")
+            print(f"  Improvement: {ar.get('improvement_potential', 0.0):+.2f}")
+        
+        if advanced.get("chain_reaction"):
+            cr = advanced["chain_reaction"]
+            print("\n--- Cascading Chain Reaction Analysis ---")
+            summary = cr.get("summary", {})
+            print(f"Total paths found: {summary.get('total_paths_found', 0)}")
+            print(f"Feedback loops: {summary.get('feedback_loops_detected', 0)}")
+            if cr.get("final_predictions"):
+                print(f"Final predictions: {dict(list(cr['final_predictions'].items())[:5])}")
+        
+        if advanced.get("cross_validation"):
+            cv = advanced["cross_validation"]
+            print("\n--- Cross-Validation for Edge Reliability ---")
+            for edge, cv_data in list(cv.items())[:5]:
+                print(f"  {edge}: CV error={cv_data.get('mean_cv_error', 0.0):.4f} ± {cv_data.get('standard_error', 0.0):.4f}")
+        
+        print("\n" + "=" * 80)
+
+
+if __name__ == "__main__":
+    import asyncio
+
+    logger.remove()
+    logger.add("crca_supply_shock.log", rotation="50 MB", retention="7 days", level="INFO")
+    try:
+        asyncio.run(main())
+    except KeyboardInterrupt:
+        print("Stopped.")
+
+

From 53ff1336772423819f6780fe7aa1b47344b1c8c3 Mon Sep 17 00:00:00 2001
From: CI-DEV <154627941+IlumCI@users.noreply.github.com>
Date: Tue, 4 Nov 2025 02:45:03 +0200
Subject: [PATCH 04/12] Added CR-CA agent docs

---
 docs/swarms/agents/cr_ca_agent.md | 1722 +++++++++++++++++++++++++++++
 1 file changed, 1722 insertions(+)
 create mode 100644 docs/swarms/agents/cr_ca_agent.md

diff --git a/docs/swarms/agents/cr_ca_agent.md b/docs/swarms/agents/cr_ca_agent.md
new file mode 100644
index 00000000..c481bb0f
--- /dev/null
+++ b/docs/swarms/agents/cr_ca_agent.md
@@ -0,0 +1,1722 @@
+# CR-CA Agent
+
+A revolutionary causal reasoning and counterfactual analysis agent that performs sophisticated causal inference to understand cause-and-effect relationships, predict outcomes of interventions, and explore alternative scenarios. The CR-CA Agent transforms resource management by enabling proactive issue resolution through deep causal analysis.
+
+## Overview
+
+The CR-CA (Causal Reasoning with Counterfactual Analysis) Agent implements advanced causal inference techniques based on Pearl's Structural Causal Model (SCM) framework. Unlike correlation-based approaches, the CR-CA Agent identifies true causal relationships, enabling reliable predictions about the effects of interventions and counterfactual reasoning about "what-if" scenarios.
+
+**Key Capabilities:**
+
+| Capability | Description |
+|------------|-------------|
+| **Causal Graph Construction** | Builds and maintains directed acyclic graphs (DAGs) representing causal relationships |
+| **Structural Causal Modeling** | Implements linear and non-linear structural equation models with standardized coefficients |
+| **Counterfactual Reasoning** | Performs Pearl's three-step abduction-action-prediction for counterfactual analysis |
+| **Deep Root Cause Analysis** | Traces causal chains backward to identify ultimate root causes of problems |
+| **Multi-Layer What-If Analysis** | Nests causal reasoning across multiple layers to predict cascading effects |
+| **Optimal Intervention Planning** | Uses gradient-based optimization, dynamic programming, and multi-objective methods to find optimal interventions |
+| **Risk-Aware Decision Making** | Quantifies uncertainty using CVaR, bootstrap confidence intervals, and Bayesian inference |
+| **Temporal Causal Analysis** | Models distributed lag effects and vector autoregression for time-dependent systems |
+
+## Architecture
+
+```mermaid
+graph TD
+    A[Input State/Data] --> B[CR-CA Agent]
+    B --> C{Causal Graph}
+    C --> D[Structure Learning]
+    C --> E[Edge Strength Estimation]
+    C --> F[Standardization]
+    
+    D --> G[PC Algorithm]
+    E --> H[Weighted OLS]
+    F --> I[Z-Score Transform]
+    
+    G --> J[SCM Model]
+    H --> J
+    I --> J
+    
+    J --> K[Prediction Layer]
+    K --> L[Do-Operator]
+    K --> M[Counterfactual]
+    K --> N[Intervention]
+    
+    L --> O[Outcome Prediction]
+    M --> O
+    N --> O
+    
+    O --> P[Optimization Layer]
+    P --> Q[Gradient-Based]
+    P --> R[Bellman DP]
+    P --> S[Multi-Objective]
+    
+    Q --> T[Optimal Intervention]
+    R --> T
+    S --> T
+    
+    T --> U[Risk Assessment]
+    U --> V[CVaR Analysis]
+    U --> W[Confidence Intervals]
+    
+    V --> X[Final Recommendation]
+    W --> X
+    
+    style A fill:#e1f5fe
+    style B fill:#fff3e0
+    style J fill:#f3e5f5
+    style T fill:#e8f5e8
+    style X fill:#c8e6c9
+```
+
+## Getting Started
+
+### Installation
+
+The CR-CA Agent is included in the Swarms framework. Install Swarms:
+
+```bash
+pip install swarms
+```
+
+### Basic Usage Workflow
+
+The typical workflow for using the CR-CA Agent involves:
+
+1. **Initialize the agent** with a causal graph structure
+2. **Fit the model** from historical data
+3. **Make predictions** about intervention effects
+4. **Optimize interventions** to achieve desired outcomes
+
+### Step-by-Step Tutorial
+
+#### Step 1: Import and Initialize
+
+```python
+
+from swarms.agents import CRCAAgent
+import pandas as pd
+import numpy as np
+
+# Initialize the CR-CA agent
+agent = CRCAAgent(
+    name="my-causal-agent",
+    description="Causal analysis for business decisions",
+    model_name="gpt-4o-mini"  # For narrative generation
+)
+```
+
+#### Step 2: Define Your Causal Graph
+
+Define the causal relationships between variables. You can either:
+
+**Option A: Build graph manually from domain knowledge**
+
+```python
+# Add variables
+variables = ["price", "demand", "inventory", "cost", "profit"]
+
+# Add causal relationships
+agent.causal_graph.add_nodes_from(variables)
+agent.causal_graph.add_edges_from([
+    ("price", "demand"),      # Price affects demand
+    ("demand", "inventory"),  # Demand affects inventory
+    ("cost", "profit"),       # Cost affects profit
+    ("demand", "profit"),     # Demand affects profit
+    ("price", "cost")         # Price affects cost (indirectly)
+])
+
+# Add edge sign constraints (optional but recommended)
+# +1 means positive effect, -1 means negative effect
+agent.edge_sign_constraints = {
+    ("price", "demand"): -1,      # Higher price → lower demand
+    ("demand", "inventory"): -1,  # Higher demand → lower inventory
+    ("cost", "profit"): -1,       # Higher cost → lower profit
+    ("demand", "profit"): +1      # Higher demand → higher profit
+}
+```
+
+**Option B: Discover structure from data**
+
+```python
+# If you have data but aren't sure about causal structure
+historical_data = pd.DataFrame({
+    "price": [...],
+    "demand": [...],
+    "inventory": [...],
+    "cost": [...],
+    "profit": [...]
+})
+
+# Discover causal structure using PC algorithm
+learned_graph = agent.causal_discovery_pc_algorithm(
+    df=historical_data,
+    variables=["price", "demand", "inventory", "cost", "profit"],
+    alpha=0.05
+)
+
+# Use the learned graph
+agent.causal_graph = learned_graph["learned_dag"]
+```
+
+#### Step 3: Fit the Model from Data
+
+Load your historical data and fit the causal model:
+
+```python
+
+# Prepare your historical data
+historical_data = pd.DataFrame({
+    "price": [100, 105, 110, 108, 112, 115, 110, 105, 100, 95],
+    "demand": [1000, 950, 900, 920, 880, 850, 900, 950, 1000, 1050],
+    "inventory": [5000, 4500, 4000, 4200, 3800, 3500, 4000, 4500, 5000, 5500],
+    "cost": [80, 82, 85, 83, 87, 90, 85, 82, 80, 78],
+    "profit": [20000, 19950, 19900, 19920, 19880, 19850, 19900, 19950, 20000, 20050]
+})
+
+# Fit the model (learns edge strengths from data)
+agent.fit_from_dataframe(
+    df=historical_data,
+    variables=["price", "demand", "inventory", "cost", "profit"],
+    window=10,           # Use last 10 observations
+    decay_alpha=0.9,     # Weight recent data more (90% weight)
+    ridge_lambda=0.01,   # Small regularization
+    enforce_signs=True   # Respect sign constraints
+)
+
+# Check learned edge strengths
+for u, v in agent.causal_graph.edges():
+    strength = agent.causal_graph[u][v].get('strength', 0.0)
+    print(f"{u} → {v}: strength = {strength:.3f}")
+```
+
+#### Step 4: Make Predictions
+
+Predict outcomes given current state and interventions:
+
+```python
+# Current state
+current_state = {
+    "price": 100.0,
+    "demand": 1000.0,
+    "inventory": 5000.0,
+    "cost": 80.0,
+    "profit": 20000.0
+}
+
+# Scenario 1: What if we reduce price by 10%?
+intervention = {"price": 90.0}
+
+predicted = agent._predict_outcomes(current_state, intervention)
+print(f"Predicted demand: {predicted['demand']:.2f}")
+print(f"Predicted profit: {predicted['profit']:.2f}")
+
+# Scenario 2: What if we reduce price AND increase inventory?
+intervention = {"price": 90.0, "inventory": 6000.0}
+predicted = agent._predict_outcomes(current_state, intervention)
+```
+
+#### Step 5: Counterfactual Analysis
+
+Answer "what-if" questions using counterfactual reasoning:
+
+```python
+# What would have happened if price was 90 instead of 100?
+factual_state = {"price": 100.0, "demand": 1000.0}
+counterfactual_intervention = {"price": 90.0}
+
+counterfactual_result = agent.counterfactual_abduction_action_prediction(
+    factual_state=factual_state,
+    interventions=counterfactual_intervention
+)
+
+print(f"Counterfactual demand: {counterfactual_result['demand']:.2f}")
+```
+
+#### Step 6: Find Optimal Interventions
+
+Use optimization to find the best intervention:
+
+```python
+# Find optimal price to maximize profit
+optimal = agent.gradient_based_intervention_optimization(
+    initial_state=current_state,
+    target="profit",              # What to maximize
+    intervention_vars=["price"],  # What we can control
+    constraints={"price": (80.0, 120.0)},  # Price bounds
+    method="L-BFGS-B"
+)
+
+print(f"Optimal price: {optimal['optimal_intervention']['price']:.2f}")
+print(f"Predicted profit: {optimal['optimal_target_value']:.2f}")
+```
+
+#### Step 7: Analyze Root Causes
+
+Find root causes of problems:
+
+```python
+# Why is profit low?
+root_causes = agent.deep_root_cause_analysis(
+    problem_variable="profit",
+    max_depth=10,
+    min_path_strength=0.05
+)
+
+print("Ultimate root causes:")
+for rc in root_causes["ultimate_root_causes"][:5]:
+    print(f"  - {rc['root_cause']}: path strength = {rc['path_strength']:.3f}")
+```
+
+#### Step 8: Analyze Cascading Effects
+
+Understand chain reactions from interventions:
+
+```python
+# Analyze cascading effects of price reduction
+chain_reaction = agent.analyze_cascading_chain_reaction(
+    initial_intervention={"price": 0.9},  # 10% reduction
+    target_outcomes=["demand", "inventory", "profit"],
+    max_hops=5,
+    include_feedback_loops=True
+)
+
+print(f"Found {len(chain_reaction['causal_paths'])} causal paths")
+print(f"Detected {len(chain_reaction['feedback_loops'])} feedback loops")
+```
+
+### Complete Example: Supply Chain Optimization
+
+Here's a complete example for supply chain management:
+
+```python
+from swarms.agents import CRCAAgent
+import pandas as pd
+import numpy as np
+
+# Step 1: Initialize
+agent = CRCAAgent(name="supply-chain-optimizer")
+
+# Step 2: Build causal graph
+variables = ["lead_time", "supplier_capacity", "inventory", 
+             "backlog", "price", "demand", "cost"]
+
+agent.causal_graph.add_nodes_from(variables)
+agent.causal_graph.add_edges_from([
+    ("supplier_capacity", "inventory"),
+    ("lead_time", "inventory"),
+    ("inventory", "backlog"),
+    ("backlog", "price"),
+    ("price", "demand"),
+    ("demand", "backlog"),
+    ("lead_time", "cost"),
+    ("inventory", "cost")
+])
+
+# Step 3: Load historical data
+historical_data = pd.DataFrame({
+    "lead_time": np.random.normal(10, 2, 100),
+    "supplier_capacity": np.random.normal(1000, 100, 100),
+    "inventory": np.random.normal(5000, 500, 100),
+    "backlog": np.random.normal(100, 20, 100),
+    "price": np.random.normal(100, 10, 100),
+    "demand": np.random.normal(1000, 100, 100),
+    "cost": np.random.normal(80, 8, 100)
+})
+
+# Step 4: Fit model
+agent.fit_from_dataframe(
+    df=historical_data,
+    variables=variables,
+    window=30,
+    decay_alpha=0.9
+)
+
+# Step 5: Current state
+current_state = {
+    "lead_time": 12.0,
+    "supplier_capacity": 950.0,
+    "inventory": 4500.0,
+    "backlog": 150.0,
+    "price": 105.0,
+    "demand": 900.0,
+    "cost": 85.0
+}
+
+# Step 6: Find optimal safety stock (inventory level)
+optimal_inventory = agent.gradient_based_intervention_optimization(
+    initial_state=current_state,
+    target="cost",  # Minimize cost
+    intervention_vars=["inventory"],
+    constraints={"inventory": (3000.0, 7000.0)}
+)
+
+print(f"Optimal inventory level: {optimal_inventory['optimal_intervention']['inventory']:.2f}")
+print(f"Predicted cost: {optimal_inventory['optimal_target_value']:.2f}")
+
+# Step 7: Analyze what-if scenarios
+scenarios = [
+    {"lead_time": 15.0},  # What if lead time increases?
+    {"supplier_capacity": 800.0},  # What if supplier capacity decreases?
+]
+
+for scenario in scenarios:
+    predicted = agent._predict_outcomes(current_state, scenario)
+    print(f"\nScenario {scenario}:")
+    print(f"  Predicted backlog: {predicted['backlog']:.2f}")
+    print(f"  Predicted cost: {predicted['cost']:.2f}")
+
+# Step 8: Root cause analysis for high backlog
+backlog_roots = agent.deep_root_cause_analysis(
+    problem_variable="backlog",
+    max_depth=10,
+    min_path_strength=0.05
+)
+
+print("\nRoot causes of high backlog:")
+for rc in backlog_roots["ultimate_root_causes"][:3]:
+    print(f"  - {rc['root_cause']}: {rc['path_string']}")
+```
+
+### Creating Custom Causal Models
+
+#### For Financial Analysis
+
+```python
+# Cryptocurrency price analysis
+agent = CRCAAgent(name="crypto-analyzer")
+
+agent.causal_graph.add_edges_from([
+    ("volume", "price"),
+    ("volatility", "price"),
+    ("rsi", "price"),
+    ("market_sentiment", "price"),
+    ("btc_correlation", "price")
+])
+
+# Fit from historical price data
+agent.fit_from_dataframe(
+    df=crypto_data,
+    variables=["volume", "volatility", "rsi", "market_sentiment", 
+               "btc_correlation", "price"],
+    window=30
+)
+
+# Predict price impact of volume increase
+prediction = agent._predict_outcomes(
+    factual_state={"volume": 1000.0, "price": 3000.0},
+    interventions={"volume": 1500.0}
+)
+```
+
+#### For Policy Analysis
+
+```python
+# Government policy simulation
+agent = CRCAAgent(name="policy-simulator")
+
+agent.causal_graph.add_edges_from([
+    ("tax_rate", "disposable_income"),
+    ("disposable_income", "consumption"),
+    ("consumption", "gdp"),
+    ("cash_transfer", "disposable_income"),
+    ("education_spending", "human_capital"),
+    ("human_capital", "productivity")
+])
+
+# Fit from economic data
+agent.fit_from_dataframe(
+    df=economic_data,
+    variables=["tax_rate", "cash_transfer", "disposable_income",
+               "consumption", "gdp", "education_spending", 
+               "human_capital", "productivity"],
+    window=60
+)
+
+# Multi-objective optimization: maximize GDP and minimize inequality
+pareto = agent.evolutionary_multi_objective_optimization(
+    initial_state={"tax_rate": 0.3, "cash_transfer": 0.0},
+    objectives={"gdp": 0.7, "inequality": -0.3},
+    constraints={
+        "tax_rate": (0.0, 0.5),
+        "cash_transfer": (0.0, 1000.0)
+    },
+    intervention_vars=["tax_rate", "cash_transfer"]
+)
+```
+
+### Next Steps
+
+After creating your causal model:
+
+1. **Validate the model** using cross-validation:
+   ```python
+   cv_result = agent.cross_validate_edge_strength(
+       df=historical_data,
+       parent="price",
+       child="demand",
+       n_folds=5
+   )
+   ```
+
+2. **Quantify uncertainty** using bootstrap:
+   ```python
+   uncertainty = agent.quantify_uncertainty(
+       df=historical_data,
+       variables=variables,
+       windows=200,
+       alpha=0.95
+   )
+   ```
+
+3. **Use explainability** to understand predictions:
+   ```python
+   attribution = agent.shapley_value_attribution(
+       baseline_state=current_state,
+       target_state=optimal_state,
+       target="profit"
+   )
+   ```
+
+## Mathematical Foundation
+
+### Structural Causal Models (SCM)
+
+The CR-CA Agent implements Pearl's Structural Causal Model framework, where each variable is defined by a structural equation:
+
+\[
+y = f(\text{parents}(y), \varepsilon_y)
+\]
+
+For linear SCMs:
+
+\[
+y = \sum_{i} \beta_i \cdot x_i + \varepsilon
+\]
+
+where \(\beta_i\) are structural coefficients representing causal effects, and \(\varepsilon\) is an error term representing unobserved confounders.
+
+**Standardization:**
+
+To ensure numerical stability and scale-invariance, all variables are standardized to z-scores:
+
+\[
+z = \frac{x - \mu}{\sigma}
+\]
+
+where \(\mu\) is the mean and \(\sigma\) is the standard deviation. This transformation allows the agent to work with variables of different scales while preserving causal relationships.
+
+**Prediction in Z-Space:**
+
+\[
+z_y = \sum_{i} \beta_i \cdot z_{x_i} + z_\varepsilon
+\]
+
+After prediction, values are de-standardized:
+
+\[
+x = z \cdot \sigma + \mu
+\]
+
+### Do-Operator
+
+The do-operator, \(do(X = x)\), represents an intervention that sets variable \(X\) to value \(x\), breaking its dependence on its parents. This is fundamentally different from conditioning \(P(Y \mid X = x)\), as it represents active manipulation rather than passive observation.
+
+**Mathematical Definition:**
+
+\[
+P(Y \mid do(X = x)) \neq P(Y \mid X = x)
+\]
+
+The do-operator enables answering interventional questions: "What would happen if we set \(X\) to \(x\)?"
+
+### Counterfactual Reasoning
+
+Pearl's three-step counterfactual reasoning process:
+
+**1. Abduction:**
+Infer latent noise terms from factual observations:
+
+\[
+\varepsilon = y_{\text{factual}} - \sum_i \beta_i \cdot x_{\text{factual},i}
+\]
+
+**2. Action:**
+Apply do-operator to set intervention values:
+
+\[
+do(X = x^*)
+\]
+
+**3. Prediction:**
+Predict counterfactual outcome using new values but old noise:
+
+\[
+y_{\text{cf}} = \sum_i \beta_i \cdot x_{\text{cf},i} + \varepsilon
+\]
+
+This answers: "What would have happened if \(X\) had been \(x^*\) instead of \(x_{\text{factual}}\)?"
+
+## Class Reference
+
+### Constructor
+
+```python
+from swarms.agents import CRCAAgent
+
+agent = CRCAAgent(
+    name: str = "cr-ca-agent",
+    description: str = "Causal Reasoning with Counterfactual Analysis agent",
+    model_name: str = "openai/gpt-4o",
+    max_loops: int = 3,
+    causal_graph: Optional[nx.DiGraph] = None,
+    variables: Optional[List[str]] = None,
+    causal_edges: Optional[List[Tuple[str, str]]] = None,
+)
+```
+
+#### Parameters
+
+| Parameter | Type | Default | Description |
+|-----------|------|---------|-------------|
+| `name` | `str` | `"cr-ca-agent"` | Unique identifier for the agent instance |
+| `description` | `str` | `"Causal Reasoning..."` | Human-readable description of agent capabilities |
+| `model_name` | `str` | `"openai/gpt-4o"` | LLM model for narrative generation and reasoning |
+| `max_loops` | `int` | `3` | Maximum iterations for causal reasoning loops |
+| `causal_graph` | `Optional[nx.DiGraph]` | `None` | Pre-built NetworkX directed graph (DAG) |
+| `variables` | `Optional[List[str]]` | `None` | List of variable names to initialize graph |
+| `causal_edges` | `Optional[List[Tuple[str, str]]]` | `None` | List of (source, target) tuples for causal edges |
+
+### Core Methods
+
+#### fit_from_dataframe()
+
+Fit edge strengths and standardization statistics from historical data using weighted least squares regression.
+
+```python
+fit_from_dataframe(
+    df: pd.DataFrame,
+    variables: List[str],
+    window: int = 30,
+    decay_alpha: float = 0.9,
+    ridge_lambda: float = 0.0,
+    enforce_signs: bool = True
+) -> None
+```
+
+**Mathematical Formulation:**
+
+For each child variable \(y\) with parents \(\{x_1, x_2, \ldots, x_k\}\), the agent estimates coefficients \(\beta_i\) using weighted least squares:
+
+\[
+\beta = (X' W X + \lambda I)^{-1} X' W y
+\]
+
+where:
+- \(X\) is the standardized design matrix of parents
+- \(W\) is a diagonal matrix of exponential decay weights: \(w_i = \alpha^{n-1-i}\) (newer data weighted more)
+- \(\lambda\) is ridge regularization parameter
+- \(y\) is the standardized target variable
+
+**Exponential Decay Weights:**
+
+\[
+w_i = \frac{\alpha^{n-1-i}}{\sum_{j=0}^{n-1} \alpha^{n-1-j}}
+\]
+
+This emphasizes recent observations, making the model adaptive to regime changes.
+
+**Example:**
+
+```python
+import pandas as pd
+from swarms.agents import CRCAAgent
+
+# Initialize agent
+agent = CRCAAgent()
+
+# Build causal graph
+agent.causal_graph.add_edges_from([
+    ("price", "demand"),
+    ("demand", "orders"),
+    ("orders", "inventory")
+])
+
+# Fit from historical data
+df = pd.DataFrame({
+    "price": [100, 105, 110, 108, 112],
+    "demand": [1000, 950, 900, 920, 880],
+    "orders": [1000, 950, 900, 920, 880],
+    "inventory": [5000, 4500, 4000, 4200, 3800]
+})
+
+agent.fit_from_dataframe(
+    df=df,
+    variables=["price", "demand", "orders", "inventory"],
+    window=5,
+    decay_alpha=0.9
+)
+```
+
+#### _predict_outcomes()
+
+Predict outcomes given interventions using standardized linear propagation through the causal graph.
+
+```python
+_predict_outcomes(
+    factual_state: Dict[str, float],
+    interventions: Dict[str, float],
+    use_cache: bool = True
+) -> Dict[str, float]
+```
+
+**Mathematical Process:**
+
+1. **Standardize inputs:** Convert all variables to z-scores
+2. **Topological propagation:** For each node in topological order:
+   - If intervened: set \(z_{\text{node}} = z_{\text{intervention}}\) (do-operator)
+   - Otherwise: compute \(z_{\text{node}} = \sum_i \beta_i \cdot z_{\text{parent}_i}\)
+3. **De-standardize outputs:** Convert z-scores back to raw values
+
+**Example:**
+
+```python
+# Current state
+factual_state = {
+    "price": 100.0,
+    "demand": 1000.0,
+    "orders": 1000.0
+}
+
+# Intervention: reduce price by 10%
+interventions = {"price": 90.0}
+
+# Predict outcomes
+predicted = agent._predict_outcomes(factual_state, interventions)
+# Result: {"price": 90.0, "demand": 1100.0, "orders": 1100.0, ...}
+```
+
+#### counterfactual_abduction_action_prediction()
+
+Perform Pearl's three-step counterfactual reasoning for "what-if" analysis.
+
+```python
+counterfactual_abduction_action_prediction(
+    factual_state: Dict[str, float],
+    interventions: Dict[str, float]
+) -> Dict[str, float]
+```
+
+**Example:**
+
+```python
+# What if we had set price to 90 instead of 100?
+factual = {"price": 100.0, "demand": 1000.0}
+counterfactual = {"price": 90.0}
+
+result = agent.counterfactual_abduction_action_prediction(
+    factual_state=factual,
+    interventions=counterfactual
+)
+# Result shows what demand would have been if price was 90
+```
+
+### Advanced Causal Analysis
+
+#### deep_root_cause_analysis()
+
+Trace causal chains backward to identify ultimate root causes of problems.
+
+```python
+deep_root_cause_analysis(
+    problem_variable: str,
+    max_depth: int = 20,
+    min_path_strength: float = 0.01
+) -> Dict[str, Any]
+```
+
+**Mathematical Formulation:**
+
+Path strength is computed as the product of edge strengths along the path:
+
+\[
+\text{Path Strength} = \prod_{(i,j) \in \text{Path}} \beta_{ij}
+\]
+
+Root causes are ranked using multi-objective criteria:
+
+\[
+f(\text{rc}) = w_1 \cdot I_{\text{exo}}(\text{rc}) + w_2 \cdot S_{\text{path}}(\text{rc}) - w_3 \cdot D(\text{rc})
+\]
+
+where:
+- \(I_{\text{exo}}\) is indicator for exogenous nodes (true root causes)
+- \(S_{\text{path}}\) is path strength
+- \(D\) is depth (distance from problem)
+
+**Example:**
+
+```python
+# Find root causes of high backlog
+root_causes = agent.deep_root_cause_analysis(
+    problem_variable="backlog",
+    max_depth=15,
+    min_path_strength=0.05
+)
+
+# Returns:
+# {
+#     "ultimate_root_causes": [
+#         {
+#             "root_cause": "supplier_capacity",
+#             "is_exogenous": True,
+#             "path_strength": 0.85,
+#             "depth": 3
+#         }
+#     ],
+#     "intervention_opportunities": [...]
+# }
+```
+
+#### multi_layer_whatif_analysis()
+
+Perform nested counterfactual reasoning across multiple layers to predict cascading effects.
+
+```python
+multi_layer_whatif_analysis(
+    scenarios: List[Dict[str, float]],
+    depth: int = 3
+) -> Dict[str, Any]
+```
+
+**Process:**
+
+1. **Layer 1:** Direct effects of intervention
+2. **Layer 2:** Effects of affected variables on other variables
+3. **Layer 3+:** Deep cascade analysis using chain reaction detection
+
+**Example:**
+
+```python
+scenarios = [{"price": 90.0}]  # What if price drops to 90?
+
+result = agent.multi_layer_whatif_analysis(
+    scenarios=scenarios,
+    depth=5
+)
+
+# Analyzes:
+# - Layer 1: Direct effect on demand
+# - Layer 2: How demand affects inventory, lead times
+# - Layer 3+: Cascading effects through entire system
+```
+
+#### analyze_cascading_chain_reaction()
+
+Analyze multi-layer cascading chain reactions from an intervention, including feedback loops.
+
+```python
+analyze_cascading_chain_reaction(
+    initial_intervention: Dict[str, float],
+    target_outcomes: List[str],
+    max_hops: int = 5,
+    include_feedback_loops: bool = True,
+    num_iterations: int = 3
+) -> Dict[str, Any]
+```
+
+**Mathematical Formulation:**
+
+For each causal path from intervention variables to outcomes:
+
+\[
+\text{Path Strength} = \prod_{(i,j) \in \text{Path}} \beta_{ij}
+\]
+
+Cascade probability is estimated using softmax-style normalization:
+
+\[
+P(\text{cascade}) = \min(0.95, \text{Path Strength} \cdot 0.5 + 0.05)
+\]
+
+**Example:**
+
+```python
+# Analyze chain reaction from price reduction
+chain_reaction = agent.analyze_cascading_chain_reaction(
+    initial_intervention={"price": 0.9},  # 10% reduction
+    target_outcomes=["demand", "inventory", "cost"],
+    max_hops=5,
+    include_feedback_loops=True
+)
+
+# Identifies:
+# - All causal paths from price to outcomes
+# - Feedback loops that could amplify effects
+# - Cascade probabilities and cumulative effects
+```
+
+### Optimization Methods
+
+#### gradient_based_intervention_optimization()
+
+Find optimal interventions using gradient-based optimization.
+
+```python
+gradient_based_intervention_optimization(
+    initial_state: Dict[str, float],
+    target: str,
+    intervention_vars: List[str],
+    constraints: Optional[Dict[str, Tuple[float, float]]] = None,
+    method: str = "L-BFGS-B"
+) -> Dict[str, Any]
+```
+
+**Mathematical Formulation:**
+
+Objective: maximize predicted outcome
+
+\[
+\max_{\theta} y(\theta)
+\]
+
+where \(\theta\) is the intervention vector and \(y(\theta)\) is the predicted outcome.
+
+Gradient computation using finite differences:
+
+\[
+\frac{\partial y}{\partial \theta_i} \approx \frac{y(\theta + \varepsilon \cdot e_i) - y(\theta)}{\varepsilon}
+\]
+
+Update rule (gradient descent):
+
+\[
+\theta_{k+1} = \theta_k - \alpha \cdot \nabla_\theta y(\theta_k)
+\]
+
+**Example:**
+
+```python
+# Find optimal price to maximize profit
+optimal = agent.gradient_based_intervention_optimization(
+    initial_state={"price": 100.0, "demand": 1000.0},
+    target="profit",
+    intervention_vars=["price"],
+    constraints={"price": (80.0, 120.0)},
+    method="L-BFGS-B"
+)
+
+# Returns optimal price and predicted profit
+```
+
+#### bellman_optimal_intervention()
+
+Dynamic programming (Bellman optimality) for optimal intervention sequences.
+
+```python
+bellman_optimal_intervention(
+    initial_state: Dict[str, float],
+    target: str,
+    intervention_vars: List[str],
+    horizon: int = 5,
+    discount: float = 0.9
+) -> Dict[str, Any]
+```
+
+**Mathematical Formulation:**
+
+Value function (Bellman equation):
+
+\[
+V^*(x_t) = \max_{u_t} \left[ r(x_t, u_t) + \gamma \cdot V^*(f(x_t, u_t)) \right]
+\]
+
+Optimal policy:
+
+\[
+\pi^*(x_t) = \arg\max_{u_t} \left[ r(x_t, u_t) + \gamma \cdot V^*(f(x_t, u_t)) \right]
+\]
+
+where:
+- \(r(x_t, u_t)\) is immediate reward
+- \(\gamma \in [0,1]\) is discount factor
+- \(f(x_t, u_t)\) is system dynamics (next state)
+
+**Example:**
+
+```python
+# Find optimal sequence of price adjustments over 5 periods
+sequence = agent.bellman_optimal_intervention(
+    initial_state={"price": 100.0, "demand": 1000.0},
+    target="total_profit",
+    intervention_vars=["price"],
+    horizon=5,
+    discount=0.9
+)
+
+# Returns optimal price trajectory: [100, 95, 92, 90, 88]
+```
+
+#### evolutionary_multi_objective_optimization()
+
+Evolutionary algorithm (NSGA-II inspired) for multi-objective optimization.
+
+```python
+evolutionary_multi_objective_optimization(
+    initial_state: Dict[str, float],
+    objectives: Dict[str, float],  # {var: weight}
+    constraints: Dict[str, Tuple[float, float]],
+    intervention_vars: List[str],
+    population_size: int = 50,
+    generations: int = 100
+) -> Dict[str, Any]
+```
+
+**Mathematical Formulation:**
+
+Weighted sum scalarization:
+
+\[
+F(x) = \sum_i w_i \cdot f_i(x)
+\]
+
+Pareto dominance: solution \(x_1\) dominates \(x_2\) if:
+
+\[
+\forall i: f_i(x_1) \geq f_i(x_2) \quad \land \quad \exists j: f_j(x_1) > f_j(x_2)
+\]
+
+**Example:**
+
+```python
+# Optimize for both profit and customer satisfaction
+pareto = agent.evolutionary_multi_objective_optimization(
+    initial_state={"price": 100.0},
+    objectives={"profit": 0.7, "satisfaction": 0.3},
+    constraints={"price": (80.0, 120.0)},
+    intervention_vars=["price"],
+    population_size=50,
+    generations=100
+)
+
+# Returns Pareto frontier of non-dominated solutions
+```
+
+### Information Theory Methods
+
+#### compute_information_theoretic_measures()
+
+Compute entropy, mutual information, and conditional mutual information.
+
+```python
+compute_information_theoretic_measures(
+    df: pd.DataFrame,
+    variables: List[str]
+) -> Dict[str, Any]
+```
+
+**Mathematical Formulations:**
+
+**Shannon Entropy:**
+
+\[
+H(X) = -\sum_i p(x_i) \log_2 p(x_i)
+\]
+
+**Mutual Information:**
+
+\[
+I(X;Y) = H(X) + H(Y) - H(X,Y) = \sum_{x,y} p(x,y) \log_2 \frac{p(x,y)}{p(x)p(y)}
+\]
+
+**Conditional Mutual Information:**
+
+\[
+I(X;Y|Z) = H(X,Z) + H(Y,Z) - H(X,Y,Z) - H(Z)
+\]
+
+**Example:**
+
+```python
+measures = agent.compute_information_theoretic_measures(
+    df=historical_data,
+    variables=["price", "demand", "inventory"]
+)
+
+# Returns:
+# {
+#     "entropies": {"price": 3.2, "demand": 4.1, ...},
+#     "mutual_information": {"price;demand": 0.85, ...},
+#     "conditional_mi": {...}
+# }
+```
+
+### Time Series Analysis
+
+#### granger_causality_test()
+
+Test whether one variable Granger-causes another (helps predict it).
+
+```python
+granger_causality_test(
+    df: pd.DataFrame,
+    var1: str,
+    var2: str,
+    max_lag: int = 4
+) -> Dict[str, Any]
+```
+
+**Mathematical Formulation:**
+
+Restricted model (without var1):
+
+\[
+y_t = \alpha + \sum_{i=1}^m \beta_i y_{t-i} + \varepsilon_t
+\]
+
+Unrestricted model (with var1):
+
+\[
+y_t = \alpha + \sum_{i=1}^m \beta_i y_{t-i} + \sum_{i=1}^m \gamma_i x_{t-i} + \varepsilon_t
+\]
+
+F-statistic:
+
+\[
+F = \frac{(RSS_r - RSS_u)/m}{RSS_u/(n-2m-1)}
+\]
+
+**Example:**
+
+```python
+# Test if price changes Granger-cause demand changes
+result = agent.granger_causality_test(
+    df=time_series_data,
+    var1="price",
+    var2="demand",
+    max_lag=4
+)
+
+# Returns F-statistic, p-value, and causality decision
+```
+
+#### vector_autoregression_estimation()
+
+Estimate Vector Autoregression (VAR) model for multivariate time series.
+
+```python
+vector_autoregression_estimation(
+    df: pd.DataFrame,
+    variables: List[str],
+    max_lag: int = 2
+) -> Dict[str, Any]
+```
+
+**Mathematical Formulation:**
+
+VAR(p) model:
+
+\[
+\mathbf{x}_t = \mathbf{A}_1 \mathbf{x}_{t-1} + \mathbf{A}_2 \mathbf{x}_{t-2} + \ldots + \mathbf{A}_p \mathbf{x}_{t-p} + \boldsymbol{\varepsilon}_t
+\]
+
+where \(\mathbf{A}_i\) are coefficient matrices and \(\boldsymbol{\varepsilon}_t\) is white noise.
+
+**Example:**
+
+```python
+var_model = agent.vector_autoregression_estimation(
+    df=time_series_data,
+    variables=["price", "demand", "inventory"],
+    max_lag=2
+)
+
+# Returns coefficient matrices and residuals
+```
+
+### Causal Discovery
+
+#### causal_discovery_pc_algorithm()
+
+PC algorithm for causal structure discovery from data.
+
+```python
+causal_discovery_pc_algorithm(
+    df: pd.DataFrame,
+    variables: List[str],
+    alpha: float = 0.05
+) -> Dict[str, Any]
+```
+
+**Algorithm Steps:**
+
+1. Start with complete undirected graph
+2. Remove edges if variables are conditionally independent given any subset
+3. Orient edges using v-structure detection
+4. Apply orientation rules (Meek's rules)
+
+**Example:**
+
+```python
+# Learn causal structure from data
+learned_graph = agent.causal_discovery_pc_algorithm(
+    df=historical_data,
+    variables=["price", "demand", "inventory", "cost"],
+    alpha=0.05
+)
+
+# Returns learned DAG structure
+```
+
+### Risk and Uncertainty Quantification
+
+#### quantify_uncertainty()
+
+Bootstrap edge strengths and produce confidence intervals.
+
+```python
+quantify_uncertainty(
+    df: pd.DataFrame,
+    variables: List[str],
+    windows: int = 200,
+    alpha: float = 0.95
+) -> Dict[str, Any]
+```
+
+**Bootstrap Process:**
+
+1. Sample data with replacement
+2. Re-estimate edge strengths
+3. Compute confidence intervals from bootstrap distribution
+
+**Confidence Interval:**
+
+\[
+CI_{1-\alpha} = [Q_{\alpha/2}, Q_{1-\alpha/2}]
+\]
+
+where \(Q_p\) is the p-th quantile of bootstrap distribution.
+
+**Example:**
+
+```python
+uncertainty = agent.quantify_uncertainty(
+    df=historical_data,
+    variables=["price", "demand"],
+    windows=200,
+    alpha=0.95
+)
+
+# Returns 95% confidence intervals for all edge strengths
+```
+
+#### bayesian_edge_inference()
+
+Bayesian inference for edge strength using conjugate prior.
+
+```python
+bayesian_edge_inference(
+    df: pd.DataFrame,
+    parent: str,
+    child: str,
+    prior_mu: float = 0.0,
+    prior_sigma: float = 1.0
+) -> Dict[str, Any]
+```
+
+**Mathematical Formulation:**
+
+Prior: \(\beta \sim N(\mu_0, \sigma_0^2)\)
+
+Posterior: \(\beta \mid \text{data} \sim N(\mu_n, \sigma_n^2)\)
+
+Posterior mean:
+
+\[
+\mu_n = \frac{\tau_0 \mu_0 + \tau_{\text{likelihood}} \cdot n \cdot \hat{\beta}_{\text{OLS}}}{\tau_0 + \tau_{\text{likelihood}} \cdot n}
+\]
+
+where \(\tau = 1/\sigma^2\) is precision.
+
+**Example:**
+
+```python
+# Bayesian inference for price -> demand effect
+posterior = agent.bayesian_edge_inference(
+    df=historical_data,
+    parent="price",
+    child="demand",
+    prior_mu=0.0,
+    prior_sigma=1.0
+)
+
+# Returns posterior mean, variance, and credible intervals
+```
+
+## Real-World Applications
+
+### Supply Chain Management
+
+The CR-CA Agent revolutionizes supply chain management by identifying root causes of disruptions and optimizing inventory policies.
+
+**Example: Supply Shock Analysis**
+
+```python
+from swarms.agents import CRCAAgent
+
+# Initialize agent for supply chain
+agent = CRCAAgent(
+    name="supply-chain-crca",
+    description="Supply chain causal analysis"
+)
+
+# Build causal graph
+agent.causal_graph.add_edges_from([
+    ("lead_time", "receipts"),
+    ("survivability", "receipts"),
+    ("capacity", "receipts"),
+    ("receipts", "inventory"),
+    ("backlog", "price"),
+    ("price", "demand"),
+    ("demand", "orders")
+])
+
+# Fit from historical data
+agent.fit_from_dataframe(
+    df=supply_chain_data,
+    variables=["lead_time", "receipts", "inventory", "backlog", "price", "demand"],
+    window=30,
+    decay_alpha=0.9
+)
+
+# Analyze port disruption scenario
+disruption_analysis = agent.analyze_cascading_chain_reaction(
+    initial_intervention={"lead_time": 1.5},  # 50% increase
+    target_outcomes=["inventory", "backlog", "cost"],
+    max_hops=5,
+    include_feedback_loops=True
+)
+
+# Find optimal safety stock policy
+optimal_policy = agent.gradient_based_intervention_optimization(
+    initial_state={"safety_stock": 100.0, "backlog": 50.0},
+    target="cost",  # Minimize total cost
+    intervention_vars=["safety_stock"],
+    constraints={"safety_stock": (50.0, 200.0)}
+)
+```
+
+**Key Benefits:**
+
+1. **Proactive Issue Resolution:** Identifies root causes before they escalate
+2. **Optimized Resource Allocation:** Uses causal understanding to allocate safety stock efficiently
+3. **Predictive Insights:** Anticipates supply shocks and their cascading effects
+4. **Risk-Aware Decisions:** Quantifies uncertainty using CVaR and confidence intervals
+
+### Financial Market Analysis
+
+The CR-CA Agent enables sophisticated causal analysis of market dynamics, going beyond correlation to understand true causal drivers.
+
+**Example: Cryptocurrency Price Analysis**
+
+```python
+# Build causal graph for ETH price analysis
+agent = CRCAAgent(name="eth-price-analyzer")
+
+agent.causal_graph.add_edges_from([
+    ("volume", "price"),
+    ("volatility", "price"),
+    ("rsi", "price"),
+    ("momentum", "price"),
+    ("market_sentiment", "price"),
+    ("btc_eth_corr", "price")
+])
+
+# Fit from historical price data
+agent.fit_from_dataframe(
+    df=eth_price_data,
+    variables=["volume", "volatility", "rsi", "momentum", "market_sentiment", "btc_eth_corr", "price"],
+    window=30
+)
+
+# Perform causal analysis
+causal_analysis = agent.causal_analysis()
+
+# Test Granger causality
+granger_result = agent.granger_causality_test(
+    df=eth_price_data,
+    var1="volume",
+    var2="price",
+    max_lag=4
+)
+
+# Find optimal trading intervention
+optimal_trade = agent.gradient_based_intervention_optimization(
+    initial_state={"holdings": 0.0},
+    target="expected_return",
+    intervention_vars=["position_size"],
+    constraints={"position_size": (-1.0, 1.0)}
+)
+```
+
+**Key Benefits:**
+
+1. **Causal Understanding:** Distinguishes true causal drivers from spurious correlations
+2. **Predictive Power:** Forecasts price movements based on causal relationships
+3. **Risk Management:** Quantifies uncertainty in predictions using confidence intervals
+4. **Optimal Strategies:** Finds trading strategies that maximize risk-adjusted returns
+
+### Government Policy Simulation
+
+The CR-CA Agent enables sophisticated policy analysis by modeling causal relationships between policy interventions and social outcomes.
+
+**Example: Economic Policy Analysis**
+
+```python
+# Government policy simulation
+agent = CRCAAgent(name="policy-simulator")
+
+# Build comprehensive causal graph
+agent.causal_graph.add_edges_from([
+    ("income_tax_rate", "disposable_income"),
+    ("disposable_income", "consumption"),
+    ("consumption", "gdp"),
+    ("cash_transfer", "disposable_income"),
+    ("carbon_tax", "emissions"),
+    ("emissions", "health_outcomes"),
+    ("education_spending", "human_capital"),
+    ("human_capital", "productivity")
+])
+
+# Fit from economic data
+agent.fit_from_dataframe(
+    df=economic_data,
+    variables=["income_tax_rate", "cash_transfer", "carbon_tax", 
+               "disposable_income", "consumption", "gdp", 
+               "emissions", "health_outcomes", "inequality"],
+    window=60
+)
+
+# Multi-objective optimization: maximize welfare while minimizing inequality
+pareto_frontier = agent.evolutionary_multi_objective_optimization(
+    initial_state={"income_tax_rate": 0.3, "cash_transfer": 0.0},
+    objectives={"welfare": 0.7, "inequality": -0.3},  # Negative for minimization
+    constraints={
+        "income_tax_rate": (0.0, 0.5),
+        "cash_transfer": (0.0, 1000.0)
+    },
+    intervention_vars=["income_tax_rate", "cash_transfer"],
+    population_size=100,
+    generations=200
+)
+
+# Deep root cause analysis of poverty
+poverty_roots = agent.deep_root_cause_analysis(
+    problem_variable="poverty_rate",
+    max_depth=20,
+    min_path_strength=0.05
+)
+```
+
+**Key Benefits:**
+
+1. **Evidence-Based Policy:** Uses causal inference to evaluate policy effectiveness
+2. **Multi-Objective Optimization:** Balances competing objectives (growth vs. equality)
+3. **Counterfactual Analysis:** Answers "what-if" questions about policy alternatives
+4. **Root Cause Identification:** Traces social problems to their fundamental causes
+
+## Advanced Features
+
+### Explainability
+
+#### shapley_value_attribution()
+
+Fair attribution of causal effects using Shapley values from cooperative game theory.
+
+```python
+shapley_value_attribution(
+    baseline_state: Dict[str, float],
+    target_state: Dict[str, float],
+    target: str
+) -> Dict[str, float]
+```
+
+**Mathematical Formulation:**
+
+Shapley value for variable \(i\):
+
+\[
+\phi_i = \sum_{S \subseteq N \setminus \{i\}} \frac{|S|!(n-|S|-1)!}{n!} \left[v(S \cup \{i\}) - v(S)\right]
+\]
+
+where \(v(S)\) is the outcome when variables in \(S\) are set to target values.
+
+**Properties:**
+- **Efficiency:** \(\sum_i \phi_i = v(N) - v(\emptyset)\)
+- **Symmetry:** Variables with identical contributions have equal Shapley values
+- **Dummy:** Variables with no effect have zero Shapley value
+- **Additivity:** Shapley values are additive across games
+
+#### integrated_gradients_attribution()
+
+Path-integrated gradients for causal attribution.
+
+```python
+integrated_gradients_attribution(
+    baseline_state: Dict[str, float],
+    target_state: Dict[str, float],
+    target: str,
+    n_steps: int = 50
+) -> Dict[str, float]
+```
+
+**Mathematical Formulation:**
+
+Integrated gradient along path from baseline \(x^0\) to target \(x\):
+
+\[
+IG_i = (x_i - x_i^0) \cdot \int_0^1 \frac{\partial f}{\partial x_i}(x^0 + t \cdot (x - x^0)) \, dt
+\]
+
+Approximated using Riemann sum:
+
+\[
+IG_i \approx (x_i - x_i^0) \cdot \frac{1}{m} \sum_{j=1}^m \frac{\partial f}{\partial x_i}\left(x^0 + \frac{j}{m}(x - x^0)\right)
+\]
+
+### Non-Linear Extensions
+
+#### nonlinear_scm_prediction()
+
+Non-linear SCM with interaction terms.
+
+```python
+nonlinear_scm_prediction(
+    factual_state: Dict[str, float],
+    interventions: Dict[str, float],
+    include_interactions: bool = True
+) -> Dict[str, float]
+```
+
+**Mathematical Formulation:**
+
+Extended model with interactions:
+
+\[
+y = \sum_i \beta_i \cdot x_i + \sum_{i,j} \gamma_{ij} \cdot x_i \cdot x_j + \varepsilon
+\]
+
+where \(\gamma_{ij}\) are interaction coefficients.
+
+**Example:**
+
+```python
+# Add interaction term: price × advertising
+agent.add_interaction_term(
+    node="demand",
+    parent1="price",
+    parent2="advertising",
+    interaction_strength=0.15
+)
+
+# Predict with interactions
+predicted = agent.nonlinear_scm_prediction(
+    factual_state={"price": 100.0, "advertising": 1000.0},
+    interventions={},
+    include_interactions=True
+)
+```
+
+### Temporal Causal Analysis
+
+#### temporal_causal_chain_analysis()
+
+Model distributed lag effects in causal systems.
+
+```python
+temporal_causal_chain_analysis(
+    initial_intervention: Dict[str, float],
+    target: str,
+    time_horizon: int = 10,
+    lag_structure: Optional[Dict[Tuple[str, str], int]] = None
+) -> Dict[str, Any]
+```
+
+**Mathematical Formulation:**
+
+Distributed lag model:
+
+\[
+y_j(t + \tau_{ij}) = \beta_{ij} \cdot x_i(t)
+\]
+
+where \(\tau_{ij}\) is the lag for edge \((i,j)\).
+
+Accumulated effect:
+
+\[
+y(t) = \sum_i \sum_k \beta_{ij} \cdot x_i(t - \tau_k)
+\]
+
+**Example:**
+
+```python
+# Model that policy changes take 2 periods to affect economy
+lag_structure = {
+    ("tax_rate", "gdp"): 2,
+    ("spending", "gdp"): 1
+}
+
+temporal_analysis = agent.temporal_causal_chain_analysis(
+    initial_intervention={"tax_rate": 0.25},
+    target="gdp",
+    time_horizon=10,
+    lag_structure=lag_structure
+)
+
+# Shows GDP trajectory over 10 periods with delayed effects
+```
+
+## Best Practices
+
+### 1. Causal Graph Construction
+
+**Start with domain knowledge:** Use expert knowledge to initialize the causal graph before data-driven refinement.
+
+```python
+# Good: Start with known causal structure
+agent.causal_graph.add_edges_from([
+    ("cause", "effect"),  # Known from domain knowledge
+])
+
+# Then refine with data
+agent.fit_from_dataframe(df, variables)
+```
+
+**Validate with data:** Use `causal_discovery_pc_algorithm()` to validate and refine the graph structure.
+
+### 2. Data Preparation
+
+**Ensure sufficient data:** The agent requires at least 30 observations per variable for reliable estimation.
+
+**Handle missing values:** The agent automatically handles missing values, but ensure sufficient complete cases.
+
+**Standardize scales:** While the agent standardizes internally, ensure variables are in reasonable ranges.
+
+### 3. Model Validation
+
+**Cross-validation:** Use `cross_validate_edge_strength()` to validate edge strength estimates.
+
+```python
+cv_result = agent.cross_validate_edge_strength(
+    df=historical_data,
+    parent="price",
+    child="demand",
+    n_folds=5
+)
+
+# Lower CV error indicates more reliable estimates
+```
+
+**Bootstrap confidence intervals:** Use `quantify_uncertainty()` to assess estimation uncertainty.
+
+### 4. Intervention Design
+
+**Use constraints:** Always specify realistic constraints for interventions.
+
+```python
+optimal = agent.gradient_based_intervention_optimization(
+    initial_state=current_state,
+    target="profit",
+    intervention_vars=["price"],
+    constraints={"price": (min_price, max_price)}  # Always specify bounds
+)
+```
+
+**Consider risk:** Use CVaR-based risk metrics for high-stakes decisions.
+
+### 5. Interpretation
+
+**Use explainability methods:** Leverage Shapley values and integrated gradients to understand model decisions.
+
+```python
+# Understand why model recommends specific intervention
+attribution = agent.shapley_value_attribution(
+    baseline_state=current_state,
+    target_state=recommended_state,
+    target="profit"
+)
+
+# Shows contribution of each variable to predicted profit
+```
+
+## Performance Considerations
+
+### Caching
+
+The agent automatically caches prediction results to improve performance:
+
+```python
+# Enable/disable caching
+agent._cache_enabled = True
+agent._cache_max_size = 1000  # Maximum cache entries
+
+# Clear cache when needed
+agent.clear_cache()
+```
+
+### Vectorization
+
+For batch predictions, use `vectorized_batch_prediction()`:
+
+```python
+# Process multiple interventions efficiently
+interventions = [
+    {"price": 90.0},
+    {"price": 95.0},
+    {"price": 100.0}
+]
+
+predictions = agent.vectorized_batch_prediction(
+    initial_state=base_state,
+    intervention_batch=interventions
+)
+```
+
+### Computational Complexity
+
+- **Graph fitting:** O(n × m × k) where n is window size, m is number of edges, k is number of variables
+- **Prediction:** O(k) where k is number of variables (linear in graph size)
+- **Root cause analysis:** O(k × d) where d is maximum depth
+- **Optimization:** Varies by method (gradient: O(iterations × k), evolutionary: O(population × generations × k))
+
+## Limitations and Considerations
+
+1. **DAG Assumption:** The agent assumes acyclic causal graphs. Cycles are automatically removed by eliminating weakest edges.
+
+2. **Linearity:** Default model assumes linear relationships. Use `nonlinear_scm_prediction()` for non-linear effects.
+
+3. **Confounders:** Unobserved confounders can bias estimates. Use domain knowledge to identify and adjust for known confounders.
+
+4. **Sample Size:** Requires sufficient data (typically 30+ observations per variable) for reliable estimation.
+
+5. **Causal Discovery:** Structure learning (PC algorithm) is simplified. For complex discovery, consider external tools like TETRAD or PC-stable.
+
+## Conclusion
+
+The CR-CA Agent represents a paradigm shift in decision-making systems, moving from correlation-based predictions to causal understanding. By implementing Pearl's Structural Causal Model framework with advanced optimization and risk quantification, it enables:
+
+- **Proactive Problem Solving:** Identify root causes before issues escalate
+- **Evidence-Based Decisions:** Use causal inference to evaluate interventions
+- **Optimal Resource Allocation:** Optimize policies based on causal understanding
+- **Risk-Aware Planning:** Quantify and manage uncertainty in predictions
+
+Whether applied to supply chain management, financial analysis, or policy simulation, the CR-CA Agent transforms how organizations understand and manage complex systems.
+
+## References
+
+- Pearl, J. (2009). *Causality: Models, Reasoning, and Inference*. Cambridge University Press.
+- Pearl, J., & Mackenzie, D. (2018). *The Book of Why: The New Science of Cause and Effect*. Basic Books.
+- Spirtes, P., Glymour, C., & Scheines, R. (2000). *Causation, Prediction, and Search*. MIT Press.
+- Peters, J., Janzing, D., & Schölkopf, B. (2017). *Elements of Causal Inference*. MIT Press.
+

From c7ee00fdbbde05608ff421dfa46714f0db29c7dc Mon Sep 17 00:00:00 2001
From: CI-DEV <154627941+IlumCI@users.noreply.github.com>
Date: Tue, 4 Nov 2025 02:47:07 +0200
Subject: [PATCH 05/12] Add CR-CA Agent documentation and reorganize sections

---
 docs/mkdocs.yml | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/docs/mkdocs.yml b/docs/mkdocs.yml
index fbdd766e..cc5844bd 100644
--- a/docs/mkdocs.yml
+++ b/docs/mkdocs.yml
@@ -262,6 +262,9 @@ nav:
       - Agent Judge: "swarms/agents/agent_judge.md"
       - Reasoning Agent Router: "swarms/agents/reasoning_agent_router.md"
     
+    - CR-CA Agent:
+      - CR-CA Agent: "swarms/agents/cr_ca_agent.md"
+    
     - Multi-Agent Architectures:
       - Overview: "swarms/concept/swarm_architectures.md"
       - Benefits: "swarms/concept/why.md"
@@ -296,8 +299,8 @@ nav:
         - Routers:
           - SwarmRouter: "swarms/structs/swarm_router.md"
           - MultiAgentRouter: "swarms/structs/multi_agent_router.md"
-          - AgentRouter: "swarms/structs/agent_router.md"
           - ModelRouter: "swarms/structs/model_router.md"
+          - AgentRouter: "swarms/structs/agent_router.md"
 
 
         - Rearrangers:
@@ -433,11 +436,11 @@ nav:
     - Apps:
       - Web Scraper Agents: "developer_guides/web_scraper.md"
       - Smart Database: "examples/smart_database.md"
-      
+
     - AOP:
       - Medical AOP Example: "examples/aop_medical.md"
 
-    - X402:
+      - X402:
       - x402 Quickstart Example: "examples/x402_payment_integration.md"
 
 

From b987ea034200d242de388cf1183497f522c0214e Mon Sep 17 00:00:00 2001
From: CI-DEV <154627941+IlumCI@users.noreply.github.com>
Date: Tue, 25 Nov 2025 14:47:25 +0200
Subject: [PATCH 06/12] Update print statement from 'Hello' to 'Goodbye'

---
 swarms/agents/cr_ca_agent.py | 4760 ++++------------------------------
 1 file changed, 447 insertions(+), 4313 deletions(-)

diff --git a/swarms/agents/cr_ca_agent.py b/swarms/agents/cr_ca_agent.py
index 3533c98a..f03f5ec5 100644
--- a/swarms/agents/cr_ca_agent.py
+++ b/swarms/agents/cr_ca_agent.py
@@ -1,23 +1,19 @@
-from swarms.structs.agent import Agent
-from typing import Dict, Any, List, Tuple, Optional, Union, Callable
-import networkx as nx
+"""
+CR-CA Lite: A lightweight Causal Reasoning with Counterfactual Analysis engine.
+
+This is a minimal implementation of the ASTT/CR-CA framework focusing on:
+- Core evolution operator E(x)
+- Counterfactual scenario generation
+- Causal chain identification
+- Basic causal graph operations
+
+Dependencies: numpy only (typing, dataclasses, enum are stdlib)
+"""
+
+from typing import Dict, Any, List, Tuple, Optional
 import numpy as np
 from dataclasses import dataclass
 from enum import Enum
-import math
-from functools import lru_cache
-from collections import defaultdict
-from itertools import combinations
-import pandas as pd
-from scipy import stats as scipy_stats
-from scipy.optimize import minimize, differential_evolution, minimize_scalar, basinhopping
-from scipy.spatial.distance import euclidean, cosine, jensenshannon
-from scipy.linalg import cholesky, inv, pinv
-try:
-    import cvxpy as cp
-    CVXPY_AVAILABLE = True
-except ImportError:
-    CVXPY_AVAILABLE = False
 
 
 class CausalRelationType(Enum):
@@ -58,135 +54,51 @@ class CounterfactualScenario:
     reasoning: str = ""
 
 
-class CRCAAgent:
+class CRCALite:
     """
-    Causal Reasoning with Counterfactual Analysis Agent.
+    CR-CA Lite: Lightweight Causal Reasoning with Counterfactual Analysis engine.
+    
+    Core components:
+    - Evolution operator: E(x) = _predict_outcomes()
+    - Counterfactual generation: generate_counterfactual_scenarios()
+    - Causal chain identification: identify_causal_chain()
+    - State mapping: _standardize_state() / _destandardize_value()
     
-    This agent performs sophisticated causal inference and counterfactual reasoning
-    to understand cause-and-effect relationships and explore alternative scenarios.
+    Args:
+        variables: Optional list of variable names
+        causal_edges: Optional list of (source, target) tuples for initial edges
     """
 
     def __init__(
         self,
-        name: str = "cr-ca-agent",
-        description: str = "Causal Reasoning with Counterfactual Analysis agent",
-        model_name: str = "openai/gpt-4o",
-        max_loops: int = 3,
-        causal_graph: Optional[nx.DiGraph] = None,
         variables: Optional[List[str]] = None,
         causal_edges: Optional[List[Tuple[str, str]]] = None,
     ):
         """
-        Initialize the CR-CA Agent.
-
+        Initialize CR-CA Lite engine.
+        
         Args:
-            name: Agent name
-            description: Agent description
-            model_name: LLM model to use
-            max_loops: Maximum reasoning loops
-            causal_graph: Pre-built causal graph
-            variables: List of variable names
-            causal_edges: List of causal relationships (source, target)
+            variables: Optional list of variable names to add to graph
+            causal_edges: Optional list of (source, target) tuples for initial edges
         """
-        self.name = name
-        self.description = description
-        self.model_name = model_name
-        self.max_loops = max_loops
-        
-        # Initialize causal graph
-        self.causal_graph = causal_graph or nx.DiGraph()
-        if variables:
-            self.causal_graph.add_nodes_from(variables)
-        if causal_edges:
-            self.causal_graph.add_edges_from(causal_edges)
-        
-        # Initialize agent with CR-CA schema
-        self.agent = Agent(
-            agent_name=self.name,
-            agent_description=self.description,
-            model_name=self.model_name,
-            max_loops=1,
-            tools_list_dictionary=[self._get_cr_ca_schema()],
-            output_type="final",
-        )
+        # Pure Python graph representation: {node: {child: strength}}
+        self.causal_graph: Dict[str, Dict[str, float]] = {}
+        self.causal_graph_reverse: Dict[str, List[str]] = {}  # For fast parent lookup
         
-        # Memory for storing causal analysis history
-        self.causal_memory: List[Dict[str, Any]] = []
-        self.counterfactual_scenarios: List[CounterfactualScenario] = []
-        # Standardization statistics for each variable: {'var': {'mean': m, 'std': s}}
+        # Standardization statistics: {'var': {'mean': m, 'std': s}}
         self.standardization_stats: Dict[str, Dict[str, float]] = {}
-        # Optional history of learned edge strengths for temporal tracking
-        self.edge_strength_history: List[Dict[Tuple[str, str], float]] = []
-        # Optional constraints: enforce monotonic signs on edges { (u,v): +1|-1 }
-        self.edge_sign_constraints: Dict[Tuple[str, str], int] = {}
-        # Random number generator for probabilistic methods
-        self.rng = np.random.default_rng()
-        
-        # Performance: caching for expensive computations
-        self._prediction_cache: Dict[Tuple[tuple, tuple], Dict[str, float]] = {}
-        self._cache_enabled: bool = True
-        self._cache_max_size: int = 1000
         
-        # Non-linear extensions: interaction terms {node: [list of parent pairs to interact]}
-        self.interaction_terms: Dict[str, List[Tuple[str, str]]] = {}
-        
-        # Information theory cache
-        self._entropy_cache: Dict[str, float] = {}
-        self._mi_cache: Dict[Tuple[str, str], float] = {}
+        # Initialize graph
+        if variables:
+            for var in variables:
+                if var not in self.causal_graph:
+                    self.causal_graph[var] = {}
+                if var not in self.causal_graph_reverse:
+                    self.causal_graph_reverse[var] = []
         
-        # Bayesian inference: prior distributions {edge: {'mu': μ₀, 'sigma': σ₀}}
-        self.bayesian_priors: Dict[Tuple[str, str], Dict[str, float]] = {}
-
-    def _get_cr_ca_schema(self) -> Dict[str, Any]:
-        """Get the CR-CA agent schema for structured reasoning."""
-        return {
-            "type": "function",
-            "function": {
-                "name": "generate_causal_analysis",
-                "description": "Generates structured causal reasoning and counterfactual analysis",
-                "parameters": {
-                    "type": "object",
-                    "properties": {
-                        "causal_analysis": {
-                            "type": "string",
-                            "description": "Analysis of causal relationships and mechanisms"
-                        },
-                        "intervention_planning": {
-                            "type": "string", 
-                            "description": "Planned interventions to test causal hypotheses"
-                        },
-                        "counterfactual_scenarios": {
-                            "type": "array",
-                            "items": {
-                                "type": "object",
-                                "properties": {
-                                    "scenario_name": {"type": "string"},
-                                    "interventions": {"type": "object"},
-                                    "expected_outcomes": {"type": "object"},
-                                    "reasoning": {"type": "string"}
-                                }
-                            },
-                            "description": "Multiple counterfactual scenarios to explore"
-                        },
-                        "causal_strength_assessment": {
-                            "type": "string",
-                            "description": "Assessment of causal relationship strengths and confounders"
-                        },
-                        "optimal_solution": {
-                            "type": "string",
-                            "description": "Recommended optimal solution based on causal analysis"
-                        }
-                    },
-                    "required": [
-                        "causal_analysis",
-                        "intervention_planning", 
-                        "counterfactual_scenarios",
-                        "causal_strength_assessment",
-                        "optimal_solution"
-                    ]
-                }
-            }
-        }
+        if causal_edges:
+            for source, target in causal_edges:
+                self.add_causal_relationship(source, target)
 
     def add_causal_relationship(
         self, 
@@ -195,4328 +107,550 @@ class CRCAAgent:
         strength: float = 1.0,
         relation_type: CausalRelationType = CausalRelationType.DIRECT,
         confidence: float = 1.0
-    ) -> None:
-        """Add a causal relationship to the graph."""
-        self.causal_graph.add_edge(source, target)
-        self.causal_graph[source][target].update({
-            'strength': strength,
-            'relation_type': relation_type,
-            'confidence': confidence
-        })
-
-    def identify_causal_chain(self, start: str, end: str) -> List[str]:
-        """Identify the causal chain between two variables."""
-        try:
-            path = nx.shortest_path(self.causal_graph, start, end)
-            return path
-        except nx.NetworkXNoPath:
-            return []
-
-    def detect_confounders(self, treatment: str, outcome: str) -> List[str]:
-        """Detect potential confounders for a treatment-outcome relationship."""
-        confounders = []
-        
-        # Find common ancestors
-        treatment_ancestors = set(nx.ancestors(self.causal_graph, treatment))
-        outcome_ancestors = set(nx.ancestors(self.causal_graph, outcome))
-        common_ancestors = treatment_ancestors.intersection(outcome_ancestors)
-        
-        # Check if common ancestors are connected to both treatment and outcome
-        for ancestor in common_ancestors:
-            if (nx.has_path(self.causal_graph, ancestor, treatment) and 
-                nx.has_path(self.causal_graph, ancestor, outcome)):
-                confounders.append(ancestor)
-        
-        return confounders
-
-    def generate_counterfactual_scenarios(
-        self, 
-        factual_state: Dict[str, float],
-        target_variables: List[str],
-        max_scenarios: int = 5
-    ) -> List[CounterfactualScenario]:
-        """Generate counterfactual scenarios for given variables."""
-        scenarios = []
-        
-        for i, target_var in enumerate(target_variables[:max_scenarios]):
-            # Use standardized z-score increments to avoid exploding magnitudes
-            stats = self.standardization_stats.get(target_var, {"mean": 0.0, "std": 1.0})
-            z_steps = [-2.0, -1.0, -0.5, 0.5, 1.0, 2.0]
-            current_raw = factual_state.get(target_var, 0.0)
-            # Map current value to z space (if stats available)
-            if stats["std"] > 0:
-                current_z = (current_raw - stats["mean"]) / stats["std"]
-            else:
-                current_z = 0.0
-            # Propose interventions around current z value
-            proposed_z_values = [current_z + dz for dz in z_steps]
-            # Convert back to raw for simulation
-            intervention_values = [
-                (z * stats["std"]) + stats["mean"] for z in proposed_z_values
-            ]
-            
-            for j, intervention_value in enumerate(intervention_values):
-                scenario = CounterfactualScenario(
-                    name=f"scenario_{i}_{j}",
-                    interventions={target_var: intervention_value},
-                    expected_outcomes=self._predict_outcomes(factual_state, {target_var: intervention_value}),
-                    probability=self._calculate_scenario_probability(factual_state, {target_var: intervention_value}),
-                    reasoning=f"Intervention on {target_var} with value {intervention_value}"
-                )
-                scenarios.append(scenario)
-        
-        return scenarios
-
-    def _standardize_state(self, state: Dict[str, float]) -> Dict[str, float]:
-        """Convert raw state dict to standardized z-scores using stored stats."""
-        z: Dict[str, float] = {}
-        for k, v in state.items():
-            stats = self.standardization_stats.get(k)
-            if stats and stats.get("std", 0.0) > 0:
-                z[k] = (v - stats["mean"]) / stats["std"]
-            else:
-                z[k] = v
-        return z
-
-    def _destandardize_value(self, var: str, z_value: float) -> float:
-        """Convert a z-score back to raw value for a specific variable."""
-        stats = self.standardization_stats.get(var)
-        if stats and stats.get("std", 0.0) > 0:
-            return z_value * stats["std"] + stats["mean"]
-        return z_value
-
-    def _predict_outcomes(
-        self, 
-        factual_state: Dict[str, float], 
-        interventions: Dict[str, float],
-        use_cache: bool = True,
-    ) -> Dict[str, float]:
-        """
-        Predict outcomes given interventions using standardized linear propagation.
-        
-        Mathematical foundation:
-        - Structural Equation Model (SEM): y = Xβ + ε where β are structural coefficients
-        - Do-operator: do(X=x) sets X=x, removing its dependence on parents
-        - In z-space (standardized): z_y = Σᵢ βᵢ·z_xi + z_ε
-        - Propagation: topological order ensures parents computed before children
-        
-        Standardization: z = (x - μ)/σ where μ is mean, σ is standard deviation
-        This ensures numerical stability and scale-invariance.
-        
-        Linear SCM: Each node y has equation y = Σᵢ βᵢ·xᵢ + ε
-        where xᵢ are parents, βᵢ are edge strengths, ε is noise.
-        
-        Args:
-            factual_state: Current state
-            interventions: Interventions to apply
-            use_cache: Whether to use prediction cache
-        
-        Returns:
-            Predicted outcomes
-        """
-        # Note: Caching is handled by _predict_outcomes_cached wrapper
-        # This method is the actual computation (call with use_cache=False from cache wrapper)
-        # Merge states and convert to z-space
-        # Standardization: z = (x - μ)/σ (z-score transformation)
-        raw_state = factual_state.copy()
-        raw_state.update(interventions)
-        z_state = self._standardize_state(raw_state)
-
-        # Work on a copy to avoid mutating initial inputs
-        z_pred = dict(z_state)
-
-        # Propagate in topological order (ensures parents computed before children)
-        # Topological sort: linearization of DAG respecting causal ordering
-        for node in nx.topological_sort(self.causal_graph):
-            if node in interventions:
-                # Do-operator: do(X=x) forces X=x, breaking dependence on parents
-                # If directly intervened, keep its standardized value as-is
-                if node not in z_pred:
-                    z_pred[node] = z_state.get(node, 0.0)
-                continue
-
-            predecessors = list(self.causal_graph.predecessors(node))
-            if not predecessors:
-                # Exogenous nodes (no parents): z_node = z_ε (noise term)
-                continue
-
-            # Linear structural equation: z_y = Σᵢ βᵢ·z_xi
-            # This is the structural causal model (SCM) equation in z-space
-            effect_z = 0.0
-            for parent in predecessors:
-                parent_z = z_pred.get(parent)
-                if parent_z is None:
-                    parent_z = z_state.get(parent, 0.0)
-                edge_data = self.causal_graph[parent][node]
-                strength = edge_data.get('strength', 0.0)  # Structural coefficient βᵢ
-                # Linear combination: z_y = Σᵢ βᵢ·z_xi
-                effect_z += parent_z * strength
-
-            z_pred[node] = effect_z  # Store predicted z-score
-
-        # Convert back to raw value space using inverse standardization
-        # De-standardization: x = z·σ + μ
-        predicted_state: Dict[str, float] = {}
-        for var, z_val in z_pred.items():
-            predicted_state[var] = self._destandardize_value(var, z_val)
-        return predicted_state
-
-    def _calculate_scenario_probability(
-        self, 
-        factual_state: Dict[str, float], 
-        interventions: Dict[str, float]
-    ) -> float:
-        """
-        Calculate smoothed probability using standardized z-distance.
-        
-        Mathematical formulation:
-        - Compute z-score deltas: dz_i = z_new_i - z_old_i for each intervened variable
-        - L2 norm squared: ||dz||² = Σᵢ (dz_i)²
-        - Gaussian-like probability: p = 0.95 * exp(-0.5 * ||dz||²) + 0.05
-        - Bounded to [0.05, 0.98]: p = clip(p, 0.05, 0.98)
-        
-        This follows the Mahalanobis distance-based probability in multivariate Gaussian.
-        """
-        # Step 1: Compute z-score deltas for intervened variables
-        # dz_i = z_new_i - z_old_i where z = (x - μ)/σ
-        z_sq_sum = 0.0
-        for var, new_val in interventions.items():
-            stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
-            mu = stats.get('mean', 0.0)  # μ: mean
-            sd = stats.get('std', 1.0) or 1.0  # σ: standard deviation
-            
-            # Get old value from factual state or use mean as default
-            old_val = factual_state.get(var, mu)
-            
-            # Compute z-scores: z = (x - μ)/σ
-            z_new = (new_val - mu) / sd
-            z_old = (old_val - mu) / sd
-            
-            # Delta in z-space: dz = z_new - z_old
-            dz = z_new - z_old
-            
-            # Accumulate squared L2 norm: ||dz||² = Σᵢ (dz_i)²
-            z_sq_sum += float(dz) * float(dz)
-        
-        # Step 2: Compute probability using exponential decay
-        # p = 0.95 * exp(-0.5 * ||dz||²) + 0.05
-        # This gives high probability (near 0.95) when ||dz||² ≈ 0 (small intervention)
-        # and low probability (near 0.05) when ||dz||² is large (large intervention)
-        prob = 0.95 * float(np.exp(-0.5 * z_sq_sum)) + 0.05
-        
-        # Step 3: Clip to valid probability range [0.05, 0.98]
-        # p = min(0.98, max(0.05, p))
-        prob = max(0.05, min(0.98, prob))
-        
-        return float(prob)
-
-    def analyze_causal_strength(self, source: str, target: str) -> Dict[str, float]:
-        """Analyze the strength of causal relationship between two variables."""
-        if not self.causal_graph.has_edge(source, target):
-            return {"strength": 0.0, "confidence": 0.0, "path_length": float('inf')}
-        
-        edge_data = self.causal_graph[source][target]
-        path_length = len(nx.shortest_path(self.causal_graph, source, target)) - 1
-        
-        return {
-            "strength": edge_data.get('strength', 1.0),
-            "confidence": edge_data.get('confidence', 1.0),
-            "path_length": path_length,
-            "relation_type": edge_data.get('relation_type', CausalRelationType.DIRECT).value
-        }
-
-    def fit_from_dataframe(
-        self,
-        df: Any,
-        variables: List[str],
-        window: int = 30,
-        decay_alpha: float = 0.9,
-        ridge_lambda: float = 0.0,
-        enforce_signs: bool = True
-    ) -> None:
-        """Fit edge strengths and standardization stats from a rolling window with recency weighting.
-
-        For each child variable, perform a simple weighted linear regression on its parents
-        defined in the existing graph to estimate edge 'strength' coefficients. Also compute
-        mean/std for z-score scaling. Uses exponential decay weights to emphasize recent data.
-        """
-        if df is None or len(df) == 0:
-            return
-        df_local = df[variables].dropna().copy()
-        if len(df_local) < max(3, window):
-            # Still compute stats on available data
-            pass
-        # Use the last `window` rows
-        window_df = df_local.tail(window)
-        n = len(window_df)
-        # Exponential decay weights: newer rows get higher weights
-        # Oldest gets alpha^(n-1), newest gets alpha^0 = 1.0
-        weights = np.array([decay_alpha ** (n - 1 - i) for i in range(n)], dtype=float)
-        weights = weights / (weights.sum() if weights.sum() != 0 else 1.0)
-
-        # Compute standardization stats
-        self.standardization_stats = {}
-        for v in variables:
-            m = float(window_df[v].mean())
-            s = float(window_df[v].std(ddof=0))
-            if s == 0:
-                s = 1.0
-            self.standardization_stats[v] = {"mean": m, "std": s}
-        # Ensure default stats for any graph node not in the window variables
-        for node in self.causal_graph.nodes():
-            if node not in self.standardization_stats:
-                self.standardization_stats[node] = {"mean": 0.0, "std": 1.0}
-
-        # Estimate edge strengths per node from its parents
-        learned_strengths: Dict[Tuple[str, str], float] = {}
-        for child in self.causal_graph.nodes():
-            parents = list(self.causal_graph.predecessors(child))
-            if not parents:
-                continue
-            # Skip children not present in the data window
-            if child not in window_df.columns:
-                continue
-            # Prepare standardized design matrix X (parents) and target y (child)
-            X_cols = []
-            for p in parents:
-                if p in window_df.columns:
-                    X_cols.append(((window_df[p] - self.standardization_stats[p]["mean"]) / self.standardization_stats[p]["std"]).values)
-            if not X_cols:
-                continue
-            X = np.vstack(X_cols).T  # shape (n, k)
-            y = ((window_df[child] - self.standardization_stats[child]["mean"]) / self.standardization_stats[child]["std"]).values
-            # Weighted least squares: (X' W X)^{-1} X' W y
-            W = np.diag(weights)
-            XtW = X.T @ W
-            XtWX = XtW @ X
-            # Ridge regularization for stability
-            if ridge_lambda > 0 and XtWX.size > 0:
-                k = XtWX.shape[0]
-                XtWX = XtWX + ridge_lambda * np.eye(k)
-            try:
-                XtWX_inv = np.linalg.pinv(XtWX)
-                beta = XtWX_inv @ (XtW @ y)
-            except Exception:
-                beta = np.zeros(X.shape[1])
-            # Assign strengths to edges in order of parents
-            for idx, p in enumerate(parents):
-                strength = float(beta[idx]) if idx < len(beta) else 0.0
-                # Enforce monotonic sign constraints if requested
-                if enforce_signs:
-                    sign = self.edge_sign_constraints.get((p, child))
-                    if sign == 1 and strength < 0:
-                        strength = 0.0
-                    elif sign == -1 and strength > 0:
-                        strength = 0.0
-                if self.causal_graph.has_edge(p, child):
-                    self.causal_graph[p][child]['strength'] = strength
-                    self.causal_graph[p][child]['confidence'] = 1.0
-                    learned_strengths[(p, child)] = strength
-        # Track history for temporal drift analysis
-        self.edge_strength_history.append(learned_strengths)
-
-        # Enforce DAG: if cycles exist, iteratively remove weakest edge in cycles
-        try:
-            while not nx.is_directed_acyclic_graph(self.causal_graph):
-                cycle_edges = list(nx.find_cycle(self.causal_graph, orientation="original"))
-                # pick weakest edge among cycle
-                weakest = None
-                weakest_w = float("inf")
-                for u, v, _ in cycle_edges:
-                    w = abs(float(self.causal_graph[u][v].get('strength', 0.0)))
-                    if w < weakest_w:
-                        weakest_w = w
-                        weakest = (u, v)
-                if weakest:
-                    self.causal_graph.remove_edge(*weakest)
-                else:
-                    break
-        except Exception:
-            pass
-
-    def identify_adjustment_set(self, treatment: str, outcome: str) -> List[str]:
-        """Heuristic back-door adjustment set selection.
-
-        Returns a set that blocks back-door paths: parents of treatment excluding descendants of treatment and the outcome itself.
-        """
-        if treatment not in self.causal_graph or outcome not in self.causal_graph:
-            return []
-        parents_t = set(self.causal_graph.predecessors(treatment))
-        descendants_t = set(nx.descendants(self.causal_graph, treatment))
-        adjustment = [z for z in parents_t if z not in descendants_t and z != outcome]
-        return adjustment
-
-    def estimate_ate(
-        self,
-        df: Any,
-        treatment: str,
-        outcome: str,
-        conditioning: Optional[List[str]] = None,
-        method: str = 'ols'
-    ) -> float:
-        """Estimate average treatment effect using simple regression adjustment.
-
-        y ~ T + Z, return coefficient on T in standardized space.
-        """
-        if df is None or len(df) == 0:
-            return 0.0
-        if conditioning is None:
-            conditioning = self.identify_adjustment_set(treatment, outcome)
-        cols = [c for c in [outcome, treatment] + conditioning if c in df.columns]
-        data = df[cols].dropna()
-        if len(data) < 5:
-            return 0.0
-        # Standardize
-        ds = (data - data.mean()) / (data.std(ddof=0).replace(0, 1.0))
-        y = ds[outcome].values
-        X_cols = [ds[treatment].values] + [ds[c].values for c in conditioning]
-        X = np.vstack(X_cols).T
-        # OLS
-        try:
-            beta = np.linalg.pinv(X) @ y
-            return float(beta[0])
-        except Exception:
-            return 0.0
-
-    def estimate_cate(
-        self,
-        df: Any,
-        treatment: str,
-        outcome: str,
-        context_by: Optional[str] = None,
-        num_bins: int = 3
-    ) -> Dict[str, float]:
-        """Estimate heterogeneous effects by binning a context feature and computing local ATEs."""
-        if df is None or len(df) == 0 or context_by is None or context_by not in df.columns:
-            return {}
-        series = df[context_by].dropna()
-        if len(series) < 10:
-            return {}
-        quantiles = np.linspace(0, 1, num_bins + 1)
-        bins = series.quantile(quantiles).values
-        bins[0] = -np.inf
-        bins[-1] = np.inf
-        cate: Dict[str, float] = {}
-        for i in range(num_bins):
-            mask = (df[context_by] > bins[i]) & (df[context_by] <= bins[i+1])
-            ate_bin = self._safe_ate_bin(df[mask], treatment, outcome)
-            cate[f"bin_{i}"] = ate_bin
-        return cate
-
-    def _safe_ate_bin(self, df: Any, treatment: str, outcome: str) -> float:
-        if df is None or len(df) < 5:
-            return 0.0
-        return self.estimate_ate(df, treatment, outcome)
-
-    def counterfactual_abduction_action_prediction(
-        self,
-        factual_state: Dict[str, float],
-        interventions: Dict[str, float]
-    ) -> Dict[str, float]:
-        """
-        Abduction–Action–Prediction for linear-Gaussian SCM in z-space.
-        
-        Pearl's three-step counterfactual reasoning:
-        
-        1. Abduction: Infer latent noise terms ε from factual observations
-           - Given factual: x_factual, compute ε = x - E[x|parents]
-           - For linear SCM: ε = z_y - Σᵢ βᵢ·z_xi (residual)
-           - This preserves the "history" that led to factual state
-        
-        2. Action: Apply do-operator do(X=x*) to set intervention values
-           - do(X=x*) breaks causal dependencies: P(Y|do(X=x*)) ≠ P(Y|X=x*)
-           - Sets intervened variables to counterfactual values
-        
-        3. Prediction: Propagate with new values but old noise
-           - Use abduced noise ε from step 1
-           - Predict: y_cf = Σᵢ βᵢ·x_cfᵢ + ε (same noise, new parents)
-           - This gives counterfactual: "What if X had been x* instead of x_factual?"
-        
-        Mathematical foundation:
-        - Factual: Y = f(X, ε) where ε ~ N(0, σ²)
-        - Abduction: ε̂ = Y_factual - f(X_factual, 0) (infer noise from observation)
-        - Counterfactual: Y_cf = f(X_cf, ε̂) (same noise, different X)
-        """
-        # Standardize factual: z = (x - μ)/σ
-        z = self._standardize_state(factual_state)
-        noise: Dict[str, float] = {}
-        
-        # Step 1: ABDUCTION - Infer latent noise terms from factual observations
-        # Noise represents unobserved confounders and stochastic variation
-        # For linear SCM: ε = z_y - Σᵢ βᵢ·z_xi (residual from linear regression)
-        for node in nx.topological_sort(self.causal_graph):
-            parents = list(self.causal_graph.predecessors(node))
-            if not parents:
-                # Exogenous: noise equals observed value (no parents to subtract)
-                noise[node] = z.get(node, 0.0)
-                continue
-            
-            # Predicted value from structural equation: ŷ = Σᵢ βᵢ·xᵢ
-            pred = 0.0
-            for p in parents:
-                w = self.causal_graph[p][node].get('strength', 0.0)  # βᵢ
-                pred += z.get(p, 0.0) * w  # Σᵢ βᵢ·z_xi
-            
-            # Abduce noise: ε = z_observed - ŷ
-            # This captures the deviation from deterministic prediction
-            noise[node] = z.get(node, 0.0) - pred
-        # Action + prediction
-        cf_raw = factual_state.copy()
-        cf_raw.update(interventions)
-        z_cf = self._standardize_state(cf_raw)
-        z_pred: Dict[str, float] = {}
-        for node in nx.topological_sort(self.causal_graph):
-            if node in interventions:
-                z_pred[node] = z_cf.get(node, 0.0)
-                continue
-            parents = list(self.causal_graph.predecessors(node))
-            if not parents:
-                z_pred[node] = noise.get(node, 0.0)
-                continue
-            val = 0.0
-            for p in parents:
-                w = self.causal_graph[p][node].get('strength', 0.0)
-                val += z_pred.get(p, z_cf.get(p, 0.0)) * w
-            z_pred[node] = val + noise.get(node, 0.0)
-        # De-standardize
-        out: Dict[str, float] = {k: self._destandardize_value(k, v) for k, v in z_pred.items()}
-        return out
-
-    def quantify_uncertainty(
-        self,
-        df: Any,
-        variables: List[str],
-        windows: int = 200,
-        alpha: float = 0.95
-    ) -> Dict[str, Any]:
-        """Bootstrap strengths and produce confidence intervals per edge.
-
-        If PyMC is available, provide a Bayesian posterior CI as well (best effort).
-        """
-        if df is None or len(df) == 0:
-            return {"edge_cis": {}, "samples": 0}
-        samples: Dict[Tuple[str, str], List[float]] = {}
-        usable = df[variables].dropna()
-        if len(usable) < 10:
-            return {"edge_cis": {}, "samples": 0}
-        idx = np.arange(len(usable))
-        for _ in range(windows):
-            boot_idx = np.random.choice(idx, size=len(idx), replace=True)
-            boot_df = usable.iloc[boot_idx]
-            self.fit_from_dataframe(boot_df, variables=variables, window=min(30, len(boot_df)))
-            for u, v in self.causal_graph.edges():
-                w = float(self.causal_graph[u][v].get('strength', 0.0))
-                samples.setdefault((u, v), []).append(w)
-        edge_cis: Dict[str, Tuple[float, float]] = {}
-        for (u, v), arr in samples.items():
-            arr = np.array(arr)
-            lo = float(np.quantile(arr, (1 - alpha) / 2))
-            hi = float(np.quantile(arr, 1 - (1 - alpha) / 2))
-            edge_cis[f"{u}->{v}"] = (lo, hi)
-        out: Dict[str, Any] = {"edge_cis": edge_cis, "samples": windows}
-        # Optional Bayesian: very lightweight attempt using PyMC linear model per edge
-        try:
-            import pymc as pm  # type: ignore
-            bayes_cis: Dict[str, Tuple[float, float]] = {}
-            data = usable
-            for u, v in self.causal_graph.edges():
-                if u not in data.columns or v not in data.columns:
-                    continue
-                X = (data[[u]].values).astype(float)
-                y = (data[v].values).astype(float)
-                with pm.Model() as m:
-                    beta = pm.Normal('beta', mu=0, sigma=1)
-                    sigma = pm.HalfNormal('sigma', sigma=1)
-                    mu = beta * X.flatten()
-                    pm.Normal('obs', mu=mu, sigma=sigma, observed=y)
-                    idata = pm.sampling_jax.sample_numpyro_nuts(draws=500, tune=300, chains=1, progressbar=False)
-                b_samp = np.asarray(idata.posterior['beta']).flatten()
-                bayes_cis[f"{u}->{v}"] = (float(np.quantile(b_samp, 0.05)), float(np.quantile(b_samp, 0.95)))
-            out["bayes_cis"] = bayes_cis
-        except Exception:
-            pass
-        return out
-
-    def detect_change_points(self, series: List[float], threshold: float = 2.5) -> List[int]:
-        """Simple CUSUM-like change detection; returns indices with large cumulative shifts."""
-        if not series or len(series) < 10:
-            return []
-        x = np.array(series, dtype=float)
-        mu = x.mean()
-        sigma = x.std() or 1.0
-        s = np.cumsum((x - mu) / sigma)
-        return [int(i) for i, v in enumerate(s) if abs(v) > threshold]
-
-    def learn_structure(
-        self,
-        df: Any,
-        variables: List[str],
-        corr_threshold: float = 0.2
-    ) -> None:
-        """Very simple structure learning: add edges where |corr|>threshold, enforce DAG by ordering.
-
-        Order variables as provided and only add edges from earlier to later variables.
-        """
-        if df is None or len(df) == 0:
-            return
-        data = df[variables].dropna()
-        if len(data) < 10:
-            return
-        corr = data.corr().values
-        self.causal_graph.clear()
-        self.causal_graph.add_nodes_from(variables)
-        n = len(variables)
-        for i in range(n):
-            for j in range(i+1, n):
-                if abs(corr[i, j]) >= corr_threshold:
-                    self.add_causal_relationship(variables[i], variables[j], strength=0.0)
-
-    def sample_joint_interventions_gaussian_copula(
-        self,
-        base_state: Dict[str, float],
-        variables: List[str],
-        df: Any,
-        num_samples: int = 10,
-        z_radius: float = 1.0
-    ) -> List[Dict[str, float]]:
-        """Sample joint interventions using a Gaussian copula built from historical correlations in z-space."""
-        out: List[Dict[str, float]] = []
-        if df is None or len(df) == 0:
-            return out
-        hist = df[variables].dropna()
-        if len(hist) < 10:
-            return out
-        # Standardize
-        H = (hist - hist.mean()) / (hist.std(ddof=0).replace(0, 1.0))
-        cov = np.cov(H.values.T)
-        # Ensure positive semi-definite via eigen clipping
-        eigvals, eigvecs = np.linalg.eigh(cov)
-        eigvals_clipped = np.clip(eigvals, 1e-6, None)
-        cov_psd = (eigvecs @ np.diag(eigvals_clipped) @ eigvecs.T)
-        mean = np.zeros(len(variables))
-        z_samples = np.random.multivariate_normal(mean, cov_psd, size=num_samples)
-        for z in z_samples:
-            scaled = {}
-            for k, v in zip(variables, z):
-                scaled[k] = self._destandardize_value(k, float(np.clip(v, -z_radius, z_radius)))
-            out.append({**base_state, **scaled})
-        return out
-
-    def plan_interventions(
-        self,
-        target_outcome: str,
-        candidates: List[str],
-        base_state: Dict[str, float],
-        df: Any,
-        budget: float = 1.0,
-        num_grid: int = 5,
-        risk_metric: str = 'cvar',
-        cvar_alpha: float = 0.9
-    ) -> List[Dict[str, Any]]:
-        """Risk-aware intervention planner. Grid-search small z-steps and penalize by CVaR proxy.
-
-        Returns top plans with objective = expected improvement - risk_penalty.
-        """
-        if not candidates:
-            return []
-        # Build small z-grid per candidate
-        z_levels = np.linspace(-budget, budget, num_grid)
-        results: List[Dict[str, Any]] = []
-        for var in candidates:
-            for z in z_levels:
-                # Convert z-shift to raw using stats
-                raw_shift = self._destandardize_value(var, z) - self._destandardize_value(var, 0.0)
-                trial_state = base_state.copy()
-                trial_state[var] = base_state.get(var, 0.0) + raw_shift
-                # Predict deterministic outcome
-                pred = self._predict_outcomes(base_state, {var: trial_state[var]})
-                benefit = pred.get(target_outcome, 0.0) - base_state.get(target_outcome, 0.0)
-                # Risk via bootstrap strengths if data provided
-                risk_penalty = 0.0
-                if df is not None and risk_metric == 'cvar':
-                    unc = self.quantify_uncertainty(df, variables=list(set(candidates + [target_outcome])), windows=100, alpha=cvar_alpha)
-                    # Build perturbed outcomes by sampling edge strengths from CIs midpoint +/- half-range
-                    edge_cis = unc.get('edge_cis', {})
-                    outcomes = []
-                    for _ in range(50):
-                        # Temporarily perturb strengths
-                        saved: Dict[Tuple[str, str], float] = {}
-                        for (u, v) in self.causal_graph.edges():
-                            key = f"{u}->{v}"
-                            if key in edge_cis:
-                                lo, hi = edge_cis[key]
-                                w = float(np.random.uniform(lo, hi))
-                                saved[(u, v)] = self.causal_graph[u][v]['strength']
-                                self.causal_graph[u][v]['strength'] = w
-                        p = self._predict_outcomes(base_state, {var: trial_state[var]}).get(target_outcome, 0.0)
-                        outcomes.append(p)
-                        # Restore
-                        for (u, v), w in saved.items():
-                            self.causal_graph[u][v]['strength'] = w
-                    outcomes = np.array(outcomes)
-                    losses = base_state.get(target_outcome, 0.0) - outcomes
-                    tail = np.quantile(losses, cvar_alpha)
-                    risk_penalty = float(losses[losses >= tail].mean()) if np.any(losses >= tail) else 0.0
-                score = benefit - risk_penalty
-                results.append({
-                    'var': var,
-                    'z': float(z),
-                    'raw_shift': float(raw_shift),
-                    'benefit': float(benefit),
-                    'risk_penalty': float(risk_penalty),
-                    'score': float(score),
-                    'predicted': pred.get(target_outcome, 0.0)
-                })
-        results.sort(key=lambda x: x['score'], reverse=True)
-        return results[:10]
-
-    def state_space_update(
-        self,
-        prev_mean: float,
-        prev_var: float,
-        observation: float,
-        process_var: float = 1e-2,
-        obs_var: float = 1e-1
-    ) -> Tuple[float, float]:
-        """Minimal 1D Kalman-like update returning new mean/variance."""
-        # Predict
-        pred_mean = prev_mean
-        pred_var = prev_var + process_var
-        # Update
-        K = pred_var / (pred_var + obs_var)
-        new_mean = pred_mean + K * (observation - pred_mean)
-        new_var = (1 - K) * pred_var
-        return float(new_mean), float(new_var)
-
-    def causal_explain_ace(self, child: str) -> Dict[str, float]:
-        """Decompose child prediction into parent contributions in z-space (ACE-like for linear model)."""
-        parents = list(self.causal_graph.predecessors(child))
-        if not parents:
-            return {}
-        contrib: Dict[str, float] = {}
-        for p in parents:
-            contrib[p] = float(self.causal_graph[p][child].get('strength', 0.0))
-        return contrib
-
-    def identifiability_report(self, treatment: str, outcome: str) -> str:
-        """Simple do-calculus identifiability report stub based on back-door availability."""
-        adj = self.identify_adjustment_set(treatment, outcome)
-        if adj:
-            return f"Effect of {treatment} on {outcome} identifiable via back-door with adjustment set: {adj}"
-        return f"Effect of {treatment} on {outcome} not identified by simple back-door; consider IVs or front-door."
-
-    def identify_instruments(self, treatment: str, outcome: str) -> List[str]:
-        """Heuristic IV identification: candidates are parents of treatment that do not have a path to outcome.
-
-        This enforces relevance (parent of T) and exclusion (no path to Y) in the graph structure.
-        """
-        if treatment not in self.causal_graph or outcome not in self.causal_graph:
-            return []
-        instruments: List[str] = []
-        for z in self.causal_graph.predecessors(treatment):
-            # Relevance: z -> treatment by definition
-            # Exclusion: no path from z to outcome (strong condition)
-            if not nx.has_path(self.causal_graph, z, outcome):
-                instruments.append(z)
-        return instruments
-
-    def estimate_2sls(
-        self,
-        df: Any,
-        treatment: str,
-        outcome: str,
-        instruments: Optional[List[str]] = None,
-        controls: Optional[List[str]] = None
-    ) -> Dict[str, Any]:
-        """Two-Stage Least Squares estimator for causal effect of treatment on outcome.
-
-        Returns a dict with {'coef': float, 'first_stage_F': float, 'used_instruments': [...], 'used_controls': [...]}.
-        """
-        result = {"coef": 0.0, "first_stage_F": 0.0, "used_instruments": [], "used_controls": []}
-        if df is None or len(df) == 0 or treatment not in df.columns or outcome not in df.columns:
-            return result
-        if instruments is None or len(instruments) == 0:
-            instruments = self.identify_instruments(treatment, outcome)
-        if controls is None:
-            controls = []
-        cols_needed = [outcome, treatment] + instruments + controls
-        cols = [c for c in cols_needed if c in df.columns]
-        data = df[cols].dropna()
-        if len(data) < 10 or len(instruments) == 0:
-            return result
-        # Standardize
-        ds = (data - data.mean()) / (data.std(ddof=0).replace(0, 1.0))
-        # First stage: T ~ Z + C
-        ZC_cols = [ds[z].values for z in instruments] + [ds[c].values for c in controls if c in ds.columns]
-        if not ZC_cols:
-            return result
-        X1 = np.vstack(ZC_cols).T
-        y1 = ds[treatment].values
-        X1TX1 = X1.T @ X1
-        try:
-            beta1 = np.linalg.pinv(X1TX1) @ (X1.T @ y1)
-        except Exception:
-            return result
-        t_hat = X1 @ beta1
-        # First-stage F-statistic proxy: var explained / residual var times dof ratio (rough heuristic)
-        ssr = float(((t_hat - y1.mean()) ** 2).sum())
-        sse = float(((y1 - t_hat) ** 2).sum())
-        k = X1.shape[1]
-        n = X1.shape[0]
-        if sse > 0 and n > k and k > 0:
-            result["first_stage_F"] = (ssr / k) / (sse / (n - k - 1))
-        # Second stage: Y ~ T_hat + C
-        X2_cols = [t_hat] + [ds[c].values for c in controls if c in ds.columns]
-        X2 = np.vstack(X2_cols).T
-        y2 = ds[outcome].values
-        try:
-            beta2 = np.linalg.pinv(X2.T @ X2) @ (X2.T @ y2)
-            result["coef"] = float(beta2[0])
-        except Exception:
-            result["coef"] = 0.0
-        result["used_instruments"] = [z for z in instruments if z in ds.columns]
-        result["used_controls"] = [c for c in controls if c in ds.columns]
-        return result
-
-    def find_optimal_interventions(
-        self, 
-        target_outcome: str, 
-        available_interventions: List[str],
-        constraints: Optional[Dict[str, Tuple[float, float]]] = None
-    ) -> List[Dict[str, float]]:
-        """Find optimal interventions to achieve target outcome."""
-        if constraints is None:
-            constraints = {}
-        
-        optimal_interventions = []
-        
-        # Generate intervention combinations
-        for intervention_var in available_interventions:
-            if intervention_var in constraints:
-                min_val, max_val = constraints[intervention_var]
-                test_values = np.linspace(min_val, max_val, 10)
-            else:
-                test_values = np.linspace(-2.0, 2.0, 10)
-            
-            for value in test_values:
-                intervention = {intervention_var: value}
-                predicted_outcomes = self._predict_outcomes({}, intervention)
-                
-                if target_outcome in predicted_outcomes:
-                    optimal_interventions.append({
-                        'intervention': intervention,
-                        'predicted_outcome': predicted_outcomes[target_outcome],
-                        'efficiency': abs(predicted_outcomes[target_outcome]) / abs(value) if value != 0 else 0
-                    })
-        
-        # Sort by efficiency and return top interventions
-        optimal_interventions.sort(key=lambda x: x['efficiency'], reverse=True)
-        return optimal_interventions[:5]
-
-    def step(self, task: str) -> str:
-        """Execute a single step of causal reasoning."""
-        response = self.agent.run(task)
-        return response
-
-    def run(self, task: str, *args, **kwargs) -> Dict[str, Any]:
-        """
-        Run the CR-CA agent for comprehensive causal analysis.
-        
-        Args:
-            task: The problem or question to analyze causally
-            
-        Returns:
-            Dictionary containing causal analysis results
-        """
-        # Reset memory
-        self.causal_memory = []
-        self.counterfactual_scenarios = []
-        
-        # Build causal analysis prompt
-        causal_prompt = self._build_causal_prompt(task)
-        
-        # Run causal analysis
-        for i in range(self.max_loops):
-            print(f"\nCausal Analysis Step {i+1}/{self.max_loops}")
-            
-            step_result = self.step(causal_prompt)
-            self.causal_memory.append({
-                'step': i + 1,
-                'analysis': step_result,
-                'timestamp': i
-            })
-            
-            # Update prompt with previous analysis
-            if i < self.max_loops - 1:
-                memory_context = self._build_memory_context()
-                causal_prompt = f"{causal_prompt}\n\nPrevious Analysis:\n{memory_context}"
-        
-        # Generate final causal analysis
-        final_analysis = self._synthesize_causal_analysis(task)
-        
-        return {
-            'task': task,
-            'causal_analysis': final_analysis,
-            'counterfactual_scenarios': self.counterfactual_scenarios,
-            'causal_graph_info': {
-                'nodes': list(self.causal_graph.nodes()),
-                'edges': list(self.causal_graph.edges()),
-                'is_dag': nx.is_directed_acyclic_graph(self.causal_graph)
-            },
-            'analysis_steps': self.causal_memory
-        }
-
-    def _build_causal_prompt(self, task: str) -> str:
-        """Build the causal analysis prompt."""
-        return f"""
-        You are a Causal Reasoning with Counterfactual Analysis (CR-CA) agent. 
-        Analyze the following problem using sophisticated causal reasoning:
-        
-        Problem: {task}
-        
-        Your analysis should include:
-        1. Causal Analysis: Identify cause-and-effect relationships
-        2. Intervention Planning: Plan interventions to test causal hypotheses  
-        3. Counterfactual Scenarios: Explore multiple "what-if" scenarios
-        4. Causal Strength Assessment: Evaluate relationship strengths and confounders
-        5. Optimal Solution: Recommend the best approach based on causal analysis
-        
-        Current causal graph has {len(self.causal_graph.nodes())} variables and {len(self.causal_graph.edges())} relationships.
-        """
-
-    def _build_memory_context(self) -> str:
-        """Build memory context from previous analysis steps."""
-        context_parts = []
-        for step in self.causal_memory[-2:]:  # Last 2 steps
-            context_parts.append(f"Step {step['step']}: {step['analysis']}")
-        return "\n".join(context_parts)
-
-    def _synthesize_causal_analysis(self, task: str) -> str:
-        """Synthesize the final causal analysis from all steps."""
-        synthesis_prompt = f"""
-        Based on the causal analysis steps performed, synthesize a comprehensive 
-        causal reasoning report for: {task}
-        
-        Include:
-        - Key causal relationships identified
-        - Recommended interventions
-        - Counterfactual scenarios explored
-        - Optimal solution with causal justification
-        - Confidence levels and limitations
-        """
-        
-        return self.agent.run(synthesis_prompt)
-
-    def get_causal_graph_visualization(self) -> str:
-        """Get a text representation of the causal graph."""
-        if not self.causal_graph.nodes():
-            return "Empty causal graph"
-        
-        lines = ["Causal Graph Structure:"]
-        lines.append(f"Nodes: {list(self.causal_graph.nodes())}")
-        lines.append("Edges:")
-        
-        for source, target in self.causal_graph.edges():
-            edge_data = self.causal_graph[source][target]
-            strength = edge_data.get('strength', 1.0)
-            relation_type = edge_data.get('relation_type', CausalRelationType.DIRECT).value
-            lines.append(f"  {source} -> {target} (strength: {strength}, type: {relation_type})")
-        
-        return "\n".join(lines)
-
-    def analyze_cascading_chain_reaction(
-        self,
-        initial_intervention: Dict[str, float],
-        target_outcomes: List[str],
-        max_hops: int = 5,
-        include_feedback_loops: bool = True,
-        num_iterations: int = 3,
-    ) -> Dict[str, Any]:
-        """
-        Analyze multi-layer cascading chain reactions from an intervention.
-        
-        Example: "If X affects Y, how does it cascade through Z→alpha→...→back to X?"
-        
-        Args:
-            initial_intervention: {variable: value} intervention to analyze
-            target_outcomes: Variables to trace effects to
-            max_hops: Maximum path length to consider
-            include_feedback_loops: Whether to iterate for feedback effects
-            num_iterations: Number of propagation iterations (for cycles)
-        
-        Returns:
-            Dict with causal paths, cascade probabilities, and cumulative effects
-        """
-        # Find all paths from intervention variables to outcomes
-        intervention_vars = list(initial_intervention.keys())
-        all_paths: Dict[str, List[List[str]]] = {}
-        
-        for inter_var in intervention_vars:
-            for outcome in target_outcomes:
-                if outcome == inter_var:
-                    continue
-                
-                # Find all simple paths (no cycles)
-                try:
-                    simple_paths = list(nx.all_simple_paths(
-                        self.causal_graph,
-                        inter_var,
-                        outcome,
-                        cutoff=max_hops
-                    ))
-                    if simple_paths:
-                        all_paths[f"{inter_var}->{outcome}"] = simple_paths
-                except nx.NetworkXNoPath:
-                    pass
-        
-        # Find feedback loops (paths that eventually return to intervention vars)
-        feedback_paths: List[List[str]] = []
-        if include_feedback_loops:
-            for inter_var in intervention_vars:
-                try:
-                    # Find cycles through inter_var
-                    cycles = list(nx.simple_cycles(self.causal_graph))
-                    for cycle in cycles:
-                        if inter_var in cycle:
-                            # Rotate cycle to start at inter_var
-                            idx = cycle.index(inter_var)
-                            rotated = cycle[idx:] + cycle[:idx] + [inter_var]
-                            feedback_paths.append(rotated)
-                except Exception:
-                    pass
-        
-        # Multi-layer propagation with iterations
-        current_state = self._standardize_state(initial_intervention)
-        propagation_history: List[Dict[str, float]] = [current_state.copy()]
-        
-        for iteration in range(num_iterations):
-            next_state = current_state.copy()
-            
-            # Propagate through all nodes in topological order
-            for node in nx.topological_sort(self.causal_graph):
-                if node in initial_intervention and iteration == 0:
-                    # Keep intervention value in first iteration
-                    continue
-                
-                parents = list(self.causal_graph.predecessors(node))
-                if not parents:
-                    continue
-                
-                effect_z = 0.0
-                for parent in parents:
-                    parent_z = next_state.get(parent, current_state.get(parent, 0.0))
-                    edge_data = self.causal_graph[parent][node]
-                    strength = edge_data.get('strength', 0.0)
-                    effect_z += parent_z * strength
-                
-                next_state[node] = effect_z
-            
-            propagation_history.append(next_state.copy())
-            current_state = next_state
-        
-        # Compute path strengths and probabilities
-        path_analyses: List[Dict[str, Any]] = []
-        for path_key, paths in all_paths.items():
-            for path in paths:
-                # Compute path strength (product of edge strengths)
-                path_strength = 1.0
-                path_strengths_list = []
-                for i in range(len(path) - 1):
-                    u, v = path[i], path[i + 1]
-                    edge_data = self.causal_graph[u][v]
-                    strength = abs(edge_data.get('strength', 0.0))
-                    path_strength *= strength
-                    path_strengths_list.append(strength)
-                
-                # Estimate cascade probability (stronger paths = more likely)
-                # Using softmax-style normalization
-                path_prob = min(0.95, path_strength * 0.5 + 0.05)
-                
-                path_analyses.append({
-                    "path": path,
-                    "path_string": " → ".join(path),
-                    "path_strength": float(path_strength),
-                    "edge_strengths": path_strengths_list,
-                    "cascade_probability": float(path_prob),
-                    "hops": len(path) - 1,
-                })
-        
-        # Feedback loop analysis
-        feedback_analyses: List[Dict[str, Any]] = []
-        for cycle_path in feedback_paths[:10]:  # Limit to top 10 cycles
-            cycle_strength = 1.0
-            for i in range(len(cycle_path) - 1):
-                u, v = cycle_path[i], cycle_path[i + 1]
-                if self.causal_graph.has_edge(u, v):
-                    strength = abs(self.causal_graph[u][v].get('strength', 0.0))
-                    cycle_strength *= strength
-            
-            feedback_analyses.append({
-                "cycle": cycle_path,
-                "cycle_string": " → ".join(cycle_path),
-                "cycle_strength": float(cycle_strength),
-                "could_amplify": cycle_strength > 0.1,  # Strong cycles can amplify
-            })
-        
-        # Final state predictions (de-standardized)
-        final_predictions: Dict[str, float] = {}
-        for var in target_outcomes:
-            if var in propagation_history[-1]:
-                z_val = propagation_history[-1][var]
-                final_predictions[var] = self._destandardize_value(var, z_val)
-            else:
-                final_predictions[var] = 0.0
-        
-        return {
-            "initial_intervention": initial_intervention,
-            "target_outcomes": target_outcomes,
-            "causal_paths": path_analyses,
-            "feedback_loops": feedback_analyses,
-            "propagation_history": [
-                {k: self._destandardize_value(k, v) for k, v in state.items() if k in target_outcomes}
-                for state in propagation_history
-            ],
-            "final_predictions": final_predictions,
-            "summary": {
-                "total_paths_found": len(path_analyses),
-                "feedback_loops_detected": len(feedback_analyses),
-                "max_path_length": max([p["hops"] for p in path_analyses] + [0]),
-                "strongest_path": max(path_analyses, key=lambda x: x["path_strength"]) if path_analyses else None,
-            },
-        }
-
-    def multi_layer_whatif_analysis(
-        self,
-        scenarios: List[Dict[str, float]],
-        depth: int = 3,
-    ) -> Dict[str, Any]:
-        """
-        Multi-layer "what-if" analysis: If X happens to Y, how would it affect?
-        Then: What are the chances of Z affecting alpha and causing chain reaction to X?
-        
-        Performs nested counterfactual reasoning across multiple layers.
-        
-        Args:
-            scenarios: List of intervention scenarios {variable: value}
-            depth: How many layers deep to analyze
-        
-        Returns:
-            Nested analysis with cascading effects and chain reaction probabilities
-        """
-        results: List[Dict[str, Any]] = []
-        
-        for scenario in scenarios:
-            # Layer 1: Direct effects
-            layer1_outcomes = self._predict_outcomes({}, scenario)
-            
-            # Identify affected variables (significant changes)
-            affected_vars = [
-                var for var, val in layer1_outcomes.items()
-                if abs(val) > 0.01  # Threshold for "affected"
-            ]
-            
-            # Layer 2: What if affected vars change other things?
-            layer2_scenarios: List[Dict[str, float]] = []
-            for affected_var in affected_vars[:5]:  # Limit to top 5
-                # Create scenario where this variable is perturbed
-                perturbation = {
-                    affected_var: layer1_outcomes.get(affected_var, 0.0) * 1.2  # 20% perturbation
-                }
-                layer2_scenarios.append(perturbation)
-            
-            layer2_analyses: List[Dict[str, Any]] = []
-            for layer2_scen in layer2_scenarios:
-                layer2_outcomes = self._predict_outcomes(layer1_outcomes, layer2_scen)
-                
-                # Check for chain reactions back to original intervention vars
-                chain_reactions: List[Dict[str, Any]] = []
-                for orig_var in scenario.keys():
-                    if orig_var in layer2_outcomes:
-                        # Chain reaction detected: original var affected by cascade
-                        chain_reactions.append({
-                            "original_intervention": orig_var,
-                            "chain_path": f"{list(layer2_scen.keys())[0]} → {orig_var}",
-                            "effect_magnitude": abs(layer2_outcomes[orig_var] - layer1_outcomes.get(orig_var, 0.0)),
-                            "could_cause_amplification": abs(layer2_outcomes[orig_var]) > abs(scenario.get(orig_var, 0.0)),
-                        })
-                
-                layer2_analyses.append({
-                    "layer2_scenario": layer2_scen,
-                    "layer2_outcomes": layer2_outcomes,
-                    "chain_reactions": chain_reactions,
-                })
-            
-            # Layer 3+: Deep cascade analysis (if depth > 2)
-            cascade_analysis = None
-            if depth > 2:
-                # Use cascading chain reaction method
-                all_outcomes = set(layer1_outcomes.keys()) | set(layer2_analyses[0]["layer2_outcomes"].keys() if layer2_analyses else set())
-                cascade_analysis = self.analyze_cascading_chain_reaction(
-                    initial_intervention=scenario,
-                    target_outcomes=list(all_outcomes)[:10],  # Top 10 outcomes
-                    max_hops=5,
-                    include_feedback_loops=True,
-                    num_iterations=depth,
-                )
-            
-            results.append({
-                "scenario": scenario,
-                "layer1_direct_effects": layer1_outcomes,
-                "affected_variables": affected_vars,
-                "layer2_cascades": layer2_analyses,
-                "deep_cascade": cascade_analysis,
-                "chain_reaction_summary": {
-                    "total_chain_reactions": sum(len(l2.get("chain_reactions", [])) for l2 in layer2_analyses),
-                    "potential_amplifications": sum(
-                        1 for l2 in layer2_analyses
-                        for cr in l2.get("chain_reactions", [])
-                        if cr.get("could_cause_amplification", False)
-                    ),
-                },
-            })
-        
-        return {
-            "multi_layer_analysis": results,
-            "summary": {
-                "total_scenarios": len(results),
-                "avg_chain_reactions_per_scenario": np.mean([
-                    r["chain_reaction_summary"]["total_chain_reactions"] for r in results
-                ]) if results else 0.0,
-                "scenarios_with_amplification": sum(
-                    1 for r in results
-                    if r["chain_reaction_summary"]["potential_amplifications"] > 0
-                ),
-            },
-        }
-
-    def deep_root_cause_analysis(
-        self,
-        problem_variable: str,
-        max_depth: int = 20,
-        min_path_strength: float = 0.01,
-    ) -> Dict[str, Any]:
-        """
-        Infinitely nested root cause analysis: trace backwards to find absolute deepest causes.
-        
-        Keeps going deeper until hitting exogenous nodes or circular dependencies.
-        Finds the ultimate root causes that, if intervened, would solve the problem.
-        
-        Args:
-            problem_variable: Variable we want to fix/understand
-            max_depth: Maximum backward tracing depth (safety limit)
-            min_path_strength: Minimum edge strength to consider
-        
-        Returns:
-            Root causes, causal paths, intervention opportunities
-        """
-        if problem_variable not in self.causal_graph:
-            return {"error": f"Variable {problem_variable} not in causal graph"}
-        
-        # Backward tracing: find all ancestors (potential root causes)
-        all_ancestors = list(nx.ancestors(self.causal_graph, problem_variable))
-        
-        # Trace paths from each ancestor to problem
-        root_causes: List[Dict[str, Any]] = []
-        paths_to_problem: List[Dict[str, Any]] = []
-        
-        for ancestor in all_ancestors:
-            try:
-                # Find all paths from ancestor to problem
-                paths = list(nx.all_simple_paths(
-                    self.causal_graph,
-                    ancestor,
-                    problem_variable,
-                    cutoff=max_depth
-                ))
-                
-                if paths:
-                    # Compute path strength for each path
-                    # Mathematical formulation: Path strength = ∏(i,j)∈Path |β_ij|
-                    # where β_ij is the causal effect (structural coefficient) from i to j
-                    # This follows Pearl's Structural Causal Model (SCM) path product rule
-                    for path in paths:
-                        # Initialize with multiplicative identity (1.0)
-                        # Path strength represents cumulative causal effect along chain
-                        path_strength = 1.0
-                        path_details = []
-                        
-                        for i in range(len(path) - 1):
-                            u, v = path[i], path[i + 1]
-                            edge_data = self.causal_graph[u][v]
-                            # β_ij: structural coefficient from Pearl's SCM framework
-                            beta_ij = edge_data.get('strength', 0.0)  # β_ij (signed)
-                            strength = abs(beta_ij)  # |β_ij|: magnitude for threshold check
-                            
-                            # Filter by minimum effect size (power analysis threshold)
-                            # If any edge is too weak, path strength becomes 0
-                            if strength < min_path_strength:
-                                path_strength = 0.0
-                                break
-                            
-                            # Multiplicative path strength: ∏(i,j)∈Path β_ij
-                            # This follows chain rule of differentiation and causal mediation analysis
-                            # IMPORTANT: Use signed β_ij (not |β_ij|) to preserve sign in product
-                            # Total effect = β₁₂ · β₂₃ · ... · βₖ₋₁ₖ (product preserves sign)
-                            path_strength *= beta_ij  # Multiply by signed coefficient
-                            path_details.append({
-                                "edge": f"{u}→{v}",
-                                "strength": strength,
-                                "structural_coefficient": float(edge_data.get('strength', 0.0)),
-                            })
-                        
-                        if path_strength > 0:
-                            # Check if ancestor is exogenous (true root cause)
-                            ancestors_of_ancestor = list(nx.ancestors(self.causal_graph, ancestor))
-                            is_exogenous = len(ancestors_of_ancestor) == 0
-                            
-                            root_causes.append({
-                                "root_cause": ancestor,
-                                "is_exogenous": is_exogenous,
-                                "path_to_problem": path,
-                                "path_string": " → ".join(path),
-                                "path_strength": float(path_strength),
-                                "depth": len(path) - 1,
-                                "path_details": path_details,
-                            })
-                            
-                            paths_to_problem.append({
-                                "from": ancestor,
-                                "to": problem_variable,
-                                "path": path,
-                                "strength": float(path_strength),
-                            })
-            except Exception:
-                continue
-        
-        # Rank root causes using multi-objective optimization criteria
-        # Objective: maximize f(rc) = w1·I_exo(rc) + w2·S_path(rc) - w3·D(rc)
-        # where I_exo is indicator function, S_path is path strength, D is depth
-        # Using lexicographic ordering: exogenous > path_strength > -depth
-        root_causes.sort(
-            key=lambda x: (
-                -x["is_exogenous"],  # Exogenous first (lexicographic priority)
-                -x["path_strength"],  # Stronger paths first (maximize causal effect)
-                x["depth"]  # Shorter paths first (minimize intervention distance)
-            )
-        )
-        
-        # Find ultimate root causes (those with no ancestors, or only circular ones)
-        ultimate_roots = [
-            rc for rc in root_causes
-            if rc["is_exogenous"] or rc["depth"] >= max_depth - 2
-        ]
-        
-        return {
-            "problem_variable": problem_variable,
-            "all_root_causes": root_causes[:20],  # Top 20
-            "ultimate_root_causes": ultimate_roots[:10],  # Top 10 ultimate
-            "total_paths_found": len(paths_to_problem),
-            "max_depth_reached": max([rc["depth"] for rc in root_causes] + [0]),
-            "intervention_opportunities": [
-                {
-                    "intervene_on": rc["root_cause"],
-                    "expected_impact_on_problem": rc["path_strength"],
-                    "depth": rc["depth"],
-                    "is_exogenous": rc["is_exogenous"],
-                }
-                for rc in root_causes[:10]
-            ],
-        }
-
-    def explore_alternate_realities(
-        self,
-        factual_state: Dict[str, float],
-        target_outcome: str,
-        target_value: Optional[float] = None,
-        max_realities: int = 50,
-        max_interventions: int = 3,
-    ) -> Dict[str, Any]:
-        """
-        Explore multiple alternate realities to find interventions that achieve best outcome.
-        
-        Searches intervention space to find sequences that optimize target outcome.
-        Considers multiple possible realities and picks the best.
-        
-        Args:
-            factual_state: Current state
-            target_outcome: Variable to optimize
-            target_value: Desired value (if None, maximize)
-            max_realities: Number of alternate scenarios to explore
-            max_interventions: Max number of simultaneous interventions
-        
-        Returns:
-            Best interventions, alternate realities explored, optimal outcome
-        """
-        if target_outcome not in self.causal_graph:
-            return {"error": f"Target {target_outcome} not in graph"}
-        
-        # Get intervention candidates (nodes with out-edges)
-        intervention_candidates = [
-            node for node in self.causal_graph.nodes()
-            if len(list(self.causal_graph.successors(node))) > 0
-            and node not in [target_outcome]
-        ]
-        
-        realities: List[Dict[str, Any]] = []
-        
-        # Sample intervention combinations
-        for _ in range(max_realities):
-            # Random intervention set
-            num_interventions = self.rng.integers(1, max_interventions + 1)
-            selected = self.rng.choice(intervention_candidates, size=min(num_interventions, len(intervention_candidates)), replace=False)
-            
-            # Generate intervention values (standardized perturbations)
-            intervention: Dict[str, float] = {}
-            for var in selected:
-                stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
-                current = factual_state.get(var, stats["mean"])
-                # Perturb by ±2 standard deviations
-                perturbation = self.rng.normal(0, stats["std"] * 2.0)
-                intervention[var] = current + perturbation
-            
-            # Predict outcome
-            outcome = self._predict_outcomes(factual_state, intervention)
-            target_val = outcome.get(target_outcome, 0.0)
-            
-            # Compute objective using L2 norm (Euclidean distance) or direct maximization
-            # Objective function: O(θ) = -||y(θ) - y*||₂ if target specified, else O(θ) = y(θ)
-            # where θ = intervention vector, y(θ) = predicted outcome, y* = target value
-            if target_value is not None:
-                # For single-dimensional: use L1 norm ||y - y*||₁ = |y - y*|
-                # For multi-dimensional would use: ||y - y*||₂ = √(Σ(y_i - y*_i)²)
-                # Negative sign for maximization (minimize distance = maximize negative distance)
-                distance = abs(target_val - target_value)  # L1 norm: |y - y*|
-                objective = -distance  # Negative distance (better = less distance)
-            else:
-                # Direct maximization: O(θ) = y(θ) (no target, just maximize outcome)
-                objective = target_val  # Maximize
-            
-            realities.append({
-                "interventions": intervention,
-                "outcome": outcome,
-                "target_value": target_val,
-                "objective": float(objective),
-                "delta_from_factual": target_val - factual_state.get(target_outcome, 0.0),
-            })
-        
-        # Sort by objective (best first)
-        realities.sort(key=lambda x: x["objective"], reverse=True)
-        
-        # Best reality
-        best = realities[0] if realities else None
-        
-        # Pareto frontier (if multi-objective)
-        pareto_realities = []
-        if len(realities) > 1:
-            # Simple Pareto: if reality A is better on target and not worse on others
-            for r in realities[:20]:  # Top 20
-                is_dominated = False
-                for other in realities:
-                    if other is r:
-                        continue
-                    # Check if other dominates
-                    if (other["objective"] >= r["objective"] and 
-                        other["delta_from_factual"] >= r["delta_from_factual"] and
-                        (other["objective"] > r["objective"] or other["delta_from_factual"] > r["delta_from_factual"])):
-                        is_dominated = True
-                        break
-                if not is_dominated:
-                    pareto_realities.append(r)
-        
-        return {
-            "factual_state": factual_state,
-            "target_outcome": target_outcome,
-            "target_value": target_value,
-            "best_reality": best,
-            "top_10_realities": realities[:10],
-            "pareto_frontier": pareto_realities[:10],
-            "all_realities_explored": len(realities),
-            "improvement_potential": (
-                best["target_value"] - factual_state.get(target_outcome, 0.0)
-                if best else 0.0
-            ),
-        }
-
-    def historical_pattern_matching(
-        self,
-        current_state: Dict[str, float],
-        intervention_history: List[Dict[str, float]],
-        outcome_history: List[Dict[str, float]],
-        target_outcome: str,
-        similarity_threshold: float = 0.7,
-    ) -> Dict[str, Any]:
-        """
-        Learn from historical interventions: reuse old reactions to create new ones.
-        
-        Finds past interventions in similar states that achieved good outcomes,
-        then adapts them to current state.
-        
-        Args:
-            current_state: Current factual state
-            intervention_history: List of past interventions
-            outcome_history: List of past outcomes (corresponding to interventions)
-            target_outcome: Variable to optimize
-            similarity_threshold: How similar states must be to reuse
-        
-        Returns:
-            Matched historical patterns, adapted interventions, learned strategies
-        """
-        if len(intervention_history) != len(outcome_history) or len(intervention_history) == 0:
-            return {"error": "Invalid history or empty"}
-        
-        # Compute state similarity (cosine similarity in standardized space)
-        z_current = self._standardize_state(current_state)
-        matches: List[Dict[str, Any]] = []
-        
-        for i, (intervention, outcome) in enumerate(zip(intervention_history, outcome_history)):
-            # Standardize historical outcome (treated as "state")
-            z_past = self._standardize_state(outcome)
-            
-            # Compute similarity (cosine similarity)
-            common_vars = set(z_current.keys()) & set(z_past.keys())
-            if len(common_vars) == 0:
-                continue
-            
-            vec_current = np.array([z_current[v] for v in common_vars])
-            vec_past = np.array([z_past[v] for v in common_vars])
-            
-            # Cosine similarity (normalized inner product): cos(θ) = (A·B)/(||A||₂·||B||₂)
-            # This measures angle between vectors in standardized space
-            # Range: [-1, 1], where 1 = identical direction, 0 = orthogonal, -1 = opposite
-            norm_current = np.linalg.norm(vec_current)  # L2 norm: ||v||₂ = √(Σv_i²)
-            norm_past = np.linalg.norm(vec_past)
-            
-            if norm_current < 1e-6 or norm_past < 1e-6:
-                similarity = 0.0  # Zero vectors have undefined similarity
-            else:
-                # Cosine similarity formula: cos(θ) = (v₁·v₂)/(||v₁||₂·||v₂||₂)
-                similarity = float(np.dot(vec_current, vec_past) / (norm_current * norm_past))
-            
-            if similarity >= similarity_threshold:
-                # Historical outcome value for target
-                target_past = outcome.get(target_outcome, 0.0)
-                target_current = current_state.get(target_outcome, 0.0)
-                
-                # Did this intervention improve the target?
-                improvement = target_past - target_current
-                
-                matches.append({
-                    "historical_index": i,
-                    "similarity": similarity,
-                    "past_intervention": intervention,
-                    "past_outcome": outcome,
-                    "target_improvement": float(improvement),
-                    "was_successful": improvement > 0.0,
-                })
-        
-        # Sort by similarity and success
-        matches.sort(
-            key=lambda x: (x["similarity"], x["target_improvement"]),
-            reverse=True
-        )
-        
-        # Adapt best historical interventions to current state
-        adapted_interventions: List[Dict[str, Any]] = []
-        for match in matches[:5]:  # Top 5 matches
-            past_intervention = match["past_intervention"]
-            
-            # Adapt: scale by similarity and current context
-            adapted = {}
-            for var, val in past_intervention.items():
-                # Adjust based on current state difference
-                current_val = current_state.get(var, 0.0)
-                past_val = past_intervention.get(var, 0.0)
-                
-                # Blend: similarity-weighted historical value + current baseline
-                adaptation_factor = match["similarity"]
-                adapted[var] = float(
-                    current_val * (1.0 - adaptation_factor) +
-                    past_val * adaptation_factor
-                )
-            
-            # Predict outcome of adapted intervention
-            predicted = self._predict_outcomes(current_state, adapted)
-            predicted_target = predicted.get(target_outcome, 0.0)
-            
-            adapted_interventions.append({
-                "source_match": match,
-                "adapted_intervention": adapted,
-                "predicted_outcome": predicted,
-                "predicted_target_value": float(predicted_target),
-                "expected_improvement": float(predicted_target - current_state.get(target_outcome, 0.0)),
-            })
-        
-        # Extract learned strategy patterns
-        successful_interventions = [m for m in matches if m["was_successful"]]
-        learned_patterns: List[Dict[str, Any]] = []
-        
-        if successful_interventions:
-            # Common variables in successful interventions
-            all_vars = set()
-            for m in successful_interventions:
-                all_vars.update(m["past_intervention"].keys())
-            
-            for var in all_vars:
-                successful_vals = [
-                    m["past_intervention"].get(var, 0.0)
-                    for m in successful_interventions
-                    if var in m["past_intervention"]
-                ]
-                if successful_vals:
-                    learned_patterns.append({
-                        "variable": var,
-                        "typical_successful_value": float(np.mean(successful_vals)),
-                        "value_range": [float(min(successful_vals)), float(max(successful_vals))],
-                        "success_frequency": len(successful_vals) / len(successful_interventions),
-                    })
-        
-        return {
-            "current_state": current_state,
-            "historical_matches": matches[:10],
-            "best_matches": matches[:5],
-            "adapted_interventions": adapted_interventions,
-            "learned_patterns": learned_patterns,
-            "recommended_intervention": adapted_interventions[0]["adapted_intervention"] if adapted_interventions else {},
-            "strategy_confidence": float(np.mean([m["similarity"] for m in matches[:5]])) if matches else 0.0,
-        }
-
-    def infinite_nesting_root_cause(
-        self,
-        problem: str,
-        stop_condition: Optional[Callable[[str, int], bool]] = None,
-    ) -> Dict[str, Any]:
-        """
-        Infinitely nested root cause analysis: keeps going deeper until hitting true roots.
-        
-        Unlike deep_root_cause_analysis which has max_depth, this continues until
-        hitting exogenous nodes or user-defined stop condition.
-        
-        Args:
-            problem: Variable to trace backwards from
-            stop_condition: Function(node, depth) -> bool to stop tracing
-        
-        Returns:
-            Ultimate root causes, full causal tree, intervention strategy
-        """
-        if problem not in self.causal_graph:
-            return {"error": f"Problem {problem} not in graph"}
-        
-        visited: set = set()
-        causal_tree: List[Dict[str, Any]] = []
-        root_nodes: List[str] = []
-        
-        def trace_backwards(node: str, depth: int, path: List[str]) -> None:
-            """Recursive backward tracing."""
-            if node in visited or depth > 100:  # Safety limit
-                return
-            
-            visited.add(node)
-            
-            # Check stop condition
-            if stop_condition and stop_condition(node, depth):
-                root_nodes.append(node)
-                causal_tree.append({
-                    "node": node,
-                    "depth": depth,
-                    "path_to_problem": path + [node],
-                    "is_stopped_by_condition": True,
-                })
-                return
-            
-            # Get parents (causes)
-            parents = list(self.causal_graph.predecessors(node))
-            
-            if len(parents) == 0:
-                # Exogenous node - true root cause
-                root_nodes.append(node)
-                causal_tree.append({
-                    "node": node,
-                    "depth": depth,
-                    "path_to_problem": path + [node],
-                    "is_exogenous": True,
-                })
-                return
-            
-            # Recursively trace parents
-            for parent in parents:
-                edge_data = self.causal_graph[parent][node]
-                strength = abs(edge_data.get('strength', 0.0))
-                
-                causal_tree.append({
-                    "node": node,
-                    "parent": parent,
-                    "edge_strength": float(strength),
-                    "depth": depth,
-                    "path_to_problem": path + [node],
-                })
-                
-                trace_backwards(parent, depth + 1, path + [node])
-        
-        # Start tracing from problem
-        trace_backwards(problem, 0, [])
-        
-        # Unique root nodes
-        unique_roots = list(set(root_nodes))
-        
-        # Build intervention strategy (intervene on shallowest exogenous nodes)
-        root_depths = {
-            root: min([ct["depth"] for ct in causal_tree if ct.get("node") == root or ct.get("parent") == root] + [999])
-            for root in unique_roots
-        }
-        optimal_roots = sorted(unique_roots, key=lambda x: root_depths.get(x, 999))[:10]
-        
-        return {
-            "problem": problem,
-            "ultimate_root_causes": unique_roots,
-            "optimal_intervention_targets": optimal_roots,
-            "causal_tree": causal_tree,
-            "max_depth_reached": max([ct["depth"] for ct in causal_tree] + [0]),
-            "total_nodes_explored": len(visited),
-        }
-
-    def optimal_intervention_sequence(
-        self,
-        initial_state: Dict[str, float],
-        target_outcomes: Dict[str, float],
-        max_steps: int = 5,
-        horizon: int = 10,
-    ) -> Dict[str, Any]:
-        """
-        Find optimal sequence of interventions to achieve target outcomes.
-        
-        Uses dynamic programming / tree search to find best intervention sequence
-        that alters future reactions for optimal outcome.
-        
-        Args:
-            initial_state: Starting state
-            target_outcomes: {variable: target_value} to achieve
-            max_steps: Maximum intervention steps
-            horizon: How far ahead to optimize
-        
-        Returns:
-            Optimal intervention sequence, expected trajectory, outcome probability
-        """
-        # Intervention candidates
-        candidates = [
-            node for node in self.causal_graph.nodes()
-            if len(list(self.causal_graph.successors(node))) > 0
-            and node not in target_outcomes.keys()
-        ]
-        
-        # Optimal control problem: find sequence {u₀, u₁, ..., uₜ} that minimizes cost
-        # Cost function: J = Σₜ L(xₜ, uₜ) + Φ(xₜ) where L is stage cost, Φ is terminal cost
-        # Subject to: xₜ₊₁ = f(xₜ, uₜ) (system dynamics)
-        # Using greedy approximation (could be upgraded to Bellman optimality: V*(x) = min_u[L(x,u) + V*(f(x,u))])
-        best_sequence: List[Dict[str, float]] = []
-        best_final_state: Dict[str, float] = initial_state.copy()
-        best_objective = float("-inf")
-        
-        current_state = initial_state.copy()
-        
-        for step in range(max_steps):
-            # Find best single intervention at this step (greedy policy)
-            # Greedy: u*_t = argmin_u E[L(xₜ₊₁, u) | xₜ] (one-step lookahead)
-            best_step_intervention: Optional[Dict[str, float]] = None
-            best_step_objective = float("-inf")
-            
-            # Sample candidate interventions (Monte Carlo policy search)
-            # Alternative: gradient-based optimization using ∇ᵤJ
-            for _ in range(20):  # Explore 20 candidates per step
-                var = self.rng.choice(candidates)
-                stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
-                current_val = current_state.get(var, stats["mean"])
-                
-                # Try perturbation: u = u₀ + ε where ε ~ N(0, σ²)
-                # This implements exploration in policy space
-                intervention = {var: current_val + self.rng.normal(0, stats["std"] * 1.5)}
-                
-                # Simulate forward (system dynamics): xₜ₊₁ = f(xₜ, uₜ)
-                predicted = self._predict_outcomes(current_state, intervention)
-                
-                # Multi-step lookahead (horizon H): simulate xₜ₊₁, xₜ₊₂, ..., xₜ₊ₕ
-                # This approximates value function: V^π(x) = E[Σₖ₌₀ᴴ γᵏ·rₜ₊ₖ]
-                state_after = predicted.copy()
-                for h in range(1, horizon):
-                    # Further interventions (optional, could use optimal policy π*(x))
-                    state_after = self._predict_outcomes(state_after, {})
-                
-                # Compute objective: multi-target cost function
-                # Cost: J(u) = Σⱼ |yⱼ(u) - y*ⱼ| (L1 norm, sum of absolute errors)
-                # Alternative L2: J(u) = √(Σⱼ (yⱼ(u) - y*ⱼ)²) (Euclidean distance)
-                # We use L1 for computational simplicity, can be upgraded to L2
-                # Minimize: argmin_u J(u) subject to constraints
-                # Since we maximize objective, use negative cost: O = -J(u)
-                objective = 0.0
-                for target_var, target_val in target_outcomes.items():
-                    if target_var in state_after:
-                        # L1 distance (absolute error): |y - y*|
-                        # For multi-dimensional: ||y - y*||₁ = Σⱼ |yⱼ - y*ⱼ|
-                        distance = abs(state_after[target_var] - target_val)  # L1 norm component
-                        objective -= distance  # Accumulate negative L1 distance (minimize error = maximize objective)
-                
-                if objective > best_step_objective:
-                    best_step_objective = objective
-                    best_step_intervention = intervention
-            
-            if best_step_intervention:
-                best_sequence.append(best_step_intervention)
-                # Update state
-                current_state = self._predict_outcomes(current_state, best_step_intervention)
-            else:
-                break
-        
-        # Full trajectory simulation
-        trajectory: List[Dict[str, float]] = [initial_state.copy()]
-        state = initial_state.copy()
-        for intervention in best_sequence:
-            state = self._predict_outcomes(state, intervention)
-            trajectory.append(state.copy())
-        
-        # Final outcome assessment using relative error metric
-        # Relative error: ε_rel = |y_actual - y_target| / |y_target|
-        # Success criterion: ε_rel < 0.1 (within 10% tolerance)
-        final_objective = 0.0
-        target_achievements: Dict[str, float] = {}
-        for target_var, target_val in target_outcomes.items():
-            if target_var in trajectory[-1]:
-                actual = trajectory[-1][target_var]
-                # Absolute error: ε_abs = |y_actual - y_target|
-                distance = abs(actual - target_val)
-                # Relative error: ε_rel = ε_abs / |y_target| (normalized by target magnitude)
-                relative_error = distance / abs(target_val) if abs(target_val) > 1e-6 else distance
-                target_achievements[target_var] = {
-                    "target": target_val,
-                    "actual": actual,
-                    "distance": distance,
-                    "relative_error": float(relative_error),
-                    "achieved": distance < abs(target_val * 0.1),  # Within 10% tolerance: ε_rel < 0.1
-                }
-                # Aggregate objective: J_total = -Σⱼ ε_absⱼ (minimize total error)
-                final_objective -= distance
-        
-        return {
-            "optimal_sequence": best_sequence,
-            "trajectory": trajectory,
-            "final_state": trajectory[-1] if trajectory else initial_state,
-            "target_achievements": target_achievements,
-            "objective": float(final_objective),
-            "sequence_length": len(best_sequence),
-        }
-
-    def meta_learn_intervention_strategy(
-        self,
-        historical_interventions: List[Dict[str, float]],
-        historical_outcomes: List[Dict[str, float]],
-        historical_contexts: List[Dict[str, float]],
-    ) -> Dict[str, Any]:
-        """
-        Meta-learn how to intervene: learn from past to create optimal future interventions.
-        
-        Identifies patterns in successful interventions across different contexts,
-        then uses this knowledge to design new interventions.
-        
-        Args:
-            historical_interventions: Past interventions
-            historical_outcomes: Corresponding outcomes
-            historical_contexts: States when interventions were applied
-        
-        Returns:
-            Learned intervention strategy, pattern rules, meta-knowledge
-        """
-        if not (len(historical_interventions) == len(historical_outcomes) == len(historical_contexts)):
-            return {"error": "History lengths must match"}
-        
-        # Classify interventions by outcome quality
-        intervention_classes: List[Dict[str, Any]] = []
-        
-        for i, (intervention, outcome, context) in enumerate(zip(
-            historical_interventions, historical_outcomes, historical_contexts
-        )):
-            # Compute outcome quality (simple: sum of positive changes)
-            quality = sum([
-                max(0.0, outcome.get(k, 0.0) - context.get(k, 0.0))
-                for k in outcome.keys()
-            ])
-            
-            intervention_classes.append({
-                "index": i,
-                "intervention": intervention,
-                "context": context,
-                "outcome": outcome,
-                "quality": float(quality),
-                "is_successful": quality > 0.0,
-            })
-        
-        # Extract patterns from successful interventions
-        successful = [ic for ic in intervention_classes if ic["is_successful"]]
-        unsuccessful = [ic for ic in intervention_classes if not ic["is_successful"]]
-        
-        # Pattern: what interventions work in what contexts?
-        learned_rules: List[Dict[str, Any]] = []
-        
-        if successful:
-            # For each intervention variable, find context patterns
-            all_intervention_vars = set()
-            for ic in successful:
-                all_intervention_vars.update(ic["intervention"].keys())
-            
-            for var in all_intervention_vars:
-                successful_vals = [
-                    ic["intervention"].get(var, 0.0)
-                    for ic in successful
-                    if var in ic["intervention"]
-                ]
-                
-                # Context conditions (simplified: avg context where this worked)
-                contexts_when_successful = [
-                    ic["context"]
-                    for ic in successful
-                    if var in ic["intervention"]
-                ]
-                
-                if successful_vals and contexts_when_successful:
-                    # Average successful intervention value
-                    avg_successful_val = float(np.mean(successful_vals))
-                    
-                    # Average context when this worked
-                    context_vars = set()
-                    for ctx in contexts_when_successful:
-                        context_vars.update(ctx.keys())
-                    
-                    avg_context = {
-                        k: float(np.mean([ctx.get(k, 0.0) for ctx in contexts_when_successful]))
-                        for k in context_vars
-                    }
-                    
-                    learned_rules.append({
-                        "intervention_variable": var,
-                        "recommended_value": avg_successful_val,
-                        "typical_context": avg_context,
-                        "success_rate": len(successful_vals) / len(historical_interventions),
-                        "confidence": float(min(1.0, len(successful_vals) / 5.0)),  # Higher with more examples
-                    })
-        
-        # Meta-strategy: when to use which intervention pattern
-        strategy: Dict[str, Any] = {
-            "learned_rules": learned_rules,
-            "success_rate": len(successful) / len(intervention_classes) if intervention_classes else 0.0,
-            "pattern_count": len(learned_rules),
-            "most_effective_interventions": sorted(
-                learned_rules,
-                key=lambda x: (x["confidence"], x["success_rate"]),
-                reverse=True
-            )[:5],
-        }
-        
-        return strategy
-
-    def recursive_alternate_reality_search(
-        self,
-        current_state: Dict[str, float],
-        target: str,
-        depth: int = 0,
-        max_depth: int = 10,
-        path: List[Dict[str, float]] = None,
-        best_found: Optional[Dict[str, Any]] = None,
-    ) -> Dict[str, Any]:
-        """
-        Recursively search alternate realities, nesting as deep as needed.
-        
-        Explores intervention tree recursively to find absolute best outcome.
-        Each reality branches into more realities, creating infinite nesting.
-        
-        Args:
-            current_state: Current state in this branch
-            target: Variable to optimize
-            depth: Current recursion depth
-            max_depth: Maximum depth (safety)
-            path: Intervention path to reach this state
-            best_found: Best outcome found so far (for pruning)
-        
-        Returns:
-            Best reality found, full search tree, optimal path
-        """
-        if path is None:
-            path = []
-        
-        if depth >= max_depth:
-            # Leaf: evaluate this reality
-            target_val = current_state.get(target, 0.0)
-            return {
-                "state": current_state,
-                "path": path,
-                "target_value": float(target_val),
-                "depth": depth,
-                "is_leaf": True,
-            }
-        
-        # Get intervention candidates
-        candidates = [
-            node for node in self.causal_graph.nodes()
-            if len(list(self.causal_graph.successors(node))) > 0
-            and node != target
-        ]
-        
-        # Branch: explore multiple interventions from this state
-        branches: List[Dict[str, Any]] = []
-        best_branch = None
-        best_target = float("-inf")
-        
-        # Limit branching to avoid explosion
-        num_branches = min(5, len(candidates))
-        selected = self.rng.choice(candidates, size=num_branches, replace=False) if len(candidates) > 0 else []
-        
-        for var in selected:
-            # Create intervention
-            stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
-            current_val = current_state.get(var, stats["mean"])
-            intervention = {var: current_val + self.rng.normal(0, stats["std"] * 1.0)}
-            
-            # Predict next state
-            next_state = self._predict_outcomes(current_state, intervention)
-            
-            # Recursively explore
-            branch_result = self.recursive_alternate_reality_search(
-                current_state=next_state,
-                target=target,
-                depth=depth + 1,
-                max_depth=max_depth,
-                path=path + [intervention],
-                best_found=best_found,
-            )
-            
-            branches.append({
-                "intervention": intervention,
-                "result": branch_result,
-            })
-            
-            # Update best
-            branch_target = branch_result.get("target_value", float("-inf"))
-            if branch_target > best_target:
-                best_target = branch_target
-                best_branch = branch_result
-        
-        # Return best path
-        return {
-            "state": current_state,
-            "path": path,
-            "branches": branches,
-            "best_branch": best_branch,
-            "target_value": best_target,
-            "depth": depth,
-            "is_leaf": False,
-        }
-
-    def probabilistic_nested_simulation(
-        self,
-        initial_state: Dict[str, float],
-        interventions: Dict[str, float],
-        num_samples: int = 100,
-        nesting_depth: int = 5,
-        uncertainty_propagation: bool = True,
-    ) -> Dict[str, Any]:
-        """
-        Probabilistic nested simulation: branch on uncertainty at each layer.
-        
-        Each nesting level considers multiple probabilistic outcomes,
-        creating a tree of possible futures with probabilities.
-        
-        Args:
-            initial_state: Starting state
-            interventions: Initial interventions
-            num_samples: Monte Carlo samples per nesting level
-            nesting_depth: How many layers to nest
-            uncertainty_propagation: Whether to propagate uncertainty through edges
-        
-        Returns:
-            Probabilistic outcome tree, expected values, confidence intervals
-        """
-        # Bootstrap edge strength uncertainty using coefficient of variation
-        # CV = σ/μ (coefficient of variation), where σ is standard deviation, μ is mean
-        # Uncertainty quantification: σ_β = CV · |β|, following asymptotic normality
-        # Under CLT, β̂ ~ N(β, σ²_β) for large samples
-        edge_uncertainty: Dict[Tuple[str, str], float] = {}
-        for u, v in self.causal_graph.edges():
-            strength = abs(self.causal_graph[u][v].get('strength', 0.0))
-            # Assume 20% coefficient of variation (CV = 0.2)
-            # Standard error: SE(β) = CV · |β| = 0.2 · |β|
-            # This models uncertainty from estimation variance
-            edge_uncertainty[(u, v)] = strength * 0.2
-        
-        # Nested simulation tree
-        simulation_tree: List[Dict[str, Any]] = []
-        
-        def simulate_level(
-            state: Dict[str, float],
-            interventions_at_level: Dict[str, float],
-            level: int,
-            parent_probability: float = 1.0,
-        ) -> Dict[str, Any]:
-            """Recursive probabilistic simulation."""
-            if level >= nesting_depth:
-                return {
-                    "level": level,
-                    "state": state,
-                    "probability": parent_probability,
-                    "is_leaf": True,
-                }
-            
-            # Sample edge strengths with uncertainty
-            outcomes: List[Dict[str, float]] = []
-            outcome_probs: List[float] = []
-            
-            for _ in range(num_samples):
-                # Perturb edge strengths
-                perturbed_state = state.copy()
-                
-                # Predict with uncertainty
-                z_state = self._standardize_state({**state, **interventions_at_level})
-                z_pred = dict(z_state)
-                
-                # Propagate with uncertain edges
-                for node in nx.topological_sort(self.causal_graph):
-                    if node in interventions_at_level:
-                        continue
-                    
-                    parents = list(self.causal_graph.predecessors(node))
-                    if not parents:
-                        continue
-                    
-                    effect_z = 0.0
-                    for parent in parents:
-                        parent_z = z_pred.get(parent, z_state.get(parent, 0.0))
-                        base_strength = self.causal_graph[parent][node].get('strength', 0.0)
-                        # Uncertainty propagation using normal distribution
-                        # β_sample ~ N(μ_β, σ²_β) where μ_β = base_strength, σ²_β = uncertainty²
-                        # This follows Bayesian posterior sampling or bootstrap sampling
-                        if uncertainty_propagation:
-                            uncertainty = edge_uncertainty.get((parent, node), 0.0)
-                            # Monte Carlo sampling: β ~ N(μ_β, σ²_β)
-                            # This propagates estimation uncertainty through causal structure
-                            strength = float(self.rng.normal(base_strength, uncertainty))
-                        else:
-                            strength = base_strength
-                        effect_z += parent_z * strength
-                    
-                    z_pred[node] = effect_z
-                
-                # De-standardize
-                outcome = {
-                    k: self._destandardize_value(k, v)
-                    for k, v in z_pred.items()
-                    if k in state or k in interventions_at_level
-                }
-                outcomes.append(outcome)
-                outcome_probs.append(1.0 / num_samples)  # Uniform weights
-            
-            # Aggregate outcomes using sample statistics (Monte Carlo estimation)
-            # Expected value: E[Y] = (1/n)Σᵢ yᵢ where n is sample size
-            # This is the Monte Carlo estimate of the expectation
-            # Unbiased estimator: E[Ȳ] = E[Y] (sample mean is unbiased for population mean)
-            expected_outcome: Dict[str, float] = {}
-            all_vars = set.union(*[set(o.keys()) for o in outcomes]) if outcomes else set()
-            for var in all_vars:
-                # Collect all samples for this variable: {y₁, y₂, ..., yₙ}
-                vals = np.array([o.get(var, 0.0) for o in outcomes])
-                n = len(vals)
-                if n > 0:
-                    # Sample mean: ȳ = (1/n)Σᵢ₌₁ⁿ yᵢ
-                    # E[Y] = lim_{n→∞} (1/n)Σᵢ yᵢ (Monte Carlo convergence)
-                    expected_outcome[var] = float(np.mean(vals))  # E[Y] = (1/n)Σᵢ yᵢ
-                else:
-                    expected_outcome[var] = 0.0
-            
-            # Confidence intervals using quantile-based estimation (non-parametric)
-            # For 90% CI: CI₉₀ = [Q₀.₀₅, Q₀.₉₅] where Q_p is p-th quantile
-            # Non-parametric: no distributional assumptions
-            # Alternative (parametric, if normal): CI = [μ̂ - z₀.₀₅·SE, μ̂ + z₀.₀₅·SE]
-            # where z₀.₀₅ ≈ 1.645 for 90% CI (two-tailed: 5% in each tail)
-            ci90_outcome: Dict[str, Tuple[float, float]] = {}
-            for var in expected_outcome.keys():
-                vals = np.array([o.get(var, 0.0) for o in outcomes])
-                n = len(vals)
-                if n > 0:
-                    # Non-parametric 90% CI: [Q₀.₀₅, Q₀.₉₅]
-                    # Quantile function: Q(p) = inf{x : P(X ≤ x) ≥ p}
-                    # 5th percentile (lower bound): Q₀.₀₅
-                    # 95th percentile (upper bound): Q₀.₉₅
-                    ci90_outcome[var] = (
-                        float(np.quantile(vals, 0.05)),  # Lower bound: Q₀.₀₅ = 5th percentile
-                        float(np.quantile(vals, 0.95)),  # Upper bound: Q₀.₉₅ = 95th percentile
-                    )
-                else:
-                    ci90_outcome[var] = (0.0, 0.0)
-            
-            # Recursively nest for next level
-            child_nodes: List[Dict[str, Any]] = []
-            if level < nesting_depth - 1:
-                # Create nested interventions based on outcomes
-                for outcome_sample in outcomes[:5]:  # Top 5 outcomes
-                    # Generate follow-up interventions
-                    nested_interventions: Dict[str, float] = {}
-                    # (Simplified: could use policy logic here)
-                    
-                    child = simulate_level(
-                        state=outcome_sample,
-                        interventions_at_level=nested_interventions,
-                        level=level + 1,
-                        parent_probability=parent_probability * (1.0 / num_samples),
-                    )
-                    child_nodes.append(child)
-            
-            return {
-                "level": level,
-                "state": state,
-                "interventions": interventions_at_level,
-                "expected_outcome": expected_outcome,
-                "ci90": ci90_outcome,
-                "outcome_samples": outcomes[:10],  # Top 10
-                "probability": parent_probability,
-                "children": child_nodes,
-                "is_leaf": level >= nesting_depth - 1,
-            }
-        
-        root_node = simulate_level(initial_state, interventions, level=0)
-        simulation_tree.append(root_node)
-        
-        # Extract final outcomes (leaf nodes)
-        def collect_leaves(node: Dict[str, Any]) -> List[Dict[str, Any]]:
-            if node.get("is_leaf", False):
-                return [node]
-            leaves = []
-            for child in node.get("children", []):
-                leaves.extend(collect_leaves(child))
-            return leaves
-        
-        leaves = collect_leaves(root_node)
-        
-        return {
-            "simulation_tree": root_node,
-            "all_leaves": leaves,
-            "expected_final_outcomes": {
-                var: float(np.mean([l["state"].get(var, 0.0) for l in leaves]))
-                for var in set.union(*[set(l["state"].keys()) for l in leaves])
-            },
-            "total_paths": len(leaves),
-            "max_nesting_reached": nesting_depth,
-        }
-
-    def adversarial_nested_analysis(
-        self,
-        intervention: Dict[str, float],
-        target: str,
-        adversary_objectives: List[str],
-        nesting_depth: int = 4,
-    ) -> Dict[str, Any]:
-        """
-        Adversarial nesting: consider worst-case reactions that could undermine your intervention.
-        
-        Models how external forces or negative feedback might react to your actions,
-        then nests to find best intervention despite adversarial responses.
-        
-        Args:
-            intervention: Your proposed intervention
-            target: Variable you want to optimize
-            adversary_objectives: Variables an adversary wants to minimize (worst-case)
-            nesting_depth: How many adversarial reaction layers to consider
-        
-        Returns:
-            Worst-case scenarios, robust interventions, adversarial paths
-        """
-        # Adversary model: reacts to minimize adversary_objectives
-        adversarial_paths: List[Dict[str, Any]] = []
-        
-        current_state = intervention.copy()
-        
-        for depth in range(nesting_depth):
-            # Your intervention at this depth
-            predicted_outcome = self._predict_outcomes({}, current_state)
-            
-            # Adversary reaction: find interventions that worsen adversary objectives
-            adversary_interventions: List[Dict[str, float]] = []
-            
-            for adv_obj in adversary_objectives:
-                if adv_obj not in self.causal_graph:
-                    continue
-                
-                # Find variables that affect adversary objective
-                affecting_vars = list(self.causal_graph.predecessors(adv_obj))
-                
-                # Adversary intervenes to minimize this objective
-                for var in affecting_vars[:3]:  # Top 3
-                    edge_data = self.causal_graph[var][adv_obj]
-                    strength = edge_data.get('strength', 0.0)
-                    
-                    # Adversarial optimization: adversary minimizes your objective
-                    # Adversary strategy: u_adv* = argmin_u_adv f(x, u, u_adv)
-                    # Where f is your objective function, u is your intervention, u_adv is adversary's
-                    # Gradient-based: u_adv ← u_adv - α·∇_{u_adv} f (gradient descent on negative objective)
-                    # If positive strength, adversary reduces var; if negative, increases
-                    current_val = predicted_outcome.get(var, 0.0)
-                    # Adversarial perturbation: Δu = -sign(∂f/∂u)·η·|u|
-                    # where η = 0.5 is step size, sign gives direction to worsen your objective
-                    adversary_intervention = {
-                        var: current_val - 0.5 * np.sign(strength) * abs(current_val)
-                    }
-                    adversary_interventions.append(adversary_intervention)
-            
-            # Worst-case outcome after adversary reaction
-            worst_outcomes: List[Dict[str, Any]] = []
-            for adv_intervention in adversary_interventions:
-                combined = {**current_state, **adv_intervention}
-                worst_outcome = self._predict_outcomes({}, combined)
-                
-                # Adversary damage quantification using L1 norm
-                # Damage = ||y_worst - y_predicted||₁ = Σⱼ |yⱼ_worst - yⱼ_predicted|
-                # This measures magnitude of deviation from expected outcome
-                target_value = worst_outcome.get(target, 0.0)
-                # Aggregate damage across all adversary objectives (L1 norm)
-                adversary_damage = sum([
-                    abs(worst_outcome.get(obj, 0.0) - predicted_outcome.get(obj, 0.0))
-                    for obj in adversary_objectives
-                ])
-                
-                worst_outcomes.append({
-                    "adversary_intervention": adv_intervention,
-                    "outcome": worst_outcome,
-                    "target_value": float(target_value),
-                    "adversary_damage": float(adversary_damage),
-                })
-            
-            # Sort by worst for target
-            worst_outcomes.sort(key=lambda x: x["target_value"])
-            worst_case = worst_outcomes[0] if worst_outcomes else None
-            
-            adversarial_paths.append({
-                "depth": depth,
-                "your_intervention": current_state,
-                "predicted_outcome": predicted_outcome,
-                "adversary_reactions": adversary_interventions,
-                "worst_case": worst_case,
-            })
-            
-            # Update state for next depth
-            if worst_case:
-                current_state = worst_case["outcome"]
-        
-        # Find robust intervention (works even in worst case)
-        final_target_values = [
-            path["worst_case"]["target_value"]
-            for path in adversarial_paths
-            if path.get("worst_case")
-        ]
-        worst_final = min(final_target_values) if final_target_values else 0.0
-        
-        return {
-            "intervention": intervention,
-            "target": target,
-            "adversarial_paths": adversarial_paths,
-            "worst_case_target_value": float(worst_final),
-            "adversarial_depth": nesting_depth,
-            "robustness_assessment": {
-                "worst_case_loss": float(intervention.get(target, 0.0) - worst_final),
-                "is_robust": worst_final > intervention.get(target, 0.0) * 0.5,  # Still >50% of desired
-            },
-        }
-
-    def multi_objective_infinite_nesting(
-        self,
-        current_state: Dict[str, float],
-        objectives: Dict[str, float],  # {variable: weight} to maximize
-        constraints: Dict[str, Tuple[float, float]],  # {variable: (min, max)}
-        max_depth: int = 8,
-        beam_width: int = 5,
-    ) -> Dict[str, Any]:
-        """
-        Multi-objective infinite nesting: optimize multiple goals simultaneously.
-        
-        Uses beam search to explore intervention space, balancing multiple objectives.
-        Nests as deep as needed to find Pareto-optimal solutions.
-        
-        Args:
-            current_state: Current state
-            objectives: {variable: weight} - variables to maximize with weights
-            constraints: {variable: (min, max)} - hard bounds
-            max_depth: Maximum nesting depth
-            beam_width: How many paths to keep at each level (beam search)
-        
-        Returns:
-            Pareto-optimal intervention paths, multi-objective trade-offs
-        """
-        # Beam search: maintain top-k paths at each level
-        beam: List[Dict[str, Any]] = [{
-            "state": current_state,
-            "path": [],
-            "objective_vector": {k: 0.0 for k in objectives.keys()},
-            "depth": 0,
-        }]
-        
-        pareto_frontier: List[Dict[str, Any]] = []
-        
-        for depth in range(max_depth):
-            next_beam: List[Dict[str, Any]] = []
-            
-            for path_node in beam:
-                # Get intervention candidates
-                candidates = [
-                    node for node in self.causal_graph.nodes()
-                    if len(list(self.causal_graph.successors(node))) > 0
-                    and node not in objectives.keys()
-                ]
-                
-                # Explore interventions
-                for var in candidates[:10]:  # Limit candidates
-                    stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
-                    current_val = path_node["state"].get(var, stats["mean"])
-                    
-                    # Try intervention
-                    intervention = {var: current_val + self.rng.normal(0, stats["std"] * 1.0)}
-                    
-                    # Check constraints
-                    violates = False
-                    for const_var, (min_val, max_val) in constraints.items():
-                        if const_var in intervention:
-                            if not (min_val <= intervention[const_var] <= max_val):
-                                violates = True
-                                break
-                    
-                    if violates:
-                        continue
-                    
-                    # Predict outcome
-                    outcome = self._predict_outcomes(path_node["state"], intervention)
-                    
-                    # Check outcome constraints
-                    for const_var, (min_val, max_val) in constraints.items():
-                        if const_var in outcome:
-                            if not (min_val <= outcome[const_var] <= max_val):
-                                violates = True
-                                break
-                    
-                    if violates:
-                        continue
-                    
-                    # Multi-objective optimization: weighted sum scalarization
-                    # Objective vector: f(x) = [f₁(x), f₂(x), ..., fₖ(x)] where fᵢ are individual objectives
-                    # Scalarized: F(x) = Σᵢ wᵢ·fᵢ(x) where wᵢ are weights
-                    # This converts multi-objective to single-objective for optimization
-                    # Weighted sum: F(x) = w₁·f₁(x) + w₂·f₂(x) + ... + wₖ·fₖ(x)
-                    obj_vector = {}
-                    for k, weight in objectives.items():
-                        # Individual objective value: fᵢ(x)
-                        obj_value = outcome.get(k, 0.0)
-                        # Weighted component: wᵢ·fᵢ(x)
-                        obj_vector[k] = obj_value * weight
-                    
-                    # Combined objective: F(x) = Σᵢ wᵢ·fᵢ(x) (weighted sum)
-                    # This is the scalarized multi-objective function
-                    # Alternative formulations:
-                    # - Weighted Lp norm: F(x) = (Σᵢ wᵢ·|fᵢ(x)|ᵖ)^(1/p)
-                    # - Chebyshev: F(x) = minᵢ wᵢ·fᵢ(x) (for maximization)
-                    combined_obj = sum(obj_vector.values())  # F(x) = Σᵢ wᵢ·fᵢ(x)
-                    
-                    next_beam.append({
-                        "state": outcome,
-                        "path": path_node["path"] + [intervention],
-                        "objective_vector": obj_vector,
-                        "combined_objective": float(combined_obj),
-                        "depth": depth + 1,
-                    })
-            
-            # Prune beam: keep top beam_width by combined objective
-            next_beam.sort(key=lambda x: x["combined_objective"], reverse=True)
-            beam = next_beam[:beam_width]
-            
-            # Add to Pareto if not dominated
-            for node in beam:
-                # Pareto dominance: x dominates y iff ∀i: fᵢ(x) ≥ fᵢ(y) ∧ ∃j: fⱼ(x) > fⱼ(y)
-                # This follows multi-objective optimization theory (Pareto optimality)
-                is_dominated = False
-                for pareto_node in pareto_frontier:
-                    # Check if pareto_node dominates node using Pareto dominance criterion
-                    # f₁ dominates f₂ if: ∀k: f₁ₖ ≥ f₂ₖ ∧ ∃k: f₁ₖ > f₂ₖ
-                    all_better = all(
-                        pareto_node["objective_vector"].get(k, 0.0) >= node["objective_vector"].get(k, 0.0)
-                        for k in objectives.keys()
-                    )
-                    some_better = any(
-                        pareto_node["objective_vector"].get(k, 0.0) > node["objective_vector"].get(k, 0.0)
-                        for k in objectives.keys()
-                    )
-                    # Pareto dominance condition: all_better ∧ some_better
-                    if all_better and some_better:
-                        is_dominated = True
-                        break
-                
-                if not is_dominated:
-                    # Remove dominated nodes from frontier
-                    pareto_frontier = [
-                        pn for pn in pareto_frontier
-                        if not (
-                            all(node["objective_vector"].get(k, 0.0) >= pn["objective_vector"].get(k, 0.0)
-                            for k in objectives.keys()) and
-                            any(node["objective_vector"].get(k, 0.0) > pn["objective_vector"].get(k, 0.0)
-                            for k in objectives.keys())
-                        )
-                    ]
-                    pareto_frontier.append(node)
-        
-        # Sort Pareto frontier
-        pareto_frontier.sort(key=lambda x: x["combined_objective"], reverse=True)
-        
-        return {
-            "pareto_frontier": pareto_frontier[:20],  # Top 20
-            "best_path": pareto_frontier[0] if pareto_frontier else None,
-            "total_paths_explored": len(pareto_frontier),
-            "max_depth_reached": max_depth,
-            "objectives": objectives,
-            "trade_off_analysis": {
-                "objective_ranges": {
-                    k: {
-                        "min": float(min(p["objective_vector"].get(k, 0.0) for p in pareto_frontier)),
-                        "max": float(max(p["objective_vector"].get(k, 0.0) for p in pareto_frontier)),
-                    }
-                    for k in objectives.keys()
-                },
-            },
-        }
-
-    def temporal_causal_chain_analysis(
-        self,
-        initial_intervention: Dict[str, float],
-        target: str,
-        time_horizon: int = 10,
-        lag_structure: Optional[Dict[Tuple[str, str], int]] = None,
-    ) -> Dict[str, Any]:
-        """
-        Temporal nesting: account for time delays in causal effects.
-        
-        Models that some effects take time (X→Y might take 2 periods),
-        creating temporal causal chains that nest across time.
-        
-        Args:
-            initial_intervention: Starting intervention
-            target: Variable to optimize
-            time_horizon: Number of time periods
-            lag_structure: {(source, target): lag_periods} - if None, assumes lag=1
-        
-        Returns:
-            Temporal trajectory, delayed effects, optimal timing
-        """
-        if lag_structure is None:
-            # Default: each edge has lag=1
-            lag_structure = {
-                (u, v): 1
-                for u, v in self.causal_graph.edges()
-            }
-        
-        # State history across time: x(t) = [x₁(t), x₂(t), ..., xₙ(t)]
-        # Discrete-time causal system with distributed lags
-        state_history: List[Dict[str, float]] = [initial_intervention.copy()]
-        
-        # Track pending effects: distributed lag model
-        # Effect yⱼ(t+τᵢⱼ) = βᵢⱼ·xᵢ(t) where τᵢⱼ is lag for edge (i,j)
-        # This implements VAR (Vector Autoregression) with distributed lags
-        pending_effects: Dict[int, List[Tuple[str, str, float]]] = {}  # {time: [(source, target, effect)]}
-        
-        for t in range(time_horizon):
-            current_state = state_history[-1].copy()
-            next_state = current_state.copy()
-            
-            # Apply pending effects from previous periods (distributed lag accumulation)
-            # y(t) = Σᵢ Σₖ βᵢⱼ·xᵢ(t-τₖ) where τₖ are lags
-            if t in pending_effects:
-                for source, target, effect_magnitude in pending_effects[t]:
-                    if target in next_state:
-                        # Linear accumulation: additive effects from multiple sources
-                        next_state[target] = next_state.get(target, 0.0) + effect_magnitude
-            
-            # Compute new effects with lags using distributed lag model
-            # Causal effect equation: yⱼ(t+τᵢⱼ) = βᵢⱼ·xᵢ(t)
-            # where τᵢⱼ is the lag for edge (i,j), βᵢⱼ is structural coefficient
-            # This implements VAR (Vector Autoregression) with distributed lags
-            for u, v in self.causal_graph.edges():
-                lag = lag_structure.get((u, v), 1)  # Lag τᵢⱼ (time delay)
-                source_val = current_state.get(u, 0.0)  # xᵢ(t): source value at time t
-                edge_data = self.causal_graph[u][v]
-                strength = edge_data.get('strength', 0.0)  # Structural coefficient βᵢⱼ
-                
-                # Effect magnitude: e = βᵢⱼ·xᵢ(t) (linear structural equation)
-                # This is the effect that will manifest at time t + τ
-                effect = source_val * strength  # e = βᵢⱼ·xᵢ(t)
-                
-                # Schedule effect for future period (distributed lag)
-                # Effect manifests at time t + τ: yⱼ(t+τ) ← yⱼ(t+τ) + βᵢⱼ·xᵢ(t)
-                # This implements: yⱼ(t+τᵢⱼ) = βᵢⱼ·xᵢ(t)
-                future_time = t + lag  # Time when effect manifests: t + τᵢⱼ
-                if future_time < time_horizon:
-                    if future_time not in pending_effects:
-                        pending_effects[future_time] = []
-                    # Store effect to be applied at future_time
-                    pending_effects[future_time].append((u, v, effect))
-            
-            state_history.append(next_state)
-        
-        # Extract temporal patterns
-        target_trajectory = [s.get(target, 0.0) for s in state_history]
-        
-        return {
-            "initial_intervention": initial_intervention,
-            "target": target,
-            "temporal_trajectory": state_history,
-            "target_over_time": target_trajectory,
-            "peak_value": float(max(target_trajectory)) if target_trajectory else 0.0,
-            "time_to_peak": int(np.argmax(target_trajectory)) if target_trajectory else 0,
-            "steady_state_value": float(target_trajectory[-1]) if target_trajectory else 0.0,
-            "lag_structure_used": lag_structure,
-        }
-
-    def explainable_nested_analysis(
-        self,
-        intervention: Dict[str, float],
-        target: str,
-        depth: int = 5,
-    ) -> Dict[str, Any]:
-        """
-        Explainable nesting: at each layer, explain WHY the effects occur.
-        
-        Nests deeply but provides human-readable explanations for each causal step,
-        building a narrative of how intervention → effect → effect → ... → target.
-        
-        Args:
-            intervention: Initial intervention
-            target: Target outcome
-            depth: Nesting depth
-        
-        Returns:
-            Explained causal chain, narrative, reasoning at each level
-        """
-        explanations: List[Dict[str, Any]] = []
-        
-        current_state = intervention.copy()
-        
-        for level in range(depth):
-            # Predict outcomes
-            predicted = self._predict_outcomes({}, current_state)
-            
-            # Find causal paths to target
-            paths_to_target: List[List[str]] = []
-            for inter_var in current_state.keys():
-                if inter_var == target:
-                    continue
-                try:
-                    paths = list(nx.all_simple_paths(
-                        self.causal_graph,
-                        inter_var,
-                        target,
-                        cutoff=depth - level
-                    ))
-                    paths_to_target.extend(paths)
-                except Exception:
-                    pass
-            
-            # Explain each path using causal effect decomposition
-            # Path effect = ∏(i,j)∈Path βᵢⱼ (product of structural coefficients)
-            # Following Pearl's do-calculus and causal mediation analysis
-            path_explanations: List[str] = []
-            for path in paths_to_target[:5]:  # Top 5 paths
-                explanation_parts = []
-                path_product = 1.0  # Initialize path effect product
-                for i in range(len(path) - 1):
-                    u, v = path[i], path[i + 1]
-                    edge_data = self.causal_graph[u][v]
-                    strength = abs(edge_data.get('strength', 0.0))  # |βᵢⱼ|
-                    sign = "+" if edge_data.get('strength', 0.0) >= 0 else "-"
-                    # Accumulate path effect: ∏ βᵢⱼ
-                    path_product *= edge_data.get('strength', 0.0)
-                    
-                    explanation_parts.append(
-                        f"{u} {sign}affects {v} (β={strength:.3f})"
-                    )
-                # Path effect: total causal effect along this path
-                explanation_parts.append(f"Path effect: {path_product:.4f}")
-                
-                path_explanation = " → ".join([
-                    f"{path[i]}{'↑' if i < len(path)-1 else ''}"
-                    for i in range(len(path))
-                ])
-                path_explanations.append(path_explanation)
-            
-            # Build explanation
-            explanation = {
-                "level": level,
-                "interventions": current_state,
-                "predicted_outcomes": predicted,
-                "paths_to_target": [p[:3] for p in paths_to_target[:3]],  # Show first 3 vars of each path
-                "explanation_text": f"Level {level}: " + "; ".join(path_explanations[:3]),
-                "target_value_at_level": float(predicted.get(target, 0.0)),
-            }
-            explanations.append(explanation)
-            
-            # Update for next level (use predicted as new baseline)
-            current_state = predicted
-        
-        # Synthesize narrative
-        narrative_parts = [
-            f"At level {e['level']}: {e['explanation_text']}"
-            for e in explanations
-        ]
-        
-        return {
-            "intervention": intervention,
-            "target": target,
-            "explanations_by_level": explanations,
-            "narrative": "\n".join(narrative_parts),
-            "final_target_value": float(explanations[-1]["target_value_at_level"]) if explanations else 0.0,
-            "total_levels": len(explanations),
-        }
-
-    # ==================== MAJOR UPGRADES ====================
-    
-    def gradient_based_intervention_optimization(
-        self,
-        initial_state: Dict[str, float],
-        target: str,
-        intervention_vars: List[str],
-        constraints: Optional[Dict[str, Tuple[float, float]]] = None,
-        method: str = "L-BFGS-B",
-    ) -> Dict[str, Any]:
-        """
-        Gradient-based optimization for finding optimal interventions.
-        
-        Uses automatic differentiation via numerical gradients to optimize:
-        minimize: -f(x) where f(x) = predicted outcome given intervention x
-        
-        Mathematical formulation:
-        - Objective: J(θ) = -y(θ) where y(θ) = predicted outcome
-        - Gradient: ∇_θ J(θ) = -∇_θ y(θ) computed via finite differences
-        - Update: θ_{k+1} = θ_k - α·∇_θ J(θ_k) (gradient descent)
-        
-        Args:
-            initial_state: Current state
-            target: Variable to optimize
-            intervention_vars: Variables that can be intervened on
-            constraints: {var: (min, max)} bounds
-            method: Optimization method ('L-BFGS-B', 'BFGS', 'SLSQP', etc.)
-        
-        Returns:
-            Optimal intervention, objective value, convergence info
-        """
-        # Prepare bounds
-        bounds = []
-        x0 = []
-        var_to_idx = {}
-        for i, var in enumerate(intervention_vars):
-            var_to_idx[var] = i
-            stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
-            current_val = initial_state.get(var, stats["mean"])
-            x0.append(current_val)
-            
-            if constraints and var in constraints:
-                min_val, max_val = constraints[var]
-                bounds.append((min_val, max_val))
-            else:
-                # Default bounds: ±3 standard deviations
-                bounds.append((current_val - 3 * stats["std"], current_val + 3 * stats["std"]))
-        
-        # Objective function: J(x) = -y(x) where y(x) is predicted outcome
-        def objective(x: np.ndarray) -> float:
-            """Objective: minimize -f(x) (maximize f(x))"""
-            intervention = {intervention_vars[i]: float(x[i]) for i in range(len(x))}
-            outcome = self._predict_outcomes(initial_state, intervention)
-            target_val = outcome.get(target, 0.0)
-            return -target_val  # Negative for minimization
-        
-        # Numerical gradient: ∇_θ J(θ) ≈ [J(θ+ε·e_i) - J(θ-ε·e_i)] / (2ε)
-        # where e_i is unit vector in direction i, ε is small step
-        def gradient(x: np.ndarray) -> np.ndarray:
-            """Compute gradient via finite differences: ∇f ≈ (f(x+ε) - f(x-ε))/(2ε)"""
-            epsilon = 1e-5
-            grad = np.zeros_like(x)
-            f0 = objective(x)
-            
-            for i in range(len(x)):
-                x_plus = x.copy()
-                x_plus[i] += epsilon
-                f_plus = objective(x_plus)
-                grad[i] = (f_plus - f0) / epsilon
-            
-            return grad
-        
-        # Optimize using scipy.optimize
-        try:
-            result = minimize(
-                objective,
-                x0=np.array(x0),
-                method=method,
-                bounds=bounds,
-                jac=gradient if method in ["L-BFGS-B", "BFGS", "CG"] else None,
-                options={"maxiter": 100, "ftol": 1e-6} if method == "L-BFGS-B" else {}
-            )
-            
-            optimal_intervention = {intervention_vars[i]: float(result.x[i]) for i in range(len(result.x))}
-            optimal_outcome = self._predict_outcomes(initial_state, optimal_intervention)
-            
-            return {
-                "optimal_intervention": optimal_intervention,
-                "optimal_target_value": float(optimal_outcome.get(target, 0.0)),
-                "objective_value": float(result.fun),
-                "success": bool(result.success),
-                "iterations": int(result.nit) if hasattr(result, 'nit') else 0,
-                "convergence_message": str(result.message),
-                "gradient_norm": float(np.linalg.norm(gradient(result.x))) if result.success else float('inf'),
-            }
-        except Exception as e:
-            return {"error": str(e), "optimal_intervention": {}, "success": False}
-
-    def nonlinear_scm_prediction(
-        self,
-        factual_state: Dict[str, float],
-        interventions: Dict[str, float],
-        include_interactions: bool = True,
-    ) -> Dict[str, float]:
-        """
-        Non-linear SCM prediction with interaction terms.
-        
-        Extends linear model: y = Σᵢ βᵢ·xᵢ + Σᵢⱼ γᵢⱼ·xᵢ·xⱼ + ε
-        where γᵢⱼ are interaction coefficients.
-        
-        Mathematical foundation:
-        - Linear term: Σᵢ βᵢ·xᵢ
-        - Quadratic interaction: Σᵢⱼ γᵢⱼ·xᵢ·xⱼ (product of parent pairs)
-        - Full model: y = linear_term + interaction_term + ε
-        
-        Args:
-            factual_state: Current state
-            interventions: Interventions to apply
-            include_interactions: Whether to include interaction terms
-        
-        Returns:
-            Predicted outcomes with non-linear effects
-        """
-        # Standardize and merge states
-        raw_state = factual_state.copy()
-        raw_state.update(interventions)
-        z_state = self._standardize_state(raw_state)
-        z_pred = dict(z_state)
-        
-        # Interaction coefficients cache {node: {(parent1, parent2): γ}}
-        interaction_coeffs: Dict[str, Dict[Tuple[str, str], float]] = {}
-        
-        for node in nx.topological_sort(self.causal_graph):
-            if node in interventions:
-                continue
-            
-            parents = list(self.causal_graph.predecessors(node))
-            if not parents:
-                continue
-            
-            # Linear term: Σᵢ βᵢ·z_xi
-            linear_term = 0.0
-            for parent in parents:
-                parent_z = z_pred.get(parent, z_state.get(parent, 0.0))
-                beta = self.causal_graph[parent][node].get('strength', 0.0)
-                linear_term += parent_z * beta
-            
-            # Interaction terms: Σᵢⱼ γᵢⱼ·z_xi·z_xj
-            interaction_term = 0.0
-            if include_interactions and node in self.interaction_terms:
-                for (p1, p2) in self.interaction_terms[node]:
-                    if p1 in parents and p2 in parents:
-                        z1 = z_pred.get(p1, z_state.get(p1, 0.0))
-                        z2 = z_pred.get(p2, z_state.get(p2, 0.0))
-                        # Interaction coefficient (default: small value)
-                        gamma = self.causal_graph[p1][node].get('interaction_strength', {}).get(p2, 0.0)
-                        interaction_term += gamma * z1 * z2  # γ·x₁·x₂
-            
-            # Total prediction: z_y = linear_term + interaction_term
-            z_pred[node] = linear_term + interaction_term
-        
-        # De-standardize
-        predicted_state = {}
-        for var, z_val in z_pred.items():
-            predicted_state[var] = self._destandardize_value(var, z_val)
-        return predicted_state
-
-    def compute_information_theoretic_measures(
-        self,
-        df: Any,
-        variables: List[str],
-    ) -> Dict[str, Any]:
-        """
-        Compute information-theoretic measures: entropy, mutual information, causal entropy.
-        
-        Mathematical formulations:
-        - Entropy: H(X) = -Σᵢ P(xᵢ) log₂ P(xᵢ) (discrete) or -∫ p(x) log p(x) dx (continuous)
-        - Mutual Information: I(X;Y) = H(X) + H(Y) - H(X,Y) = KL(P(X,Y) || P(X)P(Y))
-        - Conditional MI: I(X;Y|Z) = H(X,Z) + H(Y,Z) - H(X,Y,Z) - H(Z)
-        - Causal Entropy: Expected reduction in entropy from intervention
-        
-        Args:
-            df: DataFrame with variables
-            variables: Variables to analyze
-        
-        Returns:
-            Entropies, mutual information, causal information gains
-        """
-        if df is None or len(df) < 10:
-            return {"error": "Insufficient data"}
-        
-        data = df[variables].dropna()
-        if len(data) < 10:
-            return {"error": "Insufficient data after dropna"}
-        
-        results: Dict[str, Any] = {
-            "entropies": {},
-            "mutual_information": {},
-            "conditional_mi": {},
-        }
-        
-        # Compute entropies: H(X) = -Σ p(x) log p(x)
-        # Using discrete histogram approximation for continuous variables
-        for var in variables:
-            if var not in data.columns:
-                continue
-            
-            series = data[var].dropna()
-            if len(series) < 5:
-                continue
-            
-            # Discretize for entropy estimation (histogram method)
-            # H(X) ≈ -Σᵢ (nᵢ/n) log₂(nᵢ/n) where nᵢ is count in bin i
-            n_bins = min(20, max(5, int(np.sqrt(len(series)))))  # Adaptive binning
-            hist, bins = np.histogram(series, bins=n_bins)
-            hist = hist[hist > 0]  # Remove empty bins
-            probs = hist / hist.sum()
-            
-            # Shannon entropy: H(X) = -Σᵢ pᵢ log₂ pᵢ
-            entropy = -np.sum(probs * np.log2(probs))
-            results["entropies"][var] = float(entropy)
-            self._entropy_cache[var] = float(entropy)
-        
-        # Compute pairwise mutual information: I(X;Y) = H(X) + H(Y) - H(X,Y)
-        for i, var1 in enumerate(variables):
-            if var1 not in results["entropies"]:
-                continue
-            for var2 in variables[i+1:]:
-                if var2 not in results["entropies"]:
-                    continue
-                
-                # Joint entropy: H(X,Y) = -Σᵢⱼ p(xᵢ,yⱼ) log₂ p(xᵢ,yⱼ)
-                joint_series = data[[var1, var2]].dropna()
-                if len(joint_series) < 5:
-                    continue
-                
-                # 2D histogram
-                n_bins = min(10, max(3, int(np.cbrt(len(joint_series)))))
-                hist_2d, _, _ = np.histogram2d(
-                    joint_series[var1],
-                    joint_series[var2],
-                    bins=n_bins
-                )
-                hist_2d = hist_2d[hist_2d > 0]
-                probs_joint = hist_2d / hist_2d.sum()
-                
-                # Joint entropy
-                h_joint = -np.sum(probs_joint * np.log2(probs_joint))
-                
-                # Mutual information: I(X;Y) = H(X) + H(Y) - H(X,Y)
-                mi = results["entropies"][var1] + results["entropies"][var2] - float(h_joint)
-                results["mutual_information"][f"{var1};{var2}"] = float(max(0.0, mi))  # MI ≥ 0
-                self._mi_cache[(var1, var2)] = float(max(0.0, mi))
-        
-        return results
-
-    def convex_intervention_optimization(
-        self,
-        initial_state: Dict[str, float],
-        objectives: Dict[str, float],  # {var: weight}
-        constraints_dict: Dict[str, Tuple[float, float]],  # {var: (min, max)}
-        intervention_vars: List[str],
-    ) -> Dict[str, Any]:
-        """
-        Convex optimization for interventions using CVXPY (if available).
-        
-        Mathematical formulation:
-        minimize: Σᵢ wᵢ·fᵢ(x)
-        subject to: l ≤ x ≤ u (box constraints)
-        where fᵢ are linear functions of interventions
-        
-        Uses CVXPY for guaranteed global optimum in convex problems.
-        
-        Args:
-            initial_state: Current state
-            objectives: {variable: weight} to optimize
-            constraints_dict: {variable: (min, max)} bounds
-            intervention_vars: Variables to optimize
-        
-        Returns:
-            Optimal intervention, solver status, dual variables
-        """
-        if not CVXPY_AVAILABLE:
-            return {"error": "CVXPY not available. Install with: pip install cvxpy"}
-        
-        try:
-            # Decision variables: intervention values
-            n = len(intervention_vars)
-            x = cp.Variable(n, name="interventions")
-            
-            # Build objective: minimize Σᵢ wᵢ·(-outcome_i)
-            # Since CVXPY minimizes, we minimize negative of what we want to maximize
-            obj_terms = []
-            for target_var, weight in objectives.items():
-                # Approximate outcome as linear function of interventions
-                # outcome ≈ baseline + Σⱼ βⱼ·intervention_j
-                baseline = initial_state.get(target_var, 0.0)
-                
-                # Find paths from intervention vars to target
-                effect_sum = 0.0
-                for i, inter_var in enumerate(intervention_vars):
-                    try:
-                        path = nx.shortest_path(self.causal_graph, inter_var, target_var)
-                        if len(path) > 1:
-                            # Path strength (simplified: direct edge if exists)
-                            if self.causal_graph.has_edge(inter_var, target_var):
-                                beta = self.causal_graph[inter_var][target_var].get('strength', 0.0)
-                                effect_sum += beta * x[i]
-                    except:
-                        pass
-                
-                # Objective term: -weight * (baseline + effect_sum)
-                obj_terms.append(-weight * (baseline + effect_sum))
-            
-            objective = cp.Minimize(sum(obj_terms))
-            
-            # Constraints: l ≤ x ≤ u
-            constraints = []
-            for i, var in enumerate(intervention_vars):
-                if var in constraints_dict:
-                    min_val, max_val = constraints_dict[var]
-                    constraints.append(x[i] >= min_val)
-                    constraints.append(x[i] <= max_val)
-                else:
-                    # Default bounds
-                    stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
-                    current = initial_state.get(var, stats["mean"])
-                    constraints.append(x[i] >= current - 3 * stats["std"])
-                    constraints.append(x[i] <= current + 3 * stats["std"])
-            
-            # Solve
-            problem = cp.Problem(objective, constraints)
-            problem.solve(solver=cp.ECOS if hasattr(cp, 'ECOS') else cp.SCS)
-            
-            if problem.status in ["optimal", "optimal_inaccurate"]:
-                optimal_x = {intervention_vars[i]: float(x.value[i]) for i in range(n)}
-                return {
-                    "optimal_intervention": optimal_x,
-                    "status": problem.status,
-                    "objective_value": float(problem.value),
-                    "solver": problem.solver_stats.name if hasattr(problem, 'solver_stats') else "unknown",
-                }
-            else:
-                return {"error": f"Solver failed: {problem.status}", "optimal_intervention": {}}
-        except Exception as e:
-            return {"error": str(e), "optimal_intervention": {}}
-
-    def sensitivity_analysis(
-        self,
-        intervention: Dict[str, float],
-        target: str,
-        perturbation_size: float = 0.01,
-    ) -> Dict[str, Any]:
-        """
-        Sensitivity analysis: how sensitive is outcome to intervention changes?
-        
-        Mathematical formulation:
-        - Sensitivity: Sᵢ = ∂y/∂xᵢ ≈ (y(x + ε·eᵢ) - y(x)) / ε
-        - Elasticity: Eᵢ = (∂y/∂xᵢ)·(xᵢ/y) = sensitivity · (x/y)
-        - Total sensitivity: ||∇y||₂ = √(Σᵢ Sᵢ²)
-        
-        Args:
-            intervention: Base intervention
-            target: Target variable
-            perturbation_size: ε for finite differences
-        
-        Returns:
-            Sensitivities, elasticities, most influential variables
-        """
-        base_outcome = self._predict_outcomes({}, intervention)
-        base_target = base_outcome.get(target, 0.0)
-        
-        sensitivities: Dict[str, float] = {}
-        elasticities: Dict[str, float] = {}
-        
-        for var, val in intervention.items():
-            # Perturb: x + ε·e
-            perturbed_intervention = intervention.copy()
-            perturbed_intervention[var] = val + perturbation_size
-            
-            # Compute sensitivity: S = (y(x+ε) - y(x)) / ε
-            perturbed_outcome = self._predict_outcomes({}, perturbed_intervention)
-            perturbed_target = perturbed_outcome.get(target, 0.0)
-            
-            sensitivity = (perturbed_target - base_target) / perturbation_size
-            sensitivities[var] = float(sensitivity)
-            
-            # Elasticity: E = (∂y/∂x)·(x/y) = S·(x/y)
-            if abs(base_target) > 1e-6 and abs(val) > 1e-6:
-                elasticity = sensitivity * (val / base_target)
-                elasticities[var] = float(elasticity)
-            else:
-                elasticities[var] = 0.0
-        
-        # Total sensitivity (L2 norm of gradient): ||∇y||₂ = √(Σᵢ Sᵢ²)
-        sensitivity_vector = np.array(list(sensitivities.values()))
-        total_sensitivity = float(np.linalg.norm(sensitivity_vector))
-        
-        # Most influential (highest absolute sensitivity)
-        most_influential = max(sensitivities.items(), key=lambda x: abs(x[1])) if sensitivities else None
-        
-        return {
-            "sensitivities": sensitivities,
-            "elasticities": elasticities,
-            "total_sensitivity": total_sensitivity,
-            "most_influential_variable": most_influential[0] if most_influential else None,
-            "most_influential_sensitivity": most_influential[1] if most_influential else 0.0,
-        }
-
-    def vectorized_batch_prediction(
-        self,
-        initial_state: Dict[str, float],
-        intervention_batch: List[Dict[str, float]],
-    ) -> np.ndarray:
-        """
-        Vectorized batch prediction for efficiency.
-        
-        Computes predictions for multiple interventions in parallel using vectorized operations.
-        Much faster than looping through interventions individually.
-        
-        Mathematical: y_batch = f(X_batch) where X_batch is matrix of interventions
-        
-        Args:
-            initial_state: Base state
-            intervention_batch: List of interventions to predict
-        
-        Returns:
-            Array of predicted outcomes (one row per intervention)
-        """
-        if not intervention_batch:
-            return np.array([])
-        
-        # Extract all variables
-        all_vars = set(initial_state.keys())
-        for inter in intervention_batch:
-            all_vars.update(inter.keys())
-        
-        all_vars = sorted(list(all_vars))
-        n_interventions = len(intervention_batch)
-        n_vars = len(all_vars)
-        
-        # Build intervention matrix: X[i, j] = intervention i's value for variable j
-        X = np.zeros((n_interventions, n_vars))
-        for i, inter in enumerate(intervention_batch):
-            for j, var in enumerate(all_vars):
-                X[i, j] = inter.get(var, initial_state.get(var, 0.0))
-        
-        # Vectorized predictions (for now, use batched calls)
-        # Future: could vectorize the entire SCM forward pass
-        predictions = []
-        for inter in intervention_batch:
-            outcome = self._predict_outcomes(initial_state, inter)
-            predictions.append([outcome.get(var, 0.0) for var in all_vars])
-        
-        return np.array(predictions)
-
-    def bayesian_edge_inference(
-        self,
-        df: Any,
-        parent: str,
-        child: str,
-        prior_mu: float = 0.0,
-        prior_sigma: float = 1.0,
-    ) -> Dict[str, Any]:
-        """
-        Bayesian inference for edge strength using conjugate prior.
-        
-        Mathematical formulation:
-        - Prior: β ~ N(μ₀, σ²₀)
-        - Likelihood: y | β, X ~ N(Xβ, σ²)
-        - Posterior: β | y, X ~ N(μₙ, σ²ₙ)
-        - Posterior mean: μₙ = (σ²₀X'X + σ²I)⁻¹(σ²₀X'X μ̂_OLS + σ²μ₀)
-        - Posterior variance: σ²ₙ = (σ²₀⁻¹ + (X'X)/σ²)⁻¹
-        
-        Args:
-            df: Data
-            parent: Source variable
-            child: Target variable
-            prior_mu: Prior mean μ₀
-            prior_sigma: Prior standard deviation σ₀
-        
-        Returns:
-            Posterior mean, variance, credible intervals
-        """
-        if df is None or parent not in df.columns or child not in df.columns:
-            return {"error": "Invalid data or variables"}
-        
-        data = df[[parent, child]].dropna()
-        if len(data) < 5:
-            return {"error": "Insufficient data"}
-        
-        X = data[parent].values.reshape(-1, 1)
-        y = data[child].values
-        
-        # Standardize
-        X_mean, X_std = X.mean(), X.std() or 1.0
-        y_mean, y_std = y.mean(), y.std() or 1.0
-        X_norm = (X - X_mean) / X_std
-        y_norm = (y - y_mean) / y_std
-        
-        # OLS estimate: β̂_OLS = (X'X)⁻¹X'y
-        XtX = X_norm.T @ X_norm
-        Xty = X_norm.T @ y_norm
-        beta_ols = (np.linalg.pinv(XtX) @ Xty)[0]
-        
-        # Likelihood variance: σ² = (1/n)Σ(y - Xβ̂)²
-        residuals = y_norm - X_norm @ np.array([beta_ols])
-        sigma_sq = float(np.var(residuals))
-        
-        # Bayesian update: posterior parameters
-        # Precision: τ = 1/σ²
-        tau_likelihood = 1.0 / (sigma_sq + 1e-6)  # Likelihood precision
-        tau_prior = 1.0 / (prior_sigma ** 2)  # Prior precision
-        
-        # Posterior precision: τ_posterior = τ_prior + τ_likelihood
-        tau_posterior = tau_prior + tau_likelihood * len(data)
-        
-        # Posterior mean: μ_posterior = (τ_prior·μ₀ + τ_likelihood·n·β̂_OLS) / τ_posterior
-        mu_posterior = (tau_prior * prior_mu + tau_likelihood * len(data) * beta_ols) / tau_posterior
-        
-        # Posterior variance: σ²_posterior = 1/τ_posterior
-        sigma_posterior_sq = 1.0 / tau_posterior
-        sigma_posterior = np.sqrt(sigma_posterior_sq)
-        
-        # Credible intervals (95%): [μ - 1.96σ, μ + 1.96σ]
-        ci_lower = mu_posterior - 1.96 * sigma_posterior
-        ci_upper = mu_posterior + 1.96 * sigma_posterior
-        
-        # Store prior for future use
-        self.bayesian_priors[(parent, child)] = {
-            "mu": float(prior_mu),
-            "sigma": float(prior_sigma)
-        }
-        
-        return {
-            "posterior_mean": float(mu_posterior),
-            "posterior_std": float(sigma_posterior),
-            "posterior_variance": float(sigma_posterior_sq),
-            "credible_interval_95": (float(ci_lower), float(ci_upper)),
-            "ols_estimate": float(beta_ols),
-            "prior_mu": float(prior_mu),
-            "prior_sigma": float(prior_sigma),
-        }
-
-    def add_interaction_term(
-        self,
-        node: str,
-        parent1: str,
-        parent2: str,
-        interaction_strength: float = 0.0,
     ) -> None:
         """
-        Add non-linear interaction term: y = ... + γ·x₁·x₂
-        
-        Mathematical: interaction effect = γ·x₁·x₂ where γ is interaction coefficient
+        Add a causal edge to the graph.
         
         Args:
-            node: Child variable
-            parent1: First parent
-            parent2: Second parent
-            interaction_strength: Interaction coefficient γ
+            source: Source variable name
+            target: Target variable name
+            strength: Causal effect strength (default: 1.0)
+            relation_type: Type of causal relation (default: DIRECT)
+            confidence: Confidence in the relationship (default: 1.0)
         """
-        if node not in self.interaction_terms:
-            self.interaction_terms[node] = []
-        self.interaction_terms[node].append((parent1, parent2))
+        # Initialize nodes if needed
+        if source not in self.causal_graph:
+            self.causal_graph[source] = {}
+        if target not in self.causal_graph:
+            self.causal_graph[target] = {}
+        if source not in self.causal_graph_reverse:
+            self.causal_graph_reverse[source] = []
+        if target not in self.causal_graph_reverse:
+            self.causal_graph_reverse[target] = []
         
-        # Store interaction strength in graph edge data
-        if self.causal_graph.has_edge(parent1, node):
-            if 'interaction_strength' not in self.causal_graph[parent1][node]:
-                self.causal_graph[parent1][node]['interaction_strength'] = {}
-            self.causal_graph[parent1][node]['interaction_strength'][parent2] = interaction_strength
-
-    def clear_cache(self) -> None:
-        """Clear prediction cache to free memory."""
-        self._prediction_cache.clear()
-        self._entropy_cache.clear()
-        self._mi_cache.clear()
-
-    def _predict_outcomes_cached(
-        self,
-        factual_state: Dict[str, float],
-        interventions: Dict[str, float],
-    ) -> Dict[str, float]:
-        """
-        Cached version of _predict_outcomes for performance.
+        # Add edge: source -> target with strength
+        self.causal_graph[source][target] = strength
         
-        Uses hash-based caching to avoid recomputing identical predictions.
-        Cache key: hash of (sorted factual_state.items(), sorted interventions.items())
+        # Update reverse mapping for parent lookup
+        if source not in self.causal_graph_reverse[target]:
+            self.causal_graph_reverse[target].append(source)
+    
+    def _get_parents(self, node: str) -> List[str]:
         """
-        if not self._cache_enabled:
-            return self._predict_outcomes(factual_state, interventions)
+        Get parent nodes (predecessors) of a node.
         
-        # Create cache key from state and interventions (sorted for consistency)
-        state_key = tuple(sorted(factual_state.items()))
-        inter_key = tuple(sorted(interventions.items()))
-        cache_key = (state_key, inter_key)
-        
-        # Check cache
-        if cache_key in self._prediction_cache:
-            return self._prediction_cache[cache_key].copy()
-        
-        # Compute and cache (call with use_cache=False to avoid recursion)
-        result = self._predict_outcomes(factual_state, interventions, use_cache=False)
-        
-        # LRU eviction if cache too large
-        if len(self._prediction_cache) >= self._cache_max_size:
-            # Remove oldest 10% of entries (simple FIFO approximation)
-            keys_to_remove = list(self._prediction_cache.keys())[:self._cache_max_size // 10]
-            for k in keys_to_remove:
-                del self._prediction_cache[k]
+        Args:
+            node: Node name
         
-        self._prediction_cache[cache_key] = result.copy()
-        return result
-
-    def granger_causality_test(
-        self,
-        df: Any,
-        var1: str,
-        var2: str,
-        max_lag: int = 4,
-    ) -> Dict[str, Any]:
+        Returns:
+            List of parent node names
         """
-        Granger causality test: does var1 help predict var2?
-        
-        Mathematical formulation:
-        - Restricted model: y_t = α + Σᵢ₌₁ᵐ βᵢ·y_{t-i} + ε_t
-        - Unrestricted model: y_t = α + Σᵢ₌₁ᵐ βᵢ·y_{t-i} + Σᵢ₌₁ᵐ γᵢ·x_{t-i} + ε_t
-        - F-statistic: F = [(RSS_r - RSS_u)/m] / [RSS_u/(n-2m-1)]
-        - H₀: var1 does not Granger-cause var2 (γᵢ = 0 for all i)
+        return self.causal_graph_reverse.get(node, [])
+    
+    def _get_children(self, node: str) -> List[str]:
+        """
+        Get child nodes (successors) of a node.
         
         Args:
-            df: Time series data
-            var1: Potential cause variable
-            var2: Outcome variable
-            max_lag: Maximum lag to test
+            node: Node name
         
         Returns:
-            F-statistic, p-value, Granger causality decision
+            List of child node names
         """
-        if df is None or var1 not in df.columns or var2 not in df.columns:
-            return {"error": "Invalid data or variables"}
-        
-        data = df[[var1, var2]].dropna()
-        if len(data) < max_lag * 2 + 5:
-            return {"error": "Insufficient data"}
+        return list(self.causal_graph.get(node, {}).keys())
+    
+    def _topological_sort(self) -> List[str]:
+        """
+        Perform topological sort using Kahn's algorithm (pure Python).
         
-        from scipy.stats import f as f_dist
+        Returns:
+            List of nodes in topological order
+        """
+        # Compute in-degrees
+        in_degree: Dict[str, int] = {node: 0 for node in self.causal_graph.keys()}
+        for node in self.causal_graph:
+            for child in self._get_children(node):
+                in_degree[child] = in_degree.get(child, 0) + 1
         
-        # Prepare lagged variables
-        n = len(data)
-        X_lags = []  # Lagged var2 (restricted model)
-        X_unrestricted = []  # Lagged var2 + lagged var1 (unrestricted)
-        y = []
+        # Initialize queue with nodes having no incoming edges
+        queue: List[str] = [node for node, degree in in_degree.items() if degree == 0]
+        result: List[str] = []
         
-        for t in range(max_lag, n):
-            y.append(data[var2].iloc[t])
-            
-            # Restricted: only lags of var2
-            restricted_row = [data[var2].iloc[t-i] for i in range(1, max_lag+1)]
-            X_lags.append(restricted_row)
+        # Process nodes
+        while queue:
+            node = queue.pop(0)
+            result.append(node)
             
-            # Unrestricted: lags of var2 + lags of var1
-            unrestricted_row = restricted_row + [data[var1].iloc[t-i] for i in range(1, max_lag+1)]
-            X_unrestricted.append(unrestricted_row)
+            # Reduce in-degree of children
+            for child in self._get_children(node):
+                in_degree[child] -= 1
+                if in_degree[child] == 0:
+                    queue.append(child)
         
-        X_lags = np.array(X_lags)
-        X_unrestricted = np.array(X_unrestricted)
-        y = np.array(y)
-        
-        # Fit restricted model: y ~ lags(var2)
-        # β_r = (X_r'X_r)⁻¹ X_r'y
-        try:
-            XrTXr = X_lags.T @ X_lags
-            XrTy = X_lags.T @ y
-            beta_r = np.linalg.pinv(XrTXr) @ XrTy
-            y_pred_r = X_lags @ beta_r
-            rss_r = float(np.sum((y - y_pred_r) ** 2))  # Restricted residual sum of squares
-            
-            # Fit unrestricted model: y ~ lags(var2) + lags(var1)
-            XuTXu = X_unrestricted.T @ X_unrestricted
-            XuTy = X_unrestricted.T @ y
-            beta_u = np.linalg.pinv(XuTXu) @ XuTy
-            y_pred_u = X_unrestricted @ beta_u
-            rss_u = float(np.sum((y - y_pred_u) ** 2))  # Unrestricted RSS
-            
-            # F-statistic: F = [(RSS_r - RSS_u)/m] / [RSS_u/(n-2m-1)]
-            # where m = number of additional parameters (max_lag)
-            m = max_lag
-            n_obs = len(y)
-            df1 = m  # Numerator degrees of freedom
-            df2 = n_obs - 2 * m - 1  # Denominator degrees of freedom
-            
-            if df2 > 0 and rss_u > 1e-10:
-                f_stat = ((rss_r - rss_u) / m) / (rss_u / df2)
-                f_stat = float(f_stat)
-                
-                # P-value: P(F > f_stat | H₀)
-                p_value = float(1.0 - f_dist.cdf(f_stat, df1, df2))
-                
-                # Decision: reject H₀ if p < 0.05
-                granger_causes = p_value < 0.05
-                
-                return {
-                    "f_statistic": f_stat,
-                    "p_value": float(p_value),
-                    "granger_causes": granger_causes,
-                    "max_lag": max_lag,
-                    "restricted_rss": rss_r,
-                    "unrestricted_rss": rss_u,
-                    "df_numerator": df1,
-                    "df_denominator": df2,
-                    "interpretation": f"{var1} {'does' if granger_causes else 'does not'} Granger-cause {var2}",
-                }
-            else:
-                return {"error": "Degenerate case in F-test"}
-        except Exception as e:
-            return {"error": str(e)}
-
-    def vector_autoregression_estimation(
-        self,
-        df: Any,
-        variables: List[str],
-        max_lag: int = 2,
-    ) -> Dict[str, Any]:
+        return result
+    
+    def identify_causal_chain(self, start: str, end: str) -> List[str]:
         """
-        Estimate Vector Autoregression (VAR) model.
+        Find shortest causal path from start to end using BFS (pure Python).
         
-        Mathematical formulation:
-        - VAR(p): x_t = A₁x_{t-1} + A₂x_{t-2} + ... + A_p x_{t-p} + ε_t
-        - where x_t is vector of variables, A_i are coefficient matrices
-        - Estimation: OLS on each equation: x_{i,t} = Σⱼ Σₖ a_{ij,k}·x_{j,t-k} + ε_{i,t}
+        Implements core causal chain identification (Ax2, Ax6).
         
         Args:
-            df: Time series data
-            variables: Variables to include in VAR
-            max_lag: Lag order p
+            start: Starting variable
+            end: Target variable
         
         Returns:
-            Coefficient matrices, residuals, model diagnostics
+            List of variables forming the causal chain, or empty list if no path exists
         """
-        if df is None or len(variables) < 2:
-            return {"error": "Invalid data or need at least 2 variables"}
-        
-        data = df[variables].dropna()
-        if len(data) < max_lag * len(variables) + 10:
-            return {"error": "Insufficient data"}
-        
-        n_vars = len(variables)
-        n_obs = len(data) - max_lag
-        
-        # Build lagged design matrix
-        # Each row: [x_{t-1}, x_{t-2}, ..., x_{t-p}] for all variables
-        X_lag = []
-        y_matrix = []
-        
-        for t in range(max_lag, len(data)):
-            # Dependent variables at time t: y_t
-            y_row = [data[var].iloc[t] for var in variables]
-            y_matrix.append(y_row)
-            
-            # Lagged predictors: [x_{t-1}, x_{t-2}, ..., x_{t-p}]
-            lag_row = []
-            for lag in range(1, max_lag + 1):
-                for var in variables:
-                    lag_row.append(data[var].iloc[t - lag])
-            X_lag.append(lag_row)
+        if start not in self.causal_graph or end not in self.causal_graph:
+            return []
         
-        X_lag = np.array(X_lag)
-        y_matrix = np.array(y_matrix)
+        if start == end:
+            return [start]
         
-        # Estimate VAR coefficients equation by equation
-        # For each variable i: y_i = X_lag @ beta_i + ε_i
-        coefficient_matrices: Dict[str, np.ndarray] = {}
-        residuals_matrix = []
+        # BFS to find shortest path
+        queue: List[Tuple[str, List[str]]] = [(start, [start])]
+        visited: set = {start}
         
-        for i, var in enumerate(variables):
-            y_i = y_matrix[:, i]
-            
-            # OLS: β̂_i = (X'X)⁻¹X'y_i
-            XtX = X_lag.T @ X_lag
-            Xty = X_lag.T @ y_i
-            beta_i = np.linalg.pinv(XtX) @ Xty
-            
-            # Reshape to matrix form: A_k[i, j] = coefficient of var_j at lag k on var_i
-            A_matrices = {}
-            for lag in range(1, max_lag + 1):
-                A_lag = np.zeros((n_vars, n_vars))
-                for j, var_j in enumerate(variables):
-                    idx = (lag - 1) * n_vars + j
-                    if idx < len(beta_i):
-                        A_lag[i, j] = float(beta_i[idx])
-                A_matrices[f"A_{lag}"] = A_lag
+        while queue:
+            current, path = queue.pop(0)
             
-            coefficient_matrices[var] = {
-                "coefficients": beta_i,
-                "A_matrices": A_matrices,
-            }
-            
-            # Residuals: ε_i = y_i - X_lag @ β̂_i
-            y_pred_i = X_lag @ beta_i
-            residuals_i = y_i - y_pred_i
-            residuals_matrix.append(residuals_i)
-        
-        residuals_matrix = np.array(residuals_matrix).T  # Shape: (n_obs, n_vars)
-        
-        # Impulse response: how does shock to var_i affect var_j over time?
-        # IRF_{j,i}(h) = ∂y_{j,t+h} / ∂ε_{i,t}
-        # Can be computed from VAR coefficients (simplified here)
+            # Check all children
+            for child in self._get_children(current):
+                if child == end:
+                    return path + [child]
+                
+                if child not in visited:
+                    visited.add(child)
+                    queue.append((child, path + [child]))
         
-        return {
-            "coefficient_matrices": {
-                k: {k2: v2.tolist() if isinstance(v2, np.ndarray) else v2
-                    for k2, v2 in v.items()}
-                for k, v in coefficient_matrices.items()
-            },
-            "residuals": residuals_matrix.tolist(),
-            "residual_covariance": np.cov(residuals_matrix.T).tolist(),
-            "n_observations": n_obs,
-            "n_variables": n_vars,
-            "max_lag": max_lag,
-            "variables": variables,
-        }
-
-    def impulse_response_analysis(
-        self,
-        var_coefficients: Dict[str, Any],
-        horizon: int = 10,
-        shock_size: float = 1.0,
-    ) -> Dict[str, Any]:
+        return []  # No path found
+    
+    def detect_confounders(self, treatment: str, outcome: str) -> List[str]:
         """
-        Impulse Response Function (IRF): effect of one-time shock on variables over time.
-        
-        Mathematical formulation:
-        - IRF_{j,i}(h) = ∂y_{j,t+h} / ∂ε_{i,t}
-        - Computed recursively from VAR: y_t = Σₖ A_k y_{t-k} + ε_t
-        - IRF(0) = I (identity), IRF(h) = Σₖ A_k · IRF(h-k)
+        Detect confounders: variables that are ancestors of both treatment and outcome.
         
         Args:
-            var_coefficients: VAR coefficient matrices from vector_autoregression_estimation
-            horizon: Time horizon for IRF
-            shock_size: Size of initial shock
+            treatment: Treatment variable
+            outcome: Outcome variable
         
         Returns:
-            Impulse responses over time horizon
+            List of confounder variable names
         """
-        # Extract A matrices
-        A_matrices = {}
-        variables = list(var_coefficients.keys())
-        n_vars = len(variables)
-        
-        # Get max lag from coefficient structure
-        max_lag = 1
-        for var_data in var_coefficients.values():
-            if "A_matrices" in var_data:
-                for A_key in var_data["A_matrices"].keys():
-                    lag_num = int(A_key.split("_")[1])
-                    max_lag = max(max_lag, lag_num)
-        
-        # Build A_k matrices (average across equations or use first variable's)
-        first_var = variables[0]
-        if first_var in var_coefficients and "A_matrices" in var_coefficients[first_var]:
-            A_matrices = var_coefficients[first_var]["A_matrices"]
-        else:
-            return {"error": "Invalid VAR coefficients structure"}
-        
-        # Initialize IRF: IRF(0) = I (identity matrix)
-        # IRF[h][i, j] = response of variable i to shock in variable j at horizon h
-        irf = []
-        irf_0 = np.eye(n_vars) * shock_size  # Initial shock matrix
-        irf.append(irf_0.tolist())
-        
-        # Recursive computation: IRF(h) = Σₖ₌₁^p A_k · IRF(h-k)
-        # where p is max_lag
-        for h in range(1, horizon + 1):
-            irf_h = np.zeros((n_vars, n_vars))
+        def get_ancestors(node: str) -> set:
+            """Get all ancestors of a node using DFS."""
+            ancestors = set()
+            stack = [node]
+            visited = set()
             
-            for lag in range(1, min(h, max_lag) + 1):
-                A_key = f"A_{lag}"
-                if A_key in A_matrices:
-                    A_k = np.array(A_matrices[A_key])
-                    # IRF(h) += A_k · IRF(h-k)
-                    if h - lag < len(irf):
-                        irf_h += A_k @ np.array(irf[h - lag])
+            while stack:
+                current = stack.pop()
+                if current in visited:
+                    continue
+                visited.add(current)
+                
+                parents = self._get_parents(current)
+                for parent in parents:
+                    if parent not in ancestors:
+                        ancestors.add(parent)
+                        stack.append(parent)
             
-            irf.append(irf_h.tolist())
+            return ancestors
         
-        # Extract IRF paths for each variable pair
-        irf_paths: Dict[str, Dict[str, List[float]]] = {}
-        for i, var_i in enumerate(variables):
-            irf_paths[var_i] = {}
-            for j, var_j in enumerate(variables):
-                # Response of var_i to shock in var_j over time
-                path = [irf[h][i][j] for h in range(horizon + 1)]
-                irf_paths[var_i][var_j] = [float(x) for x in path]
+        if treatment not in self.causal_graph or outcome not in self.causal_graph:
+            return []
         
-        return {
-            "impulse_responses": irf_paths,
-            "horizon": horizon,
-            "shock_size": shock_size,
-            "variables": variables,
-            "irf_matrix": irf,  # Full IRF matrices
-        }
-
-    def causal_discovery_pc_algorithm(
-        self,
-        df: Any,
-        variables: List[str],
-        alpha: float = 0.05,
-    ) -> Dict[str, Any]:
-        """
-        PC algorithm for causal structure discovery (simplified implementation).
+        t_ancestors = get_ancestors(treatment)
+        o_ancestors = get_ancestors(outcome)
         
-        PC algorithm steps:
-        1. Start with complete undirected graph
-        2. Remove edges if variables are conditionally independent given any subset
-        3. Orient edges using v-structure detection
-        4. Apply orientation rules (Meek's rules)
+        # Confounders are common ancestors
+        confounders = list(t_ancestors & o_ancestors)
         
-        Mathematical foundation: d-separation, conditional independence tests
+        # Verify they have paths to both treatment and outcome
+        valid_confounders = []
+        for conf in confounders:
+            if (self._has_path(conf, treatment) and self._has_path(conf, outcome)):
+                valid_confounders.append(conf)
+        
+        return valid_confounders
+    
+    def _has_path(self, start: str, end: str) -> bool:
+        """
+        Check if a path exists from start to end using DFS.
         
         Args:
-            df: Data
-            variables: Variables to analyze
-            alpha: Significance level for independence tests
+            start: Starting node
+            end: Target node
         
         Returns:
-            Learned DAG, edge orientations, independence test results
+            True if path exists, False otherwise
         """
-        if df is None or len(variables) < 2:
-            return {"error": "Need at least 2 variables"}
-        
-        data = df[variables].dropna()
-        if len(data) < 10:
-            return {"error": "Insufficient data"}
+        if start == end:
+            return True
         
-        # Step 1: Start with complete graph (all pairs connected)
-        learned_graph = nx.DiGraph()
-        learned_graph.add_nodes_from(variables)
+        stack = [start]
+        visited = set()
         
-        # Create undirected complete graph first
-        undirected = nx.Graph()
-        undirected.add_nodes_from(variables)
-        for i, v1 in enumerate(variables):
-            for v2 in variables[i+1:]:
-                undirected.add_edge(v1, v2)
-        
-        # Step 2: Test conditional independence, remove edges
-        # Simplified: test I(X;Y|Z) for all conditioning sets Z
-        # Use correlation-based test as proxy for independence
-        edges_to_remove = []
-        
-        for v1, v2 in list(undirected.edges()):
-            # Test if v1 and v2 are independent given any subset of other variables
-            others = [v for v in variables if v not in [v1, v2]]
+        while stack:
+            current = stack.pop()
+            if current in visited:
+                continue
+            visited.add(current)
             
-            # Simple test: if partial correlation |ρ_{12|others}| < threshold, remove edge
-            # Partial correlation: correlation after controlling for others
-            try:
-                # Compute partial correlation
-                if len(others) == 0:
-                    # No conditioning: use simple correlation
-                    corr = data[[v1, v2]].corr().iloc[0, 1]
-                else:
-                    # Partial correlation approximation
-                    # Simplified: regress v1 and v2 on others, then correlate residuals
-                    from scipy.stats import pearsonr
-                    
-                    # Residuals after controlling for others
-                    X_others = data[others].values
-                    y1 = data[v1].values
-                    y2 = data[v2].values
-                    
-                    # Remove linear effect of others
-                    beta1 = np.linalg.pinv(X_others.T @ X_others) @ X_others.T @ y1
-                    beta2 = np.linalg.pinv(X_others.T @ X_others) @ X_others.T @ y2
-                    
-                    res1 = y1 - X_others @ beta1
-                    res2 = y2 - X_others @ beta2
-                    
-                    corr, p_val = pearsonr(res1, res2)
-                    
-                    # Remove edge if not significantly correlated (independent)
-                    if abs(corr) < 0.1 or (p_val is not None and p_val > alpha):
-                        edges_to_remove.append((v1, v2))
-            except:
-                pass
-        
-        # Remove edges
-        for v1, v2 in edges_to_remove:
-            if undirected.has_edge(v1, v2):
-                undirected.remove_edge(v1, v2)
+            for child in self._get_children(current):
+                if child == end:
+                    return True
+                if child not in visited:
+                    stack.append(child)
         
-        # Step 3: Orient edges (simplified v-structure detection)
-        # If X-Z-Y exists and X and Y are not connected, orient as X→Z←Y (v-structure)
-        for z in variables:
-            neighbors_z = list(undirected.neighbors(z))
-            if len(neighbors_z) >= 2:
-                for i, x in enumerate(neighbors_z):
-                    for y in neighbors_z[i+1:]:
-                        # If X and Y are not neighbors, create v-structure
-                        if not undirected.has_edge(x, y):
-                            learned_graph.add_edge(x, z)
-                            learned_graph.add_edge(y, z)
-        
-        # Add remaining undirected edges (arbitrarily orient)
-        for x, y in undirected.edges():
-            if not (learned_graph.has_edge(x, y) or learned_graph.has_edge(y, x)):
-                learned_graph.add_edge(x, y)  # Arbitrary orientation
-        
-        return {
-            "learned_dag": learned_graph,
-            "edges": list(learned_graph.edges()),
-            "nodes": list(learned_graph.nodes()),
-            "edges_removed": len(edges_to_remove),
-            "method": "PC_algorithm_simplified",
-        }
-
-    def evolutionary_multi_objective_optimization(
-        self,
-        initial_state: Dict[str, float],
-        objectives: Dict[str, float],  # {var: weight}
-        constraints: Dict[str, Tuple[float, float]],
-        intervention_vars: List[str],
-        population_size: int = 50,
-        generations: int = 100,
-    ) -> Dict[str, Any]:
+        return False
+    
+    def identify_adjustment_set(self, treatment: str, outcome: str) -> List[str]:
         """
-        Evolutionary algorithm (NSGA-II inspired) for multi-objective optimization.
-        
-        Mathematical foundation:
-        - Population: P = {x₁, x₂, ..., x_N} (intervention candidates)
-        - Fitness: f(x) = [f₁(x), f₂(x), ..., fₖ(x)] (objective vector)
-        - Selection: Tournament selection based on Pareto dominance
-        - Crossover: Blend crossover: x_new = α·x₁ + (1-α)·x₂
-        - Mutation: Gaussian mutation: x_new = x + N(0, σ²)
+        Identify back-door adjustment set for causal effect estimation.
         
         Args:
-            initial_state: Current state
-            objectives: {variable: weight} to optimize
-            constraints: {variable: (min, max)} bounds
-            intervention_vars: Variables to optimize
-            population_size: Size of population
-            generations: Number of generations
+            treatment: Treatment variable
+            outcome: Outcome variable
         
         Returns:
-            Pareto front, best solutions, convergence history
+            List of variables in the adjustment set
         """
-        # Initialize population
-        population: List[Dict[str, float]] = []
-        for _ in range(population_size):
-            individual = {}
-            for var in intervention_vars:
-                stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
-                current = initial_state.get(var, stats["mean"])
-                if var in constraints:
-                    min_val, max_val = constraints[var]
-                    individual[var] = float(self.rng.uniform(min_val, max_val))
-                else:
-                    individual[var] = float(self.rng.normal(current, stats["std"]))
-            population.append(individual)
+        if treatment not in self.causal_graph or outcome not in self.causal_graph:
+            return []
         
-        pareto_front: List[Dict[str, Any]] = []
-        convergence_history: List[float] = []
+        # Get parents of treatment
+        parents_t = set(self._get_parents(treatment))
         
-        for generation in range(generations):
-            # Evaluate fitness for all individuals
-            fitness_scores: List[Dict[str, float]] = []
-            for individual in population:
-                outcome = self._predict_outcomes(initial_state, individual)
-                fitness = {k: outcome.get(k, 0.0) * weight for k, weight in objectives.items()}
-                combined = sum(fitness.values())
-                fitness_scores.append({
-                    "individual": individual,
-                    "fitness_vector": fitness,
-                    "combined": combined,
-                })
-            
-            # Update Pareto front
-            for fs in fitness_scores:
-                is_dominated = False
-                for pf in pareto_front:
-                    pf_fit = pf["fitness_vector"]
-                    fs_fit = fs["fitness_vector"]
-                    
-                    # Check if pf dominates fs
-                    all_better = all(
-                        pf_fit.get(k, 0.0) >= fs_fit.get(k, 0.0) for k in objectives.keys()
-                    )
-                    some_better = any(
-                        pf_fit.get(k, 0.0) > fs_fit.get(k, 0.0) for k in objectives.keys()
-                    )
-                    
-                    if all_better and some_better:
-                        is_dominated = True
-                        break
-                
-                if not is_dominated:
-                    # Remove dominated points from front
-                    pareto_front = [
-                        p for p in pareto_front
-                        if not (
-                            all(fs["fitness_vector"].get(k, 0.0) >= p["fitness_vector"].get(k, 0.0)
-                            for k in objectives.keys()) and
-                            any(fs["fitness_vector"].get(k, 0.0) > p["fitness_vector"].get(k, 0.0)
-                            for k in objectives.keys())
-                        )
-                    ]
-                    pareto_front.append(fs)
+        # Get descendants of treatment
+        def get_descendants(node: str) -> set:
+            """Get all descendants using DFS."""
+            descendants = set()
+            stack = [node]
+            visited = set()
             
-            # Track convergence (average combined fitness)
-            avg_fitness = np.mean([fs["combined"] for fs in fitness_scores])
-            convergence_history.append(float(avg_fitness))
-            
-            # Selection: tournament selection (simplified)
-            # Crossover: blend crossover
-            # Mutation: Gaussian mutation
-            new_population = []
-            while len(new_population) < population_size:
-                # Tournament selection
-                idx1 = self.rng.integers(0, len(population))
-                idx2 = self.rng.integers(0, len(population))
-                parent1 = population[idx1]
-                parent2 = population[idx2]
-                
-                # Crossover: blend (α = random)
-                alpha = self.rng.random()
-                child = {}
-                for var in intervention_vars:
-                    val1 = parent1.get(var, 0.0)
-                    val2 = parent2.get(var, 0.0)
-                    child[var] = float(alpha * val1 + (1 - alpha) * val2)
-                    
-                    # Mutation: Gaussian noise
-                    if self.rng.random() < 0.1:  # 10% mutation rate
-                        stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
-                        child[var] += float(self.rng.normal(0, stats["std"] * 0.1))
-                    
-                    # Enforce constraints
-                    if var in constraints:
-                        min_val, max_val = constraints[var]
-                        child[var] = float(np.clip(child[var], min_val, max_val))
+            while stack:
+                current = stack.pop()
+                if current in visited:
+                    continue
+                visited.add(current)
                 
-                new_population.append(child)
+                for child in self._get_children(current):
+                    if child not in descendants:
+                        descendants.add(child)
+                        stack.append(child)
             
-            population = new_population
+            return descendants
         
-        # Sort Pareto front by combined fitness
-        pareto_front.sort(key=lambda x: x["combined"], reverse=True)
+        descendants_t = get_descendants(treatment)
         
-        return {
-            "pareto_front": pareto_front[:20],  # Top 20
-            "best_solution": pareto_front[0] if pareto_front else None,
-            "convergence_history": convergence_history,
-            "final_population_size": len(population),
-            "generations": generations,
-        }
-
-    def shannon_entropy(
-        self,
-        variable: str,
-        df: Any,
-        bins: Optional[int] = None,
-    ) -> float:
+        # Adjustment set: parents of treatment that are not descendants and not the outcome
+        adjustment = [
+            z for z in parents_t 
+            if z not in descendants_t and z != outcome
+        ]
+        
+        return adjustment
+    
+    def _standardize_state(self, state: Dict[str, float]) -> Dict[str, float]:
         """
-        Compute Shannon entropy: H(X) = -Σᵢ p(xᵢ) log₂ p(xᵢ)
+        Standardize state values to z-scores.
         
         Args:
-            variable: Variable name
-            df: Data
-            bins: Number of bins for discretization (auto if None)
+            state: Dictionary of variable values
         
         Returns:
-            Entropy value in bits
+            Dictionary of standardized (z-score) values
         """
-        if df is None or variable not in df.columns:
-            return 0.0
-        
-        series = df[variable].dropna()
-        if len(series) < 5:
-            return 0.0
-        
-        # Check cache
-        cache_key = f"{variable}_{len(series)}_{bins}"
-        if cache_key in self._entropy_cache:
-            return self._entropy_cache[cache_key]
-        
-        # Discretize
-        if bins is None:
-            bins = min(20, max(5, int(np.sqrt(len(series)))))
+        z = {}
+        for k, v in state.items():
+            s = self.standardization_stats.get(k)
+            if s and s.get("std", 0.0) > 0:
+                z[k] = (v - s["mean"]) / s["std"]
+            else:
+                z[k] = v
+        return z
+    
+    def _destandardize_value(self, var: str, z_value: float) -> float:
+        """
+        Convert z-score back to original scale.
         
-        hist, _ = np.histogram(series, bins=bins)
-        hist = hist[hist > 0]
-        probs = hist / hist.sum()
+        Args:
+            var: Variable name
+            z_value: Standardized (z-score) value
         
-        # Shannon entropy
-        entropy = float(-np.sum(probs * np.log2(probs)))
-        self._entropy_cache[cache_key] = entropy
-        return entropy
-
-    def mutual_information(
+        Returns:
+            Original scale value
+        """
+        s = self.standardization_stats.get(var)
+        if s and s.get("std", 0.0) > 0:
+            return z_value * s["std"] + s["mean"]
+        return z_value
+    
+    def _predict_outcomes(
         self,
-        var1: str,
-        var2: str,
-        df: Any,
-    ) -> float:
+        factual_state: Dict[str, float],
+        interventions: Dict[str, float]
+    ) -> Dict[str, float]:
         """
-        Compute mutual information: I(X;Y) = H(X) + H(Y) - H(X,Y)
+        Evolution operator E(x): Predict outcomes given state and interventions.
+        
+        This is the core CR-CA evolution operator implementing:
+        x_{t+1} = E(x_t)
+        
+        Mathematical foundation:
+        - Linear structural causal model: y = Σᵢ βᵢ·xᵢ + ε
+        - Propagates effects through causal graph in topological order
+        - Standardizes inputs, computes in z-space, de-standardizes outputs
         
         Args:
-            var1: First variable
-            var2: Second variable
-            df: Data
+            factual_state: Current world state (baseline)
+            interventions: Interventions to apply (do-operator)
         
         Returns:
-            Mutual information in bits
+            Dictionary of predicted variable values
         """
-        if df is None or var1 not in df.columns or var2 not in df.columns:
-            return 0.0
-        
-        # Check cache
-        cache_key = (var1, var2)
-        if cache_key in self._mi_cache:
-            return self._mi_cache[cache_key]
+        # Merge factual state with interventions
+        raw = factual_state.copy()
+        raw.update(interventions)
         
-        data = df[[var1, var2]].dropna()
-        if len(data) < 10:
-            return 0.0
-        
-        # Individual entropies
-        h1 = self.shannon_entropy(var1, df)
-        h2 = self.shannon_entropy(var2, df)
+        # Standardize to z-scores
+        z_state = self._standardize_state(raw)
+        z_pred = dict(z_state)
         
-        # Joint entropy: H(X,Y)
-        n_bins = min(10, max(3, int(np.cbrt(len(data)))))
-        hist_2d, _, _ = np.histogram2d(data[var1], data[var2], bins=n_bins)
-        hist_2d = hist_2d[hist_2d > 0]
-        probs_joint = hist_2d / hist_2d.sum()
-        h_joint = float(-np.sum(probs_joint * np.log2(probs_joint)))
+        # Process nodes in topological order
+        for node in self._topological_sort():
+            # If node is intervened on, keep its value
+            if node in interventions:
+                if node not in z_pred:
+                    z_pred[node] = z_state.get(node, 0.0)
+                continue
+            
+            # Get parents
+            parents = self._get_parents(node)
+            if not parents:
+                continue
+            
+            # Compute linear combination: Σᵢ βᵢ·z_xi
+            s = 0.0
+            for p in parents:
+                pz = z_pred.get(p, z_state.get(p, 0.0))
+                strength = self.causal_graph.get(p, {}).get(node, 0.0)
+                s += pz * strength
+            
+            z_pred[node] = s
         
-        # Mutual information
-        mi = float(max(0.0, h1 + h2 - h_joint))
-        self._mi_cache[cache_key] = mi
-        return mi
-
-    def conditional_mutual_information(
+        # De-standardize results
+        return {v: self._destandardize_value(v, z) for v, z in z_pred.items()}
+    
+    def _calculate_scenario_probability(
         self,
-        var1: str,
-        var2: str,
-        condition: str,
-        df: Any,
+        factual_state: Dict[str, float], 
+        interventions: Dict[str, float]
     ) -> float:
         """
-        Compute conditional mutual information: I(X;Y|Z) = H(X,Z) + H(Y,Z) - H(X,Y,Z) - H(Z)
+        Calculate probability of a counterfactual scenario.
+        
+        Uses Mahalanobis distance in standardized space.
         
         Args:
-            var1: First variable
-            var2: Second variable
-            condition: Conditioning variable
-            df: Data
+            factual_state: Baseline state
+            interventions: Intervention values
         
         Returns:
-            Conditional MI in bits
+            Probability value between 0.05 and 0.98
         """
-        if df is None or any(v not in df.columns for v in [var1, var2, condition]):
-            return 0.0
-        
-        data = df[[var1, var2, condition]].dropna()
-        if len(data) < 10:
-            return 0.0
-        
-        # H(X,Z)
-        h_xz = self.shannon_entropy(f"{var1}_{condition}", pd.DataFrame({
-            f"{var1}_{condition}": data[var1].astype(str) + "_" + data[condition].astype(str)
-        }))
+        z_sq = 0.0
+        for var, new in interventions.items():
+            s = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
+            mu, sd = s.get("mean", 0.0), s.get("std", 1.0) or 1.0
+            old = factual_state.get(var, mu)
+            dz = (new - mu) / sd - (old - mu) / sd
+            z_sq += float(dz) * float(dz)
         
-        # H(Y,Z)
-        h_yz = self.shannon_entropy(f"{var2}_{condition}", pd.DataFrame({
-            f"{var2}_{condition}": data[var2].astype(str) + "_" + data[condition].astype(str)
-        }))
-        
-        # H(X,Y,Z) - simplified joint entropy
-        # H(Z)
-        h_z = self.shannon_entropy(condition, df)
-        
-        # Simplified: I(X;Y|Z) ≈ I(X;Y) - I(X;Z) - I(Y;Z) + I(X;Y;Z)
-        # Use chain rule approximation
-        mi_xy = self.mutual_information(var1, var2, df)
-        mi_xz = self.mutual_information(var1, condition, df)
-        mi_yz = self.mutual_information(var2, condition, df)
-        
-        # Chain rule: I(X;Y|Z) = I(X;Y) - I(X;Y;Z) where I(X;Y;Z) is interaction
-        # Approximation: I(X;Y|Z) ≈ I(X;Y) - min(I(X;Z), I(Y;Z))
-        cmi = float(max(0.0, mi_xy - min(mi_xz, mi_yz)))
-        
-        return cmi
-
-    def cross_validate_edge_strength(
+        p = 0.95 * float(np.exp(-0.5 * z_sq)) + 0.05
+        return float(max(0.05, min(0.98, p)))
+    
+    def generate_counterfactual_scenarios(
         self,
-        df: Any,
-        parent: str,
-        child: str,
-        n_folds: int = 5,
-    ) -> Dict[str, Any]:
+        factual_state: Dict[str, float],
+        target_variables: List[str],
+        max_scenarios: int = 5
+    ) -> List[CounterfactualScenario]:
         """
-        Cross-validation for edge strength estimation.
+        Generate counterfactual scenarios for target variables.
         
-        Mathematical:
-        - K-fold CV: partition data into K folds
-        - Train on K-1 folds, test on held-out fold
-        - CV error: CV = (1/K) Σᵢ₌₁ᴷ MSE_i where MSE_i is mean squared error on fold i
+        Implements Ax8 (Counterfactuals) - core CR-CA functionality.
         
         Args:
-            df: Data
-            parent: Source variable
-            child: Target variable
-            n_folds: Number of CV folds
+            factual_state: Current factual state
+            target_variables: Variables to generate counterfactuals for
+            max_scenarios: Maximum number of scenarios per variable
         
         Returns:
-            CV scores, mean CV error, standard error
+            List of CounterfactualScenario objects
         """
-        if df is None or parent not in df.columns or child not in df.columns:
-            return {"error": "Invalid data"}
-        
-        data = df[[parent, child]].dropna()
-        if len(data) < n_folds * 3:
-            return {"error": "Insufficient data for CV"}
-        
-        n = len(data)
-        fold_size = n // n_folds
-        
-        cv_errors: List[float] = []
+        scenarios = []
+        z_steps = [-2.0, -1.0, -0.5, 0.5, 1.0, 2.0]
         
-        for fold in range(n_folds):
-            # Split: test = fold, train = rest
-            test_start = fold * fold_size
-            test_end = (fold + 1) * fold_size if fold < n_folds - 1 else n
+        for i, tv in enumerate(target_variables[:max_scenarios]):
+            s = self.standardization_stats.get(tv, {"mean": 0.0, "std": 1.0})
+            cur = factual_state.get(tv, 0.0)
+            cz = (cur - s["mean"]) / s["std"] if s["std"] > 0 else 0.0
             
-            test_indices = list(range(test_start, test_end))
-            train_indices = [i for i in range(n) if i not in test_indices]
+            vals = [(cz + dz) * s["std"] + s["mean"] for dz in z_steps]
             
-            train_data = data.iloc[train_indices]
-            test_data = data.iloc[test_indices]
-            
-            if len(train_data) < 5 or len(test_data) < 2:
-                continue
-            
-            # Fit on training data
-            X_train = train_data[parent].values.reshape(-1, 1)
-            y_train = train_data[child].values
-            X_test = test_data[parent].values.reshape(-1, 1)
-            y_test = test_data[child].values
-            
-            # OLS: β = (X'X)⁻¹X'y
-            XtX = X_train.T @ X_train
-            Xty = X_train.T @ y_train
-            beta = (np.linalg.pinv(XtX) @ Xty)[0]
-            
-            # Predict on test: ŷ = Xβ
-            y_pred = X_test @ np.array([beta])
-            
-            # MSE on test fold
-            mse = float(np.mean((y_test - y_pred) ** 2))
-            cv_errors.append(mse)
-        
-        if len(cv_errors) == 0:
-            return {"error": "CV failed"}
-        
-        # CV statistics
-        mean_cv_error = float(np.mean(cv_errors))
-        std_cv_error = float(np.std(cv_errors))
-        se_cv = std_cv_error / np.sqrt(len(cv_errors))  # Standard error
+            for j, v in enumerate(vals):
+                scenarios.append(CounterfactualScenario(
+                    name=f"scenario_{i}_{j}",
+                    interventions={tv: v},
+                    expected_outcomes=self._predict_outcomes(factual_state, {tv: v}),
+                    probability=self._calculate_scenario_probability(factual_state, {tv: v}),
+                    reasoning=f"Intervention on {tv} with value {v}"
+                ))
         
-        return {
-            "cv_errors": [float(e) for e in cv_errors],
-            "mean_cv_error": mean_cv_error,
-            "std_cv_error": std_cv_error,
-            "standard_error": float(se_cv),
-            "n_folds": len(cv_errors),
-            "cv_score": mean_cv_error,  # Lower is better
-        }
-
-    def integrated_gradients_attribution(
-        self,
-        baseline_state: Dict[str, float],
-        target_state: Dict[str, float],
-        target: str,
-        n_steps: int = 50,
-    ) -> Dict[str, float]:
+        return scenarios
+    
+    def analyze_causal_strength(self, source: str, target: str) -> Dict[str, float]:
         """
-        Integrated Gradients for causal attribution: how much does each variable contribute?
-        
-        Mathematical formulation:
-        - IG_i = (x_i - x_i^0) · ∫₀¹ [∂f/∂x_i](x^0 + t·(x - x^0)) dt
-        - Approximated: IG_i ≈ (x_i - x_i^0) · (1/m) Σⱼ₌₁ᵐ [∂f/∂x_i](x^0 + (j/m)·(x - x^0))
-        - Attribution: A_i = IG_i / Σⱼ IGⱼ (normalized)
+        Analyze the strength of causal relationship between two variables.
         
         Args:
-            baseline_state: Reference state (x^0)
-            target_state: Target state (x)
-            target: Outcome variable
-            n_steps: Number of integration steps
+            source: Source variable
+            target: Target variable
         
         Returns:
-            Attributions for each variable
+            Dictionary with strength, confidence, path_length, relation_type
         """
-        # Variables that differ between baseline and target
-        diff_vars = [
-            v for v in set(list(baseline_state.keys()) + list(target_state.keys()))
-            if abs(baseline_state.get(v, 0.0) - target_state.get(v, 0.0)) > 1e-6
-        ]
-        
-        if not diff_vars:
-            return {}
-        
-        integrated_gradients: Dict[str, float] = {}
-        
-        for var in diff_vars:
-            x0 = baseline_state.get(var, 0.0)
-            x1 = target_state.get(var, 0.0)
-            delta = x1 - x0
-            
-            if abs(delta) < 1e-6:
-                integrated_gradients[var] = 0.0
-                continue
-            
-            # Integrate gradient along path: x(t) = x^0 + t·(x - x^0), t ∈ [0,1]
-            grad_sum = 0.0
-            
-            for step in range(1, n_steps + 1):
-                t = step / n_steps  # t ∈ [0,1]
-                
-                # Interpolated state: x(t) = x^0 + t·(x - x^0)
-                interpolated_state = baseline_state.copy()
-                for v in diff_vars:
-                    v0 = baseline_state.get(v, 0.0)
-                    v1 = target_state.get(v, 0.0)
-                    interpolated_state[v] = v0 + t * (v1 - v0)
-                
-                # Compute gradient: ∂f/∂x_i at interpolated state
-                # Use finite differences
-                epsilon = abs(delta) * 1e-4
-                perturbed_state = interpolated_state.copy()
-                perturbed_state[var] += epsilon
-                
-                outcome_base = self._predict_outcomes({}, interpolated_state)
-                outcome_pert = self._predict_outcomes({}, perturbed_state)
-                
-                grad = (outcome_pert.get(target, 0.0) - outcome_base.get(target, 0.0)) / epsilon
-                grad_sum += grad
-            
-            # Integrated gradient: IG = delta · average_gradient
-            avg_grad = grad_sum / n_steps
-            ig = delta * avg_grad
-            integrated_gradients[var] = float(ig)
+        if source not in self.causal_graph or target not in self.causal_graph[source]:
+            return {"strength": 0.0, "confidence": 0.0, "path_length": float('inf')}
         
-        # Normalize attributions
-        total_ig = sum(abs(v) for v in integrated_gradients.values())
-        if total_ig > 1e-6:
-            attributions = {k: float(v / total_ig) for k, v in integrated_gradients.items()}
-        else:
-            attributions = {k: 0.0 for k in integrated_gradients.keys()}
+        strength = self.causal_graph[source].get(target, 0.0)
+        path = self.identify_causal_chain(source, target)
+        path_length = len(path) - 1 if path else float('inf')
         
         return {
-            "integrated_gradients": integrated_gradients,
-            "attributions": attributions,  # Normalized to sum to 1
-            "total_attribution": float(sum(abs(v) for v in attributions.values())),
+            "strength": float(strength),
+            "confidence": 1.0,  # Simplified: assume full confidence
+            "path_length": path_length,
+            "relation_type": CausalRelationType.DIRECT.value
         }
-
-    def bellman_optimal_intervention(
+    
+    def set_standardization_stats(
         self,
-        initial_state: Dict[str, float],
-        target: str,
-        intervention_vars: List[str],
-        horizon: int = 5,
-        discount: float = 0.9,
-    ) -> Dict[str, Any]:
+        variable: str,
+        mean: float,
+        std: float
+    ) -> None:
         """
-        Dynamic Programming (Bellman optimality) for optimal intervention sequence.
-        
-        Mathematical formulation:
-        - Value function: V*(x) = max_u [r(x,u) + γ·V*(f(x,u))]
-        - Optimal policy: π*(x) = argmax_u [r(x,u) + γ·V*(f(x,u))]
-        - Backward induction: solve V*(x) from terminal time backwards
+        Set standardization statistics for a variable.
         
         Args:
-            initial_state: Starting state
-            target: Variable to maximize
-            intervention_vars: Available interventions
-            horizon: Time horizon T
-            discount: Discount factor γ ∈ [0,1]
+            variable: Variable name
+            mean: Mean value
+            std: Standard deviation
+        """
+        self.standardization_stats[variable] = {"mean": mean, "std": std if std > 0 else 1.0}
+    
+    def get_nodes(self) -> List[str]:
+        """
+        Get all nodes in the causal graph.
+        
+        Returns:
+            List of node names
+        """
+        return list(self.causal_graph.keys())
+    
+    def get_edges(self) -> List[Tuple[str, str]]:
+        """
+        Get all edges in the causal graph.
         
         Returns:
-            Optimal policy, value function, intervention sequence
+            List of (source, target) tuples
+        """
+        edges = []
+        for source, targets in self.causal_graph.items():
+            for target in targets.keys():
+                edges.append((source, target))
+        return edges
+    
+    def is_dag(self) -> bool:
         """
-        # Discretize state space (simplified: use current state as reference)
-        # Value function: V_t(x) = value at time t in state x
-        value_function: Dict[int, Dict[Tuple, float]] = {}
-        policy: Dict[int, Dict[Tuple, Dict[str, float]]] = {}
+        Check if the causal graph is a DAG (no cycles).
         
-        # Terminal condition: V_T(x) = r(x) (immediate reward)
-        # Reward: r(x) = target_value(x)
-        def reward(state: Dict[str, float]) -> float:
-            outcome = self._predict_outcomes({}, state)
-            return float(outcome.get(target, 0.0))
+        Uses DFS to detect cycles.
         
-        # Backward induction: from T down to 0
-        # For each time t from T-1 down to 0:
-        for t in range(horizon - 1, -1, -1):
-            # Simplified: evaluate at current state (could expand to full state space)
-            state_key = tuple(sorted(initial_state.items()))
+        Returns:
+            True if DAG, False if cycles exist
+        """
+        def has_cycle(node: str, visited: set, rec_stack: set) -> bool:
+            """DFS to detect cycles."""
+            visited.add(node)
+            rec_stack.add(node)
             
-            if t == horizon - 1:
-                # Terminal: V_T(x) = r(x)
-                value_function[t] = {state_key: reward(initial_state)}
-                policy[t] = {state_key: {}}
-            else:
-                # Bellman: V_t(x) = max_u [r(x) + γ·V_{t+1}(f(x,u))]
-                best_value = float("-inf")
-                best_intervention: Dict[str, float] = {}
-                
-                # Search intervention space (simplified: sample candidates)
-                for _ in range(20):
-                    candidate_intervention = {}
-                    for var in intervention_vars:
-                        stats = self.standardization_stats.get(var, {"mean": 0.0, "std": 1.0})
-                        current = initial_state.get(var, stats["mean"])
-                        candidate_intervention[var] = float(self.rng.normal(current, stats["std"] * 0.5))
-                    
-                    # Next state: f(x, u)
-                    next_state = self._predict_outcomes(initial_state, candidate_intervention)
-                    next_key = tuple(sorted(next_state.items()))
-                    
-                    # Immediate reward
-                    r = reward(next_state)
-                    
-                    # Future value: γ·V_{t+1}(f(x,u))
-                    if t + 1 in value_function and next_key in value_function[t + 1]:
-                        future_val = value_function[t + 1][next_key]
-                    else:
-                        future_val = 0.0
-                    
-                    # Total value: r + γ·V_{t+1}
-                    total_value = r + discount * future_val
-                    
-                    if total_value > best_value:
-                        best_value = total_value
-                        best_intervention = candidate_intervention
-                
-                value_function[t] = {state_key: best_value}
-                policy[t] = {state_key: best_intervention}
+            for child in self._get_children(node):
+                if child not in visited:
+                    if has_cycle(child, visited, rec_stack):
+                        return True
+                elif child in rec_stack:
+                    return True
+            
+            rec_stack.remove(node)
+            return False
         
-        # Extract optimal sequence
-        optimal_sequence: List[Dict[str, float]] = []
-        current_state = initial_state.copy()
+        visited = set()
+        rec_stack = set()
         
-        for t in range(horizon):
-            state_key = tuple(sorted(current_state.items()))
-            if t in policy and state_key in policy[t]:
-                intervention = policy[t][state_key]
-                optimal_sequence.append(intervention)
-                current_state = self._predict_outcomes(current_state, intervention)
+        for node in self.causal_graph:
+            if node not in visited:
+                if has_cycle(node, visited, rec_stack):
+                    return False
         
-        return {
-            "optimal_sequence": optimal_sequence,
-            "value_function": {
-                t: {str(k): v for k, v in vf.items()}
-                for t, vf in value_function.items()
-            },
-            "policy": {
-                t: {str(k): v for k, v in p.items()}
-                for t, p in policy.items()
-            },
-            "total_value": float(value_function.get(0, {}).get(tuple(sorted(initial_state.items())), 0.0)),
-            "horizon": horizon,
-            "discount_factor": discount,
-        }
-
-    def shapley_value_attribution(
+        return True
+    
+    def run(
         self,
-        baseline_state: Dict[str, float],
-        target_state: Dict[str, float],
-        target: str,
-    ) -> Dict[str, float]:
+        initial_state: Dict[str, float],
+        target_variables: Optional[List[str]] = None,
+        max_steps: int = 1
+    ) -> Dict[str, Any]:
         """
-        Shapley values for fair attribution: marginal contribution of each variable.
+        Run causal simulation: evolve state and generate counterfactuals.
         
-        Mathematical formulation:
-        - Shapley value: φᵢ = Σ_{S ⊆ N\{i}} [|S|!(n-|S|-1)!/n!] · [v(S∪{i}) - v(S)]
-        - where v(S) = outcome with variables in S set to target, others to baseline
-        - Fair attribution: satisfies efficiency, symmetry, dummy, additivity
+        Simple entry point for CR-CA engine.
         
         Args:
-            baseline_state: Baseline (all variables at baseline)
-            target_state: Target (all variables at target)
-            target: Outcome variable
+            initial_state: Initial world state
+            target_variables: Variables to generate counterfactuals for (default: all nodes)
+            max_steps: Number of evolution steps (default: 1)
         
         Returns:
-            Shapley values for each variable
+            Dictionary with evolved state, counterfactuals, and graph info
         """
-        variables = list(set(list(baseline_state.keys()) + list(target_state.keys())))
-        n = len(variables)
-        
-        if n == 0:
-            return {}
-        
-        shapley_values: Dict[str, float] = {var: 0.0 for var in variables}
+        # Use all nodes as targets if not specified
+        if target_variables is None:
+            target_variables = list(self.causal_graph.keys())
         
-        # Compute value function: v(S) = outcome when S are set to target, rest to baseline
-        def value_function(subset: set) -> float:
-            state = baseline_state.copy()
-            for var in subset:
-                if var in target_state:
-                    state[var] = target_state[var]
-            outcome = self._predict_outcomes({}, state)
-            return float(outcome.get(target, 0.0))
+        # Evolve state
+        current_state = initial_state.copy()
+        for step in range(max_steps):
+            current_state = self._predict_outcomes(current_state, {})
         
-        # Compute Shapley value for each variable
-        for var in variables:
-            phi_i = 0.0
-            
-            # Sum over all subsets S not containing var
-            others = [v for v in variables if v != var]
-            
-            # For each subset size
-            for subset_size in range(len(others) + 1):
-                # Generate all subsets of size subset_size
-                from itertools import combinations
-                
-                for subset in combinations(others, subset_size):
-                    S = set(subset)
-                    
-                    # Weight: |S|!(n-|S|-1)!/n!
-                    s_size = len(S)
-                    weight = (math.factorial(s_size) * math.factorial(n - s_size - 1)) / math.factorial(n)
-                    
-                    # Marginal contribution: v(S∪{i}) - v(S)
-                    S_with_i = S | {var}
-                    marginal = value_function(S_with_i) - value_function(S)
-                    
-                    phi_i += weight * marginal
-            
-            shapley_values[var] = float(phi_i)
+        # Generate counterfactual scenarios
+        counterfactual_scenarios = self.generate_counterfactual_scenarios(
+            initial_state,
+            target_variables,
+            max_scenarios=5
+        )
         
         return {
-            "shapley_values": shapley_values,
-            "total_attribution": float(sum(shapley_values.values())),
-            "normalized": {k: float(v / sum(abs(vi) for vi in shapley_values.values()) if sum(abs(vi) for vi in shapley_values.values()) > 0 else 0.0)
-                          for k, v in shapley_values.items()},
+            "initial_state": initial_state,
+            "evolved_state": current_state,
+            "counterfactual_scenarios": counterfactual_scenarios,
+            "causal_graph_info": {
+                "nodes": self.get_nodes(),
+                "edges": self.get_edges(),
+                "is_dag": self.is_dag()
+            },
+            "steps": max_steps
         }

From 38a7cf83b0e17755da47225a181143607e4e735d Mon Sep 17 00:00:00 2001
From: CI-DEV <154627941+IlumCI@users.noreply.github.com>
Date: Tue, 25 Nov 2025 15:13:08 +0200
Subject: [PATCH 07/12] Refactor causal graph handling and remove advanced
 methods

Refactor causal graph node initialization and edge addition. Removed advanced methods for confounder detection and adjustment set identification in Lite version.
---
 swarms/agents/cr_ca_agent.py | 177 ++++++++---------------------------
 1 file changed, 39 insertions(+), 138 deletions(-)

diff --git a/swarms/agents/cr_ca_agent.py b/swarms/agents/cr_ca_agent.py
index f03f5ec5..3e0db60b 100644
--- a/swarms/agents/cr_ca_agent.py
+++ b/swarms/agents/cr_ca_agent.py
@@ -91,15 +91,19 @@ class CRCALite:
         # Initialize graph
         if variables:
             for var in variables:
-                if var not in self.causal_graph:
-                    self.causal_graph[var] = {}
-                if var not in self.causal_graph_reverse:
-                    self.causal_graph_reverse[var] = []
-        
+                self._ensure_node_exists(var)
+
         if causal_edges:
             for source, target in causal_edges:
                 self.add_causal_relationship(source, target)
 
+    def _ensure_node_exists(self, node: str) -> None:
+        """Ensure node present in graph structures."""
+        if node not in self.causal_graph:
+            self.causal_graph[node] = {}
+        if node not in self.causal_graph_reverse:
+            self.causal_graph_reverse[node] = []
+
     def add_causal_relationship(
         self, 
         source: str, 
@@ -118,20 +122,14 @@ class CRCALite:
             relation_type: Type of causal relation (default: DIRECT)
             confidence: Confidence in the relationship (default: 1.0)
         """
-        # Initialize nodes if needed
-        if source not in self.causal_graph:
-            self.causal_graph[source] = {}
-        if target not in self.causal_graph:
-            self.causal_graph[target] = {}
-        if source not in self.causal_graph_reverse:
-            self.causal_graph_reverse[source] = []
-        if target not in self.causal_graph_reverse:
-            self.causal_graph_reverse[target] = []
-        
-        # Add edge: source -> target with strength
-        self.causal_graph[source][target] = strength
-        
-        # Update reverse mapping for parent lookup
+        # Ensure nodes exist
+        self._ensure_node_exists(source)
+        self._ensure_node_exists(target)
+
+        # Add or update edge: source -> target with strength
+        self.causal_graph[source][target] = float(strength)
+
+        # Update reverse mapping for parent lookup (avoid duplicates)
         if source not in self.causal_graph_reverse[target]:
             self.causal_graph_reverse[target].append(source)
     
@@ -226,53 +224,7 @@ class CRCALite:
         
         return []  # No path found
     
-    def detect_confounders(self, treatment: str, outcome: str) -> List[str]:
-        """
-        Detect confounders: variables that are ancestors of both treatment and outcome.
-        
-        Args:
-            treatment: Treatment variable
-            outcome: Outcome variable
-        
-        Returns:
-            List of confounder variable names
-        """
-        def get_ancestors(node: str) -> set:
-            """Get all ancestors of a node using DFS."""
-            ancestors = set()
-            stack = [node]
-            visited = set()
-            
-            while stack:
-                current = stack.pop()
-                if current in visited:
-                    continue
-                visited.add(current)
-                
-                parents = self._get_parents(current)
-                for parent in parents:
-                    if parent not in ancestors:
-                        ancestors.add(parent)
-                        stack.append(parent)
-            
-            return ancestors
-        
-        if treatment not in self.causal_graph or outcome not in self.causal_graph:
-            return []
-        
-        t_ancestors = get_ancestors(treatment)
-        o_ancestors = get_ancestors(outcome)
-        
-        # Confounders are common ancestors
-        confounders = list(t_ancestors & o_ancestors)
-        
-        # Verify they have paths to both treatment and outcome
-        valid_confounders = []
-        for conf in confounders:
-            if (self._has_path(conf, treatment) and self._has_path(conf, outcome)):
-                valid_confounders.append(conf)
-        
-        return valid_confounders
+    # detect_confounders removed in Lite version (advanced inference)
     
     def _has_path(self, start: str, end: str) -> bool:
         """
@@ -305,52 +257,7 @@ class CRCALite:
         
         return False
     
-    def identify_adjustment_set(self, treatment: str, outcome: str) -> List[str]:
-        """
-        Identify back-door adjustment set for causal effect estimation.
-        
-        Args:
-            treatment: Treatment variable
-            outcome: Outcome variable
-        
-        Returns:
-            List of variables in the adjustment set
-        """
-        if treatment not in self.causal_graph or outcome not in self.causal_graph:
-            return []
-        
-        # Get parents of treatment
-        parents_t = set(self._get_parents(treatment))
-        
-        # Get descendants of treatment
-        def get_descendants(node: str) -> set:
-            """Get all descendants using DFS."""
-            descendants = set()
-            stack = [node]
-            visited = set()
-            
-            while stack:
-                current = stack.pop()
-                if current in visited:
-                    continue
-                visited.add(current)
-                
-                for child in self._get_children(current):
-                    if child not in descendants:
-                        descendants.add(child)
-                        stack.append(child)
-            
-            return descendants
-        
-        descendants_t = get_descendants(treatment)
-        
-        # Adjustment set: parents of treatment that are not descendants and not the outcome
-        adjustment = [
-            z for z in parents_t 
-            if z not in descendants_t and z != outcome
-        ]
-        
-        return adjustment
+    # identify_adjustment_set removed in Lite version (advanced inference)
     
     def _standardize_state(self, state: Dict[str, float]) -> Dict[str, float]:
         """
@@ -399,7 +306,7 @@ class CRCALite:
         x_{t+1} = E(x_t)
         
         Mathematical foundation:
-        - Linear structural causal model: y = Σᵢ βᵢ·xᵢ + ε
+        - Linear structural causal model: y = Σᵢ βᵢ·xᵢ + ε\n+        - NOTE: This implementation is linear. To model nonlinear dynamics override\n+          `_predict_outcomes` in a subclass with a custom evolution operator.\n*** End Patch
         - Propagates effects through causal graph in topological order
         - Standardizes inputs, computes in z-space, de-standardizes outputs
         
@@ -449,16 +356,18 @@ class CRCALite:
         interventions: Dict[str, float]
     ) -> float:
         """
-        Calculate probability of a counterfactual scenario.
+        Calculate a heuristic probability of a counterfactual scenario.
         
-        Uses Mahalanobis distance in standardized space.
+        NOTE: This is a lightweight heuristic proximity measure (Mahalanobis-like)
+        and NOT a full statistical estimator — it ignores covariance and should
+        be treated as a relative plausibility score for Lite usage.
         
         Args:
             factual_state: Baseline state
             interventions: Intervention values
         
         Returns:
-            Probability value between 0.05 and 0.98
+            Heuristic probability value between 0.05 and 0.98
         """
         z_sq = 0.0
         for var, new in interventions.items():
@@ -490,26 +399,7 @@ class CRCALite:
         Returns:
             List of CounterfactualScenario objects
         """
-        scenarios = []
-        z_steps = [-2.0, -1.0, -0.5, 0.5, 1.0, 2.0]
-        
-        for i, tv in enumerate(target_variables[:max_scenarios]):
-            s = self.standardization_stats.get(tv, {"mean": 0.0, "std": 1.0})
-            cur = factual_state.get(tv, 0.0)
-            cz = (cur - s["mean"]) / s["std"] if s["std"] > 0 else 0.0
-            
-            vals = [(cz + dz) * s["std"] + s["mean"] for dz in z_steps]
-            
-            for j, v in enumerate(vals):
-                scenarios.append(CounterfactualScenario(
-                    name=f"scenario_{i}_{j}",
-                    interventions={tv: v},
-                    expected_outcomes=self._predict_outcomes(factual_state, {tv: v}),
-                    probability=self._calculate_scenario_probability(factual_state, {tv: v}),
-                    reasoning=f"Intervention on {tv} with value {v}"
-                ))
-        
-        return scenarios
+        # Ensure stats exist for variables in factual_state (fallback behavior)\n+        self.ensure_standardization_stats(factual_state)\n+\n+        scenarios: List[CounterfactualScenario] = []\n+        z_steps = [-2.0, -1.0, -0.5, 0.5, 1.0, 2.0]\n+\n+        for i, tv in enumerate(target_variables[:max_scenarios]):\n+            stats = self.standardization_stats.get(tv, {\"mean\": 0.0, \"std\": 1.0})\n+            cur = factual_state.get(tv, stats.get(\"mean\", 0.0))\n+\n+            # If std is zero or missing, use absolute perturbations instead\n+            if not stats or stats.get(\"std\", 0.0) <= 0:\n+                base = cur\n+                abs_steps = [-2.0, -1.0, -0.5, 0.5, 1.0, 2.0]\n+                vals = [base + step for step in abs_steps]\n+            else:\n+                mean = stats[\"mean\"]\n+                std = stats[\"std\"]\n+                cz = (cur - mean) / std\n+                vals = [(cz + dz) * std + mean for dz in z_steps]\n+\n+            for j, v in enumerate(vals):\n+                scenarios.append(CounterfactualScenario(\n+                    name=f\"scenario_{i}_{j}\",\n+                    interventions={tv: float(v)},\n+                    expected_outcomes=self._predict_outcomes(factual_state, {tv: float(v)}),\n+                    probability=self._calculate_scenario_probability(factual_state, {tv: float(v)}),\n+                    reasoning=f\"Intervention on {tv} with value {v}\"\n+                ))\n+\n+        return scenarios\n*** End Patch
     
     def analyze_causal_strength(self, source: str, target: str) -> Dict[str, float]:
         """
@@ -552,6 +442,16 @@ class CRCALite:
         """
         self.standardization_stats[variable] = {"mean": mean, "std": std if std > 0 else 1.0}
     
+    def ensure_standardization_stats(self, state: Dict[str, float]) -> None:
+        """
+        Ensure standardization stats exist for all variables in a given state.
+        If stats are missing, create a sensible fallback (mean=observed, std=1.0).
+        This prevents degenerate std=0 issues in Lite mode.
+        """
+        for var, val in state.items():
+            if var not in self.standardization_stats:
+                self.standardization_stats[var] = {"mean": float(val), "std": 1.0}
+    
     def get_nodes(self) -> List[str]:
         """
         Get all nodes in the causal graph.
@@ -636,9 +536,10 @@ class CRCALite:
         for step in range(max_steps):
             current_state = self._predict_outcomes(current_state, {})
         
-        # Generate counterfactual scenarios
+        # Ensure standardization stats exist for the evolved state and generate counterfactuals from it
+        self.ensure_standardization_stats(current_state)
         counterfactual_scenarios = self.generate_counterfactual_scenarios(
-            initial_state,
+            current_state,
             target_variables,
             max_scenarios=5
         )

From 535b2fe42694bf77c7ea8acb125ec8bb3deffe8a Mon Sep 17 00:00:00 2001
From: CI-DEV <154627941+IlumCI@users.noreply.github.com>
Date: Tue, 25 Nov 2025 20:58:21 +0200
Subject: [PATCH 08/12] Update print statement from 'Hello' to 'Goodbye'

---
 docs/swarms/agents/cr_ca_agent.md | 1882 +++--------------------------
 1 file changed, 183 insertions(+), 1699 deletions(-)

diff --git a/docs/swarms/agents/cr_ca_agent.md b/docs/swarms/agents/cr_ca_agent.md
index c481bb0f..35f9d518 100644
--- a/docs/swarms/agents/cr_ca_agent.md
+++ b/docs/swarms/agents/cr_ca_agent.md
@@ -1,1722 +1,206 @@
-# CR-CA Agent
 
-A revolutionary causal reasoning and counterfactual analysis agent that performs sophisticated causal inference to understand cause-and-effect relationships, predict outcomes of interventions, and explore alternative scenarios. The CR-CA Agent transforms resource management by enabling proactive issue resolution through deep causal analysis.
+# CRCAgent
 
-## Overview
+Short summary
+-------------
+CRCAgent is a lightweight, auditable causal simulation core implemented in
+pure Python and intended as the deterministic CR‑CA engine for Swarms.
+It focuses on the core ASTT primitives: a causal DAG, a linear structural
+evolution operator (in z-space), and compact counterfactual generation.
 
-The CR-CA (Causal Reasoning with Counterfactual Analysis) Agent implements advanced causal inference techniques based on Pearl's Structural Causal Model (SCM) framework. Unlike correlation-based approaches, the CR-CA Agent identifies true causal relationships, enabling reliable predictions about the effects of interventions and counterfactual reasoning about "what-if" scenarios.
+Key properties
+- Minimal dependencies (numpy + stdlib)
+- Pure-Python causal graph (adjacency dicts)
+- Linear SCM evolution by default (overrideable)
+- Agent-first `run()` entrypoint (accepts dict or JSON payloads)
 
-**Key Capabilities:**
-
-| Capability | Description |
-|------------|-------------|
-| **Causal Graph Construction** | Builds and maintains directed acyclic graphs (DAGs) representing causal relationships |
-| **Structural Causal Modeling** | Implements linear and non-linear structural equation models with standardized coefficients |
-| **Counterfactual Reasoning** | Performs Pearl's three-step abduction-action-prediction for counterfactual analysis |
-| **Deep Root Cause Analysis** | Traces causal chains backward to identify ultimate root causes of problems |
-| **Multi-Layer What-If Analysis** | Nests causal reasoning across multiple layers to predict cascading effects |
-| **Optimal Intervention Planning** | Uses gradient-based optimization, dynamic programming, and multi-objective methods to find optimal interventions |
-| **Risk-Aware Decision Making** | Quantifies uncertainty using CVaR, bootstrap confidence intervals, and Bayesian inference |
-| **Temporal Causal Analysis** | Models distributed lag effects and vector autoregression for time-dependent systems |
-
-## Architecture
-
-```mermaid
-graph TD
-    A[Input State/Data] --> B[CR-CA Agent]
-    B --> C{Causal Graph}
-    C --> D[Structure Learning]
-    C --> E[Edge Strength Estimation]
-    C --> F[Standardization]
-    
-    D --> G[PC Algorithm]
-    E --> H[Weighted OLS]
-    F --> I[Z-Score Transform]
-    
-    G --> J[SCM Model]
-    H --> J
-    I --> J
-    
-    J --> K[Prediction Layer]
-    K --> L[Do-Operator]
-    K --> M[Counterfactual]
-    K --> N[Intervention]
-    
-    L --> O[Outcome Prediction]
-    M --> O
-    N --> O
-    
-    O --> P[Optimization Layer]
-    P --> Q[Gradient-Based]
-    P --> R[Bellman DP]
-    P --> S[Multi-Objective]
-    
-    Q --> T[Optimal Intervention]
-    R --> T
-    S --> T
-    
-    T --> U[Risk Assessment]
-    U --> V[CVaR Analysis]
-    U --> W[Confidence Intervals]
-    
-    V --> X[Final Recommendation]
-    W --> X
-    
-    style A fill:#e1f5fe
-    style B fill:#fff3e0
-    style J fill:#f3e5f5
-    style T fill:#e8f5e8
-    style X fill:#c8e6c9
-```
-
-## Getting Started
-
-### Installation
-
-The CR-CA Agent is included in the Swarms framework. Install Swarms:
-
-```bash
-pip install swarms
-```
-
-### Basic Usage Workflow
-
-The typical workflow for using the CR-CA Agent involves:
-
-1. **Initialize the agent** with a causal graph structure
-2. **Fit the model** from historical data
-3. **Make predictions** about intervention effects
-4. **Optimize interventions** to achieve desired outcomes
-
-### Step-by-Step Tutorial
-
-#### Step 1: Import and Initialize
-
-```python
-
-from swarms.agents import CRCAAgent
-import pandas as pd
-import numpy as np
-
-# Initialize the CR-CA agent
-agent = CRCAAgent(
-    name="my-causal-agent",
-    description="Causal analysis for business decisions",
-    model_name="gpt-4o-mini"  # For narrative generation
-)
-```
-
-#### Step 2: Define Your Causal Graph
-
-Define the causal relationships between variables. You can either:
-
-**Option A: Build graph manually from domain knowledge**
-
-```python
-# Add variables
-variables = ["price", "demand", "inventory", "cost", "profit"]
-
-# Add causal relationships
-agent.causal_graph.add_nodes_from(variables)
-agent.causal_graph.add_edges_from([
-    ("price", "demand"),      # Price affects demand
-    ("demand", "inventory"),  # Demand affects inventory
-    ("cost", "profit"),       # Cost affects profit
-    ("demand", "profit"),     # Demand affects profit
-    ("price", "cost")         # Price affects cost (indirectly)
-])
-
-# Add edge sign constraints (optional but recommended)
-# +1 means positive effect, -1 means negative effect
-agent.edge_sign_constraints = {
-    ("price", "demand"): -1,      # Higher price → lower demand
-    ("demand", "inventory"): -1,  # Higher demand → lower inventory
-    ("cost", "profit"): -1,       # Higher cost → lower profit
-    ("demand", "profit"): +1      # Higher demand → higher profit
-}
-```
-
-**Option B: Discover structure from data**
-
-```python
-# If you have data but aren't sure about causal structure
-historical_data = pd.DataFrame({
-    "price": [...],
-    "demand": [...],
-    "inventory": [...],
-    "cost": [...],
-    "profit": [...]
-})
-
-# Discover causal structure using PC algorithm
-learned_graph = agent.causal_discovery_pc_algorithm(
-    df=historical_data,
-    variables=["price", "demand", "inventory", "cost", "profit"],
-    alpha=0.05
-)
-
-# Use the learned graph
-agent.causal_graph = learned_graph["learned_dag"]
-```
-
-#### Step 3: Fit the Model from Data
-
-Load your historical data and fit the causal model:
-
-```python
-
-# Prepare your historical data
-historical_data = pd.DataFrame({
-    "price": [100, 105, 110, 108, 112, 115, 110, 105, 100, 95],
-    "demand": [1000, 950, 900, 920, 880, 850, 900, 950, 1000, 1050],
-    "inventory": [5000, 4500, 4000, 4200, 3800, 3500, 4000, 4500, 5000, 5500],
-    "cost": [80, 82, 85, 83, 87, 90, 85, 82, 80, 78],
-    "profit": [20000, 19950, 19900, 19920, 19880, 19850, 19900, 19950, 20000, 20050]
-})
-
-# Fit the model (learns edge strengths from data)
-agent.fit_from_dataframe(
-    df=historical_data,
-    variables=["price", "demand", "inventory", "cost", "profit"],
-    window=10,           # Use last 10 observations
-    decay_alpha=0.9,     # Weight recent data more (90% weight)
-    ridge_lambda=0.01,   # Small regularization
-    enforce_signs=True   # Respect sign constraints
-)
-
-# Check learned edge strengths
-for u, v in agent.causal_graph.edges():
-    strength = agent.causal_graph[u][v].get('strength', 0.0)
-    print(f"{u} → {v}: strength = {strength:.3f}")
-```
-
-#### Step 4: Make Predictions
-
-Predict outcomes given current state and interventions:
-
-```python
-# Current state
-current_state = {
-    "price": 100.0,
-    "demand": 1000.0,
-    "inventory": 5000.0,
-    "cost": 80.0,
-    "profit": 20000.0
-}
-
-# Scenario 1: What if we reduce price by 10%?
-intervention = {"price": 90.0}
-
-predicted = agent._predict_outcomes(current_state, intervention)
-print(f"Predicted demand: {predicted['demand']:.2f}")
-print(f"Predicted profit: {predicted['profit']:.2f}")
-
-# Scenario 2: What if we reduce price AND increase inventory?
-intervention = {"price": 90.0, "inventory": 6000.0}
-predicted = agent._predict_outcomes(current_state, intervention)
-```
-
-#### Step 5: Counterfactual Analysis
-
-Answer "what-if" questions using counterfactual reasoning:
-
-```python
-# What would have happened if price was 90 instead of 100?
-factual_state = {"price": 100.0, "demand": 1000.0}
-counterfactual_intervention = {"price": 90.0}
-
-counterfactual_result = agent.counterfactual_abduction_action_prediction(
-    factual_state=factual_state,
-    interventions=counterfactual_intervention
-)
-
-print(f"Counterfactual demand: {counterfactual_result['demand']:.2f}")
-```
-
-#### Step 6: Find Optimal Interventions
-
-Use optimization to find the best intervention:
-
-```python
-# Find optimal price to maximize profit
-optimal = agent.gradient_based_intervention_optimization(
-    initial_state=current_state,
-    target="profit",              # What to maximize
-    intervention_vars=["price"],  # What we can control
-    constraints={"price": (80.0, 120.0)},  # Price bounds
-    method="L-BFGS-B"
-)
-
-print(f"Optimal price: {optimal['optimal_intervention']['price']:.2f}")
-print(f"Predicted profit: {optimal['optimal_target_value']:.2f}")
-```
-
-#### Step 7: Analyze Root Causes
-
-Find root causes of problems:
-
-```python
-# Why is profit low?
-root_causes = agent.deep_root_cause_analysis(
-    problem_variable="profit",
-    max_depth=10,
-    min_path_strength=0.05
-)
-
-print("Ultimate root causes:")
-for rc in root_causes["ultimate_root_causes"][:5]:
-    print(f"  - {rc['root_cause']}: path strength = {rc['path_strength']:.3f}")
-```
-
-#### Step 8: Analyze Cascading Effects
-
-Understand chain reactions from interventions:
-
-```python
-# Analyze cascading effects of price reduction
-chain_reaction = agent.analyze_cascading_chain_reaction(
-    initial_intervention={"price": 0.9},  # 10% reduction
-    target_outcomes=["demand", "inventory", "profit"],
-    max_hops=5,
-    include_feedback_loops=True
-)
-
-print(f"Found {len(chain_reaction['causal_paths'])} causal paths")
-print(f"Detected {len(chain_reaction['feedback_loops'])} feedback loops")
-```
-
-### Complete Example: Supply Chain Optimization
-
-Here's a complete example for supply chain management:
-
-```python
-from swarms.agents import CRCAAgent
-import pandas as pd
-import numpy as np
-
-# Step 1: Initialize
-agent = CRCAAgent(name="supply-chain-optimizer")
-
-# Step 2: Build causal graph
-variables = ["lead_time", "supplier_capacity", "inventory", 
-             "backlog", "price", "demand", "cost"]
-
-agent.causal_graph.add_nodes_from(variables)
-agent.causal_graph.add_edges_from([
-    ("supplier_capacity", "inventory"),
-    ("lead_time", "inventory"),
-    ("inventory", "backlog"),
-    ("backlog", "price"),
-    ("price", "demand"),
-    ("demand", "backlog"),
-    ("lead_time", "cost"),
-    ("inventory", "cost")
-])
-
-# Step 3: Load historical data
-historical_data = pd.DataFrame({
-    "lead_time": np.random.normal(10, 2, 100),
-    "supplier_capacity": np.random.normal(1000, 100, 100),
-    "inventory": np.random.normal(5000, 500, 100),
-    "backlog": np.random.normal(100, 20, 100),
-    "price": np.random.normal(100, 10, 100),
-    "demand": np.random.normal(1000, 100, 100),
-    "cost": np.random.normal(80, 8, 100)
-})
-
-# Step 4: Fit model
-agent.fit_from_dataframe(
-    df=historical_data,
-    variables=variables,
-    window=30,
-    decay_alpha=0.9
-)
-
-# Step 5: Current state
-current_state = {
-    "lead_time": 12.0,
-    "supplier_capacity": 950.0,
-    "inventory": 4500.0,
-    "backlog": 150.0,
-    "price": 105.0,
-    "demand": 900.0,
-    "cost": 85.0
-}
-
-# Step 6: Find optimal safety stock (inventory level)
-optimal_inventory = agent.gradient_based_intervention_optimization(
-    initial_state=current_state,
-    target="cost",  # Minimize cost
-    intervention_vars=["inventory"],
-    constraints={"inventory": (3000.0, 7000.0)}
-)
-
-print(f"Optimal inventory level: {optimal_inventory['optimal_intervention']['inventory']:.2f}")
-print(f"Predicted cost: {optimal_inventory['optimal_target_value']:.2f}")
-
-# Step 7: Analyze what-if scenarios
-scenarios = [
-    {"lead_time": 15.0},  # What if lead time increases?
-    {"supplier_capacity": 800.0},  # What if supplier capacity decreases?
-]
-
-for scenario in scenarios:
-    predicted = agent._predict_outcomes(current_state, scenario)
-    print(f"\nScenario {scenario}:")
-    print(f"  Predicted backlog: {predicted['backlog']:.2f}")
-    print(f"  Predicted cost: {predicted['cost']:.2f}")
-
-# Step 8: Root cause analysis for high backlog
-backlog_roots = agent.deep_root_cause_analysis(
-    problem_variable="backlog",
-    max_depth=10,
-    min_path_strength=0.05
-)
-
-print("\nRoot causes of high backlog:")
-for rc in backlog_roots["ultimate_root_causes"][:3]:
-    print(f"  - {rc['root_cause']}: {rc['path_string']}")
-```
-
-### Creating Custom Causal Models
-
-#### For Financial Analysis
-
-```python
-# Cryptocurrency price analysis
-agent = CRCAAgent(name="crypto-analyzer")
-
-agent.causal_graph.add_edges_from([
-    ("volume", "price"),
-    ("volatility", "price"),
-    ("rsi", "price"),
-    ("market_sentiment", "price"),
-    ("btc_correlation", "price")
-])
-
-# Fit from historical price data
-agent.fit_from_dataframe(
-    df=crypto_data,
-    variables=["volume", "volatility", "rsi", "market_sentiment", 
-               "btc_correlation", "price"],
-    window=30
-)
-
-# Predict price impact of volume increase
-prediction = agent._predict_outcomes(
-    factual_state={"volume": 1000.0, "price": 3000.0},
-    interventions={"volume": 1500.0}
-)
-```
-
-#### For Policy Analysis
-
-```python
-# Government policy simulation
-agent = CRCAAgent(name="policy-simulator")
-
-agent.causal_graph.add_edges_from([
-    ("tax_rate", "disposable_income"),
-    ("disposable_income", "consumption"),
-    ("consumption", "gdp"),
-    ("cash_transfer", "disposable_income"),
-    ("education_spending", "human_capital"),
-    ("human_capital", "productivity")
-])
-
-# Fit from economic data
-agent.fit_from_dataframe(
-    df=economic_data,
-    variables=["tax_rate", "cash_transfer", "disposable_income",
-               "consumption", "gdp", "education_spending", 
-               "human_capital", "productivity"],
-    window=60
-)
-
-# Multi-objective optimization: maximize GDP and minimize inequality
-pareto = agent.evolutionary_multi_objective_optimization(
-    initial_state={"tax_rate": 0.3, "cash_transfer": 0.0},
-    objectives={"gdp": 0.7, "inequality": -0.3},
-    constraints={
-        "tax_rate": (0.0, 0.5),
-        "cash_transfer": (0.0, 1000.0)
-    },
-    intervention_vars=["tax_rate", "cash_transfer"]
-)
-```
-
-### Next Steps
-
-After creating your causal model:
-
-1. **Validate the model** using cross-validation:
-   ```python
-   cv_result = agent.cross_validate_edge_strength(
-       df=historical_data,
-       parent="price",
-       child="demand",
-       n_folds=5
-   )
-   ```
-
-2. **Quantify uncertainty** using bootstrap:
-   ```python
-   uncertainty = agent.quantify_uncertainty(
-       df=historical_data,
-       variables=variables,
-       windows=200,
-       alpha=0.95
-   )
-   ```
-
-3. **Use explainability** to understand predictions:
-   ```python
-   attribution = agent.shapley_value_attribution(
-       baseline_state=current_state,
-       target_state=optimal_state,
-       target="profit"
-   )
-   ```
-
-## Mathematical Foundation
-
-### Structural Causal Models (SCM)
-
-The CR-CA Agent implements Pearl's Structural Causal Model framework, where each variable is defined by a structural equation:
-
-\[
-y = f(\text{parents}(y), \varepsilon_y)
-\]
-
-For linear SCMs:
-
-\[
-y = \sum_{i} \beta_i \cdot x_i + \varepsilon
-\]
-
-where \(\beta_i\) are structural coefficients representing causal effects, and \(\varepsilon\) is an error term representing unobserved confounders.
-
-**Standardization:**
-
-To ensure numerical stability and scale-invariance, all variables are standardized to z-scores:
-
-\[
-z = \frac{x - \mu}{\sigma}
-\]
-
-where \(\mu\) is the mean and \(\sigma\) is the standard deviation. This transformation allows the agent to work with variables of different scales while preserving causal relationships.
-
-**Prediction in Z-Space:**
-
-\[
-z_y = \sum_{i} \beta_i \cdot z_{x_i} + z_\varepsilon
-\]
-
-After prediction, values are de-standardized:
-
-\[
-x = z \cdot \sigma + \mu
-\]
-
-### Do-Operator
-
-The do-operator, \(do(X = x)\), represents an intervention that sets variable \(X\) to value \(x\), breaking its dependence on its parents. This is fundamentally different from conditioning \(P(Y \mid X = x)\), as it represents active manipulation rather than passive observation.
-
-**Mathematical Definition:**
-
-\[
-P(Y \mid do(X = x)) \neq P(Y \mid X = x)
-\]
-
-The do-operator enables answering interventional questions: "What would happen if we set \(X\) to \(x\)?"
-
-### Counterfactual Reasoning
-
-Pearl's three-step counterfactual reasoning process:
-
-**1. Abduction:**
-Infer latent noise terms from factual observations:
-
-\[
-\varepsilon = y_{\text{factual}} - \sum_i \beta_i \cdot x_{\text{factual},i}
-\]
-
-**2. Action:**
-Apply do-operator to set intervention values:
-
-\[
-do(X = x^*)
-\]
-
-**3. Prediction:**
-Predict counterfactual outcome using new values but old noise:
-
-\[
-y_{\text{cf}} = \sum_i \beta_i \cdot x_{\text{cf},i} + \varepsilon
-\]
-
-This answers: "What would have happened if \(X\) had been \(x^*\) instead of \(x_{\text{factual}}\)?"
-
-## Class Reference
-
-### Constructor
-
-```python
-from swarms.agents import CRCAAgent
-
-agent = CRCAAgent(
-    name: str = "cr-ca-agent",
-    description: str = "Causal Reasoning with Counterfactual Analysis agent",
-    model_name: str = "openai/gpt-4o",
-    max_loops: int = 3,
-    causal_graph: Optional[nx.DiGraph] = None,
-    variables: Optional[List[str]] = None,
-    causal_edges: Optional[List[Tuple[str, str]]] = None,
-)
-```
-
-#### Parameters
-
-| Parameter | Type | Default | Description |
-|-----------|------|---------|-------------|
-| `name` | `str` | `"cr-ca-agent"` | Unique identifier for the agent instance |
-| `description` | `str` | `"Causal Reasoning..."` | Human-readable description of agent capabilities |
-| `model_name` | `str` | `"openai/gpt-4o"` | LLM model for narrative generation and reasoning |
-| `max_loops` | `int` | `3` | Maximum iterations for causal reasoning loops |
-| `causal_graph` | `Optional[nx.DiGraph]` | `None` | Pre-built NetworkX directed graph (DAG) |
-| `variables` | `Optional[List[str]]` | `None` | List of variable names to initialize graph |
-| `causal_edges` | `Optional[List[Tuple[str, str]]]` | `None` | List of (source, target) tuples for causal edges |
-
-### Core Methods
-
-#### fit_from_dataframe()
-
-Fit edge strengths and standardization statistics from historical data using weighted least squares regression.
-
-```python
-fit_from_dataframe(
-    df: pd.DataFrame,
-    variables: List[str],
-    window: int = 30,
-    decay_alpha: float = 0.9,
-    ridge_lambda: float = 0.0,
-    enforce_signs: bool = True
-) -> None
-```
-
-**Mathematical Formulation:**
-
-For each child variable \(y\) with parents \(\{x_1, x_2, \ldots, x_k\}\), the agent estimates coefficients \(\beta_i\) using weighted least squares:
-
-\[
-\beta = (X' W X + \lambda I)^{-1} X' W y
-\]
-
-where:
-- \(X\) is the standardized design matrix of parents
-- \(W\) is a diagonal matrix of exponential decay weights: \(w_i = \alpha^{n-1-i}\) (newer data weighted more)
-- \(\lambda\) is ridge regularization parameter
-- \(y\) is the standardized target variable
-
-**Exponential Decay Weights:**
-
-\[
-w_i = \frac{\alpha^{n-1-i}}{\sum_{j=0}^{n-1} \alpha^{n-1-j}}
-\]
-
-This emphasizes recent observations, making the model adaptive to regime changes.
-
-**Example:**
-
-```python
-import pandas as pd
-from swarms.agents import CRCAAgent
-
-# Initialize agent
-agent = CRCAAgent()
-
-# Build causal graph
-agent.causal_graph.add_edges_from([
-    ("price", "demand"),
-    ("demand", "orders"),
-    ("orders", "inventory")
-])
-
-# Fit from historical data
-df = pd.DataFrame({
-    "price": [100, 105, 110, 108, 112],
-    "demand": [1000, 950, 900, 920, 880],
-    "orders": [1000, 950, 900, 920, 880],
-    "inventory": [5000, 4500, 4000, 4200, 3800]
-})
-
-agent.fit_from_dataframe(
-    df=df,
-    variables=["price", "demand", "orders", "inventory"],
-    window=5,
-    decay_alpha=0.9
-)
-```
-
-#### _predict_outcomes()
-
-Predict outcomes given interventions using standardized linear propagation through the causal graph.
-
-```python
-_predict_outcomes(
-    factual_state: Dict[str, float],
-    interventions: Dict[str, float],
-    use_cache: bool = True
-) -> Dict[str, float]
-```
-
-**Mathematical Process:**
-
-1. **Standardize inputs:** Convert all variables to z-scores
-2. **Topological propagation:** For each node in topological order:
-   - If intervened: set \(z_{\text{node}} = z_{\text{intervention}}\) (do-operator)
-   - Otherwise: compute \(z_{\text{node}} = \sum_i \beta_i \cdot z_{\text{parent}_i}\)
-3. **De-standardize outputs:** Convert z-scores back to raw values
-
-**Example:**
-
-```python
-# Current state
-factual_state = {
-    "price": 100.0,
-    "demand": 1000.0,
-    "orders": 1000.0
-}
-
-# Intervention: reduce price by 10%
-interventions = {"price": 90.0}
-
-# Predict outcomes
-predicted = agent._predict_outcomes(factual_state, interventions)
-# Result: {"price": 90.0, "demand": 1100.0, "orders": 1100.0, ...}
-```
-
-#### counterfactual_abduction_action_prediction()
-
-Perform Pearl's three-step counterfactual reasoning for "what-if" analysis.
-
-```python
-counterfactual_abduction_action_prediction(
-    factual_state: Dict[str, float],
-    interventions: Dict[str, float]
-) -> Dict[str, float]
-```
-
-**Example:**
-
-```python
-# What if we had set price to 90 instead of 100?
-factual = {"price": 100.0, "demand": 1000.0}
-counterfactual = {"price": 90.0}
-
-result = agent.counterfactual_abduction_action_prediction(
-    factual_state=factual,
-    interventions=counterfactual
-)
-# Result shows what demand would have been if price was 90
-```
-
-### Advanced Causal Analysis
-
-#### deep_root_cause_analysis()
-
-Trace causal chains backward to identify ultimate root causes of problems.
-
-```python
-deep_root_cause_analysis(
-    problem_variable: str,
-    max_depth: int = 20,
-    min_path_strength: float = 0.01
-) -> Dict[str, Any]
-```
-
-**Mathematical Formulation:**
-
-Path strength is computed as the product of edge strengths along the path:
-
-\[
-\text{Path Strength} = \prod_{(i,j) \in \text{Path}} \beta_{ij}
-\]
-
-Root causes are ranked using multi-objective criteria:
-
-\[
-f(\text{rc}) = w_1 \cdot I_{\text{exo}}(\text{rc}) + w_2 \cdot S_{\text{path}}(\text{rc}) - w_3 \cdot D(\text{rc})
-\]
-
-where:
-- \(I_{\text{exo}}\) is indicator for exogenous nodes (true root causes)
-- \(S_{\text{path}}\) is path strength
-- \(D\) is depth (distance from problem)
-
-**Example:**
-
-```python
-# Find root causes of high backlog
-root_causes = agent.deep_root_cause_analysis(
-    problem_variable="backlog",
-    max_depth=15,
-    min_path_strength=0.05
-)
-
-# Returns:
-# {
-#     "ultimate_root_causes": [
-#         {
-#             "root_cause": "supplier_capacity",
-#             "is_exogenous": True,
-#             "path_strength": 0.85,
-#             "depth": 3
-#         }
-#     ],
-#     "intervention_opportunities": [...]
-# }
-```
-
-#### multi_layer_whatif_analysis()
-
-Perform nested counterfactual reasoning across multiple layers to predict cascading effects.
-
-```python
-multi_layer_whatif_analysis(
-    scenarios: List[Dict[str, float]],
-    depth: int = 3
-) -> Dict[str, Any]
-```
-
-**Process:**
-
-1. **Layer 1:** Direct effects of intervention
-2. **Layer 2:** Effects of affected variables on other variables
-3. **Layer 3+:** Deep cascade analysis using chain reaction detection
-
-**Example:**
-
-```python
-scenarios = [{"price": 90.0}]  # What if price drops to 90?
-
-result = agent.multi_layer_whatif_analysis(
-    scenarios=scenarios,
-    depth=5
-)
-
-# Analyzes:
-# - Layer 1: Direct effect on demand
-# - Layer 2: How demand affects inventory, lead times
-# - Layer 3+: Cascading effects through entire system
-```
-
-#### analyze_cascading_chain_reaction()
-
-Analyze multi-layer cascading chain reactions from an intervention, including feedback loops.
-
-```python
-analyze_cascading_chain_reaction(
-    initial_intervention: Dict[str, float],
-    target_outcomes: List[str],
-    max_hops: int = 5,
-    include_feedback_loops: bool = True,
-    num_iterations: int = 3
-) -> Dict[str, Any]
-```
-
-**Mathematical Formulation:**
-
-For each causal path from intervention variables to outcomes:
-
-\[
-\text{Path Strength} = \prod_{(i,j) \in \text{Path}} \beta_{ij}
-\]
-
-Cascade probability is estimated using softmax-style normalization:
-
-\[
-P(\text{cascade}) = \min(0.95, \text{Path Strength} \cdot 0.5 + 0.05)
-\]
-
-**Example:**
-
-```python
-# Analyze chain reaction from price reduction
-chain_reaction = agent.analyze_cascading_chain_reaction(
-    initial_intervention={"price": 0.9},  # 10% reduction
-    target_outcomes=["demand", "inventory", "cost"],
-    max_hops=5,
-    include_feedback_loops=True
-)
-
-# Identifies:
-# - All causal paths from price to outcomes
-# - Feedback loops that could amplify effects
-# - Cascade probabilities and cumulative effects
-```
-
-### Optimization Methods
-
-#### gradient_based_intervention_optimization()
-
-Find optimal interventions using gradient-based optimization.
-
-```python
-gradient_based_intervention_optimization(
-    initial_state: Dict[str, float],
-    target: str,
-    intervention_vars: List[str],
-    constraints: Optional[Dict[str, Tuple[float, float]]] = None,
-    method: str = "L-BFGS-B"
-) -> Dict[str, Any]
-```
-
-**Mathematical Formulation:**
-
-Objective: maximize predicted outcome
-
-\[
-\max_{\theta} y(\theta)
-\]
-
-where \(\theta\) is the intervention vector and \(y(\theta)\) is the predicted outcome.
-
-Gradient computation using finite differences:
-
-\[
-\frac{\partial y}{\partial \theta_i} \approx \frac{y(\theta + \varepsilon \cdot e_i) - y(\theta)}{\varepsilon}
-\]
-
-Update rule (gradient descent):
-
-\[
-\theta_{k+1} = \theta_k - \alpha \cdot \nabla_\theta y(\theta_k)
-\]
-
-**Example:**
-
-```python
-# Find optimal price to maximize profit
-optimal = agent.gradient_based_intervention_optimization(
-    initial_state={"price": 100.0, "demand": 1000.0},
-    target="profit",
-    intervention_vars=["price"],
-    constraints={"price": (80.0, 120.0)},
-    method="L-BFGS-B"
-)
-
-# Returns optimal price and predicted profit
-```
-
-#### bellman_optimal_intervention()
-
-Dynamic programming (Bellman optimality) for optimal intervention sequences.
-
-```python
-bellman_optimal_intervention(
-    initial_state: Dict[str, float],
-    target: str,
-    intervention_vars: List[str],
-    horizon: int = 5,
-    discount: float = 0.9
-) -> Dict[str, Any]
-```
-
-**Mathematical Formulation:**
-
-Value function (Bellman equation):
-
-\[
-V^*(x_t) = \max_{u_t} \left[ r(x_t, u_t) + \gamma \cdot V^*(f(x_t, u_t)) \right]
-\]
-
-Optimal policy:
-
-\[
-\pi^*(x_t) = \arg\max_{u_t} \left[ r(x_t, u_t) + \gamma \cdot V^*(f(x_t, u_t)) \right]
-\]
-
-where:
-- \(r(x_t, u_t)\) is immediate reward
-- \(\gamma \in [0,1]\) is discount factor
-- \(f(x_t, u_t)\) is system dynamics (next state)
-
-**Example:**
-
-```python
-# Find optimal sequence of price adjustments over 5 periods
-sequence = agent.bellman_optimal_intervention(
-    initial_state={"price": 100.0, "demand": 1000.0},
-    target="total_profit",
-    intervention_vars=["price"],
-    horizon=5,
-    discount=0.9
-)
-
-# Returns optimal price trajectory: [100, 95, 92, 90, 88]
-```
-
-#### evolutionary_multi_objective_optimization()
-
-Evolutionary algorithm (NSGA-II inspired) for multi-objective optimization.
-
-```python
-evolutionary_multi_objective_optimization(
-    initial_state: Dict[str, float],
-    objectives: Dict[str, float],  # {var: weight}
-    constraints: Dict[str, Tuple[float, float]],
-    intervention_vars: List[str],
-    population_size: int = 50,
-    generations: int = 100
-) -> Dict[str, Any]
-```
-
-**Mathematical Formulation:**
-
-Weighted sum scalarization:
-
-\[
-F(x) = \sum_i w_i \cdot f_i(x)
-\]
-
-Pareto dominance: solution \(x_1\) dominates \(x_2\) if:
-
-\[
-\forall i: f_i(x_1) \geq f_i(x_2) \quad \land \quad \exists j: f_j(x_1) > f_j(x_2)
-\]
-
-**Example:**
-
-```python
-# Optimize for both profit and customer satisfaction
-pareto = agent.evolutionary_multi_objective_optimization(
-    initial_state={"price": 100.0},
-    objectives={"profit": 0.7, "satisfaction": 0.3},
-    constraints={"price": (80.0, 120.0)},
-    intervention_vars=["price"],
-    population_size=50,
-    generations=100
-)
-
-# Returns Pareto frontier of non-dominated solutions
-```
-
-### Information Theory Methods
-
-#### compute_information_theoretic_measures()
-
-Compute entropy, mutual information, and conditional mutual information.
-
-```python
-compute_information_theoretic_measures(
-    df: pd.DataFrame,
-    variables: List[str]
-) -> Dict[str, Any]
-```
-
-**Mathematical Formulations:**
-
-**Shannon Entropy:**
-
-\[
-H(X) = -\sum_i p(x_i) \log_2 p(x_i)
-\]
-
-**Mutual Information:**
-
-\[
-I(X;Y) = H(X) + H(Y) - H(X,Y) = \sum_{x,y} p(x,y) \log_2 \frac{p(x,y)}{p(x)p(y)}
-\]
-
-**Conditional Mutual Information:**
-
-\[
-I(X;Y|Z) = H(X,Z) + H(Y,Z) - H(X,Y,Z) - H(Z)
-\]
-
-**Example:**
-
-```python
-measures = agent.compute_information_theoretic_measures(
-    df=historical_data,
-    variables=["price", "demand", "inventory"]
-)
-
-# Returns:
-# {
-#     "entropies": {"price": 3.2, "demand": 4.1, ...},
-#     "mutual_information": {"price;demand": 0.85, ...},
-#     "conditional_mi": {...}
-# }
-```
-
-### Time Series Analysis
-
-#### granger_causality_test()
-
-Test whether one variable Granger-causes another (helps predict it).
-
-```python
-granger_causality_test(
-    df: pd.DataFrame,
-    var1: str,
-    var2: str,
-    max_lag: int = 4
-) -> Dict[str, Any]
-```
-
-**Mathematical Formulation:**
-
-Restricted model (without var1):
-
-\[
-y_t = \alpha + \sum_{i=1}^m \beta_i y_{t-i} + \varepsilon_t
-\]
-
-Unrestricted model (with var1):
-
-\[
-y_t = \alpha + \sum_{i=1}^m \beta_i y_{t-i} + \sum_{i=1}^m \gamma_i x_{t-i} + \varepsilon_t
-\]
-
-F-statistic:
-
-\[
-F = \frac{(RSS_r - RSS_u)/m}{RSS_u/(n-2m-1)}
-\]
-
-**Example:**
-
-```python
-# Test if price changes Granger-cause demand changes
-result = agent.granger_causality_test(
-    df=time_series_data,
-    var1="price",
-    var2="demand",
-    max_lag=4
-)
-
-# Returns F-statistic, p-value, and causality decision
-```
-
-#### vector_autoregression_estimation()
-
-Estimate Vector Autoregression (VAR) model for multivariate time series.
-
-```python
-vector_autoregression_estimation(
-    df: pd.DataFrame,
-    variables: List[str],
-    max_lag: int = 2
-) -> Dict[str, Any]
-```
-
-**Mathematical Formulation:**
-
-VAR(p) model:
-
-\[
-\mathbf{x}_t = \mathbf{A}_1 \mathbf{x}_{t-1} + \mathbf{A}_2 \mathbf{x}_{t-2} + \ldots + \mathbf{A}_p \mathbf{x}_{t-p} + \boldsymbol{\varepsilon}_t
-\]
-
-where \(\mathbf{A}_i\) are coefficient matrices and \(\boldsymbol{\varepsilon}_t\) is white noise.
-
-**Example:**
-
-```python
-var_model = agent.vector_autoregression_estimation(
-    df=time_series_data,
-    variables=["price", "demand", "inventory"],
-    max_lag=2
-)
-
-# Returns coefficient matrices and residuals
-```
-
-### Causal Discovery
-
-#### causal_discovery_pc_algorithm()
-
-PC algorithm for causal structure discovery from data.
-
-```python
-causal_discovery_pc_algorithm(
-    df: pd.DataFrame,
-    variables: List[str],
-    alpha: float = 0.05
-) -> Dict[str, Any]
-```
-
-**Algorithm Steps:**
-
-1. Start with complete undirected graph
-2. Remove edges if variables are conditionally independent given any subset
-3. Orient edges using v-structure detection
-4. Apply orientation rules (Meek's rules)
-
-**Example:**
-
-```python
-# Learn causal structure from data
-learned_graph = agent.causal_discovery_pc_algorithm(
-    df=historical_data,
-    variables=["price", "demand", "inventory", "cost"],
-    alpha=0.05
-)
-
-# Returns learned DAG structure
-```
-
-### Risk and Uncertainty Quantification
-
-#### quantify_uncertainty()
-
-Bootstrap edge strengths and produce confidence intervals.
-
-```python
-quantify_uncertainty(
-    df: pd.DataFrame,
-    variables: List[str],
-    windows: int = 200,
-    alpha: float = 0.95
-) -> Dict[str, Any]
-```
-
-**Bootstrap Process:**
-
-1. Sample data with replacement
-2. Re-estimate edge strengths
-3. Compute confidence intervals from bootstrap distribution
-
-**Confidence Interval:**
-
-\[
-CI_{1-\alpha} = [Q_{\alpha/2}, Q_{1-\alpha/2}]
-\]
-
-where \(Q_p\) is the p-th quantile of bootstrap distribution.
-
-**Example:**
-
-```python
-uncertainty = agent.quantify_uncertainty(
-    df=historical_data,
-    variables=["price", "demand"],
-    windows=200,
-    alpha=0.95
-)
-
-# Returns 95% confidence intervals for all edge strengths
-```
-
-#### bayesian_edge_inference()
-
-Bayesian inference for edge strength using conjugate prior.
-
-```python
-bayesian_edge_inference(
-    df: pd.DataFrame,
-    parent: str,
-    child: str,
-    prior_mu: float = 0.0,
-    prior_sigma: float = 1.0
-) -> Dict[str, Any]
-```
-
-**Mathematical Formulation:**
-
-Prior: \(\beta \sim N(\mu_0, \sigma_0^2)\)
-
-Posterior: \(\beta \mid \text{data} \sim N(\mu_n, \sigma_n^2)\)
-
-Posterior mean:
-
-\[
-\mu_n = \frac{\tau_0 \mu_0 + \tau_{\text{likelihood}} \cdot n \cdot \hat{\beta}_{\text{OLS}}}{\tau_0 + \tau_{\text{likelihood}} \cdot n}
-\]
-
-where \(\tau = 1/\sigma^2\) is precision.
-
-**Example:**
-
-```python
-# Bayesian inference for price -> demand effect
-posterior = agent.bayesian_edge_inference(
-    df=historical_data,
-    parent="price",
-    child="demand",
-    prior_mu=0.0,
-    prior_sigma=1.0
-)
-
-# Returns posterior mean, variance, and credible intervals
-```
-
-## Real-World Applications
-
-### Supply Chain Management
-
-The CR-CA Agent revolutionizes supply chain management by identifying root causes of disruptions and optimizing inventory policies.
-
-**Example: Supply Shock Analysis**
-
-```python
-from swarms.agents import CRCAAgent
-
-# Initialize agent for supply chain
-agent = CRCAAgent(
-    name="supply-chain-crca",
-    description="Supply chain causal analysis"
-)
-
-# Build causal graph
-agent.causal_graph.add_edges_from([
-    ("lead_time", "receipts"),
-    ("survivability", "receipts"),
-    ("capacity", "receipts"),
-    ("receipts", "inventory"),
-    ("backlog", "price"),
-    ("price", "demand"),
-    ("demand", "orders")
-])
-
-# Fit from historical data
-agent.fit_from_dataframe(
-    df=supply_chain_data,
-    variables=["lead_time", "receipts", "inventory", "backlog", "price", "demand"],
-    window=30,
-    decay_alpha=0.9
-)
-
-# Analyze port disruption scenario
-disruption_analysis = agent.analyze_cascading_chain_reaction(
-    initial_intervention={"lead_time": 1.5},  # 50% increase
-    target_outcomes=["inventory", "backlog", "cost"],
-    max_hops=5,
-    include_feedback_loops=True
-)
-
-# Find optimal safety stock policy
-optimal_policy = agent.gradient_based_intervention_optimization(
-    initial_state={"safety_stock": 100.0, "backlog": 50.0},
-    target="cost",  # Minimize total cost
-    intervention_vars=["safety_stock"],
-    constraints={"safety_stock": (50.0, 200.0)}
-)
-```
-
-**Key Benefits:**
-
-1. **Proactive Issue Resolution:** Identifies root causes before they escalate
-2. **Optimized Resource Allocation:** Uses causal understanding to allocate safety stock efficiently
-3. **Predictive Insights:** Anticipates supply shocks and their cascading effects
-4. **Risk-Aware Decisions:** Quantifies uncertainty using CVaR and confidence intervals
-
-### Financial Market Analysis
-
-The CR-CA Agent enables sophisticated causal analysis of market dynamics, going beyond correlation to understand true causal drivers.
-
-**Example: Cryptocurrency Price Analysis**
-
-```python
-# Build causal graph for ETH price analysis
-agent = CRCAAgent(name="eth-price-analyzer")
-
-agent.causal_graph.add_edges_from([
-    ("volume", "price"),
-    ("volatility", "price"),
-    ("rsi", "price"),
-    ("momentum", "price"),
-    ("market_sentiment", "price"),
-    ("btc_eth_corr", "price")
-])
-
-# Fit from historical price data
-agent.fit_from_dataframe(
-    df=eth_price_data,
-    variables=["volume", "volatility", "rsi", "momentum", "market_sentiment", "btc_eth_corr", "price"],
-    window=30
-)
-
-# Perform causal analysis
-causal_analysis = agent.causal_analysis()
-
-# Test Granger causality
-granger_result = agent.granger_causality_test(
-    df=eth_price_data,
-    var1="volume",
-    var2="price",
-    max_lag=4
-)
-
-# Find optimal trading intervention
-optimal_trade = agent.gradient_based_intervention_optimization(
-    initial_state={"holdings": 0.0},
-    target="expected_return",
-    intervention_vars=["position_size"],
-    constraints={"position_size": (-1.0, 1.0)}
-)
-```
-
-**Key Benefits:**
-
-1. **Causal Understanding:** Distinguishes true causal drivers from spurious correlations
-2. **Predictive Power:** Forecasts price movements based on causal relationships
-3. **Risk Management:** Quantifies uncertainty in predictions using confidence intervals
-4. **Optimal Strategies:** Finds trading strategies that maximize risk-adjusted returns
-
-### Government Policy Simulation
-
-The CR-CA Agent enables sophisticated policy analysis by modeling causal relationships between policy interventions and social outcomes.
-
-**Example: Economic Policy Analysis**
-
-```python
-# Government policy simulation
-agent = CRCAAgent(name="policy-simulator")
-
-# Build comprehensive causal graph
-agent.causal_graph.add_edges_from([
-    ("income_tax_rate", "disposable_income"),
-    ("disposable_income", "consumption"),
-    ("consumption", "gdp"),
-    ("cash_transfer", "disposable_income"),
-    ("carbon_tax", "emissions"),
-    ("emissions", "health_outcomes"),
-    ("education_spending", "human_capital"),
-    ("human_capital", "productivity")
-])
-
-# Fit from economic data
-agent.fit_from_dataframe(
-    df=economic_data,
-    variables=["income_tax_rate", "cash_transfer", "carbon_tax", 
-               "disposable_income", "consumption", "gdp", 
-               "emissions", "health_outcomes", "inequality"],
-    window=60
-)
-
-# Multi-objective optimization: maximize welfare while minimizing inequality
-pareto_frontier = agent.evolutionary_multi_objective_optimization(
-    initial_state={"income_tax_rate": 0.3, "cash_transfer": 0.0},
-    objectives={"welfare": 0.7, "inequality": -0.3},  # Negative for minimization
-    constraints={
-        "income_tax_rate": (0.0, 0.5),
-        "cash_transfer": (0.0, 1000.0)
-    },
-    intervention_vars=["income_tax_rate", "cash_transfer"],
-    population_size=100,
-    generations=200
-)
-
-# Deep root cause analysis of poverty
-poverty_roots = agent.deep_root_cause_analysis(
-    problem_variable="poverty_rate",
-    max_depth=20,
-    min_path_strength=0.05
-)
-```
-
-**Key Benefits:**
-
-1. **Evidence-Based Policy:** Uses causal inference to evaluate policy effectiveness
-2. **Multi-Objective Optimization:** Balances competing objectives (growth vs. equality)
-3. **Counterfactual Analysis:** Answers "what-if" questions about policy alternatives
-4. **Root Cause Identification:** Traces social problems to their fundamental causes
-
-## Advanced Features
-
-### Explainability
-
-#### shapley_value_attribution()
-
-Fair attribution of causal effects using Shapley values from cooperative game theory.
-
-```python
-shapley_value_attribution(
-    baseline_state: Dict[str, float],
-    target_state: Dict[str, float],
-    target: str
-) -> Dict[str, float]
-```
-
-**Mathematical Formulation:**
-
-Shapley value for variable \(i\):
-
-\[
-\phi_i = \sum_{S \subseteq N \setminus \{i\}} \frac{|S|!(n-|S|-1)!}{n!} \left[v(S \cup \{i\}) - v(S)\right]
-\]
-
-where \(v(S)\) is the outcome when variables in \(S\) are set to target values.
-
-**Properties:**
-- **Efficiency:** \(\sum_i \phi_i = v(N) - v(\emptyset)\)
-- **Symmetry:** Variables with identical contributions have equal Shapley values
-- **Dummy:** Variables with no effect have zero Shapley value
-- **Additivity:** Shapley values are additive across games
-
-#### integrated_gradients_attribution()
-
-Path-integrated gradients for causal attribution.
-
-```python
-integrated_gradients_attribution(
-    baseline_state: Dict[str, float],
-    target_state: Dict[str, float],
-    target: str,
-    n_steps: int = 50
-) -> Dict[str, float]
-```
-
-**Mathematical Formulation:**
-
-Integrated gradient along path from baseline \(x^0\) to target \(x\):
-
-\[
-IG_i = (x_i - x_i^0) \cdot \int_0^1 \frac{\partial f}{\partial x_i}(x^0 + t \cdot (x - x^0)) \, dt
-\]
-
-Approximated using Riemann sum:
-
-\[
-IG_i \approx (x_i - x_i^0) \cdot \frac{1}{m} \sum_{j=1}^m \frac{\partial f}{\partial x_i}\left(x^0 + \frac{j}{m}(x - x^0)\right)
-\]
-
-### Non-Linear Extensions
-
-#### nonlinear_scm_prediction()
-
-Non-linear SCM with interaction terms.
-
-```python
-nonlinear_scm_prediction(
-    factual_state: Dict[str, float],
-    interventions: Dict[str, float],
-    include_interactions: bool = True
-) -> Dict[str, float]
-```
-
-**Mathematical Formulation:**
-
-Extended model with interactions:
-
-\[
-y = \sum_i \beta_i \cdot x_i + \sum_{i,j} \gamma_{ij} \cdot x_i \cdot x_j + \varepsilon
-\]
-
-where \(\gamma_{ij}\) are interaction coefficients.
-
-**Example:**
-
-```python
-# Add interaction term: price × advertising
-agent.add_interaction_term(
-    node="demand",
-    parent1="price",
-    parent2="advertising",
-    interaction_strength=0.15
-)
-
-# Predict with interactions
-predicted = agent.nonlinear_scm_prediction(
-    factual_state={"price": 100.0, "advertising": 1000.0},
-    interventions={},
-    include_interactions=True
-)
-```
-
-### Temporal Causal Analysis
-
-#### temporal_causal_chain_analysis()
-
-Model distributed lag effects in causal systems.
-
-```python
-temporal_causal_chain_analysis(
-    initial_intervention: Dict[str, float],
-    target: str,
-    time_horizon: int = 10,
-    lag_structure: Optional[Dict[Tuple[str, str], int]] = None
-) -> Dict[str, Any]
-```
-
-**Mathematical Formulation:**
-
-Distributed lag model:
-
-\[
-y_j(t + \tau_{ij}) = \beta_{ij} \cdot x_i(t)
-\]
-
-where \(\tau_{ij}\) is the lag for edge \((i,j)\).
-
-Accumulated effect:
-
-\[
-y(t) = \sum_i \sum_k \beta_{ij} \cdot x_i(t - \tau_k)
-\]
-
-**Example:**
-
-```python
-# Model that policy changes take 2 periods to affect economy
-lag_structure = {
-    ("tax_rate", "gdp"): 2,
-    ("spending", "gdp"): 1
-}
-
-temporal_analysis = agent.temporal_causal_chain_analysis(
-    initial_intervention={"tax_rate": 0.25},
-    target="gdp",
-    time_horizon=10,
-    lag_structure=lag_structure
-)
-
-# Shows GDP trajectory over 10 periods with delayed effects
-```
-
-## Best Practices
-
-### 1. Causal Graph Construction
-
-**Start with domain knowledge:** Use expert knowledge to initialize the causal graph before data-driven refinement.
-
-```python
-# Good: Start with known causal structure
-agent.causal_graph.add_edges_from([
-    ("cause", "effect"),  # Known from domain knowledge
-])
-
-# Then refine with data
-agent.fit_from_dataframe(df, variables)
-```
-
-**Validate with data:** Use `causal_discovery_pc_algorithm()` to validate and refine the graph structure.
-
-### 2. Data Preparation
-
-**Ensure sufficient data:** The agent requires at least 30 observations per variable for reliable estimation.
-
-**Handle missing values:** The agent automatically handles missing values, but ensure sufficient complete cases.
-
-**Standardize scales:** While the agent standardizes internally, ensure variables are in reasonable ranges.
-
-### 3. Model Validation
-
-**Cross-validation:** Use `cross_validate_edge_strength()` to validate edge strength estimates.
-
-```python
-cv_result = agent.cross_validate_edge_strength(
-    df=historical_data,
-    parent="price",
-    child="demand",
-    n_folds=5
-)
-
-# Lower CV error indicates more reliable estimates
-```
-
-**Bootstrap confidence intervals:** Use `quantify_uncertainty()` to assess estimation uncertainty.
-
-### 4. Intervention Design
-
-**Use constraints:** Always specify realistic constraints for interventions.
+Canonical import
+----------------
+Use the canonical agent import in application code:
 
 ```python
-optimal = agent.gradient_based_intervention_optimization(
-    initial_state=current_state,
-    target="profit",
-    intervention_vars=["price"],
-    constraints={"price": (min_price, max_price)}  # Always specify bounds
-)
+from swarms.agents.cr_ca_agent import CRCAgent
 ```
 
-**Consider risk:** Use CVaR-based risk metrics for high-stakes decisions.
-
-### 5. Interpretation
-
-**Use explainability methods:** Leverage Shapley values and integrated gradients to understand model decisions.
+Quickstart
+----------
+Minimal example — initialize, add edges, evolve state and get counterfactuals:
 
 ```python
-# Understand why model recommends specific intervention
-attribution = agent.shapley_value_attribution(
-    baseline_state=current_state,
-    target_state=recommended_state,
-    target="profit"
-)
-
-# Shows contribution of each variable to predicted profit
-```
+from swarms.agents.cr_ca_agent import CRCAgent
 
-## Performance Considerations
+agent = CRCAgent(variables=["price", "demand", "inventory"])
+agent.add_causal_relationship("price", "demand", strength=-0.5)
+agent.add_causal_relationship("demand", "inventory", strength=-0.2)
 
-### Caching
+state = {"price": 100.0, "demand": 1000.0, "inventory": 5000.0}
+out = agent.run(state, target_variables=["price", "demand"], max_steps=1)
 
-The agent automatically caches prediction results to improve performance:
-
-```python
-# Enable/disable caching
-agent._cache_enabled = True
-agent._cache_max_size = 1000  # Maximum cache entries
-
-# Clear cache when needed
-agent.clear_cache()
+print("Evolved:", out["evolved_state"])            # evolved world state
+for sc in out["counterfactual_scenarios"][:5]:      # candidate CFs
+    print(sc.name, sc.interventions, sc.probability)
 ```
 
-### Vectorization
-
-For batch predictions, use `vectorized_batch_prediction()`:
+Agent-style JSON payload example (orchestrators)
+------------------------------------------------
 
 ```python
-# Process multiple interventions efficiently
-interventions = [
-    {"price": 90.0},
-    {"price": 95.0},
-    {"price": 100.0}
-]
+import json
+from swarms.agents.cr_ca_agent import CRCAgent
 
-predictions = agent.vectorized_batch_prediction(
-    initial_state=base_state,
-    intervention_batch=interventions
-)
+agent = CRCAgent(variables=["price","demand","inventory"])
+payload = json.dumps({"price": 100.0, "demand": 1000.0})
+out = agent.run(payload, target_variables=["price"], max_steps=1)
+print(out["evolved_state"])
 ```
 
-### Computational Complexity
-
-- **Graph fitting:** O(n × m × k) where n is window size, m is number of edges, k is number of variables
-- **Prediction:** O(k) where k is number of variables (linear in graph size)
-- **Root cause analysis:** O(k × d) where d is maximum depth
-- **Optimization:** Varies by method (gradient: O(iterations × k), evolutionary: O(population × generations × k))
-
-## Limitations and Considerations
-
-1. **DAG Assumption:** The agent assumes acyclic causal graphs. Cycles are automatically removed by eliminating weakest edges.
-
-2. **Linearity:** Default model assumes linear relationships. Use `nonlinear_scm_prediction()` for non-linear effects.
+Why use `run()`
+--------------
+- Accepts both dict and JSON payloads for flexible integration.
+- Evolves the world state for `max_steps` using the deterministic evolution
+  operator, then generates counterfactuals from the evolved state (consistent timelines).
+- Returns a compact result dict used across Swarms agents.
 
-3. **Confounders:** Unobserved confounders can bias estimates. Use domain knowledge to identify and adjust for known confounders.
+Architecture (high level)
+-------------------------
 
-4. **Sample Size:** Requires sufficient data (typically 30+ observations per variable) for reliable estimation.
-
-5. **Causal Discovery:** Structure learning (PC algorithm) is simplified. For complex discovery, consider external tools like TETRAD or PC-stable.
-
-## Conclusion
-
-The CR-CA Agent represents a paradigm shift in decision-making systems, moving from correlation-based predictions to causal understanding. By implementing Pearl's Structural Causal Model framework with advanced optimization and risk quantification, it enables:
-
-- **Proactive Problem Solving:** Identify root causes before issues escalate
-- **Evidence-Based Decisions:** Use causal inference to evaluate interventions
-- **Optimal Resource Allocation:** Optimize policies based on causal understanding
-- **Risk-Aware Planning:** Quantify and manage uncertainty in predictions
-
-Whether applied to supply chain management, financial analysis, or policy simulation, the CR-CA Agent transforms how organizations understand and manage complex systems.
-
-## References
-
-- Pearl, J. (2009). *Causality: Models, Reasoning, and Inference*. Cambridge University Press.
-- Pearl, J., & Mackenzie, D. (2018). *The Book of Why: The New Science of Cause and Effect*. Basic Books.
-- Spirtes, P., Glymour, C., & Scheines, R. (2000). *Causation, Prediction, and Search*. MIT Press.
-- Peters, J., Janzing, D., & Schölkopf, B. (2017). *Elements of Causal Inference*. MIT Press.
+```mermaid
+flowchart LR
+  subgraph Ingestion["Input / Ingestion"]
+    I1["Initial state"]
+    I2["Historical data"]
+  end
+
+  subgraph Modeling["Causal Model"]
+    G1["Causal graph"]
+    G2["Add/update edges"]
+    G3["Standardization stats"]
+  end
+
+  subgraph Preproc["Preprocessing"]
+    P1["ensure_standardization_stats"]
+    P2["Standardize to z-space"]
+  end
+
+  subgraph Engine["Lite Engine"]
+    T["Topological sort"]
+    E["predict_outcomes (linear SCM)"]
+    D["De-standardize outputs"]
+    R["run (timeline rollout)"]
+  end
+
+  subgraph CF["Counterfactuals"]
+    C1["generate_counterfactual_scenarios"]
+    C2["Abduction–Action–Prediction"]
+    S["Scenario scoring"]
+  end
+
+  subgraph Analysis["Outputs / Analysis"]
+    O1["Evolved state"]
+    O2["Counterfactual scenarios"]
+    O3["Causal paths / visualization"]
+  end
+
+  I1 --> P1 --> P2 --> G1
+  I2 --> G2 --> G1
+  G3 --> P2
+  G1 --> T --> E --> D --> R
+  R --> C1 --> C2 --> S --> O2
+  R --> O1
+  T --> O3
+
+```
+
+Complete method index (quick)
+-----------------------------
+The following is the public surface implemented by `CRCAgent` in
+`swarms/agents/cr_ca_agent.py`. See the code for full docstrings and math.
+
+Core graph & state
+- `_ensure_node_exists(node)` — ensure node present in internal maps
+- `add_causal_relationship(source, target, strength=1.0, ...)` — add/update edge
+- `_get_parents(node)`, `_get_children(node)` — graph accessors
+- `_topological_sort()` — Kahn's algorithm
+- `get_nodes()`, `get_edges()`, `is_dag()` — graph introspection
+
+Standardization & prediction
+- `set_standardization_stats(var, mean, std)` — set z-stats
+- `ensure_standardization_stats(state)` — auto-fill sensible stats
+- `_standardize_state(state)` / `_destandardize_value(var, z)` — z-score transforms
+- `_predict_outcomes(factual_state, interventions)` — evolution operator (linear SCM)
+- `_predict_outcomes_cached(...)` — cached wrapper
+
+Counterfactuals & reasoning
+- `generate_counterfactual_scenarios(factual_state, target_variables, max_scenarios=5)`
+- `_calculate_scenario_probability(factual_state, interventions)` — heuristic plausibility
+- `counterfactual_abduction_action_prediction(factual_state, interventions)` — abduction–action–prediction (Pearl)
+
+Estimation, analysis & utilities
+- `fit_from_dataframe(df, variables, window=30, ...)` — WLS edge estimation and stats
+- `quantify_uncertainty(df, variables, windows=200, ...)` — bootstrap CIs
+- `analyze_causal_strength(source, target)` — path/edge summary
+- `identify_causal_chain(start, end)` — BFS shortest path
+- `detect_change_points(series, threshold=2.5)` — simple detector
+
+Advanced functions (Restricted((Does exist)))
+- `learn_structure(...)`, `plan_interventions(...)`, `gradient_based_intervention_optimization(...)`,
+  `convex_intervention_optimization(...)`, `evolutionary_multi_objective_optimization(...)`,
+  `probabilistic_nested_simulation(...)`, `deep_root_cause_analysis(...)`, and more.
+
+Return shape from `run()`
+-------------------------
+`run()` returns a dictionary with at least the following keys:
+- `initial_state`: the provided input state (dict)
+- `evolved_state`: state after applying `max_steps` of the evolution operator
+- `counterfactual_scenarios`: list of `CounterfactualScenario` with name/interventions/expected_outcomes/probability/reasoning
+- `causal_graph_info`: {"nodes": [...], "edges": [...], "is_dag": bool}
+- `steps`: `max_steps` used
+
+Usage patterns & examples
+-------------------------
+1) Script-style (preferred for simple programs)
+
+```python
+agent = CRCAgent(variables=["a","b","c"])
+agent.add_causal_relationship("a","b", strength=0.8)
+state = {"a":1.0, "b":2.0, "c":3.0}
+res = agent.run(state, max_steps=2)
+print(res["evolved_state"])
+```
+
+2) Orchestration / agent-style (JSON payloads)
+
+```python
+payload = '{"a":1.0,"b":2.0,"c":3.0}'
+res = agent.run(payload, max_steps=1)
+if "error" in res:
+    print("Bad payload:", res["error"])
+else:
+    print("Evolved:", res["evolved_state"])
+```
+
+3) Lower-level testing & research
+
+```python
+pred = agent._predict_outcomes({"a":1.0,"b":2.0},{"a":0.0})
+print(pred)
+```
+
+Design notes & limitations
+--------------------------
+- Linearity: default `_predict_outcomes` is linear in standardized z-space. To model non-linear dynamics, subclass `CRCAgent` and override `_predict_outcomes`.
+- Probabilities: scenario probability is a heuristic proximity measure (Mahalanobis-like) — not a formal posterior.
+- Stats: the engine auto-fills standardization stats with sensible defaults (`mean=observed`, `std=1.0`) via `ensure_standardization_stats` to avoid degenerate std=0 cases.
+- Dependencies: Lite intentionally avoids heavy libs (pandas/scipy/cvxpy/LLM) in the core file.
+
+Extending & integration
+-----------------------
+For advanced capabilities (structure learning, Bayesian inference, optimization,
+LLM-driven analysis), build separate modules that import `CRCAgent` as the
+deterministic simulation core and add the richer logic there (keeps Lite auditable).
+
+References
+----------
+- Pearl, J. (2009). *Causality: Models, Reasoning, and Inference*.
+- Pearl, J., & Mackenzie, D. (2018). *The Book of Why*.
 

From b53a52ec346d7097981eedb8325da0e1d2b7654d Mon Sep 17 00:00:00 2001
From: CI-DEV <154627941+IlumCI@users.noreply.github.com>
Date: Tue, 25 Nov 2025 20:59:41 +0200
Subject: [PATCH 09/12] Refactor CRCAgent class and enhance type hints

---
 swarms/agents/cr_ca_agent.py | 89 ++++++++++++++++++++++++++++++++----
 1 file changed, 81 insertions(+), 8 deletions(-)

diff --git a/swarms/agents/cr_ca_agent.py b/swarms/agents/cr_ca_agent.py
index 3e0db60b..8e456995 100644
--- a/swarms/agents/cr_ca_agent.py
+++ b/swarms/agents/cr_ca_agent.py
@@ -10,7 +10,7 @@ This is a minimal implementation of the ASTT/CR-CA framework focusing on:
 Dependencies: numpy only (typing, dataclasses, enum are stdlib)
 """
 
-from typing import Dict, Any, List, Tuple, Optional
+from typing import Dict, Any, List, Tuple, Optional, Union
 import numpy as np
 from dataclasses import dataclass
 from enum import Enum
@@ -54,7 +54,7 @@ class CounterfactualScenario:
     reasoning: str = ""
 
 
-class CRCALite:
+class CRCAgent:
     """
     CR-CA Lite: Lightweight Causal Reasoning with Counterfactual Analysis engine.
     
@@ -73,6 +73,7 @@ class CRCALite:
         self,
         variables: Optional[List[str]] = None,
         causal_edges: Optional[List[Tuple[str, str]]] = None,
+        max_loops: Optional[Union[int, str]] = 1,
     ):
         """
         Initialize CR-CA Lite engine.
@@ -97,6 +98,10 @@ class CRCALite:
             for source, target in causal_edges:
                 self.add_causal_relationship(source, target)
 
+        # Agent-like loop control: accept numeric or "auto"
+        # Keep the original (possibly "auto") value; resolution happens at run time.
+        self.max_loops = max_loops
+
     def _ensure_node_exists(self, node: str) -> None:
         """Ensure node present in graph structures."""
         if node not in self.causal_graph:
@@ -269,7 +274,7 @@ class CRCALite:
         Returns:
             Dictionary of standardized (z-score) values
         """
-        z = {}
+        z: Dict[str, float] = {}
         for k, v in state.items():
             s = self.standardization_stats.get(k)
             if s and s.get("std", 0.0) > 0:
@@ -399,7 +404,44 @@ class CRCALite:
         Returns:
             List of CounterfactualScenario objects
         """
-        # Ensure stats exist for variables in factual_state (fallback behavior)\n+        self.ensure_standardization_stats(factual_state)\n+\n+        scenarios: List[CounterfactualScenario] = []\n+        z_steps = [-2.0, -1.0, -0.5, 0.5, 1.0, 2.0]\n+\n+        for i, tv in enumerate(target_variables[:max_scenarios]):\n+            stats = self.standardization_stats.get(tv, {\"mean\": 0.0, \"std\": 1.0})\n+            cur = factual_state.get(tv, stats.get(\"mean\", 0.0))\n+\n+            # If std is zero or missing, use absolute perturbations instead\n+            if not stats or stats.get(\"std\", 0.0) <= 0:\n+                base = cur\n+                abs_steps = [-2.0, -1.0, -0.5, 0.5, 1.0, 2.0]\n+                vals = [base + step for step in abs_steps]\n+            else:\n+                mean = stats[\"mean\"]\n+                std = stats[\"std\"]\n+                cz = (cur - mean) / std\n+                vals = [(cz + dz) * std + mean for dz in z_steps]\n+\n+            for j, v in enumerate(vals):\n+                scenarios.append(CounterfactualScenario(\n+                    name=f\"scenario_{i}_{j}\",\n+                    interventions={tv: float(v)},\n+                    expected_outcomes=self._predict_outcomes(factual_state, {tv: float(v)}),\n+                    probability=self._calculate_scenario_probability(factual_state, {tv: float(v)}),\n+                    reasoning=f\"Intervention on {tv} with value {v}\"\n+                ))\n+\n+        return scenarios\n*** End Patch
+        # Ensure stats exist for variables in factual_state (fallback behavior)
+        self.ensure_standardization_stats(factual_state)
+
+        scenarios: List[CounterfactualScenario] = []
+        z_steps = [-2.0, -1.0, -0.5, 0.5, 1.0, 2.0]
+
+        for i, tv in enumerate(target_variables[:max_scenarios]):
+            stats = self.standardization_stats.get(tv, {"mean": 0.0, "std": 1.0})
+            cur = factual_state.get(tv, stats.get("mean", 0.0))
+
+            # If std is zero or missing, use absolute perturbations instead
+            if not stats or stats.get("std", 0.0) <= 0:
+                base = cur
+                abs_steps = [-2.0, -1.0, -0.5, 0.5, 1.0, 2.0]
+                vals = [base + step for step in abs_steps]
+            else:
+                mean = stats["mean"]
+                std = stats["std"]
+                cz = (cur - mean) / std
+                vals = [(cz + dz) * std + mean for dz in z_steps]
+
+            for j, v in enumerate(vals):
+                interventions = {tv: float(v)}
+                scenarios.append(
+                    CounterfactualScenario(
+                        name=f"scenario_{i}_{j}",
+                        interventions=interventions,
+                        expected_outcomes=self._predict_outcomes(
+                            factual_state, interventions
+                        ),
+                        probability=self._calculate_scenario_probability(
+                            factual_state, interventions
+                        ),
+                        reasoning=f"Intervention on {tv} with value {v}",
+                    )
+                )
+
+        return scenarios
     
     def analyze_causal_strength(self, source: str, target: str) -> Dict[str, float]:
         """
@@ -510,9 +552,9 @@ class CRCALite:
     
     def run(
         self,
-        initial_state: Dict[str, float],
+        initial_state: Any,
         target_variables: Optional[List[str]] = None,
-        max_steps: int = 1
+        max_steps: Union[int, str] = 1
     ) -> Dict[str, Any]:
         """
         Run causal simulation: evolve state and generate counterfactuals.
@@ -527,13 +569,40 @@ class CRCALite:
         Returns:
             Dictionary with evolved state, counterfactuals, and graph info
         """
+        # Accept either a dict initial_state or a JSON string (agent-like behavior)
+        if not isinstance(initial_state, dict):
+            try:
+                import json
+                parsed = json.loads(initial_state)
+                if isinstance(parsed, dict):
+                    initial_state = parsed
+                else:
+                    return {"error": "initial_state JSON must decode to a dict"}
+            except Exception:
+                return {"error": "initial_state must be a dict or JSON-encoded dict"}
+
         # Use all nodes as targets if not specified
         if target_variables is None:
             target_variables = list(self.causal_graph.keys())
         
+        # Resolve "auto" sentinel for max_steps (accepts method arg or instance-level default)
+        def _resolve_max_steps(value: Union[int, str]) -> int:
+            if isinstance(value, str) and value == "auto":
+                # Heuristic: one step per variable (at least 1)
+                return max(1, len(self.causal_graph))
+            try:
+                return int(value)
+            except Exception:
+                return max(1, len(self.causal_graph))
+
+        effective_steps = _resolve_max_steps(max_steps if max_steps != 1 or self.max_loops == 1 else self.max_loops)
+        # If caller passed default 1 and instance set a different max_loops, prefer instance value
+        if max_steps == 1 and self.max_loops != 1:
+            effective_steps = _resolve_max_steps(self.max_loops)
+
         # Evolve state
         current_state = initial_state.copy()
-        for step in range(max_steps):
+        for step in range(effective_steps):
             current_state = self._predict_outcomes(current_state, {})
         
         # Ensure standardization stats exist for the evolved state and generate counterfactuals from it
@@ -553,5 +622,9 @@ class CRCALite:
                 "edges": self.get_edges(),
                 "is_dag": self.is_dag()
             },
-            "steps": max_steps
+            "steps": effective_steps
         }
+
+
+# Agent-like behavior: `run` accepts either a dict or a JSON string as the initial_state
+# so the engine behaves like a normal agent by default.

From 7f813cfc0c47b1b990a6314fcb58a8b78de8fa9b Mon Sep 17 00:00:00 2001
From: CI-DEV <154627941+IlumCI@users.noreply.github.com>
Date: Tue, 25 Nov 2025 22:48:44 +0200
Subject: [PATCH 10/12] Revise CRCAAgent documentation for clarity and updates

Updated documentation for CRCAAgent to reflect new features and changes, including LLM integration and dual-mode operation.
---
 docs/swarms/agents/cr_ca_agent.md | 209 ++++++++++++++++++++----------
 1 file changed, 142 insertions(+), 67 deletions(-)

diff --git a/docs/swarms/agents/cr_ca_agent.md b/docs/swarms/agents/cr_ca_agent.md
index 35f9d518..b471b732 100644
--- a/docs/swarms/agents/cr_ca_agent.md
+++ b/docs/swarms/agents/cr_ca_agent.md
@@ -1,120 +1,160 @@
-
-# CRCAgent
+<!-- swarms/agents/cr_ca_agent.py — CRCAAgent (CR‑CA Lite) -->
+# CRCAAgent 
 
 Short summary
 -------------
-CRCAgent is a lightweight, auditable causal simulation core implemented in
-pure Python and intended as the deterministic CR‑CA engine for Swarms.
-It focuses on the core ASTT primitives: a causal DAG, a linear structural
+CRCAAgent is a lightweight causal reasoning Agent with LLM integration,
+implemented in pure Python and intended as a flexible CR‑CA engine for Swarms.
+It provides both LLM-based causal analysis and deterministic causal simulation,
+focusing on the core ASTT primitives: a causal DAG, a linear structural
 evolution operator (in z-space), and compact counterfactual generation.
 
 Key properties
-- Minimal dependencies (numpy + stdlib)
+- LLM integration for sophisticated causal reasoning (like full CRCAAgent)
+- Dual-mode operation: LLM-based analysis and deterministic simulation
+- Minimal dependencies (numpy + swarms Agent base)
 - Pure-Python causal graph (adjacency dicts)
 - Linear SCM evolution by default (overrideable)
-- Agent-first `run()` entrypoint (accepts dict or JSON payloads)
+- Agent-first `run()` entrypoint (accepts task string or dict/JSON payloads)
 
 Canonical import
 ----------------
 Use the canonical agent import in application code:
 
 ```python
-from swarms.agents.cr_ca_agent import CRCAgent
+from swarms.agents.cr_ca_agent import CRCAAgent
 ```
 
 Quickstart
 ----------
-Minimal example — initialize, add edges, evolve state and get counterfactuals:
+Minimal example — deterministic mode: initialize, add edges, evolve state and get counterfactuals:
 
 ```python
-from swarms.agents.cr_ca_agent import CRCAgent
+from swarms.agents.cr_ca_agent import CRCAAgent
 
-agent = CRCAgent(variables=["price", "demand", "inventory"])
+agent = CRCAAgent(variables=["price", "demand", "inventory"])
 agent.add_causal_relationship("price", "demand", strength=-0.5)
 agent.add_causal_relationship("demand", "inventory", strength=-0.2)
 
 state = {"price": 100.0, "demand": 1000.0, "inventory": 5000.0}
-out = agent.run(state, target_variables=["price", "demand"], max_steps=1)
+out = agent.run(initial_state=state, target_variables=["price", "demand"], max_steps=1)
 
 print("Evolved:", out["evolved_state"])            # evolved world state
 for sc in out["counterfactual_scenarios"][:5]:      # candidate CFs
     print(sc.name, sc.interventions, sc.probability)
 ```
 
+LLM-based causal analysis example
+----------------------------------
+
+```python
+from swarms.agents.cr_ca_agent import CRCAAgent
+
+agent = CRCAAgent(
+    variables=["price", "demand", "inventory"],
+    model_name="gpt-4o",
+    max_loops=3
+)
+agent.add_causal_relationship("price", "demand", strength=-0.5)
+
+# LLM mode: pass task as string
+task = "Analyze how increasing price affects demand and inventory levels"
+result = agent.run(task=task)
+
+print("Causal Analysis:", result["causal_analysis"])
+print("Counterfactual Scenarios:", result["counterfactual_scenarios"])
+print("Analysis Steps:", result["analysis_steps"])
+```
+
 Agent-style JSON payload example (orchestrators)
 ------------------------------------------------
 
 ```python
 import json
-from swarms.agents.cr_ca_agent import CRCAgent
+from swarms.agents.cr_ca_agent import CRCAAgent
 
-agent = CRCAgent(variables=["price","demand","inventory"])
+agent = CRCAAgent(variables=["price","demand","inventory"])
 payload = json.dumps({"price": 100.0, "demand": 1000.0})
-out = agent.run(payload, target_variables=["price"], max_steps=1)
+out = agent.run(initial_state=payload, target_variables=["price"], max_steps=1)
 print(out["evolved_state"])
 ```
 
 Why use `run()`
 --------------
-- Accepts both dict and JSON payloads for flexible integration.
-- Evolves the world state for `max_steps` using the deterministic evolution
-  operator, then generates counterfactuals from the evolved state (consistent timelines).
-- Returns a compact result dict used across Swarms agents.
+- **Dual-mode operation**: Automatically selects LLM mode (task string) or deterministic mode (initial_state dict)
+- **LLM mode**: Performs sophisticated multi-loop causal reasoning with structured output
+- **Deterministic mode**: Evolves the world state for `max_steps` using the deterministic evolution
+  operator, then generates counterfactuals from the evolved state (consistent timelines)
+- Accepts both dict and JSON payloads for flexible integration
+- Returns a compact result dict used across Swarms agents
 
 Architecture (high level)
 -------------------------
 
 ```mermaid
-flowchart LR
-  subgraph Ingestion["Input / Ingestion"]
-    I1["Initial state"]
-    I2["Historical data"]
+flowchart TB
+  subgraph Input[Input]
+    I1[Task string]
+    I2[Initial state dict]
   end
 
-  subgraph Modeling["Causal Model"]
-    G1["Causal graph"]
-    G2["Add/update edges"]
-    G3["Standardization stats"]
-  end
+  I1 -->|String| LLM[LLM Mode]
+  I2 -->|Dict| DET[Deterministic Mode]
 
-  subgraph Preproc["Preprocessing"]
-    P1["ensure_standardization_stats"]
-    P2["Standardize to z-space"]
+  subgraph LLMFlow[LLM Causal Analysis]
+    LLM --> P1[Build Causal Prompt]
+    P1 --> L1[LLM Step 1]
+    L1 --> L2[LLM Step 2...N]
+    L2 --> SYN[Synthesize Analysis]
+    SYN --> CF1[Generate Counterfactuals]
   end
 
-  subgraph Engine["Lite Engine"]
-    T["Topological sort"]
-    E["predict_outcomes (linear SCM)"]
-    D["De-standardize outputs"]
-    R["run (timeline rollout)"]
+  subgraph DetFlow[Deterministic Simulation]
+    DET --> P2[ensure_standardization_stats]
+    P2 --> P3[Standardize to z-space]
+    P3 --> T[Topological sort]
+    T --> E[predict_outcomes linear SCM]
+    E --> D[De-standardize outputs]
+    D --> R[Timeline rollout]
+    R --> CF2[Generate Counterfactuals]
   end
 
-  subgraph CF["Counterfactuals"]
-    C1["generate_counterfactual_scenarios"]
-    C2["Abduction–Action–Prediction"]
-    S["Scenario scoring"]
+  subgraph Model[Causal Model]
+    G1[Causal graph]
+    G2[Edge strengths]
+    G3[Standardization stats]
   end
 
-  subgraph Analysis["Outputs / Analysis"]
-    O1["Evolved state"]
-    O2["Counterfactual scenarios"]
-    O3["Causal paths / visualization"]
+  subgraph Output[Outputs]
+    O1[Causal analysis / Evolved state]
+    O2[Counterfactual scenarios]
+    O3[Causal graph info]
   end
 
-  I1 --> P1 --> P2 --> G1
-  I2 --> G2 --> G1
-  G3 --> P2
-  G1 --> T --> E --> D --> R
-  R --> C1 --> C2 --> S --> O2
+  G1 --> LLMFlow
+  G1 --> DetFlow
+  G2 --> DetFlow
+  G3 --> DetFlow
+  CF1 --> O2
+  CF2 --> O2
+  SYN --> O1
   R --> O1
-  T --> O3
-
+  G1 --> O3
 ```
 
 Complete method index (quick)
 -----------------------------
-The following is the public surface implemented by `CRCAgent` in
-`swarms/agents/cr_ca_agent.py`. See the code for full docstrings and math.
+The following is the public surface implemented by `CRCAAgent` (Lite) in
+`ceca_lite/crca-lite.py` (canonical import: `swarms/agents/cr_ca_agent.py`).
+See the code for full docstrings and math.
+
+LLM integration
+- `_get_cr_ca_schema()` — CR-CA function calling schema for structured reasoning
+- `step(task)` — Execute a single step of LLM-based causal reasoning
+- `_build_causal_prompt(task)` — Build causal analysis prompt with graph context
+- `_build_memory_context()` — Build memory context from previous analysis steps
+- `_synthesize_causal_analysis(task)` — Synthesize final causal analysis using LLM
+- `_run_llm_causal_analysis(task)` — Run multi-loop LLM-based causal analysis
 
 Core graph & state
 - `_ensure_node_exists(node)` — ensure node present in internal maps
@@ -142,14 +182,23 @@ Estimation, analysis & utilities
 - `identify_causal_chain(start, end)` — BFS shortest path
 - `detect_change_points(series, threshold=2.5)` — simple detector
 
-Advanced functions (Restricted((Does exist)))
+Advanced (optional / Pro)
 - `learn_structure(...)`, `plan_interventions(...)`, `gradient_based_intervention_optimization(...)`,
   `convex_intervention_optimization(...)`, `evolutionary_multi_objective_optimization(...)`,
   `probabilistic_nested_simulation(...)`, `deep_root_cause_analysis(...)`, and more.
 
 Return shape from `run()`
 -------------------------
-`run()` returns a dictionary with at least the following keys:
+`run()` returns a dictionary with different keys depending on mode:
+
+**LLM Mode** (when `task` is a string):
+- `task`: the provided task/problem string
+- `causal_analysis`: synthesized causal analysis report (string)
+- `counterfactual_scenarios`: list of `CounterfactualScenario` objects
+- `causal_graph_info`: {"nodes": [...], "edges": [...], "is_dag": bool}
+- `analysis_steps`: list of analysis steps with memory context
+
+**Deterministic Mode** (when `initial_state` is a dict):
 - `initial_state`: the provided input state (dict)
 - `evolved_state`: state after applying `max_steps` of the evolution operator
 - `counterfactual_scenarios`: list of `CounterfactualScenario` with name/interventions/expected_outcomes/probability/reasoning
@@ -158,28 +207,45 @@ Return shape from `run()`
 
 Usage patterns & examples
 -------------------------
-1) Script-style (preferred for simple programs)
+1) LLM-based causal analysis (sophisticated reasoning)
 
 ```python
-agent = CRCAgent(variables=["a","b","c"])
+agent = CRCAAgent(
+    variables=["a","b","c"],
+    model_name="gpt-4o",
+    max_loops=3
+)
+agent.add_causal_relationship("a","b", strength=0.8)
+
+# LLM mode: pass task as string
+task = "Analyze the causal relationship between a and b"
+res = agent.run(task=task)
+print(res["causal_analysis"])
+print(res["analysis_steps"])
+```
+
+2) Deterministic simulation (script-style)
+
+```python
+agent = CRCAAgent(variables=["a","b","c"])
 agent.add_causal_relationship("a","b", strength=0.8)
 state = {"a":1.0, "b":2.0, "c":3.0}
-res = agent.run(state, max_steps=2)
+res = agent.run(initial_state=state, max_steps=2)
 print(res["evolved_state"])
 ```
 
-2) Orchestration / agent-style (JSON payloads)
+3) Orchestration / agent-style (JSON payloads)
 
 ```python
 payload = '{"a":1.0,"b":2.0,"c":3.0}'
-res = agent.run(payload, max_steps=1)
+res = agent.run(initial_state=payload, max_steps=1)
 if "error" in res:
     print("Bad payload:", res["error"])
 else:
     print("Evolved:", res["evolved_state"])
 ```
 
-3) Lower-level testing & research
+4) Lower-level testing & research
 
 ```python
 pred = agent._predict_outcomes({"a":1.0,"b":2.0},{"a":0.0})
@@ -188,19 +254,28 @@ print(pred)
 
 Design notes & limitations
 --------------------------
-- Linearity: default `_predict_outcomes` is linear in standardized z-space. To model non-linear dynamics, subclass `CRCAgent` and override `_predict_outcomes`.
-- Probabilities: scenario probability is a heuristic proximity measure (Mahalanobis-like) — not a formal posterior.
-- Stats: the engine auto-fills standardization stats with sensible defaults (`mean=observed`, `std=1.0`) via `ensure_standardization_stats` to avoid degenerate std=0 cases.
-- Dependencies: Lite intentionally avoids heavy libs (pandas/scipy/cvxpy/LLM) in the core file.
+- **LLM Integration**: Uses swarms Agent infrastructure for LLM calls. Configure model via `model_name` parameter. Multi-loop reasoning enabled by default.
+- **Dual-mode operation**: Automatically selects LLM mode (task string) or deterministic mode (initial_state dict). Both modes generate counterfactuals using deterministic methods.
+- **Linearity**: default `_predict_outcomes` is linear in standardized z-space. To model non-linear dynamics, subclass `CRCAAgent` and override `_predict_outcomes`.
+- **Probabilities**: scenario probability is a heuristic proximity measure (Mahalanobis-like) — not a formal posterior.
+- **Stats**: the engine auto-fills standardization stats with sensible defaults (`mean=observed`, `std=1.0`) via `ensure_standardization_stats` to avoid degenerate std=0 cases.
+- **Dependencies**: Lite intentionally avoids heavy libs (pandas/scipy/cvxpy) but includes LLM integration via swarms Agent base.
 
 Extending & integration
 -----------------------
 For advanced capabilities (structure learning, Bayesian inference, optimization,
-LLM-driven analysis), build separate modules that import `CRCAgent` as the
-deterministic simulation core and add the richer logic there (keeps Lite auditable).
+extensive statistical methods), use the full `CRCAAgent` in `swarms/agents/cr_ca_agent.py`.
+The Lite version provides core causal reasoning with LLM support while maintaining minimal dependencies.
 
 References
 ----------
 - Pearl, J. (2009). *Causality: Models, Reasoning, and Inference*.
 - Pearl, J., & Mackenzie, D. (2018). *The Book of Why*.
 
+---
+CRCAAgent (Lite) — lightweight causal reasoning Agent with LLM integration for Swarms.
+
+Implementation: `ceca_lite/crca-lite.py`  
+Canonical import: `from swarms.agents.cr_ca_agent import CRCAAgent`
+
+

From d0b2a96824abc5ac20ee4c10125487dd9f65518e Mon Sep 17 00:00:00 2001
From: CI-DEV <154627941+IlumCI@users.noreply.github.com>
Date: Tue, 25 Nov 2025 22:49:56 +0200
Subject: [PATCH 11/12] Delete
 examples/demos/logistics/crca_supply_shock_agent.py

---
 .../logistics/crca_supply_shock_agent.py      | 1887 -----------------
 1 file changed, 1887 deletions(-)
 delete mode 100644 examples/demos/logistics/crca_supply_shock_agent.py

diff --git a/examples/demos/logistics/crca_supply_shock_agent.py b/examples/demos/logistics/crca_supply_shock_agent.py
deleted file mode 100644
index 3cee1163..00000000
--- a/examples/demos/logistics/crca_supply_shock_agent.py
+++ /dev/null
@@ -1,1887 +0,0 @@
-import math
-from dataclasses import dataclass
-from typing import Dict, List, Tuple, Optional, Any
-
-import numpy as np
-import pandas as pd
-from loguru import logger
-import json
-import re
-import warnings
-
-from swarms import Agent
-from swarms.agents import CRCAAgent
-
-
-SUPPLY_AGENT_PROMPT = """
-You are an expert supply chain analyst with deep knowledge of multi-echelon inventory, logistics, and robust control.
-You analyze telemetry and SCM outputs, apply causal reasoning, and propose safe, actionable interventions.
-
-Data-awareness:
-- Consider lead time (L), survival/transport factor (phi), capacity (K), backlog (B), inventory (I), demand (D), orders (O), receipts (R), price (p).
-- Reference learned causal edges when explaining recommendations (e.g., B→p+, I→p−, dcost→p+, L→R−, D→O+).
-
-Uncertainty and risk:
-- Note regime shifts or drift (EWMA/CUSUM/BOCPD). Prefer conservative actions when uncertainty is high.
-- Propose z_alpha updates, reroute/expedite shares with CVaR-style caution and execution realism.
-
-Guardrails:
-- Avoid claims beyond the data window. Keep recommendations feasible under capacity and service constraints.
-- Prefer stable signals and explain trade-offs (service vs. cost vs. bullwhip).
-
-Output structure (always include these 7 sections):
-1) Drivers: succinct causal drivers (e.g., L↑→R↓→I↓→B↑→p↑; dcost↑→p↑→D↓)
-2) Regime/Alerts: note EWMA/CUSUM/BOCPD, utilization, and stability
-3) Proposal: recommended z_alpha, reroute/expedite, and rationale
-4) Expected Impact: service, cost proxy, bullwhip changes (direction and rough magnitude)
-5) Risks/Uncertainty: cite instability or wide uncertainty; suggest mitigations
-6) Counterfactuals: 1–2 do()-style scenarios and expected KPI shifts
-7) Actionables: concrete next steps and monitoring items
-
-Learned DAG alignment:
-- Mirror the learned DAG strengths exactly in your explanation. Do not claim effects whose learned strength is ~0. If L→R≈0 or R→I≈0, reflect that and avoid relying on those edges. Base rationale on the actual learned edges provided.
-
-After the 7 sections, you MUST output a final JSON object on a new line with the exact schema:
-{
-  "proposal": {"z_alpha_new": number, "reroute_share": number, "expedite_share": number, "dual_source_share": number},
-  "notes": string,
-  "expected_deltas": {"service": number, "cost_proxy": number, "bullwhip": number},
-  "ci80": {"service": [low, high], "cost_proxy": [low, high], "bullwhip": [low, high]},
-  "feasible": boolean
-}
-Numbers should be in [0, 3] for z_alpha_new, [0, 1] for shares.
-"""
-
-
-@dataclass
-class SKUKey:
-    sku: str
-    facility: str
-
-
-@dataclass
-class PolicyParams:
-    z_alpha: float = 1.28  # base safety factor (approx 90%)
-    theta_smoothing: float = 0.35  # order smoothing parameter
-
-
-@dataclass
-class Elasticities:
-    eta_c: float = 0.3  # pass-through elasticity to price from cost changes
-    eta_B: float = 0.5  # price increases with backlog
-    eta_I: float = 0.3  # price decreases with inventory
-
-
-class SupplyShockCRCAgent:
-    """CR-CA Supply-Shock Agent for multi-period inventory flows and interventions.
-
-    Implements SCM flow, queueing-derived lead times, pricing pass-through, and
-    integrates CRCAAgent for causal analysis and do()-counterfactuals.
-    """
-
-    def __init__(
-        self,
-        skus: List[SKUKey],
-        T: int = 60,
-        policy: PolicyParams = PolicyParams(),
-        el: Elasticities = Elasticities(),
-        seed: int = 7,
-    ) -> None:
-        self.skus = skus
-        self.T = T
-        self.policy = policy
-        self.el = el
-        self.rng = np.random.default_rng(seed)
-
-        # Core data containers (panel: period x (sku,facility))
-        index = pd.MultiIndex.from_tuples(
-            [(t, k.sku, k.facility) for t in range(T) for k in skus],
-            names=["t", "sku", "facility"],
-        )
-        self.df = pd.DataFrame(index=index)
-
-        # Initialize states with simple priors
-        self.df["D"] = self.rng.poisson(100, len(self.df))  # demand
-        self.df["I"] = 120.0  # on-hand
-        self.df["B"] = 0.0  # backorder
-        self.df["P"] = 80.0  # pipeline
-        self.df["O"] = 0.0  # orders placed
-        self.df["R"] = 0.0  # receipts
-        self.df["K"] = 1e6  # facility capacity (big default)
-        self.df["phi"] = 1.0  # spoilage/survival fraction
-        self.df["L"] = self.rng.integers(1, 4, len(self.df)).astype(float)  # lead time in periods (float for updates)
-        self.df["c"] = 10.0  # unit cost
-        self.df["dcost"] = 0.0  # cost change
-        self.df["p_bar"] = 15.0
-        self.df["p"] = self.df["p_bar"]
-        self.df["D_ref"] = 100.0
-
-        # CR-CA causal layer
-        self.crca = CRCAAgent(
-            name="crca-supply-shock",
-            description="Causal layer for supply shocks and policy",
-            model_name="gpt-4o-mini",
-            max_loops=2,
-        )
-        self._build_causal_graph()
-
-        # VSM overlay components (S2-S5)
-        self.vsm = VSMOverlay()
-
-        # Narrative LLM agent (graceful init)
-        try:
-            self.agent = Agent(
-                agent_name="CRCA-Supply-Shock-Agent",
-                system_prompt=SUPPLY_AGENT_PROMPT,
-                model_name="gpt-4o",
-                max_loops=1,
-                autosave=False,
-                dashboard=True,
-                verbose=False,
-                dynamic_temperature_enabled=True,
-                context_length=200000,
-                output_type="string",
-                streaming_on=False,
-            )
-        except Exception as e:
-            logger.warning(f"LLM Agent init failed (narrative disabled): {e}")
-            self.agent = None
-
-        # Feasibility config and last applied controls
-        self.lane_capacity: float = 0.35  # max share sum for reroute+expedite+dual_source per cycle
-        self.max_weekly_change: Dict[str, float] = {"z_alpha_new": 0.3, "reroute_share": 0.15, "expedite_share": 0.15, "dual_source_share": 0.2}
-        self.last_controls: Dict[str, float] = {"z_alpha_new": self.policy.z_alpha, "reroute_share": 0.0, "expedite_share": 0.0, "dual_source_share": 0.0}
-        # KPI normalization scalers
-        self.kpi_units = {"service": "%", "cost_proxy": "currency", "bullwhip": "ratio"}
-        self.cost_unit_multiplier = 1.0
-        # KPI/action history and RL weights
-        self.kpi_history: List[Dict[str, float]] = []
-        self.action_history: List[Dict[str, float]] = []
-        self.mpc_weights: Dict[str, float] = {"service": 1.0, "cost": 1.0, "bullwhip": 0.5}
-        # Dynamic data feeds
-        self._feeds: Dict[str, Any] = {}
-        # Direct pricing lever (applied as an offset to p_bar during simulate)
-        self._price_adjust: float = 0.0
-
-    # ===== Helper: logistics lever support from learned DAG =====
-    def _logistics_support_from_strengths(self, strengths: Dict[str, float], tol: float = 0.05) -> bool:
-        keys = ["L->R", "phi->R", "K->R"]
-        return any(abs(float(strengths.get(k, 0.0))) > tol for k in keys)
-
-    # ===== Helper: calibrate z to target service via short grid search =====
-    def calibrate_z_to_service(self, target_service: float = 0.95, z_grid: Optional[np.ndarray] = None) -> float:
-        if z_grid is None:
-            z_grid = np.linspace(0.8, 2.6, 10)
-        best_z = self.policy.z_alpha
-        best_val = float("inf")
-        # Snapshot current policy
-        z_prev = self.policy.z_alpha
-        try:
-            for z in z_grid:
-                self.policy.z_alpha = float(z)
-                df = self.simulate()
-                kpi = self.summarize(df)
-                # distance to target with slight cost penalty to avoid extreme z
-                val = abs(float(kpi.get("service_level", 0.0)) - target_service) + 0.01 * max(0.0, float(kpi.get("cost_proxy", 0.0)))
-                if val < best_val:
-                    best_val = val
-                    best_z = float(z)
-        finally:
-            self.policy.z_alpha = z_prev
-        return best_z
-
-    # ===== Helper: minimal Pareto grid on (z, r, e) =====
-    def pareto_front(self, base_z: float, allow_logistics: bool, trials: int = 30, allow_price: bool = False) -> List[Dict[str, Any]]:
-        z_vals = np.clip(np.linspace(base_z - 0.2, base_z + 0.2, 5), 0.5, 3.0)
-        r_vals = [0.0, 0.05, 0.1] if allow_logistics else [0.0]
-        e_vals = [0.0, 0.05, 0.1] if allow_logistics else [0.0]
-        p_vals = [0.0, -0.5, -1.0] if allow_price else [0.0]
-        points: List[Dict[str, Any]] = []
-        for z in z_vals:
-            for r in r_vals:
-                for e in e_vals:
-                    for p in p_vals:
-                        imp = self._quantified_impact(float(z), float(r), float(e), trials=trials, price_adjust=float(p))
-                        exp = imp.get("expected", {})
-                        points.append({
-                            "z_alpha_new": float(z),
-                            "reroute_share": float(r),
-                            "expedite_share": float(e),
-                            "price_adjust": float(p),
-                            "expected": exp,
-                            "ci80": imp.get("ci80", {}),
-                            "cvar_loss": imp.get("cvar_loss", 0.0),
-                        })
-        # Pareto filter: maximize service, minimize cost and bullwhip
-        def dominates(a: Dict[str, Any], b: Dict[str, Any]) -> bool:
-            ea, eb = a["expected"], b["expected"]
-            svc_a, cost_a, bw_a = ea.get("service", 0.0), ea.get("cost_proxy", 0.0), ea.get("bullwhip", 0.0)
-            svc_b, cost_b, bw_b = eb.get("service", 0.0), eb.get("cost_proxy", 0.0), eb.get("bullwhip", 0.0)
-            return (svc_a >= svc_b and cost_a <= cost_b and bw_a <= bw_b) and (svc_a > svc_b or cost_a < cost_b or bw_a < bw_b)
-        pareto: List[Dict[str, Any]] = []
-        for p in points:
-            if not any(dominates(q, p) for q in points if q is not p):
-                pareto.append(p)
-        return pareto
-
-    def z_service_curve(self, z_values: Optional[np.ndarray] = None) -> List[Dict[str, float]]:
-        if z_values is None:
-            z_values = np.linspace(0.8, 2.6, 10)
-        curve: List[Dict[str, float]] = []
-        z_prev = self.policy.z_alpha
-        try:
-            for z in z_values:
-                self.policy.z_alpha = float(z)
-                df = self.simulate()
-                k = self.summarize(df)
-                curve.append({"z": float(z), "service": float(k.get("service_level", 0.0)), "cost_proxy": float(k.get("cost_proxy", 0.0))})
-        finally:
-            self.policy.z_alpha = z_prev
-        return curve
-
-    # ===== Real-world KPI ingestion =====
-    def ingest_kpis(self, kpis: Dict[str, float]) -> None:
-        """Ingest external KPIs (e.g., service %, cost, bullwhip) and store history."""
-        safe = {
-            "service": float(kpis.get("service", np.nan)),
-            "cost_proxy": float(kpis.get("cost_proxy", np.nan)),
-            "bullwhip": float(kpis.get("bullwhip", np.nan)),
-        }
-        self.kpi_history.append(safe)
-
-    # ===== Dynamic data feeds =====
-    def register_feed(self, name: str, fetch_fn: Any) -> None:
-        """Register a callable that returns dicts to merge into df or KPIs."""
-        self._feeds[name] = fetch_fn
-
-    def poll_feeds(self) -> Dict[str, Any]:
-        """Poll all feeds and merge into state; return a snapshot of updates."""
-        updates: Dict[str, Any] = {}
-        for name, fn in list(self._feeds.items()):
-            try:
-                data = fn()
-                updates[name] = data
-                # If KPI-like, ingest; else if dataframe-like keys, merge shallowly
-                if isinstance(data, dict) and set(["service", "cost_proxy", "bullwhip"]).issubset(set(data.keys())):
-                    self.ingest_kpis(data)
-                # Extend here to merge time-series; keeping simple for now
-            except Exception as e:
-                updates[name] = {"error": str(e)}
-        return updates
-
-    # ===== Action validation and rollback =====
-    def validate_and_rollback(
-        self,
-        new_kpis: Dict[str, float],
-        thresholds: Dict[str, float] = None,
-    ) -> Dict[str, Any]:
-        """Validate last applied action against fresh KPIs; rollback if violated.
-
-        thresholds: {"min_service_gain": 0.0, "max_cost_increase": 0.0, "max_bullwhip_increase": 0.0}
-        """
-        if thresholds is None:
-            thresholds = {"min_service_gain": 0.0, "max_cost_increase": 0.0, "max_bullwhip_increase": 0.0}
-        if not self.kpi_history:
-            self.ingest_kpis(new_kpis)
-            return {"rolled_back": False, "reason": "no_baseline"}
-        prev = self.kpi_history[-1]
-        self.ingest_kpis(new_kpis)
-        ds = float(new_kpis.get("service", 0.0) - (prev.get("service", 0.0) if prev.get("service") is not None else 0.0))
-        dc = float(new_kpis.get("cost_proxy", 0.0) - (prev.get("cost_proxy", 0.0) if prev.get("cost_proxy") is not None else 0.0))
-        db = float(new_kpis.get("bullwhip", 0.0) - (prev.get("bullwhip", 0.0) if prev.get("bullwhip") is not None else 0.0))
-        violate = (ds < thresholds["min_service_gain"]) or (dc > thresholds["max_cost_increase"]) or (db > thresholds["max_bullwhip_increase"]) 
-        if violate and self.action_history:
-            # rollback: revert to previous controls, dampen risky knobs
-            last = self.action_history[-1]
-            self.policy.z_alpha = float(last.get("z_alpha_prev", self.policy.z_alpha))
-            self.last_controls["z_alpha_new"] = self.policy.z_alpha
-            for k in ["reroute_share", "expedite_share", "dual_source_share"]:
-                self.last_controls[k] = max(0.0, self.last_controls.get(k, 0.0) * 0.5)
-            return {"rolled_back": True, "reason": "threshold_violation", "delta": {"service": ds, "cost": dc, "bullwhip": db}}
-        return {"rolled_back": False, "reason": "ok", "delta": {"service": ds, "cost": dc, "bullwhip": db}}
-
-    # ===== Reinforcement-based self-tuning =====
-    def reinforce_from_outcome(self, expected: Dict[str, float]) -> Dict[str, float]:
-        """Update MPC weights from outcome using a simple reward: r = dS - a*max(0,dC) - b*max(0,dB)."""
-        dS = float(expected.get("service", 0.0))
-        dC = float(expected.get("cost_proxy", 0.0))
-        dB = float(expected.get("bullwhip", 0.0))
-        a, b, lr = 1.0, 0.5, 0.1
-        reward = dS - a * max(0.0, dC) - b * max(0.0, dB)
-        # Increase emphasis on service if reward positive; else increase cost/bullwhip penalty
-        if reward >= 0:
-            self.mpc_weights["service"] = float(min(2.0, self.mpc_weights.get("service", 1.0) + lr * reward))
-            self.mpc_weights["cost"] = float(max(0.2, self.mpc_weights.get("cost", 1.0) * (1.0 - 0.05)))
-        else:
-            self.mpc_weights["cost"] = float(min(2.0, self.mpc_weights.get("cost", 1.0) + lr * (-reward)))
-            self.mpc_weights["bullwhip"] = float(min(2.0, self.mpc_weights.get("bullwhip", 0.5) + lr * 0.5 * (-reward)))
-        return dict(self.mpc_weights)
-
-    def _feasible(self, proposal: Dict[str, Any]) -> bool:
-        rr = float(proposal.get("reroute_share", 0.0))
-        ex = float(proposal.get("expedite_share", 0.0))
-        ds = float(proposal.get("dual_source_share", 0.0))
-        if rr < 0 or ex < 0:
-            return False
-        if rr + ex + ds > self.lane_capacity:
-            return False
-        # rate limits
-        for k, cap in self.max_weekly_change.items():
-            prev = float(self.last_controls.get(k, 0.0))
-            cur = float(proposal.get(k, prev))
-            if abs(cur - prev) > cap:
-                return False
-        return True
-
-    def _quantified_impact(self, z_new: float, rr: float, ex: float, trials: int = 100, price_adjust: float = 0.0, alpha: float = 0.9) -> Dict[str, Any]:
-        # Run small Monte Carlo by injecting noise on D and L; measure KPI deltas
-        base = self.simulate()
-        base_kpi = self.summarize(base)
-        deltas = []
-        rng = self.rng
-        saved_price_adj = self._price_adjust
-        for _ in range(trials):
-            # stochastic shocks via temporary tweaks
-            shock = {"stochastic": True}
-            self.policy.z_alpha = z_new
-            # approximate expedite/reroute: reduce L and increase phi within shares
-            self.df["phi"] = np.clip(self.df["phi"] * (1.0 + 0.1 * rr), 0.2, 1.2)
-            self.df["L"] = np.clip(self.df["L"] * (1.0 - 0.2 * ex), 1.0, None)
-            self._price_adjust = float(price_adjust)
-            sim = self.simulate(interventions=None)
-            kpi = self.summarize(sim)
-            deltas.append({
-                "service": float(kpi["service_level"] - base_kpi["service_level"]),
-                "cost_proxy": float(kpi["cost_proxy"] - base_kpi["cost_proxy"]),
-                "bullwhip": float(kpi["bullwhip"] - base_kpi["bullwhip"]),
-            })
-        # restore controls
-        self._price_adjust = saved_price_adj
-        # Aggregate
-        svc = np.array([d["service"] for d in deltas])
-        cst = np.array([d["cost_proxy"] for d in deltas])
-        bwe = np.array([d["bullwhip"] for d in deltas])
-        def ci80(arr: np.ndarray) -> Tuple[float, float]:
-            return float(np.quantile(arr, 0.1)), float(np.quantile(arr, 0.9))
-        def ci95(arr: np.ndarray) -> Tuple[float, float]:
-            return float(np.quantile(arr, 0.025)), float(np.quantile(arr, 0.975))
-        loss = cst - svc + bwe
-        thr = float(np.quantile(loss, alpha))
-        cvar = float(loss[loss >= thr].mean()) if np.any(loss >= thr) else float(loss.mean())
-        return {
-            "expected": {"service": float(np.mean(svc)), "cost_proxy": float(np.mean(cst)), "bullwhip": float(np.mean(bwe))},
-            "ci80": {"service": ci80(svc), "cost_proxy": ci80(cst), "bullwhip": ci80(bwe)},
-            "ci95": {"service": ci95(svc), "cost_proxy": ci95(cst), "bullwhip": ci95(bwe)},
-            "samples": {"service": svc.tolist(), "cost_proxy": cst.tolist(), "bullwhip": bwe.tolist()},
-            "cvar_alpha": alpha,
-            "cvar_loss": cvar,
-        }
-
-    # ===== CVaR grid minimizer (discrete neighborhood search) =====
-    def cvar_select_from_grid(
-        self,
-        base: Dict[str, float],
-        alpha: float = 0.9,
-        eps: float = 0.05,
-        trials: int = 40,
-        weights: Optional[Dict[str, float]] = None,
-    ) -> Dict[str, Any]:
-        """Pick among a small grid around base (z,r,e,ds) to minimize CVaR_alpha of loss.
-
-        loss = w_cost*Δcost - w_service*Δservice + w_bw*Δbullwhip
-        """
-        if weights is None:
-            weights = {"cost": 1.0, "service": 1.0, "bullwhip": 0.5}
-        z0 = float(base.get("z_alpha_new", self.policy.z_alpha))
-        r0 = float(base.get("reroute_share", 0.0))
-        e0 = float(base.get("expedite_share", 0.0))
-        ds0 = float(base.get("dual_source_share", 0.0))
-        cand = [
-            {"z": z0, "r": r0, "e": e0},
-            {"z": z0+eps, "r": r0, "e": e0},
-            {"z": z0, "r": r0+eps, "e": e0},
-            {"z": z0, "r": r0, "e": e0+eps},
-            {"z": z0-eps, "r": r0, "e": e0},
-        ]
-        best = None
-        best_val = float("inf")
-        tail_q = alpha
-        for c in cand:
-            imp = self._quantified_impact(c["z"], c["r"], c["e"], trials=trials)
-            svc = np.array(imp["samples"]["service"])  # Δservice
-            cst = np.array(imp["samples"]["cost_proxy"])  # Δcost
-            bwe = np.array(imp["samples"]["bullwhip"])  # Δbullwhip
-            loss = weights["cost"] * cst - weights["service"] * svc + weights["bullwhip"] * bwe
-            thresh = np.quantile(loss, tail_q)
-            cvar = float(loss[loss >= thresh].mean()) if np.any(loss >= thresh) else float(loss.mean())
-            if cvar < best_val:
-                best_val = cvar
-                best = {"z_alpha_new": c["z"], "reroute_share": c["r"], "expedite_share": c["e"], "dual_source_share": ds0}
-        return {"choice": best, "cvar": best_val, "alpha": alpha}
-
-    @staticmethod
-    def _extract_final_json(text: str) -> Optional[Dict[str, Any]]:
-        try:
-            # Find the last JSON-like block with required keys
-            matches = re.findall(r"\{[\s\S]*?\}", text)
-            for chunk in reversed(matches):
-                if '"proposal"' in chunk and '"z_alpha_new"' in chunk:
-                    return json.loads(chunk)
-        except Exception:
-            return None
-        return None
-
-    @staticmethod
-    def _validate_proposal(p: Dict[str, Any]) -> Optional[Dict[str, float]]:
-        try:
-            z = float(np.clip(float(p.get("z_alpha_new")), 0.0, 3.0))
-            rr = float(np.clip(float(p.get("reroute_share")), 0.0, 1.0))
-            ex = float(np.clip(float(p.get("expedite_share")), 0.0, 1.0))
-            return {"z_alpha_new": z, "reroute_share": rr, "expedite_share": ex}
-        except Exception:
-            return None
-
-    def _llm_decision_loop(
-        self,
-        panel: pd.DataFrame,
-        s2: Dict[str, Any],
-        proposal: Optional[Dict[str, Any]],
-        decision: Dict[str, Any],
-        strengths: Dict[str, float],
-        kpis: Dict[str, Any],
-        rounds: int = 3,
-    ) -> Tuple[str, Optional[Dict[str, Any]]]:
-        if self.agent is None:
-            return "analysis_unavailable: agent_not_initialized", proposal
-
-        alerts = s2.get("alerts", [])
-        ai_out: Any = ""
-        for r in range(rounds):
-            # Edge guidance for narration
-            top_edges = sorted(strengths.items(), key=lambda kv: abs(kv[1]), reverse=True)[:5]
-            weak_edges = [k for k, v in strengths.items() if abs(v) <= 0.05]
-            narrative_prompt = (
-                f"Round {r+1}/{rounds}. Analyze state and propose safe actions.\n"
-                f"KPIs: service={kpis.get('service_level', 0.0):.2f}, cost_proxy={kpis.get('cost_proxy', 0.0):.2f}, bullwhip={kpis.get('bullwhip', 0.0):.2f}.\n"
-                f"Alerts: {alerts}.\n"
-                f"Current proposal: {proposal}. Decision: {decision}.\n"
-                f"Causal edges (use these): {dict(top_edges)}; avoid near-zero edges: {weak_edges}.\n"
-                f"Provide the 7-section output and the final JSON exactly per schema."
-            )
-            try:
-                ai_out = self.agent.run(narrative_prompt)
-            except Exception as e:
-                return f"analysis_unavailable: {e}", proposal
-            llm_json = self._extract_final_json(str(ai_out)) if isinstance(ai_out, str) else None
-            if llm_json and isinstance(llm_json.get("proposal"), dict):
-                validated = self._validate_proposal(llm_json["proposal"])
-                if validated:
-                    proposal = {**validated, "source": "llm"}
-                    decision = self.vsm.s5_policy_gate(proposal, s2, self.vsm.s3_star_audit(panel), risk_cap_cvar=0.15)
-        return str(ai_out), proposal
-
-    def _build_causal_graph(self) -> None:
-        g = self.crca.causal_graph
-        g.clear()
-        vars_graph = [
-            "L",  # lead time
-            "phi",  # survival/transport factor
-            "K",  # capacity
-            "dcost",
-            "B",  # backlog
-            "I",  # inventory
-            "p",  # price
-            "D",  # demand
-            "O",  # orders
-            "R",  # receipts
-        ]
-        g.add_nodes_from(vars_graph)
-        # Structural influences (signs where sensible)
-        self.crca.add_causal_relationship("K", "R", strength=0.0)  # more cap -> more receipts
-        self.crca.add_causal_relationship("phi", "R", strength=0.0)  # more survival -> more receipts
-        self.crca.add_causal_relationship("L", "R", strength=0.0)  # longer lead -> lower timely receipts
-        self.crca.edge_sign_constraints[("L", "R")] = -1
-
-        self.crca.add_causal_relationship("B", "p", strength=0.0)  # backlog -> higher price
-        self.crca.edge_sign_constraints[("B", "p")] = 1
-        self.crca.add_causal_relationship("I", "p", strength=0.0)  # inventory -> lower price
-        self.crca.edge_sign_constraints[("I", "p")] = -1
-        self.crca.add_causal_relationship("dcost", "p", strength=0.0)  # cost pass-through
-        self.crca.edge_sign_constraints[("dcost", "p")] = 1
-
-        self.crca.add_causal_relationship("p", "D", strength=0.0)  # pricing impacts demand
-        self.crca.edge_sign_constraints[("p", "D")] = -1
-        self.crca.add_causal_relationship("D", "O", strength=0.0)  # more demand -> more orders
-        self.crca.edge_sign_constraints[("D", "O")] = 1
-        self.crca.add_causal_relationship("R", "I", strength=0.0)
-        self.crca.edge_sign_constraints[("R", "I")] = 1
-        self.crca.add_causal_relationship("D", "B", strength=0.0)
-        self.crca.edge_sign_constraints[("D", "B")] = 1
-
-    @staticmethod
-    def _relu(x: float) -> float:
-        return float(max(0.0, x))
-
-    def _arrivals(self, O_hist: List[float], L_hist: List[int], phi_hist: List[float], t: int) -> float:
-        """Receipts at t: sum 1[L=ell]*O[t-ell]*phi[t-ell->t]."""
-        total = 0.0
-        for ell in range(1, min(10, t + 1)):
-            if L_hist[t] == ell:
-                total += O_hist[t - ell] * phi_hist[t - ell]
-        return total
-
-    def _queueing_leadtime(self, lam: float, mu: float, transport: float = 0.0) -> float:
-        rho = min(0.95, lam / max(mu, 1e-6))
-        wq = (rho / (mu * max(1e-6, (1 - rho)))) if rho < 0.999 else 10.0
-        return wq + (1.0 / max(mu, 1e-6)) + transport
-
-    def _price_pass_through(self, p_bar: float, dcost: float, B: float, I: float, D_ref: float) -> float:
-        return (
-            p_bar
-            + self.el.eta_c * dcost
-            + self.el.eta_B * (B / max(D_ref, 1e-6))
-            - self.el.eta_I * (I / max(D_ref, 1e-6))
-        )
-
-    def simulate(self, interventions: Optional[Dict[str, Any]] = None) -> pd.DataFrame:
-        """Run minimal multi-period SCM with optional do()-style interventions.
-
-        interventions: dict with keys like {'outage_facility': {'F1': 1}, 'disruption_route': {'R1': 1}}
-        For simplicity, treat interventions as shocks to K (capacity), L (lead), and phi.
-        """
-        df = self.df.copy()
-        # Initialize per (sku,facility)
-        for (sku, fac), sub in df.groupby(level=["sku", "facility" ]):
-            O = [0.0] * self.T
-            R = [0.0] * self.T
-            I = [float(sub.iloc[0]["I"])] + [0.0] * (self.T - 1)
-            B = [float(sub.iloc[0]["B"])] + [0.0] * (self.T - 1)
-            P = [float(sub.iloc[0]["P"])] + [0.0] * (self.T - 1)
-            L_hist = [int(sub.iloc[min(i, len(sub)-1)]["L"]) for i in range(self.T)]
-            phi_hist = [float(sub.iloc[min(i, len(sub)-1)]["phi"]) for i in range(self.T)]
-            K_hist = [float(sub.iloc[min(i, len(sub)-1)]["K"]) for i in range(self.T)]
-
-            # Apply high-level interventions (if any)
-            for t in range(self.T):
-                if interventions:
-                    if interventions.get("outage_facility", {}).get(fac, 0) == 1:
-                        K_hist[t] = K_hist[t] * 0.7  # 30% capacity loss
-                    if interventions.get("disruption_route", {}).get(fac, 0) == 1:
-                        L_hist[t] = max(1, L_hist[t] + 1)
-                        phi_hist[t] = max(0.2, phi_hist[t] * 0.8)
-
-            # Period loop
-            for t in range(self.T):
-                # Demand and cost dynamics (toy):
-                D_t = float(sub.iloc[t]["D"]) if t < len(sub) else 100.0
-                dcost_t = float(sub.iloc[t]["dcost"]) if t < len(sub) else 0.0
-                pbar = (float(sub.iloc[t]["p_bar"]) if t < len(sub) else 15.0) + float(self._price_adjust)
-
-                # Receipts from earlier orders
-                R[t] = self._arrivals(O, L_hist, phi_hist, t)
-
-                # Shipments and inventory/backorders
-                S_t = min(I[t - 1] + (R[t] if t > 0 else 0.0), D_t + (B[t - 1] if t > 0 else 0.0))
-                if t > 0:
-                    I[t] = I[t - 1] + R[t] - S_t
-                    B[t] = max(0.0, D_t + B[t - 1] - (I[t - 1] + R[t]))
-
-                # Demand response to price
-                p_t = self._price_pass_through(pbar, dcost_t, B[t], I[t], float(sub.iloc[0]["D_ref"]))
-                # Simple log-linear elasticity around reference
-                D_t_eff = max(0.0, D_t * math.exp(-0.01 * (p_t - pbar)))
-
-                # Lead-time estimate (M/M/1 rough cut)
-                lam = D_t_eff
-                mu = max(1e-6, K_hist[t] / max(1.0, len(self.skus)))
-                L_eff = max(1.0, self._queueing_leadtime(lam, mu, transport=float(L_hist[t]) - 1.0))
-
-                # Base-stock target and orders
-                POS_t = I[t] + P[t]
-                muL = L_eff
-                sigL = 0.5 * muL
-                target = muL * D_t_eff + self.policy.z_alpha * sigL * math.sqrt(max(1e-6, D_t_eff))
-                O_policy = self._relu(target - POS_t)
-                # Order smoothing
-                O_prev = O[t - 1] if t > 0 else 0.0
-                O[t] = (1 - self.policy.theta_smoothing) * O_prev + self.policy.theta_smoothing * O_policy
-
-                # Update pipeline (very simplified)
-                if t < self.T - 1:
-                    P[t + 1] = max(0.0, P[t] + O[t] - R[t])
-
-                # Capacity constraint (aggregate receipts)
-                R[t] = min(R[t], K_hist[t])
-
-                # Write back to df
-                df.loc[(t, sku, fac), ["R", "I", "B", "O", "p", "L", "phi", "K"]] = [
-                    R[t], I[t], B[t], O[t], p_t, L_eff, phi_hist[t], K_hist[t]
-                ]
-
-        return df
-
-    # ===== Reporting =====
-    def summarize(self, df: pd.DataFrame) -> Dict[str, Any]:
-        out: Dict[str, Any] = {}
-        # Simple KPIs
-        service = 1.0 - (df["B"].groupby(level="t").mean() > 0).mean()
-        holding_cost = df["I"].clip(lower=0).mean() * 0.1
-        shortage_penalty = df["B"].mean() * 1.0
-        ordering_cost = df["O"].mean() * df["c"].mean()
-        cost = holding_cost + shortage_penalty + ordering_cost
-        bwe = float((df["O"].var() / max(df["D"].var(), 1e-6)))
-        out["service_level"] = float(service)
-        out["cost_proxy"] = float(cost)
-        out["bullwhip"] = bwe
-        return out
-
-    # ===== Causal runs (Upgraded) =====
-    def causal_edges(self, df: pd.DataFrame) -> Dict[str, float]:
-        """Fit causal edges and return strengths, now with enhanced analysis."""
-        # Fit on panel averages per t
-        panel = df.groupby(level="t").mean(numeric_only=True)
-        vars_fit = [c for c in ["L", "phi", "K", "dcost", "B", "I", "p", "D", "O", "R"] if c in panel.columns]
-        try:
-            self.crca.fit_from_dataframe(panel, variables=vars_fit, window=min(30, len(panel)), decay_alpha=0.9, ridge_lambda=0.1)
-        except Exception as e:
-            logger.warning(f"CRCA fit skipped: {e}")
-        strengths = {}
-        for u, v in self.crca.causal_graph.edges():
-            strengths[f"{u}->{v}"] = float(self.crca.causal_graph[u][v].get("strength", 0.0))
-        return strengths
-
-    def advanced_causal_analysis(self, df: pd.DataFrame) -> Dict[str, Any]:
-        """Run comprehensive advanced causal analysis using all upgraded CR-CA methods."""
-        panel = df.groupby(level="t").mean(numeric_only=True)
-        vars_fit = [c for c in ["L", "phi", "K", "dcost", "B", "I", "p", "D", "O", "R"] if c in panel.columns]
-        
-        # Fit causal graph first
-        try:
-            self.crca.fit_from_dataframe(panel, variables=vars_fit, window=min(30, len(panel)), decay_alpha=0.9, ridge_lambda=0.1)
-        except Exception as e:
-            logger.warning(f"CRCA fit skipped: {e}")
-            return {"error": str(e)}
-        
-        # Get latest state for analysis
-        latest = panel.iloc[-1] if len(panel) > 0 else {}
-        factual_state = {var: float(latest.get(var, 0.0)) for var in vars_fit if var in latest}
-        
-        # ========== UPGRADED METHODS ==========
-        results: Dict[str, Any] = {
-            "causal_strengths": {},
-            "sensitivity_analysis": {},
-            "granger_causality": {},
-            "information_theory": {},
-            "var_model": {},
-            "bayesian_edges": {},
-            "root_causes": {},
-            "shapley_attribution": {},
-            "whatif_analysis": {},
-            "optimal_intervention": {},
-            "alternate_realities": {},
-        }
-        
-        # Get causal strengths
-        for u, v in self.crca.causal_graph.edges():
-            results["causal_strengths"][f"{u}->{v}"] = float(self.crca.causal_graph[u][v].get("strength", 0.0))
-        
-        # 1. Sensitivity Analysis: What drives service/cost changes most?
-        try:
-            if len(factual_state) >= 4:
-                intervention_vars = [v for v in ["L", "phi", "K", "dcost", "B"] if v in factual_state][:4]
-                test_intervention = {k: factual_state.get(k, 0.0) for k in intervention_vars}
-                
-                # Analyze sensitivity to service (via B→p→D chain) and cost
-                sensitivity_service = self.crca.sensitivity_analysis(
-                    intervention=test_intervention,
-                    target="B",  # Backlog affects service
-                    perturbation_size=0.01,
-                )
-                sensitivity_cost = self.crca.sensitivity_analysis(
-                    intervention={k: v for k, v in test_intervention.items() if k in ["dcost", "L", "phi"]},
-                    target="p",  # Price affects cost
-                    perturbation_size=0.01,
-                )
-                results["sensitivity_analysis"] = {
-                    "service_drivers": sensitivity_service,
-                    "cost_drivers": sensitivity_cost,
-                }
-                logger.info(f"Sensitivity: service={sensitivity_service.get('most_influential_variable', 'N/A')}, cost={sensitivity_cost.get('most_influential_variable', 'N/A')}")
-        except Exception as e:
-            logger.debug(f"Sensitivity analysis failed: {e}")
-        
-        # 2. Granger Causality: Temporal causal relationships
-        try:
-            if len(panel) >= 20:
-                # Test if demand Granger-causes orders
-                granger_d_o = self.crca.granger_causality_test(
-                    df=panel,
-                    var1="D",
-                    var2="O",
-                    max_lag=3,
-                )
-                # Test if backlog Granger-causes price
-                granger_b_p = self.crca.granger_causality_test(
-                    df=panel,
-                    var1="B",
-                    var2="p",
-                    max_lag=2,
-                )
-                results["granger_causality"] = {
-                    "demand_granger_causes_orders": granger_d_o.get("granger_causes", False),
-                    "backlog_granger_causes_price": granger_b_p.get("granger_causes", False),
-                    "d_o_f_stat": granger_d_o.get("f_statistic", 0.0),
-                    "b_p_f_stat": granger_b_p.get("f_statistic", 0.0),
-                }
-                logger.info(f"Granger causality: D→O={granger_d_o.get('granger_causes', False)}, B→p={granger_b_p.get('granger_causes', False)}")
-        except Exception as e:
-            logger.debug(f"Granger causality test failed: {e}")
-        
-        # 3. Information Theoretic Measures
-        try:
-            if len(panel) >= 10:
-                core_vars = [v for v in ["D", "O", "B", "I", "p", "L"] if v in panel.columns]
-                if len(core_vars) >= 3:
-                    info_theory = self.crca.compute_information_theoretic_measures(
-                        df=panel,
-                        variables=core_vars,
-                    )
-                    results["information_theory"] = info_theory
-                    logger.info(f"Information theory: {len(info_theory.get('entropies', {}))} entropies computed")
-        except Exception as e:
-            logger.debug(f"Information theory computation failed: {e}")
-        
-        # 4. VAR Model: Vector Autoregression
-        try:
-            if len(panel) >= 30:
-                var_vars = [v for v in ["D", "O", "I", "B", "p"] if v in panel.columns]
-                if len(var_vars) >= 2:
-                    var_model = self.crca.vector_autoregression_estimation(
-                        df=panel,
-                        variables=var_vars,
-                        max_lag=2,
-                    )
-                    results["var_model"] = var_model
-                    logger.info(f"VAR model: {var_model.get('n_variables', 0)} variables, lag={var_model.get('max_lag', 0)}")
-        except Exception as e:
-            logger.debug(f"VAR estimation failed: {e}")
-        
-        # 5. Bayesian Edge Inference
-        try:
-            bayesian_edges = {}
-            key_edges = [("B", "p"), ("I", "p"), ("dcost", "p"), ("D", "O"), ("L", "R")]
-            for parent, child in key_edges:
-                if parent in panel.columns and child in panel.columns:
-                    bayes_result = self.crca.bayesian_edge_inference(
-                        df=panel,
-                        parent=parent,
-                        child=child,
-                        prior_mu=0.0,
-                        prior_sigma=1.0,
-                    )
-                    if "error" not in bayes_result:
-                        bayesian_edges[f"{parent}->{child}"] = {
-                            "posterior_mean": bayes_result.get("posterior_mean", 0.0),
-                            "posterior_std": bayes_result.get("posterior_std", 0.0),
-                            "credible_interval": bayes_result.get("credible_interval_95", (0.0, 0.0)),
-                        }
-            results["bayesian_edges"] = bayesian_edges
-            if bayesian_edges:
-                logger.info(f"Bayesian inference for {len(bayesian_edges)} edges")
-        except Exception as e:
-            logger.debug(f"Bayesian inference failed: {e}")
-        
-        # 6. Deep Root Cause Analysis: Find ultimate drivers of service/cost issues
-        try:
-            root_causes_service = self.crca.deep_root_cause_analysis(
-                problem_variable="B",  # Backlog is service issue
-                max_depth=8,
-                min_path_strength=0.01,
-            )
-            root_causes_cost = self.crca.deep_root_cause_analysis(
-                problem_variable="p",  # Price is cost proxy
-                max_depth=8,
-                min_path_strength=0.01,
-            )
-            results["root_causes"] = {
-                "service_issues": root_causes_service,
-                "cost_issues": root_causes_cost,
-            }
-            if root_causes_service.get("ultimate_root_causes"):
-                logger.info(f"Root causes (service): {[rc.get('root_cause') for rc in root_causes_service.get('ultimate_root_causes', [])[:3]]}")
-        except Exception as e:
-            logger.debug(f"Root cause analysis failed: {e}")
-        
-        # 7. Shapley Value Attribution: Fair attribution of KPI drivers
-        try:
-            if len(panel) >= 7:
-                # Baseline: average over last week
-                baseline_state = {
-                    k: float(panel[k].tail(7).mean()) 
-                    for k in factual_state.keys() 
-                    if k in panel.columns
-                }
-                if baseline_state and "B" in baseline_state:
-                    shapley_backlog = self.crca.shapley_value_attribution(
-                        baseline_state=baseline_state,
-                        target_state=factual_state,
-                        target="B",
-                    )
-                    if "p" in baseline_state:
-                        shapley_price = self.crca.shapley_value_attribution(
-                            baseline_state=baseline_state,
-                            target_state=factual_state,
-                            target="p",
-                        )
-                        results["shapley_attribution"] = {
-                            "backlog_drivers": shapley_backlog,
-                            "price_drivers": shapley_price,
-                        }
-                        logger.info(f"Shapley attribution computed for B and p")
-        except Exception as e:
-            logger.debug(f"Shapley attribution failed: {e}")
-        
-        # 8. Multi-layer What-If Analysis: Cascading effects of disruptions
-        try:
-            test_scenarios = [
-                {"L": factual_state.get("L", 2.0) * 1.5},  # Lead time disruption
-                {"phi": max(0.2, factual_state.get("phi", 1.0) * 0.7)},  # Survival rate drop
-                {"dcost": factual_state.get("dcost", 0.0) + 2.0},  # Cost shock
-            ]
-            whatif_analysis = self.crca.multi_layer_whatif_analysis(
-                scenarios=test_scenarios,
-                depth=3,
-            )
-            results["whatif_analysis"] = whatif_analysis
-            logger.info(f"What-if analysis: {whatif_analysis.get('summary', {}).get('total_scenarios', 0)} scenarios")
-        except Exception as e:
-            logger.debug(f"What-if analysis failed: {e}")
-        
-        # 9. Optimal Intervention Sequence: Bellman optimization
-        try:
-            optimal_intervention = self.crca.bellman_optimal_intervention(
-                initial_state=factual_state,
-                target="B",  # Minimize backlog (maximize service)
-                intervention_vars=["L", "phi", "K", "dcost"],
-                horizon=5,
-                discount=0.9,
-            )
-            results["optimal_intervention"] = optimal_intervention
-            if optimal_intervention.get("optimal_sequence"):
-                logger.info(f"Optimal intervention sequence: {len(optimal_intervention['optimal_sequence'])} steps")
-        except Exception as e:
-            logger.debug(f"Optimal intervention failed: {e}")
-        
-        # 10. Explore Alternate Realities: Best intervention scenarios
-        try:
-            alternate_realities = self.crca.explore_alternate_realities(
-                factual_state=factual_state,
-                target_outcome="B",  # Minimize backlog
-                target_value=0.0,  # Target zero backlog
-                max_realities=30,
-                max_interventions=3,
-            )
-            results["alternate_realities"] = alternate_realities
-            if alternate_realities.get("best_reality"):
-                improvement = factual_state.get("B", 0.0) - alternate_realities["best_reality"].get("target_value", 0.0)
-                logger.info(f"Best alternate reality: {improvement:+.2f} backlog reduction")
-        except Exception as e:
-            logger.debug(f"Alternate realities exploration failed: {e}")
-        
-        # 11. Cascading Chain Reaction Analysis
-        try:
-            if "L" in factual_state:
-                chain_reaction = self.crca.analyze_cascading_chain_reaction(
-                    initial_intervention={"L": factual_state.get("L", 2.0) * 1.5},
-                    target_outcomes=["B", "I", "O", "p", "D"],
-                    max_hops=6,
-                    include_feedback_loops=True,
-                    num_iterations=4,
-                )
-                results["chain_reaction"] = chain_reaction
-                logger.info(f"Chain reaction analysis: {chain_reaction.get('summary', {}).get('total_paths_found', 0)} paths")
-        except Exception as e:
-            logger.debug(f"Chain reaction analysis failed: {e}")
-        
-        # 12. Cross-validation for edge strength reliability
-        try:
-            cv_results = {}
-            for parent, child in [("B", "p"), ("D", "O"), ("L", "R")]:
-                if parent in panel.columns and child in panel.columns:
-                    cv = self.crca.cross_validate_edge_strength(
-                        df=panel,
-                        parent=parent,
-                        child=child,
-                        n_folds=5,
-                    )
-                    if "error" not in cv:
-                        cv_results[f"{parent}->{child}"] = {
-                            "mean_cv_error": cv.get("mean_cv_error", 0.0),
-                            "standard_error": cv.get("standard_error", 0.0),
-                        }
-            results["cross_validation"] = cv_results
-            if cv_results:
-                logger.info(f"Cross-validation for {len(cv_results)} edges")
-        except Exception as e:
-            logger.debug(f"Cross-validation failed: {e}")
-        
-        return results
-
-    def intervene_and_compare(self, scenario: Dict[str, Any]) -> Dict[str, Any]:
-        base = self.simulate()
-        base_kpi = self.summarize(base)
-        shock = self.simulate(interventions=scenario)
-        shock_kpi = self.summarize(shock)
-        delta = {k: float(shock_kpi.get(k, 0.0) - base_kpi.get(k, 0.0)) for k in base_kpi}
-        return {"base": base_kpi, "shock": shock_kpi, "delta": delta}
-
-    # ===== VSM overlay orchestration =====
-    def control_cycle(
-        self,
-        telemetry_events: Optional[List[Dict[str, Any]]] = None,
-        intel_events: Optional[List[Dict[str, Any]]] = None,
-    ) -> Dict[str, Any]:
-        """One control cycle over S2–S5: ingest telemetry, monitor, propose, audit, gate."""
-        # Ingest telemetry/intel (stubs)
-        # Dynamic feeds first
-        _ = self.poll_feeds()
-        if telemetry_events:
-            self.vsm.ingest_s1_flow(self.df, telemetry_events)
-        if intel_events:
-            self.vsm.ingest_s4_external(intel_events)
-
-        # Simulate baseline for the cycle
-        df = self.simulate()
-        panel = df.groupby(level="t").mean(numeric_only=True)
-
-        # S2 stability monitors
-        s2 = self.vsm.s2_monitor(panel)
-
-        # S3 propose optimizers only if S2 stable
-        proposal = None
-        if s2.get("stable", False):
-            proposal = self.vsm.s3_optimize(panel, self.policy)
-            # SPC/EWMA-driven mode switch: if EWMA breaches on backlog, bias to higher service target
-            backlog_alerts = [a for a in s2.get("alerts", []) if a.get("type") == "ewma" and a.get("signal") == "B"]
-            target_service = 0.95 + (0.02 if backlog_alerts else 0.0)
-            z_cal = self.calibrate_z_to_service(target_service=target_service)
-            proposal["z_alpha_new"] = float(z_cal)
-
-        # S3★ audit
-        audit = self.vsm.s3_star_audit(panel)
-
-        # S5 gate with policy caps (LLM-led proposals are still safety-gated here)
-        decision = self.vsm.s5_policy_gate(proposal, s2, audit, risk_cap_cvar=0.15)
-
-        # Build causal strengths snapshot and LLM narratives
-        strengths = self.causal_edges(df)
-        # Build strength-aware explanation preface
-        top_edges = sorted(strengths.items(), key=lambda kv: abs(kv[1]), reverse=True)[:5]
-        explainer = {k: v for k, v in top_edges}
-        # Compute weak edges to avoid claiming
-        weak_edges = {k: v for k, v in strengths.items() if abs(v) <= 0.05}
-        # Prepare concise narrative prompt for the agent
-        kpis = self.summarize(df)
-        alerts = s2.get("alerts", [])
-        proposal_text = str(proposal) if proposal else "None"
-        decision_text = str(decision)
-        narrative_prompt = (
-            f"Analyze supply chain state and propose safe actions.\n"
-            f"KPIs: service={kpis.get('service_level', 0.0):.2f}, cost_proxy={kpis.get('cost_proxy', 0.0):.2f}, bullwhip={kpis.get('bullwhip', 0.0):.2f}.\n"
-            f"Alerts: {alerts}.\n"
-            f"Proposal: {proposal_text}. Decision: {decision_text}.\n"
-            f"Causal edges (mirror these in explanation): {explainer}.\n"
-            f"Do NOT claim effects via edges with near-zero strength: {list(weak_edges.keys())}.\n"
-            f"Provide the 7-section output per instructions."
-        )
-        # Multi-round LLM-led decision loop
-        ai_analysis, proposal = self._llm_decision_loop(
-            panel=panel,
-            s2=s2,
-            proposal=proposal,
-            decision=decision,
-            strengths=strengths,
-            kpis=kpis,
-            rounds=3,
-        )
-
-        # Feasibility check and quantified impact
-        feasibility_flag = False
-        impact = None
-        if isinstance(proposal, dict):
-            # Gate logistics levers by learned DAG support
-            allow_logistics = self._logistics_support_from_strengths(strengths, tol=0.05)
-            allow_price = (abs(float(strengths.get("B->p", 0.0))) > 0.05) and (abs(float(strengths.get("p->D", 0.0))) > 0.05)
-            if not allow_logistics:
-                proposal["reroute_share"] = 0.0
-                proposal["expedite_share"] = 0.0
-            if not allow_price:
-                proposal["price_adjust"] = 0.0
-            else:
-                proposal.setdefault("price_adjust", 0.0)
-            feasibility_flag = self._feasible(proposal)
-            z_new = float(proposal.get("z_alpha_new", self.policy.z_alpha))
-            rr = float(proposal.get("reroute_share", 0.0))
-            ex = float(proposal.get("expedite_share", 0.0))
-            price_adj = float(proposal.get("price_adjust", 0.0))
-            impact = self._quantified_impact(z_new, rr, ex, trials=50, price_adjust=price_adj)
-            # auto de-risk actions on red tier or excessive cost
-            if s2.get("tier") == "red" or (impact and impact.get("expected", {}).get("cost_proxy", 0.0) > 0):
-                # freeze increases to expedite/reroute
-                proposal["expedite_share"] = min(float(proposal.get("expedite_share", 0.0)), self.last_controls.get("expedite_share", 0.0))
-                proposal["reroute_share"] = min(float(proposal.get("reroute_share", 0.0)), self.last_controls.get("reroute_share", 0.0))
-            # Optional: refine via constrained MPC if feasible
-            if feasibility_flag:
-                mpc = constrained_mpc_policy(
-                    last=self.last_controls,
-                    limits=self.max_weekly_change,
-                    lane_cap=self.lane_capacity,
-                    weights=self.mpc_weights,
-                    impact=impact,
-                )
-                if "error" not in mpc:
-                    proposal.update({k: v for k, v in mpc.items() if k in ["z_alpha_new", "reroute_share", "expedite_share", "dual_source_share"]})
-                # Final hard-feasibility polish via CP-SAT
-                cps = cpsat_policy(self.last_controls, self.max_weekly_change, self.lane_capacity)
-                if "error" not in cps:
-                    proposal.update({k: v for k, v in cps.items() if k in ["z_alpha_new", "reroute_share", "expedite_share", "dual_source_share"]})
-                # CVaR neighborhood selection
-                cvar_pick = self.cvar_select_from_grid(proposal, alpha=0.9, eps=0.05, trials=30, weights=self.mpc_weights)
-                if cvar_pick.get("choice"):
-                    proposal.update(cvar_pick["choice"])
-                
-                # UPGRADED: Try gradient-based optimization for refinement
-                try:
-                    # Use current state as initial for gradient optimization
-                    current_state = {
-                        "z_alpha": z_new,
-                        "reroute_share": rr,
-                        "expedite_share": ex,
-                        "B": float(panel.get("B", pd.Series([0.0])).iloc[-1]),
-                        "I": float(panel.get("I", pd.Series([120.0])).iloc[-1]),
-                        "p": float(panel.get("p", pd.Series([15.0])).iloc[-1]),
-                    }
-                    
-                    # Optimize z_alpha to minimize backlog (via gradient)
-                    if "B" in panel.columns:
-                        opt_result = self.crca.gradient_based_intervention_optimization(
-                            initial_state=current_state,
-                            target="B",  # Minimize backlog
-                            intervention_vars=["z_alpha"],
-                            constraints={"z_alpha": (0.5, 3.0)},
-                            method="L-BFGS-B",
-                        )
-                        if opt_result.get("success") and opt_result.get("optimal_intervention"):
-                            # Refine z_alpha if gradient optimization suggests improvement
-                            opt_z = opt_result["optimal_intervention"].get("z_alpha", z_new)
-                            if abs(opt_z - z_new) < 0.3:  # Within rate limit
-                                proposal["z_alpha_new"] = float(opt_z)
-                                logger.info(f"Gradient optimization refined z_alpha: {z_new:.2f} → {opt_z:.2f}")
-                except Exception as e:
-                    logger.debug(f"Gradient optimization failed: {e}")
-                
-                # Provide minimal Pareto frontier for transparency
-                pareto = self.pareto_front(base_z=z_new, allow_logistics=allow_logistics, trials=20, allow_price=allow_price)
-            else:
-                pareto = []
-        else:
-            # Infeasible: rollback immediately
-            if self.action_history:
-                last = self.action_history[-1]
-                self.policy.z_alpha = float(last.get("z_alpha_prev", self.policy.z_alpha))
-                self.last_controls["z_alpha_new"] = self.policy.z_alpha
-                for k in ["reroute_share", "expedite_share", "dual_source_share"]:
-                    self.last_controls[k] = max(0.0, self.last_controls.get(k, 0.0) * 0.5)
-            pareto = []
-
-        # Apply approved proposal to live policy (LLM primacy) after safety gate
-        if isinstance(proposal, dict) and feasibility_flag:
-            decision = self.vsm.s5_policy_gate(proposal, s2, audit, risk_cap_cvar=0.15)
-            if decision.get("approved"):
-                self.policy.z_alpha = float(proposal.get("z_alpha_new", self.policy.z_alpha))
-                # persist last controls for rate-limit checks
-                self.last_controls = {
-                    "z_alpha_new": self.policy.z_alpha,
-                    "reroute_share": float(proposal.get("reroute_share", 0.0)),
-                    "expedite_share": float(proposal.get("expedite_share", 0.0)),
-                }
-                # record action for possible rollback and RL
-                self.action_history.append({
-                    "z_alpha_prev": float(self.last_controls["z_alpha_new"]),
-                    "reroute_share": float(self.last_controls["reroute_share"]),
-                    "expedite_share": float(self.last_controls["expedite_share"]),
-                })
-                if impact and impact.get("expected"):
-                    self.reinforce_from_outcome(impact["expected"])
-
-        # Advanced causal analysis using upgraded methods
-        advanced_causal = {}
-        try:
-            advanced_causal = self.advanced_causal_analysis(df)
-            logger.info(f"Advanced causal analysis completed: {len([k for k, v in advanced_causal.items() if v and 'error' not in str(v)])} methods succeeded")
-        except Exception as e:
-            logger.debug(f"Advanced causal analysis failed: {e}")
-        
-        # Human-readable causal summary via CR-CA agent (enhanced with upgraded insights)
-        try:
-            sensitivity_note = ""
-            if advanced_causal.get("sensitivity_analysis"):
-                sens_svc = advanced_causal["sensitivity_analysis"].get("service_drivers", {})
-                sens_cost = advanced_causal["sensitivity_analysis"].get("cost_drivers", {})
-                most_influential_svc = sens_svc.get("most_influential_variable", "N/A")
-                most_influential_cost = sens_cost.get("most_influential_variable", "N/A")
-                sensitivity_note = f" Sensitivity analysis shows {most_influential_svc} most drives service, {most_influential_cost} most drives cost."
-            
-            granger_note = ""
-            if advanced_causal.get("granger_causality"):
-                gc = advanced_causal["granger_causality"]
-                if gc.get("demand_granger_causes_orders"):
-                    granger_note = " Granger causality: D→O confirmed. "
-                if gc.get("backlog_granger_causes_price"):
-                    granger_note += "B→p temporally confirmed."
-            
-            summary_prompt = (
-                f"Summarize key drivers (B→p, I→p, dcost→p, L→R) and their implications.{sensitivity_note}{granger_note} "
-                f"Reference learned strengths: {dict(list(strengths.items())[:5])}."
-            )
-            causal_summary = self.crca.run(summary_prompt)
-        except Exception as e:
-            causal_summary = f"causal_unavailable: {e}"
-
-        return {
-            "s2": s2,
-            "proposal": proposal,
-            "audit": audit,
-            "decision": decision,
-            "kpis": kpis,
-            "causal_strengths": strengths,
-            "ai_analysis": ai_analysis,
-            "causal_summary": causal_summary,
-            "feasible": feasibility_flag,
-            "impact": impact,
-            "pareto_front": pareto,
-            "z_service_curve": self.z_service_curve(),
-            # Upgraded CR-CA analysis results
-            "advanced_causal": advanced_causal,
-            # Advanced hooks (stubs returning diagnostics)
-            "estimation": {
-                "ms_filter": ms_regime_filter(panel),
-                "bsts_nowcast": bsts_nowcast(panel),
-                "svar": svar_identification(panel),
-            },
-            "robust_optimization": {
-                "dro_mpc": dro_mpc_plan(panel),
-                "chance_mpc": chance_constrained_mpc(panel),
-                "h_infinity": h_infinity_controller(panel),
-                "sddp": sddp_policy_stub(panel),
-            },
-            "multi_echelon": {
-                "clark_scarf": clark_scarf_baseline(panel),
-                "risk_newsvendor": risk_averse_newsvendor_stub(panel),
-            },
-            "network_risk": {
-                "percolation": percolation_stub(panel),
-                "eisenberg_noe": eisenberg_noe_stub(panel),
-                "k_cuts": k_cut_sets_stub(),
-            },
-            "pricing": {
-                "logit": logit_share_stub(panel),
-                "dp_pricing": dynamic_pricing_dp_stub(panel),
-                "ramsey": ramsey_pricing_stub(panel),
-            },
-            "policy_eval": {
-                "synth_control": synthetic_control_stub(panel),
-                "did_iv": did_iv_stub(panel),
-            },
-            "security": {
-                "secure_state": secure_state_l1_stub(panel),
-                "spectral": spectral_shift_stub(panel),
-            },
-            "investment": {
-                "real_options": real_options_stub(),
-                "supplier_portfolio": supplier_portfolio_stub(),
-            },
-            "advanced2": {
-                "transport_modes": transport_modes_sim_stub(),
-                "online_em_ms": online_em_ms(panel),
-                "hier_bsts": hierarchical_bsts_stub(panel),
-                "multi_stage_mpc": multi_stage_mpc_stub(panel),
-                "iot_fusion": iot_fusion_stub(),
-                "nested_logit": nested_logit_stub(),
-                "kcut_hardening": kcut_hardening_stub(),
-                "linucb_policy": linucb_policy_stub(panel),
-                "l1_observer": l1_observer_stub(panel),
-                "fan_charts": fan_charts_stub(panel),
-                "async_ingest": {"kafka": True, "duckdb": True}
-            }
-        }
-
-
-# ===== Viable System Overlay (S2–S5) =====
-class VSMOverlay:
-    def __init__(self) -> None:
-        self.state: Dict[str, Any] = {"R_posterior": np.array([1.0])}
-
-    # Telemetry ingest (stubs)
-    def ingest_s1_flow(self, df: pd.DataFrame, events: List[Dict[str, Any]]) -> None:
-        # Example event schema documented; here we could append/merge into df
-        # For now we no-op (upgrade path to Kafka/Timescale later)
-        pass
-
-    def ingest_s4_external(self, events: List[Dict[str, Any]]) -> None:
-        # Store the latest intel snapshot
-        self.state["intel_last"] = events[-1] if events else None
-
-    # S2: Stability/coordination
-    def s2_monitor(self, panel: pd.DataFrame) -> Dict[str, Any]:
-        out: Dict[str, Any] = {"alerts": [], "stable": True, "tier": "green"}
-        # EWMA residuals on key KPIs
-        for col in [c for c in ["L", "I", "B"] if c in panel.columns]:
-            z, breaches = ewma_monitor(panel[col].values, lam=0.2, k=3.0)
-            if breaches > 0:
-                out["alerts"].append({"type": "ewma", "signal": col, "breaches": breaches})
-        # CUSUM on lead time
-        if "L" in panel.columns:
-            plus, minus, trips = cusum(panel["L"].values, mu0=float(panel["L"].head(5).mean()), k=0.1, h=5.0)
-            if trips:
-                out["alerts"].append({"type": "cusum", "signal": "L", "trips": len(trips)})
-        # Page-Hinkley on demand
-        if "D" in panel.columns and len(panel["D"]) > 20:
-            ph = page_hinkley(panel["D"].astype(float).values)
-            if ph["alarm"]:
-                out["alerts"].append({"type": "page_hinkley", "signal": "D", "mT": ph["mT"]})
-        # BOCPD change-point minimal
-        if "D" in panel.columns:
-            p_break = bocpd_break_prob(panel["D"].values, hazard=0.02)
-            if p_break > 0.5:
-                out["alerts"].append({"type": "bocpd", "p_break": p_break})
-        # Queueing sanity
-        if set(["D", "K"]).issubset(panel.columns):
-            lam = float(max(1e-6, panel["D"].iloc[-1]))
-            mu = float(max(1e-6, panel["K"].iloc[-1]))
-            rho = lam / mu
-            if rho > 0.85:
-                out["alerts"].append({"type": "utilization", "rho": rho})
-        # Stable if few alerts; tiering
-        n_alerts = len(out["alerts"])
-        out["stable"] = n_alerts == 0
-        if n_alerts == 0:
-            out["tier"] = "green"
-        elif n_alerts < 3:
-            out["tier"] = "yellow"
-        else:
-            out["tier"] = "red"
-        return out
-
-    # S3: Optimizers (stubs)
-    def s3_optimize(self, panel: pd.DataFrame, policy: PolicyParams) -> Dict[str, Any]:
-        # Heuristic constrained optimizer proxy; prefer stability
-        z = policy.z_alpha
-        rr = 0.0
-        ex = 0.05
-        ds = 0.0
-        if "B" in panel.columns:
-            b_trend = float(np.polyfit(np.arange(len(panel)), panel["B"].values, 1)[0]) if len(panel) >= 5 else 0.0
-            z = float(np.clip(z + 0.05 * np.sign(b_trend), 0.5, 2.5))
-        if self.state.get("intel_last"):
-            rr = 0.1
-        return {"z_alpha_new": z, "reroute_share": rr, "expedite_share": ex, "dual_source_share": ds}
-
-    # S3★: Audit
-    def s3_star_audit(self, panel: pd.DataFrame) -> Dict[str, Any]:
-        out: Dict[str, Any] = {}
-        if set(["O", "D"]).issubset(panel.columns):
-            varO = float(panel["O"].var())
-            varD = float(panel["D"].var())
-            out["BWE"] = float(varO / max(varD, 1e-6))
-        # Simple receipts cross-check stub (noisy)
-        out["receipts_delta_sigma"] = 0.0
-        return out
-
-    # S5: Policy gate
-    def s5_policy_gate(
-        self,
-        proposal: Optional[Dict[str, Any]],
-        s2: Dict[str, Any],
-        audit: Dict[str, Any],
-        risk_cap_cvar: float = 0.2,
-    ) -> Dict[str, Any]:
-        if proposal is None:
-            return {"approved": False, "reason": "no_proposal"}
-        if not s2.get("stable", False):
-            return {"approved": False, "reason": "unstable_S2"}
-        if audit.get("BWE", 1.0) > 1.3:
-            # tighten smoothing recommendation by halving expedite/reroute
-            proposal = {**proposal, "expedite_share": proposal.get("expedite_share", 0.0) * 0.5, "reroute_share": proposal.get("reroute_share", 0.0) * 0.5}
-        return {"approved": True, "proposal": proposal}
-
-
-# ===== Detectors (S2) =====
-def ewma_monitor(x: np.ndarray, lam: float = 0.2, k: float = 3.0) -> Tuple[np.ndarray, int]:
-    z = np.zeros_like(x, dtype=float)
-    z[0] = x[0]
-    for t in range(1, len(x)):
-        z[t] = lam * x[t] + (1 - lam) * z[t - 1]
-    resid = x - z
-    sigma = np.std(resid[max(1, len(resid)//10):]) or 1.0
-    breaches = int(np.sum(np.abs(resid) > k * sigma))
-    return z, breaches
-
-
-def cusum(x: np.ndarray, mu0: float, k: float, h: float) -> Tuple[np.ndarray, np.ndarray, List[int]]:
-    s_plus = np.zeros_like(x, dtype=float)
-    s_minus = np.zeros_like(x, dtype=float)
-    trips: List[int] = []
-    for t in range(1, len(x)):
-        s_plus[t] = max(0.0, s_plus[t - 1] + (x[t] - mu0 - k))
-        s_minus[t] = max(0.0, s_minus[t - 1] + (mu0 - x[t] - k))
-        if s_plus[t] > h or s_minus[t] > h:
-            trips.append(t)
-            s_plus[t] = 0.0
-            s_minus[t] = 0.0
-    return s_plus, s_minus, trips
-
-
-def bocpd_break_prob(x: np.ndarray, hazard: float = 0.02) -> float:
-    # Minimal BOCPD: approximate break prob by normalized absolute diff of recent means with hazard weight
-    if len(x) < 10:
-        return 0.0
-    n = len(x)
-    m1 = float(np.mean(x[: n // 2]))
-    m2 = float(np.mean(x[n // 2 :]))
-    delta = abs(m2 - m1) / (np.std(x) or 1.0)
-    p = 1.0 - math.exp(-hazard * delta)
-    return float(np.clip(p, 0.0, 1.0))
-
-
-def page_hinkley(x: np.ndarray, delta: float = 0.005, lamb: float = 50.0, alpha: float = 1.0) -> Dict[str, Any]:
-    # Minimal Page-Hinkley drift detector
-    mean = 0.0
-    mT = 0.0
-    MT = 0.0
-    alarm = False
-    for i, xi in enumerate(x):
-        mean = mean + (xi - mean) / (i + 1)
-        mT = mT + xi - mean - delta
-        MT = min(MT, mT)
-        if mT - MT > lamb * alpha:
-            alarm = True
-            break
-    return {"alarm": alarm, "mT": float(mT)}
-
-
-# ===== Advanced Estimation (stubs) =====
-def ms_regime_filter(panel: pd.DataFrame) -> Dict[str, Any]:
-    """Two-regime Markov-switching on demand using statsmodels MarkovRegression.
-
-    Returns current regime probabilities and smoothed prediction for next step.
-    """
-    try:
-        from statsmodels.tsa.regime_switching.markov_regression import MarkovRegression
-        if "D" not in panel.columns or len(panel) < 20:
-            return {"regime": "insufficient", "p_regime": {}}
-        y = panel["D"].astype(float).values
-        # Fit a simple mean-switching model with 2 regimes
-        with warnings.catch_warnings():
-            warnings.simplefilter("ignore")
-            mod = MarkovRegression(y, k_regimes=2, trend='c', switching_variance=True)
-            res = mod.fit(disp=False)
-        p_t = res.smoothed_marginal_probabilities.values[:, -1] if hasattr(res.smoothed_marginal_probabilities, 'values') else res.smoothed_marginal_probabilities
-        p_reg1 = float(p_t[-1])
-        regime = "shock" if p_reg1 > 0.5 else "normal"
-        return {"regime": regime, "p_regime": {"regime1": p_reg1, "regime0": 1 - p_reg1}}
-    except Exception as e:
-        return {"regime": "error", "error": str(e)}
-
-
-def bsts_nowcast(panel: pd.DataFrame) -> Dict[str, Any]:
-    """Dynamic factor nowcast for demand using statsmodels DynamicFactor (FAVAR-like)."""
-    try:
-        from statsmodels.tsa.statespace.dynamic_factor import DynamicFactor
-        cols = [c for c in ["D", "R", "I", "B", "O"] if c in panel.columns]
-        if len(cols) < 2 or len(panel) < 20:
-            mu = float(panel.get("D", pd.Series([100.0])).iloc[-1])
-            return {"D_nowcast": mu, "uncertainty": 0.2, "cols": cols}
-        endog = panel[cols].astype(float)
-        with warnings.catch_warnings():
-            warnings.simplefilter("ignore")
-            mod = DynamicFactor(endog, k_factors=1, factor_order=1)
-            res = mod.fit(disp=False)
-        # One-step ahead forecast for demand
-        fc = res.get_forecast(steps=1)
-        d_idx = cols.index("D")
-        d_mean = float(fc.predicted_mean.iloc[0, d_idx])
-        d_var = float(fc.var_pred_mean.iloc[0, d_idx]) if hasattr(fc, 'var_pred_mean') else 0.2
-        return {"D_nowcast": d_mean, "uncertainty": max(0.05, min(0.5, d_var ** 0.5)), "cols": cols}
-    except Exception as e:
-        mu = float(panel.get("D", pd.Series([100.0])).iloc[-1])
-        return {"D_nowcast": mu, "uncertainty": 0.3, "error": str(e)}
-
-
-def svar_identification(panel: pd.DataFrame) -> Dict[str, Any]:
-    """Estimate a small VAR and report impulse responses as proxy for shocks."""
-    try:
-        from statsmodels.tsa.api import VAR
-        cols = [c for c in ["D", "R", "I", "B", "p"] if c in panel.columns]
-        if len(cols) < 3 or len(panel) < 30:
-            return {"irf": {}, "cols": cols}
-        endog = panel[cols].astype(float)
-        model = VAR(endog)
-        res = model.fit(maxlags=2, ic='aic')
-        irf = res.irf(5)
-        irf_dict = {f"{src}->{dst}": float(irf.irfs[1, cols.index(src), cols.index(dst)]) for src in cols for dst in cols}
-        return {"irf_h1": irf_dict, "cols": cols}
-    except Exception as e:
-        return {"error": str(e)}
-
-
-# ===== Robust Optimization & Control (stubs) =====
-def dro_mpc_plan(panel: pd.DataFrame) -> Dict[str, Any]:
-    """Single-variable DRO-style MPC for z_alpha using cvxpy.
-
-    Minimize holding/backorder proxy under Wasserstein penalty.
-    """
-    try:
-        import cvxpy as cp
-        from scipy.stats import norm
-        D = float(panel.get("D", pd.Series([100.0])).iloc[-1])
-        muL = float(panel.get("L", pd.Series([2.0])).iloc[-1])
-        sigL = max(0.2, 0.5 * muL)
-        z = cp.Variable()
-        # Proxy cost: holding ~ z, backlog ~ max(0, Phi^{-1}(0.95)-z)
-        z_req = norm.ppf(0.95)
-        backlog_short = cp.pos(z_req - z)
-        cost = 0.1 * z + 0.5 * backlog_short
-        # DRO penalty
-        rho = 0.1
-        objective = cp.Minimize(cost + rho * cp.abs(z))
-        constraints = [z >= 0.5, z <= 3.0]
-        prob = cp.Problem(objective, constraints)
-        prob.solve(solver=cp.ECOS, warm_start=True)
-        return {"type": "DRO-MPC", "z_alpha": float(z.value), "status": prob.status, "rho": rho}
-    except Exception as e:
-        return {"type": "DRO-MPC", "error": str(e)}
-
-
-def constrained_mpc_policy(
-    last: Dict[str, float],
-    limits: Dict[str, float],
-    lane_cap: float,
-    weights: Dict[str, float],
-    impact: Optional[Dict[str, Any]] = None,
-) -> Dict[str, Any]:
-    # Optimize z, r, e, ds under caps and rate limits to minimize weighted proxy cost
-    try:
-        import cvxpy as cp
-        z = cp.Variable()
-        r = cp.Variable()
-        e = cp.Variable()
-        ds = cp.Variable()
-        # Objective: weights over expected deltas if available, else regularization
-        if impact and "expected" in impact:
-            exp = impact["expected"]
-            svc = exp.get("service", 0.0)
-            cst = exp.get("cost_proxy", 0.0)
-            bwe = exp.get("bullwhip", 0.0)
-            obj = weights.get("cost", 1.0) * cst + weights.get("service", 1.0) * (-svc) + weights.get("bullwhip", 1.0) * bwe
-        else:
-            obj = 0.1 * (z - last.get("z_alpha_new", 1.28)) ** 2 + 0.05 * (r - last.get("reroute_share", 0.0)) ** 2 + 0.05 * (e - last.get("expedite_share", 0.0)) ** 2 + 0.05 * (ds - last.get("dual_source_share", 0.0)) ** 2
-        constraints = [
-            z >= 0.5, z <= 3.0,
-            r >= 0.0, e >= 0.0, ds >= 0.0,
-            r + e + ds <= lane_cap,
-            cp.abs(z - last.get("z_alpha_new", 1.28)) <= limits.get("z_alpha_new", 0.3),
-            cp.abs(r - last.get("reroute_share", 0.0)) <= limits.get("reroute_share", 0.15),
-            cp.abs(e - last.get("expedite_share", 0.0)) <= limits.get("expedite_share", 0.15),
-            cp.abs(ds - last.get("dual_source_share", 0.0)) <= limits.get("dual_source_share", 0.2),
-        ]
-        prob = cp.Problem(cp.Minimize(obj), constraints)
-        prob.solve(solver=cp.ECOS_BB, mi_max_iterations=1000)
-        return {"z_alpha_new": float(z.value), "reroute_share": float(r.value), "expedite_share": float(e.value), "dual_source_share": float(ds.value), "status": prob.status}
-    except Exception as e:
-        return {"error": str(e)}
-
-
-def cpsat_policy(
-    last: Dict[str, float],
-    limits: Dict[str, float],
-    lane_cap: float,
-) -> Dict[str, Any]:
-    """Hard-feasibility projection using cvxpy (no OR-Tools).
-
-    Minimizes squared distance to last controls subject to rate and capacity limits.
-    """
-    try:
-        import cvxpy as cp
-        z = cp.Variable()
-        r = cp.Variable()
-        e = cp.Variable()
-        ds = cp.Variable()
-        # Objective: keep close to last (stability)
-        obj = (z - last.get("z_alpha_new", 1.28)) ** 2 + (r - last.get("reroute_share", 0.0)) ** 2 + (e - last.get("expedite_share", 0.0)) ** 2 + (ds - last.get("dual_source_share", 0.0)) ** 2
-        cons = [
-            z >= 0.5, z <= 3.0,
-            r >= 0.0, e >= 0.0, ds >= 0.0,
-            r + e + ds <= lane_cap,
-            cp.abs(z - last.get("z_alpha_new", 1.28)) <= limits.get("z_alpha_new", 0.3),
-            cp.abs(r - last.get("reroute_share", 0.0)) <= limits.get("reroute_share", 0.15),
-            cp.abs(e - last.get("expedite_share", 0.0)) <= limits.get("expedite_share", 0.15),
-            cp.abs(ds - last.get("dual_source_share", 0.0)) <= limits.get("dual_source_share", 0.2),
-        ]
-        prob = cp.Problem(cp.Minimize(obj), cons)
-        prob.solve(solver=cp.ECOS)
-        if z.value is None:
-            return {"error": "infeasible"}
-        return {
-            "z_alpha_new": float(z.value),
-            "reroute_share": float(r.value),
-            "expedite_share": float(e.value),
-            "dual_source_share": float(ds.value),
-            "status": prob.status,
-        }
-    except Exception as e:
-        return {"error": str(e)}
-
-
-def chance_constrained_mpc(panel: pd.DataFrame) -> Dict[str, Any]:
-    """Closed-form chance constraint for service level: z >= Phi^{-1}(beta)."""
-    try:
-        from scipy.stats import norm
-        beta = 0.95
-        z_req = float(norm.ppf(beta))
-        return {"type": "Chance-MPC", "beta": beta, "z_min": z_req, "feasible": True}
-    except Exception as e:
-        return {"type": "Chance-MPC", "error": str(e)}
-
-
-def h_infinity_controller(panel: pd.DataFrame) -> Dict[str, Any]:
-    """Approximate robust controller via discrete LQR (DARE) for inventory linearization."""
-    try:
-        from scipy.linalg import solve_discrete_are
-        # Simple 1D: x_{t+1} = x_t - u_t + w_t
-        A = np.array([[1.0]])
-        B = np.array([[1.0]])
-        Q = np.array([[1.0]])
-        R = np.array([[0.5]])
-        P = solve_discrete_are(A, B, Q, R)
-        K = np.linalg.inv(B.T @ P @ B + R) @ (B.T @ P @ A)
-        gamma = float(np.sqrt(np.max(np.linalg.eigvals(P))))
-        return {"type": "LQR", "K": float(K), "gamma_proxy": gamma}
-    except Exception as e:
-        return {"type": "LQR", "error": str(e)}
-
-
-def sddp_policy_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    return {"type": "SDDP", "stages": 3, "status": "ok"}
-
-
-# ===== Multi-Echelon Inventory (stubs) =====
-def clark_scarf_baseline(panel: pd.DataFrame) -> Dict[str, Any]:
-    """Compute a simple echelon base-stock as I + mean(P) across time (proxy)."""
-    try:
-        if set(["I"]).issubset(panel.columns):
-            echelon = float(panel["I"].mean()) + float(panel.get("P", pd.Series([0.0])).mean())
-            return {"echelon_base_stock": echelon}
-        return {"echelon_base_stock": 0.0}
-    except Exception as e:
-        return {"error": str(e)}
-
-
-def risk_averse_newsvendor_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    """Entropic-risk newsvendor: grid search Q to minimize 1/theta log E[exp(theta*cost)]."""
-    try:
-        D = panel.get("D", pd.Series([100.0])).astype(float).values
-        if len(D) < 10:
-            return {"Q_star": float(np.percentile(D, 95)), "risk_measure": "entropic", "theta": 0.5}
-        theta = 0.5
-        c_h, c_b = 0.1, 0.5
-        Q_grid = np.linspace(np.percentile(D, 10), np.percentile(D, 99), 30)
-        best, bestQ = 1e9, Q_grid[0]
-        for Q in Q_grid:
-            cost = c_h * np.maximum(Q - D, 0.0) + c_b * np.maximum(D - Q, 0.0)
-            risk = (1.0 / theta) * np.log(np.mean(np.exp(theta * cost)))
-            if risk < best:
-                best, bestQ = risk, Q
-        return {"Q_star": float(bestQ), "risk_measure": "entropic", "theta": theta, "objective": float(best)}
-    except Exception as e:
-        return {"error": str(e)}
-
-
-# ===== Digital twin gating scenarios =====
-def run_gating_scenarios(agent: "SupplyShockCRCAgent") -> Dict[str, Any]:
-    grid = [
-        {"name": "baseline", "z": agent.policy.z_alpha, "r": 0.0, "e": 0.0},
-        {"name": "z1.6_r0.20_e0.10", "z": 1.6, "r": 0.20, "e": 0.10},
-        {"name": "z1.8_r0.15_e0.15", "z": 1.8, "r": 0.15, "e": 0.15},
-        {"name": "z2.0_e0.20", "z": 2.0, "r": 0.00, "e": 0.20},
-    ]
-    results: Dict[str, Any] = {}
-    base = agent.simulate()
-    base_kpi = agent.summarize(base)
-    for g in grid:
-        impact = agent._quantified_impact(g["z"], g["r"], g["e"], trials=50)
-        exp = impact.get("expected", {})
-        svc_delta = float(exp.get("service", 0.0))
-        cost_delta = float(exp.get("cost_proxy", 0.0))
-        marginal_cost_per_pp = float(cost_delta / max(1e-6, svc_delta * 100.0)) if svc_delta > 0 else float("inf")
-        results[g["name"]] = {
-            "expected": exp,
-            "ci80": impact.get("ci80", {}),
-            "marginal_cost_per_1pp_service": marginal_cost_per_pp,
-        }
-    return {"baseline": base_kpi, "scenarios": results}
-
-
-# ===== Network & Systemic Risk (stubs) =====
-def percolation_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    return {"gc_threshold": 0.3, "expected_shortfall": 0.12}
-
-
-def eisenberg_noe_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    return {"clearing_vector_norm": 0.97}
-
-
-def k_cut_sets_stub() -> Dict[str, Any]:
-    return {"min_k_cut": 2, "critical_arcs": ["lane_CN-EU", "lane_US-EU"]}
-
-
-# ===== Pricing & Demand (stubs) =====
-def logit_share_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    return {"alpha_price": 0.8, "elasticity": -1.2}
-
-
-def dynamic_pricing_dp_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    return {"policy": "approxDP", "discount": 0.98}
-
-
-def ramsey_pricing_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    return {"lambda": 0.2, "implied_markups": {"A": 0.1, "B": 0.05}}
-
-
-# ===== Policy Evaluation (stubs) =====
-def synthetic_control_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    return {"effect": -0.03, "weight_entropy": 0.9}
-
-
-def did_iv_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    return {"beta": -0.08, "se_robust": 0.04}
-
-
-# ===== Security & Integrity (stubs) =====
-def secure_state_l1_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    return {"attacks_detected": 0}
-
-
-def spectral_shift_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    return {"eig_drift": 0.05}
-
-
-# ===== Investment under Uncertainty (stubs) =====
-def real_options_stub() -> Dict[str, Any]:
-    return {"LSM_value": 1.2}
-
-
-def supplier_portfolio_stub() -> Dict[str, Any]:
-    return {"selected_suppliers": ["S1", "S3"], "service_prob": 0.97}
-
-
-# ===== Further Advanced (realistic approximations or stubs) =====
-def transport_modes_sim_stub() -> Dict[str, Any]:
-    return {"modes": ["SEA", "AIR", "RAIL"], "schedules": {"SEA": 7, "AIR": 2, "RAIL": 5}}
-
-
-def online_em_ms(panel: pd.DataFrame) -> Dict[str, Any]:
-    # Lightweight online update: adapt mean/var of L based on EWMA
-    if "L" not in panel.columns:
-        return {"mu": 2.0, "sigma": 1.0}
-    L = panel["L"].astype(float).values
-    lam = 0.2
-    mu = L[0]
-    var = 1.0
-    for x in L[1:]:
-        mu = lam * x + (1 - lam) * mu
-        var = lam * (x - mu) ** 2 + (1 - lam) * var
-    return {"mu": float(mu), "sigma": float(max(0.2, var ** 0.5))}
-
-
-def hierarchical_bsts_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    # Placeholder summary for hierarchical pooling
-    groups = {"facilities": int(panel.shape[1] > 0)}
-    return {"pooled": True, "groups": groups}
-
-
-def multi_stage_mpc_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    return {"horizon": 3, "reroute_share": 0.1, "expedite_share": 0.05}
-
-
-def iot_fusion_stub() -> Dict[str, Any]:
-    return {"adjust_phi": -0.05, "adjust_L": +0.3}
-
-
-def nested_logit_stub() -> Dict[str, Any]:
-    try:
-        from statsmodels.discrete.discrete_model import MNLogit  # noqa: F401
-        return {"available": True, "note": "Use MNLogit with inventory and price features"}
-    except Exception:
-        return {"available": False}
-
-
-def kcut_hardening_stub() -> Dict[str, Any]:
-    return {"harden": ["lane_CN-EU"], "budget": 1}
-
-
-def linucb_policy_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    # Simple LinUCB placeholders for reroute/expedite arms
-    alpha = 0.5
-    arms = ["keep", "reroute", "expedite"]
-    scores = {a: 0.5 + alpha * 0.1 for a in arms}
-    choice = max(scores, key=scores.get)
-    return {"choice": choice, "scores": scores}
-
-
-def l1_observer_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    try:
-        import cvxpy as cp  # noqa: F401
-        return {"feasible": True}
-    except Exception:
-        return {"feasible": False}
-
-
-def fan_charts_stub(panel: pd.DataFrame) -> Dict[str, Any]:
-    if "D" not in panel.columns:
-        return {"quantiles": {}}
-    y = panel["D"].astype(float).values
-    q = {
-        "p10": float(np.percentile(y, 10)),
-        "p50": float(np.percentile(y, 50)),
-        "p90": float(np.percentile(y, 90)),
-    }
-    return {"quantiles": q}
-
-
-async def main() -> None:
-    skus = [SKUKey("SKU1", "F1"), SKUKey("SKU2", "F1"), SKUKey("SKU3", "F2")]
-    agent = SupplyShockCRCAgent(skus=skus, T=40)
-
-    # Baseline simulate
-    df = agent.simulate()
-    kpis = agent.summarize(df)
-    strengths = agent.causal_edges(df)
-    print("Baseline KPIs:", kpis)
-    print("Causal strengths:", strengths)
-
-    # Example interventions
-    scenario_port = {"disruption_route": {"F1": 1}}
-    scenario_outage = {"outage_facility": {"F2": 1}}
-    cmp_port = agent.intervene_and_compare(scenario_port)
-    cmp_outage = agent.intervene_and_compare(scenario_outage)
-    print("Port disruption delta:", cmp_port["delta"])
-    print("Facility outage delta:", cmp_outage["delta"])
-
-    # Full control cycle with AI narrative and upgraded CR-CA analysis
-    result = agent.control_cycle()
-    print("-" * 80)
-    print("AI Narrative Analysis:\n", result.get("ai_analysis"))
-    print("-" * 80)
-    print("Causal Summary:\n", result.get("causal_summary"))
-    
-    # Display upgraded analysis results
-    advanced = result.get("advanced_causal", {})
-    if advanced and not advanced.get("error"):
-        print("\n" + "=" * 80)
-        print("UPGRADED CR-CA ANALYSIS RESULTS")
-        print("=" * 80)
-        
-        if advanced.get("sensitivity_analysis"):
-            sens = advanced["sensitivity_analysis"]
-            print("\n--- Sensitivity Analysis ---")
-            if sens.get("service_drivers"):
-                svc = sens["service_drivers"]
-                print(f"Service (backlog) drivers:")
-                print(f"  Most influential: {svc.get('most_influential_variable', 'N/A')} (sensitivity: {svc.get('most_influential_sensitivity', 0.0):.4f})")
-            if sens.get("cost_drivers"):
-                cost = sens["cost_drivers"]
-                print(f"Cost (price) drivers:")
-                print(f"  Most influential: {cost.get('most_influential_variable', 'N/A')} (sensitivity: {cost.get('most_influential_sensitivity', 0.0):.4f})")
-        
-        if advanced.get("granger_causality"):
-            gc = advanced["granger_causality"]
-            print("\n--- Granger Causality Tests ---")
-            print(f"D → O: {gc.get('demand_granger_causes_orders', False)} (F={gc.get('d_o_f_stat', 0.0):.2f})")
-            print(f"B → p: {gc.get('backlog_granger_causes_price', False)} (F={gc.get('b_p_f_stat', 0.0):.2f})")
-        
-        if advanced.get("information_theory") and advanced["information_theory"].get("entropies"):
-            it = advanced["information_theory"]
-            print("\n--- Information Theory ---")
-            print("Variable entropies:")
-            for var, entropy in list(it["entropies"].items())[:5]:
-                print(f"  H({var}) = {entropy:.3f} bits")
-            if it.get("mutual_information"):
-                print("Top mutual information:")
-                mi_items = sorted(it["mutual_information"].items(), key=lambda x: x[1], reverse=True)[:3]
-                for pair, mi_val in mi_items:
-                    print(f"  I({pair}) = {mi_val:.3f} bits")
-        
-        if advanced.get("shapley_attribution"):
-            shap = advanced["shapley_attribution"]
-            if shap.get("backlog_drivers") and shap["backlog_drivers"].get("shapley_values"):
-                print("\n--- Shapley Value Attribution (Backlog Drivers) ---")
-                shap_b = shap["backlog_drivers"]["shapley_values"]
-                for var, value in sorted(shap_b.items(), key=lambda x: abs(x[1]), reverse=True)[:5]:
-                    print(f"  {var}: {value:+.4f}")
-        
-        if advanced.get("root_causes") and advanced["root_causes"].get("service_issues"):
-            rc = advanced["root_causes"]["service_issues"]
-            if rc.get("ultimate_root_causes"):
-                print("\n--- Deep Root Cause Analysis (Service Issues) ---")
-                print("Ultimate root causes of backlog:")
-                for root in rc["ultimate_root_causes"][:5]:
-                    print(f"  - {root.get('root_cause', 'N/A')} "
-                          f"(path strength: {root.get('path_strength', 0.0):.3f}, depth: {root.get('depth', 0)})")
-        
-        if advanced.get("optimal_intervention") and advanced["optimal_intervention"].get("optimal_sequence"):
-            opt = advanced["optimal_intervention"]
-            print("\n--- Optimal Intervention Sequence (Bellman) ---")
-            print(f"Optimal {len(opt['optimal_sequence'])}-step sequence to minimize backlog:")
-            for i, step in enumerate(opt["optimal_sequence"][:3], 1):
-                print(f"  Step {i}: {step}")
-            print(f"Expected total value: {opt.get('total_value', 0.0):.2f}")
-        
-        if advanced.get("alternate_realities") and advanced["alternate_realities"].get("best_reality"):
-            ar = advanced["alternate_realities"]
-            best = ar["best_reality"]
-            print("\n--- Alternate Realities Exploration ---")
-            print(f"Best alternate reality (minimize backlog):")
-            print(f"  Interventions: {best.get('interventions', {})}")
-            print(f"  Expected backlog: {best.get('target_value', 0.0):.2f}")
-            print(f"  Improvement: {ar.get('improvement_potential', 0.0):+.2f}")
-        
-        if advanced.get("chain_reaction"):
-            cr = advanced["chain_reaction"]
-            print("\n--- Cascading Chain Reaction Analysis ---")
-            summary = cr.get("summary", {})
-            print(f"Total paths found: {summary.get('total_paths_found', 0)}")
-            print(f"Feedback loops: {summary.get('feedback_loops_detected', 0)}")
-            if cr.get("final_predictions"):
-                print(f"Final predictions: {dict(list(cr['final_predictions'].items())[:5])}")
-        
-        if advanced.get("cross_validation"):
-            cv = advanced["cross_validation"]
-            print("\n--- Cross-Validation for Edge Reliability ---")
-            for edge, cv_data in list(cv.items())[:5]:
-                print(f"  {edge}: CV error={cv_data.get('mean_cv_error', 0.0):.4f} ± {cv_data.get('standard_error', 0.0):.4f}")
-        
-        print("\n" + "=" * 80)
-
-
-if __name__ == "__main__":
-    import asyncio
-
-    logger.remove()
-    logger.add("crca_supply_shock.log", rotation="50 MB", retention="7 days", level="INFO")
-    try:
-        asyncio.run(main())
-    except KeyboardInterrupt:
-        print("Stopped.")
-
-

From b15f70ce8638467542eda90d38b608993f978ddb Mon Sep 17 00:00:00 2001
From: CI-DEV <154627941+IlumCI@users.noreply.github.com>
Date: Fri, 5 Dec 2025 11:03:00 +0200
Subject: [PATCH 12/12] Update cr_ca_agent.md

---
 docs/swarms/agents/cr_ca_agent.md | 243 ++++++++++++++++++++++++++++--
 1 file changed, 230 insertions(+), 13 deletions(-)

diff --git a/docs/swarms/agents/cr_ca_agent.md b/docs/swarms/agents/cr_ca_agent.md
index b471b732..3ecd9695 100644
--- a/docs/swarms/agents/cr_ca_agent.md
+++ b/docs/swarms/agents/cr_ca_agent.md
@@ -22,7 +22,7 @@ Canonical import
 Use the canonical agent import in application code:
 
 ```python
-from swarms.agents.cr_ca_agent import CRCAAgent
+from path.to.crca_agent import CRCAAgent
 ```
 
 Quickstart
@@ -30,7 +30,7 @@ Quickstart
 Minimal example — deterministic mode: initialize, add edges, evolve state and get counterfactuals:
 
 ```python
-from swarms.agents.cr_ca_agent import CRCAAgent
+from path.to.crca_agent import CRCAAgent
 
 agent = CRCAAgent(variables=["price", "demand", "inventory"])
 agent.add_causal_relationship("price", "demand", strength=-0.5)
@@ -48,7 +48,7 @@ LLM-based causal analysis example
 ----------------------------------
 
 ```python
-from swarms.agents.cr_ca_agent import CRCAAgent
+from path.to.crca_agent import CRCAAgent
 
 agent = CRCAAgent(
     variables=["price", "demand", "inventory"],
@@ -71,7 +71,7 @@ Agent-style JSON payload example (orchestrators)
 
 ```python
 import json
-from swarms.agents.cr_ca_agent import CRCAAgent
+from path.to.crca_agent import CRCAAgent
 
 agent = CRCAAgent(variables=["price","demand","inventory"])
 payload = json.dumps({"price": 100.0, "demand": 1000.0})
@@ -79,6 +79,230 @@ out = agent.run(initial_state=payload, target_variables=["price"], max_steps=1)
 print(out["evolved_state"])
 ```
 
+Complete example: Full workflow with system prompt
+--------------------------------------------------
+This example demonstrates a complete workflow from imports to execution, including
+system prompt configuration, causal graph construction, and both LLM and deterministic modes.
+
+```python
+"""
+Complete CRCAAgent example: Full workflow from initialization to execution
+"""
+
+# 1. Imports
+from typing import Dict, Any
+from path.to.crca_agent import CRCAAgent
+
+# 2. System prompt configuration
+# Define a custom system prompt for domain-specific causal reasoning
+SYSTEM_PROMPT = """You are an expert causal reasoning analyst specializing in economic systems.
+Your role is to:
+- Identify causal relationships between economic variables
+- Analyze how interventions affect system outcomes
+- Generate plausible counterfactual scenarios
+- Provide clear, evidence-based causal explanations
+
+When analyzing causal relationships:
+1. Consider both direct and indirect causal paths
+2. Account for confounding factors
+3. Evaluate intervention plausibility
+4. Quantify expected causal effects when possible
+
+Always ground your analysis in the provided causal graph structure and observed data."""
+
+# 3. Agent initialization with system prompt
+agent = CRCAAgent(
+    variables=["price", "demand", "inventory", "supply", "competition"],
+    agent_name="economic-causal-analyst",
+    agent_description="Expert economic causal reasoning agent",
+    model_name="gpt-4o",  # or "gpt-4o-mini" for faster/cheaper analysis
+    max_loops=3,  # Number of reasoning loops for LLM-based analysis
+    system_prompt=SYSTEM_PROMPT,
+    verbose=True,  # Enable detailed logging
+)
+
+# 4. Build causal graph: Add causal relationships
+# Price negatively affects demand (higher price → lower demand)
+agent.add_causal_relationship("price", "demand", strength=-0.5)
+
+# Demand negatively affects inventory (higher demand → lower inventory)
+agent.add_causal_relationship("demand", "inventory", strength=-0.2)
+
+# Supply positively affects inventory (higher supply → higher inventory)
+agent.add_causal_relationship("supply", "inventory", strength=0.3)
+
+# Competition negatively affects price (more competition → lower price)
+agent.add_causal_relationship("competition", "price", strength=-0.4)
+
+# Price positively affects supply (higher price → more supply)
+agent.add_causal_relationship("price", "supply", strength=0.2)
+
+# 5. Verify graph structure
+print("Causal Graph Nodes:", agent.get_nodes())
+print("Causal Graph Edges:", agent.get_edges())
+print("Is DAG:", agent.is_dag())
+
+# 6. Example 1: LLM-based causal analysis (sophisticated reasoning)
+print("\n" + "="*80)
+print("EXAMPLE 1: LLM-Based Causal Analysis")
+print("="*80)
+
+task = """
+Analyze the causal relationship between price increases and inventory levels.
+Consider both direct and indirect causal paths. What interventions could
+stabilize inventory while maintaining profitability?
+"""
+
+result = agent.run(task=task)
+
+print("\n--- Causal Analysis Report ---")
+print(result["causal_analysis"])
+
+print("\n--- Counterfactual Scenarios ---")
+for i, scenario in enumerate(result["counterfactual_scenarios"][:3], 1):
+    print(f"\nScenario {i}: {scenario.name}")
+    print(f"  Interventions: {scenario.interventions}")
+    print(f"  Expected Outcomes: {scenario.expected_outcomes}")
+    print(f"  Probability: {scenario.probability:.3f}")
+    print(f"  Reasoning: {scenario.reasoning}")
+
+print("\n--- Causal Graph Info ---")
+print(f"Nodes: {result['causal_graph_info']['nodes']}")
+print(f"Edges: {result['causal_graph_info']['edges']}")
+print(f"Is DAG: {result['causal_graph_info']['is_dag']}")
+
+# 7. Example 2: Deterministic simulation (script-style)
+print("\n" + "="*80)
+print("EXAMPLE 2: Deterministic Causal Simulation")
+print("="*80)
+
+# Initial state
+initial_state = {
+    "price": 100.0,
+    "demand": 1000.0,
+    "inventory": 5000.0,
+    "supply": 2000.0,
+    "competition": 5.0,
+}
+
+# Run deterministic evolution
+simulation_result = agent.run(
+    initial_state=initial_state,
+    target_variables=["price", "demand", "inventory"],
+    max_steps=3,  # Evolve for 3 time steps
+)
+
+print("\n--- Initial State ---")
+for var, value in initial_state.items():
+    print(f"  {var}: {value}")
+
+print("\n--- Evolved State (after 3 steps) ---")
+for var, value in simulation_result["evolved_state"].items():
+    print(f"  {var}: {value:.2f}")
+
+print("\n--- Counterfactual Scenarios ---")
+for i, scenario in enumerate(simulation_result["counterfactual_scenarios"][:3], 1):
+    print(f"\nScenario {i}: {scenario.name}")
+    print(f"  Interventions: {scenario.interventions}")
+    print(f"  Expected Outcomes: {scenario.expected_outcomes}")
+    print(f"  Probability: {scenario.probability:.3f}")
+
+# 8. Example 3: Causal chain identification
+print("\n" + "="*80)
+print("EXAMPLE 3: Causal Chain Analysis")
+print("="*80)
+
+chain = agent.identify_causal_chain("competition", "inventory")
+if chain:
+    print(f"Causal chain from 'competition' to 'inventory': {' → '.join(chain)}")
+else:
+    print("No direct causal chain found")
+
+# 9. Example 4: Analyze causal strength
+print("\n" + "="*80)
+print("EXAMPLE 4: Causal Strength Analysis")
+print("="*80)
+
+strength_analysis = agent.analyze_causal_strength("price", "inventory")
+print(f"Direct edge strength: {strength_analysis.get('direct_strength', 'N/A')}")
+print(f"Path strength: {strength_analysis.get('path_strength', 'N/A')}")
+
+# 10. Example 5: Custom intervention prediction
+print("\n" + "="*80)
+print("EXAMPLE 5: Custom Intervention Prediction")
+print("="*80)
+
+# What if we reduce price by 20%?
+interventions = {"price": 80.0}  # 20% reduction from 100
+predicted = agent._predict_outcomes(initial_state, interventions)
+
+print("\nIntervention: Reduce price from 100 to 80 (20% reduction)")
+print("Predicted outcomes:")
+for var, value in predicted.items():
+    if var in initial_state:
+        change = value - initial_state[var]
+        change_pct = (change / initial_state[var]) * 100 if initial_state[var] != 0 else 0
+        print(f"  {var}: {initial_state[var]:.2f} → {value:.2f} ({change_pct:+.1f}%)")
+
+print("\n" + "="*80)
+print("Example execution complete!")
+print("="*80)
+```
+
+Expected output structure
+-------------------------
+The `run()` method returns different structures depending on the mode:
+
+**LLM Mode** (task string):
+```python
+{
+    "task": str,  # The provided task string
+    "causal_analysis": str,  # Synthesized analysis report
+    "counterfactual_scenarios": List[CounterfactualScenario],  # Generated scenarios
+    "causal_graph_info": {
+        "nodes": List[str],
+        "edges": List[Tuple[str, str]],
+        "is_dag": bool
+    },
+    "analysis_steps": List[Dict[str, Any]]  # Step-by-step reasoning history
+}
+```
+
+**Deterministic Mode** (initial_state dict):
+```python
+{
+    "initial_state": Dict[str, float],  # Input state
+    "evolved_state": Dict[str, float],  # State after max_steps evolution
+    "counterfactual_scenarios": List[CounterfactualScenario],  # Generated scenarios
+    "causal_graph_info": {
+        "nodes": List[str],
+        "edges": List[Tuple[str, str]],
+        "is_dag": bool
+    },
+    "steps": int  # Number of evolution steps applied
+}
+```
+
+System prompt best practices
+-----------------------------
+1. **Domain-specific guidance**: Include domain knowledge relevant to your causal model
+2. **Causal reasoning principles**: Reference Pearl's causal hierarchy (association, intervention, counterfactual)
+3. **Output format**: Specify desired analysis structure and detail level
+4. **Plausibility constraints**: Guide the agent on what interventions are realistic
+5. **Quantification**: Encourage numerical estimates when appropriate
+
+Example system prompt template:
+```python
+SYSTEM_PROMPT = """You are a {domain} causal reasoning expert.
+Your analysis should:
+- Identify {specific_relationships}
+- Consider {relevant_factors}
+- Generate {scenario_types}
+- Provide {output_format}
+
+Ground your reasoning in the causal graph structure provided."""
+```
+
 Why use `run()`
 --------------
 - **Dual-mode operation**: Automatically selects LLM mode (task string) or deterministic mode (initial_state dict)
@@ -145,8 +369,7 @@ flowchart TB
 Complete method index (quick)
 -----------------------------
 The following is the public surface implemented by `CRCAAgent` (Lite) in
-`ceca_lite/crca-lite.py` (canonical import: `swarms/agents/cr_ca_agent.py`).
-See the code for full docstrings and math.
+`ceca_lite/crca-lite.py`.
 
 LLM integration
 - `_get_cr_ca_schema()` — CR-CA function calling schema for structured reasoning
@@ -264,7 +487,7 @@ Design notes & limitations
 Extending & integration
 -----------------------
 For advanced capabilities (structure learning, Bayesian inference, optimization,
-extensive statistical methods), use the full `CRCAAgent` in `swarms/agents/cr_ca_agent.py`.
+extensive statistical methods), use the full CRCA Agent featured [WIP]
 The Lite version provides core causal reasoning with LLM support while maintaining minimal dependencies.
 
 References
@@ -272,10 +495,4 @@ References
 - Pearl, J. (2009). *Causality: Models, Reasoning, and Inference*.
 - Pearl, J., & Mackenzie, D. (2018). *The Book of Why*.
 
----
-CRCAAgent (Lite) — lightweight causal reasoning Agent with LLM integration for Swarms.
-
-Implementation: `ceca_lite/crca-lite.py`  
-Canonical import: `from swarms.agents.cr_ca_agent import CRCAAgent`
-