feat(aem): per-bucket MAE_MULT table + shadow logging completeness

AEM stays shadow-only this sprint (V7 drives live exits); changes affect what AEM *would have done*, logged to CH for future V7→AEM demotion analysis. adaptive_exit_engine.py: - Replace single MAE_MULT_TIER1=3.5 with MAE_MULT_BY_BUCKET dict (B3→None disables MAE stop, B4→2.0 strict, B6→6.0 wide band) - evaluate() return dict extended: mae_mult_applied, mae_threshold, atr, p_threshold, giveback_k (all params that drove the decision) - adaptive_exit_shadow schema extended (new Nullable columns added via ALTER TABLE IF NOT EXISTS — backward-compat with pre-sprint rows) - log_shadow() signature extended: v7_action, v7_exit_reason, naive_would_have (TP/STOP/MAX_HOLD counterfactual at same instant) dolphin_actor.py: - AEM shadow call now passes V7 head-to-head decision and naive counterfactual so future retrospective requires no offline replay - EsoF listener registered on DOLPHIN_FEATURES map (esof_advisor_latest key); label fed into engine._current_esof_label before each step_bar - S6/bucket loaders (_load_s6_size_table, _load_asset_bucket_data) and constructor wiring for the new GREEN engine kwargs Plan refs: Tasks 5, 7, 10 — V7 path untouched, AEM return value is never gated, CH shadow is best-effort (daemon thread). Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-04-22 06:07:46 +02:00
parent af5156f52d
commit 48dcf3fe13
2 changed files with 232 additions and 18 deletions
--- a/adaptive_exit/adaptive_exit_engine.py
+++ b/adaptive_exit/adaptive_exit_engine.py
@@ -35,7 +35,7 @@ import os
 import threading
 import time
 import urllib.request
-from typing import Optional
+from typing import Dict, Optional
 import numpy as np
@@ -45,11 +45,28 @@ from adaptive_exit.continuation_model import ContinuationModelBank, FEATURE_COLS
 # ── Config ────────────────────────────────────────────────────────────────────
 P_THRESHOLD = 0.40          # P(continuation) below this → consider exit
 GIVEBACK_K = 0.50           # MFE giveback fraction
-MAE_MULT_TIER1 = 3.5        # vol multiplier for tier-1 stop
+MAE_MULT_TIER1 = 3.5        # fallback multiplier when bucket-specific entry missing
 MAE_MULT_TIER2 = 7.0
 ATR_WINDOW = 20
 MIN_ATR = 1e-6
 # Per-bucket MAE multipliers — replaces single MAE_MULT_TIER1 in the stop check.
 # Shadow-only this sprint (AEM doesn't drive live exits; V7 does), so this shapes
 # what AEM *would have done* for data collection — not actual trade outcomes.
 # `None` disables the MAE_STOP gate entirely for that bucket (giveback/time still apply).
 #   B3 — natural winners; shadow shows 5.0–5.1 MAE peaks before FIXED_TP succeeds
 #   B4 — gross-negative alpha; cut fast before drawdown compounds
 #   B6 — extreme-vol assets; wide band or we trip on noise
 MAE_MULT_BY_BUCKET: Dict[int, Optional[float]] = {
    0: 3.5,
    1: 3.0,
    2: 3.5,
    3: None,
    4: 2.0,
    5: 4.0,
    6: 6.0,
 }
 _CH_URL = "http://localhost:8123/"
 _CH_HEADERS = {"X-ClickHouse-User": "dolphin", "X-ClickHouse-Key": "dolphin_ch_2026"}
@@ -72,7 +89,13 @@ def _ch_insert(row: dict, db: str = _SHADOW_DB) -> None:
 def _ensure_shadow_table() -> None:
-    """Create shadow table if it doesn't exist."""
+    """Create shadow table if it doesn't exist.
    Extended schema (2026-04-21, GREEN S6 sprint) captures the full AEM decision
    snapshot plus V7 action at the same instant, so a future AEM-vs-V7 demotion
    analysis can replay head-to-head without needing to re-simulate AEM.
    New columns are nullable — existing rows (pre-sprint) simply have NULL for them.
    """
    ddl = (
        f"CREATE TABLE IF NOT EXISTS {_SHADOW_DB}.{_SHADOW_TABLE} ("
        "ts            DateTime64(6, 'UTC'),"
@@ -90,19 +113,43 @@ def _ensure_shadow_table() -> None:
        "action        LowCardinality(String),"
        "exit_reason   LowCardinality(String),"
        "actual_exit   LowCardinality(String),"
-        "pnl_pct       Float32"
+        "pnl_pct       Float32,"
        # ── AEM decision params (Nullable to stay backward-compat) ──
        "mae_mult_applied   Nullable(Float32),"
        "mae_threshold      Nullable(Float32),"
        "atr                Nullable(Float32),"
        "p_threshold        Nullable(Float32),"
        "giveback_k         Nullable(Float32),"
        # ── V7 head-to-head (authoritative path) ──
        "v7_action          LowCardinality(Nullable(String)),"
        "v7_exit_reason     LowCardinality(Nullable(String)),"
        # ── Naive counterfactual (what the dumb TP/STOP/MAX_HOLD would have done) ──
        "naive_would_have   LowCardinality(Nullable(String))"
        ") ENGINE = MergeTree()"
        " ORDER BY (ts_day, asset, ts)"
        " TTL ts_day + INTERVAL 90 DAY"
    )
    # For pre-existing tables, add the new columns idempotently. CH treats
    # ADD COLUMN IF NOT EXISTS as a no-op when the column is already present.
    alters = [
        f"ALTER TABLE {_SHADOW_DB}.{_SHADOW_TABLE} ADD COLUMN IF NOT EXISTS mae_mult_applied Nullable(Float32)",
        f"ALTER TABLE {_SHADOW_DB}.{_SHADOW_TABLE} ADD COLUMN IF NOT EXISTS mae_threshold Nullable(Float32)",
        f"ALTER TABLE {_SHADOW_DB}.{_SHADOW_TABLE} ADD COLUMN IF NOT EXISTS atr Nullable(Float32)",
        f"ALTER TABLE {_SHADOW_DB}.{_SHADOW_TABLE} ADD COLUMN IF NOT EXISTS p_threshold Nullable(Float32)",
        f"ALTER TABLE {_SHADOW_DB}.{_SHADOW_TABLE} ADD COLUMN IF NOT EXISTS giveback_k Nullable(Float32)",
        f"ALTER TABLE {_SHADOW_DB}.{_SHADOW_TABLE} ADD COLUMN IF NOT EXISTS v7_action LowCardinality(Nullable(String))",
        f"ALTER TABLE {_SHADOW_DB}.{_SHADOW_TABLE} ADD COLUMN IF NOT EXISTS v7_exit_reason LowCardinality(Nullable(String))",
        f"ALTER TABLE {_SHADOW_DB}.{_SHADOW_TABLE} ADD COLUMN IF NOT EXISTS naive_would_have LowCardinality(Nullable(String))",
    ]
    try:
-        body = ddl.encode()
+        for stmt in (ddl, *alters):
            body = stmt.encode()
            req = urllib.request.Request(_CH_URL, data=body, method="POST")
            for k, v in _CH_HEADERS.items():
                req.add_header(k, v)
            urllib.request.urlopen(req, timeout=10)
    except Exception as e:
-        print(f"[AdaptiveExitEngine] Warning: could not create shadow table: {e}")
+        print(f"[AdaptiveExitEngine] Warning: could not create/alter shadow table: {e}")
 # ── Per-trade state ───────────────────────────────────────────────────────────
@@ -324,12 +371,14 @@ class AdaptiveExitEngine:
            bucket_id=st.bucket_id,
        )
-        # Decision logic
+        # Decision logic — per-bucket MAE multiplier. `None` entry disables the
-        mae_threshold = max(0.005, MAE_MULT_TIER1 * atr)
+        # MAE_STOP gate for that bucket (giveback + time checks still apply).
        mae_mult = MAE_MULT_BY_BUCKET.get(st.bucket_id, MAE_MULT_TIER1)
        mae_threshold = max(0.005, mae_mult * atr) if mae_mult is not None else None
        action = "HOLD"
        exit_reason = ""
-        if st.mae > mae_threshold:
+        if mae_threshold is not None and st.mae > mae_threshold:
            action = "EXIT"
            exit_reason = "AE_MAE_STOP"
        elif (st.peak_mfe > 0 and st.mfe < GIVEBACK_K * st.peak_mfe
@@ -352,10 +401,31 @@ class AdaptiveExitEngine:
            "bucket_id": st.bucket_id,
            "vel_div_entry": st.vel_div_entry,
            "vel_div_now": vel_div_now,
            "mae_mult_applied": mae_mult,
            "mae_threshold": mae_threshold,
            "atr": atr,
            "p_threshold": P_THRESHOLD,
            "giveback_k": GIVEBACK_K,
        }
-    def log_shadow(self, shadow: dict, actual_exit: str = "", pnl_pct: float = 0.0) -> None:
+    def log_shadow(
-        """Async log a shadow decision to ClickHouse."""
+        self,
        shadow: dict,
        actual_exit: str = "",
        pnl_pct: float = 0.0,
        v7_action: Optional[str] = None,
        v7_exit_reason: Optional[str] = None,
        naive_would_have: Optional[str] = None,
    ) -> None:
        """Async log a shadow decision to ClickHouse.
        V7 head-to-head + naive counterfactual are optional but should be passed
        from dolphin_actor whenever available — they enable the future AEM-vs-V7
        demotion analysis without needing an offline replay.
        """
        def _opt(v):
            return None if v is None else float(v)
        row = {
            "ts": int(time.time() * 1e6),
            "trade_id": shadow.get("trade_id", ""),
@@ -372,5 +442,15 @@ class AdaptiveExitEngine:
            "exit_reason": shadow.get("exit_reason_shadow", ""),
            "actual_exit": actual_exit,
            "pnl_pct": float(pnl_pct),
            # New AEM-decision params (Nullable-capable)
            "mae_mult_applied": _opt(shadow.get("mae_mult_applied")),
            "mae_threshold":    _opt(shadow.get("mae_threshold")),
            "atr":              _opt(shadow.get("atr")),
            "p_threshold":      _opt(shadow.get("p_threshold")),
            "giveback_k":       _opt(shadow.get("giveback_k")),
            # Head-to-head
            "v7_action":        v7_action,
            "v7_exit_reason":   v7_exit_reason,
            "naive_would_have": naive_would_have,
        }
        threading.Thread(target=_ch_insert, args=(row,), daemon=True).start()
--- a/nautilus_dolphin/nautilus_dolphin/nautilus/dolphin_actor.py
+++ b/nautilus_dolphin/nautilus_dolphin/nautilus/dolphin_actor.py
@@ -5,6 +5,7 @@ import threading
 import time
 from collections import deque, namedtuple
 from datetime import datetime, timezone
 from typing import Optional
 import numpy as np
 import pandas as pd
 from pathlib import Path
@@ -136,6 +137,7 @@ class DolphinActor(Strategy):
        self._v6_decisions: dict = {}    # trade_id → latest evaluate() result
        # EXF macro snapshot — updated from ACB payload, injected into V7 contexts each scan
        self._last_exf: dict = {}        # keys: funding, dvol, fear_greed, taker
        self._current_esof_label: Optional[str] = None  # cached from HZ esof_advisor_latest
        # Adaptive exit engine — parallel shadow mode (never executes real exits)
        self._adaptive_exit = None
        # Stablecoin symbols ÔÇö kept in eigen for purity, hard-blocked at picker
@@ -148,6 +150,57 @@ class DolphinActor(Strategy):
        self._bucket_assignments: dict = {}
        self._hibernate_protect_active: str | None = None
    # ── GREEN S6/EsoF/AEM loaders (BLUE skips these via absent config keys) ──
    def _load_s6_size_table(self):
        """Resolve GREEN S6 bucket→multiplier table.
        Precedence (first non-None wins):
          1) `s6_table_path` in config → YAML file's `buckets:` mapping
          2) `s6_size_table` inline in config
          3) None (BLUE no-op)
        """
        try:
            _path = self.dolphin_config.get('s6_table_path')
            if _path:
                import yaml  # local import — BLUE never reaches here
                _p = Path(_path)
                if not _p.is_absolute():
                    _p = Path.cwd() / _p
                if _p.exists():
                    with open(_p, 'r') as _f:
                        _doc = yaml.safe_load(_f) or {}
                    _b = _doc.get('buckets')
                    if isinstance(_b, dict):
                        return {int(k): float(v) for k, v in _b.items()}
            _inline = self.dolphin_config.get('s6_size_table')
            if isinstance(_inline, dict):
                return {int(k): float(v) for k, v in _inline.items()}
        except Exception as _e:
            self.log.warning(f"[S6] s6_size_table load failed: {_e} — feature disabled")
        return None
    def _load_asset_bucket_data(self):
        """Load KMeans bucket assignments from adaptive_exit/models/bucket_assignments.pkl.
        Returns the authoritative `{"assignments": {symbol: int, ...}, ...}` dict used by
        both the orchestrator (for S6 lookup) and the selector (for ban-set filtering).
        """
        try:
            import pickle
            _path = self.dolphin_config.get(
                'asset_bucket_pkl',
                'adaptive_exit/models/bucket_assignments.pkl',
            )
            _p = Path(_path)
            if not _p.is_absolute():
                _p = Path.cwd() / _p
            if _p.exists():
                with open(_p, 'rb') as _f:
                    return pickle.load(_f)
        except Exception as _e:
            self.log.warning(f"[S6] bucket_assignments load failed: {_e} — S6 + ban disabled")
        return None
    def on_start(self):
        # Read posture from HZ DOLPHIN_SAFETY
        self.hz_client = self._connect_hz()
@@ -206,8 +259,24 @@ class DolphinActor(Strategy):
            use_alpha_layers=eng_cfg.get('use_alpha_layers', True),
            use_dynamic_leverage=eng_cfg.get('use_dynamic_leverage', True),
            seed=eng_cfg.get('seed', 42),
            # GREEN S6/EsoF/AEM sprint — top-level config keys, not nested under engine.
            # BLUE leaves these unset → orchestrator reads None/False → BLUE no-op.
            s6_size_table=self._load_s6_size_table(),
            esof_sizing_table=self.dolphin_config.get('esof_sizing_table'),
            asset_bucket_data=self._load_asset_bucket_data(),
            use_int_leverage=bool(self.dolphin_config.get('use_int_leverage', False)),
        )
        self.engine = create_boost_engine(mode=boost_mode, **_engine_kwargs)
        # Wire asset selector ban-set (shared file, BLUE-invariant when ban_set is None).
        _ban = self.dolphin_config.get('asset_bucket_ban_set')
        _bucket_data = _engine_kwargs.get('asset_bucket_data') or {}
        if _ban:
            try:
                self.engine.asset_selector.asset_bucket_ban_set = set(int(b) for b in _ban)
                self.engine.asset_selector.asset_bucket_assignments = dict(_bucket_data.get('assignments', {}))
            except Exception as _e:
                self.log.warning(f"[S6] Failed to wire asset_bucket_ban_set: {_e}")
        self.engine.set_esoteric_hazard_multiplier(0.0)  # gold spec: init guard, MUST precede set_mc_forewarner
        # == MC-Forewarner injection ===========================================
@@ -509,10 +578,34 @@ class DolphinActor(Strategy):
                added_func=self._on_scan_event,
                updated_func=self._on_scan_event,
            )
-            self.log.info("[HZ] Push listeners registered: acb_boost + latest_eigen_scan")
+            # EsoF advisor listener — feeds orchestrator regime gate at _try_entry.
            # Callback is zero-work (JSON parse + dict write); the label is consumed
            # just before step_bar on the timer thread.
            features.add_entry_listener(
                include_value=True,
                key='esof_advisor_latest',
                added_func=self._on_esof_event,
                updated_func=self._on_esof_event,
            )
            self.log.info("[HZ] Push listeners registered: acb_boost + latest_eigen_scan + esof_advisor_latest")
        except Exception as e:
            self.log.error(f"Failed to setup ACB listener: {e}")
    def _on_esof_event(self, event):
        """Cache EsoF label for the orchestrator regime gate. Tolerates stale JSON
        schema — on any parse error we fall back to no label (orchestrator treats
        None as UNKNOWN, the new renamed conflict-state default)."""
        try:
            val = event.value
            if not val:
                return
            parsed = json.loads(val) if isinstance(val, str) else val
            label = parsed.get('advisory_label') if isinstance(parsed, dict) else None
            if isinstance(label, str) and label:
                self._current_esof_label = label
        except Exception:
            self._current_esof_label = None
    def _on_scan_event(self, event):
        """HZ reactor-thread callback -- fires immediately when NG7 writes to HZ.
        Zero-work: stores raw string + sets edge-trigger flag. No JSON parsing,
@@ -683,6 +776,13 @@ class DolphinActor(Strategy):
            getattr(self.engine, '_mc_gate_open', True),
        )
        # Feed EsoF label into orchestrator — consumed by regime gate at _try_entry top.
        # Engine tolerates None (treated as UNKNOWN under the NEUTRAL→UNKNOWN rename).
        try:
            self.engine._current_esof_label = self._current_esof_label
        except Exception:
            pass
        _step_start = time.monotonic()
        try:
            result = self.engine.step_bar(
@@ -1536,7 +1636,41 @@ class DolphinActor(Strategy):
                            exf=self._last_exf,
                        )
                        _shadow['asset'] = _pend_ae['asset']
-                        self._adaptive_exit.log_shadow(_shadow)
+
                        # V7 head-to-head: pull the authoritative-path decision for
                        # the same trade at the same instant (may be None if V7 not
                        # wired or hasn't decided yet — log_shadow tolerates None).
                        _v7_dec_ae = self._v6_decisions.get(_tid_ae) or {}
                        _v7_action    = _v7_dec_ae.get('action')
                        _v7_exit_reason = _v7_dec_ae.get('reason')
                        # Naive counterfactual: pure TP/STOP/MAX_HOLD at this bar.
                        _naive_would_have: Optional[str] = None
                        try:
                            _eng_cfg_ae = self.dolphin_config.get('engine', {})
                            _tp = float(_eng_cfg_ae.get('fixed_tp_pct', 0.0095))
                            _sl = float(_eng_cfg_ae.get('stop_pct', 0.0)) or 0.0
                            _mh = int(_eng_cfg_ae.get('max_hold_bars', 120))
                            _dir_ae = -1 if _pend_ae['side'] == 'SHORT' else 1
                            _ep_ae = float(_pend_ae['entry_price'] or 0.0)
                            _pnl_naive = (_dir_ae * (_ep_ae - float(_cur_px_ae)) / _ep_ae) if _ep_ae > 0 else 0.0
                            if _pnl_naive >= _tp:
                                _naive_would_have = 'TP'
                            elif _sl > 0 and _pnl_naive <= -_sl:
                                _naive_would_have = 'STOP'
                            elif _bars_ae >= _mh:
                                _naive_would_have = 'MAX_HOLD'
                            else:
                                _naive_would_have = 'HOLD'
                        except Exception:
                            _naive_would_have = None
                        self._adaptive_exit.log_shadow(
                            _shadow,
                            v7_action=_v7_action,
                            v7_exit_reason=_v7_exit_reason,
                            naive_would_have=_naive_would_have,
                        )
            except Exception:
                pass  # shadow must never affect live trading