initial: import DOLPHIN baseline 2026-04-21 from dolphinng5_predict working tree

Includes core prod + GREEN/BLUE subsystems:
- prod/ (BLUE harness, configs, scripts, docs)
- nautilus_dolphin/ (GREEN Nautilus-native impl + dvae/ preserved)
- adaptive_exit/ (AEM engine + models/bucket_assignments.pkl)
- Observability/ (EsoF advisor, TUI, dashboards)
- external_factors/ (EsoF producer)
- mc_forewarning_qlabs_fork/ (MC regime/envelope)

Excludes runtime caches, logs, backups, and reproducible artifacts per .gitignore.
This commit is contained in:
hjnormey
2026-04-21 16:58:38 +02:00
commit 01c19662cb
643 changed files with 260241 additions and 0 deletions

259
nautilus_dolphin/run_go1_ood.py Executable file
View File

@@ -0,0 +1,259 @@
"""GO1 / GO2 OOD Dress Rehearsal - Baseline run on all available parquet data.
Run: python run_go1_ood.py
python run_go1_ood.py --label GO2
"""
import sys, time, math, argparse
from pathlib import Path
import numpy as np
import pandas as pd
# Force UTF-8 output (Windows cp1252 safety)
if hasattr(sys.stdout, 'reconfigure'):
sys.stdout.reconfigure(encoding='utf-8')
sys.path.insert(0, str(Path(__file__).parent))
# ── JIT warmup ─────────────────────────────────────────────────────────────
print("Compiling numba kernels...")
t0c = time.time()
from nautilus_dolphin.nautilus.alpha_asset_selector import compute_irp_nb, compute_ars_nb, rank_assets_irp_nb
from nautilus_dolphin.nautilus.alpha_bet_sizer import compute_sizing_nb
from nautilus_dolphin.nautilus.alpha_signal_generator import check_dc_nb
_p = np.array([1.0, 2.0, 3.0], dtype=np.float64)
compute_irp_nb(_p, -1); compute_ars_nb(1.0, 0.5, 0.01)
rank_assets_irp_nb(np.ones((10, 2), dtype=np.float64), 8, -1, 5, 500.0, 20, 0.20)
compute_sizing_nb(-0.03, -0.02, -0.05, 3.0, 0.5, 5.0, 0.20, True, True, 0.0,
np.zeros(4, dtype=np.int64), np.zeros(4, dtype=np.int64),
np.zeros(5, dtype=np.float64), 0, -1, 0.01, 0.04)
check_dc_nb(_p, 3, 1, 0.75)
print(f" JIT: {time.time() - t0c:.1f}s")
from nautilus_dolphin.nautilus.alpha_orchestrator import NDAlphaEngine
from nautilus_dolphin.nautilus.adaptive_circuit_breaker import AdaptiveCircuitBreaker
# ── Config ─────────────────────────────────────────────────────────────────
VBT_DIR = Path(r"C:\Users\Lenovo\Documents\- DOLPHIN NG HD HCM TSF Predict\vbt_cache")
META_COLS = {'timestamp', 'scan_number', 'v50_lambda_max_velocity', 'v150_lambda_max_velocity',
'v300_lambda_max_velocity', 'v750_lambda_max_velocity', 'vel_div',
'instability_50', 'instability_150'}
ENGINE_KWARGS = dict(
initial_capital=25000.0, vel_div_threshold=-0.02, vel_div_extreme=-0.05,
min_leverage=0.5, max_leverage=5.0, leverage_convexity=3.0,
fraction=0.20, fixed_tp_pct=0.0099, stop_pct=1.0, max_hold_bars=120,
use_direction_confirm=True, dc_lookback_bars=7, dc_min_magnitude_bps=0.75,
dc_skip_contradicts=True, dc_leverage_boost=1.0, dc_leverage_reduce=0.5,
use_asset_selection=True, min_irp_alignment=0.45,
use_sp_fees=True, use_sp_slippage=True,
sp_maker_entry_rate=0.62, sp_maker_exit_rate=0.50,
use_ob_edge=True, ob_edge_bps=5.0, ob_confirm_rate=0.40,
lookback=100, use_alpha_layers=True, use_dynamic_leverage=True, seed=42,
)
VD_THRESH = -0.02; VD_EXTREME = -0.05; CONVEXITY = 3.0
PAPER_CAPITAL = 10000.0 # user paper-trade capital
SIM_CAPITAL = 25000.0 # engine simulation capital
SCALE = PAPER_CAPITAL / SIM_CAPITAL # 0.40
# ── Data load ──────────────────────────────────────────────────────────────
parquet_files = sorted(VBT_DIR.glob("*.parquet"))
parquet_files = [p for p in parquet_files if 'catalog' not in str(p)]
acb = AdaptiveCircuitBreaker()
date_strings = [pf.stem for pf in parquet_files]
acb.preload_w750(date_strings)
all_vols = []
for pf in parquet_files[:2]:
df = pd.read_parquet(pf)
if 'BTCUSDT' not in df.columns: continue
pr = df['BTCUSDT'].values
for i in range(60, len(pr)):
seg = pr[max(0, i-50):i]
if len(seg) < 10: continue
v = float(np.std(np.diff(seg)/seg[:-1]))
if v > 0: all_vols.append(v)
vol_p60 = float(np.percentile(all_vols, 60)) if all_vols else 0.0
pq_data = {}
for pf in parquet_files:
df = pd.read_parquet(pf)
ac = [c for c in df.columns if c not in META_COLS]
bp = df['BTCUSDT'].values if 'BTCUSDT' in df.columns else None
dv = np.full(len(df), np.nan)
if bp is not None:
for i in range(50, len(bp)):
seg = bp[max(0, i-50):i]
if len(seg) < 10: continue
dv[i] = float(np.std(np.diff(seg)/seg[:-1]))
pq_data[pf.stem] = (df, ac, dv)
def strength_cubic(vel_div):
if vel_div >= VD_THRESH: return 0.0
raw = (VD_THRESH - vel_div) / (VD_THRESH - VD_EXTREME)
return min(1.0, max(0.0, raw)) ** CONVEXITY
# ── Engine run ─────────────────────────────────────────────────────────────
def run_engine():
import gc; gc.collect()
engine = NDAlphaEngine(**ENGINE_KWARGS)
bar_idx = 0; ph = {}; dstats = []
for pf in parquet_files:
ds = pf.stem; cs = engine.capital
engine.regime_direction = -1
engine.regime_dd_halt = False
acb_info = acb.get_dynamic_boost_for_date(ds, ob_engine=None)
base_boost = acb_info['boost']
beta = acb_info['beta']
df, acols, dvol = pq_data[ds]
bid = 0
for ri in range(len(df)):
row = df.iloc[ri]; vd = row.get("vel_div")
if vd is None or not np.isfinite(vd): bar_idx+=1; bid+=1; continue
prices = {}
for ac in acols:
p = row[ac]
if p and p > 0 and np.isfinite(p):
prices[ac] = float(p)
if ac not in ph: ph[ac] = []
ph[ac].append(float(p))
if len(ph[ac]) > 500: ph[ac] = ph[ac][-200:]
if not prices: bar_idx+=1; bid+=1; continue
vrok = False if bid < 100 else (np.isfinite(dvol[ri]) and dvol[ri] > vol_p60)
if beta > 0 and base_boost > 1.0:
ss = strength_cubic(float(vd))
engine.regime_size_mult = base_boost * (1.0 + beta * ss)
else:
engine.regime_size_mult = base_boost
engine.process_bar(bar_idx=bar_idx, vel_div=float(vd), prices=prices,
vol_regime_ok=vrok, price_histories=ph)
bar_idx+=1; bid+=1
dstats.append({'date': ds, 'pnl': engine.capital - cs, 'cap': engine.capital})
tr = engine.trade_history
w = [t for t in tr if t.pnl_absolute > 0]
l = [t for t in tr if t.pnl_absolute <= 0]
gw = sum(t.pnl_absolute for t in w) if w else 0.0
gl = abs(sum(t.pnl_absolute for t in l)) if l else 0.0
roi = (engine.capital - SIM_CAPITAL) / SIM_CAPITAL * 100
pf_val = gw / gl if gl > 0 else 999.0
dr = [s['pnl'] / SIM_CAPITAL * 100 for s in dstats]
sharpe = np.mean(dr) / np.std(dr) * np.sqrt(365) if np.std(dr) > 0 else 0.0
peak_cap = SIM_CAPITAL; max_dd = 0.0
for s in dstats:
peak_cap = max(peak_cap, s['cap'])
dd = (peak_cap - s['cap']) / peak_cap * 100
max_dd = max(max_dd, dd)
wr = len(w) / len(tr) * 100 if tr else 0.0
avg_win = float(np.mean([t.pnl_pct for t in w]) * 100) if w else 0.0
avg_loss= float(np.mean([t.pnl_pct for t in l]) * 100) if l else 0.0
return {
'roi': roi, 'pf': pf_val, 'dd': max_dd, 'sharpe': sharpe,
'trades': len(tr), 'capital': engine.capital,
'wr': wr, 'avg_win': avg_win, 'avg_loss': avg_loss,
'n_wins': len(w), 'n_losses': len(l),
'dstats': dstats,
}
# ── Main ───────────────────────────────────────────────────────────────────
if __name__ == '__main__':
parser = argparse.ArgumentParser()
parser.add_argument('--label', default='GO1', help='Run label (GO1 or GO2)')
args = parser.parse_args()
label = args.label.upper()
print(f"\n{'='*70}")
print(f" DOLPHIN NG -- OOD DRESS REHEARSAL [{label}]")
print(f"{'='*70}")
print(f" Data: {date_strings[0]} to {date_strings[-1]} ({len(date_strings)} days)")
print(f" Capital: ${PAPER_CAPITAL:,.0f} paper (sim at ${SIM_CAPITAL:,.0f}, scale={SCALE:.2f})")
print(f" OB: BASELINE (no OB engine)")
print(f" Mode: Eigenvalue signal only")
print(f"{'='*70}")
t0 = time.time()
r = run_engine()
elapsed = time.time() - t0
net_pnl_paper = (r['capital'] - SIM_CAPITAL) * SCALE
cap_paper = r['capital'] * SCALE
print(f"\n [{label}] RESULT ({elapsed:.0f}s)")
print(f" {''*66}")
print(f" ROI: {r['roi']:+.2f}%")
print(f" PF: {r['pf']:.3f}")
print(f" Sharpe: {r['sharpe']:.2f}")
print(f" Max DD: {r['dd']:.2f}%")
print(f" Trades: {r['trades']} WR: {r['wr']:.1f}% AvgW: {r['avg_win']:+.3f}% AvgL: {r['avg_loss']:+.3f}%")
print(f" W/L: {r['n_wins']}/{r['n_losses']}")
print(f" Capital: ${cap_paper:,.2f} (net {net_pnl_paper:+,.2f} on $10k paper)")
print(f" {''*66}")
# Last 7 days breakdown
tail = r['dstats'][-7:]
print(f"\n Last {len(tail)} days daily P&L (paper $10k scale):")
for s in tail:
pnl_p = s['pnl'] * SCALE
cap_p = s['cap'] * SCALE
bar = '+' * int(abs(pnl_p) / 2) if pnl_p >= 0 else '-' * int(abs(pnl_p) / 2)
sign = '+' if pnl_p >= 0 else ''
print(f" {s['date']} {sign}${pnl_p:6.2f} cap ${cap_p:,.2f} {bar}")
print(f"\n{'='*70}\n")
# Save snapshot for GO2 delta calc
import json
snap = {
'label': label,
'dates': date_strings,
'roi': r['roi'],
'pf': r['pf'],
'sharpe': r['sharpe'],
'dd': r['dd'],
'trades': r['trades'],
'wr': r['wr'],
'capital': r['capital'],
'n_wins': r['n_wins'],
'n_losses': r['n_losses'],
'dstats': r['dstats'],
}
snap_path = Path(__file__).parent / f'ood_{label.lower()}_snap.json'
with open(snap_path, 'w') as f:
json.dump(snap, f, indent=2)
print(f" Snapshot saved: {snap_path.name}")
# If GO2, load GO1 snap and print delta
if label == 'GO2':
go1_path = Path(__file__).parent / 'ood_go1_snap.json'
if go1_path.exists():
with open(go1_path) as f:
g1 = json.load(f)
new_days = [d for d in date_strings if d not in g1['dates']]
d_roi = r['roi'] - g1['roi']
d_trades = r['trades'] - g1['trades']
d_wr = r['wr'] - g1['wr']
d_cap = (r['capital'] - g1['capital']) * SCALE
print(f" {'='*66}")
print(f" DELTA vs GO1")
print(f" {''*66}")
print(f" New days ingested: {new_days if new_days else '(none -- same dataset)'}")
print(f" dROI: {d_roi:+.2f}%")
print(f" dTrades: {d_trades:+d}")
print(f" dWR: {d_wr:+.2f}%")
print(f" dCapital:{d_cap:+,.2f} (paper $10k)")
if new_days:
print(f"\n New day(s) P&L:")
new_dstats = [s for s in r['dstats'] if s['date'] in new_days]
for s in new_dstats:
pnl_p = s['pnl'] * SCALE
sign = '+' if pnl_p >= 0 else ''
print(f" {s['date']} {sign}${pnl_p:.2f} (paper)")
print(f" {'='*66}\n")
else:
print(" [GO2] No GO1 snapshot found -- run GO1 first.")