DOLPHIN/prod/diag_vol_gold.py

"""
Verify gold vol_ok methodology: compare static-threshold FIX vs gold-vol FIX.
Confirms ROI improvement and T=2155 maintained.
"""
import sys, math, pathlib
import numpy as np
import pandas as pd

sys.path.insert(0, '/mnt/dolphinng5_predict')
sys.path.insert(0, '/mnt/dolphinng5_predict/nautilus_dolphin')

print("Importing...", flush=True)
from nautilus_dolphin.nautilus.proxy_boost_engine import create_boost_engine
print("Import done.", flush=True)

PARQUET_DIR = pathlib.Path('/mnt/dolphinng5_predict/vbt_cache')
VOL_P60_INWINDOW = 0.00009868

ENG_KWARGS = dict(
    max_hold_bars=120, min_irp_alignment=0.45, max_leverage=8.0,
    vel_div_threshold=-0.02, vel_div_extreme=-0.05,
    min_leverage=0.5, leverage_convexity=3.0,
    fraction=0.20, fixed_tp_pct=0.0095, stop_pct=1.0,
    use_direction_confirm=True, dc_lookback_bars=7, dc_min_magnitude_bps=0.75,
    dc_skip_contradicts=True, dc_leverage_boost=1.0, dc_leverage_reduce=0.5,
    use_asset_selection=True, use_sp_fees=True, use_sp_slippage=True,
    sp_maker_entry_rate=0.62, sp_maker_exit_rate=0.50,
    use_ob_edge=True, ob_edge_bps=5.0, ob_confirm_rate=0.40,
    lookback=100, use_alpha_layers=True, use_dynamic_leverage=True, seed=42,
)

def make_engine(cap=25000.0):
    return create_boost_engine(mode='d_liq', initial_capital=cap, **ENG_KWARGS)

def compute_static_vol_ok(df):
    """Static threshold, 49-ret window, stored at j (old actor method)."""
    btc_f = df['BTCUSDT'].values.astype('float64')
    n = len(btc_f)
    vol_ok = np.zeros(n, dtype=bool)
    for j in range(50, n):
        seg = btc_f[max(0, j-50):j]
        diffs = np.diff(seg)
        denom = seg[:-1]
        if np.any(denom == 0):
            continue
        v = float(np.std(diffs / denom))
        if math.isfinite(v) and v > 0:
            vol_ok[j] = v > VOL_P60_INWINDOW
    return vol_ok

def compute_gold_vol_ok_all_days(parquet_files):
    """Gold vol_ok: 50-ret window, dvol[j+1], accumulating vp60. Returns {ts_ns: bool}."""
    all_vols = []
    result = {}

    for pf in parquet_files:
        df = pd.read_parquet(pf)
        ts_ns_arr = df['timestamp'].values.astype('int64') if 'timestamp' in df.columns else None
        if ts_ns_arr is None:
            continue

        bp = df['BTCUSDT'].values if 'BTCUSDT' in df.columns else None
        n = len(df)
        dvol = np.zeros(n, dtype=np.float64)

        if bp is not None and len(bp) > 1:
            rets = np.diff(bp.astype('float64')) / (bp[:-1].astype('float64') + 1e-9)
            for j in range(50, len(rets)):
                v = float(np.std(rets[j - 50:j]))
                dvol[j + 1] = v
                if v > 0:
                    all_vols.append(v)

        vp60 = float(np.percentile(all_vols, 60)) if len(all_vols) > 1000 else VOL_P60_INWINDOW

        for i in range(n):
            result[int(ts_ns_arr[i])] = bool(dvol[i] > 0 and dvol[i] > vp60)

    return result

def run_day(df, date_str, eng, vol_ok_arr, nan_fix=True):
    eng.begin_day(date_str)
    data_arr = df.values
    cols = df.columns.tolist()
    vd_idx = cols.index('vel_div') if 'vel_div' in cols else -1
    v50_idx = cols.index('v50_lambda_max_velocity') if 'v50_lambda_max_velocity' in cols else -1
    v750_idx = cols.index('v750_lambda_max_velocity') if 'v750_lambda_max_velocity' in cols else -1
    i50_idx = cols.index('instability_50') if 'instability_50' in cols else -1
    usdt_idxs = [(c, cols.index(c)) for c in cols if c.endswith('USDT')]
    trades = 0

    for i in range(len(df)):
        row_vals = data_arr[i]
        vd_raw = float(row_vals[vd_idx]) if vd_idx != -1 else float('nan')
        if not math.isfinite(vd_raw):
            if nan_fix:
                eng._global_bar_idx += 1
            continue

        v750 = float(row_vals[v750_idx]) if v750_idx != -1 and math.isfinite(float(row_vals[v750_idx])) else 0.0
        inst50 = float(row_vals[i50_idx]) if i50_idx != -1 and math.isfinite(float(row_vals[i50_idx])) else 0.0
        v50 = float(row_vals[v50_idx]) if v50_idx != -1 and math.isfinite(float(row_vals[v50_idx])) else 0.0
        prices = {sym: float(row_vals[ci]) for sym, ci in usdt_idxs
                  if math.isfinite(float(row_vals[ci])) and float(row_vals[ci]) > 0}

        prev_pos = eng.position
        if hasattr(eng, 'pre_bar_proxy_update'):
            eng.pre_bar_proxy_update(inst50, v750)

        eng.step_bar(
            bar_idx=i, vel_div=vd_raw, prices=prices,
            v50_vel=v50, v750_vel=v750,
            vol_regime_ok=bool(vol_ok_arr[i]),
        )
        if prev_pos is not None and eng.position is None:
            trades += 1

    eng.end_day()
    return trades

def main():
    files = sorted(PARQUET_DIR.glob('*.parquet'))
    print(f"Days: {len(files)}", flush=True)

    # Precompute gold vol_ok
    print("Precomputing gold vol_ok...", flush=True)
    gold_vol_ok = compute_gold_vol_ok_all_days(files)
    n_true = sum(1 for v in gold_vol_ok.values() if v)
    print(f"Gold vol_ok: {n_true:,}/{len(gold_vol_ok):,} True ({100*n_true/len(gold_vol_ok):.1f}%)", flush=True)

    static_eng = make_engine()
    gold_eng = make_engine()
    static_T = gold_T = 0

    for pf in files:
        date_str = pf.stem
        df = pd.read_parquet(pf)

        static_vol = compute_static_vol_ok(df)

        ts_ns_arr = df['timestamp'].values.astype('int64')
        gold_vol = np.array([gold_vol_ok.get(int(ts), False) for ts in ts_ns_arr], dtype=bool)

        ts = static_eng.capital
        tg = static_eng.capital
        ta = run_day(df, date_str, static_eng, static_vol, nan_fix=True)
        tb = run_day(df, date_str, gold_eng, gold_vol, nan_fix=True)
        static_T += ta; gold_T += tb

        print(f"{date_str}: STATIC+{ta:3d}(cum={static_T:4d} ${static_eng.capital:8.0f})  "
              f"GOLD+{tb:3d}(cum={gold_T:4d} ${gold_eng.capital:8.0f})", flush=True)

    ic = 25000.0
    print(f"\nSTATIC: T={static_T}, cap=${static_eng.capital:.2f}, ROI={100*(static_eng.capital/ic-1):.2f}%", flush=True)
    print(f"GOLD:   T={gold_T}, cap=${gold_eng.capital:.2f}, ROI={100*(gold_eng.capital/ic-1):.2f}%", flush=True)
    print(f"\nGold target: T=2155, ROI=+189.48%", flush=True)

if __name__ == '__main__':
    main()
initial: import DOLPHIN baseline 2026-04-21 from dolphinng5_predict working tree Includes core prod + GREEN/BLUE subsystems: - prod/ (BLUE harness, configs, scripts, docs) - nautilus_dolphin/ (GREEN Nautilus-native impl + dvae/ preserved) - adaptive_exit/ (AEM engine + models/bucket_assignments.pkl) - Observability/ (EsoF advisor, TUI, dashboards) - external_factors/ (EsoF producer) - mc_forewarning_qlabs_fork/ (MC regime/envelope) Excludes runtime caches, logs, backups, and reproducible artifacts per .gitignore. 2026-04-21 16:58:38 +02:00			`"""`
			`Verify gold vol_ok methodology: compare static-threshold FIX vs gold-vol FIX.`
			`Confirms ROI improvement and T=2155 maintained.`
			`"""`
			`import sys, math, pathlib`
			`import numpy as np`
			`import pandas as pd`

			`sys.path.insert(0, '/mnt/dolphinng5_predict')`
			`sys.path.insert(0, '/mnt/dolphinng5_predict/nautilus_dolphin')`

			`print("Importing...", flush=True)`
			`from nautilus_dolphin.nautilus.proxy_boost_engine import create_boost_engine`
			`print("Import done.", flush=True)`

			`PARQUET_DIR = pathlib.Path('/mnt/dolphinng5_predict/vbt_cache')`
			`VOL_P60_INWINDOW = 0.00009868`

			`ENG_KWARGS = dict(`
			`max_hold_bars=120, min_irp_alignment=0.45, max_leverage=8.0,`
			`vel_div_threshold=-0.02, vel_div_extreme=-0.05,`
			`min_leverage=0.5, leverage_convexity=3.0,`
			`fraction=0.20, fixed_tp_pct=0.0095, stop_pct=1.0,`
			`use_direction_confirm=True, dc_lookback_bars=7, dc_min_magnitude_bps=0.75,`
			`dc_skip_contradicts=True, dc_leverage_boost=1.0, dc_leverage_reduce=0.5,`
			`use_asset_selection=True, use_sp_fees=True, use_sp_slippage=True,`
			`sp_maker_entry_rate=0.62, sp_maker_exit_rate=0.50,`
			`use_ob_edge=True, ob_edge_bps=5.0, ob_confirm_rate=0.40,`
			`lookback=100, use_alpha_layers=True, use_dynamic_leverage=True, seed=42,`
			`)`

			`def make_engine(cap=25000.0):`
			`return create_boost_engine(mode='d_liq', initial_capital=cap, **ENG_KWARGS)`

			`def compute_static_vol_ok(df):`
			`"""Static threshold, 49-ret window, stored at j (old actor method)."""`
			`btc_f = df['BTCUSDT'].values.astype('float64')`
			`n = len(btc_f)`
			`vol_ok = np.zeros(n, dtype=bool)`
			`for j in range(50, n):`
			`seg = btc_f[max(0, j-50):j]`
			`diffs = np.diff(seg)`
			`denom = seg[:-1]`
			`if np.any(denom == 0):`
			`continue`
			`v = float(np.std(diffs / denom))`
			`if math.isfinite(v) and v > 0:`
			`vol_ok[j] = v > VOL_P60_INWINDOW`
			`return vol_ok`

			`def compute_gold_vol_ok_all_days(parquet_files):`
			`"""Gold vol_ok: 50-ret window, dvol[j+1], accumulating vp60. Returns {ts_ns: bool}."""`
			`all_vols = []`
			`result = {}`

			`for pf in parquet_files:`
			`df = pd.read_parquet(pf)`
			`ts_ns_arr = df['timestamp'].values.astype('int64') if 'timestamp' in df.columns else None`
			`if ts_ns_arr is None:`
			`continue`

			`bp = df['BTCUSDT'].values if 'BTCUSDT' in df.columns else None`
			`n = len(df)`
			`dvol = np.zeros(n, dtype=np.float64)`

			`if bp is not None and len(bp) > 1:`
			`rets = np.diff(bp.astype('float64')) / (bp[:-1].astype('float64') + 1e-9)`
			`for j in range(50, len(rets)):`
			`v = float(np.std(rets[j - 50:j]))`
			`dvol[j + 1] = v`
			`if v > 0:`
			`all_vols.append(v)`

			`vp60 = float(np.percentile(all_vols, 60)) if len(all_vols) > 1000 else VOL_P60_INWINDOW`

			`for i in range(n):`
			`result[int(ts_ns_arr[i])] = bool(dvol[i] > 0 and dvol[i] > vp60)`

			`return result`

			`def run_day(df, date_str, eng, vol_ok_arr, nan_fix=True):`
			`eng.begin_day(date_str)`
			`data_arr = df.values`
			`cols = df.columns.tolist()`
			`vd_idx = cols.index('vel_div') if 'vel_div' in cols else -1`
			`v50_idx = cols.index('v50_lambda_max_velocity') if 'v50_lambda_max_velocity' in cols else -1`
			`v750_idx = cols.index('v750_lambda_max_velocity') if 'v750_lambda_max_velocity' in cols else -1`
			`i50_idx = cols.index('instability_50') if 'instability_50' in cols else -1`
			`usdt_idxs = [(c, cols.index(c)) for c in cols if c.endswith('USDT')]`
			`trades = 0`

			`for i in range(len(df)):`
			`row_vals = data_arr[i]`
			`vd_raw = float(row_vals[vd_idx]) if vd_idx != -1 else float('nan')`
			`if not math.isfinite(vd_raw):`
			`if nan_fix:`
			`eng._global_bar_idx += 1`
			`continue`

			`v750 = float(row_vals[v750_idx]) if v750_idx != -1 and math.isfinite(float(row_vals[v750_idx])) else 0.0`
			`inst50 = float(row_vals[i50_idx]) if i50_idx != -1 and math.isfinite(float(row_vals[i50_idx])) else 0.0`
			`v50 = float(row_vals[v50_idx]) if v50_idx != -1 and math.isfinite(float(row_vals[v50_idx])) else 0.0`
			`prices = {sym: float(row_vals[ci]) for sym, ci in usdt_idxs`
			`if math.isfinite(float(row_vals[ci])) and float(row_vals[ci]) > 0}`

			`prev_pos = eng.position`
			`if hasattr(eng, 'pre_bar_proxy_update'):`
			`eng.pre_bar_proxy_update(inst50, v750)`

			`eng.step_bar(`
			`bar_idx=i, vel_div=vd_raw, prices=prices,`
			`v50_vel=v50, v750_vel=v750,`
			`vol_regime_ok=bool(vol_ok_arr[i]),`
			`)`
			`if prev_pos is not None and eng.position is None:`
			`trades += 1`

			`eng.end_day()`
			`return trades`

			`def main():`
			`files = sorted(PARQUET_DIR.glob('*.parquet'))`
			`print(f"Days: {len(files)}", flush=True)`

			`# Precompute gold vol_ok`
			`print("Precomputing gold vol_ok...", flush=True)`
			`gold_vol_ok = compute_gold_vol_ok_all_days(files)`
			`n_true = sum(1 for v in gold_vol_ok.values() if v)`
			`print(f"Gold vol_ok: {n_true:,}/{len(gold_vol_ok):,} True ({100*n_true/len(gold_vol_ok):.1f}%)", flush=True)`

			`static_eng = make_engine()`
			`gold_eng = make_engine()`
			`static_T = gold_T = 0`

			`for pf in files:`
			`date_str = pf.stem`
			`df = pd.read_parquet(pf)`

			`static_vol = compute_static_vol_ok(df)`

			`ts_ns_arr = df['timestamp'].values.astype('int64')`
			`gold_vol = np.array([gold_vol_ok.get(int(ts), False) for ts in ts_ns_arr], dtype=bool)`

			`ts = static_eng.capital`
			`tg = static_eng.capital`
			`ta = run_day(df, date_str, static_eng, static_vol, nan_fix=True)`
			`tb = run_day(df, date_str, gold_eng, gold_vol, nan_fix=True)`
			`static_T += ta; gold_T += tb`

			`print(f"{date_str}: STATIC+{ta:3d}(cum={static_T:4d} ${static_eng.capital:8.0f}) "`
			`f"GOLD+{tb:3d}(cum={gold_T:4d} ${gold_eng.capital:8.0f})", flush=True)`

			`ic = 25000.0`
			`print(f"\nSTATIC: T={static_T}, cap=${static_eng.capital:.2f}, ROI={100*(static_eng.capital/ic-1):.2f}%", flush=True)`
			`print(f"GOLD: T={gold_T}, cap=${gold_eng.capital:.2f}, ROI={100*(gold_eng.capital/ic-1):.2f}%", flush=True)`
			`print(f"\nGold target: T=2155, ROI=+189.48%", flush=True)`

			`if __name__ == '__main__':`
			`main()`