275 lines
11 KiB
Python
275 lines
11 KiB
Python
import argparse
|
|
|
|
import matplotlib.pyplot as plt
|
|
import numpy as np
|
|
import pandas as pd
|
|
|
|
import data_manager
|
|
import factor_attribution
|
|
import metrics
|
|
from strategies.adaptive_momentum import AdaptiveMomentumStrategy
|
|
from strategies.buy_and_hold import BuyAndHoldStrategy
|
|
from strategies.dual_momentum import DualMomentumStrategy
|
|
from strategies.inverse_vol import InverseVolatilityStrategy
|
|
from strategies.mean_reversion import MeanReversionStrategy
|
|
from strategies.momentum import MomentumStrategy
|
|
from strategies.momentum_quality import MomentumQualityStrategy
|
|
from strategies.multi_factor import MultiFactorStrategy
|
|
from strategies.recovery_momentum import RecoveryMomentumStrategy
|
|
from strategies.trend_following import TrendFollowingStrategy
|
|
from universe import UNIVERSES
|
|
|
|
|
|
# ---------------------------------------------------------------------------
|
|
# Backtest engine
|
|
# ---------------------------------------------------------------------------
|
|
|
|
def backtest(
|
|
strategy,
|
|
data: pd.DataFrame,
|
|
initial_capital: float = 100_000,
|
|
transaction_cost: float = 0.001,
|
|
fixed_fee: float = 0.0,
|
|
open_data: pd.DataFrame | None = None,
|
|
) -> pd.Series:
|
|
"""
|
|
Vectorized backtest.
|
|
|
|
Parameters
|
|
----------
|
|
strategy : Strategy
|
|
Any class implementing generate_signals(data) → DataFrame of weights.
|
|
data : pd.DataFrame
|
|
Adjusted close prices, one column per asset.
|
|
initial_capital : float
|
|
Starting portfolio value.
|
|
transaction_cost : float
|
|
One-way cost per unit of turnover (e.g. 0.001 = 10 bps).
|
|
fixed_fee : float
|
|
Fixed dollar cost per individual trade (each buy or sell).
|
|
open_data : pd.DataFrame, optional
|
|
Open prices. When provided, enables open-to-close execution mode:
|
|
- Morning: observe open prices → run strategy → decide weights
|
|
- Evening: execute all trades at close prices
|
|
Strategies have an internal shift(1) designed for close prices.
|
|
Since open prices are observable same-day (before close), we undo
|
|
that shift so signals use today's open and execute at today's close.
|
|
|
|
Returns
|
|
-------
|
|
pd.Series
|
|
Daily equity curve.
|
|
"""
|
|
if open_data is not None:
|
|
# Open-to-close mode:
|
|
# Strategy's shift(1) on open prices gives: weights[t] = f(open_{t-1})
|
|
# But open_t is known at morning of day t, so undo shift to get f(open_t)
|
|
# Then execute at close_t, earning close_t → close_{t+1}
|
|
weights = strategy.generate_signals(open_data)
|
|
weights = weights.shift(-1).fillna(0.0)
|
|
weights = weights.reindex(data.index).fillna(0.0)
|
|
positions = weights
|
|
|
|
# Returns earned: close[t] → close[t+1], weighted by positions decided at open[t]
|
|
close_returns = data.pct_change().fillna(0.0)
|
|
portfolio_returns = (close_returns * positions.shift(1).fillna(0.0)).sum(axis=1)
|
|
else:
|
|
# Classic close-to-close mode
|
|
weights = strategy.generate_signals(data)
|
|
weights = weights.reindex(data.index).fillna(0.0)
|
|
positions = weights
|
|
|
|
daily_returns = data.pct_change().fillna(0.0)
|
|
portfolio_returns = (daily_returns * positions).sum(axis=1)
|
|
|
|
# Turnover cost: sum of absolute weight changes each day
|
|
turnover = positions.diff().abs().sum(axis=1).fillna(0.0)
|
|
portfolio_returns -= turnover * transaction_cost
|
|
|
|
# Fixed per-trade fee: count positions with non-zero weight change
|
|
if fixed_fee > 0:
|
|
weight_changes = positions.diff().fillna(0.0)
|
|
n_trades = (weight_changes.abs() > 1e-8).sum(axis=1)
|
|
# Build running equity to convert dollar fees to return impact
|
|
equity_running = (1 + portfolio_returns).cumprod() * initial_capital
|
|
fee_impact = (n_trades * fixed_fee) / equity_running.shift(1).fillna(initial_capital)
|
|
portfolio_returns -= fee_impact
|
|
|
|
equity = (1 + portfolio_returns).cumprod() * initial_capital
|
|
return equity
|
|
|
|
|
|
# ---------------------------------------------------------------------------
|
|
# Visualization
|
|
# ---------------------------------------------------------------------------
|
|
|
|
def plot_results(results: pd.DataFrame) -> None:
|
|
"""Two-panel chart: equity curves (top) + drawdowns (bottom)."""
|
|
# Compute drawdowns
|
|
drawdowns = results.div(results.cummax()) - 1
|
|
|
|
fig, (ax1, ax2) = plt.subplots(2, 1, figsize=(14, 9), sharex=True,
|
|
gridspec_kw={"height_ratios": [3, 1]})
|
|
|
|
for col in results.columns:
|
|
ax1.plot(results.index, results[col], label=col, linewidth=1.5)
|
|
ax1.set_title("Strategy Comparison — Equity Curves", fontsize=14)
|
|
ax1.set_ylabel("Portfolio Value ($)")
|
|
ax1.legend(loc="upper left")
|
|
ax1.grid(True, alpha=0.3)
|
|
|
|
for col in drawdowns.columns:
|
|
ax2.plot(drawdowns.index, drawdowns[col] * 100, label=col, linewidth=1.0)
|
|
ax2.set_title("Drawdowns")
|
|
ax2.set_ylabel("Drawdown (%)")
|
|
ax2.set_xlabel("Date")
|
|
ax2.grid(True, alpha=0.3)
|
|
|
|
plt.tight_layout()
|
|
plt.show()
|
|
|
|
|
|
# ---------------------------------------------------------------------------
|
|
# Main
|
|
# ---------------------------------------------------------------------------
|
|
|
|
def main() -> None:
|
|
parser = argparse.ArgumentParser(description="Run strategy backtest")
|
|
parser.add_argument(
|
|
"--market", choices=UNIVERSES.keys(), default="us",
|
|
help="Market universe to backtest (default: us)",
|
|
)
|
|
parser.add_argument(
|
|
"--capital", type=float, default=None,
|
|
help="Initial capital (default: 10000)",
|
|
)
|
|
parser.add_argument(
|
|
"--top-n", type=int, default=None,
|
|
help="Number of stocks for selective strategies (default: ~10%% of universe)",
|
|
)
|
|
parser.add_argument(
|
|
"--years", type=int, default=None,
|
|
help="Limit backtest to last N years of data",
|
|
)
|
|
parser.add_argument(
|
|
"--no-plot", action="store_true",
|
|
help="Skip plotting charts",
|
|
)
|
|
parser.add_argument(
|
|
"--fixed-fee", type=float, default=0.0,
|
|
help="Fixed dollar cost per trade, e.g. 2.0 means $2 per buy or sell",
|
|
)
|
|
parser.add_argument(
|
|
"--execution", choices=["close", "open-close"], default="close",
|
|
help="Execution mode: 'close' (default, signal & execute on close) or "
|
|
"'open-close' (signal on morning open, execute at close)",
|
|
)
|
|
parser.add_argument(
|
|
"--attribution", action="store_true",
|
|
help="Run factor attribution after performance metrics",
|
|
)
|
|
parser.add_argument(
|
|
"--attribution-model", choices=["capm", "ff5", "ff5plus", "all"], default="all",
|
|
help="Factor model selection for attribution output",
|
|
)
|
|
parser.add_argument(
|
|
"--attribution-export", default=None,
|
|
help="Directory to export factor attribution CSVs",
|
|
)
|
|
args = parser.parse_args()
|
|
initial_capital = args.capital if args.capital is not None else 10_000
|
|
use_open = args.execution == "open-close"
|
|
|
|
universe = UNIVERSES[args.market]
|
|
tickers = universe["fetch"]()
|
|
benchmark = universe["benchmark"]
|
|
benchmark_label = universe["benchmark_label"]
|
|
all_tickers = sorted(set(tickers + [benchmark]))
|
|
|
|
result = data_manager.update(args.market, all_tickers, with_open=use_open)
|
|
if use_open:
|
|
data, open_data = result
|
|
else:
|
|
data = result
|
|
open_data = None
|
|
|
|
if args.years:
|
|
cutoff = data.index[-1] - pd.DateOffset(years=args.years)
|
|
data = data[data.index >= cutoff]
|
|
if open_data is not None:
|
|
open_data = open_data[open_data.index >= cutoff]
|
|
print(f"--- Sliced to last {args.years} years: {data.index[0].date()} to {data.index[-1].date()} ---")
|
|
|
|
# Filter tickers to only those in the data
|
|
tickers = [t for t in tickers if t in data.columns]
|
|
print(f"--- Universe: {len(tickers)} stocks + {benchmark} benchmark ---")
|
|
|
|
top_n = args.top_n if args.top_n else max(5, len(tickers) // 10)
|
|
print(f"--- Selective strategies will pick top {top_n} stocks ---")
|
|
if args.fixed_fee > 0:
|
|
print(f"--- Fixed fee: ${args.fixed_fee:.2f} per trade ---")
|
|
if use_open:
|
|
print(f"--- Execution: open-close (signal on open, execute at close) ---")
|
|
|
|
# Build strategy tuples: (strategy, close_data, open_data_or_None)
|
|
open_tickers = open_data[tickers] if open_data is not None else None
|
|
open_all = open_data if open_data is not None else None
|
|
|
|
strategies = {
|
|
# --- Original strategies ---
|
|
"Buy & Hold (EW)": (BuyAndHoldStrategy(), data[tickers], open_tickers),
|
|
"Momentum": (MomentumStrategy(lookback=252, skip=21, top_n=top_n), data[tickers], open_tickers),
|
|
"Inverse Volatility": (InverseVolatilityStrategy(vol_window=20), data[tickers], open_tickers),
|
|
"Multi-Factor": (MultiFactorStrategy(tickers=tickers, benchmark=benchmark, top_n=top_n), data, open_all),
|
|
# --- New strategies ---
|
|
"Mean Reversion": (MeanReversionStrategy(top_n=top_n), data[tickers], open_tickers),
|
|
"Trend Following": (TrendFollowingStrategy(ma_window=150, momentum_period=126, top_n=top_n), data[tickers], open_tickers),
|
|
"Dual Momentum": (DualMomentumStrategy(top_n=top_n), data[tickers], open_tickers),
|
|
"Momentum+Quality": (MomentumQualityStrategy(momentum_period=252, skip=21, top_n=top_n), data[tickers], open_tickers),
|
|
"Mom+InvVol": (AdaptiveMomentumStrategy(top_n=top_n), data[tickers], open_tickers),
|
|
"Recovery+Mom Top20": (RecoveryMomentumStrategy(top_n=min(20, top_n)), data[tickers], open_tickers),
|
|
"Recovery+Mom Top10": (RecoveryMomentumStrategy(top_n=10), data[tickers], open_tickers),
|
|
}
|
|
|
|
results: dict[str, pd.Series] = {}
|
|
for name, (strategy, strat_data, strat_open) in strategies.items():
|
|
print(f"\nRunning: {name}")
|
|
results[name] = backtest(strategy, strat_data, initial_capital=initial_capital,
|
|
fixed_fee=args.fixed_fee, open_data=strat_open)
|
|
|
|
# Add benchmark (normalized to same initial capital)
|
|
bench = data[benchmark].dropna()
|
|
results[benchmark_label] = (bench / bench.iloc[0]) * initial_capital
|
|
|
|
results_df = pd.DataFrame(results)
|
|
|
|
# --- Performance metrics ---
|
|
for name, equity in results_df.items():
|
|
eq = equity.dropna()
|
|
if len(eq) < 2:
|
|
print(f"\n {name}: insufficient data, skipping")
|
|
continue
|
|
metrics.summary(eq, name=name)
|
|
|
|
if args.attribution:
|
|
summary_df, loadings_df = factor_attribution.attribute_strategies(
|
|
results_df=results_df,
|
|
benchmark_label=benchmark_label,
|
|
benchmark=benchmark,
|
|
price_data=data,
|
|
market=args.market,
|
|
model_selection=args.attribution_model,
|
|
)
|
|
factor_attribution.print_attribution_summary(summary_df)
|
|
if args.attribution_export:
|
|
factor_attribution.export_attribution(summary_df, loadings_df, args.attribution_export)
|
|
print(f"Attribution CSVs written to {args.attribution_export}")
|
|
|
|
# --- Visualization ---
|
|
if not args.no_plot:
|
|
plot_results(results_df.dropna())
|
|
|
|
|
|
if __name__ == "__main__":
|
|
main()
|