import numpy as np
import pandas as pd
import yfinance as yf
import matplotlib.pyplot as plt
import seaborn as sns

from statsmodels.graphics.tsaplots import plot_acf
from scipy import stats
from sklearn.preprocessing import StandardScaler
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, LSTM, Conv2D, MaxPooling2D, Flatten
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from sklearn.metrics import mean_squared_error, r2_score

#step 1

np.random.seed(42)
sns.set_style("whitegrid")
plt.rcParams["figure.figsize"] = (14, 5)

# ---------------------------------------------------------
# PART (a): DATA ACQUISITION & DESCRIPTION
# ---------------------------------------------------------

ticker = "BTC-USD"
start_date = "2022-01-01"
end_date = "2025-12-01"

data = yf.download(
    ticker,
    start=start_date,
    end=end_date,
    auto_adjust=True,
    progress=False
)

prices = data["Close"].squeeze().dropna()
print(f"{ticker}: {len(prices)} daily observations")

plt.plot(prices, color="navy", linewidth=1.5)
plt.title("Figure 1: Bitcoin Daily Prices (USD)", fontweight="bold")
plt.ylabel("Price")
plt.xlabel("Date")
plt.tight_layout()
plt.show()

plot_acf(prices, lags=30)
plt.title("Figure 2: ACF of Bitcoin Returns")
plt.tight_layout()
plt.show()


print("\nTable 1. Statistical Summary – Price Levels")
print("-" * 50)
print(f"Mean:     {prices.mean():.2f}")
print(f"Std Dev:  {prices.std():.2f}")
print(f"Skewness: {stats.skew(prices):.2f}")
print(f"Kurtosis: {stats.kurtosis(prices):.2f}")

log_returns = np.log(prices / prices.shift(1)).dropna()

plt.plot(log_returns, color="orange", linewidth=1)
plt.title("Figure 3: Bitcoin Daily Log Returns", fontweight="bold")
plt.ylabel("Log Return")
plt.tight_layout()
plt.show()

plot_acf(log_returns, lags=30)
plt.title("Figure 4: ACF of Bitcoin Log Returns")
plt.tight_layout()
plt.show()


print("\nTable 2. Statistical Summary – Log Returns")
print("-" * 50)
print(f"Mean:     {log_returns.mean():.5f}")
print(f"Std Dev:  {log_returns.std():.5f}")
print(f"Skewness: {stats.skew(log_returns):.2f}")
print(f"Kurtosis: {stats.kurtosis(log_returns):.2f}")

BTC-USD: 1430 daily observations

Table 1. Statistical Summary – Price Levels
--------------------------------------------------
Mean:     55462.46
Std Dev:  32323.60
Skewness: 0.57
Kurtosis: -1.07

Table 2. Statistical Summary – Log Returns
--------------------------------------------------
Mean:     0.00045
Std Dev:  0.02711
Skewness: -0.16
Kurtosis: 4.45

#Part B-- Converting data to Leaky Data

#Build Leaky Label
HORIZON = 5  # 5-day forward average return

y = (
    log_returns
    .shift(-1)
    .rolling(window=HORIZON)
    .mean()
)

#Build lagged feature
N_LAGS = 20

X = pd.concat(
    [log_returns.shift(i) for i in range(N_LAGS)],
    axis=1
)

X.columns = [f"lag_{i}" for i in range(N_LAGS)]

data = pd.concat([X, y.rename("target")], axis=1).dropna()

X = data.drop(columns="target")
y = data["target"]

scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)   # <-- INFORMATION LEAKAGE

#Train Test Split
split = int(0.7 * len(X_scaled))

X_train = X_scaled[:split]
X_test  = X_scaled[split:]

y_train = y.values[:split]
y_test  = y.values[split:]

#Data Summary
print("Dataset Summary")
print("-" * 40)
print("Total observations:", len(X_scaled))
print("Train size:", len(X_train))
print("Test size:", len(X_test))

Dataset Summary
----------------------------------------
Total observations: 1409
Train size: 986
Test size: 423

#Part C-- Building model and prediction

#MLP
def build_mlp(input_dim):
    model = Sequential([
        Dense(128, activation="relu", input_shape=(input_dim,)),
        Dense(64, activation="relu"),
        Dense(1)
    ])
    model.compile(optimizer=Adam(0.001), loss="mse")
    return model

#LSTM
def build_lstm(timesteps):
    model = Sequential([
        LSTM(64, input_shape=(timesteps, 1)),
        Dense(32, activation="relu"),
        Dense(1)
    ])
    model.compile(optimizer=Adam(0.001), loss="mse")
    return model

#CNN with GAF
def gramian_angular_field(ts):
    ts = (ts - ts.min()) / (ts.max() - ts.min())
    ts = np.clip(ts, 0, 1)
    phi = np.arccos(ts)
    return np.cos(phi[:, None] + phi[None, :])

def build_gaf_images(X):
    images = [gramian_angular_field(row) for row in X]
    return np.array(images)[..., np.newaxis]

def build_cnn_gaf(input_shape):
    model = Sequential([
        Conv2D(32, (3,3), activation="relu", input_shape=input_shape),
        MaxPooling2D((2,2)),
        Conv2D(64, (3,3), activation="relu"),
        Flatten(),
        Dense(64, activation="relu"),
        Dense(1)
    ])
    model.compile(optimizer=Adam(0.001), loss="mse")
    return model

# LSTM reshaping
X_train_lstm = X_train.reshape(X_train.shape[0], X_train.shape[1], 1)
X_test_lstm  = X_test.reshape(X_test.shape[0],  X_test.shape[1],  1)

# CNN-GAF transformation
X_train_gaf = build_gaf_images(X_train)
X_test_gaf  = build_gaf_images(X_test)

es = EarlyStopping(patience=10, restore_best_weights=True)

# Initialize models
mlp  = build_mlp(X_train.shape[1])
lstm = build_lstm(X_train_lstm.shape[1])
cnn  = build_cnn_gaf(X_train_gaf.shape[1:])

# Train
history_mlp = mlp.fit(
    X_train, y_train,
    validation_split=0.2,
    epochs=100,
    batch_size=32,
    callbacks=[es],
    verbose=0
)

history_lstm = lstm.fit(
    X_train_lstm, y_train,
    validation_split=0.2,
    epochs=100,
    batch_size=32,
    callbacks=[es],
    verbose=0
)

history_cnn = cnn.fit(
    X_train_gaf, y_train,
    validation_split=0.2,
    epochs=50,
    batch_size=32,
    callbacks=[es],
    verbose=0
)

y_pred_mlp  = mlp.predict(X_test).flatten()
y_pred_lstm = lstm.predict(X_test_lstm).flatten()
y_pred_cnn  = cnn.predict(X_test_gaf).flatten()

/usr/local/lib/python3.12/dist-packages/keras/src/layers/core/dense.py:93: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/rnn/rnn.py:199: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(**kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/convolutional/base_conv.py:113: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)

14/14 ━━━━━━━━━━━━━━━━━━━━ 0s 5ms/step 
14/14 ━━━━━━━━━━━━━━━━━━━━ 0s 18ms/step
14/14 ━━━━━━━━━━━━━━━━━━━━ 0s 15ms/step

def report(name, y_true, y_pred):
    rmse = np.sqrt(mean_squared_error(y_true, y_pred))
    r2 = r2_score(y_true, y_pred)
    print(f"{name:<8} | RMSE: {rmse:.6f} | R²: {r2:.4f}")

print("\nPART (c): Prediction Performance (Leaky Setup)")
print("-" * 50)
report("MLP", y_test, y_pred_mlp)
report("LSTM", y_test, y_pred_lstm)
report("CNN-GAF", y_test, y_pred_cnn)

PART (c): Prediction Performance (Leaky Setup)
--------------------------------------------------
MLP      | RMSE: 0.049557 | R²: -23.9211
LSTM     | RMSE: 0.006783 | R²: 0.5331
CNN-GAF  | RMSE: 0.008722 | R²: 0.2281

results = [
    {
        "Model": "MLP",
        "y_true": y_test,
        "y_pred": y_pred_mlp,
        "hist": history_mlp.history,
        "r2": r2_score(y_test, y_pred_mlp)
    },
    {
        "Model": "LSTM",
        "y_true": y_test,
        "y_pred": y_pred_lstm,
        "hist": history_lstm.history,
        "r2": r2_score(y_test, y_pred_lstm)
    },
    {
        "Model": "CNN-GAF",
        "y_true": y_test,
        "y_pred": y_pred_cnn,
        "hist": history_cnn.history,
        "r2": r2_score(y_test, y_pred_cnn)
    }
]


for res in results:
    fig, axes = plt.subplots(1, 3, figsize=(24, 6))

    # --------------------------------------------------
    # Plot 1: Observed vs Predicted (Time Series)
    # --------------------------------------------------
    ax1 = axes[0]
    zoom = 200

    y_true = res["y_true"][-zoom:]
    y_pred = res["y_pred"][-zoom:]
    idx = np.arange(len(y_true))

    ax1.plot(
        idx, y_true,
        color="black", linewidth=2.0,
        label="Observed"
    )
    ax1.plot(
        idx, y_pred,
        color="crimson", linestyle="--", linewidth=2.0,
        label="Predicted"
    )

    ax1.set_title(
        f"{res['Model']} — Observed vs Predicted Forward Returns",
        fontsize=14, fontweight="bold"
    )
    ax1.set_xlabel("Test Time Index")
    ax1.set_ylabel("5-Day Forward Return")
    ax1.legend()
    ax1.grid(True, alpha=0.3)

    # --------------------------------------------------
    # Plot 2: Training & Validation Loss (Convergence)
    # --------------------------------------------------
    ax2 = axes[1]
    hist = res["hist"]

    ax2.plot(
        hist["loss"],
        color="steelblue", linewidth=2.0,
        label="Training Loss"
    )
    ax2.plot(
        hist["val_loss"],
        color="darkorange", linewidth=2.0,
        linestyle=":",
        label="Validation Loss"
    )

    ax2.set_title(
        "Training Convergence (MSE Loss)",
        fontsize=14, fontweight="bold"
    )
    ax2.set_xlabel("Epochs")
    ax2.set_ylabel("Loss")
    ax2.legend()
    ax2.grid(True, linestyle="--", alpha=0.4)

    # --------------------------------------------------
    # Plot 3: Actual vs Predicted (Scatter)
    # --------------------------------------------------
    ax3 = axes[2]

    ax3.scatter(
        res["y_true"],
        res["y_pred"],
        alpha=0.5,
        color="cyan",
        edgecolors="black"
    )

    min_val = min(res["y_true"].min(), res["y_pred"].min())
    max_val = max(res["y_true"].max(), res["y_pred"].max())
    ax3.plot(
        [min_val, max_val],
        [min_val, max_val],
        "k--", lw=2,
        label="Perfect Fit"
    )

    ax3.set_title(
        f"Prediction Accuracy (R² = {res['r2']:.4f})",
        fontsize=14, fontweight="bold"
    )
    ax3.set_xlabel("Observed Returns")
    ax3.set_ylabel("Predicted Returns")
    ax3.legend()
    ax3.grid(True, alpha=0.3)

    plt.tight_layout()
    plt.show()

#Part D
def backtest_strategy(y_true, y_pred, model_name):
    """
    Long–Short and Long-Only backtest for regression-based signals
    """

    df = pd.DataFrame({
        "Ret": y_true,
        "Pred": y_pred
    }).dropna()

    # --------------------------------------------------
    # Trading Signals (Regression-Based)
    # --------------------------------------------------
    df["Position"] = np.where(df["Pred"] > 0, 1, -1)

    # Shift positions to avoid look-ahead bias
    df["Position_shift"] = df["Position"].shift(1)

    # Long–Short strategy
    df["Strat_ret"] = df["Position_shift"] * df["Ret"]

    # Long-Only strategy
    df["Position_L"] = df["Position_shift"].clip(lower=0)
    df["Strat_ret_L"] = df["Position_L"] * df["Ret"]

    # --------------------------------------------------
    # Cumulative Returns
    # --------------------------------------------------
    df["Cum_LS"] = (1 + df["Strat_ret"]).cumprod() - 1
    df["Cum_L"] = (1 + df["Strat_ret_L"]).cumprod() - 1
    df["Cum_BH"] = (1 + df["Ret"]).cumprod() - 1

    # --------------------------------------------------
    # Performance Metrics
    # --------------------------------------------------
    results = {
        "Model": model_name,
        "Final_Return_LS": (1 + df["Strat_ret"]).prod() - 1,
        "Final_Return_L": (1 + df["Strat_ret_L"]).prod() - 1,
        "Final_Return_BH": (1 + df["Ret"]).prod() - 1,
        "Sharpe_LS": np.mean(df["Strat_ret"]) / np.std(df["Strat_ret"]) * np.sqrt(252),
        "Sharpe_L": np.mean(df["Strat_ret_L"]) / np.std(df["Strat_ret_L"]) * np.sqrt(252),
        "Data": df
    }

    return results

bt_mlp  = backtest_strategy(y_test, y_pred_mlp,  "MLP")
bt_lstm = backtest_strategy(y_test, y_pred_lstm, "LSTM")
bt_cnn  = backtest_strategy(y_test, y_pred_cnn,  "CNN-GAF")

backtests = [bt_mlp, bt_lstm, bt_cnn]

summary_df = pd.DataFrame([
    {
        "Model": bt["Model"],
        "Long–Short Return (%)": bt["Final_Return_LS"] * 100,
        "Long-Only Return (%)": bt["Final_Return_L"] * 100,
        "Buy & Hold Return (%)": bt["Final_Return_BH"] * 100,
        "Sharpe (LS)": bt["Sharpe_LS"],
        "Sharpe (L)": bt["Sharpe_L"]
    }
    for bt in backtests
])

print("\nPART (d): BACKTEST PERFORMANCE SUMMARY")
print("-" * 60)
print(summary_df.round(3).to_string(index=False))
print("-" * 60)

plt.figure(figsize=(14, 6))

for bt in backtests:
    plt.plot(bt["Data"]["Cum_LS"], label=f"{bt['Model']} (Long–Short)")

plt.plot(backtests[0]["Data"]["Cum_BH"],
         color="black", linestyle="--", linewidth=2,
         label="Buy & Hold")

plt.title("Figure 5: Equity Curves — Long–Short Strategies",
          fontsize=14, fontweight="bold")
plt.ylabel("Cumulative Return")
plt.xlabel("Test Time Index")
plt.legend()
plt.grid(alpha=0.3)
plt.tight_layout()
plt.show()

plt.figure(figsize=(14, 6))

for bt in backtests:
    plt.plot(bt["Data"]["Cum_L"], label=f"{bt['Model']} (Long-Only)")

plt.plot(backtests[0]["Data"]["Cum_BH"],
         color="black", linestyle="--", linewidth=2,
         label="Buy & Hold")

plt.title("Figure 6: Equity Curves — Long-Only Strategies",
          fontsize=14, fontweight="bold")
plt.ylabel("Cumulative Return")
plt.xlabel("Test Time Index")
plt.legend()
plt.grid(alpha=0.3)
plt.tight_layout()
plt.show()

PART (d): BACKTEST PERFORMANCE SUMMARY
------------------------------------------------------------
  Model  Long–Short Return (%)  Long-Only Return (%)  Buy & Hold Return (%)  Sharpe (LS)  Sharpe (L)
    MLP                 53.445                50.582                 42.923        1.705       2.328
   LSTM                581.519               216.856                 42.923        8.255       6.418
CNN-GAF                524.726               202.990                 42.923        7.793       5.790
------------------------------------------------------------

# STEP 2:
def build_lstm(timesteps):
    model = Sequential([
        LSTM(64, input_shape=(timesteps, 1)),
        Dense(32, activation='relu'),
        Dense(1)
    ])
    model.compile(optimizer=Adam(0.001), loss='mse')
    return model

def build_cnn_gaf(input_shape):
    model = Sequential([
        Conv2D(32, (3,3), activation='relu', input_shape=input_shape),
        MaxPooling2D((2,2)),
        Conv2D(64, (3,3), activation='relu'),
        Flatten(),
        Dense(64, activation='relu'),
        Dense(1)
    ])
    model.compile(optimizer=Adam(0.001), loss='mse')
    return model

def gramian_angular_field(ts):
    ts = (ts - ts.min()) / (ts.max() - ts.min())
    ts = np.clip(ts, 0, 1)
    phi = np.arccos(ts)
    return np.cos(phi[:, None] + phi[None, :])

def build_gaf_images(X):
    images = [gramian_angular_field(row) for row in X]
    return np.array(images)[..., np.newaxis]

# Walk-forward backtest function
def walk_forward_backtest(X, y, train_len, test_len, model_type='lstm'):
    """
    Non-anchored walk-forward backtest.
    X, y: full dataset (scaled features and target)
    train_len: length of training window
    test_len: length of testing window
    model_type: 'lstm' or 'cnn_gaf'
    """
    n = len(X)
    preds = []
    actuals = []

    for start in range(0, n - train_len - test_len + 1, test_len):
        train_end = start + train_len
        test_end = train_end + test_len

        X_train = X[start:train_end]
        y_train = y[start:train_end]
        X_test = X[train_end:test_end]
        y_test = y[train_end:test_end]

        if model_type == 'lstm':
            X_train_rs = X_train.reshape(X_train.shape[0], X_train.shape[1], 1)
            X_test_rs = X_test.reshape(X_test.shape[0], X_test.shape[1], 1)
            model = build_lstm(X_train_rs.shape[1])
            model.fit(X_train_rs, y_train, epochs=30, batch_size=32, verbose=0)
            y_pred = model.predict(X_test_rs, verbose=0).flatten()

        elif model_type == 'cnn_gaf':
            X_train_rs = build_gaf_images(X_train)
            X_test_rs = build_gaf_images(X_test)
            model = build_cnn_gaf(X_train_rs.shape[1:])
            model.fit(X_train_rs, y_train, epochs=30, batch_size=32, verbose=0)
            y_pred = model.predict(X_test_rs, verbose=0).flatten()

        preds.extend(y_pred)
        actuals.extend(y_test)

    return np.array(actuals), np.array(preds)

# Prepare data (same as Step 1)
N_LAGS = 20
HORIZON = 5

log_returns = np.log(prices / prices.shift(1)).dropna()
y = log_returns.shift(-HORIZON).rolling(HORIZON).mean().dropna()
X = pd.concat([log_returns.shift(i) for i in range(N_LAGS)], axis=1).dropna()
X.columns = [f'lag_{i}' for i in range(N_LAGS)]
df = pd.concat([X, y.rename('target')], axis=1).dropna()
X = df.drop(columns='target')
y = df['target'].values

# Scale features (WITH leakage, as per Step 1 setup)
scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)

# Step 2a: Walk-forward with train=500, test=500
print("="*60)
print("STEP 2a: Walk-forward (train=500, test=500)")
print("="*60)

actuals_2a_lstm, preds_2a_lstm = walk_forward_backtest(X_scaled, y, train_len=500, test_len=500, model_type='lstm')
actuals_2a_cnn, preds_2a_cnn = walk_forward_backtest(X_scaled, y, train_len=500, test_len=500, model_type='cnn_gaf')

# Step 2b: Walk-forward with train=500, test=100
print("\n" + "="*60)
print("STEP 2b: Walk-forward (train=500, test=100)")
print("="*60)

actuals_2b_lstm, preds_2b_lstm = walk_forward_backtest(X_scaled, y, train_len=500, test_len=100, model_type='lstm')
actuals_2b_cnn, preds_2b_cnn = walk_forward_backtest(X_scaled, y, train_len=500, test_len=100, model_type='cnn_gaf')

# Performance metrics function
def evaluate_performance(actuals, preds, model_name, step_label):
    rmse = np.sqrt(np.mean((actuals - preds)**2))
    r2 = 1 - np.sum((actuals - preds)**2) / np.sum((actuals - np.mean(actuals))**2)
    print(f"{model_name} ({step_label}): RMSE = {rmse:.6f}, R² = {r2:.4f}")
    return rmse, r2

print("\nPerformance Summary:")
print("-"*50)
rmse_2a_lstm, r2_2a_lstm = evaluate_performance(actuals_2a_lstm, preds_2a_lstm, "LSTM", "2a")
rmse_2a_cnn, r2_2a_cnn = evaluate_performance(actuals_2a_cnn, preds_2a_cnn, "CNN-GAF", "2a")
rmse_2b_lstm, r2_2b_lstm = evaluate_performance(actuals_2b_lstm, preds_2b_lstm, "LSTM", "2b")
rmse_2b_cnn, r2_2b_cnn = evaluate_performance(actuals_2b_cnn, preds_2b_cnn, "CNN-GAF", "2b")

# Backtest strategy function (reuse from Step 1)
def backtest_strategy(y_true, y_pred, model_name):
    df = pd.DataFrame({'Ret': y_true, 'Pred': y_pred})
    df['Position'] = np.where(df['Pred'] > 0, 1, -1)
    df['Position_shift'] = df['Position'].shift(1)
    df['Strat_ret'] = df['Position_shift'] * df['Ret']
    df['Cum_LS'] = (1 + df['Strat_ret']).cumprod() - 1
    sharpe = np.mean(df['Strat_ret']) / np.std(df['Strat_ret']) * np.sqrt(252) if np.std(df['Strat_ret']) > 0 else 0
    final_return = (1 + df['Strat_ret']).prod() - 1
    return {
        'Model': model_name,
        'Final_Return': final_return,
        'Sharpe': sharpe,
        'Data': df
    }

# Run backtests for Step 2 results
bt_2a_lstm = backtest_strategy(actuals_2a_lstm, preds_2a_lstm, "LSTM (2a)")
bt_2a_cnn = backtest_strategy(actuals_2a_cnn, preds_2a_cnn, "CNN-GAF (2a)")
bt_2b_lstm = backtest_strategy(actuals_2b_lstm, preds_2b_lstm, "LSTM (2b)")
bt_2b_cnn = backtest_strategy(actuals_2b_cnn, preds_2b_cnn, "CNN-GAF (2b)")

# Plot equity curves
fig, axes = plt.subplots(2, 2, figsize=(14, 10))

for idx, (bt, title) in enumerate([(bt_2a_lstm, "LSTM 2a"), (bt_2a_cnn, "CNN-GAF 2a"),
                                    (bt_2b_lstm, "LSTM 2b"), (bt_2b_cnn, "CNN-GAF 2b")]):
    ax = axes[idx//2, idx%2]
    ax.plot(bt['Data']['Cum_LS'], label='Long-Short')
    ax.set_title(f"{title} - Equity Curve", fontweight='bold')
    ax.set_ylabel("Cumulative Return")
    ax.set_xlabel("Step")
    ax.legend()
    ax.grid(alpha=0.3)

plt.tight_layout()
plt.show()

# Summary table
summary = pd.DataFrame([
    {'Model': 'LSTM', 'Step': '2a', 'RMSE': rmse_2a_lstm, 'R2': r2_2a_lstm, 'Sharpe': bt_2a_lstm['Sharpe'], 'Final_Return': bt_2a_lstm['Final_Return']},
    {'Model': 'CNN-GAF', 'Step': '2a', 'RMSE': rmse_2a_cnn, 'R2': r2_2a_cnn, 'Sharpe': bt_2a_cnn['Sharpe'], 'Final_Return': bt_2a_cnn['Final_Return']},
    {'Model': 'LSTM', 'Step': '2b', 'RMSE': rmse_2b_lstm, 'R2': r2_2b_lstm, 'Sharpe': bt_2b_lstm['Sharpe'], 'Final_Return': bt_2b_lstm['Final_Return']},
    {'Model': 'CNN-GAF', 'Step': '2b', 'RMSE': rmse_2b_cnn, 'R2': r2_2b_cnn, 'Sharpe': bt_2b_cnn['Sharpe'], 'Final_Return': bt_2b_cnn['Final_Return']}
])

print("\n" + "="*60)
print("STEP 2 - PERFORMANCE SUMMARY TABLE")
print("="*60)
print(summary.round(4).to_string(index=False))

============================================================
STEP 2a: Walk-forward (train=500, test=500)
============================================================

/usr/local/lib/python3.12/dist-packages/keras/src/layers/rnn/rnn.py:199: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(**kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/convolutional/base_conv.py:113: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)

============================================================
STEP 2b: Walk-forward (train=500, test=100)
============================================================

WARNING:tensorflow:5 out of the last 21 calls to <function TensorFlowTrainer.make_predict_function.<locals>.one_step_on_data_distributed at 0x7c53f2210220> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for  more details.
WARNING:tensorflow:6 out of the last 24 calls to <function TensorFlowTrainer.make_predict_function.<locals>.one_step_on_data_distributed at 0x7c53f2210220> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for  more details.

Performance Summary:
--------------------------------------------------
LSTM (2a): RMSE = 0.012118, R² = -0.2133
CNN-GAF (2a): RMSE = 0.014764, R² = -0.8010
LSTM (2b): RMSE = 0.012087, R² = -0.3099
CNN-GAF (2b): RMSE = 0.012618, R² = -0.4274

============================================================
STEP 2 - PERFORMANCE SUMMARY TABLE
============================================================
  Model Step   RMSE      R2  Sharpe  Final_Return
   LSTM   2a 0.0121 -0.2133 -0.7227       -0.2478
CNN-GAF   2a 0.0148 -0.8010 -0.2058       -0.0983
   LSTM   2b 0.0121 -0.3099 -0.3868       -0.2473
CNN-GAF   2b 0.0126 -0.4274  0.1422        0.0354

# Step 3

log_returns = np.log(prices / prices.shift(1)).dropna()
y_raw = log_returns.shift(-HORIZON).rolling(HORIZON).mean().dropna()
X_raw = pd.concat([log_returns.shift(i) for i in range(N_LAGS)], axis=1).dropna()
X_raw.columns = [f'lag_{i}' for i in range(N_LAGS)]

df_clean = pd.concat([X_raw, y_raw.rename('target')], axis=1).dropna()
X_clean = df_clean.drop(columns='target').values
y_clean = df_clean['target'].values

print(f"Data reset for Step 3. Shape: {X_clean.shape}")

# Modified Walk-Forward Function to Return History

def walk_forward_no_leakage_with_history(X, y, train_len, test_len, model_type='lstm'):
    """
    Performs non-anchored walk-forward backtest.
    Returns: actuals, predictions, and the history of the LAST training fold.
    """
    n = len(X)
    preds = []
    actuals = []
    last_history = None

    for start in range(0, n - train_len - test_len + 1, test_len):
        train_end = start + train_len
        test_end = train_end + test_len

        # 1. Slice Raw Data
        X_train_raw = X[start:train_end]
        y_train = y[start:train_end]
        X_test_raw = X[train_end:test_end]
        y_test = y[train_end:test_end]

        # Dynamic Normalization (No Leakage)
        local_scaler = StandardScaler()
        X_train_scaled = local_scaler.fit_transform(X_train_raw)
        X_test_scaled = local_scaler.transform(X_test_raw)

        # Model Training
        if model_type == 'lstm':
            X_train_rs = X_train_scaled.reshape(X_train_scaled.shape[0], X_train_scaled.shape[1], 1)
            X_test_rs = X_test_scaled.reshape(X_test_scaled.shape[0], X_test_scaled.shape[1], 1)

            # Re-build model to ensure clean slate
            model = build_lstm(X_train_rs.shape[1])
            # Capture history
            history = model.fit(
                X_train_rs, y_train,
                validation_split=0.2,
                epochs=30,
                batch_size=32,
                verbose=0
            )
            y_pred = model.predict(X_test_rs, verbose=0).flatten()

        elif model_type == 'cnn_gaf':
            X_train_rs = build_gaf_images(X_train_scaled)
            X_test_rs = build_gaf_images(X_test_scaled)

            model = build_cnn_gaf(X_train_rs.shape[1:])
            history = model.fit(
                X_train_rs, y_train,
                validation_split=0.2,
                epochs=30,
                batch_size=32,
                verbose=0
            )
            y_pred = model.predict(X_test_rs, verbose=0).flatten()

        preds.extend(y_pred)
        actuals.extend(y_test)
        last_history = history # Save last history for plotting

    return np.array(actuals), np.array(preds), last_history


# Run Backtests (Step 3b and 3c)

print("Running Step 3b (500/500)...")
y_3b_lstm, p_3b_lstm, h_3b_lstm = walk_forward_no_leakage_with_history(X_clean, y_clean, 500, 500, 'lstm')
y_3b_cnn,  p_3b_cnn,  h_3b_cnn  = walk_forward_no_leakage_with_history(X_clean, y_clean, 500, 500, 'cnn_gaf')

print("Running Step 3c (500/100)...")
y_3c_lstm, p_3c_lstm, h_3c_lstm = walk_forward_no_leakage_with_history(X_clean, y_clean, 500, 100, 'lstm')
y_3c_cnn,  p_3c_cnn,  h_3c_cnn  = walk_forward_no_leakage_with_history(X_clean, y_clean, 500, 100, 'cnn_gaf')

#
results_step3_plots = [
    {
        "Model": "LSTM (Step 3b: 500/500)",
        "y_true": y_3b_lstm,
        "y_pred": p_3b_lstm,
        "hist": h_3b_lstm.history,
        "r2": r2_score(y_3b_lstm, p_3b_lstm)
    },
    {
        "Model": "CNN-GAF (Step 3b: 500/500)",
        "y_true": y_3b_cnn,
        "y_pred": p_3b_cnn,
        "hist": h_3b_cnn.history,
        "r2": r2_score(y_3b_cnn, p_3b_cnn)
    },
    {
        "Model": "LSTM (Step 3c: 500/100)",
        "y_true": y_3c_lstm,
        "y_pred": p_3c_lstm,
        "hist": h_3c_lstm.history,
        "r2": r2_score(y_3c_lstm, p_3c_lstm)
    },
    {
        "Model": "CNN-GAF (Step 3c: 500/100)",
        "y_true": y_3c_cnn,
        "y_pred": p_3c_cnn,
        "hist": h_3c_cnn.history,
        "r2": r2_score(y_3c_cnn, p_3c_cnn)
    }
]

print("\nGenerating Loss and Performance Plots for Step 3...")

for res in results_step3_plots:
    fig, axes = plt.subplots(1, 3, figsize=(24, 6))

    #
    ax1 = axes[0]
    zoom = 150

    y_true = res["y_true"][-zoom:]
    y_pred = res["y_pred"][-zoom:]
    idx = np.arange(len(y_true))

    ax1.plot(idx, y_true, color="black", linewidth=2.0, label="Observed")
    ax1.plot(idx, y_pred, color="crimson", linestyle="--", linewidth=2.0, label="Predicted")

    ax1.set_title(f"{res['Model']} — Last {zoom} Days", fontsize=14, fontweight="bold")
    ax1.set_xlabel("Test Time Index")
    ax1.set_ylabel("5-Day Forward Return")
    ax1.legend()
    ax1.grid(True, alpha=0.3)

    #
    ax2 = axes[1]
    hist = res["hist"]

    ax2.plot(hist["loss"], color="steelblue", linewidth=2.0, label="Training Loss")

    if "val_loss" in hist:
        ax2.plot(hist["val_loss"], color="darkorange", linewidth=2.0, linestyle=":", label="Validation Loss")

    ax2.set_title("Training Convergence (Last Fold)", fontsize=14, fontweight="bold")
    ax2.set_xlabel("Epochs")
    ax2.set_ylabel("MSE Loss")
    ax2.legend()
    ax2.grid(True, linestyle="--", alpha=0.4)

    #
    ax3 = axes[2]

    ax3.scatter(res["y_true"], res["y_pred"], alpha=0.5, color="cyan", edgecolors="black")

    min_val = min(res["y_true"].min(), res["y_pred"].min())
    max_val = max(res["y_true"].max(), res["y_pred"].max())
    ax3.plot([min_val, max_val], [min_val, max_val], "k--", lw=2, label="Perfect Fit")

    ax3.set_title(f"Prediction Accuracy (R² = {res['r2']:.4f})", fontsize=14, fontweight="bold")
    ax3.set_xlabel("Observed Returns")
    ax3.set_ylabel("Predicted Returns")
    ax3.legend()
    ax3.grid(True, alpha=0.3)

    plt.tight_layout()
    plt.show()

#
metrics_summary = []
for res in results_step3_plots:
    # Calculate simple Sharpe for the table
    df_temp = pd.DataFrame({'ret': res['y_true'], 'pred': res['y_pred']})
    df_temp['pos'] = np.where(df_temp['pred'] > 0, 1, -1)
    df_temp['strat'] = df_temp['pos'].shift(1) * df_temp['ret']
    sharpe = (df_temp['strat'].mean() / df_temp['strat'].std() * np.sqrt(252)) if df_temp['strat'].std() > 0 else 0

    metrics_summary.append({
        "Model": res['Model'],
        "RMSE": np.sqrt(mean_squared_error(res['y_true'], res['y_pred'])),
        "R2": res['r2'],
        "Sharpe": sharpe
    })

print("\nStep 3 Final Metrics Summary:")
print(pd.DataFrame(metrics_summary).round(4).to_string(index=False))

Data reset for Step 3. Shape: (1405, 20)
Running Step 3b (500/500)...

/usr/local/lib/python3.12/dist-packages/keras/src/layers/rnn/rnn.py:199: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(**kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/convolutional/base_conv.py:113: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)

Running Step 3c (500/100)...

/usr/local/lib/python3.12/dist-packages/keras/src/layers/rnn/rnn.py:199: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(**kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/rnn/rnn.py:199: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(**kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/rnn/rnn.py:199: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(**kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/rnn/rnn.py:199: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(**kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/rnn/rnn.py:199: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(**kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/rnn/rnn.py:199: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(**kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/rnn/rnn.py:199: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(**kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/rnn/rnn.py:199: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(**kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/rnn/rnn.py:199: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(**kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/convolutional/base_conv.py:113: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/convolutional/base_conv.py:113: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/convolutional/base_conv.py:113: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/convolutional/base_conv.py:113: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/convolutional/base_conv.py:113: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/convolutional/base_conv.py:113: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/convolutional/base_conv.py:113: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/convolutional/base_conv.py:113: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)
/usr/local/lib/python3.12/dist-packages/keras/src/layers/convolutional/base_conv.py:113: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)

Generating Loss and Performance Plots for Step 3...

Step 3 Final Metrics Summary:
                     Model   RMSE      R2  Sharpe
   LSTM (Step 3b: 500/500) 0.0141 -0.6367 -3.4770
CNN-GAF (Step 3b: 500/500) 0.0143 -0.6817  0.6595
   LSTM (Step 3c: 500/100) 0.0125 -0.4024 -0.9971
CNN-GAF (Step 3c: 500/100) 0.0138 -0.7189 -0.2966

Introduction¶

Step 1¶

Step d¶

Summary for Part (c) and (d)¶

Step 2¶

Step 3¶

Step 3d¶

Conclusion¶

Reference¶