theonegareth
/

GoldPricePredictor

+"""
+Inference script for Gold Price Direction Predictor
+This script demonstrates how to load the model and make predictions.
+"""
+import pandas as pd
+import numpy as np
+from joblib import load
+from huggingface_hub import hf_hub_download
+import warnings
+warnings.filterwarnings("ignore")
+def load_model():
+    """Load the trained model from Hugging Face"""
+    try:
+        model_path = hf_hub_download("theonegareth/GoldPricePredictor", "gold_direction_model.joblib")
+        model = load(model_path)
+        print("Model loaded successfully!")
+        return model
+    except Exception as e:
+        print(f"Error loading model: {e}")
+        return None
+def add_features_adaptive(data: pd.DataFrame, price='close') -> pd.DataFrame:
+    """
+    Feature engineering function (same as used in training)
+    """
+    out = data.copy()
+    n = len(out)
+    if n < 8:
+        raise ValueError(f"Dataset too small (n={n}). Need at least 8 rows.")
+    out['ret'] = out[price].pct_change()
+    out['log_ret'] = np.log1p(out['ret'])
+    # Adaptive lags and windows
+    max_lag = max(1, min(5, n // 6))
+    lag_list = list(range(1, max_lag + 1))
+    win_candidates = [3, 5, 10, 20]
+    win_list = [w for w in win_candidates if w < n-2]
+    if not win_list:
+        win_list = [3]
+    for L in lag_list:
+        out[f'ret_lag_{L}'] = out['ret'].shift(L)
+    for w in win_list:
+        out[f'roll_mean_{w}'] = out['ret'].rolling(w, min_periods=1).mean()
+        out[f'roll_std_{w}'] = out['ret'].rolling(w, min_periods=1).std()
+        out[f'roll_min_{w}'] = out['ret'].rolling(w, min_periods=1).min()
+        out[f'roll_max_{w}'] = out['ret'].rolling(w, min_periods=1).max()
+    # RSI
+    rsi_w = max(3, min(14, n // 6))
+    delta = out[price].diff()
+    gain = (delta.where(delta > 0, 0.0)).rolling(rsi_w, min_periods=1).mean()
+    loss = (-delta.where(delta < 0, 0.0)).rolling(rsi_w, min_periods=1).mean()
+    rs = gain / (loss + 1e-9)
+    out['rsi14'] = 100 - (100 / (1 + rs))
+    # MACD
+    fast = max(6, min(12, n // 5))
+    slow = max(fast+4, min(26, n // 3))
+    signal = max(5, min(9, n // 6))
+    ema_fast = out[price].ewm(span=fast, adjust=False).mean()
+    ema_slow = out[price].ewm(span=slow, adjust=False).mean()
+    out['macd'] = ema_fast - ema_slow
+    out['macd_signal'] = out['macd'].ewm(span=signal, adjust=False).mean()
+    out['macd_hist'] = out['macd'] - out['macd_signal']
+    # Bollinger
+    bb_w = max(5, min(20, n // 4))
+    ma = out[price].rolling(bb_w, min_periods=1).mean()
+    sd = out[price].rolling(bb_w, min_periods=1).std()
+    out['bb_mid'] = ma
+    out['bb_up'] = ma + 2*sd
+    out['bb_low'] = ma - 2*sd
+    out['bb_width'] = (out['bb_up'] - out['bb_low']) / (out['bb_mid'] + 1e-9)
+    # Calendar
+    out['dow'] = out['date'].dt.weekday
+    out['month'] = out['date'].dt.month
+    return out
+def predict_next_day_direction(model, historical_data: pd.DataFrame, threshold=0.52):
+    """
+    Predict next-day direction from historical price data
+    Parameters:
+    - model: Loaded sklearn model
+    - historical_data: DataFrame with 'date' and 'close' columns
+    - threshold: Probability threshold for prediction (optimized from training)
+    Returns:
+    - prediction: 1 for up, 0 for down
+    - probability: Probability of going up
+    """
+    # Ensure data is sorted
+    historical_data = historical_data.sort_values('date').reset_index(drop=True)
+    # Add features
+    feat = add_features_adaptive(historical_data, price='close')
+    # Drop rows with NaN (lags, etc.)
+    feat = feat.dropna(subset=[c for c in feat.columns if c.startswith('ret_lag_')])
+    if len(feat) == 0:
+        raise ValueError("Not enough data to compute features")
+    # Get latest features
+    latest_features = feat.iloc[[-1]]
+    # Select feature columns (exclude non-feature columns)
+    feature_cols = [c for c in latest_features.columns
+                   if c not in ['date','close','ret','log_ret','next_close','target']
+                   and not c.startswith('roll_') or c in ['roll_mean_3','roll_std_3','roll_min_3','roll_max_3',
+                                                        'roll_mean_5','roll_std_5','roll_min_5','roll_max_5']]
+    # Ensure we have the right columns (this might need adjustment based on training)
+    X = latest_features[feature_cols]
+    # Predict
+    proba_up = model.predict_proba(X)[:, 1][0]
+    prediction = int(proba_up >= threshold)
+    direction = "UP 📈" if prediction == 1 else "DOWN 📉"
+    return prediction, proba_up, direction
+if __name__ == "__main__":
+    # Example usage
+    model = load_model()
+    if model is None:
+        print("Failed to load model")
+        exit(1)
+    # Example historical data (replace with your data)
+    example_data = pd.DataFrame({
+        'date': pd.date_range('2023-01-01', periods=50, freq='D'),
+        'close': np.random.uniform(1000000, 1200000, 50)  # Random prices
+    })
+    try:
+        pred, proba, direction = predict_next_day_direction(model, example_data)
+        print(f"Next-day prediction: {direction}")
+        print(".3f")
+        print(f"Decision threshold: 0.52")
+    except Exception as e:
+        print(f"Error making prediction: {e}")