removed griffin-stuff

2025-01-29 19:24:55 -05:00
parent 5f8e3f4c68
commit c39d19a17a
28 changed files with 0 additions and 1935429 deletions
--- a/src/griffin-stuff/GUSHTradingBotV1.0.py
+++ b/src/griffin-stuff/GUSHTradingBotV1.0.py
@@ -1,246 +0,0 @@
-import numpy as np
-import pandas as pd
-import yfinance as yf
-from scipy.optimize import minimize
-
-
-def ticker_info():
-    ticker = "gush"
-    return ticker.upper()
-
-
-def fetch_expiration_dates(ticker):
-    print(f"Fetching available expiration dates for {ticker}...")
-    stock = yf.Ticker(ticker)
-    expiration_dates = stock.options
-    print(f"Available expiration dates: {expiration_dates}")
-    return expiration_dates
-
-
-def select_expiration_date(expiration_dates):
-    print("Selecting the first available expiration date...")
-    expiration_date = expiration_dates[0]
-    print(f"Selected expiration date: {expiration_date}")
-    return expiration_date
-
-
-def fetch_option_chain(ticker, expiration_date):
-    print(f"Fetching option chain for {ticker} with expiration date {expiration_date}...")
-    stock = yf.Ticker(ticker)
-    options_chain = stock.option_chain(expiration_date)
-    print("Option chain fetched successfully!")
-    return options_chain
-
-
-def get_price_data(ticker, start_date, end_date):
-    print(f"Fetching price data for {ticker} from {start_date} to {end_date}...")
-    data = yf.download(ticker, start=start_date, end=end_date)
-    print(f"Price data fetched successfully for {ticker}!")
-    return data
-
-
-def moving_average_strategy(data, short_window=20, long_window=50):
-    data['Short_MA'] = data['Close'].rolling(window=short_window).mean()
-    data['Long_MA'] = data['Close'].rolling(window=long_window).mean()
-    data['Signal'] = np.where(data['Short_MA'] > data['Long_MA'], 1, -1)
-    return data['Signal']
-
-def rsi_strategy(data, window=14, overbought=70, oversold=30):
-    delta = data['Close'].diff(1)
-    gain = np.where(delta > 0, delta, 0).flatten()  # Flatten to 1D array
-    loss = np.where(delta < 0, abs(delta), 0).flatten()  # Flatten to 1D array
-    
-    avg_gain = pd.Series(gain).rolling(window=window).mean()
-    avg_loss = pd.Series(loss).rolling(window=window).mean()
-    
-    # Avoid division by zero by using np.where to replace 0 with np.nan in avg_loss
-    rs = avg_gain / np.where(avg_loss == 0, np.nan, avg_loss)  
-    
-    rsi = 100 - (100 / (1 + rs))
-    
-    signal = np.where(rsi < oversold, 1, np.where(rsi > overbought, -1, 0))
-    return pd.Series(signal, index=data.index)
-
-def bollinger_bands_strategy(data, window=20, num_std=2):
-    # Calculate moving average
-    data['Moving_Avg'] = data['Close'].rolling(window=window).mean()
-
-    # Calculate rolling standard deviation and force it to be a Series
-    rolling_std = data['Close'].rolling(window).std()
-    rolling_std = rolling_std.squeeze()  # Ensure rolling_std is a Series
-
-    # Print shapes for debugging
-    print(f"Shape of Moving_Avg: {data['Moving_Avg'].shape}")
-    print(f"Shape of Rolling Std: {rolling_std.shape}")
-
-    # Calculate upper and lower bands
-    data['Band_Upper'] = data['Moving_Avg'] + (num_std * rolling_std)
-    data['Band_Lower'] = data['Moving_Avg'] - (num_std * rolling_std)
-
-    # Print shapes after assignments for debugging
-    print(f"Shape of Band_Upper: {data['Band_Upper'].shape}")
-    print(f"Shape of Band_Lower: {data['Band_Lower'].shape}")
-
-    # Check for NaN values
-    print(f"NaNs in Close: {data['Close'].isna().sum()}")
-    print(f"NaNs in Band_Upper: {data['Band_Upper'].isna().sum()}")
-    print(f"NaNs in Band_Lower: {data['Band_Lower'].isna().sum()}")
-
-    # Print the columns of the DataFrame
-    print(f"Columns in data before dropping NaNs: {data.columns.tolist()}")
-
-    # Optionally drop rows with NaNs
-    data = data.dropna(subset=['Close', 'Band_Upper', 'Band_Lower'])
-
-    # Generate signals based on the bands
-    signal = np.where(data['Close'] < data['Band_Lower'], 1, 
-                      np.where(data['Close'] > data['Band_Upper'], -1, 0))
-    
-    return pd.Series(signal, index=data.index)
-
-def generate_signals(data):
-    ma_signal = moving_average_strategy(data)
-    rsi_signal = rsi_strategy(data)
-    bollinger_signal = bollinger_bands_strategy(data)
-    return pd.DataFrame({'MA': ma_signal, 'RSI': rsi_signal, 'Bollinger': bollinger_signal})
-
-
-def backtest_option_trades(option_chain, signals, stock_data):
-    """
-    Backtest option trades based on the given signals and stock data.
-    """
-    trades = []
-    current_position = None
-
-    # Ensure both stock_data and option_chain indices are sorted in ascending order
-    stock_data = stock_data.sort_index()
-
-    # Convert 'lastTradeDate' or any date-related columns to datetime in option_chain
-    if 'lastTradeDate' in option_chain.columns:
-        option_chain['lastTradeDate'] = pd.to_datetime(option_chain['lastTradeDate'])
-        option_chain = option_chain.set_index('lastTradeDate')
-
-    # If option_chain index isn't datetime, convert it to datetime (ensuring compatibility)
-    option_chain.index = pd.to_datetime(option_chain.index)
-
-    # Remove the timezone from option_chain index
-    option_chain.index = option_chain.index.tz_localize(None)
-
-    # Now reindex the option chain to match the stock data index (forward fill missing option prices)
-    option_chain = option_chain.sort_index()
-    option_chain = option_chain.reindex(stock_data.index, method='ffill')
-
-    for i in range(len(signals)):
-        if signals.iloc[i]['MA'] == 1 and current_position is None:
-            # BUY signal
-            entry_price = option_chain['lastPrice'].iloc[i]
-            if pd.isna(entry_price):  # If price is nan, log the error and continue
-                print(f"Missing entry price on {stock_data.index[i]}, skipping trade.")
-                continue
-            entry_date = stock_data.index[i]
-            current_position = {
-                'entry_price': entry_price,
-                'entry_date': entry_date
-            }
-            print(f"BUY signal on {entry_date}: Entry Price = {entry_price}")
-        
-        elif signals.iloc[i]['MA'] == -1 and current_position is not None:
-            # SELL signal
-            exit_price = option_chain['lastPrice'].iloc[i]
-            if pd.isna(exit_price):  # If price is nan, log the error and continue
-                print(f"Missing exit price on {stock_data.index[i]}, skipping trade.")
-                continue
-            exit_date = stock_data.index[i]
-            pnl = (exit_price - current_position['entry_price']) * 100
-            print(f"SELL signal on {exit_date}: Exit Price = {exit_price}, P&L = {pnl}")
-
-            trades.append({
-                'entry_date': current_position['entry_date'],
-                'entry_price': current_position['entry_price'],
-                'exit_date': exit_date,
-                'exit_price': exit_price,
-                'pnl': pnl
-            })
-            current_position = None
-
-    cumulative_pnl = sum(trade['pnl'] for trade in trades)
-    total_wins = sum(1 for trade in trades if trade['pnl'] > 0)
-    total_trades = len(trades)
-    win_rate = total_wins / total_trades if total_trades > 0 else 0
-
-    return cumulative_pnl, trades, win_rate
-
-
-def objective_function_profit(weights, strategy_signals, data, option_chain):
-    weights = np.array(weights)
-    weights /= np.sum(weights)  # Normalize weights
-    weighted_signals = np.sum([signal * weight for signal, weight in zip(strategy_signals.T.values, weights)], axis=0)
-
-    # Since `backtest_option_trades` returns 3 values, we only unpack those
-    cumulative_pnl, _, _ = backtest_option_trades(option_chain, weighted_signals, data)
-
-    # Return negative cumulative P&L to maximize profit
-    return -cumulative_pnl
-
-
-def optimize_weights(strategy_signals, data, option_chain):
-    initial_weights = [1 / len(strategy_signals.columns)] * len(strategy_signals.columns)
-    constraints = ({'type': 'eq', 'fun': lambda weights: np.sum(weights) - 1})
-    bounds = [(0, 1)] * len(strategy_signals.columns)
-
-    result = minimize(objective_function_profit, initial_weights, args=(strategy_signals, data, option_chain),
-                      method='SLSQP', bounds=bounds, constraints=constraints)
-    return result.x  # Optimal weights
-
-
-def weighted_signal_combination(strategy_signals, weights):
-    weighted_signals = np.sum([signal * weight for signal, weight in zip(strategy_signals.T.values, weights)], axis=0)
-    return weighted_signals
-
-
-def main_decision(weighted_signals):
-    last_signal = weighted_signals[-1]  # Latest signal
-    if last_signal > 0:
-        return "BUY"
-    elif last_signal < 0:
-        return "SELL"
-    else:
-        return "HOLD"
-
-
-def run_backtest():
-    ticker = ticker_info()
-    expiration_dates = fetch_expiration_dates(ticker)
-    expiration_date = select_expiration_date(expiration_dates)
-    options_chain = fetch_option_chain(ticker, expiration_date)
-
-    # Fetch training data
-    train_data = get_price_data(ticker, '2010-01-01', '2022-01-01')
-
-    # Generate signals
-    strategy_signals_train = generate_signals(train_data)
-
-    # Optimize weights
-    optimal_weights = optimize_weights(strategy_signals_train, train_data, options_chain.calls)
-
-    # Fetch test data
-    test_data = get_price_data(ticker, '2022-01-02', '2024-01-01')
-
-    # Generate test signals
-    strategy_signals_test = generate_signals(test_data)
-
-    # Combine signals and backtest
-    weighted_signals = weighted_signal_combination(strategy_signals_test, optimal_weights)
-    cumulative_pnl, trades, win_rate = backtest_option_trades(options_chain.calls, weighted_signals, test_data)
-
-    # Make final decision
-    decision = main_decision(weighted_signals)
-    print(f"Final decision: {decision}")
-
-    # Output results
-    print(f"Cumulative P&L: {cumulative_pnl}")
-    print(f"Win Rate: {win_rate * 100:.2f}%")
-
-
-# Call the main function
-run_backtest()
--- a/src/griffin-stuff/IBKR/3_month_testing_data.csv
+++ b/src/griffin-stuff/IBKR/3_month_testing_data.csv
--- a/src/griffin-stuff/IBKR/3_years_training_data.csv
+++ b/src/griffin-stuff/IBKR/3_years_training_data.csv
--- a/src/griffin-stuff/IBKR/predict_price.py
+++ b/src/griffin-stuff/IBKR/predict_price.py
@@ -1,78 +0,0 @@
-import pandas as pd
-import numpy as np
-from sklearn.preprocessing import StandardScaler
-from sklearn.metrics import mean_squared_error, mean_absolute_error
-from tensorflow.keras.models import Sequential
-from tensorflow.keras.layers import Dense
-from tensorflow.keras.callbacks import EarlyStopping
-
-# Load the training and testing data
-training_data = pd.read_csv("3_years_training_data.csv")
-testing_data = pd.read_csv("3_month_testing_data.csv")
-
-# Drop unnecessary columns
-training_data = training_data.drop(columns=["Unnamed: 0", "Date"])
-testing_data = testing_data.drop(columns=["Unnamed: 0", "Date"])
-
-# Create lagged features for the model
-def create_lagged_features(data, n_lags=3):
-    df = data.copy()
-    for lag in range(1, n_lags + 1):
-        df[f'Close_lag_{lag}'] = df['Close'].shift(lag)
-    df.dropna(inplace=True)  # Remove rows with NaN values due to shifting
-    return df
-
-# Apply lagged features to the training and testing datasets
-training_data = create_lagged_features(training_data)
-testing_data = create_lagged_features(testing_data)
-
-# Separate features and target
-X_train = training_data.drop(columns=["Close"]).values
-y_train = training_data["Close"].values
-X_test = testing_data.drop(columns=["Close"]).values
-y_test = testing_data["Close"].values
-
-# Standardize the features
-scaler = StandardScaler()
-X_train = scaler.fit_transform(X_train)
-X_test = scaler.transform(X_test)
-
-# Build the neural network model
-model = Sequential([
-    Dense(64, activation='sigmoid', input_shape=(X_train.shape[1],)),
-    Dense(32, activation='sigmoid'),
-    Dense(16, activation='sigmoid'),
-    Dense(1)  # Output layer for regression
-])
-
-# Compile the model
-model.compile(optimizer='adam', loss='mse', metrics=['mae'])
-
-# Use early stopping to prevent overfitting
-early_stopping = EarlyStopping(monitor='val_loss', patience=10, restore_best_weights=True)
-
-# Train the model
-history = model.fit(
-    X_train, y_train,
-    epochs=100,
-    batch_size=32,
-    validation_split=0.2,
-    callbacks=[early_stopping],
-    verbose=1
-)
-
-# Evaluate the model on the test set
-y_pred = model.predict(X_test).flatten()
-mse = mean_squared_error(y_test, y_pred)
-mae = mean_absolute_error(y_test, y_pred)
-
-print(f"Neural Network MSE: {mse:.2f}")
-print(f"Neural Network MAE: {mae:.2f}")
-
-# Prepare the latest data to predict tomorrow's price
-latest_data = testing_data.tail(1).drop(columns=["Close"])
-latest_data_scaled = scaler.transform(latest_data)
-
-# Predict tomorrow's close price
-tomorrow_pred = model.predict(latest_data_scaled)
-print(f"Predicted Close Price for Tomorrow: {tomorrow_pred[0][0]:.2f}")
--- a/src/griffin-stuff/IBKR/requirements.txt
+++ b/src/griffin-stuff/IBKR/requirements.txt
@@ -1,47 +0,0 @@
-absl-py==2.1.0
-astunparse==1.6.3
-certifi==2024.8.30
-charset-normalizer==3.4.0
-flatbuffers==24.3.25
-gast==0.6.0
-google-pasta==0.2.0
-grpcio==1.67.1
-h5py==3.12.1
-ibapi==9.81.1.post1
-idna==3.10
-importlib_metadata==8.5.0
-joblib==1.4.2
-keras==3.6.0
-libclang==18.1.1
-Markdown==3.7
-markdown-it-py==3.0.0
-MarkupSafe==3.0.2
-mdurl==0.1.2
-ml-dtypes==0.4.1
-namex==0.0.8
-numpy==2.0.2
-opt_einsum==3.4.0
-optree==0.13.0
-packaging==24.1
-pandas==2.2.3
-protobuf==5.28.3
-Pygments==2.18.0
-python-dateutil==2.9.0.post0
-pytz==2024.2
-requests==2.32.3
-rich==13.9.4
-scikit-learn==1.5.2
-scipy==1.13.1
-six==1.16.0
-tensorboard==2.18.0
-tensorboard-data-server==0.7.2
-tensorflow==2.18.0
-tensorflow-io-gcs-filesystem==0.37.1
-termcolor==2.5.0
-threadpoolctl==3.5.0
-typing_extensions==4.12.2
-tzdata==2024.2
-urllib3==2.2.3
-Werkzeug==3.1.1
-wrapt==1.16.0
-zipp==3.20.2
--- a/src/griffin-stuff/backtester/.config.json.un~
+++ b/src/griffin-stuff/backtester/.config.json.un~
--- a/src/griffin-stuff/backtester/.ipynb_checkpoints/evaluation-checkpoint.py
+++ b/src/griffin-stuff/backtester/.ipynb_checkpoints/evaluation-checkpoint.py
--- a/src/griffin-stuff/backtester/.ipynb_checkpoints/indicators-checkpoint.py
+++ b/src/griffin-stuff/backtester/.ipynb_checkpoints/indicators-checkpoint.py
--- a/src/griffin-stuff/backtester/.ipynb_checkpoints/main-checkpoint.py
+++ b/src/griffin-stuff/backtester/.ipynb_checkpoints/main-checkpoint.py
@@ -1,129 +0,0 @@
-import pandas as pd
-import matplotlib.pyplot as plt
-import json
-import os
-import datetime
-from sklearn.linear_model import LogisticRegression
-from sklearn.metrics import accuracy_score
-
-from indicators import add_indicators
-from strategy import generate_signals
-from backtester import backtest
-from optimizer import parameter_search
-from indicator_sets import indicator_sets
-
-def load_config(config_path="config.json"):
-    with open(config_path, 'r') as f:
-        return json.load(f)
-
-def load_data(data_path):
-    df = pd.read_csv(data_path, parse_dates=['Date'], index_col='Date')
-    df = df.sort_index()
-    required_cols = ['Open','High','Low','Close','Volume']
-    if not all(col in df.columns for col in required_cols):
-        raise ValueError("Data file must contain Date,Open,High,Low,Close,Volume columns.")
-    return df
-
-def visualize_data_with_indicators(df):
-    fig, axes = plt.subplots(4, 1, figsize=(12, 10), sharex=True)
-
-    axes[0].plot(df.index, df['Close'], label='Close', color='black')
-    axes[0].plot(df.index, df['EMA'], label='EMA', color='blue', alpha=0.7)
-    axes[0].set_title('Price and EMA')
-    axes[0].legend()
-
-    axes[1].plot(df.index, df['RSI'], label='RSI', color='green')
-    axes[1].axhline(70, color='red', linestyle='--')
-    axes[1].axhline(30, color='green', linestyle='--')
-    axes[1].set_title('RSI')
-
-    axes[2].plot(df.index, df['MACD'], label='MACD', color='purple')
-    axes[2].axhline(0, color='red', linestyle='--')
-    axes[2].set_title('MACD')
-
-    axes[3].plot(df.index, df['ADX'], label='ADX', color='brown')
-    axes[3].axhline(20, color='grey', linestyle='--')
-    axes[3].axhline(25, color='grey', linestyle='--')
-    axes[3].set_title('ADX')
-
-    plt.tight_layout()
-    plt.show()
-
-def log_results(message, log_file="indicator_test_results.log"):
-    timestamp = datetime.datetime.now().strftime("%Y-%m-%d %H:%M:%S")
-    with open(log_file, "a") as f:
-        f.write(f"{timestamp} - {message}\n")
-
-def main():
-    config = load_config("config.json")
-    data_path = os.path.join("data", "SPY_5min_preprocessed.csv")
-    df = load_data(data_path)
-
-    # Add core indicators and visualize
-    df = add_indicators(df, config)
-    visualize_data_with_indicators(df)
-
-    # Generate signals and backtest
-    df = generate_signals(df, config)
-    results = backtest(df, config)
-    print("Backtest Results:")
-    print(results)
-
-    # Parameter optimization example
-    param_grid = {
-        "rsi_threshold_bearish": [65, 70, 75],
-        "rsi_threshold_bullish": [25, 30, 35]
-    }
-    best_params, best_performance = parameter_search(df, config, param_grid)
-    print("Best Parameters Found:", best_params)
-    print("Best Performance (Final Equity):", best_performance)
-
-    # Now test multiple indicator sets for classification accuracy
-    log_file = "indicator_test_results.log"
-    with open(log_file, "w") as f:
-        f.write("Indicator Test Results Log\n")
-
-    # Create prediction target: next candle up or down
-    df['Future_Close'] = df['Close'].shift(-1)
-    df['Up_Indicator'] = (df['Future_Close'] > df['Close']).astype(int)
-    df = df.dropna(subset=['Future_Close'])
-
-    train_size = int(len(df)*0.7)
-    df_train = df.iloc[:train_size].copy()
-    df_test = df.iloc[train_size:].copy()
-
-    for set_name, func in indicator_sets.items():
-        # Apply the indicator set to train/test
-        train = df_train.copy()
-        test = df_test.copy()
-
-        train = func(train)
-        test = func(test)
-
-        # Ensure columns align
-        test = test.reindex(columns=train.columns)
-        test = test.dropna()
-        if len(test) == 0 or len(train) == 0:
-            log_results(f"{set_name}: Not enough data after adding indicators.", log_file)
-            continue
-
-        base_cols = ['Open','High','Low','Close','Volume','Future_Close','Up_Indicator']
-        feature_cols = [c for c in train.columns if c not in base_cols]
-
-        X_train = train[feature_cols]
-        y_train = train['Up_Indicator']
-        X_test = test[feature_cols]
-        y_test = test['Up_Indicator']
-
-        # Train a simple logistic regression model
-        model = LogisticRegression(max_iter=1000)
-        model.fit(X_train, y_train)
-        y_pred = model.predict(X_test)
-
-        acc = accuracy_score(y_test, y_pred)
-        result_message = f"{set_name}: Accuracy = {acc:.4f}"
-        print(result_message)
-        log_results(result_message, log_file)
-
-if __name__ == "__main__":
-    main()
--- a/src/griffin-stuff/backtester/pycache/evaluation.cpython-313.pyc
+++ b/src/griffin-stuff/backtester/pycache/evaluation.cpython-313.pyc
--- a/src/griffin-stuff/backtester/pycache/indicators.cpython-313.pyc
+++ b/src/griffin-stuff/backtester/pycache/indicators.cpython-313.pyc
--- a/src/griffin-stuff/backtester/config.json
+++ b/src/griffin-stuff/backtester/config.json
@@ -1,32 +0,0 @@
-{
-	  "data": {
-		      "input_csv": "data/SPY_5min_preprocessed.csv",
-		          "date_column": "Date",
-			      "price_column": "Close",
-			          "high_column": "High",
-				      "low_column": "Low",
-				          "volume_column": "Volume"
-					    },
-					      "indicators": {
-						          "trend": ["SMA", "EMA", "ADX"],
-							      "momentum": ["RSI", "MACD"],
-							          "volatility": ["BollingerBands"],
-								      "volume": ["OBV"], 
-								          "mean_reversion": ["MeanReversionSignal"]
-									    },
-									      "parameters": {
-										          "SMA": {"window": 20},
-											      "EMA": {"window": 20},
-											          "ADX": {"window": 14},
-												      "RSI": {"window": 14, "overbought": 70, "oversold": 30},
-												          "MACD": {"fastperiod": 12, "slowperiod": 26, "signalperiod": 9},
-													      "BollingerBands": {"window": 20, "std_dev": 2},
-													          "OBV": {},
-														      "MeanReversionSignal": {"window": 10}
-														        },
-															  "evaluation": {
-																      "prediction_horizon": 1,
-																          "log_file": "logs/results.log"
-																	    }
-}
-
--- a/src/griffin-stuff/backtester/config.json~
+++ b/src/griffin-stuff/backtester/config.json~
@@ -1,32 +0,0 @@
-{
-	  "data": {
-		      "input_csv": "data/price_data.csv",
-		          "date_column": "Date",
-			      "price_column": "Close",
-			          "high_column": "High",
-				      "low_column": "Low",
-				          "volume_column": "Volume"
-					    },
-					      "indicators": {
-						          "trend": ["SMA", "EMA", "ADX"],
-							      "momentum": ["RSI", "MACD"],
-							          "volatility": ["BollingerBands"],
-								      "volume": ["OBV"], 
-								          "mean_reversion": ["MeanReversionSignal"]
-									    },
-									      "parameters": {
-										          "SMA": {"window": 20},
-											      "EMA": {"window": 20},
-											          "ADX": {"window": 14},
-												      "RSI": {"window": 14, "overbought": 70, "oversold": 30},
-												          "MACD": {"fastperiod": 12, "slowperiod": 26, "signalperiod": 9},
-													      "BollingerBands": {"window": 20, "std_dev": 2},
-													          "OBV": {},
-														      "MeanReversionSignal": {"window": 10}
-														        },
-															  "evaluation": {
-																      "prediction_horizon": 1,
-																          "log_file": "logs/results.log"
-																	    }
-}
-
--- a/src/griffin-stuff/backtester/data/SPY_3yr_1min_data.csv
+++ b/src/griffin-stuff/backtester/data/SPY_3yr_1min_data.csv
--- a/src/griffin-stuff/backtester/data/SPY_3yr_5min_data.csv
+++ b/src/griffin-stuff/backtester/data/SPY_3yr_5min_data.csv
--- a/src/griffin-stuff/backtester/data/SPY_5min_preprocessed.csv
+++ b/src/griffin-stuff/backtester/data/SPY_5min_preprocessed.csv
--- a/src/griffin-stuff/backtester/data/spy_1min_preprocessed.csv
+++ b/src/griffin-stuff/backtester/data/spy_1min_preprocessed.csv
--- a/src/griffin-stuff/backtester/evaluation.py
+++ b/src/griffin-stuff/backtester/evaluation.py
@@ -1,32 +0,0 @@
-import numpy as np
-
-def evaluate_indicator_accuracy(df, price_col="Close", horizon=1):
-    """
-    Evaluate how often indicator signals predict the correct next-day price direction.
-    
-    Logic:
-    - If signal[i] = 1 (bullish), correct if price[i+horizon] > price[i].
-    - If signal[i] = -1 (bearish), correct if price[i+horizon] < price[i].
-    - If signal[i] = 0, skip.
-    """
-    correct = 0
-    total = 0
-    
-    for i in range(len(df) - horizon):
-        sig = df['signal'].iloc[i]
-        if sig == 0:
-            continue
-        future_price = df[price_col].iloc[i + horizon]
-        current_price = df[price_col].iloc[i]
-        
-        if sig == 1 and future_price > current_price:
-            correct += 1
-        elif sig == -1 and future_price < current_price:
-            correct += 1
-        
-        if sig != 0:
-            total += 1
-    
-    if total == 0:
-        return np.nan  # No signals generated
-    return correct / total
--- a/src/griffin-stuff/backtester/indicators.py
+++ b/src/griffin-stuff/backtester/indicators.py
@@ -1,96 +0,0 @@
-import pandas as pd
-import numpy as np
-import ta
-
-def calculate_indicator_signals(df, indicator_name, params, price_col="Close", high_col="High", low_col="Low", volume_col="Volume"):
-    """
-    Calculates indicator values and generates signals:
-    Signal Convention: 1 = Bullish Prediction, -1 = Bearish Prediction, 0 = Neutral
-    """
-    if price_col not in df.columns:
-        raise ValueError(f"{price_col} column not found in the dataframe.")
-    
-    if indicator_name == "SMA":
-        # Trend: price > SMA => bullish, else bearish
-        window = params.get("window", 20)
-        df['SMA'] = df[price_col].rolling(window).mean()
-        df['signal'] = np.where(df[price_col] > df['SMA'], 1, -1)
-    
-    elif indicator_name == "EMA":
-        # Trend: price > EMA => bullish, else bearish
-        window = params.get("window", 20)
-        df['EMA'] = df[price_col].ewm(span=window, adjust=False).mean()
-        df['signal'] = np.where(df[price_col] > df['EMA'], 1, -1)
-    
-    elif indicator_name == "ADX":
-        # Trend: use ADXIndicator
-        if high_col not in df.columns or low_col not in df.columns:
-            raise ValueError("ADX calculation requires 'High' and 'Low' columns.")
-        window = params.get("window", 14)
-        adx_indicator = ta.trend.ADXIndicator(high=df[high_col], low=df[low_col], close=df[price_col], window=window)
-        df['ADX'] = adx_indicator.adx()
-        df['DIP'] = adx_indicator.adx_pos()  # +DI
-        df['DIN'] = adx_indicator.adx_neg()  # -DI
-        
-        # If ADX > 25 and DI+ > DI- => bullish
-        # If ADX > 25 and DI- > DI+ => bearish
-        # Otherwise => no strong signal
-        df['signal'] = 0
-        trending_up = (df['DIP'] > df['DIN']) & (df['ADX'] > 25)
-        trending_down = (df['DIN'] > df['DIP']) & (df['ADX'] > 25)
-        df.loc[trending_up, 'signal'] = 1
-        df.loc[trending_down, 'signal'] = -1
-    
-    elif indicator_name == "RSI":
-        # Momentum: RSI > overbought => bearish, RSI < oversold => bullish
-        window = params.get("window", 14)
-        overbought = params.get("overbought", 70)
-        oversold = params.get("oversold", 30)
-        df['RSI'] = ta.momentum.rsi(df[price_col], window=window)
-        conditions = [
-            (df['RSI'] > overbought),
-            (df['RSI'] < oversold)
-        ]
-        values = [-1, 1]
-        df['signal'] = np.select(conditions, values, default=0)
-    
-    elif indicator_name == "MACD":
-        # Momentum: MACD line > Signal line => bullish, else bearish
-        fastperiod = params.get("fastperiod", 12)
-        slowperiod = params.get("slowperiod", 26)
-        signalperiod = params.get("signalperiod", 9)
-        macd = ta.trend.MACD(df[price_col], window_slow=slowperiod, window_fast=fastperiod, window_sign=signalperiod)
-        df['MACD'] = macd.macd()
-        df['MACD_Signal'] = macd.macd_signal()
-        
-        df['signal'] = np.where(df['MACD'] > df['MACD_Signal'], 1, -1)
-    
-    elif indicator_name == "BollingerBands":
-        # Volatility: price near upper band => bearish, near lower band => bullish
-        window = params.get("window", 20)
-        std_dev = params.get("std_dev", 2)
-        bb = ta.volatility.BollingerBands(df[price_col], window=window, window_dev=std_dev)
-        df['BB_High'] = bb.bollinger_hband()
-        df['BB_Low'] = bb.bollinger_lband()
-        df['signal'] = np.where(df[price_col] >= df['BB_High'], -1,
-                        np.where(df[price_col] <= df['BB_Low'], 1, 0))
-    
-    elif indicator_name == "OBV":
-        # Volume: Rising OBV => bullish, falling OBV => bearish
-        if volume_col not in df.columns:
-            raise ValueError(f"OBV calculation requires '{volume_col}' column.")
-        df['OBV'] = ta.volume.on_balance_volume(df[price_col], df[volume_col])
-        df['OBV_Change'] = df['OBV'].diff()
-        df['signal'] = np.where(df['OBV_Change'] > 0, 1, np.where(df['OBV_Change'] < 0, -1, 0))
-    
-    elif indicator_name == "MeanReversionSignal":
-        # Mean Reversion: price > mean => bearish, price < mean => bullish
-        window = params.get("window", 10)
-        df['mean'] = df[price_col].rolling(window).mean()
-        df['signal'] = np.where(df[price_col] > df['mean'], -1, 
-                        np.where(df[price_col] < df['mean'], 1, 0))
-    
-    else:
-        raise ValueError(f"Unknown indicator: {indicator_name}")
-    
-    return df
--- a/src/griffin-stuff/backtester/logs/.ipynb_checkpoints/results-checkpoint.log
+++ b/src/griffin-stuff/backtester/logs/.ipynb_checkpoints/results-checkpoint.log
@@ -1,24 +0,0 @@
-2024-12-13 22:07:39,152 - INFO - Category: trend, Indicator: SMA, Accuracy: 0.3166
-2024-12-13 22:07:40,855 - INFO - Category: trend, Indicator: EMA, Accuracy: 0.3160
-2024-12-13 22:10:04,274 - INFO - Category: trend, Indicator: SMA, Accuracy: 0.3166
-2024-12-13 22:10:05,997 - INFO - Category: trend, Indicator: EMA, Accuracy: 0.3160
-2024-12-13 22:10:07,745 - INFO - Category: trend, Indicator: ADX, Accuracy: 0.2696
-2024-12-13 22:10:08,484 - INFO - Category: momentum, Indicator: RSI, Accuracy: 0.2495
-2024-12-13 22:10:09,096 - INFO - Category: volatility, Indicator: BollingerBands, Accuracy: 0.3114
-2024-12-13 22:10:11,937 - INFO - Category: volume, Indicator: OBV, Accuracy: 0.3167
-2024-12-13 22:10:15,386 - INFO - Category: mean_reversion, Indicator: MeanReversionSignal, Accuracy: 0.3330
-2024-12-13 22:12:44,520 - INFO - Category: trend, Indicator: SMA, Accuracy: 0.3166
-2024-12-13 22:12:45,874 - INFO - Category: trend, Indicator: EMA, Accuracy: 0.3160
-2024-12-13 22:12:47,913 - INFO - Category: trend, Indicator: ADX, Accuracy: 0.2696
-2024-12-13 22:12:48,530 - INFO - Category: momentum, Indicator: RSI, Accuracy: 0.2495
-2024-12-13 22:12:49,173 - INFO - Category: volatility, Indicator: BollingerBands, Accuracy: 0.3114
-2024-12-13 22:12:51,230 - INFO - Category: volume, Indicator: OBV, Accuracy: 0.3167
-2024-12-13 22:12:54,504 - INFO - Category: mean_reversion, Indicator: MeanReversionSignal, Accuracy: 0.3330
-2024-12-13 22:23:17,293 - INFO - Category: trend, Indicator: SMA, Accuracy: 0.3166
-2024-12-13 22:23:18,087 - INFO - Category: trend, Indicator: EMA, Accuracy: 0.3160
-2024-12-13 22:23:19,409 - INFO - Category: trend, Indicator: ADX, Accuracy: 0.2696
-2024-12-13 22:23:19,797 - INFO - Category: momentum, Indicator: RSI, Accuracy: 0.2495
-2024-12-13 22:23:20,669 - INFO - Category: momentum, Indicator: MACD, Accuracy: 0.3184
-2024-12-13 22:23:20,993 - INFO - Category: volatility, Indicator: BollingerBands, Accuracy: 0.3114
-2024-12-13 22:23:21,786 - INFO - Category: volume, Indicator: OBV, Accuracy: 0.3167
-2024-12-13 22:23:22,678 - INFO - Category: mean_reversion, Indicator: MeanReversionSignal, Accuracy: 0.3330
--- a/src/griffin-stuff/backtester/logs/results.log
+++ b/src/griffin-stuff/backtester/logs/results.log
@@ -1,8 +0,0 @@
-2024-12-13 22:23:17,293 - INFO - Category: trend, Indicator: SMA, Accuracy: 0.3166
-2024-12-13 22:23:18,087 - INFO - Category: trend, Indicator: EMA, Accuracy: 0.3160
-2024-12-13 22:23:19,409 - INFO - Category: trend, Indicator: ADX, Accuracy: 0.2696
-2024-12-13 22:23:19,797 - INFO - Category: momentum, Indicator: RSI, Accuracy: 0.2495
-2024-12-13 22:23:20,669 - INFO - Category: momentum, Indicator: MACD, Accuracy: 0.3184
-2024-12-13 22:23:20,993 - INFO - Category: volatility, Indicator: BollingerBands, Accuracy: 0.3114
-2024-12-13 22:23:21,786 - INFO - Category: volume, Indicator: OBV, Accuracy: 0.3167
-2024-12-13 22:23:22,678 - INFO - Category: mean_reversion, Indicator: MeanReversionSignal, Accuracy: 0.3330
--- a/src/griffin-stuff/backtester/main.py
+++ b/src/griffin-stuff/backtester/main.py
@@ -1,65 +0,0 @@
-import json
-import logging
-import pandas as pd
-import os
-
-from indicators import calculate_indicator_signals
-from evaluation import evaluate_indicator_accuracy
-
-def setup_logging(log_path):
-    os.makedirs(os.path.dirname(log_path), exist_ok=True)
-    logging.basicConfig(
-        filename=log_path,
-        level=logging.INFO,
-        format='%(asctime)s - %(levelname)s - %(message)s'
-    )
-
-def load_config(config_path="config.json"):
-    with open(config_path, 'r') as f:
-        config = json.load(f)
-    return config
-
-def load_data(csv_path, date_col, price_col):
-    df = pd.read_csv(csv_path)
-    df[date_col] = pd.to_datetime(df[date_col])
-    df = df.sort_values(date_col).reset_index(drop=True)
-    df = df.dropna(subset=[date_col, price_col])
-    return df
-
-if __name__ == "__main__":
-    config = load_config("config.json")
-    setup_logging(config["evaluation"]["log_file"])
-    
-    # Load data
-    df = load_data(config["data"]["input_csv"], 
-                   config["data"]["date_column"], 
-                   config["data"]["price_column"])
-    
-    # Calculate indicators and signals, evaluate accuracy
-    all_results = []
-    for category, indicators in config["indicators"].items():
-        for ind_name in indicators:
-            params = config["parameters"].get(ind_name, {})
-            
-            signals_df = calculate_indicator_signals(
-                df.copy(),
-                indicator_name=ind_name,
-                params=params,
-                price_col=config["data"]["price_column"],
-                high_col=config["data"]["high_column"],
-                low_col=config["data"]["low_column"],
-                volume_col=config["data"]["volume_column"]
-            )
-            
-            accuracy = evaluate_indicator_accuracy(
-                signals_df, 
-                price_col=config["data"]["price_column"],
-                horizon=config["evaluation"]["prediction_horizon"]
-            )
-            
-            logging.info(f"Category: {category}, Indicator: {ind_name}, Accuracy: {accuracy:.4f}")
-            all_results.append((category, ind_name, accuracy))
-    
-    # Print results to console as well
-    for category, ind_name, acc in all_results:
-        print(f"Category: {category}, Indicator: {ind_name}, Accuracy: {acc:.4f}")
--- a/src/griffin-stuff/data_collection_daily.py
+++ b/src/griffin-stuff/data_collection_daily.py
@@ -1,233 +0,0 @@
-import signal
-from ibapi.client import EClient
-from ibapi.wrapper import EWrapper
-from ibapi.contract import Contract
-import threading
-import time
-import pandas as pd
-from datetime import datetime, timedelta, timezone
-from tqdm import tqdm  # For progress bar
-import os
-
-class IBApi(EWrapper, EClient):
-    def __init__(self):
-        EClient.__init__(self, self)
-        self.data = []
-        self.df = pd.DataFrame()
-        self.data_retrieved = False
-
-    def historicalData(self, reqId, bar):
-        # Debug: Print each received bar
-        print(f"Received bar: Date={bar.date}, Open={bar.open}, High={bar.high}, Low={bar.low}, Close={bar.close}, Volume={bar.volume}")
-        self.data.append({
-            "Date": bar.date,
-            "Open": bar.open,
-            "High": bar.high,
-            "Low": bar.low,
-            "Close": bar.close,
-            "Volume": bar.volume
-        })
-
-    def historicalDataEnd(self, reqId, start, end):
-        # Debug: Indicate end of data reception
-        print(f"HistoricalDataEnd received. Start: {start}, End: {end}. Number of bars fetched: {len(self.data)}")
-        chunk_df = pd.DataFrame(self.data)
-        if not chunk_df.empty:
-            self.df = pd.concat([self.df, chunk_df], ignore_index=True)
-        else:
-            print("No data received in this request.")
-        self.data_retrieved = True
-        self.data = []  # Reset data list for next request
-
-class IBApp:
-    def __init__(self):
-        self.app = IBApi()
-
-    def connect(self):
-        # Connect to IB API (ensure IB Gateway or TWS is running)
-        print("Connecting to IB API...")
-        self.app.connect("127.0.0.1", 4002, clientId=1)
-        # Start the API thread
-        thread = threading.Thread(target=self.run_app, daemon=True)
-        thread.start()
-        time.sleep(1)  # Allow time for connection
-        print("Connected to IB API.")
-
-    def run_app(self):
-        self.app.run()
-
-    def request_data(self, contract, end_date, duration, bar_size):
-        # Request historical data
-        print(f"Requesting data: endDateTime={end_date}, durationStr={duration}, barSizeSetting={bar_size}")
-        self.app.reqHistoricalData(
-            reqId=1,
-            contract=contract,
-            endDateTime=end_date,
-            durationStr=duration,
-            barSizeSetting=bar_size,
-            whatToShow="TRADES",
-            useRTH=1,  # Use regular trading hours
-            formatDate=1,
-            keepUpToDate=False,
-            chartOptions=[]
-        )
-        # Wait until data is retrieved
-        while not self.app.data_retrieved:
-            time.sleep(0.1)
-        self.app.data_retrieved = False  # Reset flag for next request
-
-    def fetch_historical_data_yearly(self, symbol, sec_type, exchange, currency, start_date, end_date, bar_size="1 day"):
-        """
-        Fetch historical data in yearly chunks to cover 3 years.
-        """
-        try:
-            contract = Contract()
-            contract.symbol = symbol
-            contract.secType = sec_type
-            contract.exchange = exchange
-            contract.currency = currency
-
-            delta = timedelta(days=365)
-            current_end_date = end_date
-
-            total_years = 3  # Fetch 3 years of data
-            with tqdm(total=total_years, desc="Fetching Data", unit="year") as pbar:
-                for _ in range(total_years):
-                    current_start_date = current_end_date - delta
-                    end_date_str = current_end_date.strftime("%Y%m%d %H:%M:%S UTC")
-                    self.request_data(contract, end_date_str, "1 Y", bar_size)
-                    pbar.update(1)
-                    current_end_date = current_start_date
-                    time.sleep(1)  # Respect IB API pacing
-        except Exception as e:
-            print(f"Error fetching data: {e}")
-
-    def fetch_historical_data(self, symbol, sec_type, exchange, currency, existing_df=None):
-        """
-        Fetch historical data for the given symbol.
-        If existing_df is provided, fetch data after the last date in existing_df.
-        Otherwise, fetch the entire 3 years of data.
-        """
-        try:
-            contract = Contract()
-            contract.symbol = symbol
-            contract.secType = sec_type
-            contract.exchange = exchange
-            contract.currency = currency
-
-            bar_size = "1 day"   # Set bar size to 1 day for daily data
-            duration = "1 Y"      # Fetch 1 year at a time
-
-            if existing_df is not None and not existing_df.empty:
-                # Get the last date from existing data
-                last_date_str = existing_df['Date'].iloc[-1]
-                # Clean up the date string to have single space
-                last_date_str = last_date_str.strip().replace('  ', ' ')
-                # Parse the last date as timezone-aware datetime (assuming UTC)
-                try:
-                    # Try parsing in 'YYYYMMDD HH:MM:SS' format
-                    last_date = datetime.strptime(last_date_str, "%Y%m%d %H:%M:%S").replace(tzinfo=timezone.utc)
-                except ValueError:
-                    try:
-                        # If that fails, try 'YYYY-MM-DD HH:MM:SS' format
-                        last_date = datetime.strptime(last_date_str, "%Y-%m-%d %H:%M:%S").replace(tzinfo=timezone.utc)
-                    except ValueError:
-                        print(f"Error parsing last_date_str: {last_date_str}")
-                        return
-
-                # Remove any future dates if present
-                current_time = datetime.now(timezone.utc)
-                existing_df = existing_df[existing_df['Date'] <= current_time]
-                print(f"Last valid date after cleaning: {last_date.strftime('%Y-%m-%d %H:%M:%S')}")
-
-                # Fetch new data in yearly chunks
-                # Since we need 3 years of data, and assuming existing_df has some, adjust accordingly
-                # For simplicity, fetch the entire 3 years again
-                # Alternatively, fetch data from last_date forward
-
-                # Here, we'll fetch 3 years of data up to current_date
-                end_date = datetime.now(timezone.utc)
-                start_date = end_date - timedelta(days=365 * 3)
-                self.fetch_historical_data_yearly(symbol, sec_type, exchange, currency, start_date, end_date, bar_size)
-            else:
-                # No existing data, fetch all 3 years
-                end_date = datetime.now(timezone.utc)
-                self.fetch_historical_data_yearly(symbol, sec_type, exchange, currency, end_date - timedelta(days=365*3), end_date, bar_size)
-        except Exception as e:
-            print(f"Error fetching data: {e}")
-
-    def disconnect(self):
-        self.app.disconnect()
-        print("Disconnected from IB API.")
-
-def get_user_input():
-    print("Provide the stock details for historical data retrieval.")
-    try:
-        symbol = input("Enter the stock symbol (e.g., 'AAPL'): ").strip().upper()
-        sec_type = "STK"          # Automatically set to Stock
-        exchange = "SMART"        # Automatically set to SMART routing
-        currency = "USD"          # Automatically set to USD
-
-        if not symbol:
-            raise ValueError("Stock symbol is required. Please try again.")
-
-        return symbol, sec_type, exchange, currency
-    except Exception as e:
-        print(f"Input Error: {e}")
-        return None
-
-def graceful_exit(signal_received, frame):
-    print("\nTerminating program...")
-    app.disconnect()
-    exit(0)
-
-# Handle graceful exit on Ctrl+C
-signal.signal(signal.SIGINT, graceful_exit)
-
-# Initialize and connect the IBApp
-app = IBApp()
-app.connect()
-
-try:
-    user_input = get_user_input()
-    if user_input:
-        symbol, sec_type, exchange, currency = user_input
-
-        # Define the filename (save directly in current directory)
-        filename = f"{symbol}_3yr_daily_data.csv"
-
-        # Fetch historical data
-        app.fetch_historical_data(symbol, sec_type, exchange, currency)
-
-        # Retrieve fetched data
-        data = app.app.df
-        if not data.empty:
-            print(f"Number of data points fetched: {len(data)}")
-
-            # Clean and parse the 'Date' column
-            # Attempt multiple formats
-            data['Date'] = pd.to_datetime(data['Date'], errors='coerce')
-
-            # Check if timezone is present; if not, localize to UTC
-            if data['Date'].dt.tz is None:
-                data['Date'] = data['Date'].dt.tz_localize(timezone.utc, ambiguous='NaT', nonexistent='NaT')
-
-            # Remove any rows with NaT in 'Date'
-            data.dropna(subset=['Date'], inplace=True)
-
-            # Sort by 'Date' ascending
-            data.sort_values(by='Date', inplace=True)
-
-            # Reset index
-            data.reset_index(drop=True, inplace=True)
-
-            # Save to CSV
-            data.to_csv(filename, index=False)
-            print(f"Data saved to {filename}.")
-            print(data.head())
-        else:
-            print("No data retrieved.")
-except Exception as e:
-    print(f"Error: {e}")
-finally:
-    app.disconnect()
--- a/src/griffin-stuff/data_collection_min.py
+++ b/src/griffin-stuff/data_collection_min.py
@@ -1,144 +0,0 @@
-import signal
-from ibapi.client import EClient
-from ibapi.wrapper import EWrapper
-from ibapi.contract import Contract
-import threading
-import time
-import pandas as pd
-from datetime import datetime, timedelta, timezone
-from tqdm import tqdm  # For progress bar
-
-
-class IBApi(EWrapper, EClient):
-    def __init__(self):
-        EClient.__init__(self, self)
-        self.data = []
-        self.df = pd.DataFrame()
-        self.data_retrieved = False
-
-    def historicalData(self, reqId, bar):
-        self.data.append({
-            "Date": bar.date,
-            "Open": bar.open,
-            "High": bar.high,
-            "Low": bar.low,
-            "Close": bar.close,
-            "Volume": bar.volume
-        })
-
-    def historicalDataEnd(self, reqId, start, end):
-        chunk_df = pd.DataFrame(self.data)
-        self.df = pd.concat([self.df, chunk_df], ignore_index=True)
-        self.data_retrieved = True
-        self.data = []
-
-
-class IBApp:
-    def __init__(self):
-        self.app = IBApi()
-
-    def connect(self):
-        self.app.connect("127.0.0.1", 4002, clientId=1)
-        thread = threading.Thread(target=self.run_app, daemon=True)
-        thread.start()
-        time.sleep(1)
-
-    def run_app(self):
-        self.app.run()
-
-    def request_data(self, contract, end_date, duration, bar_size):
-        self.app.reqHistoricalData(
-            reqId=1,
-            contract=contract,
-            endDateTime=end_date,
-            durationStr=duration,
-            barSizeSetting=bar_size,
-            whatToShow="TRADES",
-            useRTH=0,
-            formatDate=1,
-            keepUpToDate=False,
-            chartOptions=[]
-        )
-        # Ensure pacing between API calls
-        while not self.app.data_retrieved:
-            time.sleep(0.1)
-
-    def fetch_historical_data(self, symbol, sec_type, exchange, currency):
-        try:
-            contract = Contract()
-            contract.symbol = symbol
-            contract.secType = sec_type
-            contract.exchange = exchange
-            contract.currency = currency
-
-            # Set duration and bar size
-            duration = "1 D"  # 1 day chunks
-            bar_size = "5 mins"  # 1-minute intervals
-
-            end_date = datetime.now(timezone.utc)
-            start_date = end_date - timedelta(days=365) #Can multiply for more years
-
-            total_days = (end_date - start_date).days
-            with tqdm(total=total_days, desc="Fetching Data", unit="day") as pbar:
-                current_date = end_date
-                while current_date > start_date:
-                    end_date_str = current_date.strftime("%Y%m%d %H:%M:%S UTC")
-                    try:
-                        self.request_data(contract, end_date_str, duration, bar_size)
-                        pbar.update(1)
-                        time.sleep(5)  # Sleep to avoid pacing violations
-                    except Exception as e:
-                        print(f"Error fetching data for {end_date_str}: {e}")
-                    current_date -= timedelta(days=1)
-        except Exception as e:
-            print(f"Error fetching data: {e}")
-
-    def disconnect(self):
-        self.app.disconnect()
-
-
-def get_user_input():
-    print("Provide the stock details for historical data retrieval.")
-    try:
-        symbol = input("Enter the stock symbol (e.g., 'AAPL'): ").strip().upper()
-        sec_type = "STK"  # Automatically set to Stock
-        exchange = "SMART"  # Automatically set to SMART routing
-        currency = "USD"  # Automatically set to USD
-
-        if not symbol:
-            raise ValueError("Stock symbol is required. Please try again.")
-
-        return symbol, sec_type, exchange, currency
-    except Exception as e:
-        print(f"Input Error: {e}")
-        return None
-
-
-def graceful_exit(signal_received, frame):
-    print("\nTerminating program...")
-    app.disconnect()
-    exit(0)
-
-
-signal.signal(signal.SIGINT, graceful_exit)
-
-app = IBApp()
-app.connect()
-
-try:
-    user_input = get_user_input()
-    if user_input:
-        symbol, sec_type, exchange, currency = user_input
-        app.fetch_historical_data(symbol, sec_type, exchange, currency)
-        data = app.app.df
-        if not data.empty:
-            filename = f"{symbol}_1yr_5min_data.csv"
-            data.to_csv(filename, index=False)
-            print(f"Data saved to {filename}.")
-            print(data.head())
-        else:
-            print("No data retrieved.")
-except Exception as e:
-    print(f"Error: {e}")
-finally:
-    app.disconnect()
--- a/src/griffin-stuff/data_preprocessing.py
+++ b/src/griffin-stuff/data_preprocessing.py
@@ -1,24 +0,0 @@
-import pandas as pd
-
-# Define the path to your CSV file
-csv_file_path = 'C:/Users/gwitt/MidasTechnologies/API/SPY_3yr_5min_data.csv'  # Replace with your actual file path
-df = pd.read_csv(csv_file_path)
-
-# Step 2: Preprocess the data
-# Parse the 'Date' column to datetime and set as index
-df['Date'] = pd.to_datetime(df['Date'].str.strip(), format='%Y%m%d %H:%M:%S')
-df.set_index('Date', inplace=True)
-
-# Sort data in chronological order
-df.sort_index(inplace=True)
-
-# Handle missing data by forward filling
-df.ffill(inplace=True)
-
-# Step 3: Save preprocessed data to a new CSV file
-preprocessed_file_path = 'SPY_5min_preprocessed.csv'  # Replace with your desired path
-df.to_csv(preprocessed_file_path)
-
-print(f"Preprocessed data saved to {preprocessed_file_path}")
-
-
--- a/src/griffin-stuff/options_data_collection.py
+++ b/src/griffin-stuff/options_data_collection.py
@@ -1,145 +0,0 @@
-import signal
-from ibapi.client import EClient
-from ibapi.wrapper import EWrapper
-from ibapi.contract import Contract
-import threading
-import time
-import pandas as pd
-from datetime import datetime, timezone
-from tqdm import tqdm  # For progress bar
-
-
-class IBApi(EWrapper, EClient):
-    def __init__(self):
-        EClient.__init__(self, self)
-        self.data = []
-        self.df = pd.DataFrame()
-        self.data_retrieved = False
-
-    def historicalData(self, reqId, bar):
-        self.data.append({
-            "Date": bar.date,
-            "Open": bar.open,
-            "High": bar.high,
-            "Low": bar.low,
-            "Close": bar.close,
-            "Volume": bar.volume
-        })
-
-    def historicalDataEnd(self, reqId, start, end):
-        chunk_df = pd.DataFrame(self.data)
-        self.df = pd.concat([self.df, chunk_df], ignore_index=True)
-        self.data_retrieved = True
-        self.data = []
-
-
-class IBApp:
-    def __init__(self):
-        self.app = IBApi()
-
-    def connect(self):
-        self.app.connect("127.0.0.1", 4002, clientId=1)
-        thread = threading.Thread(target=self.run_app, daemon=True)
-        thread.start()
-        time.sleep(1)
-
-    def run_app(self):
-        self.app.run()
-
-    def request_data(self, contract, end_date, duration, bar_size):
-        self.app.reqHistoricalData(
-            reqId=1,
-            contract=contract,
-            endDateTime=end_date,
-            durationStr=duration,
-            barSizeSetting=bar_size,
-            whatToShow="TRADES",
-            useRTH=0,
-            formatDate=1,
-            keepUpToDate=False,
-            chartOptions=[]
-        )
-        # Ensure pacing between API calls
-        while not self.app.data_retrieved:
-            time.sleep(0.1)
-
-    def fetch_options_data(self, symbol, exchange, currency, right, strike, expiry):
-        try:
-            contract = Contract()
-            contract.symbol = symbol
-            contract.secType = "OPT"  # Set security type to options
-            contract.exchange = exchange
-            contract.currency = currency
-            contract.right = right  # 'C' for Call, 'P' for Put
-            contract.strike = float(strike)  # Strike price
-            contract.lastTradeDateOrContractMonth = expiry  # Expiry date in YYYYMMDD format
-
-            # Set duration and bar size for options data
-            duration = "1 D"  # 1 day chunks
-            bar_size = "1 min"  # 1-minute intervals
-
-            end_date = datetime.now(timezone.utc)
-
-            # Since options data typically spans less than a year, we fetch for the expiry
-            with tqdm(total=1, desc=f"Fetching {right} {strike} {expiry} data", unit="contract") as pbar:
-                end_date_str = end_date.strftime("%Y%m%d %H:%M:%S UTC")
-                try:
-                    self.request_data(contract, end_date_str, duration, bar_size)
-                    pbar.update(1)
-                    time.sleep(15)  # Sleep to avoid pacing violations
-                except Exception as e:
-                    print(f"Error fetching data for contract {contract.symbol}: {e}")
-        except Exception as e:
-            print(f"Error fetching data: {e}")
-
-    def disconnect(self):
-        self.app.disconnect()
-
-
-def get_user_input():
-    print("Provide the options contract details for data retrieval.")
-    try:
-        symbol = input("Enter the stock symbol (e.g., 'AAPL'): ").strip().upper()
-        exchange = "SMART"  # Automatically set to SMART routing
-        currency = "USD"  # Automatically set to USD
-        right = input("Enter the option type ('C' for Call, 'P' for Put): ").strip().upper()
-        strike = input("Enter the strike price (e.g., '150'): ").strip()
-        expiry = input("Enter the expiry date (YYYYMMDD): ").strip()
-
-        if not all([symbol, right, strike, expiry]):
-            raise ValueError("All fields are required. Please try again.")
-
-        return symbol, exchange, currency, right, strike, expiry
-    except Exception as e:
-        print(f"Input Error: {e}")
-        return None
-
-
-def graceful_exit(signal_received, frame):
-    print("\nTerminating program...")
-    app.disconnect()
-    exit(0)
-
-
-signal.signal(signal.SIGINT, graceful_exit)
-
-app = IBApp()
-app.connect()
-
-try:
-    user_input = get_user_input()
-    if user_input:
-        symbol, exchange, currency, right, strike, expiry = user_input
-        app.fetch_options_data(symbol, exchange, currency, right, strike, expiry)
-        data = app.app.df
-        if not data.empty:
-            filename = f"{symbol}_{strike}_{right}_{expiry}_options_data.csv"
-            data.to_csv(filename, index=False)
-            print(f"Options data saved to {filename}.")
-            print(data.head())
-        else:
-            print("No options data retrieved.")
-except Exception as e:
-    print(f"Error: {e}")
-finally:
-    app.disconnect()
--- a/src/griffin-stuff/recent_data_pull.py
+++ b/src/griffin-stuff/recent_data_pull.py
@@ -1,170 +0,0 @@
-import signal
-from ibapi.client import EClient
-from ibapi.wrapper import EWrapper
-from ibapi.contract import Contract
-import threading
-import time
-import pandas as pd
-from datetime import datetime, timedelta, timezone
-import os
-
-class IBApi(EWrapper, EClient):
-    def __init__(self):
-        EClient.__init__(self, self)
-        self.data = []
-        self.df = pd.DataFrame()
-        self.data_retrieved = False
-
-    def historicalData(self, reqId, bar):
-        # Debug: Print each received bar
-        print(f"Received bar: Date={bar.date}, Open={bar.open}, High={bar.high}, Low={bar.low}, Close={bar.close}, Volume={bar.volume}")
-        self.data.append({
-            "Date": bar.date,
-            "Open": bar.open,
-            "High": bar.high,
-            "Low": bar.low,
-            "Close": bar.close,
-            "Volume": bar.volume
-        })
-
-    def historicalDataEnd(self, reqId, start, end):
-        # Debug: Indicate end of data reception
-        print(f"HistoricalDataEnd received. Start: {start}, End: {end}. Number of bars fetched: {len(self.data)}")
-        chunk_df = pd.DataFrame(self.data)
-        if not chunk_df.empty:
-            self.df = pd.concat([self.df, chunk_df], ignore_index=True)
-        else:
-            print("No data received in this request.")
-        self.data_retrieved = True
-        self.data = []  # Reset data list for next request
-
-class IBApp:
-    def __init__(self):
-        self.app = IBApi()
-
-    def connect(self):
-        # Connect to IB API (ensure IB Gateway or TWS is running)
-        print("Connecting to IB API...")
-        self.app.connect("127.0.0.1", 4002, clientId=1)
-        # Start the API thread
-        thread = threading.Thread(target=self.run_app, daemon=True)
-        thread.start()
-        time.sleep(1)  # Allow time for connection
-        print("Connected to IB API.")
-
-    def run_app(self):
-        self.app.run()
-
-    def request_data(self, contract, end_date, duration, bar_size):
-        # Request historical data
-        print(f"Requesting data: endDateTime={end_date}, durationStr={duration}, barSizeSetting={bar_size}")
-        self.app.reqHistoricalData(
-            reqId=1,
-            contract=contract,
-            endDateTime=end_date,
-            durationStr=duration,
-            barSizeSetting=bar_size,
-            whatToShow="TRADES",
-            useRTH=1,  # Use regular trading hours
-            formatDate=1,
-            keepUpToDate=False,
-            chartOptions=[]
-        )
-        # Wait until data is retrieved
-        while not self.app.data_retrieved:
-            time.sleep(0.1)
-        self.app.data_retrieved = False  # Reset flag for next request
-
-    def fetch_recent_data(self, symbol, sec_type, exchange, currency):
-        try:
-            # Define the contract
-            contract = Contract()
-            contract.symbol = symbol
-            contract.secType = sec_type
-            contract.exchange = exchange
-            contract.currency = currency
-
-            # Set duration and bar size for last 2 days
-            duration = "2 D"        # 2 days
-            bar_size = "1 min"      # 1-minute intervals
-
-            # Set end_date to now in UTC
-            end_date = datetime.now(timezone.utc)
-            end_date_str = end_date.strftime("%Y%m%d %H:%M:%S UTC")
-            print(f"Fetching data up to {end_date_str} for the last {duration} with bar size {bar_size}")
-            self.request_data(contract, end_date_str, duration, bar_size)
-
-        except Exception as e:
-            print(f"Error fetching data: {e}")
-
-    def disconnect(self):
-        self.app.disconnect()
-        print("Disconnected from IB API.")
-
-def get_user_input():
-    print("Provide the stock details for historical data retrieval.")
-    try:
-        symbol = input("Enter the stock symbol (e.g., 'AAPL'): ").strip().upper()
-        sec_type = "STK"        # Automatically set to Stock
-        exchange = "SMART"      # Automatically set to SMART routing
-        currency = "USD"        # Automatically set to USD
-
-        if not symbol:
-            raise ValueError("Stock symbol is required. Please try again.")
-
-        return symbol, sec_type, exchange, currency
-    except Exception as e:
-        print(f"Input Error: {e}")
-        return None
-
-def graceful_exit(signal_received, frame):
-    print("\nTerminating program...")
-    app.disconnect()
-    exit(0)
-
-# Handle graceful exit on Ctrl+C
-signal.signal(signal.SIGINT, graceful_exit)
-
-# Initialize and connect the IBApp
-app = IBApp()
-app.connect()
-
-try:
-    user_input = get_user_input()
-    if user_input:
-        symbol, sec_type, exchange, currency = user_input
-
-        # Define the filename (save directly in current directory)
-        filename = f"{symbol}_recent_data.csv"
-
-        # Fetch recent data (last 2 days)
-        app.fetch_recent_data(symbol, sec_type, exchange, currency)
-
-        # Retrieve fetched data
-        data = app.app.df
-        if not data.empty:
-            print(f"Number of data points fetched: {len(data)}")
-            # Clean and parse the 'Date' column
-            # Attempt multiple formats
-            data['Date'] = pd.to_datetime(data['Date'], errors='coerce')
-
-            # Check if timezone is present; if not, localize to UTC
-            if data['Date'].dt.tz is None:
-                data['Date'] = data['Date'].dt.tz_localize(timezone.utc, ambiguous='NaT', nonexistent='NaT')
-
-            # Remove any rows with NaT in 'Date'
-            data.dropna(subset=['Date'], inplace=True)
-
-            # Sort by 'Date' ascending
-            data.sort_values(by='Date', inplace=True)
-
-            # Save to CSV
-            data.to_csv(filename, index=False)
-            print(f"Data saved to {filename}.")
-            print(data.tail())
-        else:
-            print("No new data fetched.")
-except Exception as e:
-    print(f"Error: {e}")
-finally:
-    app.disconnect()
--- a/src/griffin-stuff/technical_ind_calc.py
+++ b/src/griffin-stuff/technical_ind_calc.py
@@ -1,119 +0,0 @@
-import ta
-import pandas as pd
-
-preprocessed_file_path = 'C:/Users/gwitt/MidasTechnologies/API/spy_1min_preprocessed.csv'  # Replace with your file path
-df = pd.read_csv(preprocessed_file_path, index_col='Date', parse_dates=True)
-
-# **Trend Indicators**
-# Simple Moving Averages
-df['SMA_20'] = ta.trend.sma_indicator(close=df['Close'], window=20)
-df['SMA_50'] = ta.trend.sma_indicator(close=df['Close'], window=50)
-df['SMA_200'] = ta.trend.sma_indicator(close=df['Close'], window=200)
-
-# Exponential Moving Averages
-df['EMA_20'] = ta.trend.ema_indicator(close=df['Close'], window=20)
-df['EMA_50'] = ta.trend.ema_indicator(close=df['Close'], window=50)
-
-# MACD
-macd = ta.trend.MACD(close=df['Close'], window_slow=26, window_fast=12, window_sign=9)
-df['MACD'] = macd.macd()
-df['MACD_Signal'] = macd.macd_signal()
-df['MACD_Hist'] = macd.macd_diff()
-
-# ADX
-df['ADX_14'] = ta.trend.adx(high=df['High'], low=df['Low'], close=df['Close'], window=14)
-
-# **Momentum Indicators**
-# RSI
-df['RSI_14'] = ta.momentum.rsi(close=df['Close'], window=14)
-
-# Stochastic Oscillator
-stoch = ta.momentum.StochasticOscillator(high=df['High'], low=df['Low'], close=df['Close'], window=14, smooth_window=3)
-df['Stoch_%K'] = stoch.stoch()
-df['Stoch_%D'] = stoch.stoch_signal()
-
-# Rate of Change
-df['ROC_10'] = ta.momentum.roc(close=df['Close'], window=10)
-
-# **Volatility Indicators**
-# Bollinger Bands
-bollinger = ta.volatility.BollingerBands(close=df['Close'], window=20, window_dev=2)
-df['Bollinger_High'] = bollinger.bollinger_hband()
-df['Bollinger_Low'] = bollinger.bollinger_lband()
-df['Bollinger_Middle'] = bollinger.bollinger_mavg()
-
-# Average True Range
-df['ATR_14'] = ta.volatility.average_true_range(high=df['High'], low=df['Low'], close=df['Close'], window=14)
-
-# **Volume Indicators**
-# On-Balance Volume
-df['OBV'] = ta.volume.on_balance_volume(close=df['Close'], volume=df['Volume'])
-
-# Volume Weighted Average Price
-df['VWAP'] = ta.volume.volume_weighted_average_price(high=df['High'], low=df['Low'], close=df['Close'], volume=df['Volume'])
-
-# Chaikin Money Flow
-df['CMF_20'] = ta.volume.chaikin_money_flow(high=df['High'], low=df['Low'], close=df['Close'], volume=df['Volume'], window=20)
-
-# **Composite Indicators**
-# # Ichimoku Cloud
-# ichimoku = ta.trend.IchimokuIndicator(high=df['High'], low=df['Low'], close=df['Close'], window1=9, window2=26, window3=52)
-# df['Ichimoku_A'] = ichimoku.ichimoku_a()
-# df['Ichimoku_B'] = ichimoku.ichimoku_b()
-# df['Ichimoku_Base_Line'] = ichimoku.ichimoku_base_line()
-# df['Ichimoku_Conversion_Line'] = ichimoku.ichimoku_conversion_line()
-
-# Parabolic SAR
-df['PSAR'] = ta.trend.psar_up(close=df['Close'], high=df['High'], low=df['Low'], step=0.02, max_step=0.2)
-
-
-# **Classification Target:** 1 if next minute's close > current close, else 0
-df['Target_Class'] = (df['Close'].shift(-1) > df['Close']).astype(int)
-
-# **Regression Target:** Percentage change in close price
-df['Target_Change'] = ((df['Close'].shift(-1) - df['Close']) / df['Close']) * 100
-
-# Display targets
-print("\nTarget Variables:")
-print(df[['Close', 'Target_Class', 'Target_Change']].head())
-
-# Define lag periods
-lag_periods = [1, 2, 3]
-
-# Create lagged features for key indicators
-key_indicators = ['RSI_14', 'MACD', 'ADX_14', 'ATR_14', 'OBV', 'CMF_20']
-
-for indicator in key_indicators:
-    for lag in lag_periods:
-        df[f'{indicator}_lag{lag}'] = df[indicator].shift(lag)
-
-# Display lagged features
-print("\nLagged Features:")
-print(df[[f'RSI_14_lag{lag}' for lag in lag_periods]].head())
-
-# Rolling mean of RSI over past 5 minutes
-df['RSI_14_roll_mean_5'] = df['RSI_14'].rolling(window=5).mean()
-
-# Rolling standard deviation of ATR over past 10 minutes
-df['ATR_14_roll_std_10'] = df['ATR_14'].rolling(window=10).std()
-
-# Display rolling features
-print("\nRolling Features:")
-print(df[['RSI_14_roll_mean_5', 'ATR_14_roll_std_10']].head())
-
-# Interaction between MACD and RSI
-df['MACD_RSI'] = df['MACD'] * df['RSI_14']
-
-# Interaction between ATR and ADX
-df['ATR_ADX'] = df['ATR_14'] * df['ADX_14']
-
-# Display interaction features
-print("\nInteraction Features:")
-print(df[['MACD_RSI', 'ATR_ADX']].head())
-
-
-# Save dataset with technical indicators
-indicators_file_path = 'C:/Users/gwitt/MidasTechnologies/API/spy_1min_with_indicators.csv'  # Replace with your desired path
-df.to_csv(indicators_file_path)
-
-print(f"Data with technical indicators saved to {indicators_file_path}")